From dfc06b0a6d104f753ca6c341e1ce62f459449fc6 Mon Sep 17 00:00:00 2001
From: Jark Wu <jark@apache.org>
Date: Mon, 25 Aug 2025 17:31:09 +0800
Subject: [PATCH 001/287] Initial Commit

---
 fluss-rust/.DS_Store                          | Bin 0 -> 6148 bytes
 fluss-rust/.asf.yaml                          |  45 ++++
 fluss-rust/.github/.DS_Store                  | Bin 0 -> 6148 bytes
 fluss-rust/.github/ISSUE_TEMPLATE/bug.yml     |  58 +++++
 fluss-rust/.github/ISSUE_TEMPLATE/config.yml  |  19 ++
 fluss-rust/.github/ISSUE_TEMPLATE/feature.yml |  58 +++++
 fluss-rust/.github/ISSUE_TEMPLATE/task.yml    |  51 +++++
 fluss-rust/.github/PULL_REQUEST_TEMPLATE.md   |  41 ++++
 fluss-rust/.gitignore                         |  19 ++
 fluss-rust/DISCLAIMER                         |  10 +
 fluss-rust/LICENSE                            | 201 ++++++++++++++++++
 fluss-rust/NOTICE                             |   5 +
 fluss-rust/README.md                          | 138 ++++++++++++
 13 files changed, 645 insertions(+)
 create mode 100644 fluss-rust/.DS_Store
 create mode 100644 fluss-rust/.asf.yaml
 create mode 100644 fluss-rust/.github/.DS_Store
 create mode 100644 fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
 create mode 100644 fluss-rust/.github/ISSUE_TEMPLATE/config.yml
 create mode 100644 fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
 create mode 100644 fluss-rust/.github/ISSUE_TEMPLATE/task.yml
 create mode 100644 fluss-rust/.github/PULL_REQUEST_TEMPLATE.md
 create mode 100644 fluss-rust/.gitignore
 create mode 100644 fluss-rust/DISCLAIMER
 create mode 100644 fluss-rust/LICENSE
 create mode 100644 fluss-rust/NOTICE
 create mode 100644 fluss-rust/README.md

diff --git a/fluss-rust/.DS_Store b/fluss-rust/.DS_Store
new file mode 100644
index 0000000000000000000000000000000000000000..aa422df10c54b59dcb4bd4dcfc37bcac4de3fc93
GIT binary patch
literal 6148
zcmeHKO>fgc5S>j!VpAdI08%eVmbg|SK&gbdIA4cK1*Euw1E3J&sI_ptRpO9C6v=1!
zF<kj2{2h3+yG4xymmUzRW~A9SyE|{a`<(20iAePp$s?i`5qWUNnvdcS#{KMDR&y;4
zpfY2e(SqW5IlqXrt!!!d9~Izt*Q7R`Qc49~d4D=a&-eHuOXo$W^F!5k>bDwAuj%c2
z@1rxljEYIInD-{Lw_H2XI*TvkN&GsUF2}9AeVrGRG@s54Ax)-8dG{vG6TR%|MV`zJ
zH?kd`@A>1_-fH!<)7cLW4iDD*!Rpy#j-MQ^*S>e}!NcdH@u%!O*I%rZ3cosIcN|{A
zR|J(+eU4^%rt?$uFzYrA=!hcf(=l}sy`UkDjxzl*&dkdB57C9Ue;Px?BOW8OkIa`~
z4lCK;D%lNWy`mG#*vwV;E4e<6FlrZb;(4^`oRSKIS9EnQsEUaKqJSuHZ3W!!>Fr*7
z1R;t7qQFg6fcJ+0&KNo@Et;(Zg}DL%>u5HHm_MDE6F3YVmKM<iQ<e&}ROPN1%F@vu
zxV+F|Y0=V2xyy%gPgd@RqRi7Veqho`g%+h01w?^O1$Jz;#pnO<@Av;rlGH>2QQ$@?
zpz4EY(8H44*}AnjK5GN`2RIw&l@@<f5SXJFxqKAw!HuCk-~bppEG?o1CLaPu1}Q{=
Hf2zPQka~Qh

literal 0
HcmV?d00001

diff --git a/fluss-rust/.asf.yaml b/fluss-rust/.asf.yaml
new file mode 100644
index 0000000000..b71e0264e3
--- /dev/null
+++ b/fluss-rust/.asf.yaml
@@ -0,0 +1,45 @@
+#  Licensed to the Apache Software Foundation (ASF) under one
+#  or more contributor license agreements.  See the NOTICE file
+#  distributed with this work for additional information
+#  regarding copyright ownership.  The ASF licenses this file
+#  to you under the Apache License, Version 2.0 (the
+#  "License"); you may not use this file except in compliance
+#  with the License.  You may obtain a copy of the License at
+#
+#    http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing,
+#  software distributed under the License is distributed on an
+#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+#  KIND, either express or implied.  See the License for the
+#  specific language governing permissions and limitations
+#  under the License.
+
+# See: https://cwiki.apache.org/confluence/display/INFRA/git+-+.asf.yaml+features
+
+github:
+  description: "Rust Client for Apache Fluss (Incubating)"
+  homepage: https://fluss.apache.org/
+  features:
+    issues: true
+    projects: false
+    discussions: false
+    wiki: false
+  labels:
+    - fluss
+    - streaming
+    - real-time-analytics
+    - lakehouse
+    - rust
+    - python
+  enabled_merge_buttons:
+    squash:  true
+    merge:   false
+    rebase:  true
+
+notifications:
+  commits:      commits@fluss.apache.org
+  issues:       issues@fluss.apache.org
+  pullrequests: issues@fluss.apache.org
+  jobs:         builds@fluss.apache.org
+  discussions:  issues@fluss.apache.org
\ No newline at end of file
diff --git a/fluss-rust/.github/.DS_Store b/fluss-rust/.github/.DS_Store
new file mode 100644
index 0000000000000000000000000000000000000000..7adc49df07876bc71be2a10c09a4f4452106ddaf
GIT binary patch
literal 6148
zcmeHKQA+|r5S~@b6DfQs@bREmAuAK2m+R7ppddP{hYGtxsiW&w^vnkl?z#R@zog&O
z%<fu<)k_c|Gcx<l&d%(z-^$J{00?*3*#am5fQ3q!DPZ%3&^YOwWQ>PUs5zR@h88s8
z1WxCo+3_D4ptD<rBk=Hdjwknde#dY?XBmtJy&#eS#=Qo;C>$i!>YK=9b4$y4D{mF8
z8}D9@yu?q21K00gQLiOs6ijVDxCpzWc4_TU#)%)s-M&f)J6#O9z6|4z9Jz8BcLplg
z(*st)Dzr=G@p!jdt=P4CZBntvd)s91)F+dIwZ5^rf7X789%K2ei52)CRI*}l3NL8<
zxW^~2A4f92!?@`j(_BVofEi#07LfsS*IC6y+#K(T8DIu}#Q@z8HY%ZGFx9B84s7W2
zk;Zd`BxuuHg3vbT7)&+d2#V0Dh&ol6Cx+1J=(kOrV=&dI(?O_}aUQd>FfSCLR!6_B
z!a+D1xn%~JfmsH!x?7_9-~9glKbyooW`G%3C<a8X;Wb>`lBun8o1<E5qu!#DP+Y3<
lBLxjriZPZ-aT!$!`fV~09fPSx^q}yEfTDpLX5dd5cn5ScO<w>2

literal 0
HcmV?d00001

diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml b/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
new file mode 100644
index 0000000000..43fbc90d8b
--- /dev/null
+++ b/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
@@ -0,0 +1,58 @@
+################################################################################
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+################################################################################
+
+name: Bug report 🐞
+description: Problems, bugs and issues with Fluss
+type: "bug"
+body:
+  - type: markdown
+    attributes:
+      value: |
+        Thank you very much for your feedback!
+  - type: checkboxes
+    attributes:
+      label: Search before asking
+      description: >
+        Please search [issues](https://github.com/apache/fluss-benchmarks/issues) to check if your issue has already been reported.
+      options:
+        - label: >
+            I searched in the [issues](https://github.com/apache/fluss-benchmarks/issues) and found nothing similar.
+          required: true
+  - type: textarea
+    attributes:
+      label: Please describe the bug 🐞
+      description: >
+        Please describe the problem, what to expect, and how to reproduce.
+        Feel free to include stacktraces and the Fluss server/client configuration.
+        You can include files by dragging and dropping them here.
+    validations:
+      required: true
+  - type: textarea
+    attributes:
+      label: Solution
+      description: Describe the proposed solution about how to fix it if any.
+  - type: checkboxes
+    attributes:
+      label: Are you willing to submit a PR?
+      description: >
+        We look forward to the community of developers or users helping solve Fluss problems together. If you are willing to submit a PR to fix this problem, please check the box.
+      options:
+        - label: I'm willing to submit a PR!
+  - type: markdown
+    attributes:
+      value: "Thanks for completing our form!"
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/config.yml b/fluss-rust/.github/ISSUE_TEMPLATE/config.yml
new file mode 100644
index 0000000000..c2520da489
--- /dev/null
+++ b/fluss-rust/.github/ISSUE_TEMPLATE/config.yml
@@ -0,0 +1,19 @@
+################################################################################
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+################################################################################
+
+blank_issues_enabled: false
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml b/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
new file mode 100644
index 0000000000..fc7357165d
--- /dev/null
+++ b/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
@@ -0,0 +1,58 @@
+################################################################################
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+################################################################################
+
+name: Feature Request 🚀
+description: User-facing functionality or improvement you’d like to see added
+type: "feature"
+body:
+  - type: markdown
+    attributes:
+      value: |
+        Thank you very much for your feature proposal!
+  - type: checkboxes
+    attributes:
+      label: Search before asking
+      description: >
+        Please search [issues](https://github.com/apache/fluss-benchmarks/issues) to check if your issue has already been reported.
+      options:
+        - label: >
+            I searched in the [issues](https://github.com/apache/fluss-benchmarks/issues) and found nothing similar.
+          required: true
+  - type: textarea
+    attributes:
+      label: Motivation
+      description: Please describe the feature and elaborate on the use case and motivation behind it
+    validations:
+      required: true
+  - type: textarea
+    attributes:
+      label: Solution
+      description: Describe the proposed solution and add related materials like links if any.
+  - type: textarea
+    attributes:
+      label: Anything else?
+  - type: checkboxes
+    attributes:
+      label: Willingness to contribute
+      description: >
+        We look forward to the community of developers or users helping develop Fluss features together. If you are willing to submit a PR to implement the feature, please check the box.
+      options:
+        - label: I'm willing to submit a PR!
+  - type: markdown
+    attributes:
+      value: "Thanks for completing our form!"
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/task.yml b/fluss-rust/.github/ISSUE_TEMPLATE/task.yml
new file mode 100644
index 0000000000..70b5369a45
--- /dev/null
+++ b/fluss-rust/.github/ISSUE_TEMPLATE/task.yml
@@ -0,0 +1,51 @@
+################################################################################
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+################################################################################
+
+name: Task 📌
+description: Specific work item - either part of a larger feature or independent project maintenance
+type: "task"
+body:
+  - type: markdown
+    attributes:
+      value: |
+        Thank you very much for your work!
+  - type: checkboxes
+    attributes:
+      label: Search before asking
+      description: >
+        Please search [issues](https://github.com/apache/fluss-benchmarks/issues) to check if your issue has already been reported.
+      options:
+        - label: >
+            I searched in the [issues](https://github.com/apache/fluss-benchmarks/issues) and found nothing similar.
+          required: true
+  - type: textarea
+    attributes:
+      label: Description
+      description: Please describe the task and the purpose of the work.
+    validations:
+      required: true
+  - type: checkboxes
+    attributes:
+      label: Willingness to contribute
+      description: >
+        We look forward to the community of developers or users helping develop Fluss together. If you are willing to submit a PR to implement the task, please check the box.
+      options:
+        - label: I'm willing to submit a PR!
+  - type: markdown
+    attributes:
+      value: "Thanks for completing our form!"
diff --git a/fluss-rust/.github/PULL_REQUEST_TEMPLATE.md b/fluss-rust/.github/PULL_REQUEST_TEMPLATE.md
new file mode 100644
index 0000000000..5e03d8df9c
--- /dev/null
+++ b/fluss-rust/.github/PULL_REQUEST_TEMPLATE.md
@@ -0,0 +1,41 @@
+<!--
+*Thank you very much for contributing to Fluss - we are happy that you want to help us improve Fluss. To help the community review your contribution in the best possible way, please go through the checklist below, which will get the contribution into a shape in which it can be best reviewed.*
+
+## Contribution Checklist
+
+  - Make sure that the pull request corresponds to a [GitHub issue](https://github.com/apache/fluss-rust/issues). Exceptions are made for typos in JavaDoc or documentation files, which need no issue.
+
+  - Name the pull request in the format "[component] Title of the pull request", where *[component]* should be replaced by the name of the component being changed. Typically, this corresponds to the component label assigned to the issue (e.g., [kv], [log], [client], [flink]). Skip *[component]* if you are unsure about which is the best component.
+
+  - Fill out the template below to describe the changes contributed by the pull request. That will give reviewers the context they need to do the review.
+
+  - Make sure that the change passes the automated tests, i.e., `mvn clean verify` passes.
+
+  - Each pull request should address only one issue, not mix up code from multiple issues.
+
+
+**(The sections below can be removed for hotfixes or typos)**
+-->
+
+### Purpose
+
+<!-- Linking this pull request to the issue -->
+Linked issue: close #xxx
+
+<!-- What is the purpose of the change -->
+
+### Brief change log
+
+<!-- Please describe the changes made in this pull request and explain how they address the issue -->
+
+### Tests
+
+<!-- List UT and IT cases to verify this change -->
+
+### API and Format
+
+<!-- Does this change affect API or storage format -->
+
+### Documentation
+
+<!-- Does this change introduce a new feature -->
diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
new file mode 100644
index 0000000000..0e51e8099b
--- /dev/null
+++ b/fluss-rust/.gitignore
@@ -0,0 +1,19 @@
+# Generated by Cargo
+# will have compiled files and executables
+debug/
+target/
+Cargo.lock
+
+# These are backup files generated by rustfmt
+**/*.rs.bk
+
+# MSVC Windows builds of rustc generate these, which store debugging information
+*.pdb
+
+# RustRover
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+.idea/
+.vscode/
\ No newline at end of file
diff --git a/fluss-rust/DISCLAIMER b/fluss-rust/DISCLAIMER
new file mode 100644
index 0000000000..ddc4f01632
--- /dev/null
+++ b/fluss-rust/DISCLAIMER
@@ -0,0 +1,10 @@
+Apache Fluss (incubating) is an effort undergoing incubation at The Apache
+Software Foundation (ASF), sponsored by the Apache Incubator PMC.
+
+Incubation is required of all newly accepted projects until a further review
+indicates that the infrastructure, communications, and decision making process
+have stabilized in a manner consistent with other successful ASF projects.
+
+While incubation status is not necessarily a reflection of the completeness
+or stability of the code, it does indicate that the project has yet to be
+fully endorsed by the ASF.
\ No newline at end of file
diff --git a/fluss-rust/LICENSE b/fluss-rust/LICENSE
new file mode 100644
index 0000000000..261eeb9e9f
--- /dev/null
+++ b/fluss-rust/LICENSE
@@ -0,0 +1,201 @@
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/fluss-rust/NOTICE b/fluss-rust/NOTICE
new file mode 100644
index 0000000000..1ec5da05df
--- /dev/null
+++ b/fluss-rust/NOTICE
@@ -0,0 +1,5 @@
+Apache Fluss Rust (incubating)
+Copyright 2025 The Apache Software Foundation
+
+This product includes software developed at
+The Apache Software Foundation (http://www.apache.org/).
\ No newline at end of file
diff --git a/fluss-rust/README.md b/fluss-rust/README.md
new file mode 100644
index 0000000000..6caaebb154
--- /dev/null
+++ b/fluss-rust/README.md
@@ -0,0 +1,138 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Apache Fluss™ Rust (Incubating)
+
+![Experimental](https://img.shields.io/badge/status-experimental-orange)
+
+Rust implementation of [Apache Fluss™](https://fluss.apache.org/).
+
+
+## Why Fluss?
+[Fluss](https://fluss.apache.org/) is a streaming storage built for real-time analytics which can serve as the real-time data layer for Lakehouse architectures.
+It bridges the gap between streaming data and the data Lakehouse by enabling low-latency, high-throughput data ingestion and processing while seamlessly integrating with popular compute engines.
+
+## Why Fluss Rust Client
+It's an unofficial experimental Rust client for interacting with Fluss. This client provides foundational capabilities for table management and log streaming operations, enabling developers to explore Fluss within Rust ecosystems.
+
+## Quick-Start
+
+### Step1 Start Fluss cluster
+#### Requirements
+Fluss runs on all UNIX-like environments, e.g. Linux, Mac OS X. Before you start to setup the system, make sure you have the following software installed on your test machine:
+
+Java 17 or higher (Java 8 and Java 11 are not recommended)
+If your cluster does not fulfill these software requirements you will need to install/upgrade it.
+
+Fluss requires the JAVA_HOME environment variable to be set on all nodes and point to the directory of your Java installation.
+
+#### Fluss Setup
+Go to the [downloads](https://fluss.apache.org/downloads/) page and download the Fluss-0.6.0. Make sure to pick the Fluss package matching your Java version. After downloading the latest release, extract it:
+```shell
+tar -xzf fluss-0.7-SNAPSHOT-bin.tgz
+cd fluss-0.7-SNAPSHOT/
+```
+You can start Fluss local cluster by running the following command:
+```shell
+./bin/local-cluster.sh start
+```
+After that, the Fluss local cluster is started.
+
+### Run Provided Example
+Only supports Linux or macOs. You will need to [install Rust](https://www.rust-lang.org/tools/install) firstly. 
+
+After that, go the project directory, build it and run the example:
+```shell
+cargo build --example example-table --release
+cd target/release/examples
+./example-table
+```
+The example code is as follows:
+```rust
+#[tokio::main]
+pub async fn main() -> Result<()> {
+    // 1: create the table;
+    let mut args = Args::default();
+    args.bootstrap_server = "127.0.0.1:9123".to_string();
+    let conn_config = ConnectionConfig::from_args(args);
+    let conn = FlussConnection::new(conn_config).await;
+
+    let admin = conn.get_admin();
+
+    let table_descriptor = TableDescriptor::builder()
+        .schema(
+            Schema::builder()
+                .column("c1", DataTypes::int())
+                .column("c2", DataTypes::string())
+                .build(),
+        )
+        .build();
+
+    let table_path = TablePath::new("fluss".to_owned(), "rust_test".to_owned());
+
+    admin
+        .create_table(&table_path, &table_descriptor, true)
+        .await
+        .unwrap();
+
+    // 2: get the table
+    let table_info = admin.get_table(&table_path).await.unwrap();
+    print!("Get created table:\n {}\n", table_info);
+
+    // let's sleep 2 seconds to wait leader ready
+    thread::sleep(Duration::from_secs(2));
+
+    // 3: append log to the table
+    let table = conn.get_table(&table_path).await;
+    let append_writer = table.new_append().create_writer();
+    let batch = record_batch!(("c1", Int32, [1, 2, 3, 4, 5, 6]), ("c2", Utf8, ["a1", "a2", "a3", "a4", "a5", "a6"])).unwrap();
+    append_writer.append(batch).await?;
+    println!("Start to scan log records......");
+    // 4: scan the records
+    let log_scanner = table.new_scan().create_log_scanner();
+    log_scanner.subscribe(0, 0).await;
+
+    loop {
+        let scan_records = log_scanner.poll(Duration::from_secs(10)).await?;
+        println!("Start to poll records......");
+        for record in scan_records {
+            let row = record.row();
+            println!(
+                "{{{}, {}}}@{}",
+                row.get_int(0),
+                row.get_string(1),
+                record.offset()
+            );
+        }
+    }
+    Ok(())
+}
+```
+
+You can change it according to your needs, have fun!
+
+#### Clear environment
+Then, stop your Fluss cluster. Go to your Fluss home, stop it via the following commands:
+```shell
+./bin/local-cluster.sh stop
+```
+
+
+## License
+
+Licensed under the [Apache License, Version 2.0](http://www.apache.org/licenses/LICENSE-2.0)
\ No newline at end of file

From 2ab9022c1ec609c195ae28e3fbf852700e66449c Mon Sep 17 00:00:00 2001
From: Jark Wu <jark@apache.org>
Date: Mon, 25 Aug 2025 17:32:17 +0800
Subject: [PATCH 002/287] Initial Commit

---
 fluss-rust/.DS_Store  | Bin 6148 -> 0 bytes
 fluss-rust/.gitignore |   1 +
 2 files changed, 1 insertion(+)
 delete mode 100644 fluss-rust/.DS_Store

diff --git a/fluss-rust/.DS_Store b/fluss-rust/.DS_Store
deleted file mode 100644
index aa422df10c54b59dcb4bd4dcfc37bcac4de3fc93..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 6148
zcmeHKO>fgc5S>j!VpAdI08%eVmbg|SK&gbdIA4cK1*Euw1E3J&sI_ptRpO9C6v=1!
zF<kj2{2h3+yG4xymmUzRW~A9SyE|{a`<(20iAePp$s?i`5qWUNnvdcS#{KMDR&y;4
zpfY2e(SqW5IlqXrt!!!d9~Izt*Q7R`Qc49~d4D=a&-eHuOXo$W^F!5k>bDwAuj%c2
z@1rxljEYIInD-{Lw_H2XI*TvkN&GsUF2}9AeVrGRG@s54Ax)-8dG{vG6TR%|MV`zJ
zH?kd`@A>1_-fH!<)7cLW4iDD*!Rpy#j-MQ^*S>e}!NcdH@u%!O*I%rZ3cosIcN|{A
zR|J(+eU4^%rt?$uFzYrA=!hcf(=l}sy`UkDjxzl*&dkdB57C9Ue;Px?BOW8OkIa`~
z4lCK;D%lNWy`mG#*vwV;E4e<6FlrZb;(4^`oRSKIS9EnQsEUaKqJSuHZ3W!!>Fr*7
z1R;t7qQFg6fcJ+0&KNo@Et;(Zg}DL%>u5HHm_MDE6F3YVmKM<iQ<e&}ROPN1%F@vu
zxV+F|Y0=V2xyy%gPgd@RqRi7Veqho`g%+h01w?^O1$Jz;#pnO<@Av;rlGH>2QQ$@?
zpz4EY(8H44*}AnjK5GN`2RIw&l@@<f5SXJFxqKAw!HuCk-~bppEG?o1CLaPu1}Q{=
Hf2zPQka~Qh

diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
index 0e51e8099b..c6edfb706d 100644
--- a/fluss-rust/.gitignore
+++ b/fluss-rust/.gitignore
@@ -1,3 +1,4 @@
+.DS_Store
 # Generated by Cargo
 # will have compiled files and executables
 debug/

From c912ccd7ce4228451b966f1ab78a0a64caba1591 Mon Sep 17 00:00:00 2001
From: Jark Wu <jark@apache.org>
Date: Mon, 25 Aug 2025 17:35:53 +0800
Subject: [PATCH 003/287] [github] Update GitHub issue template

---
 fluss-rust/.github/ISSUE_TEMPLATE/bug.yml     | 4 ++--
 fluss-rust/.github/ISSUE_TEMPLATE/feature.yml | 4 ++--
 fluss-rust/.github/ISSUE_TEMPLATE/task.yml    | 4 ++--
 3 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml b/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
index 43fbc90d8b..aadd86da4e 100644
--- a/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
+++ b/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
@@ -28,10 +28,10 @@ body:
     attributes:
       label: Search before asking
       description: >
-        Please search [issues](https://github.com/apache/fluss-benchmarks/issues) to check if your issue has already been reported.
+        Please search [issues](https://github.com/apache/fluss-rust/issues) to check if your issue has already been reported.
       options:
         - label: >
-            I searched in the [issues](https://github.com/apache/fluss-benchmarks/issues) and found nothing similar.
+            I searched in the [issues](https://github.com/apache/fluss-rust/issues) and found nothing similar.
           required: true
   - type: textarea
     attributes:
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml b/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
index fc7357165d..9f08a60008 100644
--- a/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
+++ b/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
@@ -28,10 +28,10 @@ body:
     attributes:
       label: Search before asking
       description: >
-        Please search [issues](https://github.com/apache/fluss-benchmarks/issues) to check if your issue has already been reported.
+        Please search [issues](https://github.com/apache/fluss-rust/issues) to check if your issue has already been reported.
       options:
         - label: >
-            I searched in the [issues](https://github.com/apache/fluss-benchmarks/issues) and found nothing similar.
+            I searched in the [issues](https://github.com/apache/fluss-rust/issues) and found nothing similar.
           required: true
   - type: textarea
     attributes:
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/task.yml b/fluss-rust/.github/ISSUE_TEMPLATE/task.yml
index 70b5369a45..dddc621f28 100644
--- a/fluss-rust/.github/ISSUE_TEMPLATE/task.yml
+++ b/fluss-rust/.github/ISSUE_TEMPLATE/task.yml
@@ -28,10 +28,10 @@ body:
     attributes:
       label: Search before asking
       description: >
-        Please search [issues](https://github.com/apache/fluss-benchmarks/issues) to check if your issue has already been reported.
+        Please search [issues](https://github.com/apache/fluss-rust/issues) to check if your issue has already been reported.
       options:
         - label: >
-            I searched in the [issues](https://github.com/apache/fluss-benchmarks/issues) and found nothing similar.
+            I searched in the [issues](https://github.com/apache/fluss-rust/issues) and found nothing similar.
           required: true
   - type: textarea
     attributes:

From f83b32ca6b89c721735c133a7041cb88b2f48ac1 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Tue, 26 Aug 2025 20:51:06 +0800
Subject: [PATCH 004/287] [feat] Support basic write & read (#2)

---
 fluss-rust/.github/dependabot.yml             |  30 +
 fluss-rust/.github/workflows/ci.yml           |  94 ++
 fluss-rust/Cargo.toml                         |  36 +
 fluss-rust/copyright.txt                      |  17 +
 fluss-rust/crates/examples/Cargo.toml         |  34 +
 .../crates/examples/src/example_table.rs      |  86 ++
 fluss-rust/crates/fluss/Cargo.toml            |  55 ++
 fluss-rust/crates/fluss/src/build.rs          |  23 +
 fluss-rust/crates/fluss/src/client/admin.rs   |  93 ++
 .../crates/fluss/src/client/connection.rs     |  82 ++
 .../crates/fluss/src/client/metadata.rs       | 109 +++
 fluss-rust/crates/fluss/src/client/mod.rs     |  26 +
 .../crates/fluss/src/client/table/append.rs   |  69 ++
 .../crates/fluss/src/client/table/mod.rs      |  73 ++
 .../crates/fluss/src/client/table/scanner.rs  | 370 +++++++
 .../crates/fluss/src/client/table/writer.rs   |  88 ++
 .../fluss/src/client/write/accumulator.rs     | 442 +++++++++
 .../crates/fluss/src/client/write/batch.rs    | 176 ++++
 .../fluss/src/client/write/broadcast.rs       | 119 +++
 .../fluss/src/client/write/bucket_assigner.rs | 102 ++
 .../crates/fluss/src/client/write/mod.rs      |  68 ++
 .../crates/fluss/src/client/write/sender.rs   | 207 ++++
 .../fluss/src/client/write/writer_client.rs   | 147 +++
 .../crates/fluss/src/cluster/cluster.rs       | 243 +++++
 fluss-rust/crates/fluss/src/cluster/mod.rs    |  99 ++
 fluss-rust/crates/fluss/src/config.rs         |  39 +
 fluss-rust/crates/fluss/src/error.rs          |  50 +
 fluss-rust/crates/fluss/src/lib.rs            |  37 +
 .../crates/fluss/src/metadata/datatype.rs     | 814 ++++++++++++++++
 .../crates/fluss/src/metadata/json_serde.rs   | 464 +++++++++
 fluss-rust/crates/fluss/src/metadata/mod.rs   |  24 +
 fluss-rust/crates/fluss/src/metadata/table.rs | 920 ++++++++++++++++++
 .../crates/fluss/src/proto/fluss_api.proto    | 197 ++++
 fluss-rust/crates/fluss/src/record/arrow.rs   | 545 +++++++++++
 fluss-rust/crates/fluss/src/record/error.rs   |  27 +
 fluss-rust/crates/fluss/src/record/mod.rs     | 174 ++++
 fluss-rust/crates/fluss/src/row/column.rs     | 169 ++++
 fluss-rust/crates/fluss/src/row/datum.rs      | 287 ++++++
 fluss-rust/crates/fluss/src/row/mod.rs        | 148 +++
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |  54 +
 .../crates/fluss/src/rpc/api_version.rs       |  54 +
 fluss-rust/crates/fluss/src/rpc/convert.rs    |  43 +
 fluss-rust/crates/fluss/src/rpc/error.rs      |  50 +
 fluss-rust/crates/fluss/src/rpc/frame.rs      | 106 ++
 .../fluss/src/rpc/message/create_table.rs     |  62 ++
 .../crates/fluss/src/rpc/message/fetch.rs     |  56 ++
 .../crates/fluss/src/rpc/message/get_table.rs |  54 +
 .../crates/fluss/src/rpc/message/header.rs    |  73 ++
 .../crates/fluss/src/rpc/message/mod.rs       |  97 ++
 .../fluss/src/rpc/message/produce_log.rs      |  71 ++
 .../fluss/src/rpc/message/update_metadata.rs  |  60 ++
 fluss-rust/crates/fluss/src/rpc/mod.rs        |  31 +
 .../crates/fluss/src/rpc/server_connection.rs | 402 ++++++++
 fluss-rust/crates/fluss/src/rpc/transport.rs  |  83 ++
 fluss-rust/crates/fluss/src/util/mod.rs       | 176 ++++
 .../fluss/tests/integration/client/mod.rs     |  21 +
 fluss-rust/crates/fluss/tests/test_fluss.rs   |  25 +
 fluss-rust/rust-toolchain.toml                |  20 +
 fluss-rust/rustfmt.toml                       |  19 +
 59 files changed, 8340 insertions(+)
 create mode 100644 fluss-rust/.github/dependabot.yml 
 create mode 100644 fluss-rust/.github/workflows/ci.yml
 create mode 100644 fluss-rust/Cargo.toml
 create mode 100644 fluss-rust/copyright.txt
 create mode 100644 fluss-rust/crates/examples/Cargo.toml
 create mode 100644 fluss-rust/crates/examples/src/example_table.rs
 create mode 100644 fluss-rust/crates/fluss/Cargo.toml
 create mode 100644 fluss-rust/crates/fluss/src/build.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/admin.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/connection.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/metadata.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/table/append.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/table/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/table/scanner.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/table/writer.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/write/accumulator.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/write/batch.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/write/broadcast.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/write/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/write/sender.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/write/writer_client.rs
 create mode 100644 fluss-rust/crates/fluss/src/cluster/cluster.rs
 create mode 100644 fluss-rust/crates/fluss/src/cluster/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/config.rs
 create mode 100644 fluss-rust/crates/fluss/src/error.rs
 create mode 100644 fluss-rust/crates/fluss/src/lib.rs
 create mode 100644 fluss-rust/crates/fluss/src/metadata/datatype.rs
 create mode 100644 fluss-rust/crates/fluss/src/metadata/json_serde.rs
 create mode 100644 fluss-rust/crates/fluss/src/metadata/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/metadata/table.rs
 create mode 100644 fluss-rust/crates/fluss/src/proto/fluss_api.proto
 create mode 100644 fluss-rust/crates/fluss/src/record/arrow.rs
 create mode 100644 fluss-rust/crates/fluss/src/record/error.rs
 create mode 100644 fluss-rust/crates/fluss/src/record/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/column.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/datum.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/api_key.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/api_version.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/convert.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/error.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/frame.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/create_table.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/fetch.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/get_table.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/header.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/server_connection.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/transport.rs
 create mode 100644 fluss-rust/crates/fluss/src/util/mod.rs
 create mode 100644 fluss-rust/crates/fluss/tests/integration/client/mod.rs
 create mode 100644 fluss-rust/crates/fluss/tests/test_fluss.rs
 create mode 100644 fluss-rust/rust-toolchain.toml
 create mode 100644 fluss-rust/rustfmt.toml

diff --git a/fluss-rust/.github/dependabot.yml  b/fluss-rust/.github/dependabot.yml 
new file mode 100644
index 0000000000..7c12d72c0c
--- /dev/null
+++ b/fluss-rust/.github/dependabot.yml 	
@@ -0,0 +1,30 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+version: 2
+updates:
+  # Maintain dependencies for GitHub Actions
+  - package-ecosystem: "github-actions"
+    directory: "/"
+    schedule:
+      interval: "monthly"
+
+  # Maintain dependencies for rust
+  - package-ecosystem: "cargo"
+    directory: "/"
+    schedule:
+      interval: "monthly"
\ No newline at end of file
diff --git a/fluss-rust/.github/workflows/ci.yml b/fluss-rust/.github/workflows/ci.yml
new file mode 100644
index 0000000000..26616292b5
--- /dev/null
+++ b/fluss-rust/.github/workflows/ci.yml
@@ -0,0 +1,94 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+name: CI
+
+on:
+  push:
+    branches:
+      - main
+  pull_request:
+    branches:
+      - main
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
+  cancel-in-progress: true
+
+jobs:
+  check:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Check License Header
+        uses: apache/skywalking-eyes/header@v0.6.0
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Format
+        run: cargo fmt --all -- --check
+
+      - name: Clippy
+        run: cargo clippy --all-targets --workspace -- -D warnings
+
+  build:
+    runs-on: ${{ matrix.os }}
+    strategy:
+      matrix:
+        os:
+          - ubuntu-latest
+          - macos-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install protoc
+        run: |
+          if [ "$RUNNER_OS" == "Linux" ]; then
+            sudo apt-get update && sudo apt-get install -y protobuf-compiler
+          elif [ "$RUNNER_OS" == "macOS" ]; then
+            brew install protobuf
+          fi
+      - name: Build
+        run: cargo build
+
+  test:
+    runs-on: ${{ matrix.os }}
+    strategy:
+      matrix:
+        os:
+          - ubuntu-latest
+          - macos-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install protoc
+        run: |
+          if [ "$RUNNER_OS" == "Linux" ]; then
+            sudo apt-get update && sudo apt-get install -y protobuf-compiler
+          elif [ "$RUNNER_OS" == "macOS" ]; then
+            brew install protobuf
+          fi
+      - name: Unit Test
+        run: cargo test --all-targets --workspace
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
+      - name: Integration Test
+        run: cargo test --features integration_tests --all-targets --workspace
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
\ No newline at end of file
diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
new file mode 100644
index 0000000000..059236fccf
--- /dev/null
+++ b/fluss-rust/Cargo.toml
@@ -0,0 +1,36 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[workspace.package]
+categories = ["command-line-utilities"]
+description = "The rust implementation of fluss"
+repository = "https://github.com/apache/fluss-rust"
+name = "fluss"
+edition = "2024"
+version = "0.1.0"
+license = "Apache-2.0"
+rust-version = "1.85"
+
+
+[workspace]
+resolver = "2"
+members = ["crates/fluss", "crates/examples"]
+
+[workspace.dependencies]
+fluss = { version = "0.1.0", path = "./crates/fluss" }
+tokio = { version = "1.44.2", features = ["full"] }
+clap = { version = "4.5.37", features = ["derive"] }
\ No newline at end of file
diff --git a/fluss-rust/copyright.txt b/fluss-rust/copyright.txt
new file mode 100644
index 0000000000..d5519133ed
--- /dev/null
+++ b/fluss-rust/copyright.txt
@@ -0,0 +1,17 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
\ No newline at end of file
diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
new file mode 100644
index 0000000000..82d864f818
--- /dev/null
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -0,0 +1,34 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[package]
+edition = { workspace = true }
+license = { workspace = true }
+name = "fluss-examples"
+rust-version = { workspace = true }
+version = { workspace = true }
+
+
+[dependencies]
+fluss = { workspace = true }
+tokio = { workspace = true }
+clap = { workspace = true}
+
+
+[[example]]
+name = "example-table"
+path = "src/example_table.rs"
\ No newline at end of file
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
new file mode 100644
index 0000000000..3eb8dd867f
--- /dev/null
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -0,0 +1,86 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use clap::Parser;
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+use fluss::error::Result;
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+use fluss::row::{GenericRow, InternalRow};
+use std::time::Duration;
+use tokio::try_join;
+
+#[tokio::main]
+pub async fn main() -> Result<()> {
+    let mut config = Config::parse();
+    config.bootstrap_server = Some("127.0.0.1:56405".to_string());
+
+    let conn = FlussConnection::new(config).await?;
+
+    let table_descriptor = TableDescriptor::builder()
+        .schema(
+            Schema::builder()
+                .column("c1", DataTypes::int())
+                .column("c2", DataTypes::string())
+                .build()?,
+        )
+        .build()?;
+
+    let table_path = TablePath::new("fluss".to_owned(), "rust_test".to_owned());
+
+    let admin = conn.get_admin().await?;
+
+    admin
+        .create_table(&table_path, &table_descriptor, true)
+        .await?;
+
+    // 2: get the table
+    let table_info = admin.get_table(&table_path).await?;
+    print!("Get created table:\n {table_info}\n");
+
+    // write row
+    let mut row = GenericRow::new();
+    row.set_field(0, 22222);
+    row.set_field(1, "t2t");
+
+    let table = conn.get_table(&table_path).await?;
+    let append_writer = table.new_append()?.create_writer();
+    let f1 = append_writer.append(row);
+    row = GenericRow::new();
+    row.set_field(0, 233333);
+    row.set_field(1, "tt44");
+    let f2 = append_writer.append(row);
+    try_join!(f1, f2, append_writer.flush())?;
+
+    // scan rows
+    let log_scanner = table.new_scan().create_log_scanner();
+    log_scanner.subscribe(0, 0).await?;
+
+    loop {
+        let scan_records = log_scanner.poll(Duration::from_secs(10)).await?;
+        println!("Start to poll records......");
+        for record in scan_records {
+            let row = record.row();
+            println!(
+                "{{{}, {}}}@{}",
+                row.get_int(0),
+                row.get_string(1),
+                record.offset()
+            );
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
new file mode 100644
index 0000000000..cc26014a46
--- /dev/null
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -0,0 +1,55 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[package]
+edition = { workspace = true }
+rust-version = { workspace = true }
+version = { workspace = true }
+name = "fluss"
+build = "src/build.rs"
+
+[dependencies]
+arrow = "55.1.0"
+arrow-schema = "55.1.0"
+byteorder = "1.5"
+futures = "0.3"
+clap = { workspace = true }
+crc32c = "0.6.8"
+linked-hash-map = "0.5.6"
+prost = "0.13.5"
+rand = "0.9.1"
+serde = { version = "1.0.219", features = ["derive", "rc"] }
+serde_json = "1.0.140"
+thiserror = "1.0"
+tracing = "0.1"
+tokio = { workspace = true }
+parking_lot = "0.12"
+bytes = "1.10.1"
+dashmap = "6.1.0"
+rust_decimal = "1"
+ordered-float = { version = "4", features = ["serde"] }
+parse-display = "0.10"
+ref-cast = "1.0"
+chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }
+
+
+[features]
+integration_tests = []
+
+
+[build-dependencies]
+prost-build = {  version = "0.13.5"  }
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/build.rs b/fluss-rust/crates/fluss/src/build.rs
new file mode 100644
index 0000000000..a83cd056b5
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/build.rs
@@ -0,0 +1,23 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use std::io::Result;
+
+fn main() -> Result<()> {
+    prost_build::compile_protos(&["src/proto/fluss_api.proto"], &["src/proto"])?;
+    Ok(())
+}
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
new file mode 100644
index 0000000000..8688a2d844
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -0,0 +1,93 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::metadata::Metadata;
+use crate::metadata::{JsonSerde, TableDescriptor, TableInfo, TablePath};
+use crate::rpc::message::{CreateTableRequest, GetTableRequest};
+use crate::rpc::{RpcClient, ServerConnection};
+use std::sync::Arc;
+
+use crate::error::Result;
+use crate::proto::GetTableInfoResponse;
+
+#[allow(dead_code)]
+pub struct FlussAdmin {
+    admin_gateway: ServerConnection,
+    metadata: Arc<Metadata>,
+    rpc_client: Arc<RpcClient>,
+}
+
+impl FlussAdmin {
+    pub async fn new(connections: Arc<RpcClient>, metadata: Arc<Metadata>) -> Result<Self> {
+        let admin_con = connections
+            .get_connection(
+                metadata
+                    .get_cluster()
+                    .get_coordinator_server()
+                    .expect("Couldn't coordinator server"),
+            )
+            .await?;
+
+        Ok(FlussAdmin {
+            admin_gateway: admin_con,
+            metadata,
+            rpc_client: connections,
+        })
+    }
+
+    pub async fn create_table(
+        &self,
+        table_path: &TablePath,
+        table_descriptor: &TableDescriptor,
+        ignore_if_exists: bool,
+    ) -> Result<()> {
+        let _response = self
+            .admin_gateway
+            .request(CreateTableRequest::new(
+                table_path,
+                table_descriptor,
+                ignore_if_exists,
+            )?)
+            .await?;
+        Ok(())
+    }
+
+    pub async fn get_table(&self, table_path: &TablePath) -> Result<TableInfo> {
+        let response = self
+            .admin_gateway
+            .request(GetTableRequest::new(table_path))
+            .await?;
+        let GetTableInfoResponse {
+            table_id,
+            schema_id,
+            table_json,
+            created_time,
+            modified_time,
+        } = response;
+        let v: &[u8] = &table_json[..];
+        let table_descriptor =
+            TableDescriptor::deserialize_json(&serde_json::from_slice(v).unwrap())?;
+        Ok(TableInfo::of(
+            table_path.clone(),
+            table_id,
+            schema_id,
+            table_descriptor,
+            created_time,
+            modified_time,
+        ))
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
new file mode 100644
index 0000000000..899ad597c1
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -0,0 +1,82 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::WriterClient;
+use crate::client::admin::FlussAdmin;
+use crate::client::metadata::Metadata;
+use crate::client::table::FlussTable;
+use crate::config::Config;
+use crate::rpc::RpcClient;
+use parking_lot::RwLock;
+use std::sync::Arc;
+
+use crate::error::Result;
+use crate::metadata::TablePath;
+
+pub struct FlussConnection {
+    metadata: Arc<Metadata>,
+    network_connects: Arc<RpcClient>,
+    args: Config,
+    writer_client: RwLock<Option<Arc<WriterClient>>>,
+}
+
+impl FlussConnection {
+    pub async fn new(arg: Config) -> Result<Self> {
+        let connections = Arc::new(RpcClient::new());
+        let metadata = Metadata::new(
+            arg.bootstrap_server.as_ref().unwrap().as_str(),
+            connections.clone(),
+        )
+        .await?;
+
+        Ok(FlussConnection {
+            metadata: Arc::new(metadata),
+            network_connects: connections.clone(),
+            args: arg.clone(),
+            writer_client: Default::default(),
+        })
+    }
+
+    pub fn get_metadata(&self) -> Arc<Metadata> {
+        self.metadata.clone()
+    }
+
+    pub fn get_connections(&self) -> Arc<RpcClient> {
+        self.network_connects.clone()
+    }
+
+    pub async fn get_admin(&self) -> Result<FlussAdmin> {
+        FlussAdmin::new(self.network_connects.clone(), self.metadata.clone()).await
+    }
+
+    pub fn get_or_create_writer_client(&self) -> Result<Arc<WriterClient>> {
+        if let Some(client) = self.writer_client.read().as_ref() {
+            return Ok(client.clone());
+        }
+
+        // If not exists, create new one
+        let client = Arc::new(WriterClient::new(self.args.clone(), self.metadata.clone())?);
+        *self.writer_client.write() = Some(client.clone());
+        Ok(client)
+    }
+
+    pub async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>> {
+        self.metadata.update_table_metadata(table_path).await?;
+        let table_info = self.metadata.get_cluster().get_table(table_path).clone();
+        Ok(FlussTable::new(self, self.metadata.clone(), table_info))
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
new file mode 100644
index 0000000000..ebfb959f65
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -0,0 +1,109 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::cluster::{Cluster, ServerNode, ServerType};
+use crate::metadata::{TableBucket, TablePath};
+use crate::rpc::{RpcClient, ServerConnection, UpdateMetadataRequest};
+use parking_lot::RwLock;
+use std::collections::HashSet;
+use std::net::SocketAddr;
+use std::sync::Arc;
+
+use crate::error::Result;
+use crate::proto::MetadataResponse;
+
+#[derive(Default)]
+pub struct Metadata {
+    cluster: RwLock<Arc<Cluster>>,
+    connections: Arc<RpcClient>,
+}
+
+impl Metadata {
+    pub async fn new(boot_strap: &str, connections: Arc<RpcClient>) -> Result<Self> {
+        let custer = Self::init_cluster(boot_strap, connections.clone()).await?;
+        Ok(Metadata {
+            cluster: RwLock::new(Arc::new(custer)),
+            connections,
+        })
+    }
+
+    async fn init_cluster(boot_strap: &str, connections: Arc<RpcClient>) -> Result<Cluster> {
+        let socker_addrss = boot_strap.parse::<SocketAddr>().unwrap();
+        let server_node = ServerNode::new(
+            -1,
+            socker_addrss.ip().to_string(),
+            socker_addrss.port() as u32,
+            ServerType::CoordinatorServer,
+        );
+        let con = connections.get_connection(&server_node).await?;
+        let response = con.request(UpdateMetadataRequest::new(&[])).await?;
+        Cluster::from_metadata_response(response, None)
+    }
+
+    pub async fn update(&self, metadata_response: MetadataResponse) -> Result<()> {
+        let origin_cluster = self.cluster.read().clone();
+        let new_cluster =
+            Cluster::from_metadata_response(metadata_response, Some(&origin_cluster))?;
+        let mut cluster = self.cluster.write();
+        *cluster = Arc::new(new_cluster);
+        Ok(())
+    }
+
+    pub async fn update_tables_metadata(&self, table_paths: &HashSet<&TablePath>) -> Result<()> {
+        let server = self.cluster.read().get_one_available_server().clone();
+        let conn = self.connections.get_connection(&server).await?;
+
+        let update_table_paths: Vec<&TablePath> = table_paths.iter().copied().collect();
+        let response = conn
+            .request(UpdateMetadataRequest::new(update_table_paths.as_slice()))
+            .await?;
+        self.update(response).await?;
+        Ok(())
+    }
+
+    pub async fn update_table_metadata(&self, table_path: &TablePath) -> Result<()> {
+        self.update_tables_metadata(&HashSet::from([table_path]))
+            .await
+    }
+
+    pub async fn check_and_update_table_metadata(&self, table_paths: &[TablePath]) -> Result<()> {
+        let cluster_binding = self.cluster.read().clone();
+        let need_update_table_paths: HashSet<&TablePath> = table_paths
+            .iter()
+            .filter(|table_path| cluster_binding.opt_get_table(table_path).is_none())
+            .collect();
+        if !need_update_table_paths.is_empty() {
+            self.update_tables_metadata(&need_update_table_paths)
+                .await?;
+        }
+        Ok(())
+    }
+
+    pub async fn get_connection(&self, server_node: &ServerNode) -> Result<ServerConnection> {
+        let result = self.connections.get_connection(server_node).await?;
+        Ok(result)
+    }
+
+    pub fn get_cluster(&self) -> Arc<Cluster> {
+        let guard = self.cluster.read();
+        guard.clone()
+    }
+
+    pub fn leader_for(&self, _table_bucket: &TableBucket) -> Option<&ServerNode> {
+        todo!()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/mod.rs b/fluss-rust/crates/fluss/src/client/mod.rs
new file mode 100644
index 0000000000..5b6908eec1
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/mod.rs
@@ -0,0 +1,26 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+mod admin;
+mod connection;
+mod table;
+mod write;
+
+pub use connection::*;
+mod metadata;
+
+pub use write::*;
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
new file mode 100644
index 0000000000..bf15266706
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -0,0 +1,69 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::{WriteRecord, WriterClient};
+use crate::metadata::{TableInfo, TablePath};
+use crate::row::GenericRow;
+use std::sync::Arc;
+
+use crate::error::Result;
+
+#[allow(dead_code)]
+pub struct TableAppend {
+    table_path: TablePath,
+    table_info: TableInfo,
+    writer_client: Arc<WriterClient>,
+}
+
+impl TableAppend {
+    pub(super) fn new(
+        table_path: TablePath,
+        table_info: TableInfo,
+        writer_client: Arc<WriterClient>,
+    ) -> Self {
+        Self {
+            table_path,
+            table_info,
+            writer_client,
+        }
+    }
+
+    pub fn create_writer(&self) -> AppendWriter {
+        AppendWriter {
+            table_path: Arc::new(self.table_path.clone()),
+            writer_client: self.writer_client.clone(),
+        }
+    }
+}
+
+pub struct AppendWriter {
+    table_path: Arc<TablePath>,
+    writer_client: Arc<WriterClient>,
+}
+
+impl AppendWriter {
+    pub async fn append(&self, row: GenericRow<'_>) -> Result<()> {
+        let record = WriteRecord::new(self.table_path.clone(), row);
+        let result_handle = self.writer_client.send(&record).await?;
+        let result = result_handle.wait().await?;
+        result_handle.result(result)
+    }
+
+    pub async fn flush(&self) -> Result<()> {
+        self.writer_client.flush().await
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
new file mode 100644
index 0000000000..503a1edb39
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -0,0 +1,73 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::connection::FlussConnection;
+use crate::client::metadata::Metadata;
+use crate::client::table::append::TableAppend;
+use crate::client::table::scanner::TableScan;
+use crate::metadata::{TableInfo, TablePath};
+use std::sync::Arc;
+
+use crate::error::Result;
+
+mod append;
+
+mod scanner;
+mod writer;
+
+#[allow(dead_code)]
+pub struct FlussTable<'a> {
+    conn: &'a FlussConnection,
+    metadata: Arc<Metadata>,
+    table_info: TableInfo,
+    table_path: TablePath,
+    has_primary_key: bool,
+}
+
+impl<'a> FlussTable<'a> {
+    pub fn new(conn: &'a FlussConnection, metadata: Arc<Metadata>, table_info: TableInfo) -> Self {
+        FlussTable {
+            conn,
+            table_path: table_info.table_path.clone(),
+            has_primary_key: table_info.has_primary_key(),
+            table_info,
+            metadata,
+        }
+    }
+
+    pub fn get_table_info(&self) -> &TableInfo {
+        &self.table_info
+    }
+
+    pub fn new_append(&self) -> Result<TableAppend> {
+        Ok(TableAppend::new(
+            self.table_path.clone(),
+            self.table_info.clone(),
+            self.conn.get_or_create_writer_client()?,
+        ))
+    }
+
+    pub fn new_scan(&self) -> TableScan<'_> {
+        TableScan::new(self.conn, self.table_info.clone(), self.metadata.clone())
+    }
+}
+
+impl<'a> Drop for FlussTable<'a> {
+    fn drop(&mut self) {
+        // do-nothing now
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
new file mode 100644
index 0000000000..41fb17e8c8
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -0,0 +1,370 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::connection::FlussConnection;
+use crate::client::metadata::Metadata;
+use crate::error::Result;
+use crate::metadata::{TableBucket, TableInfo, TablePath};
+use crate::proto::{FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
+use crate::record::{LogRecordsBatchs, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
+use crate::rpc::RpcClient;
+use crate::util::FairBucketStatusMap;
+use parking_lot::RwLock;
+use std::collections::HashMap;
+use std::slice::from_ref;
+use std::sync::Arc;
+use std::time::Duration;
+
+const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
+#[allow(dead_code)]
+const LOG_FETCH_MAX_BYTES_FOR_BUCKET: i32 = 1024;
+const LOG_FETCH_MIN_BYTES: i32 = 1;
+const LOG_FETCH_WAIT_MAX_TIME: i32 = 500;
+
+pub struct TableScan<'a> {
+    conn: &'a FlussConnection,
+    table_info: TableInfo,
+    metadata: Arc<Metadata>,
+}
+
+impl<'a> TableScan<'a> {
+    pub fn new(conn: &'a FlussConnection, table_info: TableInfo, metadata: Arc<Metadata>) -> Self {
+        Self {
+            conn,
+            table_info,
+            metadata,
+        }
+    }
+
+    pub fn create_log_scanner(&self) -> LogScanner {
+        LogScanner::new(
+            &self.table_info,
+            self.metadata.clone(),
+            self.conn.get_connections(),
+        )
+    }
+}
+
+pub struct LogScanner {
+    table_path: TablePath,
+    table_id: i64,
+    metadata: Arc<Metadata>,
+    log_scanner_status: Arc<LogScannerStatus>,
+    log_fetcher: LogFetcher,
+}
+
+impl LogScanner {
+    pub fn new(
+        table_info: &TableInfo,
+        metadata: Arc<Metadata>,
+        connections: Arc<RpcClient>,
+    ) -> Self {
+        let log_scanner_status = Arc::new(LogScannerStatus::new());
+        Self {
+            table_path: table_info.table_path.clone(),
+            table_id: table_info.table_id,
+            metadata: metadata.clone(),
+            log_scanner_status: log_scanner_status.clone(),
+            log_fetcher: LogFetcher::new(
+                table_info.clone(),
+                connections,
+                metadata.clone(),
+                log_scanner_status.clone(),
+            ),
+        }
+    }
+
+    pub async fn poll(&self, _timeout: Duration) -> Result<ScanRecords> {
+        Ok(ScanRecords::new(self.poll_for_fetches().await?))
+    }
+
+    pub async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
+        let table_bucket = TableBucket::new(self.table_id, bucket);
+        self.metadata
+            .check_and_update_table_metadata(from_ref(&self.table_path))
+            .await?;
+        self.log_scanner_status
+            .assign_scan_bucket(table_bucket, offset);
+        Ok(())
+    }
+
+    async fn poll_for_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
+        self.log_fetcher.send_fetches_and_collect().await
+    }
+}
+
+#[allow(dead_code)]
+struct LogFetcher {
+    table_path: TablePath,
+    conns: Arc<RpcClient>,
+    table_info: TableInfo,
+    metadata: Arc<Metadata>,
+    log_scanner_status: Arc<LogScannerStatus>,
+}
+
+impl LogFetcher {
+    pub fn new(
+        table_info: TableInfo,
+        conns: Arc<RpcClient>,
+        metadata: Arc<Metadata>,
+        log_scanner_status: Arc<LogScannerStatus>,
+    ) -> Self {
+        LogFetcher {
+            table_path: table_info.table_path.clone(),
+            conns: conns.clone(),
+            table_info: table_info.clone(),
+            metadata: metadata.clone(),
+            log_scanner_status: log_scanner_status.clone(),
+        }
+    }
+
+    async fn send_fetches_and_collect(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
+        let fetch_request = self.prepare_fetch_log_requests().await;
+        let mut result: HashMap<TableBucket, Vec<ScanRecord>> = HashMap::new();
+        for (leader, fetch_request) in fetch_request {
+            let cluster = self.metadata.get_cluster();
+            let server_node = cluster
+                .get_tablet_server(leader)
+                .expect("todo: handle leader not exist.");
+            let con = self.conns.get_connection(server_node).await?;
+
+            let fetch_response = con
+                .request(crate::rpc::message::FetchLogRequest::new(fetch_request))
+                .await?;
+
+            for pb_fetch_log_resp in fetch_response.tables_resp {
+                let table_id = pb_fetch_log_resp.table_id;
+                let fetch_log_for_buckets = pb_fetch_log_resp.buckets_resp;
+                let arrow_schema = to_arrow_schema(self.table_info.get_row_type());
+                for fetch_log_for_bucket in fetch_log_for_buckets {
+                    let mut fetch_records = vec![];
+                    let bucket: i32 = fetch_log_for_bucket.bucket_id;
+                    let table_bucket = TableBucket::new(table_id, bucket);
+                    if fetch_log_for_bucket.records.is_some() {
+                        let data = fetch_log_for_bucket.records.unwrap();
+                        for log_record in &mut LogRecordsBatchs::new(&data) {
+                            let last_offset = log_record.last_log_offset();
+                            fetch_records
+                                .extend(log_record.records(ReadContext::new(arrow_schema.clone())));
+                            self.log_scanner_status
+                                .update_offset(&table_bucket, last_offset + 1);
+                        }
+                    }
+                    result.insert(table_bucket, fetch_records);
+                }
+            }
+        }
+
+        Ok(result)
+    }
+
+    async fn prepare_fetch_log_requests(&self) -> HashMap<i32, FetchLogRequest> {
+        let mut fetch_log_req_for_buckets = HashMap::new();
+        let mut table_id = None;
+        let mut ready_for_fetch_count = 0;
+        for bucket in self.fetchable_buckets() {
+            if table_id.is_none() {
+                table_id = Some(bucket.table_id());
+            }
+
+            let offset = match self.log_scanner_status.get_bucket_offset(&bucket) {
+                Some(offset) => offset,
+                None => {
+                    // todo: debug
+                    continue;
+                }
+            };
+
+            if let Some(leader) = self.get_table_bucket_leader(&bucket) {
+                let fetch_log_req_for_bucket = PbFetchLogReqForBucket {
+                    partition_id: None,
+                    bucket_id: bucket.bucket_id(),
+                    fetch_offset: offset,
+                    // 1M
+                    max_fetch_bytes: 1024 * 1024,
+                };
+
+                fetch_log_req_for_buckets
+                    .entry(leader)
+                    .or_insert_with(Vec::new)
+                    .push(fetch_log_req_for_bucket);
+                ready_for_fetch_count += 1;
+            }
+        }
+
+        if ready_for_fetch_count == 0 {
+            HashMap::new()
+        } else {
+            fetch_log_req_for_buckets
+                .into_iter()
+                .map(|(leader_id, feq_for_buckets)| {
+                    let req_for_table = PbFetchLogReqForTable {
+                        table_id: table_id.unwrap(),
+                        projection_pushdown_enabled: false,
+                        projected_fields: vec![],
+                        buckets_req: feq_for_buckets,
+                    };
+
+                    let fetch_log_request = FetchLogRequest {
+                        follower_server_id: -1,
+                        max_bytes: LOG_FETCH_MAX_BYTES,
+                        tables_req: vec![req_for_table],
+                        max_wait_ms: Some(LOG_FETCH_WAIT_MAX_TIME),
+                        min_bytes: Some(LOG_FETCH_MIN_BYTES),
+                    };
+                    (leader_id, fetch_log_request)
+                })
+                .collect()
+        }
+    }
+
+    fn fetchable_buckets(&self) -> Vec<TableBucket> {
+        // always available now
+        self.log_scanner_status.fetchable_buckets(|_| true)
+    }
+
+    fn get_table_bucket_leader(&self, tb: &TableBucket) -> Option<i32> {
+        let cluster = self.metadata.get_cluster();
+        cluster.leader_for(tb).map(|leader| leader.id())
+    }
+}
+
+pub struct LogScannerStatus {
+    bucket_status_map: Arc<RwLock<FairBucketStatusMap<BucketScanStatus>>>,
+}
+
+#[allow(dead_code)]
+impl LogScannerStatus {
+    pub fn new() -> Self {
+        Self {
+            bucket_status_map: Arc::new(RwLock::new(FairBucketStatusMap::new())),
+        }
+    }
+
+    pub fn prepare_to_poll(&self) -> bool {
+        let map = self.bucket_status_map.read();
+        map.size() > 0
+    }
+
+    pub fn move_bucket_to_end(&self, table_bucket: TableBucket) {
+        let mut map = self.bucket_status_map.write();
+        map.move_to_end(table_bucket);
+    }
+
+    /// Gets the offset of a bucket if it exists
+    pub fn get_bucket_offset(&self, table_bucket: &TableBucket) -> Option<i64> {
+        let map = self.bucket_status_map.read();
+        map.status_value(table_bucket).map(|status| status.offset())
+    }
+
+    pub fn update_high_watermark(&self, table_bucket: &TableBucket, high_watermark: i64) {
+        if let Some(status) = self.get_status(table_bucket) {
+            status.set_high_watermark(high_watermark);
+        }
+    }
+
+    pub fn update_offset(&self, table_bucket: &TableBucket, offset: i64) {
+        if let Some(status) = self.get_status(table_bucket) {
+            status.set_offset(offset);
+        }
+    }
+
+    pub fn assign_scan_buckets(&self, scan_bucket_offsets: HashMap<TableBucket, i64>) {
+        let mut map = self.bucket_status_map.write();
+        for (bucket, offset) in scan_bucket_offsets {
+            let status = map
+                .status_value(&bucket)
+                .cloned()
+                .unwrap_or_else(|| Arc::new(BucketScanStatus::new(offset)));
+            status.set_offset(offset);
+            map.update(bucket, status);
+        }
+    }
+
+    pub fn assign_scan_bucket(&self, table_bucket: TableBucket, offset: i64) {
+        let status = Arc::new(BucketScanStatus::new(offset));
+        self.bucket_status_map.write().update(table_bucket, status);
+    }
+
+    /// Unassigns scan buckets
+    pub fn unassign_scan_buckets(&self, buckets: &[TableBucket]) {
+        let mut map = self.bucket_status_map.write();
+        for bucket in buckets {
+            map.remove(bucket);
+        }
+    }
+
+    /// Gets fetchable buckets based on availability predicate
+    pub fn fetchable_buckets<F>(&self, is_available: F) -> Vec<TableBucket>
+    where
+        F: Fn(&TableBucket) -> bool,
+    {
+        let map = self.bucket_status_map.read();
+        let mut result = Vec::new();
+        map.for_each(|bucket, _| {
+            if is_available(bucket) {
+                result.push(bucket.clone());
+            }
+        });
+        result
+    }
+
+    /// Helper to get bucket status
+    fn get_status(&self, table_bucket: &TableBucket) -> Option<Arc<BucketScanStatus>> {
+        let map = self.bucket_status_map.read();
+        map.status_value(table_bucket).cloned()
+    }
+}
+
+impl Default for LogScannerStatus {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+#[derive(Debug)]
+#[allow(dead_code)]
+pub struct BucketScanStatus {
+    offset: RwLock<i64>,
+    high_watermark: RwLock<i64>,
+}
+
+#[allow(dead_code)]
+impl BucketScanStatus {
+    pub fn new(offset: i64) -> Self {
+        Self {
+            offset: RwLock::new(offset),
+            high_watermark: RwLock::new(0),
+        }
+    }
+
+    pub fn offset(&self) -> i64 {
+        *self.offset.read()
+    }
+
+    pub fn set_offset(&self, offset: i64) {
+        *self.offset.write() = offset
+    }
+
+    pub fn high_watermark(&self) -> i64 {
+        *self.high_watermark.read()
+    }
+
+    pub fn set_high_watermark(&self, high_watermark: i64) {
+        *self.high_watermark.write() = high_watermark
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/writer.rs b/fluss-rust/crates/fluss/src/client/table/writer.rs
new file mode 100644
index 0000000000..b2ba881b36
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/writer.rs
@@ -0,0 +1,88 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::{WriteRecord, WriterClient};
+use crate::row::GenericRow;
+use std::sync::Arc;
+
+use crate::error::Result;
+use crate::metadata::{TableInfo, TablePath};
+
+#[allow(dead_code)]
+pub trait TableWriter {
+    async fn flush(&self) -> Result<()>;
+}
+
+#[allow(dead_code)]
+pub trait AppendWriter: TableWriter {
+    async fn append(&self, row: GenericRow) -> Result<()>;
+}
+
+#[allow(dead_code)]
+pub trait UpsertWriter: TableWriter {
+    async fn upsert(&self, row: GenericRow) -> Result<()>;
+    async fn delete(&self, row: GenericRow) -> Result<()>;
+}
+
+#[allow(dead_code)]
+pub struct AbstractTableWriter {
+    table_path: Arc<TablePath>,
+    writer_client: Arc<WriterClient>,
+    field_count: i32,
+}
+
+#[allow(dead_code)]
+impl AbstractTableWriter {
+    pub fn new(
+        table_path: TablePath,
+        table_info: &TableInfo,
+        writer_client: Arc<WriterClient>,
+    ) -> Self {
+        // todo: partition
+        Self {
+            table_path: Arc::new(table_path),
+            writer_client,
+            field_count: table_info.row_type().fields().len() as i32,
+        }
+    }
+
+    pub async fn send(&self, write_record: &WriteRecord<'_>) -> Result<()> {
+        let result_handle = self.writer_client.send(write_record).await?;
+        let result = result_handle.wait().await?;
+        result_handle.result(result)
+    }
+}
+
+impl TableWriter for AbstractTableWriter {
+    async fn flush(&self) -> Result<()> {
+        todo!()
+    }
+}
+
+// Append writer implementation
+#[allow(dead_code)]
+pub struct AppendWriterImpl {
+    base: AbstractTableWriter,
+}
+
+#[allow(dead_code)]
+impl AppendWriterImpl {
+    pub async fn append(&self, row: GenericRow<'_>) -> Result<()> {
+        let record = WriteRecord::new(self.base.table_path.clone(), row);
+        self.base.send(&record).await
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
new file mode 100644
index 0000000000..0b77894025
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -0,0 +1,442 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::write::batch::WriteBatch::ArrowLog;
+use crate::client::write::batch::{ArrowLogWriteBatch, WriteBatch};
+use crate::client::{ResultHandle, WriteRecord};
+use crate::cluster::{BucketLocation, Cluster, ServerNode};
+use crate::config::Config;
+use crate::error::Result;
+use crate::metadata::{TableBucket, TablePath};
+use crate::util::current_time_ms;
+use crate::{BucketId, PartitionId, TableId};
+use dashmap::DashMap;
+use parking_lot::RwLock;
+use std::collections::{HashMap, HashSet, VecDeque};
+use std::sync::Arc;
+use std::sync::atomic::{AtomicI32, AtomicI64, Ordering};
+use tokio::sync::Mutex;
+
+#[allow(dead_code)]
+pub struct RecordAccumulator {
+    config: Config,
+    write_batches: DashMap<TablePath, BucketAndWriteBatches>,
+    // batch_id -> complete callback
+    incomplete_batches: RwLock<HashMap<i64, ResultHandle>>,
+    batch_timeout_ms: i64,
+    closed: bool,
+    flushes_in_progress: AtomicI32,
+    appends_in_progress: i32,
+    nodes_drain_index: Mutex<HashMap<i32, usize>>,
+    batch_id: AtomicI64,
+}
+
+impl RecordAccumulator {
+    pub fn new(config: Config) -> Self {
+        RecordAccumulator {
+            config,
+            write_batches: Default::default(),
+            incomplete_batches: Default::default(),
+            batch_timeout_ms: 500,
+            closed: Default::default(),
+            flushes_in_progress: Default::default(),
+            appends_in_progress: Default::default(),
+            nodes_drain_index: Default::default(),
+            batch_id: Default::default(),
+        }
+    }
+
+    fn try_append(
+        &self,
+        record: &WriteRecord,
+        dq: &mut VecDeque<WriteBatch>,
+    ) -> Result<Option<RecordAppendResult>> {
+        let dq_size = dq.len();
+        if let Some(last_batch) = dq.back_mut() {
+            return if let Some(result_handle) = last_batch.try_append(record)? {
+                Ok(Some(RecordAppendResult::new(
+                    result_handle,
+                    dq_size > 1 || last_batch.is_closed(),
+                    false,
+                    false,
+                )))
+            } else {
+                Ok(None)
+            };
+        }
+        Ok(None)
+    }
+
+    fn append_new_batch(
+        &self,
+        cluster: &Cluster,
+        record: &WriteRecord,
+        bucket_id: BucketId,
+        dq: &mut VecDeque<WriteBatch>,
+    ) -> Result<RecordAppendResult> {
+        if let Some(append_result) = self.try_append(record, dq)? {
+            return Ok(append_result);
+        }
+
+        let table_path = &record.table_path;
+
+        let row_type = &cluster.get_table(table_path).row_type;
+
+        let mut batch = ArrowLog(ArrowLogWriteBatch::new(
+            self.batch_id.fetch_add(1, Ordering::Relaxed),
+            table_path.as_ref().clone(),
+            0,
+            row_type,
+            bucket_id,
+            current_time_ms(),
+        ));
+
+        let batch_id = batch.batch_id();
+
+        let result_handle = batch
+            .try_append(record)?
+            .expect("must append to a new batch");
+
+        let batch_is_closed = batch.is_closed();
+        dq.push_back(batch);
+
+        self.incomplete_batches
+            .write()
+            .insert(batch_id, result_handle.clone());
+        Ok(RecordAppendResult::new(
+            result_handle,
+            dq.len() > 1 || batch_is_closed,
+            true,
+            false,
+        ))
+    }
+
+    pub async fn append(
+        &self,
+        record: &WriteRecord<'_>,
+        bucket_id: BucketId,
+        cluster: &Cluster,
+        abort_if_batch_full: bool,
+    ) -> Result<RecordAppendResult> {
+        let table_path = &record.table_path;
+        let mut binding = self
+            .write_batches
+            .entry(table_path.as_ref().clone())
+            .or_insert_with(|| BucketAndWriteBatches {
+                table_id: 0,
+                is_partitioned_table: false,
+                partition_id: None,
+                batches: Default::default(),
+            });
+        let bucket_and_batches = binding.value_mut();
+        let dq = bucket_and_batches
+            .batches
+            .entry(bucket_id)
+            .or_insert_with(|| Mutex::new(VecDeque::new()));
+        let mut dq_guard = dq.lock().await;
+        if let Some(append_result) = self.try_append(record, &mut dq_guard)? {
+            return Ok(append_result);
+        }
+
+        if abort_if_batch_full {
+            return Ok(RecordAppendResult::new_without_result_handle(
+                true, false, true,
+            ));
+        }
+
+        self.append_new_batch(cluster, record, bucket_id, &mut dq_guard)
+    }
+
+    pub async fn ready(&self, cluster: &Arc<Cluster>) -> ReadyCheckResult {
+        let mut ready_nodes = HashSet::new();
+        let mut next_ready_check_delay_ms = self.batch_timeout_ms;
+        let mut unknown_leader_tables = HashSet::new();
+        for entry in self.write_batches.iter() {
+            let table_path = entry.key();
+            let batches = entry.value();
+            next_ready_check_delay_ms = self
+                .bucket_ready(
+                    table_path,
+                    batches,
+                    &mut ready_nodes,
+                    &mut unknown_leader_tables,
+                    cluster,
+                    next_ready_check_delay_ms,
+                )
+                .await
+        }
+
+        ReadyCheckResult {
+            ready_nodes,
+            next_ready_check_delay_ms,
+            unknown_leader_tables,
+        }
+    }
+
+    async fn bucket_ready(
+        &self,
+        table_path: &TablePath,
+        batches: &BucketAndWriteBatches,
+        ready_nodes: &mut HashSet<ServerNode>,
+        unknown_leader_tables: &mut HashSet<TablePath>,
+        cluster: &Cluster,
+        next_ready_check_delay_ms: i64,
+    ) -> i64 {
+        let mut next_delay = next_ready_check_delay_ms;
+
+        for (bucket_id, batch) in batches.batches.iter() {
+            let batch_guard = batch.lock().await;
+            if batch_guard.is_empty() {
+                continue;
+            }
+
+            let batch = batch_guard.front().unwrap();
+            let waited_time_ms = batch.waited_time_ms(current_time_ms());
+            let deque_size = batch_guard.len();
+            let full = deque_size > 1 || batch.is_closed();
+            let table_bucket = cluster.get_table_bucket(table_path, *bucket_id);
+            if let Some(leader) = cluster.leader_for(&table_bucket) {
+                next_delay =
+                    self.batch_ready(leader, waited_time_ms, full, ready_nodes, next_delay);
+            } else {
+                unknown_leader_tables.insert(table_path.clone());
+            }
+        }
+        next_delay
+    }
+
+    fn batch_ready(
+        &self,
+        leader: &ServerNode,
+        waited_time_ms: i64,
+        full: bool,
+        ready_nodes: &mut HashSet<ServerNode>,
+        next_ready_check_delay_ms: i64,
+    ) -> i64 {
+        if !ready_nodes.contains(leader) {
+            let expired = waited_time_ms >= self.batch_timeout_ms;
+            let sendable = full || expired || self.closed || self.flush_in_progress();
+
+            if sendable {
+                ready_nodes.insert(leader.clone());
+            } else {
+                let time_left_ms = self.batch_timeout_ms.saturating_sub(waited_time_ms);
+                return next_ready_check_delay_ms.min(time_left_ms);
+            }
+        }
+        next_ready_check_delay_ms
+    }
+
+    pub async fn drain(
+        &self,
+        cluster: Arc<Cluster>,
+        nodes: &HashSet<ServerNode>,
+        max_size: i32,
+    ) -> Result<HashMap<i32, Vec<Arc<ReadyWriteBatch>>>> {
+        if nodes.is_empty() {
+            return Ok(HashMap::new());
+        }
+        let mut batches = HashMap::new();
+        for node in nodes {
+            let ready = self
+                .drain_batches_for_one_node(&cluster, node, max_size)
+                .await?;
+            if !ready.is_empty() {
+                batches.insert(node.id(), ready);
+            }
+        }
+
+        Ok(batches)
+    }
+
+    async fn drain_batches_for_one_node(
+        &self,
+        cluster: &Cluster,
+        node: &ServerNode,
+        max_size: i32,
+    ) -> Result<Vec<Arc<ReadyWriteBatch>>> {
+        let mut size = 0;
+        let buckets = self.get_all_buckets_in_current_node(node, cluster);
+        let mut ready = Vec::new();
+
+        if buckets.is_empty() {
+            return Ok(ready);
+        }
+
+        let mut nodes_drain_index_guard = self.nodes_drain_index.lock().await;
+        let drain_index = nodes_drain_index_guard.entry(node.id()).or_insert(0);
+        let start = *drain_index % buckets.len();
+        let mut current_index = start;
+
+        loop {
+            let bucket = &buckets[current_index];
+            let table_path = bucket.table_path.clone();
+            let table_bucket = bucket.table_bucket.clone();
+            nodes_drain_index_guard.insert(node.id(), current_index);
+            current_index = (current_index + 1) % buckets.len();
+
+            let bucket_and_write_batches = self.write_batches.get(&table_path);
+            if let Some(bucket_and_write_batches) = bucket_and_write_batches {
+                if let Some(deque) = bucket_and_write_batches
+                    .batches
+                    .get(&table_bucket.bucket_id())
+                {
+                    let mut batch = {
+                        let mut batch_lock = deque.lock().await;
+                        if batch_lock.is_empty() {
+                            continue;
+                        }
+                        let first_batch = batch_lock.front().unwrap();
+
+                        if size + first_batch.estimated_size_in_bytes() > max_size as i64
+                            && !ready.is_empty()
+                        {
+                            // there is a rare case that a single batch size is larger than the request size
+                            // due to compression; in this case we will still eventually send this batch in
+                            // a single request.
+                            break;
+                        }
+
+                        batch_lock.pop_front().unwrap()
+                    };
+
+                    let current_batch_size = batch.estimated_size_in_bytes();
+                    size += current_batch_size;
+
+                    // mark the batch as drained.
+                    batch.drained(current_time_ms());
+                    ready.push(Arc::new(ReadyWriteBatch {
+                        table_bucket,
+                        write_batch: batch,
+                    }));
+                }
+            }
+            if current_index == start {
+                break;
+            }
+        }
+        Ok(ready)
+    }
+
+    pub fn remove_incomplete_batches(&self, batch_id: i64) {
+        self.incomplete_batches.write().remove(&batch_id);
+    }
+
+    fn get_all_buckets_in_current_node(
+        &self,
+        current: &ServerNode,
+        cluster: &Cluster,
+    ) -> Vec<BucketLocation> {
+        let mut buckets = vec![];
+        for bucket_locations in cluster.get_bucket_locations_by_path().values() {
+            for bucket_location in bucket_locations {
+                if let Some(leader) = bucket_location.leader() {
+                    if current.id() == leader.id() {
+                        buckets.push(bucket_location.clone());
+                    }
+                }
+            }
+        }
+        buckets
+    }
+
+    fn flush_in_progress(&self) -> bool {
+        self.flushes_in_progress.load(Ordering::SeqCst) > 0
+    }
+
+    pub fn begin_flush(&self) {
+        self.flushes_in_progress.fetch_add(1, Ordering::SeqCst);
+    }
+
+    #[allow(unused_must_use)]
+    #[allow(clippy::await_holding_lock)]
+    pub async fn await_flush_completion(&self) -> Result<()> {
+        for result_handle in self.incomplete_batches.read().values() {
+            result_handle.wait().await?;
+        }
+        Ok(())
+    }
+}
+
+pub struct ReadyWriteBatch {
+    pub table_bucket: TableBucket,
+    pub write_batch: WriteBatch,
+}
+
+#[allow(dead_code)]
+struct BucketAndWriteBatches {
+    table_id: TableId,
+    is_partitioned_table: bool,
+    partition_id: Option<PartitionId>,
+    batches: HashMap<BucketId, Mutex<VecDeque<WriteBatch>>>,
+}
+
+pub struct RecordAppendResult {
+    pub batch_is_full: bool,
+    pub new_batch_created: bool,
+    pub abort_record_for_new_batch: bool,
+    pub result_handle: Option<ResultHandle>,
+}
+
+impl RecordAppendResult {
+    fn new(
+        result_handle: ResultHandle,
+        batch_is_full: bool,
+        new_batch_created: bool,
+        abort_record_for_new_batch: bool,
+    ) -> Self {
+        Self {
+            batch_is_full,
+            new_batch_created,
+            abort_record_for_new_batch,
+            result_handle: Some(result_handle),
+        }
+    }
+
+    fn new_without_result_handle(
+        batch_is_full: bool,
+        new_batch_created: bool,
+        abort_record_for_new_batch: bool,
+    ) -> Self {
+        Self {
+            batch_is_full,
+            new_batch_created,
+            abort_record_for_new_batch,
+            result_handle: None,
+        }
+    }
+}
+
+pub struct ReadyCheckResult {
+    pub ready_nodes: HashSet<ServerNode>,
+    pub next_ready_check_delay_ms: i64,
+    pub unknown_leader_tables: HashSet<TablePath>,
+}
+
+impl ReadyCheckResult {
+    pub fn new(
+        ready_nodes: HashSet<ServerNode>,
+        next_ready_check_delay_ms: i64,
+        unknown_leader_tables: HashSet<TablePath>,
+    ) -> Self {
+        ReadyCheckResult {
+            ready_nodes,
+            next_ready_check_delay_ms,
+            unknown_leader_tables,
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
new file mode 100644
index 0000000000..64c5dd6517
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -0,0 +1,176 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::BucketId;
+use crate::client::broadcast::{BatchWriteResult, BroadcastOnce};
+use crate::client::{ResultHandle, WriteRecord};
+use crate::metadata::{DataType, TablePath};
+use std::cmp::max;
+
+use crate::error::Result;
+use crate::record::MemoryLogRecordsArrowBuilder;
+
+#[allow(dead_code)]
+pub struct InnerWriteBatch {
+    batch_id: i64,
+    table_path: TablePath,
+    create_ms: i64,
+    bucket_id: BucketId,
+    results: BroadcastOnce<BatchWriteResult>,
+    completed: bool,
+    drained_ms: i64,
+}
+
+impl InnerWriteBatch {
+    fn new(batch_id: i64, table_path: TablePath, create_ms: i64, bucket_id: BucketId) -> Self {
+        InnerWriteBatch {
+            batch_id,
+            table_path,
+            create_ms,
+            bucket_id,
+            results: Default::default(),
+            completed: Default::default(),
+            drained_ms: -1,
+        }
+    }
+
+    fn waited_time_ms(&self, now: i64) -> i64 {
+        max(0i64, now - self.create_ms)
+    }
+
+    fn complete(&self, write_result: BatchWriteResult) -> bool {
+        if !self.completed {
+            self.results.broadcast(write_result);
+        }
+        true
+    }
+
+    fn drained(&mut self, now_ms: i64) {
+        self.drained_ms = max(self.drained_ms, now_ms);
+    }
+}
+
+pub enum WriteBatch {
+    ArrowLog(ArrowLogWriteBatch),
+}
+
+impl WriteBatch {
+    pub fn inner_batch(&self) -> &InnerWriteBatch {
+        match self {
+            WriteBatch::ArrowLog(batch) => &batch.write_batch,
+        }
+    }
+
+    pub fn try_append(&mut self, write_record: &WriteRecord) -> Result<Option<ResultHandle>> {
+        match self {
+            WriteBatch::ArrowLog(batch) => batch.try_append(write_record),
+        }
+    }
+
+    pub fn waited_time_ms(&self, now: i64) -> i64 {
+        self.inner_batch().waited_time_ms(now)
+    }
+
+    pub fn close(&mut self) {
+        match self {
+            WriteBatch::ArrowLog(batch) => {
+                batch.close();
+            }
+        }
+    }
+
+    pub fn estimated_size_in_bytes(&self) -> i64 {
+        0
+        // todo: calculate estimated_size_in_bytes
+    }
+
+    pub fn is_closed(&self) -> bool {
+        match self {
+            WriteBatch::ArrowLog(batch) => batch.is_closed(),
+        }
+    }
+
+    pub fn drained(&mut self, now_ms: i64) {
+        match self {
+            WriteBatch::ArrowLog(batch) => {
+                batch.write_batch.drained(now_ms);
+            }
+        }
+    }
+
+    pub fn build(&self) -> Result<Vec<u8>> {
+        match self {
+            WriteBatch::ArrowLog(batch) => batch.build(),
+        }
+    }
+
+    pub fn complete(&self, write_result: BatchWriteResult) -> bool {
+        self.inner_batch().complete(write_result)
+    }
+
+    pub fn batch_id(&self) -> i64 {
+        self.inner_batch().batch_id
+    }
+}
+
+pub struct ArrowLogWriteBatch {
+    pub write_batch: InnerWriteBatch,
+    pub arrow_builder: MemoryLogRecordsArrowBuilder,
+}
+
+impl ArrowLogWriteBatch {
+    pub fn new(
+        batch_id: i64,
+        table_path: TablePath,
+        schema_id: i32,
+        row_type: &DataType,
+        bucket_id: BucketId,
+        create_ms: i64,
+    ) -> Self {
+        let base = InnerWriteBatch::new(batch_id, table_path, create_ms, bucket_id);
+
+        Self {
+            write_batch: base,
+            arrow_builder: MemoryLogRecordsArrowBuilder::new(schema_id, row_type),
+        }
+    }
+
+    pub fn batch_id(&self) -> i64 {
+        self.write_batch.batch_id
+    }
+
+    pub fn try_append(&mut self, write_record: &WriteRecord) -> Result<Option<ResultHandle>> {
+        if self.arrow_builder.is_closed() || self.arrow_builder.is_full() {
+            Ok(None)
+        } else {
+            self.arrow_builder.append(&write_record.row)?;
+            Ok(Some(ResultHandle::new(self.write_batch.results.receiver())))
+        }
+    }
+
+    pub fn build(&self) -> Result<Vec<u8>> {
+        self.arrow_builder.build()
+    }
+
+    pub fn is_closed(&self) -> bool {
+        self.arrow_builder.is_closed()
+    }
+
+    pub fn close(&mut self) {
+        self.arrow_builder.close()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/broadcast.rs b/fluss-rust/crates/fluss/src/client/write/broadcast.rs
new file mode 100644
index 0000000000..2dcc34cbc4
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/broadcast.rs
@@ -0,0 +1,119 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use parking_lot::RwLock;
+use std::sync::Arc;
+use thiserror::Error;
+use tokio::sync::Notify;
+use tracing::warn;
+
+pub type Result<T, E = Error> = std::result::Result<T, E>;
+
+pub type BatchWriteResult = Result<(), Error>;
+
+#[derive(Debug, Error, Clone, PartialEq, Eq)]
+pub enum Error {
+    #[error("BroadcastOnce dropped")]
+    Dropped,
+}
+
+#[derive(Debug, Clone)]
+pub struct BroadcastOnceReceiver<T> {
+    shared: Arc<Shared<T>>,
+}
+
+impl<T: Clone + Send + Sync> BroadcastOnceReceiver<T> {
+    /// Returns `Some(_)` if data has been produced
+    pub fn peek(&self) -> Option<Result<T>> {
+        self.shared.data.read().clone()
+    }
+
+    /// Waits for [`BroadcastOnce::broadcast`] to be called or returns an error
+    /// if the [`BroadcastOnce`] is dropped without a value being published
+    pub async fn receive(&self) -> Result<T> {
+        let notified = self.shared.notify.notified();
+
+        if let Some(v) = self.peek() {
+            return v;
+        }
+
+        notified.await;
+
+        self.peek().expect("just got notified")
+    }
+}
+
+#[derive(Debug)]
+struct Shared<T> {
+    data: RwLock<Option<Result<T>>>,
+    notify: Notify,
+}
+
+#[derive(Debug)]
+pub struct BroadcastOnce<T>
+where
+    T: Send + Sync,
+{
+    shared: Arc<Shared<T>>,
+}
+
+impl<T> Default for BroadcastOnce<T>
+where
+    T: Send + Sync,
+{
+    fn default() -> Self {
+        Self {
+            shared: Arc::new(Shared {
+                data: Default::default(),
+                notify: Default::default(),
+            }),
+        }
+    }
+}
+
+impl<T: Clone + Send + Sync> BroadcastOnce<T> {
+    /// Returns a [`BroadcastOnceReceiver`] that can be used to wait on
+    /// a call to [`BroadcastOnce::broadcast`] on this instance
+    pub fn receiver(&self) -> BroadcastOnceReceiver<T> {
+        BroadcastOnceReceiver {
+            shared: Arc::clone(&self.shared),
+        }
+    }
+
+    /// Broadcast a value to all [`BroadcastOnceReceiver`] handles
+    pub fn broadcast(&self, r: T) {
+        let mut locked = self.shared.data.write();
+        assert!(locked.is_none(), "double publish");
+
+        *locked = Some(Ok(r));
+        self.shared.notify.notify_waiters();
+    }
+}
+
+impl<T> Drop for BroadcastOnce<T>
+where
+    T: Send + Sync,
+{
+    fn drop(&mut self) {
+        let mut data = self.shared.data.write();
+        if data.is_none() {
+            warn!("BroadcastOnce dropped without producing");
+            *data = Some(Err(Error::Dropped));
+            self.shared.notify.notify_waiters();
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
new file mode 100644
index 0000000000..991c5f9197
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
@@ -0,0 +1,102 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::cluster::Cluster;
+use crate::metadata::TablePath;
+use rand::Rng;
+use std::sync::atomic::{AtomicI32, Ordering};
+
+pub trait BucketAssigner: Sync + Send {
+    fn abort_if_batch_full(&self) -> bool;
+
+    fn on_new_batch(&self, cluster: &Cluster, prev_bucket_id: i32);
+
+    fn assign_bucket(&self, bucket_key: Option<&[u8]>, cluster: &Cluster) -> i32;
+}
+
+#[derive(Debug)]
+pub struct StickyBucketAssigner {
+    table_path: TablePath,
+    current_bucket_id: AtomicI32,
+}
+
+impl StickyBucketAssigner {
+    pub fn new(table_path: TablePath) -> Self {
+        Self {
+            table_path,
+            current_bucket_id: AtomicI32::new(-1),
+        }
+    }
+
+    fn next_bucket(&self, cluster: &Cluster, prev_bucket_id: i32) -> i32 {
+        let old_bucket = self.current_bucket_id.load(Ordering::Relaxed);
+        let mut new_bucket = old_bucket;
+        if old_bucket < 0 || old_bucket == prev_bucket_id {
+            let available_buckets = cluster.get_available_buckets_for_table_path(&self.table_path);
+            if available_buckets.is_empty() {
+                let mut rng = rand::rng();
+                let mut random: i32 = rng.random();
+                random &= i32::MAX;
+                new_bucket = random % cluster.get_bucket_count(&self.table_path);
+            } else if available_buckets.len() == 1 {
+                new_bucket = available_buckets[0].table_bucket.bucket_id();
+            } else {
+                let mut rng = rand::rng();
+                while new_bucket < 0 || new_bucket == old_bucket {
+                    let mut random: i32 = rng.random();
+                    random &= i32::MAX;
+                    new_bucket = available_buckets
+                        [(random % available_buckets.len() as i32) as usize]
+                        .bucket_id();
+                }
+            }
+        }
+
+        if old_bucket < 0 {
+            self.current_bucket_id.store(new_bucket, Ordering::Relaxed);
+        } else {
+            self.current_bucket_id
+                .compare_exchange(
+                    prev_bucket_id,
+                    new_bucket,
+                    Ordering::Relaxed,
+                    Ordering::Relaxed,
+                )
+                .ok();
+        }
+        self.current_bucket_id.load(Ordering::Relaxed)
+    }
+}
+
+impl BucketAssigner for StickyBucketAssigner {
+    fn abort_if_batch_full(&self) -> bool {
+        true
+    }
+
+    fn on_new_batch(&self, cluster: &Cluster, prev_bucket_id: i32) {
+        self.next_bucket(cluster, prev_bucket_id);
+    }
+
+    fn assign_bucket(&self, _bucket_key: Option<&[u8]>, cluster: &Cluster) -> i32 {
+        let bucket_id = self.current_bucket_id.load(Ordering::Relaxed);
+        if bucket_id < 0 {
+            self.next_bucket(cluster, bucket_id)
+        } else {
+            bucket_id
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
new file mode 100644
index 0000000000..74df951115
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -0,0 +1,68 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+mod accumulator;
+mod batch;
+
+use crate::client::broadcast::{BatchWriteResult, BroadcastOnceReceiver};
+use crate::error::Error;
+use crate::metadata::TablePath;
+use crate::row::GenericRow;
+pub use accumulator::*;
+use std::sync::Arc;
+
+pub(crate) mod broadcast;
+mod bucket_assigner;
+
+mod sender;
+mod writer_client;
+
+pub use writer_client::WriterClient;
+
+pub struct WriteRecord<'a> {
+    pub row: GenericRow<'a>,
+    pub table_path: Arc<TablePath>,
+}
+
+impl<'a> WriteRecord<'a> {
+    pub fn new(table_path: Arc<TablePath>, row: GenericRow<'a>) -> Self {
+        Self { row, table_path }
+    }
+}
+
+#[derive(Debug, Clone)]
+pub struct ResultHandle {
+    receiver: BroadcastOnceReceiver<BatchWriteResult>,
+}
+
+impl ResultHandle {
+    pub fn new(receiver: BroadcastOnceReceiver<BatchWriteResult>) -> Self {
+        ResultHandle { receiver }
+    }
+
+    pub async fn wait(&self) -> Result<BatchWriteResult, Error> {
+        self.receiver
+            .receive()
+            .await
+            .map_err(|e| Error::WriteError(e.to_string()))
+    }
+
+    pub fn result(&self, batch_result: BatchWriteResult) -> Result<(), Error> {
+        // do nothing, just return empty result
+        batch_result.map_err(|e| Error::WriteError(e.to_string()))
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
new file mode 100644
index 0000000000..381e10c5b1
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -0,0 +1,207 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::metadata::Metadata;
+use crate::client::{ReadyWriteBatch, RecordAccumulator};
+use crate::error::Error::WriteError;
+use crate::error::Result;
+use crate::metadata::TableBucket;
+use crate::proto::ProduceLogResponse;
+use crate::rpc::ProduceLogRequest;
+use parking_lot::Mutex;
+use std::collections::HashMap;
+use std::sync::Arc;
+use std::time::Duration;
+
+#[allow(dead_code)]
+pub struct Sender {
+    running: bool,
+    metadata: Arc<Metadata>,
+    accumulator: Arc<RecordAccumulator>,
+    in_flight_batches: Mutex<HashMap<TableBucket, Vec<Arc<ReadyWriteBatch>>>>,
+    max_request_size: i32,
+    ack: i16,
+    max_request_timeout_ms: i32,
+    retries: i32,
+}
+
+impl Sender {
+    pub fn new(
+        metadata: Arc<Metadata>,
+        accumulator: Arc<RecordAccumulator>,
+        max_request_size: i32,
+        max_request_timeout_ms: i32,
+        ack: i16,
+        retries: i32,
+    ) -> Self {
+        Self {
+            running: true,
+            metadata,
+            accumulator,
+            in_flight_batches: Default::default(),
+            max_request_size,
+            ack,
+            max_request_timeout_ms,
+            retries,
+        }
+    }
+
+    pub async fn run(&self) -> Result<()> {
+        loop {
+            if !self.running {
+                return Ok(());
+            }
+            self.run_once().await?;
+        }
+    }
+
+    async fn run_once(&self) -> Result<()> {
+        let cluster = self.metadata.get_cluster();
+        let ready_check_result = self.accumulator.ready(&cluster).await;
+
+        // Update metadata if needed
+        if !ready_check_result.unknown_leader_tables.is_empty() {
+            self.metadata
+                .update_tables_metadata(&ready_check_result.unknown_leader_tables.iter().collect())
+                .await?;
+        }
+
+        if ready_check_result.ready_nodes.is_empty() {
+            tokio::time::sleep(Duration::from_millis(
+                ready_check_result.next_ready_check_delay_ms as u64,
+            ))
+            .await;
+            return Ok(());
+        }
+
+        let batches = self
+            .accumulator
+            .drain(
+                cluster.clone(),
+                &ready_check_result.ready_nodes,
+                self.max_request_size,
+            )
+            .await?;
+
+        if !batches.is_empty() {
+            self.add_to_inflight_batches(&batches);
+            self.send_write_requests(&batches).await?;
+        }
+
+        Ok(())
+    }
+
+    fn add_to_inflight_batches(&self, batches: &HashMap<i32, Vec<Arc<ReadyWriteBatch>>>) {
+        let mut in_flight = self.in_flight_batches.lock();
+        for batch_list in batches.values() {
+            for batch in batch_list {
+                in_flight
+                    .entry(batch.table_bucket.clone())
+                    .or_default()
+                    .push(batch.clone());
+            }
+        }
+    }
+
+    async fn send_write_requests(
+        &self,
+        collated: &HashMap<i32, Vec<Arc<ReadyWriteBatch>>>,
+    ) -> Result<()> {
+        for (leader_id, batches) in collated {
+            println!("send request batch");
+            self.send_write_request(*leader_id, self.ack, batches)
+                .await?;
+        }
+        Ok(())
+    }
+
+    async fn send_write_request(
+        &self,
+        destination: i32,
+        acks: i16,
+        batches: &Vec<Arc<ReadyWriteBatch>>,
+    ) -> Result<()> {
+        if batches.is_empty() {
+            return Ok(());
+        }
+        let mut records_by_bucket = HashMap::new();
+        let mut write_batch_by_table = HashMap::new();
+
+        for batch in batches {
+            records_by_bucket.insert(batch.table_bucket.clone(), batch.clone());
+            write_batch_by_table
+                .entry(batch.table_bucket.table_id())
+                .or_insert_with(Vec::new)
+                .push(batch);
+        }
+
+        let cluster = self.metadata.get_cluster();
+
+        let destination_node = cluster
+            .get_tablet_server(destination)
+            .ok_or(WriteError(String::from("destination node not found")))?;
+        let connection = self.metadata.get_connection(destination_node).await?;
+
+        for (table_id, write_batches) in write_batch_by_table {
+            let request =
+                ProduceLogRequest::new(table_id, acks, self.max_request_timeout_ms, write_batches)?;
+            let response = connection.request(request).await?;
+            self.handle_produce_response(table_id, &records_by_bucket, response)?
+        }
+
+        Ok(())
+    }
+
+    fn handle_produce_response(
+        &self,
+        table_id: i64,
+        records_by_bucket: &HashMap<TableBucket, Arc<ReadyWriteBatch>>,
+        response: ProduceLogResponse,
+    ) -> Result<()> {
+        for produce_log_response_for_bucket in response.buckets_resp.iter() {
+            let tb = TableBucket::new(table_id, produce_log_response_for_bucket.bucket_id);
+
+            let ready_batch = records_by_bucket.get(&tb).unwrap();
+            if let Some(error_code) = produce_log_response_for_bucket.error_code {
+                todo!("handle_produce_response error: {}", error_code)
+            } else {
+                self.complete_batch(ready_batch)
+            }
+        }
+        Ok(())
+    }
+
+    fn complete_batch(&self, ready_write_batch: &Arc<ReadyWriteBatch>) {
+        if ready_write_batch.write_batch.complete(Ok(())) {
+            // remove from in flight batches
+            let mut in_flight_guard = self.in_flight_batches.lock();
+            if let Some(in_flight) = in_flight_guard.get_mut(&ready_write_batch.table_bucket) {
+                in_flight.retain(|b| !Arc::ptr_eq(b, ready_write_batch));
+                if in_flight.is_empty() {
+                    in_flight_guard.remove(&ready_write_batch.table_bucket);
+                }
+            }
+            // remove from incomplete batches
+            self.accumulator
+                .remove_incomplete_batches(ready_write_batch.write_batch.batch_id())
+        }
+    }
+
+    pub async fn close(&mut self) {
+        self.running = false;
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
new file mode 100644
index 0000000000..01fe2899ba
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -0,0 +1,147 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::metadata::Metadata;
+use crate::client::write::bucket_assigner::{BucketAssigner, StickyBucketAssigner};
+use crate::client::write::sender::Sender;
+use crate::client::{RecordAccumulator, ResultHandle, WriteRecord};
+use crate::config::Config;
+use crate::metadata::TablePath;
+use dashmap::DashMap;
+use std::sync::Arc;
+use tokio::sync::mpsc;
+use tokio::task::JoinHandle;
+
+use crate::error::{Error, Result};
+
+#[allow(dead_code)]
+pub struct WriterClient {
+    config: Config,
+    max_request_size: i32,
+    accumulate: Arc<RecordAccumulator>,
+    shutdown_tx: mpsc::Sender<()>,
+    sender_join_handle: JoinHandle<()>,
+    metadata: Arc<Metadata>,
+    bucket_assigners: DashMap<TablePath, Arc<Box<dyn BucketAssigner>>>,
+}
+
+impl WriterClient {
+    pub fn new(config: Config, metadata: Arc<Metadata>) -> Result<Self> {
+        let (shutdown_tx, mut shutdown_rx) = mpsc::channel(1);
+
+        let accumulator = Arc::new(RecordAccumulator::new(config.clone()));
+
+        let mut sender = Sender::new(
+            metadata.clone(),
+            accumulator.clone(),
+            config.request_max_size,
+            30_000,
+            Self::get_ack(&config)?,
+            config.writer_retries,
+        );
+
+        let join_handle = tokio::spawn(async move {
+            tokio::select! {
+                _ = sender.run() => {
+                    // do-nothing
+                },
+                _ = shutdown_rx.recv() => {
+                    sender.close().await
+                }
+            }
+        });
+
+        Ok(Self {
+            max_request_size: config.request_max_size,
+            config,
+            shutdown_tx,
+            sender_join_handle: join_handle,
+            accumulate: accumulator,
+            metadata,
+            bucket_assigners: Default::default(),
+        })
+    }
+
+    fn get_ack(config: &Config) -> Result<i16> {
+        let acks = config.writer_acks.as_str();
+        if acks.eq("all") {
+            Ok(-1)
+        } else {
+            acks.parse::<i16>()
+                .map_err(|e| Error::IllegalArgument(e.to_string()))
+        }
+    }
+
+    pub async fn send(&self, record: &WriteRecord<'_>) -> Result<ResultHandle> {
+        let table_path = &record.table_path;
+        let cluster = self.metadata.get_cluster();
+
+        let bucket_assigner = {
+            if let Some(assigner) = self.bucket_assigners.get(table_path) {
+                assigner.clone()
+            } else {
+                let assigner = Arc::new(Self::create_bucket_assigner(table_path.as_ref()));
+                self.bucket_assigners
+                    .insert(table_path.as_ref().clone(), assigner.clone());
+                assigner
+            }
+        };
+
+        let bucket_id = bucket_assigner.assign_bucket(None, &cluster);
+
+        let mut result = self.accumulate.append(record, 1, &cluster, true).await?;
+
+        if result.abort_record_for_new_batch {
+            let prev_bucket_id = bucket_id;
+            bucket_assigner.on_new_batch(&cluster, prev_bucket_id);
+            let bucket_id = bucket_assigner.assign_bucket(None, &cluster);
+            result = self
+                .accumulate
+                .append(record, bucket_id, &cluster, false)
+                .await?;
+        }
+
+        if result.batch_is_full || result.new_batch_created {
+            // todo: wakeup
+        }
+
+        Ok(result.result_handle.expect("result_handle should exist"))
+    }
+
+    pub async fn close(self) -> Result<()> {
+        self.shutdown_tx
+            .send(())
+            .await
+            .map_err(|e| Error::WriteError(e.to_string()))?;
+
+        self.sender_join_handle
+            .await
+            .map_err(|e| Error::WriteError(e.to_string()))?;
+        Ok(())
+    }
+
+    pub async fn flush(&self) -> Result<()> {
+        self.accumulate.begin_flush();
+        self.accumulate.await_flush_completion().await?;
+        Ok(())
+    }
+
+    pub fn create_bucket_assigner(table_path: &TablePath) -> Box<dyn BucketAssigner> {
+        // always sticky
+        Box::new(StickyBucketAssigner::new(table_path.clone()))
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
new file mode 100644
index 0000000000..1f8341dd66
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -0,0 +1,243 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::BucketId;
+use crate::cluster::{BucketLocation, ServerNode, ServerType};
+use crate::error::Result;
+use crate::metadata::{JsonSerde, TableBucket, TableDescriptor, TableInfo, TablePath};
+use crate::proto::MetadataResponse;
+use crate::rpc::{from_pb_server_node, from_pb_table_path};
+use rand::random_range;
+use std::collections::HashMap;
+
+static EMPTY: Vec<BucketLocation> = Vec::new();
+
+#[derive(Default)]
+pub struct Cluster {
+    coordinator_server: Option<ServerNode>,
+    alive_tablet_servers_by_id: HashMap<i32, ServerNode>,
+    alive_tablet_servers: Vec<ServerNode>,
+    available_locations_by_path: HashMap<TablePath, Vec<BucketLocation>>,
+    available_locations_by_bucket: HashMap<TableBucket, BucketLocation>,
+    table_id_by_path: HashMap<TablePath, i64>,
+    table_path_by_id: HashMap<i64, TablePath>,
+    table_info_by_path: HashMap<TablePath, TableInfo>,
+}
+
+impl Cluster {
+    pub fn new(
+        coordinator_server: Option<ServerNode>,
+        alive_tablet_servers_by_id: HashMap<i32, ServerNode>,
+        available_locations_by_path: HashMap<TablePath, Vec<BucketLocation>>,
+        available_locations_by_bucket: HashMap<TableBucket, BucketLocation>,
+        table_id_by_path: HashMap<TablePath, i64>,
+        table_info_by_path: HashMap<TablePath, TableInfo>,
+    ) -> Self {
+        let alive_tablet_servers = alive_tablet_servers_by_id.values().cloned().collect();
+        let table_path_by_id = table_id_by_path
+            .iter()
+            .map(|(path, table_id)| (*table_id, path.clone()))
+            .collect();
+        Cluster {
+            coordinator_server,
+            alive_tablet_servers_by_id,
+            alive_tablet_servers,
+            available_locations_by_path,
+            available_locations_by_bucket,
+            table_id_by_path,
+            table_path_by_id,
+            table_info_by_path,
+        }
+    }
+
+    pub fn update(&mut self, cluster: Cluster) {
+        let Cluster {
+            coordinator_server,
+            alive_tablet_servers_by_id,
+            alive_tablet_servers,
+            available_locations_by_path,
+            available_locations_by_bucket,
+            table_id_by_path,
+            table_path_by_id,
+            table_info_by_path,
+        } = cluster;
+        self.coordinator_server = coordinator_server;
+        self.alive_tablet_servers_by_id = alive_tablet_servers_by_id;
+        self.alive_tablet_servers = alive_tablet_servers;
+        self.available_locations_by_path = available_locations_by_path;
+        self.available_locations_by_bucket = available_locations_by_bucket;
+        self.table_id_by_path = table_id_by_path;
+        self.table_path_by_id = table_path_by_id;
+        self.table_info_by_path = table_info_by_path;
+    }
+
+    pub fn from_metadata_response(
+        metadata_response: MetadataResponse,
+        origin_cluster: Option<&Cluster>,
+    ) -> Result<Cluster> {
+        let mut servers = HashMap::with_capacity(metadata_response.tablet_servers.len());
+        for pb_server in metadata_response.tablet_servers {
+            let server_id = pb_server.node_id;
+            let server_node = from_pb_server_node(pb_server, ServerType::TabletServer);
+            servers.insert(server_id, server_node);
+        }
+
+        let coordinator_server = metadata_response
+            .coordinator_server
+            .map(|node| from_pb_server_node(node, ServerType::CoordinatorServer));
+
+        let mut table_id_by_path = HashMap::new();
+        let mut table_info_by_path = HashMap::new();
+        if let Some(origin) = origin_cluster {
+            table_info_by_path.extend(origin.get_table_info_by_path().clone());
+            table_id_by_path.extend(origin.get_table_id_by_path().clone());
+        }
+
+        // Index the bucket locations by table path, and index bucket location by bucket
+        let mut tmp_available_location_by_bucket = HashMap::new();
+        let mut tmp_available_locations_by_path = HashMap::new();
+
+        for table_metadata in metadata_response.table_metadata {
+            let table_id = table_metadata.table_id;
+            let table_path = from_pb_table_path(&table_metadata.table_path);
+            let table_descriptor = TableDescriptor::deserialize_json(
+                &serde_json::from_slice(table_metadata.table_json.as_slice()).unwrap(),
+            )?;
+            let table_info = TableInfo::of(
+                table_path.clone(),
+                table_id,
+                table_metadata.schema_id,
+                table_descriptor,
+                table_metadata.created_time,
+                table_metadata.modified_time,
+            );
+            table_info_by_path.insert(table_path.clone(), table_info);
+
+            // now, get bucket matadata
+            let mut found_unavailable_bucket = false;
+            let mut available_bucket_for_table = vec![];
+            let mut bucket_for_table = vec![];
+            for bucket_metadata in table_metadata.bucket_metadata {
+                let bucket_id = bucket_metadata.bucket_id;
+                let bucket = TableBucket::new(table_id, bucket_id);
+                let bucket_location;
+                if let Some(leader_id) = bucket_metadata.leader_id
+                    && let Some(server_node) = servers.get(&leader_id)
+                {
+                    bucket_location = BucketLocation::new(
+                        bucket.clone(),
+                        Some(server_node.clone()),
+                        table_path.clone(),
+                    );
+                    available_bucket_for_table.push(bucket_location.clone());
+                    tmp_available_location_by_bucket
+                        .insert(bucket.clone(), bucket_location.clone());
+                } else {
+                    found_unavailable_bucket = true;
+                    bucket_location = BucketLocation::new(bucket.clone(), None, table_path.clone());
+                }
+                bucket_for_table.push(bucket_location.clone());
+            }
+
+            if found_unavailable_bucket {
+                tmp_available_locations_by_path
+                    .insert(table_path.clone(), available_bucket_for_table.clone());
+            } else {
+                tmp_available_locations_by_path.insert(table_path.clone(), bucket_for_table);
+            }
+        }
+        Ok(Cluster::new(
+            coordinator_server,
+            servers,
+            tmp_available_locations_by_path,
+            tmp_available_location_by_bucket,
+            table_id_by_path,
+            table_info_by_path,
+        ))
+    }
+
+    pub fn get_coordinator_server(&self) -> Option<&ServerNode> {
+        self.coordinator_server.as_ref()
+    }
+
+    pub fn leader_for(&self, table_bucket: &TableBucket) -> Option<&ServerNode> {
+        let location = self.available_locations_by_bucket.get(table_bucket);
+        if let Some(location) = location {
+            location.leader().as_ref()
+        } else {
+            None
+        }
+    }
+
+    pub fn get_tablet_server(&self, id: i32) -> Option<&ServerNode> {
+        self.alive_tablet_servers_by_id.get(&id)
+    }
+
+    pub fn get_table_bucket(&self, table_path: &TablePath, bucket_id: BucketId) -> TableBucket {
+        let table_info = self.get_table(table_path);
+        TableBucket::new(table_info.table_id, bucket_id)
+    }
+
+    pub fn get_bucket_locations_by_path(&self) -> &HashMap<TablePath, Vec<BucketLocation>> {
+        &self.available_locations_by_path
+    }
+
+    pub fn get_table_info_by_path(&self) -> &HashMap<TablePath, TableInfo> {
+        &self.table_info_by_path
+    }
+
+    pub fn get_table_id_by_path(&self) -> &HashMap<TablePath, i64> {
+        &self.table_id_by_path
+    }
+
+    pub fn get_available_buckets_for_table_path(
+        &self,
+        table_path: &TablePath,
+    ) -> &Vec<BucketLocation> {
+        self.available_locations_by_path
+            .get(table_path)
+            .unwrap_or(&EMPTY)
+    }
+
+    pub fn get_one_available_server(&self) -> &ServerNode {
+        assert!(
+            !self.alive_tablet_servers.is_empty(),
+            "no alive tablet server in cluster"
+        );
+        let offset = random_range(0..self.alive_tablet_servers.len());
+        self.alive_tablet_servers
+            .get(offset)
+            .unwrap_or_else(|| panic!("can't find alive tab server by offset {offset}"))
+    }
+
+    pub fn get_bucket_count(&self, table_path: &TablePath) -> i32 {
+        self.table_info_by_path
+            .get(table_path)
+            .unwrap_or_else(|| panic!("can't not table info by path {table_path}"))
+            .num_buckets
+    }
+
+    pub fn get_table(&self, table_path: &TablePath) -> &TableInfo {
+        self.table_info_by_path
+            .get(table_path)
+            .unwrap_or_else(|| panic!("can't find table info by path {table_path}"))
+    }
+
+    pub fn opt_get_table(&self, table_path: &TablePath) -> Option<&TableInfo> {
+        self.table_info_by_path.get(table_path)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/cluster/mod.rs b/fluss-rust/crates/fluss/src/cluster/mod.rs
new file mode 100644
index 0000000000..f9d42e4453
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/cluster/mod.rs
@@ -0,0 +1,99 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::BucketId;
+use crate::metadata::{TableBucket, TablePath};
+
+#[allow(clippy::module_inception)]
+mod cluster;
+
+pub use cluster::Cluster;
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub struct ServerNode {
+    id: i32,
+    uid: String,
+    host: String,
+    port: u32,
+    server_type: ServerType,
+}
+
+impl ServerNode {
+    pub fn new(id: i32, host: String, port: u32, server_type: ServerType) -> ServerNode {
+        ServerNode {
+            id,
+            uid: match server_type {
+                ServerType::CoordinatorServer => format!("cs-{id}"),
+                ServerType::TabletServer => format!("ts-{id}"),
+            },
+            host,
+            port,
+            server_type,
+        }
+    }
+
+    pub fn uid(&self) -> &String {
+        &self.uid
+    }
+
+    pub fn url(&self) -> String {
+        format!("{}:{}", self.host, self.port)
+    }
+
+    pub fn id(&self) -> i32 {
+        self.id
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub enum ServerType {
+    TabletServer,
+    CoordinatorServer,
+}
+
+#[derive(Debug, Clone)]
+pub struct BucketLocation {
+    pub table_bucket: TableBucket,
+    leader: Option<ServerNode>,
+    pub table_path: TablePath,
+}
+
+impl BucketLocation {
+    pub fn new(
+        table_bucket: TableBucket,
+        leader: Option<ServerNode>,
+        table_path: TablePath,
+    ) -> BucketLocation {
+        BucketLocation {
+            table_bucket,
+            leader,
+            table_path,
+        }
+    }
+
+    pub fn leader(&self) -> &Option<ServerNode> {
+        &self.leader
+    }
+
+    pub fn table_bucket(&self) -> &TableBucket {
+        &self.table_bucket
+    }
+
+    pub fn bucket_id(&self) -> BucketId {
+        self.table_bucket.bucket_id()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
new file mode 100644
index 0000000000..08574965f4
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -0,0 +1,39 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use clap::Parser;
+use serde::{Deserialize, Serialize};
+
+#[derive(Parser, Debug, Clone, Deserialize, Serialize, Default)]
+#[command(author, version, about, long_about = None)]
+pub struct Config {
+    #[arg(long)]
+    #[serde(skip_serializing_if = "Option::is_none")]
+    pub bootstrap_server: Option<String>,
+
+    #[arg(long, default_value_t = 10 * 1024 * 1024)]
+    pub request_max_size: i32,
+
+    #[arg(long, default_value_t = String::from("all"))]
+    pub writer_acks: String,
+
+    #[arg(long, default_value_t = i32::MAX)]
+    pub writer_retries: i32,
+
+    #[arg(long, default_value_t = 2 * 1024 * 1024)]
+    pub writer_batch_size: i32,
+}
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
new file mode 100644
index 0000000000..58b88a4786
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -0,0 +1,50 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::RpcError;
+use arrow_schema::ArrowError;
+use std::{io, result};
+use thiserror::Error;
+
+pub type Result<T> = result::Result<T, Error>;
+
+#[derive(Debug, Error)]
+pub enum Error {
+    #[error(transparent)]
+    Io(#[from] io::Error),
+
+    #[error("Invalid table")]
+    InvalidTableError(String),
+
+    #[error("Json serde error")]
+    JsonSerdeError(String),
+
+    #[error("Rpc error")]
+    RpcError(#[from] RpcError),
+
+    #[error("Row convert error")]
+    RowConvertError(String),
+
+    #[error("arrow error")]
+    ArrowError(#[from] ArrowError),
+
+    #[error("Write error: {0}")]
+    WriteError(String),
+
+    #[error("Illegal argument error: {0}")]
+    IllegalArgument(String),
+}
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
new file mode 100644
index 0000000000..e63b5edfd8
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -0,0 +1,37 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+pub mod client;
+pub mod metadata;
+pub mod record;
+pub mod row;
+pub mod rpc;
+
+mod cluster;
+
+pub mod config;
+pub mod error;
+
+mod util;
+
+pub type TableId = u64;
+pub type PartitionId = u64;
+pub type BucketId = i32;
+
+pub mod proto {
+    include!(concat!(env!("OUT_DIR"), "/proto.rs"));
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
new file mode 100644
index 0000000000..0c00c6f08e
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -0,0 +1,814 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use serde::{Deserialize, Serialize};
+use std::fmt::{Display, Formatter};
+
+/// Data type for Fluss table.
+/// Impl reference: <todo: link>
+#[derive(Debug, Clone, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub enum DataType {
+    Boolean(BooleanType),
+    TinyInt(TinyIntType),
+    SmallInt(SmallIntType),
+    Int(IntType),
+    BigInt(BigIntType),
+    Float(FloatType),
+    Double(DoubleType),
+    Char(CharType),
+    String(StringType),
+    Decimal(DecimalType),
+    Date(DateType),
+    Time(TimeType),
+    Timestamp(TimestampType),
+    TimestampLTz(TimestampLTzType),
+    Bytes(BytesType),
+    Binary(BinaryType),
+    Array(ArrayType),
+    Map(MapType),
+    Row(RowType),
+}
+
+impl DataType {
+    pub fn is_nullable(&self) -> bool {
+        match self {
+            DataType::Boolean(v) => v.nullable,
+            DataType::TinyInt(v) => v.nullable,
+            DataType::SmallInt(v) => v.nullable,
+            DataType::Int(v) => v.nullable,
+            DataType::BigInt(v) => v.nullable,
+            DataType::Decimal(v) => v.nullable,
+            DataType::Double(v) => v.nullable,
+            DataType::Float(v) => v.nullable,
+            DataType::Binary(v) => v.nullable,
+            DataType::Char(v) => v.nullable,
+            DataType::String(v) => v.nullable,
+            DataType::Date(v) => v.nullable,
+            DataType::TimestampLTz(v) => v.nullable,
+            DataType::Time(v) => v.nullable,
+            DataType::Timestamp(v) => v.nullable,
+            DataType::Array(v) => v.nullable,
+            DataType::Map(v) => v.nullable,
+            DataType::Row(v) => v.nullable,
+            DataType::Bytes(v) => v.nullable,
+        }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        match self {
+            DataType::Boolean(v) => DataType::Boolean(v.as_non_nullable()),
+            DataType::TinyInt(v) => DataType::TinyInt(v.as_non_nullable()),
+            DataType::SmallInt(v) => DataType::SmallInt(v.as_non_nullable()),
+            DataType::Int(v) => DataType::Int(v.as_non_nullable()),
+            DataType::BigInt(v) => DataType::BigInt(v.as_non_nullable()),
+            DataType::Decimal(v) => DataType::Decimal(v.as_non_nullable()),
+            DataType::Double(v) => DataType::Double(v.as_non_nullable()),
+            DataType::Float(v) => DataType::Float(v.as_non_nullable()),
+            DataType::Binary(v) => DataType::Binary(v.as_non_nullable()),
+            DataType::Char(v) => DataType::Char(v.as_non_nullable()),
+            DataType::String(v) => DataType::String(v.as_non_nullable()),
+            DataType::Date(v) => DataType::Date(v.as_non_nullable()),
+            DataType::TimestampLTz(v) => DataType::TimestampLTz(v.as_non_nullable()),
+            DataType::Time(v) => DataType::Time(v.as_non_nullable()),
+            DataType::Timestamp(v) => DataType::Timestamp(v.as_non_nullable()),
+            DataType::Array(v) => DataType::Array(v.as_non_nullable()),
+            DataType::Map(v) => DataType::Map(v.as_non_nullable()),
+            DataType::Row(v) => DataType::Row(v.as_non_nullable()),
+            DataType::Bytes(v) => DataType::Bytes(v.as_non_nullable()),
+        }
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct BooleanType {
+    nullable: bool,
+}
+
+impl Default for BooleanType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl BooleanType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct TinyIntType {
+    nullable: bool,
+}
+
+impl Default for TinyIntType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl TinyIntType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct SmallIntType {
+    nullable: bool,
+}
+
+impl Default for SmallIntType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl SmallIntType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct IntType {
+    nullable: bool,
+}
+
+impl Default for IntType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl IntType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct BigIntType {
+    nullable: bool,
+}
+
+impl Default for BigIntType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl BigIntType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct FloatType {
+    nullable: bool,
+}
+
+impl Default for FloatType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl FloatType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct DoubleType {
+    nullable: bool,
+}
+
+impl Default for DoubleType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl DoubleType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct CharType {
+    nullable: bool,
+    length: u32,
+}
+
+impl CharType {
+    pub fn new(length: u32) -> Self {
+        Self::with_nullable(length, true)
+    }
+
+    pub fn with_nullable(length: u32, nullable: bool) -> Self {
+        Self { nullable, length }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(self.length, false)
+    }
+
+    pub fn length(&self) -> u32 {
+        self.length
+    }
+}
+
+impl Display for CharType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "CHAR({})", self.length)?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct StringType {
+    nullable: bool,
+}
+
+impl Default for StringType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl StringType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct DecimalType {
+    nullable: bool,
+    precision: u32,
+    scale: u32,
+}
+
+impl DecimalType {
+    pub const MIN_PRECISION: u32 = 1;
+
+    pub const MAX_PRECISION: u32 = 38;
+
+    pub const DEFAULT_PRECISION: u32 = 10;
+
+    pub const MIN_SCALE: u32 = 0;
+
+    pub const DEFAULT_SCALE: u32 = 0;
+
+    pub fn new(precision: u32, scale: u32) -> Self {
+        Self::with_nullable(true, precision, scale)
+    }
+
+    pub fn with_nullable(nullable: bool, precision: u32, scale: u32) -> Self {
+        DecimalType {
+            nullable,
+            precision,
+            scale,
+        }
+    }
+
+    pub fn precision(&self) -> u32 {
+        self.precision
+    }
+
+    pub fn scale(&self) -> u32 {
+        self.scale
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false, self.precision, self.scale)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct DateType {
+    nullable: bool,
+}
+
+impl Default for DateType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl DateType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Default, Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct TimeType {
+    nullable: bool,
+    precision: u32,
+}
+
+impl TimeType {
+    fn default() -> Self {
+        Self::new(Self::DEFAULT_PRECISION)
+    }
+}
+
+impl TimeType {
+    pub const MIN_PRECISION: u32 = 0;
+
+    pub const MAX_PRECISION: u32 = 9;
+
+    pub const DEFAULT_PRECISION: u32 = 0;
+
+    pub fn new(precision: u32) -> Self {
+        Self::with_nullable(true, precision)
+    }
+
+    pub fn with_nullable(nullable: bool, precision: u32) -> Self {
+        TimeType {
+            nullable,
+            precision,
+        }
+    }
+
+    pub fn precision(&self) -> u32 {
+        self.precision
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false, self.precision)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct TimestampType {
+    nullable: bool,
+    precision: u32,
+}
+
+impl Default for TimestampType {
+    fn default() -> Self {
+        Self::new(Self::DEFAULT_PRECISION)
+    }
+}
+
+impl TimestampType {
+    pub const MIN_PRECISION: u32 = 0;
+
+    pub const MAX_PRECISION: u32 = 9;
+
+    pub const DEFAULT_PRECISION: u32 = 6;
+
+    pub fn new(precision: u32) -> Self {
+        Self::with_nullable(true, precision)
+    }
+
+    pub fn with_nullable(nullable: bool, precision: u32) -> Self {
+        TimestampType {
+            nullable,
+            precision,
+        }
+    }
+
+    pub fn precision(&self) -> u32 {
+        self.precision
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false, self.precision)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct TimestampLTzType {
+    nullable: bool,
+    precision: u32,
+}
+
+impl Default for TimestampLTzType {
+    fn default() -> Self {
+        Self::new(Self::DEFAULT_PRECISION)
+    }
+}
+
+impl TimestampLTzType {
+    pub const MIN_PRECISION: u32 = 0;
+
+    pub const MAX_PRECISION: u32 = 9;
+
+    pub const DEFAULT_PRECISION: u32 = 6;
+
+    pub fn new(precision: u32) -> Self {
+        Self::with_nullable(true, precision)
+    }
+
+    pub fn with_nullable(nullable: bool, precision: u32) -> Self {
+        TimestampLTzType {
+            nullable,
+            precision,
+        }
+    }
+
+    pub fn precision(&self) -> u32 {
+        self.precision
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false, self.precision)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct BytesType {
+    nullable: bool,
+}
+
+impl Default for BytesType {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl BytesType {
+    pub fn new() -> Self {
+        Self::with_nullable(true)
+    }
+
+    pub fn with_nullable(nullable: bool) -> Self {
+        Self { nullable }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+pub struct BinaryType {
+    nullable: bool,
+    length: usize,
+}
+
+impl BinaryType {
+    pub const MIN_LENGTH: usize = 1;
+
+    pub const MAX_LENGTH: usize = usize::MAX;
+
+    pub const DEFAULT_LENGTH: usize = 1;
+
+    pub fn new(length: usize) -> Self {
+        Self::with_nullable(true, length)
+    }
+
+    pub fn with_nullable(nullable: bool, length: usize) -> Self {
+        Self { nullable, length }
+    }
+
+    pub fn length(&self) -> usize {
+        self.length
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false, self.length)
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub struct ArrayType {
+    nullable: bool,
+    element_type: Box<DataType>,
+}
+
+impl ArrayType {
+    pub fn new(element_type: DataType) -> Self {
+        Self::with_nullable(true, element_type)
+    }
+
+    pub fn with_nullable(nullable: bool, element_type: DataType) -> Self {
+        Self {
+            nullable,
+            element_type: Box::new(element_type),
+        }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self {
+            nullable: false,
+            element_type: self.element_type.clone(),
+        }
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Deserialize, Serialize, Hash)]
+pub struct MapType {
+    nullable: bool,
+    key_type: Box<DataType>,
+    value_type: Box<DataType>,
+}
+
+impl MapType {
+    pub fn new(key_type: DataType, value_type: DataType) -> Self {
+        Self::with_nullable(true, key_type, value_type)
+    }
+
+    pub fn with_nullable(nullable: bool, key_type: DataType, value_type: DataType) -> Self {
+        Self {
+            nullable,
+            key_type: Box::new(key_type),
+            value_type: Box::new(value_type),
+        }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self {
+            nullable: false,
+            key_type: self.key_type.clone(),
+            value_type: self.value_type.clone(),
+        }
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Deserialize, Serialize, Hash)]
+pub struct RowType {
+    nullable: bool,
+    fields: Vec<DataField>,
+}
+
+impl RowType {
+    pub const fn new(fields: Vec<DataField>) -> Self {
+        Self::with_nullable(true, fields)
+    }
+
+    pub const fn with_nullable(nullable: bool, fields: Vec<DataField>) -> Self {
+        Self { nullable, fields }
+    }
+
+    pub fn as_non_nullable(&self) -> Self {
+        Self::with_nullable(false, self.fields.clone())
+    }
+
+    pub fn fields(&self) -> &Vec<DataField> {
+        &self.fields
+    }
+}
+
+pub struct DataTypes;
+
+impl DataTypes {
+    pub fn binary(length: usize) -> DataType {
+        DataType::Binary(BinaryType::new(length))
+    }
+
+    pub fn bytes() -> DataType {
+        DataType::Bytes(BytesType::new())
+    }
+
+    pub fn boolean() -> DataType {
+        DataType::Boolean(BooleanType::new())
+    }
+
+    pub fn int() -> DataType {
+        DataType::Int(IntType::new())
+    }
+
+    /// Data type of a 1-byte signed integer with values from -128 to 127.
+    pub fn tinyint() -> DataType {
+        DataType::TinyInt(TinyIntType::new())
+    }
+
+    /// Data type of a 2-byte signed integer with values from -32,768 to 32,767.
+    pub fn smallint() -> DataType {
+        DataType::SmallInt(SmallIntType::new())
+    }
+
+    pub fn bigint() -> DataType {
+        DataType::BigInt(BigIntType::new())
+    }
+
+    /// Data type of a 4-byte single precision floating point number.
+    pub fn float() -> DataType {
+        DataType::Float(FloatType::new())
+    }
+
+    /// Data type of an 8-byte double precision floating point number.
+    pub fn double() -> DataType {
+        DataType::Double(DoubleType::new())
+    }
+
+    pub fn char(length: u32) -> DataType {
+        DataType::Char(CharType::new(length))
+    }
+
+    /// Data type of a variable-length character string.
+    pub fn string() -> DataType {
+        DataType::String(StringType::new())
+    }
+
+    /// Data type of a decimal number with fixed precision and scale `DECIMAL(p, s)` where
+    /// `p` is the number of digits in a number (=precision) and `s` is the number of
+    /// digits to the right of the decimal point in a number (=scale). `p` must have a value
+    /// between 1 and 38 (both inclusive). `s` must have a value between 0 and `p` (both inclusive).
+    pub fn decimal(precision: u32, scale: u32) -> DataType {
+        DataType::Decimal(DecimalType::new(precision, scale))
+    }
+
+    pub fn date() -> DataType {
+        DataType::Date(DateType::new())
+    }
+
+    /// Data type of a time WITHOUT time zone `TIME` with no fractional seconds by default.
+    pub fn time() -> DataType {
+        DataType::Time(TimeType::default())
+    }
+
+    /// Data type of a time WITHOUT time zone `TIME(p)` where `p` is the number of digits
+    /// of fractional seconds (=precision). `p` must have a value between 0 and 9 (both inclusive).
+    pub fn time_with_precision(precision: u32) -> DataType {
+        DataType::Time(TimeType::new(precision))
+    }
+
+    /// Data type of a timestamp WITHOUT time zone `TIMESTAMP` with 6 digits of fractional
+    /// seconds by default.
+    pub fn timestamp() -> DataType {
+        DataType::Timestamp(TimestampType::default())
+    }
+
+    /// Data type of a timestamp WITHOUT time zone `TIMESTAMP(p)` where `p` is the number
+    /// of digits of fractional seconds (=precision). `p` must have a value between 0 and 9
+    /// (both inclusive).
+    pub fn timestamp_with_precision(precision: u32) -> DataType {
+        DataType::Timestamp(TimestampType::new(precision))
+    }
+
+    /// Data type of a timestamp WITH time zone `TIMESTAMP WITH TIME ZONE` with 6 digits of
+    /// fractional seconds by default.
+    pub fn timestamp_ltz() -> DataType {
+        DataType::TimestampLTz(TimestampLTzType::default())
+    }
+
+    /// Data type of a timestamp WITH time zone `TIMESTAMP WITH TIME ZONE(p)` where `p` is the number
+    /// of digits of fractional seconds (=precision). `p` must have a value between 0 and 9 (both inclusive).
+    pub fn timestamp_ltz_with_precision(precision: u32) -> DataType {
+        DataType::TimestampLTz(TimestampLTzType::new(precision))
+    }
+
+    /// Data type of an array of elements with same subtype.
+    pub fn array(element: DataType) -> DataType {
+        DataType::Array(ArrayType::new(element))
+    }
+
+    /// Data type of an associative array that maps keys to values.
+    pub fn map(key_type: DataType, value_type: DataType) -> DataType {
+        DataType::Map(MapType::new(key_type, value_type))
+    }
+
+    /// Field definition with field name and data type.
+    pub fn field(name: String, data_type: DataType) -> DataField {
+        DataField::new(name, data_type, None)
+    }
+
+    /// Field definition with field name, data type, and a description.
+    pub fn field_with_description(
+        name: String,
+        data_type: DataType,
+        description: String,
+    ) -> DataField {
+        DataField::new(name, data_type, Some(description))
+    }
+
+    /// Data type of a sequence of fields.
+    pub fn row(fields: Vec<DataField>) -> DataType {
+        DataType::Row(RowType::new(fields))
+    }
+
+    /// Data type of a sequence of fields with generated field names (f0, f1, f2, ...).
+    pub fn row_from_types(field_types: Vec<DataType>) -> DataType {
+        let fields = field_types
+            .into_iter()
+            .enumerate()
+            .map(|(i, dt)| DataField::new(format!("f{i}"), dt, None))
+            .collect();
+        DataType::Row(RowType::new(fields))
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub struct DataField {
+    pub name: String,
+    pub data_type: DataType,
+    pub description: Option<String>,
+}
+
+impl DataField {
+    pub fn new(name: String, data_type: DataType, description: Option<String>) -> DataField {
+        DataField {
+            name,
+            data_type,
+            description,
+        }
+    }
+
+    pub fn name(&self) -> &str {
+        &self.name
+    }
+
+    pub fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+}
+
+// todo: implement display for datatype
diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
new file mode 100644
index 0000000000..1c7604c98a
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -0,0 +1,464 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::{InvalidTableError, JsonSerdeError};
+use crate::error::Result;
+use crate::metadata::datatype::{DataType, DataTypes};
+use crate::metadata::table::{Column, Schema, TableDescriptor};
+use serde_json::{Value, json};
+use std::collections::HashMap;
+
+pub trait JsonSerde: Sized {
+    fn serialize_json(&self) -> Result<Value>;
+
+    fn deserialize_json(node: &Value) -> Result<Self>;
+}
+
+impl DataType {
+    pub fn to_type_root(&self) -> &str {
+        match &self {
+            DataType::Boolean(_) => "BOOLEAN",
+            DataType::TinyInt(_) => "TINYINT",
+            DataType::SmallInt(_) => "SMALLINT",
+            DataType::Int(_) => "INTEGER",
+            DataType::BigInt(_) => "BIGINT",
+            DataType::Float(_) => "FLOAT",
+            DataType::Double(_) => "DOUBLE",
+            DataType::Char(_) => "CHAR",
+            DataType::String(_) => "STRING",
+            DataType::Decimal(_) => "DECIMAL",
+            DataType::Date(_) => "DATE",
+            DataType::Time(_) => "TIME_WITHOUT_TIME_ZONE",
+            DataType::Timestamp(_) => "TIMESTAMP_WITHOUT_TIME_ZONE",
+            DataType::TimestampLTz(_) => "TIMESTAMP_WITH_LOCAL_TIME_ZONE",
+            DataType::Bytes(_) => "BYTES",
+            DataType::Binary(_) => "BINARY",
+            DataType::Array(_) => "ARRAY",
+            DataType::Map(_) => "MAP",
+            DataType::Row(_) => "ROW",
+        }
+    }
+}
+
+impl DataType {
+    const FIELD_NAME_TYPE_NAME: &'static str = "type";
+    const FIELD_NAME_NULLABLE: &'static str = "nullable";
+    const FIELD_NAME_LENGTH: &'static str = "length";
+    #[allow(dead_code)]
+    const FIELD_NAME_PRECISION: &'static str = "precision";
+    #[allow(dead_code)]
+    const FILED_NAME_SCALE: &'static str = "scale";
+    #[allow(dead_code)]
+    const FIELD_NAME_ELEMENT_TYPE: &'static str = "element_type";
+    #[allow(dead_code)]
+    const FIELD_NAME_KEY_TYPE: &'static str = "key_type";
+    #[allow(dead_code)]
+    const FIELD_NAME_VALUE_TYPE: &'static str = "value_type";
+    #[allow(dead_code)]
+    const FIELD_NAME_FIELDS: &'static str = "fields";
+    #[allow(dead_code)]
+    const FIELD_NAME_FIELD_NAME: &'static str = "name";
+    // ROW
+    #[allow(dead_code)]
+    const FIELD_NAME_FIELD_TYPE: &'static str = "field_type";
+    #[allow(dead_code)]
+    const FIELD_NAME_FIELD_DESCRIPTION: &'static str = "description";
+}
+
+impl JsonSerde for DataType {
+    fn serialize_json(&self) -> Result<Value> {
+        let mut obj = serde_json::Map::new();
+
+        obj.insert(
+            Self::FIELD_NAME_TYPE_NAME.to_string(),
+            json!(Self::to_type_root(self)),
+        );
+        if !self.is_nullable() {
+            obj.insert(Self::FIELD_NAME_NULLABLE.to_string(), json!(false));
+        }
+
+        match &self {
+            DataType::Boolean(_)
+            | DataType::TinyInt(_)
+            | DataType::SmallInt(_)
+            | DataType::Int(_)
+            | DataType::BigInt(_)
+            | DataType::Float(_)
+            | DataType::Double(_)
+            | DataType::String(_)
+            | DataType::Bytes(_)
+            | DataType::Date(_) => {
+                // do nothing
+            }
+            DataType::Char(_type) => {
+                obj.insert(Self::FIELD_NAME_LENGTH.to_string(), json!(_type.length()));
+            }
+            DataType::Binary(_type) => {
+                obj.insert(Self::FIELD_NAME_LENGTH.to_string(), json!(_type.length()));
+            }
+            DataType::Decimal(_type) => {
+                todo!()
+            }
+
+            DataType::Time(_type) => {
+                todo!()
+            }
+            DataType::Timestamp(_type) => {
+                todo!()
+            }
+            DataType::TimestampLTz(_type) => {
+                todo!()
+            }
+            DataType::Array(_type) => todo!(),
+            DataType::Map(_type) => todo!(),
+            DataType::Row(_type) => todo!(),
+        }
+        Ok(Value::Object(obj))
+    }
+
+    fn deserialize_json(node: &Value) -> Result<Self> {
+        let mut _is_nullable = true;
+        let type_root = node
+            .get(Self::FIELD_NAME_TYPE_NAME)
+            .and_then(|v| v.as_str())
+            .ok_or_else(|| {
+                JsonSerdeError(format!(
+                    "Couldn't find field {} while deserializing datatype.",
+                    Self::FIELD_NAME_TYPE_NAME
+                ))
+            })?;
+
+        let mut data_type = match type_root {
+            "BOOLEAN" => DataTypes::boolean(),
+            "TINYINT" => DataTypes::tinyint(),
+            "SMALLINT" => DataTypes::smallint(),
+            "INTEGER" => DataTypes::int(),
+            "BIGINT" => DataTypes::bigint(),
+            "FLOAT" => DataTypes::float(),
+            "DOUBLE" => DataTypes::double(),
+            "CHAR" => todo!(),
+            "STRING" => DataTypes::string(),
+            "DECIMAL" => todo!(),
+            "DATE" => DataTypes::date(),
+            "TIME_WITHOUT_TIME_ZONE" => todo!(), // Precision set separately
+            "TIMESTAMP_WITHOUT_TIME_ZONE" => todo!(), // Precision set separately
+            "TIMESTAMP_WITH_LOCAL_TIME_ZONE" => todo!(), // Precision set separately
+            "BYTES" => DataTypes::bytes(),
+            "BINARY" => todo!(),
+            "ARRAY" => todo!(),
+            "MAP" => todo!(),
+            "ROW" => todo!(),
+            _ => return Err(JsonSerdeError(format!("Unknown type root: {type_root}"))),
+        };
+
+        if let Some(nullable) = node.get(Self::FIELD_NAME_NULLABLE) {
+            let nullable_value = nullable.as_bool().unwrap_or(true);
+            if !nullable_value {
+                data_type = data_type.as_non_nullable();
+            }
+        }
+        Ok(data_type)
+    }
+}
+
+impl Column {
+    const NAME: &'static str = "name";
+    const DATA_TYPE: &'static str = "data_type";
+    const COMMENT: &'static str = "comment";
+}
+
+impl JsonSerde for Column {
+    fn serialize_json(&self) -> Result<Value> {
+        let mut obj = serde_json::Map::new();
+
+        // Common fields
+        obj.insert(Self::NAME.to_string(), json!(self.name()));
+        obj.insert(
+            Self::DATA_TYPE.to_string(),
+            self.data_type().serialize_json()?,
+        );
+
+        if let Some(comment) = &self.comment() {
+            obj.insert(Self::COMMENT.to_string(), json!(comment));
+        }
+
+        Ok(Value::Object(obj))
+    }
+
+    fn deserialize_json(node: &Value) -> Result<Column> {
+        let name = node
+            .get(Self::NAME)
+            .and_then(|v| v.as_str())
+            .unwrap_or_else(|| panic!("{}", format!("Missing required field: {}", Self::NAME)))
+            .to_string();
+
+        let data_type_node = node.get(Self::DATA_TYPE).ok_or_else(|| {
+            JsonSerdeError(format!("Missing required field: {}", Self::DATA_TYPE))
+        })?;
+
+        let data_type = DataType::deserialize_json(data_type_node)?;
+
+        let mut column = Column::new(&name, data_type);
+
+        if let Some(comment) = node.get(Self::COMMENT).and_then(|v| v.as_str()) {
+            column = column.with_comment(comment);
+        }
+
+        Ok(column)
+    }
+}
+
+impl Schema {
+    const COLUMNS_NAME: &'static str = "columns";
+    const PRIMARY_KEY_NAME: &'static str = "primary_key";
+    const VERSION_KEY: &'static str = "version";
+    const VERSION: u32 = 1;
+}
+
+impl JsonSerde for Schema {
+    fn serialize_json(&self) -> Result<Value> {
+        let mut obj = serde_json::Map::new();
+
+        // Serialize version
+        obj.insert(Self::VERSION_KEY.to_string(), json!(Self::VERSION));
+
+        // Serialize columns
+        let columns: Vec<Value> = self
+            .columns()
+            .iter()
+            .map(|col| col.serialize_json())
+            .collect::<Result<_>>()?;
+        obj.insert(Self::COLUMNS_NAME.to_string(), json!(columns));
+
+        // Serialize primary key if present
+        if let Some(primary_key) = &self.primary_key() {
+            let pk_values: Vec<Value> = primary_key
+                .column_names()
+                .iter()
+                .map(|name| json!(name))
+                .collect();
+            obj.insert(Self::PRIMARY_KEY_NAME.to_string(), json!(pk_values));
+        }
+        Ok(Value::Object(obj))
+    }
+
+    fn deserialize_json(node: &Value) -> Result<Schema> {
+        let columns_node = node
+            .get(Self::COLUMNS_NAME)
+            .ok_or_else(|| {
+                JsonSerdeError(format!("Missing required field: {}", Self::COLUMNS_NAME))
+            })?
+            .as_array()
+            .ok_or_else(|| JsonSerdeError(format!("{} should be an array", Self::COLUMNS_NAME)))?;
+
+        let mut columns = Vec::with_capacity(columns_node.len());
+        for col_node in columns_node {
+            columns.push(Column::deserialize_json(col_node)?);
+        }
+
+        let mut schema_builder = Schema::builder().with_columns(columns);
+
+        if let Some(pk_node) = node.get(Self::PRIMARY_KEY_NAME) {
+            let pk_array = pk_node
+                .as_array()
+                .ok_or_else(|| InvalidTableError("Primary key is not an array".to_string()))?;
+
+            let mut primary_keys = Vec::with_capacity(pk_array.len());
+            for name_node in pk_array {
+                primary_keys.push(
+                    name_node
+                        .as_str()
+                        .ok_or_else(|| InvalidTableError("Primary key is not string".to_string()))?
+                        .to_string(),
+                );
+            }
+
+            schema_builder = schema_builder.primary_key(primary_keys);
+        }
+
+        schema_builder.build()
+    }
+}
+
+impl TableDescriptor {
+    const SCHEMA_NAME: &'static str = "schema";
+    const COMMENT_NAME: &'static str = "comment";
+    const PARTITION_KEY_NAME: &'static str = "partition_key";
+    const BUCKET_KEY_NAME: &'static str = "bucket_key";
+    const BUCKET_COUNT_NAME: &'static str = "bucket_count";
+    const PROPERTIES_NAME: &'static str = "properties";
+    const CUSTOM_PROPERTIES_NAME: &'static str = "custom_properties";
+    const VERSION_KEY: &'static str = "version";
+    const VERSION: u32 = 1;
+
+    fn deserialize_properties(node: &Value) -> Result<HashMap<String, String>> {
+        let obj = node
+            .as_object()
+            .ok_or_else(|| JsonSerdeError("Properties should be an object".to_string()))?;
+
+        let mut properties = HashMap::with_capacity(obj.len());
+        for (key, value) in obj {
+            properties.insert(
+                key.clone(),
+                value
+                    .as_str()
+                    .ok_or_else(|| JsonSerdeError("Properties should be an object".to_string()))?
+                    .to_owned(),
+            );
+        }
+
+        Ok(properties)
+    }
+}
+
+impl JsonSerde for TableDescriptor {
+    fn serialize_json(&self) -> Result<Value> {
+        let mut obj = serde_json::Map::new();
+
+        // Serialize version
+        obj.insert(Self::VERSION_KEY.to_string(), json!(Self::VERSION));
+
+        // Serialize schema
+        obj.insert(
+            Self::SCHEMA_NAME.to_string(),
+            self.schema().serialize_json()?,
+        );
+
+        // Serialize comment if present
+        if let Some(comment) = &self.comment() {
+            obj.insert(Self::COMMENT_NAME.to_string(), json!(comment));
+        }
+
+        // Serialize partition keys
+        let partition_keys: Vec<Value> =
+            self.partition_keys().iter().map(|key| json!(key)).collect();
+        obj.insert(Self::PARTITION_KEY_NAME.to_string(), json!(partition_keys));
+
+        // Serialize table distribution if present
+        if let Some(dist) = &self.table_distribution() {
+            let bucket_keys: Vec<Value> = dist.bucket_keys().iter().map(|key| json!(key)).collect();
+            obj.insert(Self::BUCKET_KEY_NAME.to_string(), json!(bucket_keys));
+
+            if let Some(count) = dist.bucket_count() {
+                obj.insert(Self::BUCKET_COUNT_NAME.to_string(), json!(count));
+            }
+        }
+
+        // Serialize properties
+        obj.insert(Self::PROPERTIES_NAME.to_string(), json!(self.properties()));
+
+        obj.insert(
+            Self::CUSTOM_PROPERTIES_NAME.to_string(),
+            json!(self.custom_properties()),
+        );
+
+        Ok(Value::Object(obj))
+    }
+
+    fn deserialize_json(node: &Value) -> Result<Self> {
+        let mut builder = TableDescriptor::builder();
+
+        // Deserialize schema
+        let schema_node = node.get(Self::SCHEMA_NAME).ok_or_else(|| {
+            JsonSerdeError(format!("Missing required field: {}", Self::SCHEMA_NAME))
+        })?;
+        let schema = Schema::deserialize_json(schema_node)?;
+        builder = builder.schema(schema);
+
+        // Deserialize comment if present
+        if let Some(comment_node) = node.get(Self::COMMENT_NAME) {
+            let comment = comment_node
+                .as_str()
+                .ok_or_else(|| {
+                    JsonSerdeError(format!("{} should be a string", Self::COMMENT_NAME))
+                })?
+                .to_owned();
+            builder = builder.comment(comment.as_str());
+        }
+
+        let partition_node = node
+            .get(Self::PARTITION_KEY_NAME)
+            .ok_or_else(|| {
+                JsonSerdeError(format!(
+                    "Missing required field: {}",
+                    Self::PARTITION_KEY_NAME
+                ))
+            })?
+            .as_array()
+            .ok_or_else(|| {
+                JsonSerdeError(format!("{} should be an array", Self::PARTITION_KEY_NAME))
+            })?;
+
+        let mut partition_keys = Vec::with_capacity(partition_node.len());
+        for key_node in partition_node {
+            partition_keys.push(
+                key_node
+                    .as_str()
+                    .ok_or_else(|| {
+                        JsonSerdeError(format!("{} should be a string", Self::PARTITION_KEY_NAME))
+                    })?
+                    .to_owned(),
+            );
+        }
+        builder = builder.partitioned_by(partition_keys);
+
+        let mut bucket_count = None;
+        let mut bucket_keys = vec![];
+        if let Some(bucket_key_node) = node.get(Self::BUCKET_KEY_NAME) {
+            let bucket_key_node = bucket_key_node.as_array().ok_or_else(|| {
+                JsonSerdeError(format!("{} should be an array", Self::BUCKET_COUNT_NAME))
+            })?;
+
+            for key_node in bucket_key_node {
+                bucket_keys.push(
+                    key_node
+                        .as_str()
+                        .ok_or_else(|| JsonSerdeError("Bucket key should be a string".to_string()))?
+                        .to_owned(),
+                );
+            }
+        }
+
+        if let Some(bucket_count_node) = node.get(Self::BUCKET_COUNT_NAME) {
+            bucket_count = bucket_count_node.as_u64().map(|n| n as i32);
+        }
+
+        if bucket_count.is_some() || !bucket_keys.is_empty() {
+            builder = builder.distributed_by(bucket_count, bucket_keys);
+        }
+
+        // Deserialize properties
+        let properties =
+            Self::deserialize_properties(node.get(Self::PROPERTIES_NAME).ok_or_else(|| {
+                JsonSerdeError(format!("Missing required field: {}", Self::PROPERTIES_NAME))
+            })?)?;
+        builder = builder.properties(properties);
+
+        // Deserialize custom properties
+        let custom_properties = Self::deserialize_properties(
+            node.get(Self::CUSTOM_PROPERTIES_NAME).ok_or_else(|| {
+                JsonSerdeError(format!(
+                    "Missing required field: {}",
+                    Self::CUSTOM_PROPERTIES_NAME
+                ))
+            })?,
+        )?;
+        builder = builder.custom_properties(custom_properties);
+
+        builder.build()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/mod.rs b/fluss-rust/crates/fluss/src/metadata/mod.rs
new file mode 100644
index 0000000000..79465474f7
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metadata/mod.rs
@@ -0,0 +1,24 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+mod datatype;
+pub use datatype::*;
+mod json_serde;
+mod table;
+
+pub use json_serde::*;
+pub use table::*;
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
new file mode 100644
index 0000000000..a5ab61d67e
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -0,0 +1,920 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::InvalidTableError;
+use crate::error::Result;
+use crate::metadata::datatype::{DataField, DataType, RowType};
+use core::fmt;
+use serde::{Deserialize, Serialize};
+use std::collections::{HashMap, HashSet};
+use std::fmt::{Display, Formatter};
+
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub struct Column {
+    name: String,
+    data_type: DataType,
+    comment: Option<String>,
+}
+
+impl Column {
+    pub fn new(name: &str, data_type: DataType) -> Self {
+        Self {
+            name: name.to_string(),
+            data_type,
+            comment: None,
+        }
+    }
+
+    pub fn with_comment(mut self, comment: &str) -> Self {
+        self.comment = Some(comment.to_string());
+        self
+    }
+
+    pub fn with_data_type(&self, data_type: DataType) -> Self {
+        Self {
+            name: self.name.clone(),
+            data_type: data_type.clone(),
+            comment: self.comment.clone(),
+        }
+    }
+
+    // Getters...
+    pub fn name(&self) -> &str {
+        &self.name
+    }
+
+    pub fn data_type(&self) -> &DataType {
+        &self.data_type
+    }
+
+    pub fn comment(&self) -> Option<&str> {
+        self.comment.as_deref()
+    }
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub struct PrimaryKey {
+    constraint_name: String,
+    column_names: Vec<String>,
+}
+
+impl PrimaryKey {
+    pub fn new(constraint_name: &str, column_names: Vec<String>) -> Self {
+        Self {
+            constraint_name: constraint_name.to_string(),
+            column_names,
+        }
+    }
+
+    // Getters...
+    pub fn constraint_name(&self) -> &str {
+        &self.constraint_name
+    }
+
+    pub fn column_names(&self) -> &[String] {
+        &self.column_names
+    }
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub struct Schema {
+    columns: Vec<Column>,
+    primary_key: Option<PrimaryKey>,
+    // must be Row data type kind
+    row_type: DataType,
+}
+
+impl Schema {
+    pub fn empty() -> Result<Self> {
+        Self::builder().build()
+    }
+
+    pub fn builder() -> SchemaBuilder {
+        SchemaBuilder::new()
+    }
+
+    pub fn columns(&self) -> &[Column] {
+        &self.columns
+    }
+
+    pub fn primary_key(&self) -> Option<&PrimaryKey> {
+        self.primary_key.as_ref()
+    }
+
+    pub fn row_type(&self) -> &DataType {
+        &self.row_type
+    }
+
+    pub fn primary_key_indexes(&self) -> Vec<usize> {
+        self.primary_key
+            .as_ref()
+            .map(|pk| {
+                pk.column_names
+                    .iter()
+                    .filter_map(|name| self.columns.iter().position(|c| &c.name == name))
+                    .collect()
+            })
+            .unwrap_or_default()
+    }
+
+    pub fn primary_key_column_names(&self) -> Vec<&str> {
+        self.primary_key
+            .as_ref()
+            .map(|pk| pk.column_names.iter().map(|s| s.as_str()).collect())
+            .unwrap_or_default()
+    }
+
+    pub fn column_names(&self) -> Vec<&str> {
+        self.columns.iter().map(|c| c.name.as_str()).collect()
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct SchemaBuilder {
+    columns: Vec<Column>,
+    primary_key: Option<PrimaryKey>,
+}
+
+impl SchemaBuilder {
+    pub fn new() -> Self {
+        Self::default()
+    }
+
+    pub fn with_row_type(mut self, row_type: &DataType) -> Self {
+        match row_type {
+            DataType::Row(row) => {
+                for data_field in row.fields() {
+                    self = self.column(&data_field.name, data_field.data_type.clone())
+                }
+                self
+            }
+            _ => {
+                panic!("data type msut be row type")
+            }
+        }
+    }
+
+    pub fn column(mut self, name: &str, data_type: DataType) -> Self {
+        self.columns.push(Column::new(name, data_type));
+        self
+    }
+
+    pub fn with_columns(mut self, columns: Vec<Column>) -> Self {
+        self.columns.extend_from_slice(columns.as_ref());
+        self
+    }
+
+    pub fn with_comment(mut self, comment: &str) -> Self {
+        if let Some(last) = self.columns.last_mut() {
+            *last = last.clone().with_comment(comment);
+        }
+        self
+    }
+
+    pub fn primary_key(self, column_names: Vec<String>) -> Self {
+        let constraint_name = format!("PK_{}", column_names.join("_"));
+        self.primary_key_named(&constraint_name, column_names)
+    }
+
+    pub fn primary_key_named(mut self, constraint_name: &str, column_names: Vec<String>) -> Self {
+        self.primary_key = Some(PrimaryKey::new(constraint_name, column_names));
+        self
+    }
+
+    pub fn build(&mut self) -> Result<Schema> {
+        let columns = Self::normalize_columns(&mut self.columns, self.primary_key.as_ref())?;
+
+        let data_fields = columns
+            .iter()
+            .map(|c| DataField {
+                name: c.name.clone(),
+                data_type: c.data_type.clone(),
+                description: c.comment.clone(),
+            })
+            .collect();
+
+        Ok(Schema {
+            columns,
+            primary_key: self.primary_key.clone(),
+            row_type: DataType::Row(RowType::new(data_fields)),
+        })
+    }
+
+    fn normalize_columns(
+        columns: &mut [Column],
+        primary_key: Option<&PrimaryKey>,
+    ) -> Result<Vec<Column>> {
+        let names: Vec<_> = columns.iter().map(|c| &c.name).collect();
+        if let Some(duplicates) = Self::find_duplicates(&names) {
+            return Err(InvalidTableError(format!(
+                "Duplicate column names found: {duplicates:?}"
+            )));
+        }
+
+        let Some(pk) = primary_key else {
+            return Ok(columns.to_vec());
+        };
+
+        let pk_set: HashSet<_> = pk.column_names.iter().collect();
+        let all_columns: HashSet<_> = columns.iter().map(|c| &c.name).collect();
+        if !pk_set.is_subset(&all_columns) {
+            return Err(InvalidTableError(format!(
+                "Primary key columns {pk_set:?} not found in schema"
+            )));
+        }
+
+        Ok(columns
+            .iter()
+            .map(|col| {
+                if pk_set.contains(&col.name) && col.data_type.is_nullable() {
+                    col.with_data_type(col.data_type.as_non_nullable())
+                } else {
+                    col.clone()
+                }
+            })
+            .collect())
+    }
+
+    fn find_duplicates<'a>(names: &'a [&String]) -> Option<HashSet<&'a String>> {
+        let mut seen = HashSet::new();
+        let mut duplicates = HashSet::new();
+
+        for name in names {
+            if !seen.insert(name) {
+                duplicates.insert(*name);
+            }
+        }
+
+        if duplicates.is_empty() {
+            None
+        } else {
+            Some(duplicates)
+        }
+    }
+}
+
+/// distribution of table
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub struct TableDistribution {
+    bucket_count: Option<i32>,
+    bucket_keys: Vec<String>,
+}
+
+impl TableDistribution {
+    pub fn bucket_keys(&self) -> &[String] {
+        &self.bucket_keys
+    }
+
+    pub fn bucket_count(&self) -> Option<i32> {
+        self.bucket_count
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct TableDescriptorBuilder {
+    schema: Option<Schema>,
+    properties: HashMap<String, String>,
+    custom_properties: HashMap<String, String>,
+    partition_keys: Vec<String>,
+    comment: Option<String>,
+    table_distribution: Option<TableDistribution>,
+}
+
+impl TableDescriptorBuilder {
+    pub fn new() -> Self {
+        Self::default()
+    }
+
+    pub fn schema(mut self, schema: Schema) -> Self {
+        self.schema = Some(schema);
+        self
+    }
+
+    pub fn log_format(mut self, log_format: LogFormat) -> Self {
+        self.properties
+            .insert("table.log.format".to_string(), log_format.to_string());
+        self
+    }
+
+    pub fn kv_format(mut self, kv_format: KvFormat) -> Self {
+        self.properties
+            .insert("table.kv.format".to_string(), kv_format.to_string());
+        self
+    }
+
+    pub fn property<T: ToString>(mut self, key: &str, value: T) -> Self {
+        self.properties.insert(key.to_string(), value.to_string());
+        self
+    }
+
+    pub fn properties(mut self, properties: HashMap<String, String>) -> Self {
+        self.properties.extend(properties);
+        self
+    }
+
+    pub fn custom_property(mut self, key: &str, value: &str) -> Self {
+        self.custom_properties
+            .insert(key.to_string(), value.to_string());
+        self
+    }
+
+    pub fn custom_properties(mut self, custom_properties: HashMap<String, String>) -> Self {
+        self.custom_properties.extend(custom_properties);
+        self
+    }
+
+    pub fn partitioned_by(mut self, partition_keys: Vec<String>) -> Self {
+        self.partition_keys = partition_keys;
+        self
+    }
+
+    pub fn distributed_by(mut self, bucket_count: Option<i32>, bucket_keys: Vec<String>) -> Self {
+        self.table_distribution = Some(TableDistribution {
+            bucket_count,
+            bucket_keys,
+        });
+        self
+    }
+
+    pub fn comment(mut self, comment: &str) -> Self {
+        self.comment = Some(comment.to_string());
+        self
+    }
+
+    pub fn build(self) -> Result<TableDescriptor> {
+        let schema = self.schema.expect("Schema must be set");
+        let table_distribution = TableDescriptor::normalize_distribution(
+            &schema,
+            &self.partition_keys,
+            self.table_distribution,
+        )?;
+        Ok(TableDescriptor {
+            schema,
+            comment: self.comment,
+            partition_keys: self.partition_keys,
+            table_distribution,
+            properties: self.properties,
+            custom_properties: self.custom_properties,
+        })
+    }
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub struct TableDescriptor {
+    schema: Schema,
+    comment: Option<String>,
+    partition_keys: Vec<String>,
+    table_distribution: Option<TableDistribution>,
+    properties: HashMap<String, String>,
+    custom_properties: HashMap<String, String>,
+}
+
+impl TableDescriptor {
+    pub fn builder() -> TableDescriptorBuilder {
+        TableDescriptorBuilder::new()
+    }
+
+    pub fn schema(&self) -> &Schema {
+        &self.schema
+    }
+
+    pub fn bucket_keys(&self) -> Vec<&str> {
+        self.table_distribution
+            .as_ref()
+            .map(|td| td.bucket_keys.iter().map(|s| s.as_str()).collect())
+            .unwrap_or_default()
+    }
+
+    pub fn is_default_bucket_key(&self) -> Result<bool> {
+        if self.schema.primary_key().is_some() {
+            Ok(self.bucket_keys()
+                == Self::default_bucket_key_of_primary_key_table(
+                    self.schema(),
+                    &self.partition_keys,
+                )?
+                .iter()
+                .map(|s| s.as_str())
+                .collect::<Vec<_>>())
+        } else {
+            Ok(self.bucket_keys().is_empty())
+        }
+    }
+
+    pub fn is_partitioned(&self) -> bool {
+        !self.partition_keys.is_empty()
+    }
+
+    pub fn has_primary_key(&self) -> bool {
+        self.schema.primary_key().is_some()
+    }
+
+    pub fn partition_keys(&self) -> &[String] {
+        &self.partition_keys
+    }
+
+    pub fn table_distribution(&self) -> Option<&TableDistribution> {
+        self.table_distribution.as_ref()
+    }
+
+    pub fn properties(&self) -> &HashMap<String, String> {
+        &self.properties
+    }
+
+    pub fn custom_properties(&self) -> &HashMap<String, String> {
+        &self.custom_properties
+    }
+
+    pub fn replication_factor(&self) -> Result<i32> {
+        self.properties
+            .get("table.replication.factor")
+            .ok_or(InvalidTableError(
+                "Replication factor is not set".to_string(),
+            ))?
+            .parse()
+            .map_err(|_e| {
+                InvalidTableError("Replication factor can't be convert into int".to_string())
+            })
+    }
+
+    pub fn with_properties(&self, new_properties: HashMap<String, String>) -> Self {
+        Self {
+            properties: new_properties,
+            ..self.clone()
+        }
+    }
+
+    pub fn with_replication_factor(&self, new_replication_factor: i32) -> Self {
+        let mut properties = self.properties.clone();
+        properties.insert(
+            "table.replication.factor".to_string(),
+            new_replication_factor.to_string(),
+        );
+        self.with_properties(properties)
+    }
+
+    pub fn with_bucket_count(&self, new_bucket_count: i32) -> Self {
+        Self {
+            table_distribution: Some(TableDistribution {
+                bucket_count: Some(new_bucket_count),
+                bucket_keys: self
+                    .table_distribution
+                    .as_ref()
+                    .map(|td| td.bucket_keys.clone())
+                    .unwrap_or_default(),
+            }),
+            ..self.clone()
+        }
+    }
+
+    pub fn comment(&self) -> Option<&str> {
+        self.comment.as_deref()
+    }
+
+    fn default_bucket_key_of_primary_key_table(
+        schema: &Schema,
+        partition_keys: &[String],
+    ) -> Result<Vec<String>> {
+        let mut bucket_keys = schema
+            .primary_key()
+            .expect("Primary key must be set")
+            .column_names()
+            .to_vec();
+
+        bucket_keys.retain(|k| !partition_keys.contains(k));
+
+        if bucket_keys.is_empty() {
+            return Err(InvalidTableError(format!(
+                "Primary Key constraint {:?} should not be same with partition fields {:?}.",
+                schema.primary_key().unwrap().column_names(),
+                partition_keys
+            )));
+        }
+
+        Ok(bucket_keys)
+    }
+
+    fn normalize_distribution(
+        schema: &Schema,
+        partition_keys: &[String],
+        origin_distribution: Option<TableDistribution>,
+    ) -> Result<Option<TableDistribution>> {
+        if let Some(distribution) = origin_distribution {
+            if distribution
+                .bucket_keys
+                .iter()
+                .any(|k| partition_keys.contains(k))
+            {
+                return Err(InvalidTableError(format!(
+                    "Bucket key {:?} shouldn't include any column in partition keys {:?}.",
+                    distribution.bucket_keys, partition_keys
+                )));
+            }
+
+            return if let Some(pk) = schema.primary_key() {
+                if distribution.bucket_keys.is_empty() {
+                    Ok(Some(TableDistribution {
+                        bucket_count: distribution.bucket_count,
+                        bucket_keys: Self::default_bucket_key_of_primary_key_table(
+                            schema,
+                            partition_keys,
+                        )?,
+                    }))
+                } else {
+                    let pk_columns: HashSet<_> = pk.column_names().iter().collect();
+                    if !distribution
+                        .bucket_keys
+                        .iter()
+                        .all(|k| pk_columns.contains(k))
+                    {
+                        return Err(InvalidTableError(format!(
+                            "Bucket keys must be a subset of primary keys excluding partition keys for primary-key tables. \
+                            The primary keys are {:?}, the partition keys are {:?}, but the user-defined bucket keys are {:?}.",
+                            pk.column_names(),
+                            partition_keys,
+                            distribution.bucket_keys
+                        )));
+                    }
+                    Ok(Some(distribution))
+                }
+            } else {
+                Ok(Some(distribution))
+            };
+        } else if schema.primary_key().is_some() {
+            return Ok(Some(TableDistribution {
+                bucket_count: None,
+                bucket_keys: Self::default_bucket_key_of_primary_key_table(schema, partition_keys)?,
+            }));
+        }
+
+        Ok(None)
+    }
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub enum LogFormat {
+    ARROW,
+    INDEXED,
+}
+
+impl Display for LogFormat {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            LogFormat::ARROW => {
+                write!(f, "ARROW")?;
+            }
+            LogFormat::INDEXED => {
+                write!(f, "INDEXED")?;
+            }
+        }
+        Ok(())
+    }
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub enum KvFormat {
+    INDEXED,
+    COMPACTED,
+}
+
+impl Display for KvFormat {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            KvFormat::COMPACTED => write!(f, "COMPACTED")?,
+            KvFormat::INDEXED => write!(f, "INDEXED")?,
+        }
+        Ok(())
+    }
+}
+
+#[derive(Debug, PartialEq, Eq, Hash, Clone, Serialize, Deserialize)]
+pub struct TablePath {
+    database: String,
+    table: String,
+}
+
+impl Display for TablePath {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
+        write!(f, "{}.{}", self.database, self.table)
+    }
+}
+
+impl TablePath {
+    pub fn new(db: String, tbl: String) -> Self {
+        TablePath {
+            database: db,
+            table: tbl,
+        }
+    }
+
+    #[inline]
+    pub fn database(&self) -> &str {
+        &self.database
+    }
+
+    #[inline]
+    pub fn table(&self) -> &str {
+        &self.table
+    }
+}
+
+#[derive(Debug, Clone)]
+pub struct TableInfo {
+    pub table_path: TablePath,
+    pub table_id: i64,
+    pub schema_id: i32,
+    pub schema: Schema,
+    pub row_type: DataType,
+    pub primary_keys: Vec<String>,
+    pub physical_primary_keys: Vec<String>,
+    pub bucket_keys: Vec<String>,
+    pub partition_keys: Vec<String>,
+    pub num_buckets: i32,
+    pub properties: HashMap<String, String>,
+    pub table_config: TableConfig,
+    pub custom_properties: HashMap<String, String>,
+    pub comment: Option<String>,
+    pub created_time: i64,
+    pub modified_time: i64,
+}
+
+impl TableInfo {
+    pub fn row_type(&self) -> &RowType {
+        match &self.row_type {
+            DataType::Row(row_type) => row_type,
+            _ => panic!("should be a row type"),
+        }
+    }
+}
+
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+pub struct TableConfig {
+    pub properties: HashMap<String, String>,
+}
+
+impl TableConfig {
+    pub fn from_properties(properties: HashMap<String, String>) -> Self {
+        TableConfig { properties }
+    }
+}
+
+impl TableInfo {
+    pub fn of(
+        table_path: TablePath,
+        table_id: i64,
+        schema_id: i32,
+        table_descriptor: TableDescriptor,
+        created_time: i64,
+        modified_time: i64,
+    ) -> TableInfo {
+        let TableDescriptor {
+            schema,
+            table_distribution,
+            comment,
+            partition_keys,
+            properties,
+            custom_properties,
+        } = table_descriptor;
+        let TableDistribution {
+            bucket_count,
+            bucket_keys,
+        } = table_distribution.unwrap();
+        TableInfo::new(
+            table_path,
+            table_id,
+            schema_id,
+            schema,
+            bucket_keys,
+            partition_keys,
+            bucket_count.unwrap(),
+            properties,
+            custom_properties,
+            comment,
+            created_time,
+            modified_time,
+        )
+    }
+
+    #[allow(clippy::too_many_arguments)]
+    pub fn new(
+        table_path: TablePath,
+        table_id: i64,
+        schema_id: i32,
+        schema: Schema,
+        bucket_keys: Vec<String>,
+        partition_keys: Vec<String>,
+        num_buckets: i32,
+        properties: HashMap<String, String>,
+        custom_properties: HashMap<String, String>,
+        comment: Option<String>,
+        created_time: i64,
+        modified_time: i64,
+    ) -> Self {
+        let row_type = schema.row_type.clone();
+        let primary_keys: Vec<String> = schema
+            .primary_key_column_names()
+            .iter()
+            .map(|col| (*col).to_string())
+            .collect();
+        let physical_primary_keys =
+            Self::generate_physical_primary_key(&primary_keys, &partition_keys);
+        let table_config = TableConfig::from_properties(properties.clone());
+
+        TableInfo {
+            table_path,
+            table_id,
+            schema_id,
+            schema,
+            row_type,
+            primary_keys,
+            physical_primary_keys,
+            bucket_keys,
+            partition_keys,
+            num_buckets,
+            properties,
+            table_config,
+            custom_properties,
+            comment,
+            created_time,
+            modified_time,
+        }
+    }
+
+    pub fn get_table_path(&self) -> &TablePath {
+        &self.table_path
+    }
+
+    pub fn get_table_id(&self) -> i64 {
+        self.table_id
+    }
+
+    pub fn get_schema_id(&self) -> i32 {
+        self.schema_id
+    }
+
+    pub fn get_schema(&self) -> &Schema {
+        &self.schema
+    }
+
+    pub fn get_row_type(&self) -> &DataType {
+        &self.row_type
+    }
+
+    pub fn has_primary_key(&self) -> bool {
+        !self.primary_keys.is_empty()
+    }
+
+    pub fn get_primary_keys(&self) -> &Vec<String> {
+        &self.primary_keys
+    }
+
+    pub fn get_physical_primary_keys(&self) -> &[String] {
+        &self.physical_primary_keys
+    }
+
+    pub fn has_bucket_key(&self) -> bool {
+        !self.bucket_keys.is_empty()
+    }
+
+    pub fn is_default_bucket_key(&self) -> bool {
+        if self.has_primary_key() {
+            self.bucket_keys == self.physical_primary_keys
+        } else {
+            self.bucket_keys.is_empty()
+        }
+    }
+
+    pub fn get_bucket_keys(&self) -> &[String] {
+        &self.bucket_keys
+    }
+
+    pub fn is_partitioned(&self) -> bool {
+        !self.partition_keys.is_empty()
+    }
+
+    pub fn is_auto_partitioned(&self) -> bool {
+        self.is_partitioned() && todo!()
+    }
+
+    pub fn get_partition_keys(&self) -> &[String] {
+        &self.partition_keys
+    }
+
+    pub fn get_num_buckets(&self) -> i32 {
+        self.num_buckets
+    }
+
+    pub fn get_properties(&self) -> &HashMap<String, String> {
+        &self.properties
+    }
+
+    pub fn get_table_config(&self) -> &TableConfig {
+        &self.table_config
+    }
+
+    pub fn get_custom_properties(&self) -> &HashMap<String, String> {
+        &self.custom_properties
+    }
+
+    pub fn get_comment(&self) -> Option<&str> {
+        self.comment.as_deref()
+    }
+
+    pub fn get_created_time(&self) -> i64 {
+        self.created_time
+    }
+
+    pub fn get_modified_time(&self) -> i64 {
+        self.modified_time
+    }
+
+    pub fn to_table_descriptor(&self) -> Result<TableDescriptor> {
+        let mut builder = TableDescriptor::builder()
+            .schema(self.schema.clone())
+            .partitioned_by(self.partition_keys.clone())
+            .distributed_by(Some(self.num_buckets), self.bucket_keys.clone())
+            .properties(self.properties.clone())
+            .custom_properties(self.custom_properties.clone());
+
+        if let Some(comment) = &self.comment {
+            builder = builder.comment(&comment.clone());
+        }
+
+        builder.build()
+    }
+
+    fn generate_physical_primary_key(
+        primary_keys: &[String],
+        partition_keys: &[String],
+    ) -> Vec<String> {
+        primary_keys
+            .iter()
+            .filter(|pk| !partition_keys.contains(*pk))
+            .cloned()
+            .collect()
+    }
+}
+
+impl fmt::Display for TableInfo {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        write!(
+            f,
+            "TableInfo{{ table_path={:?}, table_id={}, schema_id={}, schema={:?}, physical_primary_keys={:?}, bucket_keys={:?}, partition_keys={:?}, num_buckets={}, properties={:?}, custom_properties={:?}, comment={:?}, created_time={}, modified_time={} }}",
+            self.table_path,
+            self.table_id,
+            self.schema_id,
+            self.schema,
+            self.physical_primary_keys,
+            self.bucket_keys,
+            self.partition_keys,
+            self.num_buckets,
+            self.properties,
+            self.custom_properties,
+            self.comment,
+            self.created_time,
+            self.modified_time
+        )
+    }
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize, Hash, PartialEq, Eq)]
+pub struct TableBucket {
+    table_id: i64,
+    partition_id: Option<i64>,
+    bucket: i32,
+}
+
+impl TableBucket {
+    pub fn new(table_id: i64, bucket: i32) -> Self {
+        TableBucket {
+            table_id,
+            partition_id: None,
+            bucket,
+        }
+    }
+
+    pub fn table_id(&self) -> i64 {
+        self.table_id
+    }
+
+    pub fn bucket_id(&self) -> i32 {
+        self.bucket
+    }
+
+    pub fn partition_id(&self) -> Option<i64> {
+        self.partition_id
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
new file mode 100644
index 0000000000..195b8f824c
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -0,0 +1,197 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+syntax = "proto2";
+
+package proto;
+
+// metadata request and response, request send from client to each server.
+message MetadataRequest {
+  repeated PbTablePath table_path = 1;
+  repeated PbPhysicalTablePath partitions_path = 2;
+
+  // note: currently, we assume the partition ids must belong to the table_paths in the
+  // metadata request
+  // todo: we won't need the assumption after we introduce metadata cache in server
+  repeated int64 partitions_id = 3 [packed = true];
+}
+
+message MetadataResponse {
+  optional PbServerNode coordinator_server = 1;
+  repeated PbServerNode tablet_servers = 2;
+  repeated PbTableMetadata table_metadata = 3;
+  repeated PbPartitionMetadata partition_metadata = 4;
+}
+
+// produce log request and response
+message ProduceLogRequest {
+  required int32 acks = 1;
+  required int64 table_id = 2;
+  required int32 timeout_ms = 3;
+  repeated PbProduceLogReqForBucket buckets_req = 4;
+}
+
+
+message ProduceLogResponse {
+  repeated PbProduceLogRespForBucket buckets_resp = 1;
+}
+
+
+// --------------- Inner classes ----------------
+message PbTablePath {
+  required string database_name = 1;
+  required string table_name = 2;
+}
+
+message PbPhysicalTablePath {
+  required string database_name = 1;
+  required string table_name = 2;
+  optional string partition_name = 3;
+}
+
+// For MetadataResponse, host and port are still used for all versions.
+// For UpdateMetadataRequest,
+//   * versions <= 0.6: host and port are used.
+//   * versions >= 0.7: listeners is used to replace host and port.
+message PbServerNode {
+  required int32 node_id = 1;
+  required string host = 2;
+  required int32 port = 3;
+  optional string listeners = 4;
+}
+
+message PbTableMetadata {
+  required PbTablePath table_path = 1;
+  required int64 table_id = 2;
+  required int32 schema_id = 3;
+  required bytes table_json = 4;
+  repeated PbBucketMetadata bucket_metadata = 5;
+  required int64 created_time = 6;
+  required int64 modified_time = 7;
+}
+
+message PbPartitionMetadata {
+  required int64 table_id = 1;
+  // the partition name and id for the partition
+  required string partition_name = 2;
+  required int64 partition_id = 3;
+  repeated PbBucketMetadata bucket_metadata = 4;
+}
+
+message PbBucketMetadata {
+  required int32 bucket_id = 1;
+  // optional as some time the leader may not elected yet
+  optional int32 leader_id = 2;
+  repeated int32 replica_id = 3 [packed = true];
+  // TODO: Add isr here.
+}
+
+message PbProduceLogReqForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  required bytes records = 3;
+}
+
+message PbProduceLogRespForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  optional int32 error_code = 3;
+  optional string error_message = 4;
+  optional int64 base_offset = 5;
+}
+
+message CreateTableRequest {
+  required PbTablePath table_path = 1;
+  required bytes table_json = 2;
+  required bool ignore_if_exists = 3;
+}
+
+message CreateTableResponse {
+}
+
+
+message GetTableInfoRequest {
+  required PbTablePath table_path = 1;
+}
+
+message GetTableInfoResponse {
+  required int64 table_id = 1;
+  required int32 schema_id = 2;
+  required bytes table_json = 3;
+  required int64 created_time = 4;
+  required int64 modified_time = 5;
+}
+
+
+// fetch log request and response
+message FetchLogRequest {
+  required int32 follower_server_id = 1;  // value -1 indicate the request from client.
+  required int32 max_bytes = 2;
+  repeated PbFetchLogReqForTable tables_req = 3;
+  optional int32 max_wait_ms = 4;
+  optional int32 min_bytes = 5;
+}
+
+message FetchLogResponse {
+  repeated PbFetchLogRespForTable tables_resp = 1;
+}
+
+message PbFetchLogReqForTable {
+  required int64 table_id = 1;
+  required bool projection_pushdown_enabled = 2;
+  repeated int32 projected_fields = 3 [packed = true];
+  repeated PbFetchLogReqForBucket buckets_req = 4;
+}
+
+
+message PbFetchLogReqForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  // TODO leader epoch
+  required int64 fetch_offset = 3;
+  required int32 max_fetch_bytes = 4;
+}
+
+
+message PbFetchLogRespForTable {
+  required int64 table_id = 1;
+  repeated PbFetchLogRespForBucket buckets_resp = 2;
+}
+message PbFetchLogRespForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  optional int32 error_code = 3;
+  optional string error_message = 4;
+  optional int64 high_watermark = 5;
+  optional int64 log_start_offset = 6; // TODO now we don't introduce log start offset, but remain it in protobuf
+  optional PbRemoteLogFetchInfo remote_log_fetch_info = 7;
+  optional bytes records = 8;
+}
+
+message PbRemoteLogFetchInfo {
+  required string remote_log_tablet_dir = 1;
+  optional string partition_name = 2;
+  repeated PbRemoteLogSegment remote_log_segments = 3;
+  optional int32 first_start_pos = 4;
+}
+
+message PbRemoteLogSegment {
+  required string remote_log_segment_id = 1;
+  required int64 remote_log_start_offset = 2;
+  required int64 remote_log_end_offset = 3;
+  required int32 segment_size_in_bytes = 4;
+}
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
new file mode 100644
index 0000000000..2f595d0304
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -0,0 +1,545 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use arrow::array::{
+    ArrayBuilder, ArrayRef, BooleanBuilder, Float32Builder, Float64Builder, Int8Builder,
+    Int16Builder, Int32Builder, Int64Builder, StringBuilder, UInt8Builder, UInt16Builder,
+    UInt32Builder, UInt64Builder,
+};
+use arrow::{
+    array::RecordBatch,
+    ipc::{reader::StreamReader, writer::StreamWriter},
+};
+use arrow_schema::SchemaRef;
+use arrow_schema::{DataType as ArrowDataType, Field};
+use byteorder::WriteBytesExt;
+use byteorder::{ByteOrder, LittleEndian};
+use crc32c::crc32c;
+use parking_lot::Mutex;
+use std::{
+    io::{Cursor, Write},
+    sync::Arc,
+};
+
+use crate::error::Result;
+use crate::metadata::DataType;
+use crate::record::{ChangeType, ScanRecord};
+use crate::row::{ColumnarRow, GenericRow};
+
+/// const for record batch
+pub const BASE_OFFSET_LENGTH: usize = 8;
+pub const LENGTH_LENGTH: usize = 4;
+pub const MAGIC_LENGTH: usize = 1;
+pub const COMMIT_TIMESTAMP_LENGTH: usize = 8;
+pub const CRC_LENGTH: usize = 4;
+pub const SCHEMA_ID_LENGTH: usize = 2;
+pub const ATTRIBUTE_LENGTH: usize = 1;
+pub const LAST_OFFSET_DELTA_LENGTH: usize = 4;
+pub const WRITE_CLIENT_ID_LENGTH: usize = 8;
+pub const BATCH_SEQUENCE_LENGTH: usize = 4;
+pub const RECORDS_COUNT_LENGTH: usize = 4;
+
+pub const BASE_OFFSET_OFFSET: usize = 0;
+pub const LENGTH_OFFSET: usize = BASE_OFFSET_OFFSET + BASE_OFFSET_LENGTH;
+pub const MAGIC_OFFSET: usize = LENGTH_OFFSET + LENGTH_LENGTH;
+pub const COMMIT_TIMESTAMP_OFFSET: usize = MAGIC_OFFSET + MAGIC_LENGTH;
+pub const CRC_OFFSET: usize = COMMIT_TIMESTAMP_OFFSET + COMMIT_TIMESTAMP_LENGTH;
+pub const SCHEMA_ID_OFFSET: usize = CRC_OFFSET + CRC_LENGTH;
+pub const ATTRIBUTES_OFFSET: usize = SCHEMA_ID_OFFSET + SCHEMA_ID_LENGTH;
+pub const LAST_OFFSET_DELTA_OFFSET: usize = ATTRIBUTES_OFFSET + ATTRIBUTE_LENGTH;
+pub const WRITE_CLIENT_ID_OFFSET: usize = LAST_OFFSET_DELTA_OFFSET + LAST_OFFSET_DELTA_LENGTH;
+pub const BATCH_SEQUENCE_OFFSET: usize = WRITE_CLIENT_ID_OFFSET + WRITE_CLIENT_ID_LENGTH;
+pub const RECORDS_COUNT_OFFSET: usize = BATCH_SEQUENCE_OFFSET + BATCH_SEQUENCE_LENGTH;
+pub const RECORDS_OFFSET: usize = RECORDS_COUNT_OFFSET + RECORDS_COUNT_LENGTH;
+
+pub const RECORD_BATCH_HEADER_SIZE: usize = RECORDS_OFFSET;
+pub const ARROW_CHANGETYPE_OFFSET: usize = RECORD_BATCH_HEADER_SIZE;
+pub const LOG_OVERHEAD: usize = LENGTH_OFFSET + LENGTH_LENGTH;
+
+/// const for record
+/// The "magic" values.
+#[derive(Debug, Clone, Copy)]
+pub enum LogMagicValue {
+    V0 = 0,
+}
+
+pub const CURRENT_LOG_MAGIC_VALUE: u8 = LogMagicValue::V0 as u8;
+
+/// Value used if writer ID is not available or non-idempotent.
+pub const NO_WRITER_ID: i64 = -1;
+
+/// Value used if batch sequence is not available.
+pub const NO_BATCH_SEQUENCE: i32 = -1;
+
+pub const BUILDER_DEFAULT_OFFSET: i64 = 0;
+
+pub const DEFAULT_MAX_RECORD: i32 = 256;
+
+pub struct MemoryLogRecordsArrowBuilder {
+    base_log_offset: i64,
+    schema_id: i32,
+    magic: u8,
+    writer_id: i64,
+    batch_sequence: i32,
+    table_schema: SchemaRef,
+    record_count: i32,
+    arrow_column_builders: Mutex<Vec<Box<dyn ArrayBuilder>>>,
+    is_closed: bool,
+}
+
+impl MemoryLogRecordsArrowBuilder {
+    pub fn new(schema_id: i32, row_type: &DataType) -> Self {
+        let schema_ref = to_arrow_schema(row_type);
+        let builders = Mutex::new(
+            schema_ref
+                .fields()
+                .iter()
+                .map(|field| Self::create_builder(field.data_type()))
+                .collect(),
+        );
+        MemoryLogRecordsArrowBuilder {
+            base_log_offset: BUILDER_DEFAULT_OFFSET,
+            schema_id,
+            magic: CURRENT_LOG_MAGIC_VALUE,
+            writer_id: NO_WRITER_ID,
+            batch_sequence: NO_BATCH_SEQUENCE,
+            record_count: 0,
+            table_schema: schema_ref,
+            arrow_column_builders: builders,
+            is_closed: false,
+        }
+    }
+
+    pub fn append(&mut self, row: &GenericRow) -> Result<()> {
+        for (idx, value) in row.values.iter().enumerate() {
+            let mut builder_binding = self.arrow_column_builders.lock();
+            let builder = builder_binding.get_mut(idx).unwrap();
+            value.append_to(builder.as_mut())?;
+        }
+        self.record_count += 1;
+        // todo: consider write other change type
+        Ok(())
+    }
+
+    pub fn is_full(&self) -> bool {
+        self.record_count >= DEFAULT_MAX_RECORD
+    }
+
+    pub fn is_closed(&self) -> bool {
+        self.is_closed
+    }
+
+    pub fn close(&mut self) {
+        self.is_closed = true;
+    }
+
+    pub fn build(&self) -> Result<Vec<u8>> {
+        // serialize arrow batch
+        let mut arrow_batch_bytes = vec![];
+        let mut writer = StreamWriter::try_new(&mut arrow_batch_bytes, &self.table_schema)?;
+
+        let arrays = self
+            .arrow_column_builders
+            .lock()
+            .iter_mut()
+            .map(|b| b.finish())
+            .collect::<Vec<ArrayRef>>();
+        let record_batch = RecordBatch::try_new(self.table_schema.clone(), arrays)?;
+        // get header len
+        let header = writer.get_ref().len();
+        writer.write(&record_batch)?;
+        // get real arrow batch bytes
+        let real_arrow_batch_bytes = &arrow_batch_bytes[header..];
+
+        // now, write batch header and arrow batch
+        let mut batch_bytes = vec![0u8; RECORD_BATCH_HEADER_SIZE + real_arrow_batch_bytes.len()];
+        // write batch header
+        self.write_batch_header(&mut batch_bytes[..])?;
+
+        // write arrow batch bytes
+        let mut cursor = Cursor::new(&mut batch_bytes[..]);
+        cursor.set_position(RECORD_BATCH_HEADER_SIZE as u64);
+        cursor.write_all(real_arrow_batch_bytes).unwrap();
+
+        let calcute_crc_bytes = &cursor.get_ref()[SCHEMA_ID_OFFSET..];
+        // then update crc
+        let crc = crc32c(calcute_crc_bytes);
+        cursor.set_position(CRC_OFFSET as u64);
+        cursor.write_u32::<LittleEndian>(crc)?;
+
+        Ok(batch_bytes.to_vec())
+    }
+
+    fn write_batch_header(&self, buffer: &mut [u8]) -> Result<()> {
+        let total_len = buffer.len();
+        let mut cursor = Cursor::new(buffer);
+        cursor.write_i64::<LittleEndian>(self.base_log_offset)?;
+        cursor
+            .write_i32::<LittleEndian>((total_len - BASE_OFFSET_LENGTH - LENGTH_LENGTH) as i32)?;
+        cursor.write_u8(self.magic)?;
+        cursor.write_i64::<LittleEndian>(0)?; // timestamp placeholder
+        cursor.write_u32::<LittleEndian>(0)?; // crc placeholder
+        cursor.write_i16::<LittleEndian>(self.schema_id as i16)?;
+
+        // todo: curerntly, always is append only
+        let append_only = true;
+        cursor.write_u8(if append_only { 1 } else { 0 })?;
+        cursor.write_i32::<LittleEndian>(if self.record_count > 0 {
+            self.record_count - 1
+        } else {
+            0
+        })?;
+
+        cursor.write_i64::<LittleEndian>(self.writer_id)?;
+        cursor.write_i32::<LittleEndian>(self.batch_sequence)?;
+        cursor.write_i32::<LittleEndian>(self.record_count)?;
+        Ok(())
+    }
+
+    fn create_builder(data_type: &arrow_schema::DataType) -> Box<dyn ArrayBuilder> {
+        match data_type {
+            arrow_schema::DataType::Int8 => Box::new(Int8Builder::new()),
+            arrow_schema::DataType::Int16 => Box::new(Int16Builder::new()),
+            arrow_schema::DataType::Int32 => Box::new(Int32Builder::new()),
+            arrow_schema::DataType::Int64 => Box::new(Int64Builder::new()),
+            arrow_schema::DataType::UInt8 => Box::new(UInt8Builder::new()),
+            arrow_schema::DataType::UInt16 => Box::new(UInt16Builder::new()),
+            arrow_schema::DataType::UInt32 => Box::new(UInt32Builder::new()),
+            arrow_schema::DataType::UInt64 => Box::new(UInt64Builder::new()),
+            arrow_schema::DataType::Float32 => Box::new(Float32Builder::new()),
+            arrow_schema::DataType::Float64 => Box::new(Float64Builder::new()),
+            arrow_schema::DataType::Boolean => Box::new(BooleanBuilder::new()),
+            arrow_schema::DataType::Utf8 => Box::new(StringBuilder::new()),
+            dt => panic!("Unsupported data type: {dt:?}"),
+        }
+    }
+}
+
+pub trait ToArrow {
+    fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()>;
+}
+
+pub struct LogRecordsBatchs<'a> {
+    data: &'a [u8],
+    current_pos: usize,
+    remaining_bytes: usize,
+}
+
+impl<'a> LogRecordsBatchs<'a> {
+    pub fn new(data: &'a [u8]) -> Self {
+        let remaining_bytes: usize = data.len();
+        Self {
+            data,
+            current_pos: 0,
+            remaining_bytes,
+        }
+    }
+
+    pub fn next_batch_size(&self) -> Option<usize> {
+        if self.remaining_bytes < LOG_OVERHEAD {
+            return None;
+        }
+
+        let batch_size_bytes =
+            LittleEndian::read_i32(self.data.get(self.current_pos + LENGTH_OFFSET..).unwrap());
+        Some(batch_size_bytes as usize + LOG_OVERHEAD)
+    }
+}
+
+impl<'a> Iterator for &'a mut LogRecordsBatchs<'a> {
+    type Item = LogRecordBatch<'a>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        match self.next_batch_size() {
+            Some(batch_size) => {
+                let data_slice = &self.data[self.current_pos..self.current_pos + batch_size];
+                let record_batch = LogRecordBatch::new(data_slice);
+                self.current_pos += batch_size;
+                self.remaining_bytes -= batch_size;
+                Some(record_batch)
+            }
+            None => None,
+        }
+    }
+}
+
+pub struct LogRecordBatch<'a> {
+    data: &'a [u8],
+}
+
+#[allow(dead_code)]
+impl<'a> LogRecordBatch<'a> {
+    pub fn new(data: &'a [u8]) -> Self {
+        LogRecordBatch { data }
+    }
+
+    pub fn magic(&self) -> u8 {
+        self.data[MAGIC_OFFSET]
+    }
+
+    pub fn commit_timestamp(&self) -> i64 {
+        let offset = COMMIT_TIMESTAMP_OFFSET;
+        LittleEndian::read_i64(&self.data[offset..offset + COMMIT_TIMESTAMP_LENGTH])
+    }
+
+    pub fn writer_id(&self) -> i64 {
+        let offset = WRITE_CLIENT_ID_OFFSET;
+        LittleEndian::read_i64(&self.data[offset..offset + WRITE_CLIENT_ID_LENGTH])
+    }
+
+    pub fn batch_sequence(&self) -> i32 {
+        let offset = BATCH_SEQUENCE_OFFSET;
+        LittleEndian::read_i32(&self.data[offset..offset + BATCH_SEQUENCE_LENGTH])
+    }
+
+    pub fn ensure_valid(&self) -> Result<()> {
+        // todo
+        Ok(())
+    }
+
+    pub fn is_valid(&self) -> bool {
+        self.size_in_bytes() >= RECORD_BATCH_HEADER_SIZE
+            && self.checksum() == self.compute_checksum()
+    }
+
+    fn compute_checksum(&self) -> u32 {
+        let start = SCHEMA_ID_OFFSET;
+        let end = start + self.data.len();
+        crc32c(&self.data[start..end])
+    }
+
+    fn attributes(&self) -> u8 {
+        self.data[ATTRIBUTES_OFFSET]
+    }
+
+    pub fn next_log_offset(&self) -> i64 {
+        self.last_log_offset() + 1
+    }
+
+    pub fn checksum(&self) -> u32 {
+        let offset = CRC_OFFSET;
+        LittleEndian::read_u32(&self.data[offset..offset + CRC_OFFSET])
+    }
+
+    pub fn schema_id(&self) -> i16 {
+        let offset = SCHEMA_ID_OFFSET;
+        LittleEndian::read_i16(&self.data[offset..offset + SCHEMA_ID_OFFSET])
+    }
+
+    pub fn base_log_offset(&self) -> i64 {
+        let offset = BASE_OFFSET_OFFSET;
+        LittleEndian::read_i64(&self.data[offset..offset + BASE_OFFSET_LENGTH])
+    }
+
+    pub fn last_log_offset(&self) -> i64 {
+        self.base_log_offset() + self.last_offset_delta() as i64
+    }
+
+    fn last_offset_delta(&self) -> i32 {
+        let offset = LAST_OFFSET_DELTA_OFFSET;
+        LittleEndian::read_i32(&self.data[offset..offset + LAST_OFFSET_DELTA_LENGTH])
+    }
+
+    pub fn size_in_bytes(&self) -> usize {
+        let offset = LENGTH_OFFSET;
+        LittleEndian::read_i32(&self.data[offset..offset + LENGTH_LENGTH]) as usize + LOG_OVERHEAD
+    }
+
+    pub fn record_count(&self) -> i32 {
+        let offset = RECORDS_COUNT_OFFSET;
+        LittleEndian::read_i32(&self.data[offset..offset + RECORDS_COUNT_LENGTH])
+    }
+
+    pub fn records(&self, read_context: ReadContext) -> LogRecordIterator {
+        let count = self.record_count();
+        if count == 0 {
+            return LogRecordIterator::empty();
+        }
+
+        // get arrow_metadata
+        let arrow_metadata_bytes = read_context.to_arrow_metadata().unwrap();
+        // arrow_batch_data
+        let data = &self.data[RECORDS_OFFSET..];
+
+        // need to combine arrow_metadata_bytes + arrow_batch_data
+        let cursor = Cursor::new([&arrow_metadata_bytes, data].concat());
+        let mut stream_reader = StreamReader::try_new(cursor, None).unwrap();
+
+        let mut record_batch = None;
+        if let Some(bath) = stream_reader.next() {
+            record_batch = Some(bath.unwrap());
+        }
+
+        if record_batch.is_none() {
+            return LogRecordIterator::empty();
+        }
+
+        let arrow_reader = ArrowReader::new(Arc::new(record_batch.unwrap()));
+        LogRecordIterator::Arrow(ArrowLogRecordIterator {
+            reader: arrow_reader,
+            base_offset: self.base_log_offset(),
+            timestamp: self.commit_timestamp(),
+            row_id: 0,
+            change_type: ChangeType::AppendOnly,
+        })
+    }
+}
+
+pub fn to_arrow_schema(fluss_schema: &DataType) -> SchemaRef {
+    match &fluss_schema {
+        DataType::Row(row_type) => {
+            let fields: Vec<Field> = row_type
+                .fields()
+                .iter()
+                .map(|f| {
+                    Field::new(
+                        f.name(),
+                        to_arrow_type(f.data_type()),
+                        f.data_type().is_nullable(),
+                    )
+                })
+                .collect();
+
+            SchemaRef::new(arrow_schema::Schema::new(fields))
+        }
+        _ => {
+            panic!("must be row data tyoe.")
+        }
+    }
+}
+
+pub fn to_arrow_type(fluss_type: &DataType) -> ArrowDataType {
+    match fluss_type {
+        DataType::Boolean(_) => ArrowDataType::Boolean,
+        DataType::TinyInt(_) => ArrowDataType::Int8,
+        DataType::SmallInt(_) => ArrowDataType::Int16,
+        DataType::BigInt(_) => ArrowDataType::Int64,
+        DataType::Int(_) => ArrowDataType::Int32,
+        DataType::Float(_) => ArrowDataType::Float32,
+        DataType::Double(_) => ArrowDataType::Float64,
+        DataType::Char(_) => ArrowDataType::Utf8,
+        DataType::String(_) => ArrowDataType::Utf8,
+        DataType::Decimal(_) => todo!(),
+        DataType::Date(_) => ArrowDataType::Date32,
+        DataType::Time(_) => todo!(),
+        DataType::Timestamp(_) => todo!(),
+        DataType::TimestampLTz(_) => todo!(),
+        DataType::Bytes(_) => todo!(),
+        DataType::Binary(_) => todo!(),
+        DataType::Array(_data_type) => todo!(),
+        DataType::Map(_data_type) => todo!(),
+        DataType::Row(_data_fields) => todo!(),
+    }
+}
+
+pub struct ReadContext {
+    arrow_schema: SchemaRef,
+}
+
+impl ReadContext {
+    pub fn new(arrow_schema: SchemaRef) -> ReadContext {
+        ReadContext { arrow_schema }
+    }
+
+    pub fn to_arrow_metadata(&self) -> Result<Vec<u8>> {
+        let mut arrow_schema_bytes = vec![];
+        let _writer = StreamWriter::try_new(&mut arrow_schema_bytes, &self.arrow_schema)?;
+        Ok(arrow_schema_bytes)
+    }
+}
+
+pub enum LogRecordIterator {
+    Empty,
+    Arrow(ArrowLogRecordIterator),
+}
+
+impl LogRecordIterator {
+    pub fn empty() -> Self {
+        LogRecordIterator::Empty
+    }
+}
+
+impl Iterator for LogRecordIterator {
+    type Item = ScanRecord;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        match self {
+            LogRecordIterator::Empty => None,
+            LogRecordIterator::Arrow(iter) => iter.next(),
+        }
+    }
+}
+
+pub struct ArrowLogRecordIterator {
+    reader: ArrowReader,
+    base_offset: i64,
+    timestamp: i64,
+    row_id: usize,
+    change_type: ChangeType,
+}
+
+#[allow(dead_code)]
+impl ArrowLogRecordIterator {
+    fn new(reader: ArrowReader, base_offset: i64, timestamp: i64, change_type: ChangeType) -> Self {
+        Self {
+            reader,
+            base_offset,
+            timestamp,
+            row_id: 0,
+            change_type,
+        }
+    }
+}
+
+impl Iterator for ArrowLogRecordIterator {
+    type Item = ScanRecord;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.row_id >= self.reader.row_count() {
+            return None;
+        }
+
+        let columnar_row = self.reader.read(self.row_id);
+        let scan_record = ScanRecord::new(
+            columnar_row,
+            self.base_offset + self.row_id as i64,
+            self.timestamp,
+            self.change_type,
+        );
+        self.row_id += 1;
+        Some(scan_record)
+    }
+}
+
+pub struct ArrowReader {
+    record_batch: Arc<RecordBatch>,
+}
+
+impl ArrowReader {
+    pub fn new(record_batch: Arc<RecordBatch>) -> Self {
+        ArrowReader { record_batch }
+    }
+
+    pub fn row_count(&self) -> usize {
+        self.record_batch.num_rows()
+    }
+
+    pub fn read(&self, row_id: usize) -> ColumnarRow {
+        ColumnarRow::new_with_row_id(self.record_batch.clone(), row_id)
+    }
+}
+pub struct MyVec<T>(pub StreamReader<T>);
diff --git a/fluss-rust/crates/fluss/src/record/error.rs b/fluss-rust/crates/fluss/src/record/error.rs
new file mode 100644
index 0000000000..22704a0cdf
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/error.rs
@@ -0,0 +1,27 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use std::io;
+use thiserror::Error;
+
+#[derive(Error, Debug)]
+#[non_exhaustive]
+#[allow(dead_code)]
+pub enum Error {
+    #[error(transparent)]
+    Io(#[from] io::Error),
+}
diff --git a/fluss-rust/crates/fluss/src/record/mod.rs b/fluss-rust/crates/fluss/src/record/mod.rs
new file mode 100644
index 0000000000..d7872055b9
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/mod.rs
@@ -0,0 +1,174 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::TableBucket;
+use crate::row::ColumnarRow;
+use core::fmt;
+use std::collections::HashMap;
+
+mod arrow;
+mod error;
+
+pub use arrow::*;
+
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub enum ChangeType {
+    /// Append-only operation
+    AppendOnly,
+    /// Insert operation
+    Insert,
+    /// Update operation containing the previous content of the updated row
+    UpdateBefore,
+    /// Update operation containing the new content of the updated row
+    UpdateAfter,
+    /// Delete operation
+    Delete,
+}
+
+impl ChangeType {
+    /// Returns a short string representation of this ChangeType
+    pub fn short_string(&self) -> &'static str {
+        match self {
+            ChangeType::AppendOnly => "+A",
+            ChangeType::Insert => "+I",
+            ChangeType::UpdateBefore => "-U",
+            ChangeType::UpdateAfter => "+U",
+            ChangeType::Delete => "-D",
+        }
+    }
+
+    /// Returns the byte value representation used for serialization
+    pub fn to_byte_value(&self) -> u8 {
+        match self {
+            ChangeType::AppendOnly => 0,
+            ChangeType::Insert => 1,
+            ChangeType::UpdateBefore => 2,
+            ChangeType::UpdateAfter => 3,
+            ChangeType::Delete => 4,
+        }
+    }
+
+    /// Creates a ChangeType from its byte value representation
+    ///
+    /// # Errors
+    /// Returns an error if the byte value doesn't correspond to any ChangeType
+    pub fn from_byte_value(value: u8) -> Result<Self, String> {
+        match value {
+            0 => Ok(ChangeType::AppendOnly),
+            1 => Ok(ChangeType::Insert),
+            2 => Ok(ChangeType::UpdateBefore),
+            3 => Ok(ChangeType::UpdateAfter),
+            4 => Ok(ChangeType::Delete),
+            _ => Err(format!("Unsupported byte value '{value}' for change type")),
+        }
+    }
+}
+
+impl fmt::Display for ChangeType {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        write!(f, "{}", self.short_string())
+    }
+}
+
+pub struct ScanRecord {
+    pub row: ColumnarRow,
+    offset: i64,
+    timestamp: i64,
+    change_type: ChangeType,
+}
+
+impl ScanRecord {
+    const INVALID: i64 = -1;
+
+    pub fn new_default(row: ColumnarRow) -> Self {
+        ScanRecord {
+            row,
+            offset: Self::INVALID,
+            timestamp: Self::INVALID,
+            change_type: ChangeType::Insert,
+        }
+    }
+
+    pub fn new(row: ColumnarRow, offset: i64, timestamp: i64, change_type: ChangeType) -> Self {
+        ScanRecord {
+            row,
+            offset,
+            timestamp,
+            change_type,
+        }
+    }
+
+    pub fn row(&self) -> &ColumnarRow {
+        &self.row
+    }
+
+    /// Returns the position in the log
+    pub fn offset(&self) -> i64 {
+        self.offset
+    }
+
+    /// Returns the timestamp
+    pub fn timestamp(&self) -> i64 {
+        self.timestamp
+    }
+
+    /// Returns the change type
+    pub fn change_type(&self) -> &ChangeType {
+        &self.change_type
+    }
+}
+
+pub struct ScanRecords {
+    records: HashMap<TableBucket, Vec<ScanRecord>>,
+}
+
+impl ScanRecords {
+    pub fn empty() -> Self {
+        Self {
+            records: HashMap::new(),
+        }
+    }
+
+    pub fn new(records: HashMap<TableBucket, Vec<ScanRecord>>) -> Self {
+        Self { records }
+    }
+
+    pub fn records(&self, scan_bucket: &TableBucket) -> &[ScanRecord] {
+        self.records.get(scan_bucket).map_or(&[], |records| records)
+    }
+
+    pub fn count(&self) -> usize {
+        self.records.values().map(|v| v.len()).sum()
+    }
+
+    pub fn is_empty(&self) -> bool {
+        self.records.is_empty()
+    }
+}
+
+impl IntoIterator for ScanRecords {
+    type Item = ScanRecord;
+    type IntoIter = std::vec::IntoIter<ScanRecord>;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.records
+            .into_values()
+            .flatten()
+            .collect::<Vec<_>>()
+            .into_iter()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
new file mode 100644
index 0000000000..44ca640b51
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -0,0 +1,169 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::row::InternalRow;
+use arrow::array::{
+    AsArray, BinaryArray, FixedSizeBinaryArray, Float32Array, Float64Array, Int8Array, Int16Array,
+    Int32Array, Int64Array, RecordBatch, StringArray,
+};
+use std::sync::Arc;
+
+pub struct ColumnarRow {
+    record_batch: Arc<RecordBatch>,
+    row_id: usize,
+}
+
+impl ColumnarRow {
+    pub fn new(batch: Arc<RecordBatch>) -> Self {
+        ColumnarRow {
+            record_batch: batch,
+            row_id: 0,
+        }
+    }
+
+    pub fn new_with_row_id(bach: Arc<RecordBatch>, row_id: usize) -> Self {
+        ColumnarRow {
+            record_batch: bach,
+            row_id,
+        }
+    }
+
+    pub fn set_row_id(&mut self, row_id: usize) {
+        self.row_id = row_id
+    }
+}
+
+impl InternalRow for ColumnarRow {
+    fn get_field_count(&self) -> usize {
+        self.record_batch.num_columns()
+    }
+
+    fn is_null_at(&self, pos: usize) -> bool {
+        self.record_batch.column(pos).is_null(self.row_id)
+    }
+
+    fn get_boolean(&self, pos: usize) -> bool {
+        self.record_batch
+            .column(pos)
+            .as_boolean()
+            .value(self.row_id)
+    }
+
+    fn get_byte(&self, pos: usize) -> i8 {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<Int8Array>()
+            .expect("Expect byte array")
+            .value(self.row_id)
+    }
+
+    fn get_short(&self, pos: usize) -> i16 {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<Int16Array>()
+            .expect("Expect short array")
+            .value(self.row_id)
+    }
+
+    fn get_int(&self, pos: usize) -> i32 {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<Int32Array>()
+            .expect("Expect int array")
+            .value(self.row_id)
+    }
+
+    fn get_long(&self, pos: usize) -> i64 {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<Int64Array>()
+            .expect("Expect long array")
+            .value(self.row_id)
+    }
+
+    fn get_float(&self, pos: usize) -> f32 {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<Float32Array>()
+            .expect("Expect float32 array")
+            .value(self.row_id)
+    }
+
+    fn get_double(&self, pos: usize) -> f64 {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<Float64Array>()
+            .expect("Expect float64 array")
+            .value(self.row_id)
+    }
+
+    fn get_char(&self, pos: usize, length: usize) -> String {
+        let array = self
+            .record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<FixedSizeBinaryArray>()
+            .expect("Expected fixed-size binary array for char type");
+
+        let bytes = array.value(self.row_id);
+        if bytes.len() != length {
+            panic!(
+                "Length mismatch for fixed-size char: expected {}, got {}",
+                length,
+                bytes.len()
+            );
+        }
+
+        String::from_utf8(bytes.to_vec())
+            .unwrap_or_else(|_| String::from_utf8_lossy(bytes).into_owned())
+    }
+
+    fn get_string(&self, pos: usize) -> &str {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<StringArray>()
+            .expect("Expected String array.")
+            .value(self.row_id)
+    }
+
+    fn get_binary(&self, pos: usize, _length: usize) -> Vec<u8> {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<FixedSizeBinaryArray>()
+            .expect("Expected binary array.")
+            .value(self.row_id)
+            .to_vec()
+    }
+
+    fn get_bytes(&self, pos: usize) -> Vec<u8> {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<BinaryArray>()
+            .expect("Expected bytes array.")
+            .value(self.row_id)
+            .to_vec()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
new file mode 100644
index 0000000000..3c65a7d4ee
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -0,0 +1,287 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use chrono::Datelike;
+
+use crate::error::Error::RowConvertError;
+use crate::error::Result;
+use arrow::array::{ArrayBuilder, Int8Builder, Int16Builder, Int32Builder, StringBuilder};
+use chrono::NaiveDate;
+use ordered_float::OrderedFloat;
+use parse_display::Display;
+use ref_cast::RefCast;
+use rust_decimal::Decimal;
+use serde::{Deserialize, Serialize};
+use std::fmt;
+use std::ops::Deref;
+
+#[allow(dead_code)]
+const THIRTY_YEARS_MICROSECONDS: i64 = 946_684_800_000_000;
+
+pub const UNIX_EPOCH_DAYS: i32 = 719_163;
+
+#[derive(Debug, Clone, Display, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize)]
+pub enum Datum<'a> {
+    #[display("null")]
+    Null,
+    #[display("{0}")]
+    Bool(bool),
+    #[display("{0}")]
+    Int16(i16),
+    #[display("{0}")]
+    Int32(i32),
+    #[display("{0}")]
+    Int64(i64),
+    #[display("{0}")]
+    Float64(F64),
+    #[display("'{0}'")]
+    String(&'a str),
+    #[display("{0}")]
+    Blob(Blob),
+    #[display("{0}")]
+    Decimal(Decimal),
+    #[display("{0}")]
+    Date(Date),
+    #[display("{0}")]
+    Timestamp(Timestamp),
+    #[display("{0}")]
+    TimestampTz(TimestampLtz),
+}
+
+impl Datum<'_> {
+    pub fn is_null(&self) -> bool {
+        matches!(self, Datum::Null)
+    }
+
+    pub fn as_str(&self) -> &str {
+        match self {
+            Self::String(s) => s,
+            _ => panic!("not a string: {self:?}"),
+        }
+    }
+}
+
+// ----------- implement from
+impl<'a> From<i32> for Datum<'a> {
+    #[inline]
+    fn from(i: i32) -> Datum<'a> {
+        Datum::Int32(i)
+    }
+}
+
+impl<'a> From<&'a str> for Datum<'a> {
+    #[inline]
+    fn from(s: &'a str) -> Datum<'a> {
+        Datum::String(s)
+    }
+}
+
+impl From<Option<&()>> for Datum<'_> {
+    fn from(_: Option<&()>) -> Self {
+        Self::Null
+    }
+}
+
+impl TryFrom<&Datum<'_>> for i32 {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Int32(i) => Ok(*i),
+            _ => Err(()),
+        }
+    }
+}
+
+impl<'a> TryFrom<&Datum<'a>> for &'a str {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum<'a>) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::String(i) => Ok(*i),
+            _ => Err(()),
+        }
+    }
+}
+
+pub trait ToArrow {
+    fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()>;
+}
+
+impl Datum<'_> {
+    pub fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()> {
+        match self {
+            Datum::Null => {
+                todo!()
+            }
+            Datum::Bool(_v) => {
+                todo!()
+            }
+            Datum::Int16(_v) => {
+                todo!()
+            }
+            Datum::Int32(v) => {
+                v.append_to(builder)?;
+            }
+            Datum::Int64(_v) => {
+                todo!()
+            }
+            Datum::Float64(_v) => {
+                todo!()
+            }
+            Datum::String(v) => {
+                v.append_to(builder)?;
+            }
+            Datum::Blob(_v) => {
+                todo!()
+            }
+            Datum::Decimal(_v) => {
+                todo!()
+            }
+            Datum::Date(_v) => {
+                todo!()
+            }
+            Datum::Timestamp(_v) => {
+                todo!()
+            }
+            Datum::TimestampTz(_v) => {
+                todo!()
+            }
+        }
+        Ok(())
+    }
+}
+
+macro_rules! impl_to_arrow {
+    ($ty:ty, $variant:ident) => {
+        impl ToArrow for $ty {
+            fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()> {
+                if let Some(b) = builder.as_any_mut().downcast_mut::<$variant>() {
+                    b.append_value(*self);
+                    Ok(())
+                } else {
+                    Err(RowConvertError(format!(
+                        "Cannot cast {} to {} builder",
+                        stringify!($ty),
+                        stringify!($variant)
+                    )))
+                }
+            }
+        }
+    };
+}
+
+impl_to_arrow!(i8, Int8Builder);
+impl_to_arrow!(i16, Int16Builder);
+impl_to_arrow!(i32, Int32Builder);
+impl_to_arrow!(&str, StringBuilder);
+
+#[allow(dead_code)]
+pub type F32 = OrderedFloat<f32>;
+pub type F64 = OrderedFloat<f64>;
+#[allow(dead_code)]
+pub type Str = Box<str>;
+
+#[derive(PartialEq, Eq, PartialOrd, Ord, Hash, Clone, Serialize, Deserialize, Default)]
+pub struct Blob(Box<[u8]>);
+
+impl Deref for Blob {
+    type Target = BlobRef;
+
+    fn deref(&self) -> &Self::Target {
+        BlobRef::new(&self.0)
+    }
+}
+
+impl BlobRef {
+    pub fn new(bytes: &[u8]) -> &Self {
+        // SAFETY: `&BlobRef` and `&[u8]` have the same layout.
+        BlobRef::ref_cast(bytes)
+    }
+}
+
+/// A slice of a blob.
+#[repr(transparent)]
+#[derive(PartialEq, Eq, PartialOrd, Ord, RefCast, Hash)]
+pub struct BlobRef([u8]);
+
+impl fmt::Debug for Blob {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        write!(f, "{:?}", self.as_ref())
+    }
+}
+
+impl fmt::Display for Blob {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        write!(f, "{:?}", self.as_ref())
+    }
+}
+
+impl AsRef<[u8]> for BlobRef {
+    fn as_ref(&self) -> &[u8] {
+        &self.0
+    }
+}
+
+impl Deref for BlobRef {
+    type Target = [u8];
+
+    fn deref(&self) -> &Self::Target {
+        &self.0
+    }
+}
+
+#[derive(PartialOrd, Ord, Display, PartialEq, Eq, Debug, Copy, Clone, Default, Hash, Serialize)]
+pub struct Date(i32);
+
+#[derive(PartialOrd, Ord, Display, PartialEq, Eq, Debug, Copy, Clone, Default, Hash, Serialize)]
+pub struct Timestamp(i64);
+
+#[derive(PartialOrd, Ord, Display, PartialEq, Eq, Debug, Copy, Clone, Default, Hash, Serialize)]
+pub struct TimestampLtz(i64);
+
+impl From<Vec<u8>> for Blob {
+    fn from(vec: Vec<u8>) -> Self {
+        Blob(vec.into())
+    }
+}
+
+impl Date {
+    pub const fn new(inner: i32) -> Self {
+        Date(inner)
+    }
+
+    /// Get the inner value of date type
+    pub fn get_inner(&self) -> i32 {
+        self.0
+    }
+
+    pub fn year(&self) -> i32 {
+        let date = NaiveDate::from_num_days_from_ce_opt(self.0 + UNIX_EPOCH_DAYS).unwrap();
+        date.year()
+    }
+    pub fn month(&self) -> i32 {
+        let date = NaiveDate::from_num_days_from_ce_opt(self.0 + UNIX_EPOCH_DAYS).unwrap();
+        date.month() as i32
+    }
+    pub fn day(&self) -> i32 {
+        let date = NaiveDate::from_num_days_from_ce_opt(self.0 + UNIX_EPOCH_DAYS).unwrap();
+        date.day() as i32
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
new file mode 100644
index 0000000000..ead6ff0067
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -0,0 +1,148 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::row::datum::Datum;
+
+mod column;
+
+mod datum;
+
+pub use column::*;
+
+pub trait InternalRow {
+    /// Returns the number of fields in this row
+    fn get_field_count(&self) -> usize;
+
+    /// Returns true if the element is null at the given position
+    fn is_null_at(&self, pos: usize) -> bool;
+
+    /// Returns the boolean value at the given position
+    fn get_boolean(&self, pos: usize) -> bool;
+
+    /// Returns the byte value at the given position
+    fn get_byte(&self, pos: usize) -> i8;
+
+    /// Returns the short value at the given position
+    fn get_short(&self, pos: usize) -> i16;
+
+    /// Returns the integer value at the given position
+    fn get_int(&self, pos: usize) -> i32;
+
+    /// Returns the long value at the given position
+    fn get_long(&self, pos: usize) -> i64;
+
+    /// Returns the float value at the given position
+    fn get_float(&self, pos: usize) -> f32;
+
+    /// Returns the double value at the given position
+    fn get_double(&self, pos: usize) -> f64;
+
+    /// Returns the string value at the given position with fixed length
+    fn get_char(&self, pos: usize, length: usize) -> String;
+
+    /// Returns the string value at the given position
+    fn get_string(&self, pos: usize) -> &str;
+
+    // /// Returns the decimal value at the given position
+    // fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Decimal;
+
+    // /// Returns the timestamp value at the given position
+    // fn get_timestamp_ntz(&self, pos: usize, precision: usize) -> TimestampNtz;
+
+    // /// Returns the timestamp value at the given position
+    // fn get_timestamp_ltz(&self, pos: usize, precision: usize) -> TimestampLtz;
+
+    /// Returns the binary value at the given position with fixed length
+    fn get_binary(&self, pos: usize, length: usize) -> Vec<u8>;
+
+    /// Returns the binary value at the given position
+    fn get_bytes(&self, pos: usize) -> Vec<u8>;
+}
+
+pub struct GenericRow<'a> {
+    pub values: Vec<Datum<'a>>,
+}
+
+impl<'a> InternalRow for GenericRow<'a> {
+    fn get_field_count(&self) -> usize {
+        self.values.len()
+    }
+
+    fn is_null_at(&self, _pos: usize) -> bool {
+        false
+    }
+
+    fn get_boolean(&self, _pos: usize) -> bool {
+        todo!()
+    }
+
+    fn get_byte(&self, _pos: usize) -> i8 {
+        todo!()
+    }
+
+    fn get_short(&self, _pos: usize) -> i16 {
+        todo!()
+    }
+
+    fn get_int(&self, pos: usize) -> i32 {
+        self.values.get(pos).unwrap().try_into().unwrap()
+    }
+
+    fn get_long(&self, _pos: usize) -> i64 {
+        todo!()
+    }
+
+    fn get_float(&self, _pos: usize) -> f32 {
+        todo!()
+    }
+
+    fn get_double(&self, _pos: usize) -> f64 {
+        todo!()
+    }
+
+    fn get_char(&self, _pos: usize, _length: usize) -> String {
+        todo!()
+    }
+
+    fn get_string(&self, pos: usize) -> &str {
+        self.values.get(pos).unwrap().try_into().unwrap()
+    }
+
+    fn get_binary(&self, _pos: usize, _length: usize) -> Vec<u8> {
+        todo!()
+    }
+
+    fn get_bytes(&self, _pos: usize) -> Vec<u8> {
+        todo!()
+    }
+}
+
+impl<'a> Default for GenericRow<'a> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl<'a> GenericRow<'a> {
+    pub fn new() -> GenericRow<'a> {
+        GenericRow { values: vec![] }
+    }
+
+    pub fn set_field(&mut self, pos: usize, value: impl Into<Datum<'a>>) {
+        self.values.insert(pos, value.into());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
new file mode 100644
index 0000000000..49282084ef
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -0,0 +1,54 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::api_key::ApiKey::Unknown;
+
+#[derive(Debug, PartialEq, Eq, PartialOrd, Ord, Hash, Clone, Copy)]
+pub enum ApiKey {
+    CreateTable,
+    ProduceLog,
+    FetchLog,
+    MetaData,
+    GetTable,
+    Unknown(i16),
+}
+
+impl From<i16> for ApiKey {
+    fn from(key: i16) -> Self {
+        match key {
+            1005 => ApiKey::CreateTable,
+            1014 => ApiKey::ProduceLog,
+            1015 => ApiKey::FetchLog,
+            1012 => ApiKey::MetaData,
+            1007 => ApiKey::GetTable,
+            _ => Unknown(key),
+        }
+    }
+}
+
+impl From<ApiKey> for i16 {
+    fn from(key: ApiKey) -> Self {
+        match key {
+            ApiKey::CreateTable => 1005,
+            ApiKey::ProduceLog => 1014,
+            ApiKey::MetaData => 1012,
+            ApiKey::GetTable => 1007,
+            ApiKey::FetchLog => 1015,
+            Unknown(x) => x,
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/api_version.rs b/fluss-rust/crates/fluss/src/rpc/api_version.rs
new file mode 100644
index 0000000000..395c45cd0f
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/api_version.rs
@@ -0,0 +1,54 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#[derive(Debug, PartialEq, Eq, PartialOrd, Ord, Hash, Clone, Copy)]
+pub struct ApiVersion(pub i16);
+
+#[derive(Debug, PartialEq, Eq, Clone, Copy)]
+pub struct ApiVersionRange {
+    min: ApiVersion,
+    max: ApiVersion,
+}
+
+impl std::fmt::Display for ApiVersion {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}", self.0)
+    }
+}
+
+#[allow(dead_code)]
+impl ApiVersionRange {
+    pub const fn new(min: ApiVersion, max: ApiVersion) -> Self {
+        assert!(min.0 <= max.0);
+
+        Self { min, max }
+    }
+
+    pub fn min(&self) -> ApiVersion {
+        self.min
+    }
+
+    pub fn max(&self) -> ApiVersion {
+        self.max
+    }
+}
+
+impl std::fmt::Display for ApiVersionRange {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}:{}", self.min, self.max)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/convert.rs b/fluss-rust/crates/fluss/src/rpc/convert.rs
new file mode 100644
index 0000000000..6feb7eb8af
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/convert.rs
@@ -0,0 +1,43 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::cluster::{ServerNode, ServerType};
+use crate::metadata::TablePath;
+use crate::proto::{PbServerNode, PbTablePath};
+
+pub fn to_table_path(table_path: &TablePath) -> PbTablePath {
+    PbTablePath {
+        database_name: table_path.database().to_string(),
+        table_name: table_path.table().to_string(),
+    }
+}
+
+pub fn from_pb_server_node(pb_server_node: PbServerNode, server_type: ServerType) -> ServerNode {
+    ServerNode::new(
+        pb_server_node.node_id,
+        pb_server_node.host,
+        pb_server_node.port as u32,
+        server_type,
+    )
+}
+
+pub fn from_pb_table_path(pb_table_path: &PbTablePath) -> TablePath {
+    TablePath::new(
+        pb_table_path.database_name.to_string(),
+        pb_table_path.table_name.to_string(),
+    )
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/error.rs b/fluss-rust/crates/fluss/src/rpc/error.rs
new file mode 100644
index 0000000000..84b20b102e
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/error.rs
@@ -0,0 +1,50 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use std::sync::Arc;
+use thiserror::Error;
+
+#[derive(Error, Debug)]
+#[non_exhaustive]
+pub enum RpcError {
+    #[error("Cannot write message: {0}")]
+    WriteMessageError(#[from] crate::rpc::frame::WriteError),
+
+    #[error("Cannot read framed message: {0}")]
+    ReadMessageError(#[from] crate::rpc::frame::ReadError),
+
+    #[error("connection error")]
+    ConnectionError(String),
+
+    #[error("IO Error: {0}")]
+    IO(#[from] std::io::Error),
+
+    #[error("Connection is poisoned: {0}")]
+    Poisoned(Arc<RpcError>),
+
+    #[error(
+        "Data left at the end of the message. Got {message_size} bytes but only read {read} bytes. api_key={api_key:?} api_version={api_version}"
+    )]
+    TooMuchData {
+        message_size: u64,
+        read: u64,
+        api_key: ApiKey,
+        api_version: ApiVersion,
+    },
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/frame.rs b/fluss-rust/crates/fluss/src/rpc/frame.rs
new file mode 100644
index 0000000000..44dadc9408
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/frame.rs
@@ -0,0 +1,106 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use thiserror::Error;
+use tokio::io::{AsyncRead, AsyncReadExt, AsyncWrite, AsyncWriteExt};
+
+#[derive(Error, Debug)]
+#[non_exhaustive]
+pub enum ReadError {
+    #[error("Cannot read data: {0}")]
+    IO(#[from] std::io::Error),
+
+    #[error("Negative message size: {size}")]
+    NegativeMessageSize { size: i32 },
+
+    #[error("Message too large, limit is {limit} bytes but got {actual} bytes")]
+    MessageTooLarge { limit: usize, actual: usize },
+}
+
+pub trait AsyncMessageRead {
+    fn read_message(
+        &mut self,
+        max_message_size: usize,
+    ) -> impl Future<Output = Result<Vec<u8>, ReadError>> + Send;
+}
+
+impl<R> AsyncMessageRead for R
+where
+    R: AsyncRead + Send + Unpin,
+{
+    async fn read_message(&mut self, max_message_size: usize) -> Result<Vec<u8>, ReadError> {
+        let mut len_buf = [0u8; 4];
+        self.read_exact(&mut len_buf).await?;
+        let len = i32::from_be_bytes(len_buf);
+
+        let len = usize::try_from(len).map_err(|_| ReadError::NegativeMessageSize { size: len })?;
+        // check max message size to not blow up memory
+        if len > max_message_size {
+            // We need to seek so that next message is readable. However `self.seek` would require `R: AsyncSeek` which
+            // doesn't hold for many types we want to work with. So do some manual seeking.
+            let mut to_read = len;
+            let mut buf = vec![]; // allocate empty buffer
+            while to_read > 0 {
+                let step = max_message_size.min(to_read);
+
+                // resize buffer if required
+                buf.resize(step, 0);
+
+                self.read_exact(&mut buf).await?;
+                to_read -= step;
+            }
+
+            return Err(ReadError::MessageTooLarge {
+                limit: max_message_size,
+                actual: len,
+            });
+        }
+
+        let mut buf = vec![0u8; len];
+        self.read_exact(&mut buf).await?;
+        Ok(buf)
+    }
+}
+
+#[derive(Error, Debug)]
+#[non_exhaustive]
+pub enum WriteError {
+    #[error("Cannot write data: {0}")]
+    IO(#[from] std::io::Error),
+
+    #[error("Message too large: {size}")]
+    TooLarge { size: usize },
+}
+
+pub trait AsyncMessageWrite {
+    fn write_message(&mut self, msg: &[u8]) -> impl Future<Output = Result<(), WriteError>> + Send;
+}
+
+impl<W> AsyncMessageWrite for W
+where
+    W: AsyncWrite + Send + Unpin,
+{
+    async fn write_message(&mut self, msg: &[u8]) -> Result<(), WriteError> {
+        let len = i32::try_from(msg.len()).map_err(|_| WriteError::TooLarge { size: msg.len() })?;
+        self.write_all(len.to_be_bytes().as_ref()).await?;
+
+        if !msg.is_empty() {
+            self.write_all(msg).await?;
+        }
+        Ok(())
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_table.rs b/fluss-rust/crates/fluss/src/rpc/message/create_table.rs
new file mode 100644
index 0000000000..5802e71797
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_table.rs
@@ -0,0 +1,62 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::{JsonSerde, TableDescriptor, TablePath};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+
+use crate::error::Result as FlussResult;
+use crate::proto::CreateTableResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::convert::to_table_path;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct CreateTableRequest {
+    pub inner_request: proto::CreateTableRequest,
+}
+
+impl CreateTableRequest {
+    pub fn new(
+        table_path: &TablePath,
+        table_descriptor: &TableDescriptor,
+        ignore_if_exists: bool,
+    ) -> FlussResult<Self> {
+        Ok(CreateTableRequest {
+            inner_request: proto::CreateTableRequest {
+                table_path: to_table_path(table_path),
+                table_json: serde_json::to_vec(&table_descriptor.serialize_json()?).unwrap(),
+                ignore_if_exists,
+            },
+        })
+    }
+}
+
+impl RequestBody for CreateTableRequest {
+    type ResponseBody = CreateTableResponse;
+
+    const API_KEY: ApiKey = ApiKey::CreateTable;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(CreateTableRequest);
+impl_read_version_type!(CreateTableResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/fetch.rs b/fluss-rust/crates/fluss/src/rpc/message/fetch.rs
new file mode 100644
index 0000000000..6ebc5a2b33
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/fetch.rs
@@ -0,0 +1,56 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::FetchLogResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use prost::Message;
+
+use bytes::{Buf, BufMut};
+
+#[allow(dead_code)]
+const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
+#[allow(dead_code)]
+const LOG_FETCH_MIN_BYTES: i32 = 1;
+#[allow(dead_code)]
+const LOG_FETCH_WAIT_MAX_TIME: i32 = 500;
+
+pub struct FetchLogRequest {
+    pub inner_request: proto::FetchLogRequest,
+}
+
+impl FetchLogRequest {
+    pub fn new(fetch_log_request: proto::FetchLogRequest) -> Self {
+        Self {
+            inner_request: fetch_log_request,
+        }
+    }
+}
+
+impl RequestBody for FetchLogRequest {
+    type ResponseBody = FetchLogResponse;
+
+    const API_KEY: ApiKey = ApiKey::FetchLog;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(FetchLogRequest);
+impl_read_version_type!(FetchLogResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_table.rs b/fluss-rust/crates/fluss/src/rpc/message/get_table.rs
new file mode 100644
index 0000000000..4f4d6c7a41
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_table.rs
@@ -0,0 +1,54 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::{GetTableInfoRequest, GetTableInfoResponse, PbTablePath};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use crate::metadata::TablePath;
+use crate::{impl_read_version_type, impl_write_version_type};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct GetTableRequest {
+    pub inner_request: GetTableInfoRequest,
+}
+
+impl GetTableRequest {
+    pub fn new(table_path: &TablePath) -> Self {
+        let inner_request = GetTableInfoRequest {
+            table_path: PbTablePath {
+                database_name: table_path.database().to_owned(),
+                table_name: table_path.table().to_owned(),
+            },
+        };
+
+        Self { inner_request }
+    }
+}
+
+impl RequestBody for GetTableRequest {
+    type ResponseBody = GetTableInfoResponse;
+    const API_KEY: ApiKey = ApiKey::GetTable;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(GetTableRequest);
+impl_read_version_type!(GetTableInfoResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/header.rs b/fluss-rust/crates/fluss/src/rpc/message/header.rs
new file mode 100644
index 0000000000..fe60f8c997
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/header.rs
@@ -0,0 +1,73 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, WriteVersionedType};
+use bytes::{Buf, BufMut};
+
+#[allow(dead_code)]
+const REQUEST_HEADER_LENGTH: i32 = 8;
+const SUCCESS_RESPONSE: u8 = 0;
+#[allow(dead_code)]
+const ERROR_RESPONSE: u8 = 1;
+#[allow(dead_code)]
+const SERVER_FAILURE: u8 = 2;
+
+#[derive(Debug, PartialEq, Eq)]
+pub struct RequestHeader {
+    /// The API key of this request.
+    pub request_api_key: ApiKey,
+
+    pub request_api_version: ApiVersion,
+
+    pub request_id: i32,
+
+    pub client_id: Option<String>,
+}
+
+impl<W> WriteVersionedType<W> for RequestHeader
+where
+    W: BufMut,
+{
+    fn write_versioned(&self, writer: &mut W, _version: ApiVersion) -> Result<(), WriteError> {
+        writer.put_i16(self.request_api_key.into());
+        writer.put_i16(self.request_api_version.0);
+        writer.put_i32(self.request_id);
+        Ok(())
+    }
+}
+
+#[derive(Debug, PartialEq, Eq)]
+pub struct ResponseHeader {
+    pub request_id: i32,
+}
+
+impl<R> ReadVersionedType<R> for ResponseHeader
+where
+    R: Buf,
+{
+    fn read_versioned(reader: &mut R, _version: ApiVersion) -> Result<Self, ReadError> {
+        let resp_type = reader.get_u8();
+        if resp_type != SUCCESS_RESPONSE {
+            todo!("handle unsuccess response type");
+        }
+        let request_id = reader.get_i32();
+        Ok(ResponseHeader { request_id })
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
new file mode 100644
index 0000000000..742c39369d
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -0,0 +1,97 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use bytes::{Buf, BufMut};
+
+mod create_table;
+mod fetch;
+mod get_table;
+mod header;
+mod produce_log;
+mod update_metadata;
+
+pub use create_table::*;
+pub use fetch::*;
+pub use get_table::*;
+pub use header::*;
+pub use produce_log::*;
+pub use update_metadata::*;
+
+pub trait RequestBody {
+    type ResponseBody;
+
+    const API_KEY: ApiKey;
+
+    const REQUEST_VERSION: ApiVersion;
+}
+
+impl<T: RequestBody> RequestBody for &T {
+    type ResponseBody = T::ResponseBody;
+
+    const API_KEY: ApiKey = T::API_KEY;
+
+    const REQUEST_VERSION: ApiVersion = T::REQUEST_VERSION;
+}
+
+pub trait WriteVersionedType<W>: Sized
+where
+    W: BufMut,
+{
+    fn write_versioned(&self, writer: &mut W, version: ApiVersion) -> Result<(), WriteError>;
+}
+
+pub trait ReadVersionedType<R>: Sized
+where
+    R: Buf,
+{
+    fn read_versioned(reader: &mut R, version: ApiVersion) -> Result<Self, ReadError>;
+}
+
+#[macro_export]
+macro_rules! impl_write_version_type {
+    ($type:ty) => {
+        impl<W> WriteVersionedType<W> for $type
+        where
+            W: BufMut,
+        {
+            fn write_versioned(
+                &self,
+                writer: &mut W,
+                _version: ApiVersion,
+            ) -> Result<(), WriteError> {
+                Ok(self.inner_request.encode(writer).unwrap())
+            }
+        }
+    };
+}
+
+#[macro_export]
+macro_rules! impl_read_version_type {
+    ($type:ty) => {
+        impl<R> ReadVersionedType<R> for $type
+        where
+            R: Buf,
+        {
+            fn read_versioned(reader: &mut R, _version: ApiVersion) -> Result<Self, ReadError> {
+                Ok(<$type>::decode(reader).unwrap())
+            }
+        }
+    };
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
new file mode 100644
index 0000000000..7da2b59a2d
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
@@ -0,0 +1,71 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Result as FlussResult;
+use crate::proto::{PbProduceLogReqForBucket, ProduceLogResponse};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use std::sync::Arc;
+
+use crate::client::ReadyWriteBatch;
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+pub struct ProduceLogRequest {
+    pub inner_request: proto::ProduceLogRequest,
+}
+
+impl ProduceLogRequest {
+    pub fn new(
+        table_id: i64,
+        ack: i16,
+        max_request_timeout_ms: i32,
+        ready_batches: Vec<&Arc<ReadyWriteBatch>>,
+    ) -> FlussResult<Self> {
+        let mut request = proto::ProduceLogRequest {
+            table_id,
+            acks: ack as i32,
+            timeout_ms: max_request_timeout_ms,
+            ..Default::default()
+        };
+        for ready_batch in ready_batches {
+            request.buckets_req.push(PbProduceLogReqForBucket {
+                partition_id: ready_batch.table_bucket.partition_id(),
+                bucket_id: ready_batch.table_bucket.bucket_id(),
+                records: ready_batch.write_batch.build()?,
+            })
+        }
+
+        Ok(ProduceLogRequest {
+            inner_request: request,
+        })
+    }
+}
+
+impl RequestBody for ProduceLogRequest {
+    type ResponseBody = ProduceLogResponse;
+
+    const API_KEY: ApiKey = ApiKey::ProduceLog;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(ProduceLogRequest);
+impl_read_version_type!(ProduceLogResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs b/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
new file mode 100644
index 0000000000..0d8ad6464a
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
@@ -0,0 +1,60 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::{MetadataResponse, PbTablePath};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use crate::metadata::TablePath;
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+pub struct UpdateMetadataRequest {
+    pub inner_request: proto::MetadataRequest,
+}
+
+impl UpdateMetadataRequest {
+    pub fn new(table_paths: &[&TablePath]) -> Self {
+        UpdateMetadataRequest {
+            inner_request: proto::MetadataRequest {
+                table_path: table_paths
+                    .iter()
+                    .map(|path| PbTablePath {
+                        database_name: path.database().to_string(),
+                        table_name: path.table().to_string(),
+                    })
+                    .collect(),
+                partitions_path: vec![],
+                partitions_id: vec![],
+            },
+        }
+    }
+}
+
+impl RequestBody for UpdateMetadataRequest {
+    type ResponseBody = MetadataResponse;
+
+    const API_KEY: ApiKey = ApiKey::MetaData;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(UpdateMetadataRequest);
+impl_read_version_type!(MetadataResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/mod.rs b/fluss-rust/crates/fluss/src/rpc/mod.rs
new file mode 100644
index 0000000000..496c015073
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/mod.rs
@@ -0,0 +1,31 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+mod api_key;
+mod api_version;
+mod error;
+mod frame;
+pub mod message;
+pub use error::*;
+mod server_connection;
+pub use server_connection::*;
+mod convert;
+mod transport;
+
+pub use message::*;
+
+pub use convert::*;
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
new file mode 100644
index 0000000000..a102aa3ba6
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -0,0 +1,402 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::cluster::ServerNode;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::error::RpcError;
+use crate::rpc::error::RpcError::ConnectionError;
+use crate::rpc::frame::{AsyncMessageRead, AsyncMessageWrite};
+use crate::rpc::message::{
+    ReadVersionedType, RequestBody, RequestHeader, ResponseHeader, WriteVersionedType,
+};
+use crate::rpc::transport::Transport;
+use futures::future::BoxFuture;
+use parking_lot::{Mutex, RwLock};
+use std::collections::HashMap;
+use std::io::Cursor;
+use std::ops::DerefMut;
+use std::sync::Arc;
+use std::sync::atomic::{AtomicI32, Ordering};
+use std::task::Poll;
+use std::time::Duration;
+use tokio::io::{AsyncRead, AsyncWrite, AsyncWriteExt, BufStream, WriteHalf};
+use tokio::sync::Mutex as AsyncMutex;
+use tokio::sync::oneshot::{Sender, channel};
+use tokio::task::JoinHandle;
+use tracing::warn;
+
+pub type MessengerTransport = ServerConnectionInner<BufStream<Transport>>;
+
+pub type ServerConnection = Arc<MessengerTransport>;
+
+#[derive(Debug, Default)]
+pub struct RpcClient {
+    connections: RwLock<HashMap<String, ServerConnection>>,
+    client_id: Arc<str>,
+    timeout: Option<Duration>,
+    max_message_size: usize,
+}
+
+impl RpcClient {
+    pub fn new() -> Self {
+        RpcClient {
+            connections: Default::default(),
+            client_id: Arc::from(""),
+            timeout: None,
+            max_message_size: usize::MAX,
+        }
+    }
+
+    pub async fn get_connection(
+        &self,
+        server_node: &ServerNode,
+    ) -> Result<ServerConnection, RpcError> {
+        let server_id = server_node.uid();
+        {
+            let connections = self.connections.read();
+            if let Some(connection) = connections.get(server_id) {
+                return Ok(connection.clone());
+            }
+        }
+
+        let new_server = self.connect(server_node).await?;
+        self.connections
+            .write()
+            .insert(server_id.clone(), new_server.clone());
+
+        Ok(new_server)
+    }
+
+    async fn connect(&self, server_node: &ServerNode) -> Result<ServerConnection, RpcError> {
+        let url = server_node.url();
+        let transport = Transport::connect(&url, self.timeout)
+            .await
+            .map_err(|error| ConnectionError(error.to_string()))?;
+
+        let messenger = ServerConnectionInner::new(
+            BufStream::new(transport),
+            self.max_message_size,
+            self.client_id.clone(),
+        );
+        Ok(ServerConnection::new(messenger))
+    }
+}
+
+#[derive(Debug)]
+struct Response {
+    #[allow(dead_code)]
+    header: ResponseHeader,
+    data: Cursor<Vec<u8>>,
+}
+
+#[derive(Debug)]
+struct ActiveRequest {
+    channel: Sender<Result<Response, RpcError>>,
+}
+
+#[derive(Debug)]
+enum ConnectionState {
+    /// Currently active requests by request ID.
+    ///
+    /// An active request is one that got prepared or send but the response wasn't received yet.
+    RequestMap(HashMap<i32, ActiveRequest>),
+
+    /// One or our streams died and we are unable to process any more requests.
+    Poison(Arc<RpcError>),
+}
+
+impl ConnectionState {
+    fn poison(&mut self, err: RpcError) -> Arc<RpcError> {
+        match self {
+            Self::RequestMap(map) => {
+                let err = Arc::new(err);
+
+                // inform all active requests
+                for (_request_id, active_request) in map.drain() {
+                    // it's OK if the other side is gone
+                    active_request
+                        .channel
+                        .send(Err(RpcError::Poisoned(Arc::clone(&err))))
+                        .ok();
+                }
+                *self = Self::Poison(Arc::clone(&err));
+                err
+            }
+            Self::Poison(e) => {
+                // already poisoned, used existing error
+                Arc::clone(e)
+            }
+        }
+    }
+}
+
+#[derive(Debug)]
+pub struct ServerConnectionInner<RW> {
+    /// The half of the stream that we use to send data TO the broker.
+    ///
+    /// This will be used by [`request`](Self::request) to queue up messages.
+    stream_write: Arc<AsyncMutex<WriteHalf<RW>>>,
+
+    client_id: Arc<str>,
+
+    request_id: AtomicI32,
+
+    state: Arc<Mutex<ConnectionState>>,
+
+    join_handle: JoinHandle<()>,
+}
+
+impl<RW> ServerConnectionInner<RW>
+where
+    RW: AsyncRead + AsyncWrite + Send + 'static,
+{
+    pub fn new(stream: RW, max_message_size: usize, client_id: Arc<str>) -> Self {
+        let (stream_read, stream_write) = tokio::io::split(stream);
+        let state = Arc::new(Mutex::new(ConnectionState::RequestMap(HashMap::default())));
+        let state_captured = Arc::clone(&state);
+
+        let join_handle = tokio::spawn(async move {
+            let mut stream_read = stream_read;
+            loop {
+                match stream_read.read_message(max_message_size).await {
+                    Ok(msg) => {
+                        // message was read, so all subsequent errors should not poison the whole stream
+                        let mut cursor = Cursor::new(msg);
+                        let header =
+                            match ResponseHeader::read_versioned(&mut cursor, ApiVersion(0)) {
+                                Ok(header) => header,
+                                Err(e) => {
+                                    warn!(%e, "Cannot read message header, ignoring message");
+                                    continue;
+                                }
+                            };
+
+                        let active_request = match state_captured.lock().deref_mut() {
+                            ConnectionState::RequestMap(map) => {
+                                match map.remove(&header.request_id) {
+                                    Some(active_request) => active_request,
+                                    _ => {
+                                        warn!(
+                                            request_id = header.request_id,
+                                            "Got response for unknown request",
+                                        );
+                                        continue;
+                                    }
+                                }
+                            }
+                            ConnectionState::Poison(_) => {
+                                // stream is poisoned, no need to anything
+                                return;
+                            }
+                        };
+
+                        // we don't care if the other side is gone
+                        active_request
+                            .channel
+                            .send(Ok(Response {
+                                header,
+                                data: cursor,
+                            }))
+                            .ok();
+                    }
+                    Err(e) => {
+                        state_captured.lock().poison(RpcError::ReadMessageError(e));
+                        return;
+                    }
+                }
+            }
+        });
+
+        Self {
+            stream_write: Arc::new(AsyncMutex::new(stream_write)),
+            client_id,
+            request_id: AtomicI32::new(0),
+            state,
+            join_handle,
+        }
+    }
+
+    pub async fn request<R>(&self, msg: R) -> Result<R::ResponseBody, RpcError>
+    where
+        R: RequestBody + Send + WriteVersionedType<Vec<u8>>,
+        R::ResponseBody: ReadVersionedType<Cursor<Vec<u8>>>,
+    {
+        let request_id = self.request_id.fetch_add(1, Ordering::SeqCst);
+        let header = RequestHeader {
+            request_api_key: R::API_KEY,
+            request_api_version: ApiVersion(0),
+            request_id,
+            client_id: Some(String::from(self.client_id.as_ref())),
+        };
+
+        let header_version = ApiVersion(0);
+
+        let body_api_version = ApiVersion(0);
+
+        let mut buf = Vec::new();
+        // write header
+        header.write_versioned(&mut buf, header_version)?;
+        // write message body
+        msg.write_versioned(&mut buf, body_api_version)?;
+
+        let (tx, rx) = channel();
+
+        // to prevent stale data in inner state, ensure that we would remove the request again if we are cancelled while
+        // sending the request
+        let _cleanup_on_cancel =
+            CleanupRequestStateOnCancel::new(Arc::clone(&self.state), request_id);
+
+        match self.state.lock().deref_mut() {
+            ConnectionState::RequestMap(map) => {
+                map.insert(request_id, ActiveRequest { channel: tx });
+            }
+            ConnectionState::Poison(e) => return Err(RpcError::Poisoned(Arc::clone(e))),
+        }
+
+        self.send_message(buf).await?;
+        _cleanup_on_cancel.message_sent();
+        let mut response = rx.await.expect("Who closed this channel?!")?;
+
+        let body = R::ResponseBody::read_versioned(&mut response.data, body_api_version)?;
+
+        let read_bytes = response.data.position();
+        let message_bytes = response.data.into_inner().len() as u64;
+        if read_bytes != message_bytes {
+            return Err(RpcError::TooMuchData {
+                message_size: message_bytes,
+                read: read_bytes,
+                api_key: R::API_KEY,
+                api_version: body_api_version,
+            });
+        }
+        Ok(body)
+    }
+
+    async fn send_message(&self, msg: Vec<u8>) -> Result<(), RpcError> {
+        match self.send_message_inner(msg).await {
+            Ok(()) => Ok(()),
+            Err(e) => {
+                // need to poison the stream because message framing might be out-of-sync
+                let mut state = self.state.lock();
+                Err(RpcError::Poisoned(state.poison(e)))
+            }
+        }
+    }
+
+    async fn send_message_inner(&self, msg: Vec<u8>) -> Result<(), RpcError> {
+        let mut stream_write = Arc::clone(&self.stream_write).lock_owned().await;
+
+        // use a wrapper so that cancellation doesn't cancel the send operation and leaves half-send messages on the wire
+        let fut = CancellationSafeFuture::new(async move {
+            stream_write.write_message(&msg).await?;
+            stream_write.flush().await?;
+            Ok(())
+        });
+
+        fut.await
+    }
+}
+
+impl<RW> Drop for ServerConnectionInner<RW> {
+    fn drop(&mut self) {
+        // todo: should remove from server_connections map?
+        self.join_handle.abort();
+    }
+}
+
+struct CancellationSafeFuture<F>
+where
+    F: Future + Send + 'static,
+{
+    /// Mark if the inner future finished. If not, we must spawn a helper task on drop.
+    done: bool,
+
+    /// Inner future.
+    ///
+    /// Wrapped in an `Option` so we can extract it during drop. Inside that option however we also need a pinned
+    /// box because once this wrapper is polled, it will be pinned in memory -- even during drop. Now the inner
+    /// future does not necessarily implement `Unpin`, so we need a heap allocation to pin it in memory even when we
+    /// move it out of this option.
+    inner: Option<BoxFuture<'static, F::Output>>,
+}
+
+impl<F> CancellationSafeFuture<F>
+where
+    F: Future + Send,
+{
+    fn new(fut: F) -> Self {
+        Self {
+            done: false,
+            inner: Some(Box::pin(fut)),
+        }
+    }
+}
+
+impl<F> Future for CancellationSafeFuture<F>
+where
+    F: Future + Send,
+{
+    type Output = F::Output;
+
+    fn poll(
+        mut self: std::pin::Pin<&mut Self>,
+        cx: &mut std::task::Context<'_>,
+    ) -> Poll<Self::Output> {
+        match self.inner.as_mut().expect("no dropped").as_mut().poll(cx) {
+            Poll::Ready(res) => {
+                self.done = true;
+                Poll::Ready(res)
+            }
+            Poll::Pending => Poll::Pending,
+        }
+    }
+}
+
+/// Helper that ensures that a request is removed when a request is cancelled before it was actually sent out.
+struct CleanupRequestStateOnCancel {
+    state: Arc<Mutex<ConnectionState>>,
+    request_id: i32,
+    message_sent: bool,
+}
+
+impl CleanupRequestStateOnCancel {
+    /// Create new helper.
+    ///
+    /// You must call [`message_sent`](Self::message_sent) when the request was sent.
+    fn new(state: Arc<Mutex<ConnectionState>>, request_id: i32) -> Self {
+        Self {
+            state,
+            request_id,
+            message_sent: false,
+        }
+    }
+
+    /// Request was sent. Do NOT clean the state any longer.
+    fn message_sent(mut self) {
+        self.message_sent = true;
+    }
+}
+
+impl Drop for CleanupRequestStateOnCancel {
+    fn drop(&mut self) {
+        if !self.message_sent {
+            if let ConnectionState::RequestMap(map) = self.state.lock().deref_mut() {
+                map.remove(&self.request_id);
+            }
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/transport.rs b/fluss-rust/crates/fluss/src/rpc/transport.rs
new file mode 100644
index 0000000000..a6f721f6aa
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/transport.rs
@@ -0,0 +1,83 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::error::RpcError;
+use std::ops::DerefMut;
+use std::pin::Pin;
+use std::task::{Context, Poll};
+use std::time::Duration;
+use tokio::io::{AsyncRead, AsyncWrite, ReadBuf};
+use tokio::net::TcpStream;
+
+#[derive(Debug)]
+pub enum Transport {
+    Plain { inner: TcpStream },
+}
+
+impl AsyncRead for Transport {
+    fn poll_read(
+        mut self: Pin<&mut Self>,
+        cx: &mut Context<'_>,
+        buf: &mut ReadBuf<'_>,
+    ) -> Poll<std::io::Result<()>> {
+        match self.deref_mut() {
+            Self::Plain { inner } => Pin::new(inner).poll_read(cx, buf),
+        }
+    }
+}
+
+impl AsyncWrite for Transport {
+    fn poll_write(
+        mut self: Pin<&mut Self>,
+        cx: &mut Context<'_>,
+        buf: &[u8],
+    ) -> Poll<std::io::Result<usize>> {
+        match self.deref_mut() {
+            Self::Plain { inner } => Pin::new(inner).poll_write(cx, buf),
+        }
+    }
+
+    fn poll_flush(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<std::io::Result<()>> {
+        match self.deref_mut() {
+            Self::Plain { inner } => Pin::new(inner).poll_flush(cx),
+        }
+    }
+
+    fn poll_shutdown(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<std::io::Result<()>> {
+        match self.deref_mut() {
+            Self::Plain { inner } => Pin::new(inner).poll_shutdown(cx),
+        }
+    }
+}
+
+impl Transport {
+    pub async fn connect(server: &str, timeout: Option<Duration>) -> Result<Self, RpcError> {
+        let tcp_stream = Self::connect_timeout(server, timeout).await?;
+        Ok(Transport::Plain { inner: tcp_stream })
+    }
+
+    async fn connect_timeout(host: &str, timeout: Option<Duration>) -> Result<TcpStream, RpcError> {
+        match timeout {
+            Some(timeout) => Ok(tokio::time::timeout(timeout, TcpStream::connect(host))
+                .await
+                .map_err(|_| {
+                    RpcError::ConnectionError(format!("Timeout connecting to host {host}"))
+                })??),
+            None => Ok(TcpStream::connect(host).await?),
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
new file mode 100644
index 0000000000..c26b4ec43a
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -0,0 +1,176 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::TableBucket;
+use linked_hash_map::LinkedHashMap;
+use std::collections::{HashMap, HashSet};
+use std::hash::Hash;
+use std::sync::Arc;
+use std::time::{SystemTime, UNIX_EPOCH};
+
+pub fn current_time_ms() -> i64 {
+    SystemTime::now()
+        .duration_since(UNIX_EPOCH)
+        .unwrap()
+        .as_millis() as i64
+}
+
+pub struct FairBucketStatusMap<S> {
+    map: LinkedHashMap<TableBucket, Arc<S>>,
+    size: usize,
+}
+
+#[allow(dead_code)]
+impl<S> FairBucketStatusMap<S> {
+    pub fn new() -> Self {
+        Self {
+            map: LinkedHashMap::new(),
+            size: 0,
+        }
+    }
+
+    /// Moves the bucket to the end of the iteration order
+    pub fn move_to_end(&mut self, table_bucket: TableBucket)
+    where
+        TableBucket: Eq + Hash,
+    {
+        if let Some(status) = self.map.remove(&table_bucket) {
+            self.map.insert(table_bucket, status);
+        }
+    }
+
+    /// Updates the status and moves the bucket to the end
+    pub fn update_and_move_to_end(&mut self, table_bucket: TableBucket, status: S)
+    where
+        TableBucket: Eq + Hash,
+    {
+        self.map.remove(&table_bucket);
+        self.map.insert(table_bucket, Arc::new(status));
+        self.update_size();
+    }
+
+    /// Updates the status without changing the order
+    pub fn update(&mut self, table_bucket: TableBucket, status: Arc<S>)
+    where
+        TableBucket: Eq + Hash,
+    {
+        self.map.insert(table_bucket, status);
+        self.update_size();
+    }
+
+    /// Removes a bucket
+    pub fn remove(&mut self, table_bucket: &TableBucket)
+    where
+        TableBucket: Eq + Hash,
+    {
+        self.map.remove(table_bucket);
+        self.update_size();
+    }
+
+    /// Returns an immutable view of all buckets
+    pub fn bucket_set(&self) -> HashSet<&TableBucket>
+    where
+        TableBucket: Eq + Hash,
+    {
+        self.map.keys().collect()
+    }
+
+    /// Clears all buckets
+    pub fn clear(&mut self) {
+        self.map.clear();
+        self.update_size();
+    }
+
+    /// Checks if a bucket exists
+    pub fn contains(&self, table_bucket: &TableBucket) -> bool
+    where
+        TableBucket: Eq + Hash,
+    {
+        self.map.contains_key(table_bucket)
+    }
+
+    /// Returns an immutable view of the bucket-status map
+    pub fn bucket_status_map(&self) -> &LinkedHashMap<TableBucket, Arc<S>> {
+        &self.map
+    }
+
+    /// Returns status values in current order
+    pub fn bucket_status_values(&self) -> Vec<&Arc<S>> {
+        self.map.values().collect()
+    }
+
+    /// Gets the status for a bucket
+    pub fn status_value(&self, table_bucket: &TableBucket) -> Option<&Arc<S>>
+    where
+        TableBucket: Eq + Hash,
+    {
+        self.map.get(table_bucket)
+    }
+
+    /// Applies a function to each bucket-status pair
+    pub fn for_each<F>(&self, mut f: F)
+    where
+        F: FnMut(&TableBucket, &S),
+    {
+        for (bucket, status) in &self.map {
+            f(bucket, status);
+        }
+    }
+
+    /// Gets the current bucket count (thread-safe)
+    pub fn size(&self) -> usize {
+        self.size
+    }
+
+    pub fn set(&mut self, bucket_to_status: HashMap<TableBucket, Arc<S>>)
+    where
+        TableBucket: Eq + Hash + Clone,
+        S: Clone,
+    {
+        self.map.clear();
+
+        // Group buckets by table ID
+        let mut table_to_buckets: LinkedHashMap<i64, Vec<TableBucket>> = LinkedHashMap::new();
+        for bucket in bucket_to_status.keys() {
+            table_to_buckets
+                .entry(bucket.table_id())
+                .or_default()
+                .push(bucket.clone());
+        }
+
+        // Insert buckets grouped by table
+        for (_, buckets) in table_to_buckets {
+            for bucket in buckets {
+                if let Some(status) = bucket_to_status.get(&bucket) {
+                    self.map.insert(bucket, status.clone());
+                }
+            }
+        }
+
+        self.update_size();
+    }
+
+    fn update_size(&mut self) {
+        self.size = self.map.len()
+    }
+}
+
+impl<S> Default for FairBucketStatusMap<S> {
+    fn default() -> Self {
+        Self::new()
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/integration/client/mod.rs b/fluss-rust/crates/fluss/tests/integration/client/mod.rs
new file mode 100644
index 0000000000..567c358cea
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/client/mod.rs
@@ -0,0 +1,21 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#[test]
+fn test() {
+    println!("Running integration tests");
+}
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
new file mode 100644
index 0000000000..7840638c74
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -0,0 +1,25 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#[cfg(feature = "integration_tests")]
+extern crate fluss;
+
+#[cfg(feature = "integration_tests")]
+mod integration {
+
+    mod client;
+}
diff --git a/fluss-rust/rust-toolchain.toml b/fluss-rust/rust-toolchain.toml
new file mode 100644
index 0000000000..56c3bf5df8
--- /dev/null
+++ b/fluss-rust/rust-toolchain.toml
@@ -0,0 +1,20 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[toolchain]
+channel = "stable"
+components = ["rustfmt", "clippy"]
\ No newline at end of file
diff --git a/fluss-rust/rustfmt.toml b/fluss-rust/rustfmt.toml
new file mode 100644
index 0000000000..18d114826f
--- /dev/null
+++ b/fluss-rust/rustfmt.toml
@@ -0,0 +1,19 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+edition = "2024"
+reorder_imports = true
\ No newline at end of file

From 40cfb79e6457ea05040b834745869e1cf98638df Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Tue, 26 Aug 2025 21:13:43 +0800
Subject: [PATCH 005/287] [hotfix] Ignore some file license check (#4)

---
 fluss-rust/.licenserc.yaml | 29 +++++++++++++++++++++++++++++
 1 file changed, 29 insertions(+)
 create mode 100644 fluss-rust/.licenserc.yaml

diff --git a/fluss-rust/.licenserc.yaml b/fluss-rust/.licenserc.yaml
new file mode 100644
index 0000000000..3813b484b3
--- /dev/null
+++ b/fluss-rust/.licenserc.yaml
@@ -0,0 +1,29 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+header:
+  license:
+    spdx-id: Apache-2.0
+    copyright-owner: Apache Software Foundation
+
+  paths-ignore:
+    - '.github/PULL_REQUEST_TEMPLATE.md'
+    - '.gitignore'
+    - 'LICENSE'
+    - 'NOTICE'
+    - 'DISCLAIMER'
+  comment: on-failure

From 69b0ead1a31bb3f7f06fea895f48aed583e5b382 Mon Sep 17 00:00:00 2001
From: naivedogger <59598718+naivedogger@users.noreply.github.com>
Date: Thu, 11 Sep 2025 16:25:12 +0800
Subject: [PATCH 006/287] [feat] Add more functions to the Rust client Admin
 (#5)

---
 .../{dependabot.yml  => dependabot.yml}       |   0
 fluss-rust/crates/fluss/src/client/admin.rs   | 133 +++++++++-
 fluss-rust/crates/fluss/src/client/mod.rs     |   6 +-
 .../crates/fluss/src/client/table/mod.rs      |   5 +-
 .../fluss/src/client/write/accumulator.rs     |   6 +-
 .../crates/fluss/src/cluster/cluster.rs       |   1 +
 .../crates/fluss/src/metadata/database.rs     | 234 ++++++++++++++++++
 .../crates/fluss/src/metadata/datatype.rs     |  12 +
 fluss-rust/crates/fluss/src/metadata/mod.rs   |   4 +-
 fluss-rust/crates/fluss/src/metadata/table.rs |  65 +++++
 .../crates/fluss/src/proto/fluss_api.proto    |  83 +++++++
 fluss-rust/crates/fluss/src/record/arrow.rs   |   7 +-
 fluss-rust/crates/fluss/src/row/datum.rs      | 103 +++++---
 fluss-rust/crates/fluss/src/row/mod.rs        |   3 +-
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |  39 ++-
 .../fluss/src/rpc/message/create_database.rs  |  67 +++++
 .../fluss/src/rpc/message/database_exists.rs  |  49 ++++
 .../fluss/src/rpc/message/drop_database.rs    |  51 ++++
 .../fluss/src/rpc/message/drop_table.rs       |  56 +++++
 .../src/rpc/message/get_database_info.rs      |  49 ++++
 .../rpc/message/get_latest_lake_snapshot.rs   |  55 ++++
 .../fluss/src/rpc/message/list_databases.rs   |  47 ++++
 .../fluss/src/rpc/message/list_tables.rs      |  53 ++++
 .../crates/fluss/src/rpc/message/mod.rs       |  18 ++
 .../fluss/src/rpc/message/table_exists.rs     |  55 ++++
 .../crates/fluss/src/rpc/server_connection.rs |   1 -
 26 files changed, 1144 insertions(+), 58 deletions(-)
 rename fluss-rust/.github/{dependabot.yml  => dependabot.yml} (100%)
 create mode 100644 fluss-rust/crates/fluss/src/metadata/database.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/create_database.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/table_exists.rs

diff --git a/fluss-rust/.github/dependabot.yml  b/fluss-rust/.github/dependabot.yml
similarity index 100%
rename from fluss-rust/.github/dependabot.yml 
rename to fluss-rust/.github/dependabot.yml
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 8688a2d844..2584034a69 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -16,18 +16,28 @@
 // under the License.
 
 use crate::client::metadata::Metadata;
-use crate::metadata::{JsonSerde, TableDescriptor, TableInfo, TablePath};
-use crate::rpc::message::{CreateTableRequest, GetTableRequest};
+use crate::metadata::{
+    DatabaseDescriptor, DatabaseInfo, JsonSerde, LakeSnapshot, TableBucket, TableDescriptor,
+    TableInfo, TablePath,
+};
+use crate::rpc::message::{
+    CreateDatabaseRequest, CreateTableRequest, DatabaseExistsRequest, DropDatabaseRequest,
+    DropTableRequest, GetDatabaseInfoRequest, GetLatestLakeSnapshotRequest, GetTableRequest,
+    ListDatabasesRequest, ListTablesRequest, TableExistsRequest,
+};
 use crate::rpc::{RpcClient, ServerConnection};
+
+use std::collections::HashMap;
 use std::sync::Arc;
 
 use crate::error::Result;
 use crate::proto::GetTableInfoResponse;
 
-#[allow(dead_code)]
 pub struct FlussAdmin {
     admin_gateway: ServerConnection,
+    #[allow(dead_code)]
     metadata: Arc<Metadata>,
+    #[allow(dead_code)]
     rpc_client: Arc<RpcClient>,
 }
 
@@ -49,6 +59,23 @@ impl FlussAdmin {
         })
     }
 
+    pub async fn create_database(
+        &self,
+        database_name: &str,
+        ignore_if_exists: bool,
+        database_descriptor: Option<&DatabaseDescriptor>,
+    ) -> Result<()> {
+        let _response = self
+            .admin_gateway
+            .request(CreateDatabaseRequest::new(
+                database_name,
+                ignore_if_exists,
+                database_descriptor,
+            )?)
+            .await?;
+        Ok(())
+    }
+
     pub async fn create_table(
         &self,
         table_path: &TablePath,
@@ -66,6 +93,14 @@ impl FlussAdmin {
         Ok(())
     }
 
+    pub async fn drop_table(&self, table_path: &TablePath, ignore_if_exists: bool) -> Result<()> {
+        let _response = self
+            .admin_gateway
+            .request(DropTableRequest::new(table_path, ignore_if_exists))
+            .await?;
+        Ok(())
+    }
+
     pub async fn get_table(&self, table_path: &TablePath) -> Result<TableInfo> {
         let response = self
             .admin_gateway
@@ -90,4 +125,96 @@ impl FlussAdmin {
             modified_time,
         ))
     }
+
+    /// List all tables in the given database
+    pub async fn list_tables(&self, database_name: &str) -> Result<Vec<String>> {
+        let response = self
+            .admin_gateway
+            .request(ListTablesRequest::new(database_name))
+            .await?;
+        Ok(response.table_name)
+    }
+
+    /// Check if a table exists
+    pub async fn table_exists(&self, table_path: &TablePath) -> Result<bool> {
+        let response = self
+            .admin_gateway
+            .request(TableExistsRequest::new(table_path))
+            .await?;
+        Ok(response.exists)
+    }
+
+    /// Drop a database
+    pub async fn drop_database(
+        &self,
+        database_name: &str,
+        ignore_if_not_exists: bool,
+        cascade: bool,
+    ) -> Result<()> {
+        let _response = self
+            .admin_gateway
+            .request(DropDatabaseRequest::new(
+                database_name,
+                ignore_if_not_exists,
+                cascade,
+            ))
+            .await?;
+        Ok(())
+    }
+
+    /// List all databases
+    pub async fn list_databases(&self) -> Result<Vec<String>> {
+        let response = self
+            .admin_gateway
+            .request(ListDatabasesRequest::new())
+            .await?;
+        Ok(response.database_name)
+    }
+
+    /// Check if a database exists
+    pub async fn database_exists(&self, database_name: &str) -> Result<bool> {
+        let response = self
+            .admin_gateway
+            .request(DatabaseExistsRequest::new(database_name))
+            .await?;
+        Ok(response.exists)
+    }
+
+    /// Get database information
+    pub async fn get_database_info(&self, database_name: &str) -> Result<DatabaseInfo> {
+        let request = GetDatabaseInfoRequest::new(database_name);
+        let response = self.admin_gateway.request(request).await?;
+
+        // Convert proto response to DatabaseInfo
+        let database_descriptor = DatabaseDescriptor::from_json_bytes(&response.database_json)?;
+
+        Ok(DatabaseInfo::new(
+            database_name.to_string(),
+            database_descriptor,
+            response.created_time,
+            response.modified_time,
+        ))
+    }
+
+    /// Get the latest lake snapshot for a table
+    pub async fn get_latest_lake_snapshot(&self, table_path: &TablePath) -> Result<LakeSnapshot> {
+        let response = self
+            .admin_gateway
+            .request(GetLatestLakeSnapshotRequest::new(table_path))
+            .await?;
+
+        // Convert proto response to LakeSnapshot
+        let mut table_buckets_offset = HashMap::new();
+        for bucket_snapshot in response.bucket_snapshots {
+            let table_bucket = TableBucket::new(response.table_id, bucket_snapshot.bucket_id);
+            if let Some(log_offset) = bucket_snapshot.log_offset {
+                table_buckets_offset.insert(table_bucket, log_offset);
+            }
+        }
+
+        Ok(LakeSnapshot::new(
+            response.snapshot_id,
+            table_buckets_offset,
+        ))
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/client/mod.rs b/fluss-rust/crates/fluss/src/client/mod.rs
index 5b6908eec1..a971439258 100644
--- a/fluss-rust/crates/fluss/src/client/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/mod.rs
@@ -17,10 +17,12 @@
 
 mod admin;
 mod connection;
+mod metadata;
 mod table;
 mod write;
 
+pub use admin::*;
 pub use connection::*;
-mod metadata;
-
+pub use metadata::*;
+pub use table::*;
 pub use write::*;
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 503a1edb39..4d6f8f045b 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -17,8 +17,6 @@
 
 use crate::client::connection::FlussConnection;
 use crate::client::metadata::Metadata;
-use crate::client::table::append::TableAppend;
-use crate::client::table::scanner::TableScan;
 use crate::metadata::{TableInfo, TablePath};
 use std::sync::Arc;
 
@@ -29,6 +27,9 @@ mod append;
 mod scanner;
 mod writer;
 
+pub use append::TableAppend;
+pub use scanner::TableScan;
+
 #[allow(dead_code)]
 pub struct FlussTable<'a> {
     conn: &'a FlussConnection,
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 0b77894025..32622c7b2d 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -93,13 +93,15 @@ impl RecordAccumulator {
         }
 
         let table_path = &record.table_path;
-
+        let table_info = cluster.get_table(table_path);
         let row_type = &cluster.get_table(table_path).row_type;
 
+        let schema_id = table_info.schema_id;
+
         let mut batch = ArrowLog(ArrowLogWriteBatch::new(
             self.batch_id.fetch_add(1, Ordering::Relaxed),
             table_path.as_ref().clone(),
-            0,
+            schema_id,
             row_type,
             bucket_id,
             current_time_ms(),
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
index 1f8341dd66..a6f20a8262 100644
--- a/fluss-rust/crates/fluss/src/cluster/cluster.rs
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -126,6 +126,7 @@ impl Cluster {
                 table_metadata.modified_time,
             );
             table_info_by_path.insert(table_path.clone(), table_info);
+            table_id_by_path.insert(table_path.clone(), table_id);
 
             // now, get bucket matadata
             let mut found_unavailable_bucket = false;
diff --git a/fluss-rust/crates/fluss/src/metadata/database.rs b/fluss-rust/crates/fluss/src/metadata/database.rs
new file mode 100644
index 0000000000..2649421d6f
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metadata/database.rs
@@ -0,0 +1,234 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::JsonSerdeError;
+use crate::error::Result;
+use crate::metadata::JsonSerde;
+use serde::{Deserialize, Serialize};
+use serde_json::{Value, json};
+use std::collections::HashMap;
+
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+pub struct DatabaseDescriptor {
+    comment: Option<String>,
+    custom_properties: HashMap<String, String>,
+}
+
+#[derive(Debug, Clone)]
+pub struct DatabaseInfo {
+    database_name: String,
+    database_descriptor: DatabaseDescriptor,
+    created_time: i64,
+    modified_time: i64,
+}
+
+impl DatabaseInfo {
+    pub fn new(
+        database_name: String,
+        database_descriptor: DatabaseDescriptor,
+        created_time: i64,
+        modified_time: i64,
+    ) -> Self {
+        Self {
+            database_name,
+            database_descriptor,
+            created_time,
+            modified_time,
+        }
+    }
+
+    pub fn database_name(&self) -> &str {
+        &self.database_name
+    }
+
+    pub fn database_descriptor(&self) -> &DatabaseDescriptor {
+        &self.database_descriptor
+    }
+
+    pub fn created_time(&self) -> i64 {
+        self.created_time
+    }
+
+    pub fn modified_time(&self) -> i64 {
+        self.modified_time
+    }
+}
+
+#[derive(Debug, Default)]
+pub struct DatabaseDescriptorBuilder {
+    comment: Option<String>,
+    custom_properties: HashMap<String, String>,
+}
+
+impl DatabaseDescriptor {
+    pub fn builder() -> DatabaseDescriptorBuilder {
+        DatabaseDescriptorBuilder::default()
+    }
+
+    pub fn comment(&self) -> Option<&str> {
+        self.comment.as_deref()
+    }
+
+    pub fn custom_properties(&self) -> &HashMap<String, String> {
+        &self.custom_properties
+    }
+}
+
+impl DatabaseDescriptorBuilder {
+    pub fn comment(mut self, comment: &str) -> Self {
+        self.comment = Some(comment.to_string());
+        self
+    }
+
+    pub fn custom_properties(mut self, properties: HashMap<String, String>) -> Self {
+        self.custom_properties = properties;
+        self
+    }
+
+    pub fn custom_property(mut self, key: &str, value: &str) -> Self {
+        self.custom_properties
+            .insert(key.to_string(), value.to_string());
+        self
+    }
+
+    pub fn build(self) -> Result<DatabaseDescriptor> {
+        Ok(DatabaseDescriptor {
+            comment: self.comment,
+            custom_properties: self.custom_properties,
+        })
+    }
+}
+
+impl DatabaseDescriptor {
+    const CUSTOM_PROPERTIES_NAME: &'static str = "custom_properties";
+    const COMMENT_NAME: &'static str = "comment";
+    const VERSION_KEY: &'static str = "version";
+    const VERSION: u32 = 1;
+}
+
+impl JsonSerde for DatabaseDescriptor {
+    fn serialize_json(&self) -> Result<Value> {
+        let mut obj = serde_json::Map::new();
+
+        // Serialize version
+        obj.insert(Self::VERSION_KEY.to_string(), json!(Self::VERSION));
+
+        // Serialize comment if present
+        if let Some(comment) = self.comment() {
+            obj.insert(Self::COMMENT_NAME.to_string(), json!(comment));
+        }
+
+        // Serialize custom properties
+        obj.insert(
+            Self::CUSTOM_PROPERTIES_NAME.to_string(),
+            json!(self.custom_properties()),
+        );
+
+        Ok(Value::Object(obj))
+    }
+
+    fn deserialize_json(node: &Value) -> Result<Self> {
+        let mut builder = DatabaseDescriptor::builder();
+
+        // Deserialize comment if present
+        if let Some(comment_node) = node.get(Self::COMMENT_NAME) {
+            let comment = comment_node
+                .as_str()
+                .ok_or_else(|| {
+                    JsonSerdeError(format!("{} should be a string", Self::COMMENT_NAME))
+                })?
+                .to_owned();
+            builder = builder.comment(&comment);
+        }
+
+        // Deserialize custom properties directly
+        let custom_properties = if let Some(props_node) = node.get(Self::CUSTOM_PROPERTIES_NAME) {
+            let obj = props_node.as_object().ok_or_else(|| {
+                JsonSerdeError("Custom properties should be an object".to_string())
+            })?;
+
+            let mut properties = HashMap::with_capacity(obj.len());
+            for (key, value) in obj {
+                properties.insert(
+                    key.clone(),
+                    value
+                        .as_str()
+                        .ok_or_else(|| {
+                            JsonSerdeError("Property value should be a string".to_string())
+                        })?
+                        .to_owned(),
+                );
+            }
+            properties
+        } else {
+            HashMap::new()
+        };
+        builder = builder.custom_properties(custom_properties);
+
+        builder.build()
+    }
+}
+
+impl DatabaseDescriptor {
+    /// Create DatabaseDescriptor from JSON bytes (equivalent to Java's fromJsonBytes)
+    pub fn from_json_bytes(bytes: &[u8]) -> Result<Self> {
+        let json_value: Value = serde_json::from_slice(bytes)
+            .map_err(|e| JsonSerdeError(format!("Failed to parse JSON: {}", e)))?;
+        Self::deserialize_json(&json_value)
+    }
+
+    /// Convert DatabaseDescriptor to JSON bytes
+    pub fn to_json_bytes(&self) -> Result<Vec<u8>> {
+        let json_value = self.serialize_json()?;
+        serde_json::to_vec(&json_value)
+            .map_err(|e| JsonSerdeError(format!("Failed to serialize to JSON: {}", e)))
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_database_descriptor_json_serde() {
+        let mut custom_props = HashMap::new();
+        custom_props.insert("key1".to_string(), "value1".to_string());
+        custom_props.insert("key2".to_string(), "value2".to_string());
+
+        let descriptor = DatabaseDescriptor::builder()
+            .comment("Test database")
+            .custom_properties(custom_props)
+            .build()
+            .unwrap();
+
+        // Test serialization
+        let json_bytes = descriptor.to_json_bytes().unwrap();
+        println!("Serialized JSON: {}", String::from_utf8_lossy(&json_bytes));
+
+        // Test deserialization
+        let deserialized = DatabaseDescriptor::from_json_bytes(&json_bytes).unwrap();
+        assert_eq!(descriptor, deserialized);
+    }
+
+    #[test]
+    fn test_empty_database_descriptor() {
+        let descriptor = DatabaseDescriptor::builder().build().unwrap();
+        let json_bytes = descriptor.to_json_bytes().unwrap();
+        let deserialized = DatabaseDescriptor::from_json_bytes(&json_bytes).unwrap();
+        assert_eq!(descriptor, deserialized);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 0c00c6f08e..09ca0c2c57 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -591,6 +591,10 @@ impl ArrayType {
             element_type: self.element_type.clone(),
         }
     }
+
+    pub fn get_element_type(&self) -> &DataType {
+        &self.element_type
+    }
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Deserialize, Serialize, Hash)]
@@ -620,6 +624,14 @@ impl MapType {
             value_type: self.value_type.clone(),
         }
     }
+
+    pub fn key_type(&self) -> &DataType {
+        &self.key_type
+    }
+
+    pub fn value_type(&self) -> &DataType {
+        &self.value_type
+    }
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Deserialize, Serialize, Hash)]
diff --git a/fluss-rust/crates/fluss/src/metadata/mod.rs b/fluss-rust/crates/fluss/src/metadata/mod.rs
index 79465474f7..87540071f3 100644
--- a/fluss-rust/crates/fluss/src/metadata/mod.rs
+++ b/fluss-rust/crates/fluss/src/metadata/mod.rs
@@ -15,10 +15,12 @@
 // specific language governing permissions and limitations
 // under the License.
 
+mod database;
 mod datatype;
-pub use datatype::*;
 mod json_serde;
 mod table;
 
+pub use database::*;
+pub use datatype::*;
 pub use json_serde::*;
 pub use table::*;
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index a5ab61d67e..90e3573eb8 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -584,6 +584,16 @@ impl Display for LogFormat {
     }
 }
 
+impl LogFormat {
+    pub fn parse(s: &str) -> Result<Self> {
+        match s.to_uppercase().as_str() {
+            "ARROW" => Ok(LogFormat::ARROW),
+            "INDEXED" => Ok(LogFormat::INDEXED),
+            _ => Err(InvalidTableError(format!("Unknown log format: {}", s))),
+        }
+    }
+}
+
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
 pub enum KvFormat {
     INDEXED,
@@ -600,6 +610,16 @@ impl Display for KvFormat {
     }
 }
 
+impl KvFormat {
+    pub fn parse(s: &str) -> Result<Self> {
+        match s.to_uppercase().as_str() {
+            "INDEXED" => Ok(KvFormat::INDEXED),
+            "COMPACTED" => Ok(KvFormat::COMPACTED),
+            _ => Err(InvalidTableError(format!("Unknown kv format: {}", s))),
+        }
+    }
+}
+
 #[derive(Debug, PartialEq, Eq, Hash, Clone, Serialize, Deserialize)]
 pub struct TablePath {
     database: String,
@@ -631,6 +651,28 @@ impl TablePath {
     }
 }
 
+#[derive(Debug, Clone)]
+pub struct PhysicalTablePath {
+    table_path: TablePath,
+    #[allow(dead_code)]
+    partition: Option<String>,
+}
+
+impl PhysicalTablePath {
+    pub fn of(table_path: TablePath) -> Self {
+        Self {
+            table_path,
+            partition: None,
+        }
+    }
+
+    // TODO: support partition
+
+    pub fn get_table_path(&self) -> &TablePath {
+        &self.table_path
+    }
+}
+
 #[derive(Debug, Clone)]
 pub struct TableInfo {
     pub table_path: TablePath,
@@ -918,3 +960,26 @@ impl TableBucket {
         self.partition_id
     }
 }
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct LakeSnapshot {
+    pub snapshot_id: i64,
+    pub table_buckets_offset: HashMap<TableBucket, i64>,
+}
+
+impl LakeSnapshot {
+    pub fn new(snapshot_id: i64, table_buckets_offset: HashMap<TableBucket, i64>) -> Self {
+        Self {
+            snapshot_id,
+            table_buckets_offset,
+        }
+    }
+
+    pub fn snapshot_id(&self) -> i64 {
+        self.snapshot_id
+    }
+
+    pub fn table_buckets_offset(&self) -> &HashMap<TableBucket, i64> {
+        &self.table_buckets_offset
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index 195b8f824c..d71197b2b0 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -123,6 +123,21 @@ message CreateTableRequest {
 message CreateTableResponse {
 }
 
+message DropTableRequest {
+  required PbTablePath table_path = 1;
+  required bool ignore_if_not_exists = 2;
+}
+
+message DropTableResponse {
+}
+
+message TableExistsRequest {
+  required PbTablePath table_path = 1;
+}
+
+message TableExistsResponse {
+  required bool exists = 1;
+}
 
 message GetTableInfoRequest {
   required PbTablePath table_path = 1;
@@ -136,6 +151,57 @@ message GetTableInfoResponse {
   required int64 modified_time = 5;
 }
 
+message ListTablesRequest {
+  required string database_name = 1;
+}
+
+message ListTablesResponse {
+  repeated string table_name = 1;
+}
+
+message CreateDatabaseRequest {
+  required string database_name = 1;
+  required bool ignore_if_exists = 2;
+  optional bytes database_json = 3;
+}
+
+message CreateDatabaseResponse {
+}
+
+message GetDatabaseInfoRequest {
+  required string database_name = 1;
+}
+
+message GetDatabaseInfoResponse {
+  required bytes database_json = 3;
+  required int64 created_time = 4;
+  required int64 modified_time = 5;
+}
+
+message DropDatabaseRequest {
+  required string database_name = 1;
+  required bool ignore_if_not_exists = 2;
+  required bool cascade = 3;
+}
+
+message DropDatabaseResponse {
+}
+
+message DatabaseExistsRequest {
+  required string database_name = 1;
+}
+
+message DatabaseExistsResponse {
+  required bool exists = 1;
+}
+
+message ListDatabasesRequest {
+}
+
+message ListDatabasesResponse {
+  repeated string database_name = 1;
+}
+
 
 // fetch log request and response
 message FetchLogRequest {
@@ -194,4 +260,21 @@ message PbRemoteLogSegment {
   required int64 remote_log_start_offset = 2;
   required int64 remote_log_end_offset = 3;
   required int32 segment_size_in_bytes = 4;
+}
+
+// fetch latest lake snapshot
+message GetLatestLakeSnapshotRequest {
+  required PbTablePath table_path = 1;
+}
+
+message GetLatestLakeSnapshotResponse {
+  required int64 table_id = 1;
+  required int64 snapshotId = 2;
+  repeated PbLakeSnapshotForBucket bucket_snapshots = 3;
+}
+
+message PbLakeSnapshotForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  optional int64 log_offset = 3;
 }
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 2f595d0304..fa63b00603 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -16,9 +16,9 @@
 // under the License.
 
 use arrow::array::{
-    ArrayBuilder, ArrayRef, BooleanBuilder, Float32Builder, Float64Builder, Int8Builder,
-    Int16Builder, Int32Builder, Int64Builder, StringBuilder, UInt8Builder, UInt16Builder,
-    UInt32Builder, UInt64Builder,
+    ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Float32Builder, Float64Builder,
+    Int8Builder, Int16Builder, Int32Builder, Int64Builder, StringBuilder, UInt8Builder,
+    UInt16Builder, UInt32Builder, UInt64Builder,
 };
 use arrow::{
     array::RecordBatch,
@@ -224,6 +224,7 @@ impl MemoryLogRecordsArrowBuilder {
             arrow_schema::DataType::Float64 => Box::new(Float64Builder::new()),
             arrow_schema::DataType::Boolean => Box::new(BooleanBuilder::new()),
             arrow_schema::DataType::Utf8 => Box::new(StringBuilder::new()),
+            arrow_schema::DataType::Binary => Box::new(BinaryBuilder::new()),
             dt => panic!("Unsupported data type: {dt:?}"),
         }
     }
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 3c65a7d4ee..d8c4f748ca 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -19,7 +19,10 @@ use chrono::Datelike;
 
 use crate::error::Error::RowConvertError;
 use crate::error::Result;
-use arrow::array::{ArrayBuilder, Int8Builder, Int16Builder, Int32Builder, StringBuilder};
+use arrow::array::{
+    ArrayBuilder, BinaryBuilder, BooleanBuilder, Float32Builder, Float64Builder, Int8Builder,
+    Int16Builder, Int32Builder, Int64Builder, StringBuilder,
+};
 use chrono::NaiveDate;
 use ordered_float::OrderedFloat;
 use parse_display::Display;
@@ -47,6 +50,8 @@ pub enum Datum<'a> {
     #[display("{0}")]
     Int64(i64),
     #[display("{0}")]
+    Float32(F32),
+    #[display("{0}")]
     Float64(F64),
     #[display("'{0}'")]
     String(&'a str),
@@ -96,6 +101,20 @@ impl From<Option<&()>> for Datum<'_> {
     }
 }
 
+impl<'a> From<f32> for Datum<'a> {
+    #[inline]
+    fn from(f: f32) -> Datum<'a> {
+        Datum::Float32(F32::from(f))
+    }
+}
+
+impl<'a> From<f64> for Datum<'a> {
+    #[inline]
+    fn from(f: f64) -> Datum<'a> {
+        Datum::Float64(F64::from(f))
+    }
+}
+
 impl TryFrom<&Datum<'_>> for i32 {
     type Error = ();
 
@@ -126,45 +145,56 @@ pub trait ToArrow {
 
 impl Datum<'_> {
     pub fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()> {
+        macro_rules! append_null_to_arrow {
+            ($builder_type:ty) => {
+                if let Some(b) = builder.as_any_mut().downcast_mut::<$builder_type>() {
+                    b.append_null();
+                    return Ok(());
+                }
+            };
+        }
+
+        macro_rules! append_value_to_arrow {
+            ($builder_type:ty, $value:expr) => {
+                if let Some(b) = builder.as_any_mut().downcast_mut::<$builder_type>() {
+                    b.append_value($value);
+                    return Ok(());
+                }
+            };
+        }
+
         match self {
             Datum::Null => {
-                todo!()
-            }
-            Datum::Bool(_v) => {
-                todo!()
-            }
-            Datum::Int16(_v) => {
-                todo!()
-            }
-            Datum::Int32(v) => {
-                v.append_to(builder)?;
-            }
-            Datum::Int64(_v) => {
-                todo!()
-            }
-            Datum::Float64(_v) => {
-                todo!()
-            }
-            Datum::String(v) => {
-                v.append_to(builder)?;
+                append_null_to_arrow!(BooleanBuilder);
+                append_null_to_arrow!(Int16Builder);
+                append_null_to_arrow!(Int32Builder);
+                append_null_to_arrow!(Int64Builder);
+                append_null_to_arrow!(Float32Builder);
+                append_null_to_arrow!(Float64Builder);
+                append_null_to_arrow!(StringBuilder);
+                append_null_to_arrow!(BinaryBuilder);
             }
-            Datum::Blob(_v) => {
-                todo!()
-            }
-            Datum::Decimal(_v) => {
-                todo!()
-            }
-            Datum::Date(_v) => {
-                todo!()
-            }
-            Datum::Timestamp(_v) => {
-                todo!()
-            }
-            Datum::TimestampTz(_v) => {
-                todo!()
+            Datum::Bool(v) => append_value_to_arrow!(BooleanBuilder, *v),
+            Datum::Int16(v) => append_value_to_arrow!(Int16Builder, *v),
+            Datum::Int32(v) => append_value_to_arrow!(Int32Builder, *v),
+            Datum::Int64(v) => append_value_to_arrow!(Int64Builder, *v),
+            Datum::Float32(v) => append_value_to_arrow!(Float32Builder, v.into_inner()),
+            Datum::Float64(v) => append_value_to_arrow!(Float64Builder, v.into_inner()),
+            Datum::String(v) => append_value_to_arrow!(StringBuilder, *v),
+            Datum::Blob(v) => append_value_to_arrow!(BinaryBuilder, v.as_ref()),
+            Datum::Decimal(_) | Datum::Date(_) | Datum::Timestamp(_) | Datum::TimestampTz(_) => {
+                return Err(RowConvertError(format!(
+                    "Type {:?} is not yet supported for Arrow conversion",
+                    std::mem::discriminant(self)
+                )));
             }
         }
-        Ok(())
+
+        Err(RowConvertError(format!(
+            "Cannot append {:?} to builder of type {}",
+            self,
+            std::any::type_name_of_val(builder)
+        )))
     }
 }
 
@@ -190,9 +220,10 @@ macro_rules! impl_to_arrow {
 impl_to_arrow!(i8, Int8Builder);
 impl_to_arrow!(i16, Int16Builder);
 impl_to_arrow!(i32, Int32Builder);
+impl_to_arrow!(f32, Float32Builder);
+impl_to_arrow!(f64, Float64Builder);
 impl_to_arrow!(&str, StringBuilder);
 
-#[allow(dead_code)]
 pub type F32 = OrderedFloat<f32>;
 pub type F64 = OrderedFloat<f64>;
 #[allow(dead_code)]
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index ead6ff0067..b900cb51d5 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -15,13 +15,12 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::row::datum::Datum;
-
 mod column;
 
 mod datum;
 
 pub use column::*;
+pub use datum::*;
 
 pub trait InternalRow {
     /// Returns the number of fields in this row
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index 49282084ef..18ce44fbef 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -19,22 +19,40 @@ use crate::rpc::api_key::ApiKey::Unknown;
 
 #[derive(Debug, PartialEq, Eq, PartialOrd, Ord, Hash, Clone, Copy)]
 pub enum ApiKey {
+    CreateDatabase,
+    DropDatabase,
+    ListDatabases,
+    DatabaseExists,
     CreateTable,
+    DropTable,
+    GetTable,
+    ListTables,
+    TableExists,
+    MetaData,
     ProduceLog,
     FetchLog,
-    MetaData,
-    GetTable,
+    GetDatabaseInfo,
+    GetLatestLakeSnapshot,
     Unknown(i16),
 }
 
 impl From<i16> for ApiKey {
     fn from(key: i16) -> Self {
         match key {
+            1001 => ApiKey::CreateDatabase,
+            1002 => ApiKey::DropDatabase,
+            1003 => ApiKey::ListDatabases,
+            1004 => ApiKey::DatabaseExists,
             1005 => ApiKey::CreateTable,
+            1006 => ApiKey::DropTable,
+            1007 => ApiKey::GetTable,
+            1008 => ApiKey::ListTables,
+            1010 => ApiKey::TableExists,
+            1012 => ApiKey::MetaData,
             1014 => ApiKey::ProduceLog,
             1015 => ApiKey::FetchLog,
-            1012 => ApiKey::MetaData,
-            1007 => ApiKey::GetTable,
+            1032 => ApiKey::GetLatestLakeSnapshot,
+            1035 => ApiKey::GetDatabaseInfo,
             _ => Unknown(key),
         }
     }
@@ -43,11 +61,20 @@ impl From<i16> for ApiKey {
 impl From<ApiKey> for i16 {
     fn from(key: ApiKey) -> Self {
         match key {
+            ApiKey::CreateDatabase => 1001,
+            ApiKey::DropDatabase => 1002,
+            ApiKey::ListDatabases => 1003,
+            ApiKey::DatabaseExists => 1004,
             ApiKey::CreateTable => 1005,
-            ApiKey::ProduceLog => 1014,
-            ApiKey::MetaData => 1012,
+            ApiKey::DropTable => 1006,
             ApiKey::GetTable => 1007,
+            ApiKey::ListTables => 1008,
+            ApiKey::TableExists => 1010,
+            ApiKey::MetaData => 1012,
+            ApiKey::ProduceLog => 1014,
             ApiKey::FetchLog => 1015,
+            ApiKey::GetLatestLakeSnapshot => 1032,
+            ApiKey::GetDatabaseInfo => 1035,
             Unknown(x) => x,
         }
     }
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_database.rs b/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
new file mode 100644
index 0000000000..e4052ef361
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
@@ -0,0 +1,67 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::DatabaseDescriptor;
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+
+use crate::error::Result as FlussResult;
+use crate::proto::CreateDatabaseResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct CreateDatabaseRequest {
+    pub inner_request: proto::CreateDatabaseRequest,
+}
+
+impl CreateDatabaseRequest {
+    pub fn new(
+        database_name: &str,
+        ignore_if_exists: bool,
+        database_descriptor: Option<&DatabaseDescriptor>,
+    ) -> FlussResult<Self> {
+        let database_json = if let Some(descriptor) = database_descriptor {
+            Some(descriptor.to_json_bytes()?)
+        } else {
+            None
+        };
+
+        Ok(CreateDatabaseRequest {
+            inner_request: proto::CreateDatabaseRequest {
+                database_name: database_name.to_string(),
+                ignore_if_exists,
+                database_json,
+            },
+        })
+    }
+}
+
+impl RequestBody for CreateDatabaseRequest {
+    type ResponseBody = CreateDatabaseResponse;
+
+    const API_KEY: ApiKey = ApiKey::CreateDatabase;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(CreateDatabaseRequest);
+impl_read_version_type!(CreateDatabaseResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs b/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
new file mode 100644
index 0000000000..795eea1260
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
@@ -0,0 +1,49 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct DatabaseExistsRequest {
+    pub inner_request: proto::DatabaseExistsRequest,
+}
+
+impl DatabaseExistsRequest {
+    pub fn new(database_name: &str) -> Self {
+        DatabaseExistsRequest {
+            inner_request: proto::DatabaseExistsRequest {
+                database_name: database_name.to_string(),
+            },
+        }
+    }
+}
+
+impl RequestBody for DatabaseExistsRequest {
+    type ResponseBody = proto::DatabaseExistsResponse;
+
+    const API_KEY: ApiKey = ApiKey::DatabaseExists;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(DatabaseExistsRequest);
+impl_read_version_type!(proto::DatabaseExistsResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs b/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
new file mode 100644
index 0000000000..49cbfaf8d4
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
@@ -0,0 +1,51 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct DropDatabaseRequest {
+    pub inner_request: proto::DropDatabaseRequest,
+}
+
+impl DropDatabaseRequest {
+    pub fn new(database_name: &str, ignore_if_not_exists: bool, cascade: bool) -> Self {
+        DropDatabaseRequest {
+            inner_request: proto::DropDatabaseRequest {
+                database_name: database_name.to_string(),
+                ignore_if_not_exists,
+                cascade,
+            },
+        }
+    }
+}
+
+impl RequestBody for DropDatabaseRequest {
+    type ResponseBody = proto::DropDatabaseResponse;
+
+    const API_KEY: ApiKey = ApiKey::DropDatabase;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(DropDatabaseRequest);
+impl_read_version_type!(proto::DropDatabaseResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs b/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
new file mode 100644
index 0000000000..0dbc21bbbe
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
@@ -0,0 +1,56 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::TablePath;
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+
+use crate::proto::DropTableResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::convert::to_table_path;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct DropTableRequest {
+    pub inner_request: proto::DropTableRequest,
+}
+
+impl DropTableRequest {
+    pub fn new(table_path: &TablePath, ignore_if_not_exists: bool) -> Self {
+        DropTableRequest {
+            inner_request: proto::DropTableRequest {
+                table_path: to_table_path(table_path),
+                ignore_if_not_exists,
+            },
+        }
+    }
+}
+
+impl RequestBody for DropTableRequest {
+    type ResponseBody = DropTableResponse;
+
+    const API_KEY: ApiKey = ApiKey::DropTable;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(DropTableRequest);
+impl_read_version_type!(DropTableResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs b/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
new file mode 100644
index 0000000000..85492a8bf0
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
@@ -0,0 +1,49 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct GetDatabaseInfoRequest {
+    pub inner_request: proto::GetDatabaseInfoRequest,
+}
+
+impl GetDatabaseInfoRequest {
+    pub fn new(database_name: &str) -> Self {
+        GetDatabaseInfoRequest {
+            inner_request: proto::GetDatabaseInfoRequest {
+                database_name: database_name.to_string(),
+            },
+        }
+    }
+}
+
+impl RequestBody for GetDatabaseInfoRequest {
+    type ResponseBody = proto::GetDatabaseInfoResponse;
+
+    const API_KEY: ApiKey = ApiKey::GetDatabaseInfo;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(GetDatabaseInfoRequest);
+impl_read_version_type!(proto::GetDatabaseInfoResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs b/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
new file mode 100644
index 0000000000..a0e186efd2
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
@@ -0,0 +1,55 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto;
+use crate::proto::PbTablePath;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use crate::metadata::TablePath;
+use crate::{impl_read_version_type, impl_write_version_type};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct GetLatestLakeSnapshotRequest {
+    pub inner_request: proto::GetLatestLakeSnapshotRequest,
+}
+
+impl GetLatestLakeSnapshotRequest {
+    pub fn new(table_path: &TablePath) -> Self {
+        let inner_request = proto::GetLatestLakeSnapshotRequest {
+            table_path: PbTablePath {
+                database_name: table_path.database().to_string(),
+                table_name: table_path.table().to_string(),
+            },
+        };
+
+        Self { inner_request }
+    }
+}
+
+impl RequestBody for GetLatestLakeSnapshotRequest {
+    type ResponseBody = proto::GetLatestLakeSnapshotResponse;
+    const API_KEY: ApiKey = ApiKey::GetLatestLakeSnapshot;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(GetLatestLakeSnapshotRequest);
+impl_read_version_type!(proto::GetLatestLakeSnapshotResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs b/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
new file mode 100644
index 0000000000..ce5a091540
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
@@ -0,0 +1,47 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug, Default)]
+pub struct ListDatabasesRequest {
+    pub inner_request: proto::ListDatabasesRequest,
+}
+
+impl ListDatabasesRequest {
+    pub fn new() -> Self {
+        ListDatabasesRequest {
+            inner_request: proto::ListDatabasesRequest {},
+        }
+    }
+}
+
+impl RequestBody for ListDatabasesRequest {
+    type ResponseBody = proto::ListDatabasesResponse;
+
+    const API_KEY: ApiKey = ApiKey::ListDatabases;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(ListDatabasesRequest);
+impl_read_version_type!(proto::ListDatabasesResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs b/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
new file mode 100644
index 0000000000..daf57ea6b5
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
@@ -0,0 +1,53 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+
+use crate::proto::ListTablesResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct ListTablesRequest {
+    pub inner_request: proto::ListTablesRequest,
+}
+
+impl ListTablesRequest {
+    pub fn new(database_name: &str) -> Self {
+        ListTablesRequest {
+            inner_request: proto::ListTablesRequest {
+                database_name: database_name.to_string(),
+            },
+        }
+    }
+}
+
+impl RequestBody for ListTablesRequest {
+    type ResponseBody = ListTablesResponse;
+
+    const API_KEY: ApiKey = ApiKey::ListTables;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(ListTablesRequest);
+impl_read_version_type!(ListTablesResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 742c39369d..d5f8ebde89 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -20,18 +20,36 @@ use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::{ReadError, WriteError};
 use bytes::{Buf, BufMut};
 
+mod create_database;
 mod create_table;
+mod database_exists;
+mod drop_database;
+mod drop_table;
 mod fetch;
+mod get_database_info;
+mod get_latest_lake_snapshot;
 mod get_table;
 mod header;
+mod list_databases;
+mod list_tables;
 mod produce_log;
+mod table_exists;
 mod update_metadata;
 
+pub use create_database::*;
 pub use create_table::*;
+pub use database_exists::*;
+pub use drop_database::*;
+pub use drop_table::*;
 pub use fetch::*;
+pub use get_database_info::*;
+pub use get_latest_lake_snapshot::*;
 pub use get_table::*;
 pub use header::*;
+pub use list_databases::*;
+pub use list_tables::*;
 pub use produce_log::*;
+pub use table_exists::*;
 pub use update_metadata::*;
 
 pub trait RequestBody {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs b/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs
new file mode 100644
index 0000000000..3b71f471ac
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs
@@ -0,0 +1,55 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::TablePath;
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+
+use crate::proto::TableExistsResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::convert::to_table_path;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct TableExistsRequest {
+    pub inner_request: proto::TableExistsRequest,
+}
+
+impl TableExistsRequest {
+    pub fn new(table_path: &TablePath) -> Self {
+        TableExistsRequest {
+            inner_request: proto::TableExistsRequest {
+                table_path: to_table_path(table_path),
+            },
+        }
+    }
+}
+
+impl RequestBody for TableExistsRequest {
+    type ResponseBody = TableExistsResponse;
+
+    const API_KEY: ApiKey = ApiKey::TableExists;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(TableExistsRequest);
+impl_read_version_type!(TableExistsResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index a102aa3ba6..4eeda46063 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -72,7 +72,6 @@ impl RpcClient {
                 return Ok(connection.clone());
             }
         }
-
         let new_server = self.connect(server_node).await?;
         self.connections
             .write()

From 4779328d24a274d98e29933785c78ffec819bb5b Mon Sep 17 00:00:00 2001
From: naivedogger <59598718+naivedogger@users.noreply.github.com>
Date: Tue, 16 Sep 2025 11:54:04 +0800
Subject: [PATCH 007/287] [feat] Set up uv, ruff, and other settings for Python
 binding (#7)

---
 fluss-rust/bindings/python/Cargo.toml     |  38 ++++++
 fluss-rust/bindings/python/README.md      | 149 ++++++++++++++++++++++
 fluss-rust/bindings/python/pyproject.toml |  96 ++++++++++++++
 3 files changed, 283 insertions(+)
 create mode 100644 fluss-rust/bindings/python/Cargo.toml
 create mode 100644 fluss-rust/bindings/python/README.md
 create mode 100644 fluss-rust/bindings/python/pyproject.toml

diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
new file mode 100644
index 0000000000..aee1a21314
--- /dev/null
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -0,0 +1,38 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[package]
+name = "fluss_python"
+edition = "2024"
+version = "0.1.0"
+license = "apache-2.0"
+rust-version = "1.85"
+
+[lib]
+name = "fluss"
+crate-type = ["cdylib"]
+
+[workspace]
+
+[dependencies]
+pyo3 = { version = "0.24", features = ["extension-module"] }
+fluss = { path = "../../crates/fluss" }
+tokio = { workspace = true }
+arrow = { workspace = true }
+arrow-pyarrow = "55.1.0"
+pyo3-async-runtimes = { version = "0.24.0", features = ["tokio-runtime"] }
+chrono = { workspace = true }
diff --git a/fluss-rust/bindings/python/README.md b/fluss-rust/bindings/python/README.md
new file mode 100644
index 0000000000..5258f53291
--- /dev/null
+++ b/fluss-rust/bindings/python/README.md
@@ -0,0 +1,149 @@
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+-->
+
+# Apache Fluss™ Python Bindings
+
+Python bindings for Fluss using PyO3 and Maturin.
+
+## API Overview
+
+### Basic Usage
+
+TODO: Add basic usage examples here
+
+### Core Classes
+
+#### `Config`
+
+Configuration for Fluss connection parameters
+
+#### `FlussConnection`
+
+Main interface for connecting to Fluss cluster
+
+#### `FlussAdmin`
+
+Administrative operations for managing tables (create, delete, etc.)
+
+#### `FlussTable`
+
+Represents a Fluss table, providing read and write operations
+
+#### `TableWriter`
+
+Used for writing data to tables, supports PyArrow and Pandas
+
+#### `LogScanner`
+
+Used for scanning table log data
+
+## Development
+
+## Requirements
+
+- Python 3.9+
+- Rust 1.70+
+- [uv](https://docs.astral.sh/uv/) package manager
+- Linux or MacOS
+
+> **⚠️ Before you start:**  
+> Please make sure you can successfully build and run the [Fluss Rust client](../../crates/fluss/README.md) on your machine.  
+> The Python bindings require a working Fluss Rust backend and compatible environment.
+
+### Install Development Dependencies
+
+```bash
+cd bindings/python
+uv sync --all-extras
+```
+
+### Build Development Version
+
+```bash
+source .venv/bin/activate
+uv run maturin develop
+```
+
+### Build Release Version
+
+```bash
+uv run maturin build --release
+```
+
+### Code Formatting and Linting
+
+```bash
+uv run ruff format python/
+uv run ruff check python/
+```
+
+### Type Checking
+
+```bash
+uv run mypy python/
+```
+
+### Run Examples
+
+```bash
+uv run python example/example.py
+```
+
+### Build API docs:
+
+```bash
+uv run pdoc fluss_python
+```
+
+### Release
+
+```bash
+# Build wheel
+uv run maturin build --release
+
+# Publish to PyPI
+uv run maturin publish
+```
+
+## Project Structure
+```
+bindings/python/
+├── Cargo.toml              # Rust dependency configuration
+├── pyproject.toml          # Python project configuration
+├── README.md              # This file
+├── src/                   # Rust source code
+│   ├── lib.rs            # Main entry module
+│   ├── config.rs         # Configuration related
+│   ├── connection.rs     # Connection management
+│   ├── admin.rs          # Admin operations
+│   ├── table.rs          # Table operations
+│   ├── types.rs          # Data types
+│   └── error.rs          # Error handling
+├── python/               # Python package source
+│   └── fluss_python/
+│       ├── __init__.py   # Python package entry
+│       ├── __init__.pyi  # Stub file
+│       └── py.typed      # Type declarations
+└── example/              # Example code
+    └── example.py
+```
+
+## License
+
+Apache 2.0 License
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
new file mode 100644
index 0000000000..fe9d58878d
--- /dev/null
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -0,0 +1,96 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[build-system]
+requires = ["maturin>=1.0,<2.0"]
+build-backend = "maturin"
+
+[project]
+name = "fluss"
+description = "Python bindings for Fluss on fluss-rust with Pandas integration"
+authors = [{name = "Fluss Team"}]
+license = {text = "Apache-2.0"}
+readme = "README.md"
+requires-python = ">=3.9"
+classifiers = [
+    "License :: OSI Approved :: Apache Software License",
+    "Programming Language :: Python :: 3.9",
+    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
+]
+
+dynamic = ["version"]
+
+dependencies = [
+    "pandas>=2.3.1",
+    "pyarrow>=10.0.0",
+]
+
+[project.urls]
+Repository = "https://github.com/apache/fluss-rust"
+
+[project.optional-dependencies]
+dev = [
+    "mypy>=1.17.1",
+    "pytest>=8.3.5",
+    "pytest-asyncio>=0.25.3",
+    "ruff>=0.9.10",
+    "maturin>=1.8.2",
+]
+docs = [
+    "pdoc>=15.0.4",
+]
+
+[tool.maturin]
+python-source = "python"
+module-name = "fluss._fluss"
+features = ["pyo3/extension-module"]
+
+[tool.uv]
+cache-keys = [
+  { file = "pyproject.toml" },
+  { file = "Cargo.toml" },
+  { file = "src/**/*.rs" },
+  { file = "../../crates/**/*.rs" },
+]
+
+[tool.ruff]
+line-length = 88
+fix = true
+
+[tool.ruff.lint]
+ignore = ["E402", "F403", "F405"]
+select = ["E", "F", "I"]
+
+[tool.ruff.lint.pycodestyle]
+max-doc-length = 88
+
+[tool.ruff.lint.pydocstyle]
+convention = "numpy"
+
+[tool.ruff.format]
+docstring-code-format = true
+
+[tool.ruff.lint.isort]
+known-first-party = ["fluss"]
+
+[tool.mypy]
+python_version = "3.9"
+warn_return_any = true
+warn_unused_configs = true
+ignore_missing_imports = true

From bb8abafa13d6323d9c668dfedd9a6dcc1c3d1b21 Mon Sep 17 00:00:00 2001
From: naivedogger <59598718+naivedogger@users.noreply.github.com>
Date: Wed, 17 Sep 2025 15:00:33 +0800
Subject: [PATCH 008/287] [feat] Create Python bindings for metadata (#8)

---
 fluss-rust/bindings/python/src/config.rs   | 117 +++++
 fluss-rust/bindings/python/src/metadata.rs | 581 +++++++++++++++++++++
 2 files changed, 698 insertions(+)
 create mode 100644 fluss-rust/bindings/python/src/config.rs
 create mode 100644 fluss-rust/bindings/python/src/metadata.rs

diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
new file mode 100644
index 0000000000..08b20b4d40
--- /dev/null
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -0,0 +1,117 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use pyo3::prelude::*;
+use pyo3::types::PyDict;
+use crate::*;
+
+/// Configuration for Fluss client
+#[pyclass]
+#[derive(Clone)]
+pub struct Config {
+    inner: fcore::config::Config,
+}
+
+#[pymethods]
+impl Config {
+    /// Create a new Config with optional properties from a dictionary
+    #[new]
+    #[pyo3(signature = (properties = None))]
+    fn new(properties: Option<&Bound<'_, PyDict>>) -> PyResult<Self> {
+        let mut config = fcore::config::Config::default();
+        
+        if let Some(props) = properties {
+            for item in props.iter() {
+                let key: String = item.0.extract()?;
+                let value: String = item.1.extract()?;
+
+                match key.as_str() {
+                    "bootstrap.servers" => {
+                        config.bootstrap_server = Some(value);
+                    },
+                    "request.max.size" => {
+                        if let Ok(size) = value.parse::<i32>() {
+                            config.request_max_size = size;
+                        }
+                    },
+                    "writer.acks" => {
+                        config.writer_acks = value;
+                    },
+                    "writer.retries" => {
+                        if let Ok(retries) = value.parse::<i32>() {
+                            config.writer_retries = retries;
+                        }
+                    },
+                    "writer.batch.size" => {
+                        if let Ok(size) = value.parse::<i32>() {
+                            config.writer_batch_size = size;
+                        }
+                    },
+                    _ => {
+                        return Err(FlussError::new_err(format!("Unknown property: {}", key)));
+                    }
+                }
+            }
+        }
+
+        Ok(Self {
+            inner: config,
+        })
+    }
+    
+    /// Get the bootstrap server
+    #[getter]
+    fn bootstrap_server(&self) -> Option<String> {
+        self.inner.bootstrap_server.clone()
+    }
+    
+    /// Set the bootstrap server
+    #[setter]
+    fn set_bootstrap_server(&mut self, server: String) {
+        self.inner.bootstrap_server = Some(server);
+    }
+    
+    /// Get the request max size
+    #[getter]
+    fn request_max_size(&self) -> i32 {
+        self.inner.request_max_size
+    }
+    
+    /// Set the request max size
+    #[setter]
+    fn set_request_max_size(&mut self, size: i32) {
+        self.inner.request_max_size = size;
+    }
+    
+    /// Get the writer batch size
+    #[getter]
+    fn writer_batch_size(&self) -> i32 {
+        self.inner.writer_batch_size
+    }
+    
+    /// Set the writer batch size
+    #[setter]
+    fn set_writer_batch_size(&mut self, size: i32) {
+        self.inner.writer_batch_size = size;
+    }
+}
+
+impl Config {
+    pub fn get_core_config(&self) -> fcore::config::Config {
+        self.inner.clone()
+    }
+}
diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
new file mode 100644
index 0000000000..238dde2ec0
--- /dev/null
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -0,0 +1,581 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use pyo3::prelude::*;
+use crate::*;
+use pyo3::types::PyDict;
+use std::collections::HashMap;
+
+/// Represents a table path with database and table name
+#[pyclass]
+#[derive(Clone)]
+pub struct TablePath {
+    database_name: String,
+    table_name: String,
+}
+
+#[pymethods]
+impl TablePath {
+    /// Create a new TablePath
+    #[new]
+    pub fn new(database_name: String, table_name: String) -> Self {
+        Self {
+            database_name,
+            table_name,
+        }
+    }
+    
+    /// Get the database name
+    #[getter]
+    pub fn database_name(&self) -> String {
+        self.database_name.clone()
+    }
+    
+    /// Get the table name  
+    #[getter]
+    pub fn table_name(&self) -> String {
+        self.table_name.clone()
+    }
+
+    /// Get table path as string
+    pub fn table_path_str(&self) -> String {
+        format!("{}.{}", self.database_name, self.table_name)
+    }
+
+    pub fn __str__(&self) -> String {
+        self.table_path_str()
+    }
+    
+    fn __repr__(&self) -> String {
+        format!("TablePath('{}', '{}')", self.database_name, self.table_name)
+    }
+
+    /// Hash implementation for Python
+    pub fn __hash__(&self) -> u64 {
+        use std::collections::hash_map::DefaultHasher;
+        use std::hash::{Hash, Hasher};
+        
+        let mut hasher = DefaultHasher::new();
+        self.database_name.hash(&mut hasher);
+        self.table_name.hash(&mut hasher);
+        hasher.finish()
+    }
+
+    /// Equality implementation for Python
+    pub fn __eq__(&self, other: &TablePath) -> bool {
+        self.database_name == other.database_name 
+            && self.table_name == other.table_name
+    }
+}
+
+impl TablePath {
+    /// Convert to core TablePath
+    pub fn to_core(&self) -> fcore::metadata::TablePath {
+        fcore::metadata::TablePath::new(self.database_name.clone(), self.table_name.clone())
+    }
+
+    pub fn from_core(core_path: fcore::metadata::TablePath) -> Self {
+        Self {
+            database_name: core_path.database().to_string(),
+            table_name: core_path.table().to_string(),
+        }
+    }
+}
+
+/// Schema wrapper for Fluss table schema
+#[pyclass]
+pub struct Schema {
+    __schema: fcore::metadata::Schema,
+}
+
+#[pymethods]
+impl Schema {
+    /// Create a new Schema from PyArrow schema with optional primary keys
+    #[new]
+    #[pyo3(signature = (schema, primary_keys=None))]
+    pub fn new(
+        schema: PyObject, // PyArrow schema
+        primary_keys: Option<Vec<String>>,
+    ) -> PyResult<Self> {
+        let arrow_schema = crate::utils::Utils::pyarrow_to_arrow_schema(&schema)?;
+        
+        let mut builder = fcore::metadata::Schema::builder();
+        
+        for field in arrow_schema.fields() {
+            let fluss_data_type = crate::utils::Utils::arrow_type_to_fluss_type(field.data_type())?;
+            builder = builder.column(field.name(), fluss_data_type);
+            
+            if let Some(comment) = field.metadata().get("comment") {
+                builder = builder.with_comment(comment);
+            }
+        }
+        
+        if let Some(pk_columns) = primary_keys {
+            if !pk_columns.is_empty() {
+                builder = builder.primary_key(pk_columns);
+            }
+        }
+        
+        let fluss_schema = builder.build()
+            .map_err(|e| FlussError::new_err(format!("Failed to build schema: {}", e)))?;
+        
+        Ok(Self {
+            __schema: fluss_schema,
+        })
+    }
+
+    /// Get column names
+    fn get_column_names(&self) -> Vec<String> {
+        self.__schema.columns().iter().map(|col| col.name().to_string()).collect()
+    }
+
+    /// Get column types
+    fn get_column_types(&self) -> Vec<String> {
+        self.__schema.columns().iter()
+            .map(|col| Utils::datatype_to_string(col.data_type()))
+            .collect()
+    }
+
+    /// Get columns as (name, type) pairs
+    fn get_columns(&self) -> Vec<(String, String)> {
+        self.__schema.columns().iter()
+            .map(|col| (col.name().to_string(), Utils::datatype_to_string(col.data_type())))
+            .collect()
+    }
+
+    // TODO: support primaryKey
+
+    fn __str__(&self) -> String {
+        format!("Schema: columns={:?}", self.get_columns())
+    }
+}
+
+impl Schema {
+    /// Convert to core Schema
+    pub fn to_core(&self) -> &fcore::metadata::Schema {
+        &self.__schema
+    }
+}
+
+/// Table distribution configuration
+#[pyclass]
+pub struct TableDistribution {
+    inner: fcore::metadata::TableDistribution,
+}
+
+#[pymethods]
+impl TableDistribution {
+    /// Get bucket keys
+    fn bucket_keys(&self) -> Vec<String> {
+        self.inner.bucket_keys().to_vec()
+    }
+
+    /// Get bucket count
+    fn bucket_count(&self) -> Option<i32> {
+        self.inner.bucket_count()
+    }
+}
+
+
+/// Table descriptor containing schema and metadata
+#[pyclass]
+#[derive(Clone)]
+pub struct TableDescriptor {
+    __tbl_desc: fcore::metadata::TableDescriptor,
+}
+
+#[pymethods]
+impl TableDescriptor {
+    /// Create a new TableDescriptor
+    #[new]
+    #[pyo3(signature = (schema, **kwargs))]
+    pub fn new(
+        schema: &Schema,  // fluss schema
+        kwargs: Option<&Bound<'_, PyDict>>,
+    ) -> PyResult<Self> {
+        let mut partition_keys = Vec::new();
+        let mut bucket_count = None;
+        let mut bucket_keys = Vec::new();
+        let mut properties = std::collections::HashMap::new();
+        let mut custom_properties = std::collections::HashMap::new();
+        let mut comment: Option<String> = None;
+        let mut log_format = None;
+        let mut kv_format = None;
+
+        if let Some(kwargs) = kwargs {
+            if let Ok(Some(pkeys)) = kwargs.get_item("partition_keys") {
+                partition_keys = pkeys.extract()?;
+            }
+            if let Ok(Some(bcount)) = kwargs.get_item("bucket_count") {
+                bucket_count = Some(bcount.extract()?);
+            }
+            if let Ok(Some(bkeys)) = kwargs.get_item("bucket_keys") {
+                bucket_keys = bkeys.extract()?;
+            }
+            if let Ok(Some(props)) = kwargs.get_item("properties") {
+                properties = props.extract()?;
+            }
+            if let Ok(Some(cprops)) = kwargs.get_item("custom_properties") {
+                custom_properties = cprops.extract()?;
+            }
+            if let Ok(Some(comm)) = kwargs.get_item("comment") {
+                comment = Some(comm.extract()?);
+            }
+            if let Ok(Some(lformat)) = kwargs.get_item("log_format") {
+                let format_str: String = lformat.extract()?;
+                log_format = Some(fcore::metadata::LogFormat::parse(&format_str)
+                    .map_err(|e| FlussError::new_err(e.to_string()))?);
+            }
+            if let Ok(Some(kformat)) = kwargs.get_item("kv_format") {
+                let format_str: String = kformat.extract()?;
+                kv_format = Some(fcore::metadata::KvFormat::parse(&format_str)
+                    .map_err(|e| FlussError::new_err(e.to_string()))?);
+            }
+        }
+
+        let fluss_schema = schema.to_core().clone();
+        
+        let mut builder = fcore::metadata::TableDescriptor::builder()
+            .schema(fluss_schema)
+            .properties(properties)
+            .custom_properties(custom_properties)
+            .partitioned_by(partition_keys)
+            .distributed_by(bucket_count, bucket_keys);
+
+        if let Some(comment) = comment {
+            builder = builder.comment(&comment);
+        }
+        if let Some(log_format) = log_format {
+            builder = builder.log_format(log_format);
+        }
+        if let Some(kv_format) = kv_format {
+            builder = builder.kv_format(kv_format);
+        }
+
+        let core_descriptor = builder.build()
+            .map_err(|e| FlussError::new_err(format!("Failed to build TableDescriptor: {}", e)))?;
+
+        Ok(Self {
+            __tbl_desc: core_descriptor,
+        })
+    }
+
+    /// Get the schema of this table descriptor
+    pub fn get_schema(&self) -> PyResult<Schema> {
+        Ok(Schema {
+            __schema: self.__tbl_desc.schema().clone(),
+        })
+    }
+}
+
+impl TableDescriptor {
+    /// Convert to core TableDescriptor
+    pub fn to_core(&self) -> &fcore::metadata::TableDescriptor {
+        &self.__tbl_desc
+    }
+}
+
+/// Information about a Fluss table
+#[pyclass]
+#[derive(Clone)]
+pub struct TableInfo {
+    __table_info: fcore::metadata::TableInfo,
+}
+
+#[pymethods]
+impl TableInfo {
+    /// Get the table ID
+    #[getter]
+    pub fn table_id(&self) -> i64 {
+        self.__table_info.get_table_id()
+    }
+    
+    /// Get the schema ID
+    #[getter]
+    pub fn schema_id(&self) -> i32 {
+        self.__table_info.get_schema_id()
+    }
+    
+    /// Get the table path
+    #[getter]
+    pub fn table_path(&self) -> TablePath {
+        TablePath::from_core(self.__table_info.get_table_path().clone())
+    }
+
+    /// Get the created time
+    #[getter]
+    pub fn created_time(&self) -> i64 {
+        self.__table_info.get_created_time()
+    }
+    
+    /// Get the modified time
+    #[getter]
+    pub fn modified_time(&self) -> i64 {
+        self.__table_info.get_modified_time()
+    }
+    
+    /// Get the primary keys
+    pub fn get_primary_keys(&self) -> Vec<String> {
+        self.__table_info.get_primary_keys().clone()
+    }
+
+    /// Get the bucket keys
+    pub fn get_bucket_keys(&self) -> Vec<String> {
+        self.__table_info.get_bucket_keys().to_vec()
+    }
+
+    /// Get the partition keys
+    pub fn get_partition_keys(&self) -> Vec<String> {
+        self.__table_info.get_partition_keys().to_vec()
+    }
+
+    /// Get number of buckets
+    #[getter]
+    pub fn num_buckets(&self) -> i32 {
+        self.__table_info.get_num_buckets()
+    }
+
+    /// Check if table has primary key
+    pub fn has_primary_key(&self) -> bool {
+        self.__table_info.has_primary_key()
+    }
+
+    /// Check if table is partitioned
+    pub fn is_partitioned(&self) -> bool {
+        self.__table_info.is_partitioned()
+    }
+
+    /// Get properties
+    pub fn get_properties(&self) -> std::collections::HashMap<String, String> {
+        self.__table_info.get_properties().clone()
+    }
+
+    /// Get custom properties
+    pub fn get_custom_properties(&self) -> std::collections::HashMap<String, String> {
+        self.__table_info.get_custom_properties().clone()
+    }
+
+    /// Get comment
+    #[getter]
+    pub fn comment(&self) -> Option<String> {
+        self.__table_info.get_comment().map(|s| s.to_string())
+    }
+
+    /// Get the Schema
+    pub fn get_schema(&self) -> Schema {
+        Schema {
+            __schema: self.__table_info.get_schema().clone(),
+        }
+    }
+
+    /// Get column names
+    pub fn get_column_names(&self) -> Vec<String> {
+        self.__table_info.get_schema().columns().iter()
+            .map(|col| col.name().to_string())
+            .collect()
+    }
+
+    /// Get column count
+    pub fn get_column_count(&self) -> usize {
+        self.__table_info.get_schema().columns().len()
+    }
+}
+
+impl TableInfo {
+    /// Create from core TableInfo (internal use)
+    pub fn from_core(info: fcore::metadata::TableInfo) -> Self {
+        Self {
+            __table_info: info,
+        }
+    }
+}
+
+/// Represents a lake snapshot with snapshot ID and table bucket offsets
+#[pyclass]
+#[derive(Clone)]
+pub struct LakeSnapshot {
+    snapshot_id: i64,
+    table_buckets_offset: HashMap<fcore::metadata::TableBucket, i64>,
+}
+
+/// Represents a table bucket with table ID, partition ID, and bucket ID
+#[pyclass]
+#[derive(Clone)]
+pub struct TableBucket {
+    table_id: i64,
+    partition_id: Option<i64>,
+    bucket: i32,
+}
+
+#[pymethods]
+impl TableBucket {
+    /// Create a new TableBucket
+    #[new]
+    pub fn new(table_id: i64, bucket: i32) -> Self {
+        Self {
+            table_id,
+            partition_id: None,
+            bucket,
+        }
+    }
+
+    /// Create a new TableBucket with partition
+    #[staticmethod]
+    pub fn with_partition(table_id: i64, partition_id: i64, bucket: i32) -> Self {
+        Self {
+            table_id,
+            partition_id: Some(partition_id),
+            bucket,
+        }
+    }
+
+    /// Get table ID
+    #[getter]
+    pub fn table_id(&self) -> i64 {
+        self.table_id
+    }
+
+    /// Get bucket ID
+    #[getter]
+    pub fn bucket_id(&self) -> i32 {
+        self.bucket
+    }
+
+    /// Get partition ID
+    #[getter]
+    pub fn partition_id(&self) -> Option<i64> {
+        self.partition_id
+    }
+
+    /// String representation
+    pub fn __str__(&self) -> String {
+        if let Some(partition_id) = self.partition_id {
+            format!("TableBucket(table_id={}, partition_id={}, bucket={})", 
+                    self.table_id, partition_id, self.bucket)
+        } else {
+            format!("TableBucket(table_id={}, bucket={})", 
+                    self.table_id, self.bucket)
+        }
+    }
+
+    /// String representation
+    pub fn __repr__(&self) -> String {
+        self.__str__()
+    }
+
+    /// Hash implementation for Python
+    pub fn __hash__(&self) -> u64 {
+        use std::collections::hash_map::DefaultHasher;
+        use std::hash::{Hash, Hasher};
+        
+        let mut hasher = DefaultHasher::new();
+        self.table_id.hash(&mut hasher);
+        self.partition_id.hash(&mut hasher);
+        self.bucket.hash(&mut hasher);
+        hasher.finish()
+    }
+
+    /// Equality implementation for Python
+    pub fn __eq__(&self, other: &TableBucket) -> bool {
+        self.table_id == other.table_id 
+            && self.partition_id == other.partition_id 
+            && self.bucket == other.bucket
+    }
+}
+
+impl TableBucket {
+    /// Create from core TableBucket (internal use)
+    pub fn from_core(bucket: fcore::metadata::TableBucket) -> Self {
+        Self {
+            table_id: bucket.table_id(),
+            partition_id: bucket.partition_id(),
+            bucket: bucket.bucket_id(),
+        }
+    }
+
+    /// Convert to core TableBucket (internal use)
+    pub fn to_core(&self) -> fcore::metadata::TableBucket {
+        fcore::metadata::TableBucket::new(self.table_id, self.partition_id, self.bucket)
+    }
+}
+
+#[pymethods]
+impl LakeSnapshot {
+    /// Create a new LakeSnapshot
+    #[new]
+    pub fn new(snapshot_id: i64) -> Self {
+        Self {
+            snapshot_id,
+            table_buckets_offset: HashMap::new(),
+        }
+    }
+
+    /// Get snapshot ID
+    #[getter]
+    pub fn snapshot_id(&self) -> i64 {
+        self.snapshot_id
+    }
+
+    /// Get table bucket offsets as a Python dictionary with TableBucket keys
+    #[getter]
+    pub fn table_buckets_offset(&self, py: Python) -> PyResult<PyObject> {
+        let dict = PyDict::new(py);
+        for (bucket, offset) in &self.table_buckets_offset {
+            let py_bucket = TableBucket::from_core(bucket.clone());
+            dict.set_item(Py::new(py, py_bucket)?, *offset)?;
+        }
+        Ok(dict.into())
+    }
+
+    /// Get offset for a specific table bucket
+    pub fn get_bucket_offset(&self, bucket: &TableBucket) -> Option<i64> {
+        let core_bucket = bucket.to_core();
+        self.table_buckets_offset.get(&core_bucket).copied()
+    }
+
+    /// Get all table buckets
+    pub fn get_table_buckets(&self, py: Python) -> PyResult<Vec<PyObject>> {
+        let mut buckets = Vec::new();
+        for bucket in self.table_buckets_offset.keys() {
+            let py_bucket = TableBucket::from_core(bucket.clone());
+            buckets.push(Py::new(py, py_bucket)?.into());
+        }
+        Ok(buckets)
+    }
+
+    /// String representation
+    pub fn __str__(&self) -> String {
+        format!("LakeSnapshot(snapshot_id={}, buckets_count={})", 
+                self.snapshot_id, self.table_buckets_offset.len())
+    }
+
+    /// String representation
+    pub fn __repr__(&self) -> String {
+        self.__str__()
+    }
+}
+
+impl LakeSnapshot {
+    /// Create from core LakeSnapshot (internal use)
+    pub fn from_core(snapshot: fcore::metadata::LakeSnapshot) -> Self {
+        Self {
+            snapshot_id: snapshot.snapshot_id,
+            table_buckets_offset: snapshot.table_buckets_offset,
+        }
+    }
+}
+

From 757a833a868cb3bde4f1504ce73c11c58507985f Mon Sep 17 00:00:00 2001
From: naivedogger <59598718+naivedogger@users.noreply.github.com>
Date: Thu, 18 Sep 2025 12:09:53 +0800
Subject: [PATCH 009/287] [feat] Create Python bindings for Fluss Admin (#6)

---
 fluss-rust/bindings/python/fluss/__init__.py |  20 +++
 fluss-rust/bindings/python/src/admin.rs      | 107 +++++++++++
 fluss-rust/bindings/python/src/connection.rs | 117 ++++++++++++
 fluss-rust/bindings/python/src/error.rs      |  39 ++++
 fluss-rust/bindings/python/src/lib.rs        |  67 +++++++
 fluss-rust/bindings/python/src/utils.rs      | 178 +++++++++++++++++++
 6 files changed, 528 insertions(+)
 create mode 100644 fluss-rust/bindings/python/fluss/__init__.py
 create mode 100644 fluss-rust/bindings/python/src/admin.rs
 create mode 100644 fluss-rust/bindings/python/src/connection.rs
 create mode 100644 fluss-rust/bindings/python/src/error.rs
 create mode 100644 fluss-rust/bindings/python/src/lib.rs
 create mode 100644 fluss-rust/bindings/python/src/utils.rs

diff --git a/fluss-rust/bindings/python/fluss/__init__.py b/fluss-rust/bindings/python/fluss/__init__.py
new file mode 100644
index 0000000000..cceee102ad
--- /dev/null
+++ b/fluss-rust/bindings/python/fluss/__init__.py
@@ -0,0 +1,20 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+from .fluss_python import *
+
+__version__ = "0.1.0"
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
new file mode 100644
index 0000000000..7ec6eee93b
--- /dev/null
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -0,0 +1,107 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use pyo3::prelude::*;
+use pyo3_async_runtimes::tokio::future_into_py;
+use crate::*;
+use std::sync::Arc;
+
+/// Administrative client for managing Fluss tables
+#[pyclass]
+pub struct FlussAdmin {
+    __admin: Arc<fcore::client::FlussAdmin>,
+}
+
+#[pymethods]
+impl FlussAdmin {
+    /// Create a table with the given schema
+    #[pyo3(signature = (table_path, table_descriptor, ignore_if_exists=None))]
+    pub fn create_table<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+        table_descriptor: &TableDescriptor,
+        ignore_if_exists: Option<bool>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let ignore = ignore_if_exists.unwrap_or(false);
+        
+        let core_table_path = table_path.to_core().clone();
+        let core_descriptor = table_descriptor.to_core().clone();
+        let admin = self.__admin.clone();
+
+        future_into_py(py, async move {
+            admin.create_table(&core_table_path, &core_descriptor, ignore)
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+        
+            Python::with_gil(|py| Ok(py.None()))
+        })
+    }
+
+    /// Get table information
+    pub fn get_table<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let core_table_path = table_path.to_core().clone();
+        let admin = self.__admin.clone();
+        
+        future_into_py(py, async move {
+            let core_table_info = admin.get_table(&core_table_path).await
+                .map_err(|e| FlussError::new_err(format!("Failed to get table: {}", e)))?;
+
+            Python::with_gil(|py| {
+                let table_info = TableInfo::from_core(core_table_info);
+                Py::new(py, table_info)
+            })
+        })
+    }
+
+    /// Get the latest lake snapshot for a table
+    pub fn get_latest_lake_snapshot<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let core_table_path = table_path.to_core().clone();
+        let admin = self.__admin.clone();
+        
+        future_into_py(py, async move {
+            let core_lake_snapshot = admin.get_latest_lake_snapshot(&core_table_path).await
+                .map_err(|e| FlussError::new_err(format!("Failed to get lake snapshot: {}", e)))?;
+
+            Python::with_gil(|py| {
+                let lake_snapshot = LakeSnapshot::from_core(core_lake_snapshot);
+                Py::new(py, lake_snapshot)
+            })
+        })
+    }
+
+    fn __repr__(&self) -> String {
+        "FlussAdmin()".to_string()
+    }
+}
+
+impl FlussAdmin {
+    // Internal method to create FlussAdmin from core admin
+    pub fn from_core(admin: fcore::client::FlussAdmin) -> Self {
+        Self {
+            __admin: Arc::new(admin),
+        }
+    }
+}
diff --git a/fluss-rust/bindings/python/src/connection.rs b/fluss-rust/bindings/python/src/connection.rs
new file mode 100644
index 0000000000..ba1fa50554
--- /dev/null
+++ b/fluss-rust/bindings/python/src/connection.rs
@@ -0,0 +1,117 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use pyo3::prelude::*;
+use crate::*;
+use std::sync::Arc;
+use pyo3_async_runtimes::tokio::future_into_py;
+
+/// Connection to a Fluss cluster
+#[pyclass]
+pub struct FlussConnection {
+    inner: Arc<fcore::client::FlussConnection>,
+}
+
+#[pymethods]
+impl FlussConnection {
+    /// Create a new FlussConnection (async)
+    #[staticmethod]
+    fn connect<'py>(py: Python<'py>, config: &Config) -> PyResult<Bound<'py, PyAny>> {
+        let rust_config = config.get_core_config();
+
+        future_into_py(py, async move {
+            let connection = fcore::client::FlussConnection::new(rust_config)
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+        
+            let py_connection = FlussConnection {
+                inner: Arc::new(connection),
+            };
+
+            Python::with_gil(|py| {
+                Py::new(py, py_connection)
+            })
+        })
+    }
+    
+    /// Get admin interface
+    fn get_admin<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let client = self.inner.clone();
+
+        future_into_py(py, async move {
+            let admin = client.get_admin()
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+            let py_admin = FlussAdmin::from_core(admin);
+
+            Python::with_gil(|py| {
+                Py::new(py, py_admin)
+            })
+        })
+    }
+
+    /// Get a table
+    fn get_table<'py>(&self, py: Python<'py>, table_path: &TablePath) -> PyResult<Bound<'py, PyAny>> {
+        let client = self.inner.clone();
+        let core_path = table_path.to_core().clone();
+
+        future_into_py(py, async move {
+            let core_table = client.get_table(&core_path)
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+        
+            let py_table = FlussTable::new_table(
+                client,
+                core_table.metadata,
+                core_table.table_info,
+                core_table.table_path,
+                core_table.has_primary_key,
+            );
+
+            Python::with_gil(|py| {
+                Py::new(py, py_table)
+            })
+        })
+    }
+
+    // Close the connection
+    fn close(&mut self) -> PyResult<()> {
+        Ok(())
+    }
+
+    // Enter the runtime context (for 'with' statement)
+    fn __enter__(slf: PyRef<Self>) -> PyRef<Self> {
+        slf
+    }
+    
+    // Exit the runtime context (for 'with' statement)
+    #[pyo3(signature = (_exc_type=None, _exc_value=None, _traceback=None))]
+    fn __exit__(
+        &mut self,
+        _exc_type: Option<PyObject>,
+        _exc_value: Option<PyObject>,
+        _traceback: Option<PyObject>,
+    ) -> PyResult<bool> {
+        self.close()?;
+        Ok(false)
+    }
+
+    fn __repr__(&self) -> String {
+        "FlussConnection()".to_string()
+    }
+}
diff --git a/fluss-rust/bindings/python/src/error.rs b/fluss-rust/bindings/python/src/error.rs
new file mode 100644
index 0000000000..2db2991cfb
--- /dev/null
+++ b/fluss-rust/bindings/python/src/error.rs
@@ -0,0 +1,39 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use pyo3::prelude::*;
+
+/// Fluss errors
+#[pyclass(extends=PyException)]
+#[derive(Debug, Clone)]
+pub struct FlussError {
+    #[pyo3(get)]
+    pub message: String,
+}
+
+#[pymethods]
+impl FlussError {
+    fn __str__(&self) -> String {
+        format!("FlussError: {}", self.message)
+    }
+}
+
+impl FlussError {
+    pub fn new_err(message: impl ToString) -> PyErr {
+        PyErr::new::<FlussError, _>(message.to_string())
+    }
+}
\ No newline at end of file
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
new file mode 100644
index 0000000000..0d8b7a5a80
--- /dev/null
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -0,0 +1,67 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+pub use ::fluss as fcore;
+use pyo3::prelude::*;
+use once_cell::sync::Lazy;
+use tokio::runtime::Runtime;
+
+mod config;
+mod connection;
+mod table;
+mod admin;
+mod types;
+mod error;
+mod utils;
+
+pub use config::*;
+pub use connection::*;
+pub use table::*;
+pub use admin::*;
+pub use types::*;
+pub use error::*;
+pub use utils::*;
+
+static TOKIO_RUNTIME: Lazy<Runtime> = Lazy::new(|| {
+    tokio::runtime::Builder::new_multi_thread()
+        .enable_all()
+        .build()
+        .expect("Failed to create Tokio runtime")
+});
+
+#[pymodule]
+fn fluss_python(m: &Bound<'_, PyModule>) -> PyResult<()> {
+    // Register all classes
+    m.add_class::<Config>()?;
+    m.add_class::<FlussConnection>()?;
+    m.add_class::<TablePath>()?;
+    m.add_class::<TableInfo>()?;
+    m.add_class::<TableDescriptor>()?;
+    m.add_class::<FlussAdmin>()?;
+    m.add_class::<FlussTable>()?;
+    m.add_class::<AppendWriter>()?;
+    m.add_class::<Schema>()?;
+    m.add_class::<LogScanner>()?;
+    m.add_class::<LakeSnapshot>()?;
+    m.add_class::<TableBucket>()?;
+    
+    // Register exception types
+    // TODO: maybe implement a separate module for exceptions
+    m.add("FlussError", m.py().get_type::<FlussError>())?;
+    
+    Ok(())
+}
diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
new file mode 100644
index 0000000000..c40104bfc9
--- /dev/null
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -0,0 +1,178 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use pyo3::prelude::*;
+use arrow::datatypes::{Schema as ArrowSchema, SchemaRef};
+use std::sync::Arc;
+use arrow_pyarrow::ToPyArrow;
+use crate::*;
+
+/// Utilities for schema conversion between PyArrow, Arrow, and Fluss
+pub struct Utils;
+
+impl Utils {
+    /// Convert PyArrow schema to Rust Arrow schema
+    pub fn pyarrow_to_arrow_schema(py_schema: &PyObject) -> PyResult<SchemaRef> {
+        Python::with_gil(|py| {
+            let schema_bound = py_schema.bind(py);
+            
+            let schema: ArrowSchema = arrow_pyarrow::FromPyArrow::from_pyarrow_bound(&schema_bound)
+                .map_err(|e| FlussError::new_err(format!("Failed to convert PyArrow schema: {}", e)))?;
+            Ok(Arc::new(schema))
+        })
+    }
+
+    /// Convert Arrow DataType to Fluss DataType
+    pub fn arrow_type_to_fluss_type(arrow_type: &arrow::datatypes::DataType) -> PyResult<fcore::metadata::DataType> {
+        use arrow::datatypes::DataType as ArrowDataType;
+        use fcore::metadata::DataTypes;
+
+        let fluss_type = match arrow_type {
+            ArrowDataType::Boolean => DataTypes::boolean(),
+            ArrowDataType::Int8 => DataTypes::tinyint(),
+            ArrowDataType::Int16 => DataTypes::smallint(),
+            ArrowDataType::Int32 => DataTypes::int(),
+            ArrowDataType::Int64 => DataTypes::bigint(),
+            ArrowDataType::UInt8 => DataTypes::tinyint(),
+            ArrowDataType::UInt16 => DataTypes::smallint(),
+            ArrowDataType::UInt32 => DataTypes::int(),
+            ArrowDataType::UInt64 => DataTypes::bigint(),
+            ArrowDataType::Float32 => DataTypes::float(),
+            ArrowDataType::Float64 => DataTypes::double(),
+            ArrowDataType::Utf8 | ArrowDataType::LargeUtf8 => DataTypes::string(),
+            ArrowDataType::Binary | ArrowDataType::LargeBinary => DataTypes::bytes(),
+            ArrowDataType::Date32 => DataTypes::date(),
+            ArrowDataType::Date64 => DataTypes::date(),
+            ArrowDataType::Time32(_) | ArrowDataType::Time64(_) => DataTypes::time(),
+            ArrowDataType::Timestamp(_, _) => DataTypes::timestamp(),
+            ArrowDataType::Decimal128(precision, scale) => DataTypes::decimal(*precision as u32, *scale as u32),
+            _ => {
+                return Err(FlussError::new_err(format!(
+                    "Unsupported Arrow data type: {:?}", arrow_type
+                )));
+            }
+        };
+
+        Ok(fluss_type)
+    }
+
+    /// Convert Fluss DataType to string representation
+    pub fn datatype_to_string(data_type: &fcore::metadata::DataType) -> String {
+        match data_type {
+            fcore::metadata::DataType::Boolean(_) => "boolean".to_string(),
+            fcore::metadata::DataType::TinyInt(_) => "tinyint".to_string(),
+            fcore::metadata::DataType::SmallInt(_) => "smallint".to_string(),
+            fcore::metadata::DataType::Int(_) => "int".to_string(),
+            fcore::metadata::DataType::BigInt(_) => "bigint".to_string(),
+            fcore::metadata::DataType::Float(_) => "float".to_string(),
+            fcore::metadata::DataType::Double(_) => "double".to_string(),
+            fcore::metadata::DataType::String(_) => "string".to_string(),
+            fcore::metadata::DataType::Bytes(_) => "bytes".to_string(),
+            fcore::metadata::DataType::Date(_) => "date".to_string(),
+            fcore::metadata::DataType::Time(t) => {
+                if t.precision() == 0 {
+                    "time".to_string()
+                } else {
+                    format!("time({})", t.precision())
+                }
+            },
+            fcore::metadata::DataType::Timestamp(t) => {
+                if t.precision() == 6 {
+                    "timestamp".to_string()
+                } else {
+                    format!("timestamp({})", t.precision())
+                }
+            },
+            fcore::metadata::DataType::TimestampLTz(t) => {
+                if t.precision() == 6 {
+                    "timestamp_ltz".to_string()
+                } else {
+                    format!("timestamp_ltz({})", t.precision())
+                }
+            },
+            fcore::metadata::DataType::Char(c) => format!("char({})", c.length()),
+            fcore::metadata::DataType::Decimal(d) => format!("decimal({},{})", d.precision(), d.scale()),
+            fcore::metadata::DataType::Binary(b) => format!("binary({})", b.length()),
+            fcore::metadata::DataType::Array(arr) => format!("array<{}>", Utils::datatype_to_string(arr.get_element_type())),
+            fcore::metadata::DataType::Map(map) => format!("map<{},{}>", 
+                                        Utils::datatype_to_string(map.key_type()), 
+                                        Utils::datatype_to_string(map.value_type())),
+            fcore::metadata::DataType::Row(row) => {
+                let fields: Vec<String> = row.fields().iter()
+                    .map(|field| format!("{}: {}", field.name(), Utils::datatype_to_string(field.data_type())))
+                    .collect();
+                format!("row<{}>", fields.join(", "))
+            },
+        }
+    }
+
+    /// Parse log format string to LogFormat enum
+    pub fn parse_log_format(format_str: &str) -> PyResult<fcore::metadata::LogFormat> {
+        fcore::metadata::LogFormat::parse(format_str)
+            .map_err(|e| FlussError::new_err(format!("Invalid log format '{}': {}", format_str, e)))
+    }
+
+    /// Parse kv format string to KvFormat enum
+    pub fn parse_kv_format(format_str: &str) -> PyResult<fcore::metadata::KvFormat> {
+        fcore::metadata::KvFormat::parse(format_str)
+            .map_err(|e| FlussError::new_err(format!("Invalid kv format '{}': {}", format_str, e)))
+    }
+
+    /// Convert ScanRecords to Arrow RecordBatch
+    pub fn convert_scan_records_to_arrow(
+        _scan_records: fcore::record::ScanRecords,
+    ) -> Vec<Arc<arrow::record_batch::RecordBatch>> {
+        let mut result = Vec::new();
+        for(_, records) in _scan_records.into_records() {
+            for record in records {
+                let columnar_row = record.row();
+                let row_id = columnar_row.get_row_id();
+                if row_id == 0 {
+                    let record_batch = columnar_row.get_record_batch();
+                    result.push(record_batch.clone());
+                }
+            }
+        }
+        result
+    }
+    
+    /// Combine multiple Arrow batches into a single Table
+    pub fn combine_batches_to_table(py: Python, batches: Vec<Arc<arrow::record_batch::RecordBatch>>) -> PyResult<PyObject> {
+        if batches.is_empty() {
+            return Err(FlussError::new_err("No batches to combine"));
+        }
+        
+        // Convert Rust Arrow RecordBatch to PyObject
+        let py_batches: Result<Vec<PyObject>, _> = batches.iter()
+            .map(|batch| {
+                batch.as_ref().to_pyarrow(py)
+                    .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch to PyObject: {}", e)))
+            })
+            .collect();
+        
+        let py_batches = py_batches?;
+        
+        let pyarrow = py.import("pyarrow")?;
+        
+        // Use pyarrow.Table.from_batches to combine batches
+        let table = pyarrow
+            .getattr("Table")?
+            .call_method1("from_batches", (py_batches,))?;
+        
+        Ok(table.into())
+    }
+}

From 1d937bbe868719faf49efcf8486a4974223d85ec Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Wed, 15 Oct 2025 18:02:18 +0800
Subject: [PATCH 010/287] [chore] Introduce IT infra and add IT for database
 operations in admin (#28)

---
 fluss-rust/.github/workflows/ci.yml           |   6 +-
 fluss-rust/crates/fluss/Cargo.toml            |   4 +
 fluss-rust/crates/fluss/src/client/admin.rs   |   5 +-
 .../crates/fluss/src/metadata/database.rs     |  19 +-
 fluss-rust/crates/fluss/src/metadata/table.rs |   4 +-
 .../crates/fluss/tests/integration/admin.rs   | 131 ++++++++++++
 .../fluss/tests/integration/client/mod.rs     |  21 --
 .../fluss/tests/integration/fluss_cluster.rs  | 192 ++++++++++++++++++
 fluss-rust/crates/fluss/tests/test_fluss.rs   |   4 +-
 9 files changed, 347 insertions(+), 39 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/tests/integration/admin.rs
 delete mode 100644 fluss-rust/crates/fluss/tests/integration/client/mod.rs
 create mode 100644 fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs

diff --git a/fluss-rust/.github/workflows/ci.yml b/fluss-rust/.github/workflows/ci.yml
index 26616292b5..73e2b3f172 100644
--- a/fluss-rust/.github/workflows/ci.yml
+++ b/fluss-rust/.github/workflows/ci.yml
@@ -88,7 +88,11 @@ jobs:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
       - name: Integration Test
-        run: cargo test --features integration_tests --all-targets --workspace
+        # only run IT in linux since no docker in macos by default
+        run: |
+          if [ "$RUNNER_OS" == "Linux" ]; then
+            cargo test --features integration_tests --all-targets --workspace
+          fi
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index cc26014a46..a728bd74f8 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -46,6 +46,10 @@ parse-display = "0.10"
 ref-cast = "1.0"
 chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }
 
+[dev-dependencies]
+testcontainers = "0.25.0"
+once_cell = "1.19"
+test-env-helpers = "0.2.2"
 
 [features]
 integration_tests = []
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 2584034a69..fd0f316374 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -150,7 +150,7 @@ impl FlussAdmin {
         database_name: &str,
         ignore_if_not_exists: bool,
         cascade: bool,
-    ) -> Result<()> {
+    ) {
         let _response = self
             .admin_gateway
             .request(DropDatabaseRequest::new(
@@ -158,8 +158,7 @@ impl FlussAdmin {
                 ignore_if_not_exists,
                 cascade,
             ))
-            .await?;
-        Ok(())
+            .await;
     }
 
     /// List all databases
diff --git a/fluss-rust/crates/fluss/src/metadata/database.rs b/fluss-rust/crates/fluss/src/metadata/database.rs
index 2649421d6f..8eaa4d3eb0 100644
--- a/fluss-rust/crates/fluss/src/metadata/database.rs
+++ b/fluss-rust/crates/fluss/src/metadata/database.rs
@@ -22,7 +22,7 @@ use serde::{Deserialize, Serialize};
 use serde_json::{Value, json};
 use std::collections::HashMap;
 
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 pub struct DatabaseDescriptor {
     comment: Option<String>,
     custom_properties: HashMap<String, String>,
@@ -105,11 +105,11 @@ impl DatabaseDescriptorBuilder {
         self
     }
 
-    pub fn build(self) -> Result<DatabaseDescriptor> {
-        Ok(DatabaseDescriptor {
+    pub fn build(self) -> DatabaseDescriptor {
+        DatabaseDescriptor {
             comment: self.comment,
             custom_properties: self.custom_properties,
-        })
+        }
     }
 }
 
@@ -179,7 +179,7 @@ impl JsonSerde for DatabaseDescriptor {
         };
         builder = builder.custom_properties(custom_properties);
 
-        builder.build()
+        Ok(builder.build())
     }
 }
 
@@ -187,7 +187,7 @@ impl DatabaseDescriptor {
     /// Create DatabaseDescriptor from JSON bytes (equivalent to Java's fromJsonBytes)
     pub fn from_json_bytes(bytes: &[u8]) -> Result<Self> {
         let json_value: Value = serde_json::from_slice(bytes)
-            .map_err(|e| JsonSerdeError(format!("Failed to parse JSON: {}", e)))?;
+            .map_err(|e| JsonSerdeError(format!("Failed to parse JSON: {e}")))?;
         Self::deserialize_json(&json_value)
     }
 
@@ -195,7 +195,7 @@ impl DatabaseDescriptor {
     pub fn to_json_bytes(&self) -> Result<Vec<u8>> {
         let json_value = self.serialize_json()?;
         serde_json::to_vec(&json_value)
-            .map_err(|e| JsonSerdeError(format!("Failed to serialize to JSON: {}", e)))
+            .map_err(|e| JsonSerdeError(format!("Failed to serialize to JSON: {e}")))
     }
 }
 
@@ -212,8 +212,7 @@ mod tests {
         let descriptor = DatabaseDescriptor::builder()
             .comment("Test database")
             .custom_properties(custom_props)
-            .build()
-            .unwrap();
+            .build();
 
         // Test serialization
         let json_bytes = descriptor.to_json_bytes().unwrap();
@@ -226,7 +225,7 @@ mod tests {
 
     #[test]
     fn test_empty_database_descriptor() {
-        let descriptor = DatabaseDescriptor::builder().build().unwrap();
+        let descriptor = DatabaseDescriptor::builder().build();
         let json_bytes = descriptor.to_json_bytes().unwrap();
         let deserialized = DatabaseDescriptor::from_json_bytes(&json_bytes).unwrap();
         assert_eq!(descriptor, deserialized);
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 90e3573eb8..2b48ec60db 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -589,7 +589,7 @@ impl LogFormat {
         match s.to_uppercase().as_str() {
             "ARROW" => Ok(LogFormat::ARROW),
             "INDEXED" => Ok(LogFormat::INDEXED),
-            _ => Err(InvalidTableError(format!("Unknown log format: {}", s))),
+            _ => Err(InvalidTableError(format!("Unknown log format: {s}"))),
         }
     }
 }
@@ -615,7 +615,7 @@ impl KvFormat {
         match s.to_uppercase().as_str() {
             "INDEXED" => Ok(KvFormat::INDEXED),
             "COMPACTED" => Ok(KvFormat::COMPACTED),
-            _ => Err(InvalidTableError(format!("Unknown kv format: {}", s))),
+            _ => Err(InvalidTableError(format!("Unknown kv format: {s}"))),
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
new file mode 100644
index 0000000000..73f52db936
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -0,0 +1,131 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::integration::fluss_cluster::FlussTestingCluster;
+use once_cell::sync::Lazy;
+use parking_lot::RwLock;
+use std::sync::Arc;
+
+#[cfg(test)]
+use test_env_helpers::*;
+
+// Module-level shared cluster instance (only for this test file)
+static SHARED_FLUSS_CLUSTER: Lazy<Arc<RwLock<Option<FlussTestingCluster>>>> =
+    Lazy::new(|| Arc::new(RwLock::new(None)));
+
+#[cfg(test)]
+#[before_all]
+#[after_all]
+mod admin_test {
+    use super::SHARED_FLUSS_CLUSTER;
+    use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
+    use fluss::metadata::DatabaseDescriptorBuilder;
+    use std::sync::Arc;
+
+    fn before_all() {
+        // Create a new tokio runtime in a separate thread
+        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
+        std::thread::spawn(move || {
+            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+            rt.block_on(async {
+                let cluster = FlussTestingClusterBuilder::new().build().await;
+                let mut guard = cluster_guard.write();
+                *guard = Some(cluster);
+            });
+        })
+        .join()
+        .expect("Failed to create cluster");
+    }
+
+    fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
+        let cluster_guard = SHARED_FLUSS_CLUSTER.read();
+        if cluster_guard.is_none() {
+            panic!("Fluss cluster not initialized. Make sure before_all() was called.");
+        }
+        Arc::new(cluster_guard.as_ref().unwrap().clone())
+    }
+
+    fn after_all() {
+        // Create a new tokio runtime in a separate thread
+        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
+        std::thread::spawn(move || {
+            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+            rt.block_on(async {
+                let mut guard = cluster_guard.write();
+                if let Some(cluster) = guard.take() {
+                    cluster.stop().await;
+                }
+            });
+        })
+        .join()
+        .expect("Failed to cleanup cluster");
+    }
+
+    #[tokio::test]
+    async fn test_create_database() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("should get admin");
+
+        let db_descriptor = DatabaseDescriptorBuilder::default()
+            .comment("test_db")
+            .custom_properties(
+                [
+                    ("k1".to_string(), "v1".to_string()),
+                    ("k2".to_string(), "v2".to_string()),
+                ]
+                .into(),
+            )
+            .build();
+
+        let db_name = "test_create_database";
+
+        assert_eq!(admin.database_exists(db_name).await.unwrap(), false);
+
+        // create database
+        admin
+            .create_database(db_name, false, Some(&db_descriptor))
+            .await
+            .expect("should create database");
+
+        // database should exist
+        assert_eq!(admin.database_exists(db_name).await.unwrap(), true);
+
+        // get database
+        let db_info = admin
+            .get_database_info(db_name)
+            .await
+            .expect("should get database info");
+
+        assert_eq!(db_info.database_name(), db_name);
+        assert_eq!(db_info.database_descriptor(), &db_descriptor);
+
+        // drop database
+        admin.drop_database(db_name, false, true).await;
+
+        // database shouldn't exist now
+        assert_eq!(admin.database_exists(db_name).await.unwrap(), false);
+
+        // Note: We don't stop the shared cluster here as it's used by other tests
+    }
+
+    #[tokio::test]
+    async fn test_create_table() {
+        // todo
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/integration/client/mod.rs b/fluss-rust/crates/fluss/tests/integration/client/mod.rs
deleted file mode 100644
index 567c358cea..0000000000
--- a/fluss-rust/crates/fluss/tests/integration/client/mod.rs
+++ /dev/null
@@ -1,21 +0,0 @@
-// Licensed to the Apache Software Foundation (ASF) under one
-// or more contributor license agreements.  See the NOTICE file
-// distributed with this work for additional information
-// regarding copyright ownership.  The ASF licenses this file
-// to you under the Apache License, Version 2.0 (the
-// "License"); you may not use this file except in compliance
-// with the License.  You may obtain a copy of the License at
-//
-//   http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing,
-// software distributed under the License is distributed on an
-// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-// KIND, either express or implied.  See the License for the
-// specific language governing permissions and limitations
-// under the License.
-
-#[test]
-fn test() {
-    println!("Running integration tests");
-}
diff --git a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
new file mode 100644
index 0000000000..83a47956ae
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
@@ -0,0 +1,192 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+use std::collections::HashMap;
+use std::string::ToString;
+use std::sync::Arc;
+use std::time::Duration;
+use testcontainers::core::ContainerPort;
+use testcontainers::runners::AsyncRunner;
+use testcontainers::{ContainerAsync, GenericImage, ImageExt};
+
+const FLUSS_VERSION: &str = "0.7.0";
+
+pub struct FlussTestingClusterBuilder {
+    number_of_tablet_servers: usize,
+    network: &'static str,
+    cluster_conf: HashMap<String, String>,
+}
+
+impl FlussTestingClusterBuilder {
+    pub fn new() -> Self {
+        // reduce testing resources
+        let mut cluster_conf = HashMap::new();
+        cluster_conf.insert(
+            "netty.server.num-network-threads".to_string(),
+            "1".to_string(),
+        );
+        cluster_conf.insert(
+            "netty.server.num-worker-threads".to_string(),
+            "3".to_string(),
+        );
+
+        FlussTestingClusterBuilder {
+            number_of_tablet_servers: 1,
+            cluster_conf,
+            network: "fluss-cluster-network",
+        }
+    }
+
+    pub async fn build(&mut self) -> FlussTestingCluster {
+        let zookeeper = Arc::new(
+            GenericImage::new("zookeeper", "3.9.2")
+                .with_network(self.network)
+                .with_container_name("zookeeper")
+                .start()
+                .await
+                .unwrap(),
+        );
+
+        let coordinator_server = Arc::new(self.start_coordinator_server().await);
+
+        let mut tablet_servers = HashMap::new();
+        for server_id in 0..self.number_of_tablet_servers {
+            tablet_servers.insert(
+                server_id,
+                Arc::new(self.start_tablet_server(server_id).await),
+            );
+        }
+
+        FlussTestingCluster {
+            zookeeper,
+            coordinator_server,
+            tablet_servers,
+            bootstrap_servers: "127.0.0.1:9123".to_string(),
+        }
+    }
+
+    async fn start_coordinator_server(&mut self) -> ContainerAsync<GenericImage> {
+        let mut coordinator_confs = HashMap::new();
+        coordinator_confs.insert("zookeeper.address", "zookeeper:2181");
+        coordinator_confs.insert(
+            "bind.listeners",
+            "INTERNAL://coordinator-server:0, CLIENT://coordinator-server:9123",
+        );
+        coordinator_confs.insert("advertised.listeners", "CLIENT://localhost:9123");
+        coordinator_confs.insert("internal.listener.name", "INTERNAL");
+        GenericImage::new("fluss/fluss", FLUSS_VERSION)
+            .with_container_name("coordinator-server")
+            .with_mapped_port(9123, ContainerPort::Tcp(9123))
+            .with_network(self.network)
+            .with_cmd(vec!["coordinatorServer"])
+            .with_env_var(
+                "FLUSS_PROPERTIES",
+                self.to_fluss_properties_with(coordinator_confs),
+            )
+            .start()
+            .await
+            .unwrap()
+    }
+
+    async fn start_tablet_server(&self, server_id: usize) -> ContainerAsync<GenericImage> {
+        let mut tablet_server_confs = HashMap::new();
+        let bind_listeners = format!(
+            "INTERNAL://tablet-server-{}:0, CLIENT://tablet-server-{}:9123",
+            server_id, server_id
+        );
+        let expose_host_port = 9124 + server_id;
+        let advertised_listeners = format!("CLIENT://localhost:{}", expose_host_port);
+        let tablet_server_id = format!("{}", server_id);
+        tablet_server_confs.insert("zookeeper.address", "zookeeper:2181");
+        tablet_server_confs.insert("bind.listeners", bind_listeners.as_str());
+        tablet_server_confs.insert("advertised.listeners", advertised_listeners.as_str());
+        tablet_server_confs.insert("internal.listener.name", "INTERNAL");
+        tablet_server_confs.insert("tablet-server.id", tablet_server_id.as_str());
+
+        GenericImage::new("fluss/fluss", FLUSS_VERSION)
+            .with_cmd(vec!["tabletServer"])
+            .with_mapped_port(expose_host_port as u16, ContainerPort::Tcp(9123))
+            .with_network(self.network)
+            .with_container_name(format!("tablet-server-{}", server_id))
+            .with_env_var(
+                "FLUSS_PROPERTIES",
+                self.to_fluss_properties_with(tablet_server_confs),
+            )
+            .start()
+            .await
+            .unwrap()
+    }
+
+    fn to_fluss_properties_with(&self, extra_properties: HashMap<&str, &str>) -> String {
+        let mut fluss_properties = Vec::new();
+        for (k, v) in self.cluster_conf.iter() {
+            fluss_properties.push(format!("{}: {}", k, v));
+        }
+        for (k, v) in extra_properties.iter() {
+            fluss_properties.push(format!("{}: {}", k, v));
+        }
+        fluss_properties.join("\n")
+    }
+}
+
+/// Provides an easy way to launch a Fluss cluster with coordinator and tablet servers.
+#[derive(Clone)]
+pub struct FlussTestingCluster {
+    zookeeper: Arc<ContainerAsync<GenericImage>>,
+    coordinator_server: Arc<ContainerAsync<GenericImage>>,
+    tablet_servers: HashMap<usize, Arc<ContainerAsync<GenericImage>>>,
+    bootstrap_servers: String,
+}
+
+impl FlussTestingCluster {
+    pub async fn stop(&self) {
+        for tablet_server in self.tablet_servers.values() {
+            tablet_server.stop().await.unwrap()
+        }
+        self.coordinator_server.stop().await.unwrap();
+        self.zookeeper.stop().await.unwrap();
+    }
+
+    pub async fn get_fluss_connection(&self) -> FlussConnection {
+        let mut config = Config::default();
+        config.bootstrap_server = Some(self.bootstrap_servers.clone());
+
+        // Retry mechanism: retry for up to 1 minute
+        let max_retries = 60; // 60 retry attempts
+        let retry_interval = Duration::from_secs(1); // 1 second interval between retries
+
+        for attempt in 1..=max_retries {
+            match FlussConnection::new(config.clone()).await {
+                Ok(connection) => {
+                    return connection;
+                }
+                Err(e) => {
+                    if attempt == max_retries {
+                        panic!(
+                            "Failed to connect to Fluss cluster after {} attempts: {}",
+                            max_retries, e
+                        );
+                    }
+                    tokio::time::sleep(retry_interval).await;
+                }
+            }
+        }
+        unreachable!()
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
index 7840638c74..28b9bef7d9 100644
--- a/fluss-rust/crates/fluss/tests/test_fluss.rs
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -20,6 +20,6 @@ extern crate fluss;
 
 #[cfg(feature = "integration_tests")]
 mod integration {
-
-    mod client;
+    mod admin;
+    mod fluss_cluster;
 }

From 9533ce2e7445e3e6ea5dd0de87f9e2b58c020dc3 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Thu, 16 Oct 2025 14:17:30 +0800
Subject: [PATCH 011/287] [chore] Supports PyO3 in m1 arm 64 (#33)

---
 fluss-rust/.cargo/config.toml | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)
 create mode 100644 fluss-rust/.cargo/config.toml

diff --git a/fluss-rust/.cargo/config.toml b/fluss-rust/.cargo/config.toml
new file mode 100644
index 0000000000..57efc7ff75
--- /dev/null
+++ b/fluss-rust/.cargo/config.toml
@@ -0,0 +1,22 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[target.aarch64-apple-darwin]
+rustflags = [
+    "-C", "link-arg=-undefined",
+    "-C", "link-arg=dynamic_lookup",
+]
\ No newline at end of file

From a2cc54dd43503588ec6071d1e05f90406854dc0e Mon Sep 17 00:00:00 2001
From: naivedogger <59598718+naivedogger@users.noreply.github.com>
Date: Thu, 16 Oct 2025 19:32:50 +0800
Subject: [PATCH 012/287] [feat] Create Python bindings for table writing and
 reading (#9)

---------

Co-authored-by: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
---
 fluss-rust/Cargo.toml                         |   6 +-
 fluss-rust/bindings/python/Cargo.toml         |   3 +-
 fluss-rust/bindings/python/fluss/__init__.py  |   2 +-
 fluss-rust/bindings/python/pyproject.toml     |   2 +-
 fluss-rust/bindings/python/src/admin.rs       |  26 +-
 fluss-rust/bindings/python/src/config.rs      |  33 +-
 fluss-rust/bindings/python/src/connection.rs  |  45 +-
 fluss-rust/bindings/python/src/error.rs       |   8 +-
 fluss-rust/bindings/python/src/lib.rs         |  23 +-
 fluss-rust/bindings/python/src/metadata.rs    | 119 +++--
 fluss-rust/bindings/python/src/table.rs       | 412 ++++++++++++++++++
 fluss-rust/bindings/python/src/utils.rs       | 105 +++--
 fluss-rust/crates/fluss/Cargo.toml            |   7 +-
 .../crates/fluss/src/client/table/mod.rs      |  20 +-
 .../crates/fluss/src/client/table/scanner.rs  | 103 ++++-
 .../crates/fluss/src/proto/fluss_api.proto    |  20 +
 fluss-rust/crates/fluss/src/record/mod.rs     |   5 +
 fluss-rust/crates/fluss/src/row/column.rs     |   9 +
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |   3 +
 .../fluss/src/rpc/message/list_offsets.rs     | 124 ++++++
 .../crates/fluss/src/rpc/message/mod.rs       |   2 +
 21 files changed, 909 insertions(+), 168 deletions(-)
 create mode 100644 fluss-rust/bindings/python/src/table.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 059236fccf..54436ac17d 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -28,9 +28,11 @@ rust-version = "1.85"
 
 [workspace]
 resolver = "2"
-members = ["crates/fluss", "crates/examples"]
+members = ["crates/fluss", "crates/examples", "bindings/python"]
 
 [workspace.dependencies]
 fluss = { version = "0.1.0", path = "./crates/fluss" }
 tokio = { version = "1.44.2", features = ["full"] }
-clap = { version = "4.5.37", features = ["derive"] }
\ No newline at end of file
+clap = { version = "4.5.37", features = ["derive"] }
+arrow = "55.1.0"
+chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }
diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
index aee1a21314..04826fb289 100644
--- a/fluss-rust/bindings/python/Cargo.toml
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -26,8 +26,6 @@ rust-version = "1.85"
 name = "fluss"
 crate-type = ["cdylib"]
 
-[workspace]
-
 [dependencies]
 pyo3 = { version = "0.24", features = ["extension-module"] }
 fluss = { path = "../../crates/fluss" }
@@ -36,3 +34,4 @@ arrow = { workspace = true }
 arrow-pyarrow = "55.1.0"
 pyo3-async-runtimes = { version = "0.24.0", features = ["tokio-runtime"] }
 chrono = { workspace = true }
+once_cell = "1.21.3"
diff --git a/fluss-rust/bindings/python/fluss/__init__.py b/fluss-rust/bindings/python/fluss/__init__.py
index cceee102ad..098014adc6 100644
--- a/fluss-rust/bindings/python/fluss/__init__.py
+++ b/fluss-rust/bindings/python/fluss/__init__.py
@@ -15,6 +15,6 @@
 # specific language governing permissions and limitations
 # under the License.
 
-from .fluss_python import *
+from ._fluss import *
 
 __version__ = "0.1.0"
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index fe9d58878d..e28b3d2474 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -57,7 +57,7 @@ docs = [
 ]
 
 [tool.maturin]
-python-source = "python"
+python-source = "."
 module-name = "fluss._fluss"
 features = ["pyo3/extension-module"]
 
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index 7ec6eee93b..73b2dd3af0 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -15,9 +15,8 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use pyo3::prelude::*;
-use pyo3_async_runtimes::tokio::future_into_py;
 use crate::*;
+use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::Arc;
 
 /// Administrative client for managing Fluss tables
@@ -38,16 +37,17 @@ impl FlussAdmin {
         ignore_if_exists: Option<bool>,
     ) -> PyResult<Bound<'py, PyAny>> {
         let ignore = ignore_if_exists.unwrap_or(false);
-        
+
         let core_table_path = table_path.to_core().clone();
         let core_descriptor = table_descriptor.to_core().clone();
         let admin = self.__admin.clone();
 
         future_into_py(py, async move {
-            admin.create_table(&core_table_path, &core_descriptor, ignore)
+            admin
+                .create_table(&core_table_path, &core_descriptor, ignore)
                 .await
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
-        
+
             Python::with_gil(|py| Ok(py.None()))
         })
     }
@@ -60,10 +60,12 @@ impl FlussAdmin {
     ) -> PyResult<Bound<'py, PyAny>> {
         let core_table_path = table_path.to_core().clone();
         let admin = self.__admin.clone();
-        
+
         future_into_py(py, async move {
-            let core_table_info = admin.get_table(&core_table_path).await
-                .map_err(|e| FlussError::new_err(format!("Failed to get table: {}", e)))?;
+            let core_table_info = admin
+                .get_table(&core_table_path)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to get table: {e}")))?;
 
             Python::with_gil(|py| {
                 let table_info = TableInfo::from_core(core_table_info);
@@ -80,10 +82,12 @@ impl FlussAdmin {
     ) -> PyResult<Bound<'py, PyAny>> {
         let core_table_path = table_path.to_core().clone();
         let admin = self.__admin.clone();
-        
+
         future_into_py(py, async move {
-            let core_lake_snapshot = admin.get_latest_lake_snapshot(&core_table_path).await
-                .map_err(|e| FlussError::new_err(format!("Failed to get lake snapshot: {}", e)))?;
+            let core_lake_snapshot = admin
+                .get_latest_lake_snapshot(&core_table_path)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to get lake snapshot: {e}")))?;
 
             Python::with_gil(|py| {
                 let lake_snapshot = LakeSnapshot::from_core(core_lake_snapshot);
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 08b20b4d40..70bd9cd770 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -15,9 +15,8 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use pyo3::prelude::*;
-use pyo3::types::PyDict;
 use crate::*;
+use pyo3::types::PyDict;
 
 /// Configuration for Fluss client
 #[pyclass]
@@ -33,7 +32,7 @@ impl Config {
     #[pyo3(signature = (properties = None))]
     fn new(properties: Option<&Bound<'_, PyDict>>) -> PyResult<Self> {
         let mut config = fcore::config::Config::default();
-        
+
         if let Some(props) = properties {
             for item in props.iter() {
                 let key: String = item.0.extract()?;
@@ -42,67 +41,65 @@ impl Config {
                 match key.as_str() {
                     "bootstrap.servers" => {
                         config.bootstrap_server = Some(value);
-                    },
+                    }
                     "request.max.size" => {
                         if let Ok(size) = value.parse::<i32>() {
                             config.request_max_size = size;
                         }
-                    },
+                    }
                     "writer.acks" => {
                         config.writer_acks = value;
-                    },
+                    }
                     "writer.retries" => {
                         if let Ok(retries) = value.parse::<i32>() {
                             config.writer_retries = retries;
                         }
-                    },
+                    }
                     "writer.batch.size" => {
                         if let Ok(size) = value.parse::<i32>() {
                             config.writer_batch_size = size;
                         }
-                    },
+                    }
                     _ => {
-                        return Err(FlussError::new_err(format!("Unknown property: {}", key)));
+                        return Err(FlussError::new_err(format!("Unknown property: {key}")));
                     }
                 }
             }
         }
 
-        Ok(Self {
-            inner: config,
-        })
+        Ok(Self { inner: config })
     }
-    
+
     /// Get the bootstrap server
     #[getter]
     fn bootstrap_server(&self) -> Option<String> {
         self.inner.bootstrap_server.clone()
     }
-    
+
     /// Set the bootstrap server
     #[setter]
     fn set_bootstrap_server(&mut self, server: String) {
         self.inner.bootstrap_server = Some(server);
     }
-    
+
     /// Get the request max size
     #[getter]
     fn request_max_size(&self) -> i32 {
         self.inner.request_max_size
     }
-    
+
     /// Set the request max size
     #[setter]
     fn set_request_max_size(&mut self, size: i32) {
         self.inner.request_max_size = size;
     }
-    
+
     /// Get the writer batch size
     #[getter]
     fn writer_batch_size(&self) -> i32 {
         self.inner.writer_batch_size
     }
-    
+
     /// Set the writer batch size
     #[setter]
     fn set_writer_batch_size(&mut self, size: i32) {
diff --git a/fluss-rust/bindings/python/src/connection.rs b/fluss-rust/bindings/python/src/connection.rs
index ba1fa50554..aeb8410ddf 100644
--- a/fluss-rust/bindings/python/src/connection.rs
+++ b/fluss-rust/bindings/python/src/connection.rs
@@ -15,10 +15,9 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use pyo3::prelude::*;
 use crate::*;
-use std::sync::Arc;
 use pyo3_async_runtimes::tokio::future_into_py;
+use std::sync::Arc;
 
 /// Connection to a Fluss cluster
 #[pyclass]
@@ -37,55 +36,55 @@ impl FlussConnection {
             let connection = fcore::client::FlussConnection::new(rust_config)
                 .await
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
-        
+
             let py_connection = FlussConnection {
                 inner: Arc::new(connection),
             };
 
-            Python::with_gil(|py| {
-                Py::new(py, py_connection)
-            })
+            Python::with_gil(|py| Py::new(py, py_connection))
         })
     }
-    
+
     /// Get admin interface
     fn get_admin<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
         let client = self.inner.clone();
 
         future_into_py(py, async move {
-            let admin = client.get_admin()
+            let admin = client
+                .get_admin()
                 .await
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
 
             let py_admin = FlussAdmin::from_core(admin);
 
-            Python::with_gil(|py| {
-                Py::new(py, py_admin)
-            })
+            Python::with_gil(|py| Py::new(py, py_admin))
         })
     }
 
     /// Get a table
-    fn get_table<'py>(&self, py: Python<'py>, table_path: &TablePath) -> PyResult<Bound<'py, PyAny>> {
+    fn get_table<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+    ) -> PyResult<Bound<'py, PyAny>> {
         let client = self.inner.clone();
         let core_path = table_path.to_core().clone();
 
         future_into_py(py, async move {
-            let core_table = client.get_table(&core_path)
+            let core_table = client
+                .get_table(&core_path)
                 .await
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
-        
+
             let py_table = FlussTable::new_table(
-                client,
-                core_table.metadata,
-                core_table.table_info,
-                core_table.table_path,
-                core_table.has_primary_key,
+                client.clone(),
+                core_table.metadata().clone(),
+                core_table.table_info().clone(),
+                core_table.table_path().clone(),
+                core_table.has_primary_key(),
             );
 
-            Python::with_gil(|py| {
-                Py::new(py, py_table)
-            })
+            Python::with_gil(|py| Py::new(py, py_table))
         })
     }
 
@@ -98,7 +97,7 @@ impl FlussConnection {
     fn __enter__(slf: PyRef<Self>) -> PyRef<Self> {
         slf
     }
-    
+
     // Exit the runtime context (for 'with' statement)
     #[pyo3(signature = (_exc_type=None, _exc_value=None, _traceback=None))]
     fn __exit__(
diff --git a/fluss-rust/bindings/python/src/error.rs b/fluss-rust/bindings/python/src/error.rs
index 2db2991cfb..35d9d9149f 100644
--- a/fluss-rust/bindings/python/src/error.rs
+++ b/fluss-rust/bindings/python/src/error.rs
@@ -15,6 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use pyo3::exceptions::PyException;
 use pyo3::prelude::*;
 
 /// Fluss errors
@@ -27,6 +28,11 @@ pub struct FlussError {
 
 #[pymethods]
 impl FlussError {
+    #[new]
+    fn new(message: String) -> Self {
+        Self { message }
+    }
+
     fn __str__(&self) -> String {
         format!("FlussError: {}", self.message)
     }
@@ -36,4 +42,4 @@ impl FlussError {
     pub fn new_err(message: impl ToString) -> PyErr {
         PyErr::new::<FlussError, _>(message.to_string())
     }
-}
\ No newline at end of file
+}
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 0d8b7a5a80..63e84b1f86 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -16,24 +16,24 @@
 // under the License.
 
 pub use ::fluss as fcore;
-use pyo3::prelude::*;
 use once_cell::sync::Lazy;
+use pyo3::prelude::*;
 use tokio::runtime::Runtime;
 
+mod admin;
 mod config;
 mod connection;
-mod table;
-mod admin;
-mod types;
 mod error;
+mod metadata;
+mod table;
 mod utils;
 
+pub use admin::*;
 pub use config::*;
 pub use connection::*;
-pub use table::*;
-pub use admin::*;
-pub use types::*;
 pub use error::*;
+pub use metadata::*;
+pub use table::*;
 pub use utils::*;
 
 static TOKIO_RUNTIME: Lazy<Runtime> = Lazy::new(|| {
@@ -44,7 +44,7 @@ static TOKIO_RUNTIME: Lazy<Runtime> = Lazy::new(|| {
 });
 
 #[pymodule]
-fn fluss_python(m: &Bound<'_, PyModule>) -> PyResult<()> {
+fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     // Register all classes
     m.add_class::<Config>()?;
     m.add_class::<FlussConnection>()?;
@@ -58,10 +58,9 @@ fn fluss_python(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<LogScanner>()?;
     m.add_class::<LakeSnapshot>()?;
     m.add_class::<TableBucket>()?;
-    
+
     // Register exception types
-    // TODO: maybe implement a separate module for exceptions
-    m.add("FlussError", m.py().get_type::<FlussError>())?;
-    
+    m.add_class::<FlussError>()?;
+
     Ok(())
 }
diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
index 238dde2ec0..66748ab316 100644
--- a/fluss-rust/bindings/python/src/metadata.rs
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -15,7 +15,6 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use pyo3::prelude::*;
 use crate::*;
 use pyo3::types::PyDict;
 use std::collections::HashMap;
@@ -38,13 +37,13 @@ impl TablePath {
             table_name,
         }
     }
-    
+
     /// Get the database name
     #[getter]
     pub fn database_name(&self) -> String {
         self.database_name.clone()
     }
-    
+
     /// Get the table name  
     #[getter]
     pub fn table_name(&self) -> String {
@@ -59,7 +58,7 @@ impl TablePath {
     pub fn __str__(&self) -> String {
         self.table_path_str()
     }
-    
+
     fn __repr__(&self) -> String {
         format!("TablePath('{}', '{}')", self.database_name, self.table_name)
     }
@@ -68,7 +67,7 @@ impl TablePath {
     pub fn __hash__(&self) -> u64 {
         use std::collections::hash_map::DefaultHasher;
         use std::hash::{Hash, Hasher};
-        
+
         let mut hasher = DefaultHasher::new();
         self.database_name.hash(&mut hasher);
         self.table_name.hash(&mut hasher);
@@ -77,8 +76,7 @@ impl TablePath {
 
     /// Equality implementation for Python
     pub fn __eq__(&self, other: &TablePath) -> bool {
-        self.database_name == other.database_name 
-            && self.table_name == other.table_name
+        self.database_name == other.database_name && self.table_name == other.table_name
     }
 }
 
@@ -112,27 +110,28 @@ impl Schema {
         primary_keys: Option<Vec<String>>,
     ) -> PyResult<Self> {
         let arrow_schema = crate::utils::Utils::pyarrow_to_arrow_schema(&schema)?;
-        
+
         let mut builder = fcore::metadata::Schema::builder();
-        
+
         for field in arrow_schema.fields() {
             let fluss_data_type = crate::utils::Utils::arrow_type_to_fluss_type(field.data_type())?;
             builder = builder.column(field.name(), fluss_data_type);
-            
+
             if let Some(comment) = field.metadata().get("comment") {
                 builder = builder.with_comment(comment);
             }
         }
-        
+
         if let Some(pk_columns) = primary_keys {
             if !pk_columns.is_empty() {
                 builder = builder.primary_key(pk_columns);
             }
         }
-        
-        let fluss_schema = builder.build()
-            .map_err(|e| FlussError::new_err(format!("Failed to build schema: {}", e)))?;
-        
+
+        let fluss_schema = builder
+            .build()
+            .map_err(|e| FlussError::new_err(format!("Failed to build schema: {e}")))?;
+
         Ok(Self {
             __schema: fluss_schema,
         })
@@ -140,20 +139,33 @@ impl Schema {
 
     /// Get column names
     fn get_column_names(&self) -> Vec<String> {
-        self.__schema.columns().iter().map(|col| col.name().to_string()).collect()
+        self.__schema
+            .columns()
+            .iter()
+            .map(|col| col.name().to_string())
+            .collect()
     }
 
     /// Get column types
     fn get_column_types(&self) -> Vec<String> {
-        self.__schema.columns().iter()
+        self.__schema
+            .columns()
+            .iter()
             .map(|col| Utils::datatype_to_string(col.data_type()))
             .collect()
     }
 
     /// Get columns as (name, type) pairs
     fn get_columns(&self) -> Vec<(String, String)> {
-        self.__schema.columns().iter()
-            .map(|col| (col.name().to_string(), Utils::datatype_to_string(col.data_type())))
+        self.__schema
+            .columns()
+            .iter()
+            .map(|col| {
+                (
+                    col.name().to_string(),
+                    Utils::datatype_to_string(col.data_type()),
+                )
+            })
             .collect()
     }
 
@@ -190,7 +202,6 @@ impl TableDistribution {
     }
 }
 
-
 /// Table descriptor containing schema and metadata
 #[pyclass]
 #[derive(Clone)]
@@ -204,7 +215,7 @@ impl TableDescriptor {
     #[new]
     #[pyo3(signature = (schema, **kwargs))]
     pub fn new(
-        schema: &Schema,  // fluss schema
+        schema: &Schema, // fluss schema
         kwargs: Option<&Bound<'_, PyDict>>,
     ) -> PyResult<Self> {
         let mut partition_keys = Vec::new();
@@ -237,18 +248,22 @@ impl TableDescriptor {
             }
             if let Ok(Some(lformat)) = kwargs.get_item("log_format") {
                 let format_str: String = lformat.extract()?;
-                log_format = Some(fcore::metadata::LogFormat::parse(&format_str)
-                    .map_err(|e| FlussError::new_err(e.to_string()))?);
+                log_format = Some(
+                    fcore::metadata::LogFormat::parse(&format_str)
+                        .map_err(|e| FlussError::new_err(e.to_string()))?,
+                );
             }
             if let Ok(Some(kformat)) = kwargs.get_item("kv_format") {
                 let format_str: String = kformat.extract()?;
-                kv_format = Some(fcore::metadata::KvFormat::parse(&format_str)
-                    .map_err(|e| FlussError::new_err(e.to_string()))?);
+                kv_format = Some(
+                    fcore::metadata::KvFormat::parse(&format_str)
+                        .map_err(|e| FlussError::new_err(e.to_string()))?,
+                );
             }
         }
 
         let fluss_schema = schema.to_core().clone();
-        
+
         let mut builder = fcore::metadata::TableDescriptor::builder()
             .schema(fluss_schema)
             .properties(properties)
@@ -266,8 +281,9 @@ impl TableDescriptor {
             builder = builder.kv_format(kv_format);
         }
 
-        let core_descriptor = builder.build()
-            .map_err(|e| FlussError::new_err(format!("Failed to build TableDescriptor: {}", e)))?;
+        let core_descriptor = builder
+            .build()
+            .map_err(|e| FlussError::new_err(format!("Failed to build TableDescriptor: {e}")))?;
 
         Ok(Self {
             __tbl_desc: core_descriptor,
@@ -303,13 +319,13 @@ impl TableInfo {
     pub fn table_id(&self) -> i64 {
         self.__table_info.get_table_id()
     }
-    
+
     /// Get the schema ID
     #[getter]
     pub fn schema_id(&self) -> i32 {
         self.__table_info.get_schema_id()
     }
-    
+
     /// Get the table path
     #[getter]
     pub fn table_path(&self) -> TablePath {
@@ -321,13 +337,13 @@ impl TableInfo {
     pub fn created_time(&self) -> i64 {
         self.__table_info.get_created_time()
     }
-    
+
     /// Get the modified time
     #[getter]
     pub fn modified_time(&self) -> i64 {
         self.__table_info.get_modified_time()
     }
-    
+
     /// Get the primary keys
     pub fn get_primary_keys(&self) -> Vec<String> {
         self.__table_info.get_primary_keys().clone()
@@ -384,7 +400,10 @@ impl TableInfo {
 
     /// Get column names
     pub fn get_column_names(&self) -> Vec<String> {
-        self.__table_info.get_schema().columns().iter()
+        self.__table_info
+            .get_schema()
+            .columns()
+            .iter()
             .map(|col| col.name().to_string())
             .collect()
     }
@@ -398,9 +417,7 @@ impl TableInfo {
 impl TableInfo {
     /// Create from core TableInfo (internal use)
     pub fn from_core(info: fcore::metadata::TableInfo) -> Self {
-        Self {
-            __table_info: info,
-        }
+        Self { __table_info: info }
     }
 }
 
@@ -414,7 +431,7 @@ pub struct LakeSnapshot {
 
 /// Represents a table bucket with table ID, partition ID, and bucket ID
 #[pyclass]
-#[derive(Clone)]
+#[derive(Eq, Hash, PartialEq, Clone)]
 pub struct TableBucket {
     table_id: i64,
     partition_id: Option<i64>,
@@ -464,11 +481,15 @@ impl TableBucket {
     /// String representation
     pub fn __str__(&self) -> String {
         if let Some(partition_id) = self.partition_id {
-            format!("TableBucket(table_id={}, partition_id={}, bucket={})", 
-                    self.table_id, partition_id, self.bucket)
+            format!(
+                "TableBucket(table_id={}, partition_id={}, bucket={})",
+                self.table_id, partition_id, self.bucket
+            )
         } else {
-            format!("TableBucket(table_id={}, bucket={})", 
-                    self.table_id, self.bucket)
+            format!(
+                "TableBucket(table_id={}, bucket={})",
+                self.table_id, self.bucket
+            )
         }
     }
 
@@ -481,7 +502,7 @@ impl TableBucket {
     pub fn __hash__(&self) -> u64 {
         use std::collections::hash_map::DefaultHasher;
         use std::hash::{Hash, Hasher};
-        
+
         let mut hasher = DefaultHasher::new();
         self.table_id.hash(&mut hasher);
         self.partition_id.hash(&mut hasher);
@@ -491,8 +512,8 @@ impl TableBucket {
 
     /// Equality implementation for Python
     pub fn __eq__(&self, other: &TableBucket) -> bool {
-        self.table_id == other.table_id 
-            && self.partition_id == other.partition_id 
+        self.table_id == other.table_id
+            && self.partition_id == other.partition_id
             && self.bucket == other.bucket
     }
 }
@@ -509,7 +530,7 @@ impl TableBucket {
 
     /// Convert to core TableBucket (internal use)
     pub fn to_core(&self) -> fcore::metadata::TableBucket {
-        fcore::metadata::TableBucket::new(self.table_id, self.partition_id, self.bucket)
+        fcore::metadata::TableBucket::new(self.table_id, self.bucket)
     }
 }
 
@@ -559,8 +580,11 @@ impl LakeSnapshot {
 
     /// String representation
     pub fn __str__(&self) -> String {
-        format!("LakeSnapshot(snapshot_id={}, buckets_count={})", 
-                self.snapshot_id, self.table_buckets_offset.len())
+        format!(
+            "LakeSnapshot(snapshot_id={}, buckets_count={})",
+            self.snapshot_id,
+            self.table_buckets_offset.len()
+        )
     }
 
     /// String representation
@@ -578,4 +602,3 @@ impl LakeSnapshot {
         }
     }
 }
-
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
new file mode 100644
index 0000000000..98943b939a
--- /dev/null
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -0,0 +1,412 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::TOKIO_RUNTIME;
+use crate::*;
+use pyo3_async_runtimes::tokio::future_into_py;
+use std::collections::HashSet;
+use std::sync::Arc;
+
+const EARLIEST_OFFSET: i64 = -2;
+
+/// Represents a Fluss table for data operations
+#[pyclass]
+pub struct FlussTable {
+    connection: Arc<fcore::client::FlussConnection>,
+    metadata: Arc<fcore::client::Metadata>,
+    table_info: fcore::metadata::TableInfo,
+    table_path: fcore::metadata::TablePath,
+    has_primary_key: bool,
+}
+
+#[pymethods]
+impl FlussTable {
+    /// Create a new append writer for the table
+    fn new_append_writer<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let conn = self.connection.clone();
+        let metadata = self.metadata.clone();
+        let table_info = self.table_info.clone();
+
+        future_into_py(py, async move {
+            let fluss_table = fcore::client::FlussTable::new(&conn, metadata, table_info);
+
+            let table_append = fluss_table
+                .new_append()
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+            let rust_writer = table_append.create_writer();
+
+            let py_writer = AppendWriter::from_core(rust_writer);
+
+            Python::with_gil(|py| Py::new(py, py_writer))
+        })
+    }
+
+    /// Create a new log scanner for the table
+    fn new_log_scanner<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let conn = self.connection.clone();
+        let metadata = self.metadata.clone();
+        let table_info = self.table_info.clone();
+
+        future_into_py(py, async move {
+            let fluss_table =
+                fcore::client::FlussTable::new(&conn, metadata.clone(), table_info.clone());
+
+            let table_scan = fluss_table.new_scan();
+
+            let rust_scanner = table_scan.create_log_scanner();
+
+            let py_scanner = LogScanner::from_core(rust_scanner, table_info.clone());
+
+            Python::with_gil(|py| Py::new(py, py_scanner))
+        })
+    }
+
+    /// Get table information
+    pub fn get_table_info(&self) -> TableInfo {
+        TableInfo::from_core(self.table_info.clone())
+    }
+
+    /// Get table path
+    pub fn get_table_path(&self) -> TablePath {
+        TablePath::from_core(self.table_path.clone())
+    }
+
+    /// Check if table has primary key
+    pub fn has_primary_key(&self) -> bool {
+        self.has_primary_key
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "FlussTable(path={}.{})",
+            self.table_path.database(),
+            self.table_path.table()
+        )
+    }
+}
+
+impl FlussTable {
+    /// Create a FlussTable
+    pub fn new_table(
+        connection: Arc<fcore::client::FlussConnection>,
+        metadata: Arc<fcore::client::Metadata>,
+        table_info: fcore::metadata::TableInfo,
+        table_path: fcore::metadata::TablePath,
+        has_primary_key: bool,
+    ) -> Self {
+        Self {
+            connection,
+            metadata,
+            table_info,
+            table_path,
+            has_primary_key,
+        }
+    }
+}
+
+/// Writer for appending data to a Fluss table
+#[pyclass]
+pub struct AppendWriter {
+    inner: fcore::client::AppendWriter,
+}
+
+#[pymethods]
+impl AppendWriter {
+    /// Write Arrow table data
+    pub fn write_arrow(&mut self, py: Python, table: PyObject) -> PyResult<()> {
+        // Convert Arrow Table to batches and write each batch
+        let batches = table.call_method0(py, "to_batches")?;
+        let batch_list: Vec<PyObject> = batches.extract(py)?;
+
+        for batch in batch_list {
+            self.write_arrow_batch(py, batch)?;
+        }
+        Ok(())
+    }
+
+    /// Write Arrow batch data
+    pub fn write_arrow_batch(&mut self, py: Python, batch: PyObject) -> PyResult<()> {
+        // Extract number of rows and columns from the Arrow batch
+        let num_rows: usize = batch.getattr(py, "num_rows")?.extract(py)?;
+        let num_columns: usize = batch.getattr(py, "num_columns")?.extract(py)?;
+
+        // Process each row in the batch
+        for row_idx in 0..num_rows {
+            let mut generic_row = fcore::row::GenericRow::new();
+
+            // Extract values for each column in this row
+            for col_idx in 0..num_columns {
+                let column = batch.call_method1(py, "column", (col_idx,))?;
+                let value = column.call_method1(py, "__getitem__", (row_idx,))?;
+
+                // Convert the Python value to a Datum and add to the row
+                let datum = self.convert_python_value_to_datum(py, value)?;
+                generic_row.set_field(col_idx, datum);
+            }
+
+            // Append this row using the async append method
+            TOKIO_RUNTIME.block_on(async {
+                self.inner
+                    .append(generic_row)
+                    .await
+                    .map_err(|e| FlussError::new_err(e.to_string()))
+            })?;
+        }
+
+        Ok(())
+    }
+
+    /// Write Pandas DataFrame data
+    pub fn write_pandas(&mut self, py: Python, df: PyObject) -> PyResult<()> {
+        // Import pyarrow module
+        let pyarrow = py.import("pyarrow")?;
+
+        // Get the Table class from pyarrow module
+        let table_class = pyarrow.getattr("Table")?;
+
+        // Call Table.from_pandas(df) - from_pandas is a class method
+        let pa_table = table_class.call_method1("from_pandas", (df,))?;
+
+        // Then call write_arrow with the converted table
+        self.write_arrow(py, pa_table.into())
+    }
+
+    /// Flush any pending data
+    pub fn flush(&mut self) -> PyResult<()> {
+        TOKIO_RUNTIME.block_on(async {
+            self.inner
+                .flush()
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))
+        })
+    }
+
+    fn __repr__(&self) -> String {
+        "AppendWriter()".to_string()
+    }
+}
+
+impl AppendWriter {
+    /// Create a AppendWriter from a core append writer
+    pub fn from_core(append: fcore::client::AppendWriter) -> Self {
+        Self { inner: append }
+    }
+
+    fn convert_python_value_to_datum(
+        &self,
+        py: Python,
+        value: PyObject,
+    ) -> PyResult<fcore::row::Datum<'static>> {
+        use fcore::row::{Blob, Datum, F32, F64};
+
+        // Check for None (null)
+        if value.is_none(py) {
+            return Ok(Datum::Null);
+        }
+
+        // Try to extract different types
+        if let Ok(type_name) = value.bind(py).get_type().name() {
+            if type_name == "StringScalar" {
+                if let Ok(py_value) = value.call_method0(py, "as_py") {
+                    if let Ok(str_val) = py_value.extract::<String>(py) {
+                        let leaked_str: &'static str = Box::leak(str_val.into_boxed_str());
+                        return Ok(Datum::String(leaked_str));
+                    }
+                }
+            }
+        }
+
+        if let Ok(bool_val) = value.extract::<bool>(py) {
+            return Ok(Datum::Bool(bool_val));
+        }
+
+        if let Ok(int_val) = value.extract::<i32>(py) {
+            return Ok(Datum::Int32(int_val));
+        }
+
+        if let Ok(int_val) = value.extract::<i64>(py) {
+            return Ok(Datum::Int64(int_val));
+        }
+
+        if let Ok(float_val) = value.extract::<f32>(py) {
+            return Ok(Datum::Float32(F32::from(float_val)));
+        }
+
+        if let Ok(float_val) = value.extract::<f64>(py) {
+            return Ok(Datum::Float64(F64::from(float_val)));
+        }
+
+        if let Ok(str_val) = value.extract::<String>(py) {
+            // Convert String to &'static str by leaking memory
+            // This is a simplified approach - in production, you might want better lifetime management
+            let leaked_str: &'static str = Box::leak(str_val.into_boxed_str());
+            return Ok(Datum::String(leaked_str));
+        }
+
+        if let Ok(bytes_val) = value.extract::<Vec<u8>>(py) {
+            let blob = Blob::from(bytes_val);
+            return Ok(Datum::Blob(blob));
+        }
+
+        // If we can't convert, return an error
+        let type_name = value.bind(py).get_type().name()?;
+        Err(FlussError::new_err(format!(
+            "Cannot convert Python value to Datum: {type_name:?}"
+        )))
+    }
+}
+
+/// Scanner for reading log data from a Fluss table
+#[pyclass]
+pub struct LogScanner {
+    inner: fcore::client::LogScanner,
+    table_info: fcore::metadata::TableInfo,
+    #[allow(dead_code)]
+    start_timestamp: Option<i64>,
+    #[allow(dead_code)]
+    end_timestamp: Option<i64>,
+}
+
+#[pymethods]
+impl LogScanner {
+    /// Subscribe to log data with timestamp range
+    fn subscribe(
+        &mut self,
+        _start_timestamp: Option<i64>,
+        _end_timestamp: Option<i64>,
+    ) -> PyResult<()> {
+        if _start_timestamp.is_some() {
+            return Err(FlussError::new_err(
+                "Specifying start_timestamp is not yet supported. Please use None.".to_string(),
+            ));
+        }
+        if _end_timestamp.is_some() {
+            return Err(FlussError::new_err(
+                "Specifying end_timestamp is not yet supported. Please use None.".to_string(),
+            ));
+        }
+
+        let num_buckets = self.table_info.get_num_buckets();
+        for bucket_id in 0..num_buckets {
+            let start_offset = EARLIEST_OFFSET;
+
+            TOKIO_RUNTIME.block_on(async {
+                self.inner
+                    .subscribe(bucket_id, start_offset)
+                    .await
+                    .map_err(|e| FlussError::new_err(e.to_string()))
+            })?;
+        }
+
+        Ok(())
+    }
+
+    /// Convert all data to Arrow Table
+    fn to_arrow(&self, py: Python) -> PyResult<PyObject> {
+        use std::collections::HashMap;
+        use std::time::Duration;
+
+        let mut all_batches = Vec::new();
+
+        let num_buckets = self.table_info.get_num_buckets();
+        let bucket_ids: Vec<i32> = (0..num_buckets).collect();
+
+        // todo: after supporting list_offsets with timestamp, we can use start_timestamp and end_timestamp here
+        let target_offsets: HashMap<i32, i64> = TOKIO_RUNTIME
+            .block_on(async { self.inner.list_offsets_latest(bucket_ids).await })
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+        let mut current_offsets: HashMap<i32, i64> = HashMap::new();
+        let mut completed_buckets: HashSet<i32> = HashSet::new();
+
+        if !target_offsets.is_empty() {
+            loop {
+                let batch_result = TOKIO_RUNTIME
+                    .block_on(async { self.inner.poll(Duration::from_millis(500)).await });
+
+                match batch_result {
+                    Ok(scan_records) => {
+                        let mut filtered_records: HashMap<
+                            fcore::metadata::TableBucket,
+                            Vec<fcore::record::ScanRecord>,
+                        > = HashMap::new();
+                        for (bucket, records) in scan_records.records_by_buckets() {
+                            let bucket_id = bucket.bucket_id();
+                            if completed_buckets.contains(&bucket_id) {
+                                continue;
+                            }
+                            if let Some(last_record) = records.last() {
+                                let offset = last_record.offset();
+                                current_offsets.insert(bucket_id, offset);
+                                filtered_records.insert(bucket.clone(), records.clone());
+                                if offset >= target_offsets[&bucket_id] - 1 {
+                                    completed_buckets.insert(bucket_id);
+                                }
+                            }
+                        }
+
+                        if !filtered_records.is_empty() {
+                            let filtered_scan_records =
+                                fcore::record::ScanRecords::new(filtered_records);
+                            let arrow_batch =
+                                Utils::convert_scan_records_to_arrow(filtered_scan_records);
+                            all_batches.extend(arrow_batch);
+                        }
+
+                        // completed bucket is equal to all target buckets,
+                        // we can break scan records
+                        if completed_buckets.len() == target_offsets.len() {
+                            break;
+                        }
+                    }
+                    Err(e) => return Err(FlussError::new_err(e.to_string())),
+                }
+            }
+        }
+
+        Utils::combine_batches_to_table(py, all_batches)
+    }
+
+    /// Convert all data to Pandas DataFrame
+    fn to_pandas(&self, py: Python) -> PyResult<PyObject> {
+        let arrow_table = self.to_arrow(py)?;
+
+        // Convert Arrow Table to Pandas DataFrame using pyarrow
+        let df = arrow_table.call_method0(py, "to_pandas")?;
+        Ok(df)
+    }
+
+    fn __repr__(&self) -> String {
+        format!("LogScanner(table={})", self.table_info.table_path)
+    }
+}
+
+impl LogScanner {
+    /// Create LogScanner from core LogScanner
+    pub fn from_core(
+        inner: fcore::client::LogScanner,
+        table_info: fcore::metadata::TableInfo,
+    ) -> Self {
+        Self {
+            inner,
+            table_info,
+            start_timestamp: None,
+            end_timestamp: None,
+        }
+    }
+}
diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
index c40104bfc9..9642e9d95b 100644
--- a/fluss-rust/bindings/python/src/utils.rs
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -15,11 +15,10 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use pyo3::prelude::*;
+use crate::*;
 use arrow::datatypes::{Schema as ArrowSchema, SchemaRef};
-use std::sync::Arc;
 use arrow_pyarrow::ToPyArrow;
-use crate::*;
+use std::sync::Arc;
 
 /// Utilities for schema conversion between PyArrow, Arrow, and Fluss
 pub struct Utils;
@@ -29,15 +28,19 @@ impl Utils {
     pub fn pyarrow_to_arrow_schema(py_schema: &PyObject) -> PyResult<SchemaRef> {
         Python::with_gil(|py| {
             let schema_bound = py_schema.bind(py);
-            
-            let schema: ArrowSchema = arrow_pyarrow::FromPyArrow::from_pyarrow_bound(&schema_bound)
-                .map_err(|e| FlussError::new_err(format!("Failed to convert PyArrow schema: {}", e)))?;
+
+            let schema: ArrowSchema = arrow_pyarrow::FromPyArrow::from_pyarrow_bound(schema_bound)
+                .map_err(|e| {
+                    FlussError::new_err(format!("Failed to convert PyArrow schema: {e}"))
+                })?;
             Ok(Arc::new(schema))
         })
     }
 
     /// Convert Arrow DataType to Fluss DataType
-    pub fn arrow_type_to_fluss_type(arrow_type: &arrow::datatypes::DataType) -> PyResult<fcore::metadata::DataType> {
+    pub fn arrow_type_to_fluss_type(
+        arrow_type: &arrow::datatypes::DataType,
+    ) -> PyResult<fcore::metadata::DataType> {
         use arrow::datatypes::DataType as ArrowDataType;
         use fcore::metadata::DataTypes;
 
@@ -59,10 +62,12 @@ impl Utils {
             ArrowDataType::Date64 => DataTypes::date(),
             ArrowDataType::Time32(_) | ArrowDataType::Time64(_) => DataTypes::time(),
             ArrowDataType::Timestamp(_, _) => DataTypes::timestamp(),
-            ArrowDataType::Decimal128(precision, scale) => DataTypes::decimal(*precision as u32, *scale as u32),
+            ArrowDataType::Decimal128(precision, scale) => {
+                DataTypes::decimal(*precision as u32, *scale as u32)
+            }
             _ => {
                 return Err(FlussError::new_err(format!(
-                    "Unsupported Arrow data type: {:?}", arrow_type
+                    "Unsupported Arrow data type: {arrow_type:?}"
                 )));
             }
         };
@@ -89,47 +94,62 @@ impl Utils {
                 } else {
                     format!("time({})", t.precision())
                 }
-            },
+            }
             fcore::metadata::DataType::Timestamp(t) => {
                 if t.precision() == 6 {
                     "timestamp".to_string()
                 } else {
                     format!("timestamp({})", t.precision())
                 }
-            },
+            }
             fcore::metadata::DataType::TimestampLTz(t) => {
                 if t.precision() == 6 {
                     "timestamp_ltz".to_string()
                 } else {
                     format!("timestamp_ltz({})", t.precision())
                 }
-            },
+            }
             fcore::metadata::DataType::Char(c) => format!("char({})", c.length()),
-            fcore::metadata::DataType::Decimal(d) => format!("decimal({},{})", d.precision(), d.scale()),
+            fcore::metadata::DataType::Decimal(d) => {
+                format!("decimal({},{})", d.precision(), d.scale())
+            }
             fcore::metadata::DataType::Binary(b) => format!("binary({})", b.length()),
-            fcore::metadata::DataType::Array(arr) => format!("array<{}>", Utils::datatype_to_string(arr.get_element_type())),
-            fcore::metadata::DataType::Map(map) => format!("map<{},{}>", 
-                                        Utils::datatype_to_string(map.key_type()), 
-                                        Utils::datatype_to_string(map.value_type())),
+            fcore::metadata::DataType::Array(arr) => format!(
+                "array<{}>",
+                Utils::datatype_to_string(arr.get_element_type())
+            ),
+            fcore::metadata::DataType::Map(map) => format!(
+                "map<{},{}>",
+                Utils::datatype_to_string(map.key_type()),
+                Utils::datatype_to_string(map.value_type())
+            ),
             fcore::metadata::DataType::Row(row) => {
-                let fields: Vec<String> = row.fields().iter()
-                    .map(|field| format!("{}: {}", field.name(), Utils::datatype_to_string(field.data_type())))
+                let fields: Vec<String> = row
+                    .fields()
+                    .iter()
+                    .map(|field| {
+                        format!(
+                            "{}: {}",
+                            field.name(),
+                            Utils::datatype_to_string(field.data_type())
+                        )
+                    })
                     .collect();
                 format!("row<{}>", fields.join(", "))
-            },
+            }
         }
     }
 
     /// Parse log format string to LogFormat enum
     pub fn parse_log_format(format_str: &str) -> PyResult<fcore::metadata::LogFormat> {
         fcore::metadata::LogFormat::parse(format_str)
-            .map_err(|e| FlussError::new_err(format!("Invalid log format '{}': {}", format_str, e)))
+            .map_err(|e| FlussError::new_err(format!("Invalid log format '{format_str}': {e}")))
     }
 
     /// Parse kv format string to KvFormat enum
     pub fn parse_kv_format(format_str: &str) -> PyResult<fcore::metadata::KvFormat> {
         fcore::metadata::KvFormat::parse(format_str)
-            .map_err(|e| FlussError::new_err(format!("Invalid kv format '{}': {}", format_str, e)))
+            .map_err(|e| FlussError::new_err(format!("Invalid kv format '{format_str}': {e}")))
     }
 
     /// Convert ScanRecords to Arrow RecordBatch
@@ -137,42 +157,41 @@ impl Utils {
         _scan_records: fcore::record::ScanRecords,
     ) -> Vec<Arc<arrow::record_batch::RecordBatch>> {
         let mut result = Vec::new();
-        for(_, records) in _scan_records.into_records() {
-            for record in records {
-                let columnar_row = record.row();
-                let row_id = columnar_row.get_row_id();
-                if row_id == 0 {
-                    let record_batch = columnar_row.get_record_batch();
-                    result.push(record_batch.clone());
-                }
+        for record in _scan_records {
+            let columnar_row = record.row();
+            let row_id = columnar_row.get_row_id();
+            if row_id == 0 {
+                let record_batch = columnar_row.get_record_batch();
+                result.push(Arc::new(record_batch.clone()));
             }
         }
         result
     }
-    
+
     /// Combine multiple Arrow batches into a single Table
-    pub fn combine_batches_to_table(py: Python, batches: Vec<Arc<arrow::record_batch::RecordBatch>>) -> PyResult<PyObject> {
-        if batches.is_empty() {
-            return Err(FlussError::new_err("No batches to combine"));
-        }
-        
+    pub fn combine_batches_to_table(
+        py: Python,
+        batches: Vec<Arc<arrow::record_batch::RecordBatch>>,
+    ) -> PyResult<PyObject> {
         // Convert Rust Arrow RecordBatch to PyObject
-        let py_batches: Result<Vec<PyObject>, _> = batches.iter()
+        let py_batches: Result<Vec<PyObject>, _> = batches
+            .iter()
             .map(|batch| {
-                batch.as_ref().to_pyarrow(py)
-                    .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch to PyObject: {}", e)))
+                batch.as_ref().to_pyarrow(py).map_err(|e| {
+                    FlussError::new_err(format!("Failed to convert RecordBatch to PyObject: {e}"))
+                })
             })
             .collect();
-        
+
         let py_batches = py_batches?;
-        
+
         let pyarrow = py.import("pyarrow")?;
-        
+
         // Use pyarrow.Table.from_batches to combine batches
         let table = pyarrow
             .getattr("Table")?
             .call_method1("from_batches", (py_batches,))?;
-        
+
         Ok(table.into())
     }
 }
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index a728bd74f8..ab1efc26d2 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -23,7 +23,7 @@ name = "fluss"
 build = "src/build.rs"
 
 [dependencies]
-arrow = "55.1.0"
+arrow = { workspace = true }
 arrow-schema = "55.1.0"
 byteorder = "1.5"
 futures = "0.3"
@@ -44,7 +44,8 @@ rust_decimal = "1"
 ordered-float = { version = "4", features = ["serde"] }
 parse-display = "0.10"
 ref-cast = "1.0"
-chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }
+chrono = { workspace = true }
+oneshot = "0.1.11"
 
 [dev-dependencies]
 testcontainers = "0.25.0"
@@ -56,4 +57,4 @@ integration_tests = []
 
 
 [build-dependencies]
-prost-build = {  version = "0.13.5"  }
\ No newline at end of file
+prost-build = {  version = "0.13.5"  }
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 4d6f8f045b..07e64948fa 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -27,8 +27,8 @@ mod append;
 mod scanner;
 mod writer;
 
-pub use append::TableAppend;
-pub use scanner::TableScan;
+pub use append::{AppendWriter, TableAppend};
+pub use scanner::{LogScanner, TableScan};
 
 #[allow(dead_code)]
 pub struct FlussTable<'a> {
@@ -65,6 +65,22 @@ impl<'a> FlussTable<'a> {
     pub fn new_scan(&self) -> TableScan<'_> {
         TableScan::new(self.conn, self.table_info.clone(), self.metadata.clone())
     }
+
+    pub fn metadata(&self) -> &Arc<Metadata> {
+        &self.metadata
+    }
+
+    pub fn table_info(&self) -> &TableInfo {
+        &self.table_info
+    }
+
+    pub fn table_path(&self) -> &TablePath {
+        &self.table_path
+    }
+
+    pub fn has_primary_key(&self) -> bool {
+        self.has_primary_key
+    }
 }
 
 impl<'a> Drop for FlussTable<'a> {
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 41fb17e8c8..cbe724896e 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -22,12 +22,14 @@ use crate::metadata::{TableBucket, TableInfo, TablePath};
 use crate::proto::{FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
 use crate::record::{LogRecordsBatchs, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
 use crate::rpc::RpcClient;
+use crate::rpc::message::{ListOffsetsRequest, OffsetSpec};
 use crate::util::FairBucketStatusMap;
 use parking_lot::RwLock;
 use std::collections::HashMap;
 use std::slice::from_ref;
 use std::sync::Arc;
 use std::time::Duration;
+use tokio::task::JoinHandle;
 
 const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
 #[allow(dead_code)]
@@ -65,6 +67,7 @@ pub struct LogScanner {
     metadata: Arc<Metadata>,
     log_scanner_status: Arc<LogScannerStatus>,
     log_fetcher: LogFetcher,
+    conns: Arc<RpcClient>,
 }
 
 impl LogScanner {
@@ -81,10 +84,11 @@ impl LogScanner {
             log_scanner_status: log_scanner_status.clone(),
             log_fetcher: LogFetcher::new(
                 table_info.clone(),
-                connections,
+                connections.clone(),
                 metadata.clone(),
                 log_scanner_status.clone(),
             ),
+            conns: connections.clone(),
         }
     }
 
@@ -102,6 +106,103 @@ impl LogScanner {
         Ok(())
     }
 
+    pub async fn list_offsets_latest(&self, buckets: Vec<i32>) -> Result<HashMap<i32, i64>> {
+        // TODO: support partition_id
+        let partition_id = None;
+        let offset_spec = OffsetSpec::Latest;
+
+        self.metadata
+            .check_and_update_table_metadata(from_ref(&self.table_path))
+            .await?;
+
+        let cluster = self.metadata.get_cluster();
+        let table_id = cluster.get_table(&self.table_path).table_id;
+
+        // Prepare requests
+        let requests_by_server = self.prepare_list_offsets_requests(
+            table_id,
+            partition_id,
+            buckets.clone(),
+            offset_spec,
+        )?;
+
+        // Send Requests
+        let response_futures = self.send_list_offsets_request(requests_by_server).await?;
+
+        let mut results = HashMap::new();
+
+        for response_future in response_futures {
+            let offsets = response_future.await.map_err(
+                // todo: consider use suitable error
+                |e| crate::error::Error::WriteError(format!("Fail to get result: {e}")),
+            )?;
+            results.extend(offsets?);
+        }
+        Ok(results)
+    }
+
+    fn prepare_list_offsets_requests(
+        &self,
+        table_id: i64,
+        partition_id: Option<i64>,
+        buckets: Vec<i32>,
+        offset_spec: OffsetSpec,
+    ) -> Result<HashMap<i32, ListOffsetsRequest>> {
+        let cluster = self.metadata.get_cluster();
+        let mut node_for_bucket_list: HashMap<i32, Vec<i32>> = HashMap::new();
+
+        for bucket_id in buckets {
+            let table_bucket = TableBucket::new(table_id, bucket_id);
+            let leader = cluster.leader_for(&table_bucket).ok_or_else(|| {
+                // todo: consider use another suitable error
+                crate::error::Error::InvalidTableError(format!(
+                    "No leader found for table bucket: table_id={table_id}, bucket_id={bucket_id}"
+                ))
+            })?;
+
+            node_for_bucket_list
+                .entry(leader.id())
+                .or_default()
+                .push(bucket_id);
+        }
+
+        let mut list_offsets_requests = HashMap::new();
+        for (leader_id, bucket_ids) in node_for_bucket_list {
+            let request =
+                ListOffsetsRequest::new(table_id, partition_id, bucket_ids, offset_spec.clone());
+            list_offsets_requests.insert(leader_id, request);
+        }
+        Ok(list_offsets_requests)
+    }
+
+    async fn send_list_offsets_request(
+        &self,
+        request_map: HashMap<i32, ListOffsetsRequest>,
+    ) -> Result<Vec<JoinHandle<Result<HashMap<i32, i64>>>>> {
+        let mut tasks = Vec::new();
+
+        for (leader_id, request) in request_map {
+            let rpc_client = self.conns.clone();
+            let metadata = self.metadata.clone();
+
+            let task = tokio::spawn(async move {
+                let cluster = metadata.get_cluster();
+                let tablet_server = cluster.get_tablet_server(leader_id).ok_or_else(|| {
+                    // todo: consider use more suitable error
+                    crate::error::Error::InvalidTableError(format!(
+                        "Tablet server {leader_id} not found"
+                    ))
+                })?;
+                let connection = rpc_client.get_connection(tablet_server).await?;
+                let list_offsets_response = connection.request(request).await?;
+                list_offsets_response.offsets()
+            });
+            tasks.push(task);
+        }
+
+        Ok(tasks)
+    }
+
     async fn poll_for_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
         self.log_fetcher.send_fetches_and_collect().await
     }
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index d71197b2b0..ef460fc559 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -202,6 +202,19 @@ message ListDatabasesResponse {
   repeated string database_name = 1;
 }
 
+// list offsets request and response
+message ListOffsetsRequest {
+  required int32 follower_server_id = 1;  // value -1 indicate the request from client.
+  required int32 offset_type = 2; // value can be 0,1,2 (see ListOffsetsParam for more details)
+  required int64 table_id = 3;
+  optional int64 partition_id = 4;
+  repeated int32 bucket_id = 5 [packed = true]; // it is recommended to use packed for repeated numerics to get more efficient encoding
+  optional int64 startTimestamp = 6;
+}
+message ListOffsetsResponse {
+  repeated PbListOffsetsRespForBucket buckets_resp = 1;
+}
+
 
 // fetch log request and response
 message FetchLogRequest {
@@ -262,6 +275,13 @@ message PbRemoteLogSegment {
   required int32 segment_size_in_bytes = 4;
 }
 
+message PbListOffsetsRespForBucket {
+  required int32 bucket_id = 1;
+  optional int32 error_code = 2;
+  optional string error_message = 3;
+  optional int64 offset = 4;
+}
+
 // fetch latest lake snapshot
 message GetLatestLakeSnapshotRequest {
   required PbTablePath table_path = 1;
diff --git a/fluss-rust/crates/fluss/src/record/mod.rs b/fluss-rust/crates/fluss/src/record/mod.rs
index d7872055b9..07fbe0808c 100644
--- a/fluss-rust/crates/fluss/src/record/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/mod.rs
@@ -84,6 +84,7 @@ impl fmt::Display for ChangeType {
     }
 }
 
+#[derive(Clone)]
 pub struct ScanRecord {
     pub row: ColumnarRow,
     offset: i64,
@@ -158,6 +159,10 @@ impl ScanRecords {
     pub fn is_empty(&self) -> bool {
         self.records.is_empty()
     }
+
+    pub fn records_by_buckets(&self) -> &HashMap<TableBucket, Vec<ScanRecord>> {
+        &self.records
+    }
 }
 
 impl IntoIterator for ScanRecords {
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 44ca640b51..6d47836d9b 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -22,6 +22,7 @@ use arrow::array::{
 };
 use std::sync::Arc;
 
+#[derive(Clone)]
 pub struct ColumnarRow {
     record_batch: Arc<RecordBatch>,
     row_id: usize,
@@ -45,6 +46,14 @@ impl ColumnarRow {
     pub fn set_row_id(&mut self, row_id: usize) {
         self.row_id = row_id
     }
+
+    pub fn get_row_id(&self) -> usize {
+        self.row_id
+    }
+
+    pub fn get_record_batch(&self) -> &RecordBatch {
+        &self.record_batch
+    }
 }
 
 impl InternalRow for ColumnarRow {
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index 18ce44fbef..215bb39389 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -31,6 +31,7 @@ pub enum ApiKey {
     MetaData,
     ProduceLog,
     FetchLog,
+    ListOffsets,
     GetDatabaseInfo,
     GetLatestLakeSnapshot,
     Unknown(i16),
@@ -51,6 +52,7 @@ impl From<i16> for ApiKey {
             1012 => ApiKey::MetaData,
             1014 => ApiKey::ProduceLog,
             1015 => ApiKey::FetchLog,
+            1021 => ApiKey::ListOffsets,
             1032 => ApiKey::GetLatestLakeSnapshot,
             1035 => ApiKey::GetDatabaseInfo,
             _ => Unknown(key),
@@ -73,6 +75,7 @@ impl From<ApiKey> for i16 {
             ApiKey::MetaData => 1012,
             ApiKey::ProduceLog => 1014,
             ApiKey::FetchLog => 1015,
+            ApiKey::ListOffsets => 1021,
             ApiKey::GetLatestLakeSnapshot => 1032,
             ApiKey::GetDatabaseInfo => 1035,
             Unknown(x) => x,
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
new file mode 100644
index 0000000000..500db33e8c
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
@@ -0,0 +1,124 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+
+use crate::error::Error;
+use crate::error::Result as FlussResult;
+use crate::proto::ListOffsetsResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use std::collections::HashMap;
+
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+/// Offset type constants as per proto comments
+pub const LIST_EARLIEST_OFFSET: i32 = 0;
+pub const LIST_LATEST_OFFSET: i32 = 1;
+pub const LIST_OFFSET_FROM_TIMESTAMP: i32 = 2;
+
+/// Client follower server id constant
+pub const CLIENT_FOLLOWER_SERVER_ID: i32 = -1;
+
+/// Offset specification for list offsets request
+#[derive(Debug, Clone)]
+pub enum OffsetSpec {
+    /// Earliest offset spec
+    Earliest,
+    /// Latest offset spec  
+    Latest,
+    /// Timestamp offset spec
+    Timestamp(i64),
+}
+
+impl OffsetSpec {
+    pub fn offset_type(&self) -> i32 {
+        match self {
+            OffsetSpec::Earliest => LIST_EARLIEST_OFFSET,
+            OffsetSpec::Latest => LIST_LATEST_OFFSET,
+            OffsetSpec::Timestamp(_) => LIST_OFFSET_FROM_TIMESTAMP,
+        }
+    }
+
+    pub fn start_timestamp(&self) -> Option<i64> {
+        match self {
+            OffsetSpec::Timestamp(ts) => Some(*ts),
+            _ => None,
+        }
+    }
+}
+
+#[derive(Debug)]
+pub struct ListOffsetsRequest {
+    pub inner_request: proto::ListOffsetsRequest,
+}
+
+impl ListOffsetsRequest {
+    pub fn new(
+        table_id: i64,
+        partition_id: Option<i64>,
+        bucket_ids: Vec<i32>,
+        offset_spec: OffsetSpec,
+    ) -> Self {
+        ListOffsetsRequest {
+            inner_request: proto::ListOffsetsRequest {
+                follower_server_id: CLIENT_FOLLOWER_SERVER_ID,
+                offset_type: offset_spec.offset_type(),
+                table_id,
+                partition_id,
+                bucket_id: bucket_ids,
+                start_timestamp: offset_spec.start_timestamp(),
+            },
+        }
+    }
+}
+
+impl RequestBody for ListOffsetsRequest {
+    type ResponseBody = ListOffsetsResponse;
+
+    const API_KEY: ApiKey = ApiKey::ListOffsets;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(ListOffsetsRequest);
+impl_read_version_type!(ListOffsetsResponse);
+
+impl ListOffsetsResponse {
+    pub fn offsets(&self) -> FlussResult<HashMap<i32, i64>> {
+        self.buckets_resp
+            .iter()
+            .map(|resp| {
+                if resp.error_code.is_some() {
+                    // todo: consider use another suitable error
+                    Err(Error::WriteError(format!(
+                        "Missing offset, error message: {}",
+                        resp.error_message
+                            .as_deref()
+                            .unwrap_or("unknown server exception")
+                    )))
+                } else {
+                    // if no error msg, offset must exists
+                    Ok((resp.bucket_id, resp.offset.unwrap()))
+                }
+            })
+            .collect()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index d5f8ebde89..230d971a49 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -31,6 +31,7 @@ mod get_latest_lake_snapshot;
 mod get_table;
 mod header;
 mod list_databases;
+mod list_offsets;
 mod list_tables;
 mod produce_log;
 mod table_exists;
@@ -47,6 +48,7 @@ pub use get_latest_lake_snapshot::*;
 pub use get_table::*;
 pub use header::*;
 pub use list_databases::*;
+pub use list_offsets::*;
 pub use list_tables::*;
 pub use produce_log::*;
 pub use table_exists::*;

From 2f722d2857f6859b2632d1d6008704fea18856f6 Mon Sep 17 00:00:00 2001
From: Junbo Wang <beryllwang@gmail.com>
Date: Thu, 16 Oct 2025 21:02:37 +0800
Subject: [PATCH 013/287] [test] Add IT for table operation in admin (#32)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---------

Co-authored-by: 王俊博(wangjunbo) <wangjunbo@qiyi.com>
Co-authored-by: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
---
 fluss-rust/crates/fluss/src/metadata/table.rs |   6 +-
 .../crates/fluss/tests/integration/admin.rs   | 122 +++++++++++++++++-
 2 files changed, 123 insertions(+), 5 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 2b48ec60db..751dd6da02 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -23,7 +23,7 @@ use serde::{Deserialize, Serialize};
 use std::collections::{HashMap, HashSet};
 use std::fmt::{Display, Formatter};
 
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 pub struct Column {
     name: String,
     data_type: DataType,
@@ -66,7 +66,7 @@ impl Column {
     }
 }
 
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 pub struct PrimaryKey {
     constraint_name: String,
     column_names: Vec<String>,
@@ -90,7 +90,7 @@ impl PrimaryKey {
     }
 }
 
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 pub struct Schema {
     columns: Vec<Column>,
     primary_key: Option<PrimaryKey>,
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index 73f52db936..0d958a5656 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -33,7 +33,10 @@ static SHARED_FLUSS_CLUSTER: Lazy<Arc<RwLock<Option<FlussTestingCluster>>>> =
 mod admin_test {
     use super::SHARED_FLUSS_CLUSTER;
     use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
-    use fluss::metadata::DatabaseDescriptorBuilder;
+    use fluss::metadata::{
+        DataTypes, DatabaseDescriptorBuilder, KvFormat, LogFormat, Schema, TableDescriptor,
+        TablePath,
+    };
     use std::sync::Arc;
 
     fn before_all() {
@@ -126,6 +129,121 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_create_table() {
-        // todo
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection
+            .get_admin()
+            .await
+            .expect("Failed to get admin client");
+
+        let test_db_name = "test_create_table_db";
+        let db_descriptor = DatabaseDescriptorBuilder::default()
+            .comment("Database for test_create_table")
+            .build();
+
+        assert_eq!(admin.database_exists(test_db_name).await.unwrap(), false);
+        admin
+            .create_database(test_db_name, false, Some(&db_descriptor))
+            .await
+            .expect("Failed to create test database");
+
+        let test_table_name = "test_user_table";
+        let table_path = TablePath::new(test_db_name.to_string(), test_table_name.to_string());
+
+        // build table schema
+        let table_schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .column("age", DataTypes::int())
+            .with_comment("User's age (optional)")
+            .column("email", DataTypes::string())
+            .primary_key(vec!["id".to_string()])
+            .build()
+            .expect("Failed to build table schema");
+
+        // build table descriptor
+        let table_descriptor = TableDescriptor::builder()
+            .schema(table_schema.clone())
+            .comment("Test table for user data (id, name, age, email)")
+            .distributed_by(Some(3), vec!["id".to_string()])
+            .property("table.replication.factor", "1")
+            .log_format(LogFormat::ARROW)
+            .kv_format(KvFormat::INDEXED)
+            .build()
+            .expect("Failed to build table descriptor");
+
+        // create test table
+        admin
+            .create_table(&table_path, &table_descriptor, false)
+            .await
+            .expect("Failed to create test table");
+
+        assert!(
+            admin.table_exists(&table_path).await.unwrap(),
+            "Table {:?} should exist after creation",
+            table_path
+        );
+
+        let tables = admin.list_tables(test_db_name).await.unwrap();
+        assert_eq!(
+            tables.len(),
+            1,
+            "There should be exactly one table in the database"
+        );
+        assert!(
+            tables.contains(&test_table_name.to_string()),
+            "Table list should contain the created table"
+        );
+
+        let table_info = admin
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table info");
+
+        // verify table comment
+        assert_eq!(
+            table_info.get_comment(),
+            Some("Test table for user data (id, name, age, email)"),
+            "Table comment mismatch"
+        );
+
+        // verify schema columns
+        let actual_schema = table_info.get_schema();
+        assert_eq!(actual_schema, table_descriptor.schema(), "Schema mismatch");
+
+        // verify primary key
+        assert_eq!(
+            table_info.get_primary_keys(),
+            &vec!["id".to_string()],
+            "Primary key columns mismatch"
+        );
+
+        // verify distribution and properties
+        assert_eq!(table_info.get_num_buckets(), 3, "Bucket count mismatch");
+        assert_eq!(
+            table_info.get_bucket_keys(),
+            &vec!["id".to_string()],
+            "Bucket keys mismatch"
+        );
+
+        assert_eq!(
+            table_info.get_properties(),
+            table_descriptor.properties(),
+            "Properties mismatch"
+        );
+
+        // drop table
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+        // table shouldn't exist now
+        assert_eq!(admin.table_exists(&table_path).await.unwrap(), false);
+
+        // drop database
+        admin.drop_database(test_db_name, false, true).await;
+
+        // database shouldn't exist now
+        assert_eq!(admin.database_exists(test_db_name).await.unwrap(), false);
     }
 }

From 1ec45d3c3e2d34d3bc1781d45895c09ee4483b23 Mon Sep 17 00:00:00 2001
From: naivedogger <59598718+naivedogger@users.noreply.github.com>
Date: Fri, 17 Oct 2025 16:54:04 +0800
Subject: [PATCH 014/287] [feat] Add examples and stub files for Python
 bindings (#10)

---------

Co-authored-by: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
---
 fluss-rust/.licenserc.yaml                    |   1 +
 fluss-rust/bindings/python/README.md          |  19 +-
 fluss-rust/bindings/python/example/example.py | 188 ++++++++++++++++++
 fluss-rust/bindings/python/fluss/__init__.pyi | 171 ++++++++++++++++
 fluss-rust/bindings/python/fluss/py.typed     |   0
 5 files changed, 369 insertions(+), 10 deletions(-)
 create mode 100644 fluss-rust/bindings/python/example/example.py
 create mode 100644 fluss-rust/bindings/python/fluss/__init__.pyi
 create mode 100644 fluss-rust/bindings/python/fluss/py.typed

diff --git a/fluss-rust/.licenserc.yaml b/fluss-rust/.licenserc.yaml
index 3813b484b3..a3cfcd146b 100644
--- a/fluss-rust/.licenserc.yaml
+++ b/fluss-rust/.licenserc.yaml
@@ -26,4 +26,5 @@ header:
     - 'LICENSE'
     - 'NOTICE'
     - 'DISCLAIMER'
+    - 'bindings/python/fluss/py.typed'
   comment: on-failure
diff --git a/fluss-rust/bindings/python/README.md b/fluss-rust/bindings/python/README.md
index 5258f53291..44d6099c6c 100644
--- a/fluss-rust/bindings/python/README.md
+++ b/fluss-rust/bindings/python/README.md
@@ -108,7 +108,7 @@ uv run python example/example.py
 ### Build API docs:
 
 ```bash
-uv run pdoc fluss_python
+uv run pdoc fluss
 ```
 
 ### Release
@@ -124,10 +124,10 @@ uv run maturin publish
 ## Project Structure
 ```
 bindings/python/
-├── Cargo.toml              # Rust dependency configuration
-├── pyproject.toml          # Python project configuration
-├── README.md              # This file
-├── src/                   # Rust source code
+├── Cargo.toml            # Rust dependency configuration
+├── pyproject.toml        # Python project configuration
+├── README.md             # This file
+├── src/                  # Rust source code
 │   ├── lib.rs            # Main entry module
 │   ├── config.rs         # Configuration related
 │   ├── connection.rs     # Connection management
@@ -135,11 +135,10 @@ bindings/python/
 │   ├── table.rs          # Table operations
 │   ├── types.rs          # Data types
 │   └── error.rs          # Error handling
-├── python/               # Python package source
-│   └── fluss_python/
-│       ├── __init__.py   # Python package entry
-│       ├── __init__.pyi  # Stub file
-│       └── py.typed      # Type declarations
+├── fluss/                # Python package source
+│   ├── __init__.py       # Python package entry
+│   ├── __init__.pyi      # Stub file
+│   └── py.typed          # Type declarations
 └── example/              # Example code
     └── example.py
 ```
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
new file mode 100644
index 0000000000..0523f943e4
--- /dev/null
+++ b/fluss-rust/bindings/python/example/example.py
@@ -0,0 +1,188 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+import asyncio
+import time
+
+import pandas as pd
+import pyarrow as pa
+
+import fluss
+
+
+async def main():
+    # Create connection configuration
+    config_spec = {
+        "bootstrap.servers": "127.0.0.1:9123",
+        # Add other configuration options as needed
+        "request.max.size": "10485760",  # 10 MB
+        "writer.acks": "all",  # Wait for all replicas to acknowledge
+        "writer.retries": "3",  # Retry up to 3 times on failure
+        "writer.batch.size": "1000",  # Batch size for writes
+    }
+    config = fluss.Config(config_spec)
+
+    # Create connection using the static connect method
+    conn = await fluss.FlussConnection.connect(config)
+
+    # Define fields for PyArrow
+    fields = [
+        pa.field("id", pa.int32()),
+        pa.field("name", pa.string()),
+        pa.field("score", pa.float32()),
+        pa.field("age", pa.int32()),
+    ]
+
+    # Create a PyArrow schema
+    schema = pa.schema(fields)
+
+    # Create a Fluss Schema first (this is what TableDescriptor expects)
+    fluss_schema = fluss.Schema(schema)
+
+    # Create a Fluss TableDescriptor
+    table_descriptor = fluss.TableDescriptor(fluss_schema)
+
+    # Get the admin for Fluss
+    admin = await conn.get_admin()
+
+    # Create a Fluss table
+    table_path = fluss.TablePath("fluss", "sample_table")
+
+    try:
+        await admin.create_table(table_path, table_descriptor, True)
+        print(f"Created table: {table_path}")
+    except Exception as e:
+        print(f"Table creation failed: {e}")
+
+    # Get table information via admin
+    try:
+        table_info = await admin.get_table(table_path)
+        print(f"Table info: {table_info}")
+        print(f"Table ID: {table_info.table_id}")
+        print(f"Schema ID: {table_info.schema_id}")
+        print(f"Created time: {table_info.created_time}")
+        print(f"Primary keys: {table_info.get_primary_keys()}")
+    except Exception as e:
+        print(f"Failed to get table info: {e}")
+
+    # Get the table instance
+    table = await conn.get_table(table_path)
+    print(f"Got table: {table}")
+
+    # Create a writer for the table
+    append_writer = await table.new_append_writer()
+    print(f"Created append writer: {append_writer}")
+
+    try:
+        # Test 1: Write PyArrow Table
+        print("\n--- Testing PyArrow Table write ---")
+        pa_table = pa.Table.from_arrays(
+            [
+                pa.array([1, 2, 3], type=pa.int32()),
+                pa.array(["Alice", "Bob", "Charlie"], type=pa.string()),
+                pa.array([95.2, 87.2, 92.1], type=pa.float32()),
+                pa.array([25, 30, 35], type=pa.int32()),
+            ],
+            schema=schema,
+        )
+
+        append_writer.write_arrow(pa_table)
+        print("Successfully wrote PyArrow Table")
+
+        # Test 2: Write PyArrow RecordBatch
+        print("\n--- Testing PyArrow RecordBatch write ---")
+        pa_record_batch = pa.RecordBatch.from_arrays(
+            [
+                pa.array([4, 5], type=pa.int32()),
+                pa.array(["David", "Eve"], type=pa.string()),
+                pa.array([88.5, 91.0], type=pa.float32()),
+                pa.array([28, 32], type=pa.int32()),
+            ],
+            schema=schema,
+        )
+
+        append_writer.write_arrow_batch(pa_record_batch)
+        print("Successfully wrote PyArrow RecordBatch")
+
+        # Test 3: Write Pandas DataFrame
+        print("\n--- Testing Pandas DataFrame write ---")
+        df = pd.DataFrame(
+            {
+                "id": [6, 7],
+                "name": ["Frank", "Grace"],
+                "score": [89.3, 94.7],
+                "age": [29, 27],
+            }
+        )
+
+        append_writer.write_pandas(df)
+        print("Successfully wrote Pandas DataFrame")
+
+        # Flush all pending data
+        print("\n--- Flushing data ---")
+        append_writer.flush()
+        print("Successfully flushed data")
+
+    except Exception as e:
+        print(f"Error during writing: {e}")
+
+    # Now scan the table to verify data was written
+    print("\n--- Scanning table ---")
+    try:
+        log_scanner = await table.new_log_scanner()
+        print(f"Created log scanner: {log_scanner}")
+
+        # Subscribe to scan from earliest to latest
+        # start_timestamp=None (earliest), end_timestamp=None (latest)
+        log_scanner.subscribe(None, None)
+
+        print("Scanning results using to_arrow():")
+
+        # Try to get as PyArrow Table
+        try:
+            pa_table_result = log_scanner.to_arrow()
+            print(f"\nAs PyArrow Table: {pa_table_result}")
+        except Exception as e:
+            print(f"Could not convert to PyArrow: {e}")
+
+        # Let's subscribe from the beginning again.
+        # Reset subscription
+        log_scanner.subscribe(None, None)
+
+        # Try to get as Pandas DataFrame
+        try:
+            df_result = log_scanner.to_pandas()
+            print(f"\nAs Pandas DataFrame:\n{df_result}")
+        except Exception as e:
+            print(f"Could not convert to Pandas: {e}")
+
+        # TODO: support to_arrow_batch_reader()
+        # which is reserved for streaming use cases
+
+        # TODO: support to_duckdb()
+
+    except Exception as e:
+        print(f"Error during scanning: {e}")
+
+    # Close connection
+    conn.close()
+    print("\nConnection closed")
+
+
+if __name__ == "__main__":
+    # Run the async main function
+    asyncio.run(main())
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
new file mode 100644
index 0000000000..45652425ba
--- /dev/null
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -0,0 +1,171 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Type stubs for Fluss Python bindings."""
+
+from types import TracebackType
+from typing import Dict, List, Optional, Tuple
+
+import pandas as pd
+import pyarrow as pa
+
+class Config:
+    def __init__(self, properties: Optional[Dict[str, str]] = None) -> None: ...
+    @property
+    def bootstrap_server(self) -> Optional[str]: ...
+    @bootstrap_server.setter
+    def bootstrap_server(self, server: str) -> None: ...
+    @property
+    def request_max_size(self) -> int: ...
+    @request_max_size.setter
+    def request_max_size(self, size: int) -> None: ...
+    @property
+    def writer_batch_size(self) -> int: ...
+    @writer_batch_size.setter
+    def writer_batch_size(self, size: int) -> None: ...
+
+class FlussConnection:
+    @staticmethod
+    async def connect(config: Config) -> FlussConnection: ...
+    async def get_admin(self) -> FlussAdmin: ...
+    async def get_table(self, table_path: TablePath) -> FlussTable: ...
+    def close(self) -> None: ...
+    def __enter__(self) -> FlussConnection: ...
+    def __exit__(self, exc_type: Optional[type], exc_value: Optional[BaseException], traceback: Optional[TracebackType]) -> bool: ...
+    def __repr__(self) -> str: ...
+
+class FlussAdmin:
+    async def create_table(
+        self,
+        table_path: TablePath,
+        table_descriptor: TableDescriptor,
+        ignore_if_exists: Optional[bool] = False,
+    ) -> None: ...
+    async def get_table(self, table_path: TablePath) -> TableInfo: ...
+    async def get_latest_lake_snapshot(self, table_path: TablePath) -> LakeSnapshot: ...
+    def __repr__(self) -> str: ...
+
+class FlussTable:
+    async def new_append_writer(self) -> AppendWriter: ...
+    async def new_log_scanner(self) -> LogScanner: ...
+    def get_table_info(self) -> TableInfo: ...
+    def get_table_path(self) -> TablePath: ...
+    def has_primary_key(self) -> bool: ...
+    def __repr__(self) -> str: ...
+
+class AppendWriter:
+    def write_arrow(self, table: pa.Table) -> None: ...
+    def write_arrow_batch(self, batch: pa.RecordBatch) -> None: ...
+    def write_pandas(self, df: pd.DataFrame) -> None: ...
+    def flush(self) -> None: ...
+    def __repr__(self) -> str: ...
+
+class LogScanner:
+    def subscribe(
+        self, start_timestamp: Optional[int], end_timestamp: Optional[int]
+    ) -> None: ...
+    def to_pandas(self) -> pd.DataFrame: ...
+    def to_arrow(self) -> pa.Table: ...
+    def __repr__(self) -> str: ...
+
+class Schema:
+    def __init__(self, schema: pa.Schema, primary_keys: Optional[List[str]] = None) -> None: ...
+    def get_column_names(self) -> List[str]: ...
+    def get_column_types(self) -> List[str]: ...
+    def get_columns(self) -> List[Tuple[str,str]]: ...
+    def __str__(self) -> str: ...
+
+class TableDescriptor:
+    def __init__(self, schema: Schema, **kwargs: str) -> None: ...
+    def get_schema(self) -> Schema: ...
+
+class TablePath:
+    def __init__(self, database: str, table: str) -> None: ...
+    @property
+    def database_name(self) -> str: ...
+    @property
+    def table_name(self) -> str: ...
+    def table_path_str(self) -> str: ...
+    def __str__(self) -> str: ...
+    def __repr__(self) -> str: ...
+    def __hash__(self) -> int: ...
+    def __eq__(self, other: object) -> bool: ...
+
+class TableInfo:
+    @property
+    def table_id(self) -> int: ...
+    @property
+    def schema_id(self) -> int: ...
+    @property
+    def created_time(self) -> int: ...
+    @property
+    def modified_time(self) -> int: ...
+    @property
+    def table_path(self) -> TablePath: ...
+    @property
+    def num_buckets(self) -> int: ...
+    @property
+    def comment(self) -> Optional[str]: ...
+    def get_primary_keys(self) -> List[str]: ...
+    def get_bucket_keys(self) -> List[str]: ...
+    def get_partition_keys(self) -> List[str]: ...
+    def has_primary_key(self) -> bool: ...
+    def is_partitioned(self) -> bool: ...
+    def get_properties(self) -> Dict[str, str]: ...
+    def get_custom_properties(self) -> Dict[str, str]: ...
+    def get_schema(self) -> Schema: ...
+    def get_column_names(self) -> List[str]: ...
+    def get_column_count(self) -> int: ...
+
+class FlussError(Exception):
+    message: str
+    def __init__(self, message: str) -> None: ...
+    def __str__(self) -> str: ...
+
+class LakeSnapshot:
+    def __init__(self, snapshot_id: int) -> None: ...
+    @property
+    def snapshot_id(self) -> int: ...
+    @property
+    def table_buckets_offset(self) -> Dict[TableBucket, int]: ...
+    def get_bucket_offset(self, bucket: TableBucket) -> Optional[int]: ...
+    def get_table_buckets(self) -> List[TableBucket]: ...
+    def __str__(self) -> str: ...
+    def __repr__(self) -> str: ...
+
+class TableBucket:
+    def __init__(self, table_id: int, bucket: int) -> None: ...
+    @staticmethod
+    def with_partition(
+        table_id: int, partition_id: int, bucket: int
+    ) -> TableBucket: ...
+    @property
+    def table_id(self) -> int: ...
+    @property
+    def bucket_id(self) -> int: ...
+    @property
+    def partition_id(self) -> Optional[int]: ...
+    def __hash__(self) -> int: ...
+    def __eq__(self, other: object) -> bool: ...
+    def __str__(self) -> str: ...
+    def __repr__(self) -> str: ...
+
+class TableDistribution:
+    def bucket_keys(self) -> List[str]: ...
+    def bucket_count(self) -> Optional[int]: ...
+
+__version__: str
diff --git a/fluss-rust/bindings/python/fluss/py.typed b/fluss-rust/bindings/python/fluss/py.typed
new file mode 100644
index 0000000000..e69de29bb2

From c0374eb31673e5aca338989bfc2f6d3829a1477f Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Mon, 20 Oct 2025 14:14:28 +0800
Subject: [PATCH 015/287] [chore] Move list offsets to admin (#35)

---
 fluss-rust/bindings/python/src/table.rs       |  68 ++++++------
 fluss-rust/bindings/python/src/utils.rs       |   4 +-
 fluss-rust/crates/fluss/src/client/admin.rs   | 104 +++++++++++++++++-
 .../crates/fluss/src/client/metadata.rs       |   3 +-
 .../crates/fluss/src/client/table/mod.rs      |   2 +
 .../crates/fluss/src/client/table/scanner.rs  | 101 -----------------
 .../crates/fluss/src/client/write/sender.rs   |   2 +-
 fluss-rust/crates/fluss/src/record/mod.rs     |   4 +
 fluss-rust/crates/fluss/src/rpc/mod.rs        |   2 -
 9 files changed, 149 insertions(+), 141 deletions(-)

diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 98943b939a..c255fa6f8a 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -17,12 +17,11 @@
 
 use crate::TOKIO_RUNTIME;
 use crate::*;
+use fluss::client::EARLIEST_OFFSET;
+use fluss::rpc::message::OffsetSpec;
 use pyo3_async_runtimes::tokio::future_into_py;
-use std::collections::HashSet;
 use std::sync::Arc;
 
-const EARLIEST_OFFSET: i64 = -2;
-
 /// Represents a Fluss table for data operations
 #[pyclass]
 pub struct FlussTable {
@@ -70,8 +69,12 @@ impl FlussTable {
 
             let rust_scanner = table_scan.create_log_scanner();
 
-            let py_scanner = LogScanner::from_core(rust_scanner, table_info.clone());
+            let admin = conn
+                .get_admin()
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
 
+            let py_scanner = LogScanner::from_core(rust_scanner, admin, table_info.clone());
             Python::with_gil(|py| Py::new(py, py_scanner))
         })
     }
@@ -275,6 +278,7 @@ impl AppendWriter {
 #[pyclass]
 pub struct LogScanner {
     inner: fcore::client::LogScanner,
+    admin: fcore::client::FlussAdmin,
     table_info: fcore::metadata::TableInfo,
     #[allow(dead_code)]
     start_timestamp: Option<i64>,
@@ -327,50 +331,50 @@ impl LogScanner {
         let bucket_ids: Vec<i32> = (0..num_buckets).collect();
 
         // todo: after supporting list_offsets with timestamp, we can use start_timestamp and end_timestamp here
-        let target_offsets: HashMap<i32, i64> = TOKIO_RUNTIME
-            .block_on(async { self.inner.list_offsets_latest(bucket_ids).await })
+        let mut stopping_offsets: HashMap<i32, i64> = TOKIO_RUNTIME
+            .block_on(async {
+                self.admin
+                    .list_offsets(
+                        &self.table_info.table_path,
+                        bucket_ids.as_slice(),
+                        OffsetSpec::Latest,
+                    )
+                    .await
+            })
             .map_err(|e| FlussError::new_err(e.to_string()))?;
 
-        let mut current_offsets: HashMap<i32, i64> = HashMap::new();
-        let mut completed_buckets: HashSet<i32> = HashSet::new();
-
-        if !target_offsets.is_empty() {
+        if !stopping_offsets.is_empty() {
             loop {
                 let batch_result = TOKIO_RUNTIME
                     .block_on(async { self.inner.poll(Duration::from_millis(500)).await });
 
                 match batch_result {
                     Ok(scan_records) => {
-                        let mut filtered_records: HashMap<
-                            fcore::metadata::TableBucket,
-                            Vec<fcore::record::ScanRecord>,
-                        > = HashMap::new();
-                        for (bucket, records) in scan_records.records_by_buckets() {
-                            let bucket_id = bucket.bucket_id();
-                            if completed_buckets.contains(&bucket_id) {
+                        let mut result_records: Vec<fcore::record::ScanRecord> = vec![];
+                        for (bucket, records) in scan_records.into_records_by_buckets() {
+                            let stopping_offset = stopping_offsets.get(&bucket.bucket_id());
+
+                            if stopping_offset.is_none() {
+                                // not to include this bucket, skip records for this bucket
+                                // since we already reach end offset for this bucket
                                 continue;
                             }
                             if let Some(last_record) = records.last() {
                                 let offset = last_record.offset();
-                                current_offsets.insert(bucket_id, offset);
-                                filtered_records.insert(bucket.clone(), records.clone());
-                                if offset >= target_offsets[&bucket_id] - 1 {
-                                    completed_buckets.insert(bucket_id);
+                                result_records.extend(records);
+                                if offset >= stopping_offset.unwrap() - 1 {
+                                    stopping_offsets.remove(&bucket.bucket_id());
                                 }
                             }
                         }
 
-                        if !filtered_records.is_empty() {
-                            let filtered_scan_records =
-                                fcore::record::ScanRecords::new(filtered_records);
-                            let arrow_batch =
-                                Utils::convert_scan_records_to_arrow(filtered_scan_records);
+                        if !result_records.is_empty() {
+                            let arrow_batch = Utils::convert_scan_records_to_arrow(result_records);
                             all_batches.extend(arrow_batch);
                         }
 
-                        // completed bucket is equal to all target buckets,
-                        // we can break scan records
-                        if completed_buckets.len() == target_offsets.len() {
+                        // we have reach end offsets of all bucket
+                        if stopping_offsets.is_empty() {
                             break;
                         }
                     }
@@ -399,11 +403,13 @@ impl LogScanner {
 impl LogScanner {
     /// Create LogScanner from core LogScanner
     pub fn from_core(
-        inner: fcore::client::LogScanner,
+        inner_scanner: fcore::client::LogScanner,
+        admin: fcore::client::FlussAdmin,
         table_info: fcore::metadata::TableInfo,
     ) -> Self {
         Self {
-            inner,
+            inner: inner_scanner,
+            admin,
             table_info,
             start_timestamp: None,
             end_timestamp: None,
diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
index 9642e9d95b..93933b3774 100644
--- a/fluss-rust/bindings/python/src/utils.rs
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -152,9 +152,9 @@ impl Utils {
             .map_err(|e| FlussError::new_err(format!("Invalid kv format '{format_str}': {e}")))
     }
 
-    /// Convert ScanRecords to Arrow RecordBatch
+    /// Convert Vec<ScanRecord> to Arrow RecordBatch
     pub fn convert_scan_records_to_arrow(
-        _scan_records: fcore::record::ScanRecords,
+        _scan_records: Vec<fcore::record::ScanRecord>,
     ) -> Vec<Arc<arrow::record_batch::RecordBatch>> {
         let mut result = Vec::new();
         for record in _scan_records {
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index fd0f316374..fefab43520 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -25,13 +25,16 @@ use crate::rpc::message::{
     DropTableRequest, GetDatabaseInfoRequest, GetLatestLakeSnapshotRequest, GetTableRequest,
     ListDatabasesRequest, ListTablesRequest, TableExistsRequest,
 };
+use crate::rpc::message::{ListOffsetsRequest, OffsetSpec};
 use crate::rpc::{RpcClient, ServerConnection};
 
-use std::collections::HashMap;
-use std::sync::Arc;
-
+use crate::BucketId;
 use crate::error::Result;
 use crate::proto::GetTableInfoResponse;
+use std::collections::HashMap;
+use std::slice::from_ref;
+use std::sync::Arc;
+use tokio::task::JoinHandle;
 
 pub struct FlussAdmin {
     admin_gateway: ServerConnection,
@@ -216,4 +219,99 @@ impl FlussAdmin {
             table_buckets_offset,
         ))
     }
+
+    /// List offset for the specified buckets. This operation enables to find the beginning offset,
+    /// end offset as well as the offset matching a timestamp in buckets.
+    pub async fn list_offsets(
+        &self,
+        table_path: &TablePath,
+        buckets_id: &[BucketId],
+        offset_spec: OffsetSpec,
+    ) -> Result<HashMap<i32, i64>> {
+        self.metadata
+            .check_and_update_table_metadata(from_ref(table_path))
+            .await?;
+
+        let cluster = self.metadata.get_cluster();
+        let table_id = cluster.get_table(table_path).table_id;
+
+        // Prepare requests
+        let requests_by_server =
+            self.prepare_list_offsets_requests(table_id, None, buckets_id, offset_spec)?;
+
+        // Send Requests
+        let response_futures = self.send_list_offsets_request(requests_by_server).await?;
+
+        let mut results = HashMap::new();
+
+        for response_future in response_futures {
+            let offsets = response_future.await.map_err(
+                // todo: consider use suitable error
+                |e| crate::error::Error::WriteError(format!("Fail to get result: {e}")),
+            )?;
+            results.extend(offsets?);
+        }
+        Ok(results)
+    }
+
+    fn prepare_list_offsets_requests(
+        &self,
+        table_id: i64,
+        partition_id: Option<i64>,
+        buckets: &[BucketId],
+        offset_spec: OffsetSpec,
+    ) -> Result<HashMap<i32, ListOffsetsRequest>> {
+        let cluster = self.metadata.get_cluster();
+        let mut node_for_bucket_list: HashMap<i32, Vec<i32>> = HashMap::new();
+
+        for bucket_id in buckets {
+            let table_bucket = TableBucket::new(table_id, *bucket_id);
+            let leader = cluster.leader_for(&table_bucket).ok_or_else(|| {
+                // todo: consider use another suitable error
+                crate::error::Error::InvalidTableError(format!(
+                    "No leader found for table bucket: table_id={table_id}, bucket_id={bucket_id}"
+                ))
+            })?;
+
+            node_for_bucket_list
+                .entry(leader.id())
+                .or_default()
+                .push(*bucket_id);
+        }
+
+        let mut list_offsets_requests = HashMap::new();
+        for (leader_id, bucket_ids) in node_for_bucket_list {
+            let request =
+                ListOffsetsRequest::new(table_id, partition_id, bucket_ids, offset_spec.clone());
+            list_offsets_requests.insert(leader_id, request);
+        }
+        Ok(list_offsets_requests)
+    }
+
+    async fn send_list_offsets_request(
+        &self,
+        request_map: HashMap<i32, ListOffsetsRequest>,
+    ) -> Result<Vec<JoinHandle<Result<HashMap<i32, i64>>>>> {
+        let mut tasks = Vec::new();
+
+        for (leader_id, request) in request_map {
+            let rpc_client = self.rpc_client.clone();
+            let metadata = self.metadata.clone();
+
+            let task = tokio::spawn(async move {
+                let cluster = metadata.get_cluster();
+                let tablet_server = cluster.get_tablet_server(leader_id).ok_or_else(|| {
+                    // todo: consider use more suitable error
+                    crate::error::Error::InvalidTableError(format!(
+                        "Tablet server {leader_id} not found"
+                    ))
+                })?;
+                let connection = rpc_client.get_connection(tablet_server).await?;
+                let list_offsets_response = connection.request(request).await?;
+                list_offsets_response.offsets()
+            });
+            tasks.push(task);
+        }
+        Ok(tasks)
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index ebfb959f65..3c3ba4bd2e 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -17,7 +17,8 @@
 
 use crate::cluster::{Cluster, ServerNode, ServerType};
 use crate::metadata::{TableBucket, TablePath};
-use crate::rpc::{RpcClient, ServerConnection, UpdateMetadataRequest};
+use crate::rpc::message::UpdateMetadataRequest;
+use crate::rpc::{RpcClient, ServerConnection};
 use parking_lot::RwLock;
 use std::collections::HashSet;
 use std::net::SocketAddr;
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 07e64948fa..52ae700fc6 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -22,6 +22,8 @@ use std::sync::Arc;
 
 use crate::error::Result;
 
+pub const EARLIEST_OFFSET: i64 = -2;
+
 mod append;
 
 mod scanner;
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index cbe724896e..e1ab59ffbb 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -22,14 +22,12 @@ use crate::metadata::{TableBucket, TableInfo, TablePath};
 use crate::proto::{FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
 use crate::record::{LogRecordsBatchs, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
 use crate::rpc::RpcClient;
-use crate::rpc::message::{ListOffsetsRequest, OffsetSpec};
 use crate::util::FairBucketStatusMap;
 use parking_lot::RwLock;
 use std::collections::HashMap;
 use std::slice::from_ref;
 use std::sync::Arc;
 use std::time::Duration;
-use tokio::task::JoinHandle;
 
 const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
 #[allow(dead_code)]
@@ -67,7 +65,6 @@ pub struct LogScanner {
     metadata: Arc<Metadata>,
     log_scanner_status: Arc<LogScannerStatus>,
     log_fetcher: LogFetcher,
-    conns: Arc<RpcClient>,
 }
 
 impl LogScanner {
@@ -88,7 +85,6 @@ impl LogScanner {
                 metadata.clone(),
                 log_scanner_status.clone(),
             ),
-            conns: connections.clone(),
         }
     }
 
@@ -106,103 +102,6 @@ impl LogScanner {
         Ok(())
     }
 
-    pub async fn list_offsets_latest(&self, buckets: Vec<i32>) -> Result<HashMap<i32, i64>> {
-        // TODO: support partition_id
-        let partition_id = None;
-        let offset_spec = OffsetSpec::Latest;
-
-        self.metadata
-            .check_and_update_table_metadata(from_ref(&self.table_path))
-            .await?;
-
-        let cluster = self.metadata.get_cluster();
-        let table_id = cluster.get_table(&self.table_path).table_id;
-
-        // Prepare requests
-        let requests_by_server = self.prepare_list_offsets_requests(
-            table_id,
-            partition_id,
-            buckets.clone(),
-            offset_spec,
-        )?;
-
-        // Send Requests
-        let response_futures = self.send_list_offsets_request(requests_by_server).await?;
-
-        let mut results = HashMap::new();
-
-        for response_future in response_futures {
-            let offsets = response_future.await.map_err(
-                // todo: consider use suitable error
-                |e| crate::error::Error::WriteError(format!("Fail to get result: {e}")),
-            )?;
-            results.extend(offsets?);
-        }
-        Ok(results)
-    }
-
-    fn prepare_list_offsets_requests(
-        &self,
-        table_id: i64,
-        partition_id: Option<i64>,
-        buckets: Vec<i32>,
-        offset_spec: OffsetSpec,
-    ) -> Result<HashMap<i32, ListOffsetsRequest>> {
-        let cluster = self.metadata.get_cluster();
-        let mut node_for_bucket_list: HashMap<i32, Vec<i32>> = HashMap::new();
-
-        for bucket_id in buckets {
-            let table_bucket = TableBucket::new(table_id, bucket_id);
-            let leader = cluster.leader_for(&table_bucket).ok_or_else(|| {
-                // todo: consider use another suitable error
-                crate::error::Error::InvalidTableError(format!(
-                    "No leader found for table bucket: table_id={table_id}, bucket_id={bucket_id}"
-                ))
-            })?;
-
-            node_for_bucket_list
-                .entry(leader.id())
-                .or_default()
-                .push(bucket_id);
-        }
-
-        let mut list_offsets_requests = HashMap::new();
-        for (leader_id, bucket_ids) in node_for_bucket_list {
-            let request =
-                ListOffsetsRequest::new(table_id, partition_id, bucket_ids, offset_spec.clone());
-            list_offsets_requests.insert(leader_id, request);
-        }
-        Ok(list_offsets_requests)
-    }
-
-    async fn send_list_offsets_request(
-        &self,
-        request_map: HashMap<i32, ListOffsetsRequest>,
-    ) -> Result<Vec<JoinHandle<Result<HashMap<i32, i64>>>>> {
-        let mut tasks = Vec::new();
-
-        for (leader_id, request) in request_map {
-            let rpc_client = self.conns.clone();
-            let metadata = self.metadata.clone();
-
-            let task = tokio::spawn(async move {
-                let cluster = metadata.get_cluster();
-                let tablet_server = cluster.get_tablet_server(leader_id).ok_or_else(|| {
-                    // todo: consider use more suitable error
-                    crate::error::Error::InvalidTableError(format!(
-                        "Tablet server {leader_id} not found"
-                    ))
-                })?;
-                let connection = rpc_client.get_connection(tablet_server).await?;
-                let list_offsets_response = connection.request(request).await?;
-                list_offsets_response.offsets()
-            });
-            tasks.push(task);
-        }
-
-        Ok(tasks)
-    }
-
     async fn poll_for_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
         self.log_fetcher.send_fetches_and_collect().await
     }
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index 381e10c5b1..e25e2bace2 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -21,7 +21,7 @@ use crate::error::Error::WriteError;
 use crate::error::Result;
 use crate::metadata::TableBucket;
 use crate::proto::ProduceLogResponse;
-use crate::rpc::ProduceLogRequest;
+use crate::rpc::message::ProduceLogRequest;
 use parking_lot::Mutex;
 use std::collections::HashMap;
 use std::sync::Arc;
diff --git a/fluss-rust/crates/fluss/src/record/mod.rs b/fluss-rust/crates/fluss/src/record/mod.rs
index 07fbe0808c..35928ea082 100644
--- a/fluss-rust/crates/fluss/src/record/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/mod.rs
@@ -163,6 +163,10 @@ impl ScanRecords {
     pub fn records_by_buckets(&self) -> &HashMap<TableBucket, Vec<ScanRecord>> {
         &self.records
     }
+
+    pub fn into_records_by_buckets(self) -> HashMap<TableBucket, Vec<ScanRecord>> {
+        self.records
+    }
 }
 
 impl IntoIterator for ScanRecords {
diff --git a/fluss-rust/crates/fluss/src/rpc/mod.rs b/fluss-rust/crates/fluss/src/rpc/mod.rs
index 496c015073..b8705a3f65 100644
--- a/fluss-rust/crates/fluss/src/rpc/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/mod.rs
@@ -26,6 +26,4 @@ pub use server_connection::*;
 mod convert;
 mod transport;
 
-pub use message::*;
-
 pub use convert::*;

From b27625907e11d9ad51251db40e84d5c968a57409 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Tue, 21 Oct 2025 15:04:50 +0800
Subject: [PATCH 016/287] [feat] Support append arrow record batch (#34)

---
 fluss-rust/.github/workflows/ci.yml           |   2 +-
 .../crates/fluss/src/client/table/append.rs   |  11 +-
 .../fluss/src/client/write/accumulator.rs     |   4 +-
 .../crates/fluss/src/client/write/batch.rs    |  22 +-
 .../crates/fluss/src/client/write/mod.rs      |  20 +-
 .../crates/fluss/src/client/write/sender.rs   |   1 -
 .../fluss/src/client/write/writer_client.rs   |  33 +--
 fluss-rust/crates/fluss/src/record/arrow.rs   | 211 +++++++++++++-----
 .../crates/fluss/tests/integration/admin.rs   |   8 +-
 .../fluss/tests/integration/fluss_cluster.rs  |  67 ++++--
 .../crates/fluss/tests/integration/table.rs   | 132 +++++++++++
 .../crates/fluss/tests/integration/utils.rs   |  30 +++
 fluss-rust/crates/fluss/tests/test_fluss.rs   |   3 +
 13 files changed, 443 insertions(+), 101 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/tests/integration/table.rs
 create mode 100644 fluss-rust/crates/fluss/tests/integration/utils.rs

diff --git a/fluss-rust/.github/workflows/ci.yml b/fluss-rust/.github/workflows/ci.yml
index 73e2b3f172..69625f8f2e 100644
--- a/fluss-rust/.github/workflows/ci.yml
+++ b/fluss-rust/.github/workflows/ci.yml
@@ -91,7 +91,7 @@ jobs:
         # only run IT in linux since no docker in macos by default
         run: |
           if [ "$RUNNER_OS" == "Linux" ]; then
-            cargo test --features integration_tests --all-targets --workspace
+            RUST_TEST_THREADS=1 cargo test --features integration_tests --all-targets --workspace  -- --nocapture
           fi
         env:
           RUST_LOG: DEBUG
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index bf15266706..ad3e55e288 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -16,12 +16,12 @@
 // under the License.
 
 use crate::client::{WriteRecord, WriterClient};
+use crate::error::Result;
 use crate::metadata::{TableInfo, TablePath};
 use crate::row::GenericRow;
+use arrow::array::RecordBatch;
 use std::sync::Arc;
 
-use crate::error::Result;
-
 #[allow(dead_code)]
 pub struct TableAppend {
     table_path: TablePath,
@@ -63,6 +63,13 @@ impl AppendWriter {
         result_handle.result(result)
     }
 
+    pub async fn append_arrow_batch(&self, batch: RecordBatch) -> Result<()> {
+        let record = WriteRecord::new_record_batch(self.table_path.clone(), batch);
+        let result_handle = self.writer_client.send(&record).await?;
+        let result = result_handle.wait().await?;
+        result_handle.result(result)
+    }
+
     pub async fn flush(&self) -> Result<()> {
         self.writer_client.flush().await
     }
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 32622c7b2d..e4ca957827 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -17,7 +17,7 @@
 
 use crate::client::write::batch::WriteBatch::ArrowLog;
 use crate::client::write::batch::{ArrowLogWriteBatch, WriteBatch};
-use crate::client::{ResultHandle, WriteRecord};
+use crate::client::{Record, ResultHandle, WriteRecord};
 use crate::cluster::{BucketLocation, Cluster, ServerNode};
 use crate::config::Config;
 use crate::error::Result;
@@ -105,6 +105,7 @@ impl RecordAccumulator {
             row_type,
             bucket_id,
             current_time_ms(),
+            matches!(record.row, Record::RecordBatch(_)),
         ));
 
         let batch_id = batch.batch_id();
@@ -159,7 +160,6 @@ impl RecordAccumulator {
                 true, false, true,
             ));
         }
-
         self.append_new_batch(cluster, record, bucket_id, &mut dq_guard)
     }
 
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index 64c5dd6517..13b3d36402 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -18,11 +18,10 @@
 use crate::BucketId;
 use crate::client::broadcast::{BatchWriteResult, BroadcastOnce};
 use crate::client::{ResultHandle, WriteRecord};
-use crate::metadata::{DataType, TablePath};
-use std::cmp::max;
-
 use crate::error::Result;
+use crate::metadata::{DataType, TablePath};
 use crate::record::MemoryLogRecordsArrowBuilder;
+use std::cmp::max;
 
 #[allow(dead_code)]
 pub struct InnerWriteBatch {
@@ -140,12 +139,16 @@ impl ArrowLogWriteBatch {
         row_type: &DataType,
         bucket_id: BucketId,
         create_ms: i64,
+        to_append_record_batch: bool,
     ) -> Self {
         let base = InnerWriteBatch::new(batch_id, table_path, create_ms, bucket_id);
-
         Self {
             write_batch: base,
-            arrow_builder: MemoryLogRecordsArrowBuilder::new(schema_id, row_type),
+            arrow_builder: MemoryLogRecordsArrowBuilder::new(
+                schema_id,
+                row_type,
+                to_append_record_batch,
+            ),
         }
     }
 
@@ -157,8 +160,13 @@ impl ArrowLogWriteBatch {
         if self.arrow_builder.is_closed() || self.arrow_builder.is_full() {
             Ok(None)
         } else {
-            self.arrow_builder.append(&write_record.row)?;
-            Ok(Some(ResultHandle::new(self.write_batch.results.receiver())))
+            // append successfully
+            if self.arrow_builder.append(write_record)? {
+                Ok(Some(ResultHandle::new(self.write_batch.results.receiver())))
+            } else {
+                // append fail
+                Ok(None)
+            }
         }
     }
 
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index 74df951115..e632cde451 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -23,6 +23,7 @@ use crate::error::Error;
 use crate::metadata::TablePath;
 use crate::row::GenericRow;
 pub use accumulator::*;
+use arrow::array::RecordBatch;
 use std::sync::Arc;
 
 pub(crate) mod broadcast;
@@ -34,13 +35,28 @@ mod writer_client;
 pub use writer_client::WriterClient;
 
 pub struct WriteRecord<'a> {
-    pub row: GenericRow<'a>,
+    pub row: Record<'a>,
     pub table_path: Arc<TablePath>,
 }
 
+pub enum Record<'a> {
+    Row(GenericRow<'a>),
+    RecordBatch(Arc<RecordBatch>),
+}
+
 impl<'a> WriteRecord<'a> {
     pub fn new(table_path: Arc<TablePath>, row: GenericRow<'a>) -> Self {
-        Self { row, table_path }
+        Self {
+            row: Record::Row(row),
+            table_path,
+        }
+    }
+
+    pub fn new_record_batch(table_path: Arc<TablePath>, row: RecordBatch) -> Self {
+        Self {
+            row: Record::RecordBatch(Arc::new(row)),
+            table_path,
+        }
     }
 }
 
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index e25e2bace2..27460e3863 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -122,7 +122,6 @@ impl Sender {
         collated: &HashMap<i32, Vec<Arc<ReadyWriteBatch>>>,
     ) -> Result<()> {
         for (leader_id, batches) in collated {
-            println!("send request batch");
             self.send_write_request(*leader_id, self.ack, batches)
                 .await?;
         }
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index 01fe2899ba..28f5371e8d 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -90,20 +90,12 @@ impl WriterClient {
         let table_path = &record.table_path;
         let cluster = self.metadata.get_cluster();
 
-        let bucket_assigner = {
-            if let Some(assigner) = self.bucket_assigners.get(table_path) {
-                assigner.clone()
-            } else {
-                let assigner = Arc::new(Self::create_bucket_assigner(table_path.as_ref()));
-                self.bucket_assigners
-                    .insert(table_path.as_ref().clone(), assigner.clone());
-                assigner
-            }
-        };
+        let (bucket_assigner, bucket_id) = self.assign_bucket(table_path);
 
-        let bucket_id = bucket_assigner.assign_bucket(None, &cluster);
-
-        let mut result = self.accumulate.append(record, 1, &cluster, true).await?;
+        let mut result = self
+            .accumulate
+            .append(record, bucket_id, &cluster, true)
+            .await?;
 
         if result.abort_record_for_new_batch {
             let prev_bucket_id = bucket_id;
@@ -121,6 +113,21 @@ impl WriterClient {
 
         Ok(result.result_handle.expect("result_handle should exist"))
     }
+    fn assign_bucket(&self, table_path: &Arc<TablePath>) -> (Arc<Box<dyn BucketAssigner>>, i32) {
+        let cluster = self.metadata.get_cluster();
+        let bucket_assigner = {
+            if let Some(assigner) = self.bucket_assigners.get(table_path) {
+                assigner.clone()
+            } else {
+                let assigner = Arc::new(Self::create_bucket_assigner(table_path.as_ref()));
+                self.bucket_assigners
+                    .insert(table_path.as_ref().clone(), assigner.clone());
+                assigner
+            }
+        };
+        let bucket_id = bucket_assigner.assign_bucket(None, &cluster);
+        (bucket_assigner, bucket_id)
+    }
 
     pub async fn close(self) -> Result<()> {
         self.shutdown_tx
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index fa63b00603..487f50c348 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -15,6 +15,11 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::client::{Record, WriteRecord};
+use crate::error::Result;
+use crate::metadata::DataType;
+use crate::record::{ChangeType, ScanRecord};
+use crate::row::{ColumnarRow, GenericRow};
 use arrow::array::{
     ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Float32Builder, Float64Builder,
     Int8Builder, Int16Builder, Int32Builder, Int64Builder, StringBuilder, UInt8Builder,
@@ -35,11 +40,6 @@ use std::{
     sync::Arc,
 };
 
-use crate::error::Result;
-use crate::metadata::DataType;
-use crate::record::{ChangeType, ScanRecord};
-use crate::row::{ColumnarRow, GenericRow};
-
 /// const for record batch
 pub const BASE_OFFSET_LENGTH: usize = 8;
 pub const LENGTH_LENGTH: usize = 4;
@@ -95,14 +95,71 @@ pub struct MemoryLogRecordsArrowBuilder {
     magic: u8,
     writer_id: i64,
     batch_sequence: i32,
+    arrow_record_batch_builder: Box<dyn ArrowRecordBatchInnerBuilder>,
+    is_closed: bool,
+}
+
+pub trait ArrowRecordBatchInnerBuilder: Send + Sync {
+    fn build_arrow_record_batch(&self) -> Result<Arc<RecordBatch>>;
+
+    fn append(&mut self, row: &GenericRow) -> Result<bool>;
+
+    fn append_batch(&mut self, record_batch: Arc<RecordBatch>) -> Result<bool>;
+
+    fn schema(&self) -> SchemaRef;
+
+    fn records_count(&self) -> i32;
+
+    fn is_full(&self) -> bool;
+}
+
+#[derive(Default)]
+pub struct PrebuiltRecordBatchBuilder {
+    arrow_record_batch: Option<Arc<RecordBatch>>,
+    records_count: i32,
+}
+
+impl ArrowRecordBatchInnerBuilder for PrebuiltRecordBatchBuilder {
+    fn build_arrow_record_batch(&self) -> Result<Arc<RecordBatch>> {
+        Ok(self.arrow_record_batch.as_ref().unwrap().clone())
+    }
+
+    fn append(&mut self, _row: &GenericRow) -> Result<bool> {
+        // append one single row is not supported, return false directly
+        Ok(false)
+    }
+
+    fn append_batch(&mut self, record_batch: Arc<RecordBatch>) -> Result<bool> {
+        if self.arrow_record_batch.is_some() {
+            return Ok(false);
+        }
+        self.records_count = record_batch.num_rows() as i32;
+        self.arrow_record_batch = Some(record_batch);
+        Ok(true)
+    }
+
+    fn schema(&self) -> SchemaRef {
+        self.arrow_record_batch.as_ref().unwrap().schema()
+    }
+
+    fn records_count(&self) -> i32 {
+        self.records_count
+    }
+
+    fn is_full(&self) -> bool {
+        // full if has one record batch
+        self.arrow_record_batch.is_some()
+    }
+}
+
+pub struct RowAppendRecordBatchBuilder {
     table_schema: SchemaRef,
-    record_count: i32,
     arrow_column_builders: Mutex<Vec<Box<dyn ArrayBuilder>>>,
-    is_closed: bool,
+    records_count: i32,
 }
 
-impl MemoryLogRecordsArrowBuilder {
-    pub fn new(schema_id: i32, row_type: &DataType) -> Self {
+impl RowAppendRecordBatchBuilder {
+    pub fn new(row_type: &DataType) -> Self {
         let schema_ref = to_arrow_schema(row_type);
         let builders = Mutex::new(
             schema_ref
@@ -111,32 +168,106 @@ impl MemoryLogRecordsArrowBuilder {
                 .map(|field| Self::create_builder(field.data_type()))
                 .collect(),
         );
+        Self {
+            table_schema: schema_ref.clone(),
+            arrow_column_builders: builders,
+            records_count: 0,
+        }
+    }
+
+    fn create_builder(data_type: &arrow_schema::DataType) -> Box<dyn ArrayBuilder> {
+        match data_type {
+            arrow_schema::DataType::Int8 => Box::new(Int8Builder::new()),
+            arrow_schema::DataType::Int16 => Box::new(Int16Builder::new()),
+            arrow_schema::DataType::Int32 => Box::new(Int32Builder::new()),
+            arrow_schema::DataType::Int64 => Box::new(Int64Builder::new()),
+            arrow_schema::DataType::UInt8 => Box::new(UInt8Builder::new()),
+            arrow_schema::DataType::UInt16 => Box::new(UInt16Builder::new()),
+            arrow_schema::DataType::UInt32 => Box::new(UInt32Builder::new()),
+            arrow_schema::DataType::UInt64 => Box::new(UInt64Builder::new()),
+            arrow_schema::DataType::Float32 => Box::new(Float32Builder::new()),
+            arrow_schema::DataType::Float64 => Box::new(Float64Builder::new()),
+            arrow_schema::DataType::Boolean => Box::new(BooleanBuilder::new()),
+            arrow_schema::DataType::Utf8 => Box::new(StringBuilder::new()),
+            arrow_schema::DataType::Binary => Box::new(BinaryBuilder::new()),
+            dt => panic!("Unsupported data type: {dt:?}"),
+        }
+    }
+}
+
+impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
+    fn build_arrow_record_batch(&self) -> Result<Arc<RecordBatch>> {
+        let arrays = self
+            .arrow_column_builders
+            .lock()
+            .iter_mut()
+            .map(|b| b.finish())
+            .collect::<Vec<ArrayRef>>();
+        Ok(Arc::new(RecordBatch::try_new(
+            self.table_schema.clone(),
+            arrays,
+        )?))
+    }
+
+    fn append(&mut self, row: &GenericRow) -> Result<bool> {
+        for (idx, value) in row.values.iter().enumerate() {
+            let mut builder_binding = self.arrow_column_builders.lock();
+            let builder = builder_binding.get_mut(idx).unwrap();
+            value.append_to(builder.as_mut())?;
+        }
+        self.records_count += 1;
+        Ok(true)
+    }
+
+    fn append_batch(&mut self, _record_batch: Arc<RecordBatch>) -> Result<bool> {
+        Ok(false)
+    }
+
+    fn schema(&self) -> SchemaRef {
+        self.table_schema.clone()
+    }
+
+    fn records_count(&self) -> i32 {
+        self.records_count
+    }
+
+    fn is_full(&self) -> bool {
+        self.records_count() >= DEFAULT_MAX_RECORD
+    }
+}
+
+impl MemoryLogRecordsArrowBuilder {
+    pub fn new(schema_id: i32, row_type: &DataType, to_append_record_batch: bool) -> Self {
+        let arrow_batch_builder: Box<dyn ArrowRecordBatchInnerBuilder> = {
+            if to_append_record_batch {
+                Box::new(PrebuiltRecordBatchBuilder::default())
+            } else {
+                Box::new(RowAppendRecordBatchBuilder::new(row_type))
+            }
+        };
         MemoryLogRecordsArrowBuilder {
             base_log_offset: BUILDER_DEFAULT_OFFSET,
             schema_id,
             magic: CURRENT_LOG_MAGIC_VALUE,
             writer_id: NO_WRITER_ID,
             batch_sequence: NO_BATCH_SEQUENCE,
-            record_count: 0,
-            table_schema: schema_ref,
-            arrow_column_builders: builders,
             is_closed: false,
+            arrow_record_batch_builder: arrow_batch_builder,
         }
     }
 
-    pub fn append(&mut self, row: &GenericRow) -> Result<()> {
-        for (idx, value) in row.values.iter().enumerate() {
-            let mut builder_binding = self.arrow_column_builders.lock();
-            let builder = builder_binding.get_mut(idx).unwrap();
-            value.append_to(builder.as_mut())?;
+    pub fn append(&mut self, record: &WriteRecord) -> Result<bool> {
+        match &record.row {
+            Record::Row(row) => Ok(self.arrow_record_batch_builder.append(row)?),
+            Record::RecordBatch(record_batch) => Ok(self
+                .arrow_record_batch_builder
+                .append_batch(record_batch.clone())?),
         }
-        self.record_count += 1;
         // todo: consider write other change type
-        Ok(())
     }
 
     pub fn is_full(&self) -> bool {
-        self.record_count >= DEFAULT_MAX_RECORD
+        self.arrow_record_batch_builder.records_count() >= DEFAULT_MAX_RECORD
     }
 
     pub fn is_closed(&self) -> bool {
@@ -150,18 +281,12 @@ impl MemoryLogRecordsArrowBuilder {
     pub fn build(&self) -> Result<Vec<u8>> {
         // serialize arrow batch
         let mut arrow_batch_bytes = vec![];
-        let mut writer = StreamWriter::try_new(&mut arrow_batch_bytes, &self.table_schema)?;
-
-        let arrays = self
-            .arrow_column_builders
-            .lock()
-            .iter_mut()
-            .map(|b| b.finish())
-            .collect::<Vec<ArrayRef>>();
-        let record_batch = RecordBatch::try_new(self.table_schema.clone(), arrays)?;
+        let table_schema = self.arrow_record_batch_builder.schema();
+        let mut writer = StreamWriter::try_new(&mut arrow_batch_bytes, &table_schema)?;
         // get header len
         let header = writer.get_ref().len();
-        writer.write(&record_batch)?;
+        let record_batch = self.arrow_record_batch_builder.build_arrow_record_batch()?;
+        writer.write(record_batch.as_ref())?;
         // get real arrow batch bytes
         let real_arrow_batch_bytes = &arrow_batch_bytes[header..];
 
@@ -195,39 +320,21 @@ impl MemoryLogRecordsArrowBuilder {
         cursor.write_u32::<LittleEndian>(0)?; // crc placeholder
         cursor.write_i16::<LittleEndian>(self.schema_id as i16)?;
 
+        let record_count = self.arrow_record_batch_builder.records_count();
         // todo: curerntly, always is append only
         let append_only = true;
         cursor.write_u8(if append_only { 1 } else { 0 })?;
-        cursor.write_i32::<LittleEndian>(if self.record_count > 0 {
-            self.record_count - 1
+        cursor.write_i32::<LittleEndian>(if record_count > 0 {
+            record_count - 1
         } else {
             0
         })?;
 
         cursor.write_i64::<LittleEndian>(self.writer_id)?;
         cursor.write_i32::<LittleEndian>(self.batch_sequence)?;
-        cursor.write_i32::<LittleEndian>(self.record_count)?;
+        cursor.write_i32::<LittleEndian>(record_count)?;
         Ok(())
     }
-
-    fn create_builder(data_type: &arrow_schema::DataType) -> Box<dyn ArrayBuilder> {
-        match data_type {
-            arrow_schema::DataType::Int8 => Box::new(Int8Builder::new()),
-            arrow_schema::DataType::Int16 => Box::new(Int16Builder::new()),
-            arrow_schema::DataType::Int32 => Box::new(Int32Builder::new()),
-            arrow_schema::DataType::Int64 => Box::new(Int64Builder::new()),
-            arrow_schema::DataType::UInt8 => Box::new(UInt8Builder::new()),
-            arrow_schema::DataType::UInt16 => Box::new(UInt16Builder::new()),
-            arrow_schema::DataType::UInt32 => Box::new(UInt32Builder::new()),
-            arrow_schema::DataType::UInt64 => Box::new(UInt64Builder::new()),
-            arrow_schema::DataType::Float32 => Box::new(Float32Builder::new()),
-            arrow_schema::DataType::Float64 => Box::new(Float64Builder::new()),
-            arrow_schema::DataType::Boolean => Box::new(BooleanBuilder::new()),
-            arrow_schema::DataType::Utf8 => Box::new(StringBuilder::new()),
-            arrow_schema::DataType::Binary => Box::new(BinaryBuilder::new()),
-            dt => panic!("Unsupported data type: {dt:?}"),
-        }
-    }
 }
 
 pub trait ToArrow {
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index 0d958a5656..c51373d2cb 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -38,20 +38,24 @@ mod admin_test {
         TablePath,
     };
     use std::sync::Arc;
+    use std::thread;
 
     fn before_all() {
         // Create a new tokio runtime in a separate thread
         let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
-        std::thread::spawn(move || {
+        thread::spawn(move || {
             let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
             rt.block_on(async {
-                let cluster = FlussTestingClusterBuilder::new().build().await;
+                let cluster = FlussTestingClusterBuilder::new("test-admin").build().await;
                 let mut guard = cluster_guard.write();
                 *guard = Some(cluster);
             });
         })
         .join()
         .expect("Failed to create cluster");
+        // wait for 20 seconds to avoid the error like
+        // CoordinatorEventProcessor is not initialized yet
+        thread::sleep(std::time::Duration::from_secs(20));
     }
 
     fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
diff --git a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
index 83a47956ae..e827e14932 100644
--- a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
+++ b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
@@ -28,13 +28,14 @@ use testcontainers::{ContainerAsync, GenericImage, ImageExt};
 const FLUSS_VERSION: &str = "0.7.0";
 
 pub struct FlussTestingClusterBuilder {
-    number_of_tablet_servers: usize,
+    number_of_tablet_servers: i32,
     network: &'static str,
     cluster_conf: HashMap<String, String>,
+    testing_name: String,
 }
 
 impl FlussTestingClusterBuilder {
-    pub fn new() -> Self {
+    pub fn new(testing_name: impl Into<String>) -> Self {
         // reduce testing resources
         let mut cluster_conf = HashMap::new();
         cluster_conf.insert(
@@ -50,14 +51,27 @@ impl FlussTestingClusterBuilder {
             number_of_tablet_servers: 1,
             cluster_conf,
             network: "fluss-cluster-network",
+            testing_name: testing_name.into(),
         }
     }
 
+    fn tablet_server_container_name(&self, server_id: i32) -> String {
+        format!("tablet-server-{}-{}", self.testing_name, server_id)
+    }
+
+    fn coordinator_server_container_name(&self) -> String {
+        format!("coordinator-server-{}", self.testing_name)
+    }
+
+    fn zookeeper_container_name(&self) -> String {
+        format!("zookeeper-{}", self.testing_name)
+    }
+
     pub async fn build(&mut self) -> FlussTestingCluster {
         let zookeeper = Arc::new(
             GenericImage::new("zookeeper", "3.9.2")
                 .with_network(self.network)
-                .with_container_name("zookeeper")
+                .with_container_name(self.zookeeper_container_name())
                 .start()
                 .await
                 .unwrap(),
@@ -83,15 +97,25 @@ impl FlussTestingClusterBuilder {
 
     async fn start_coordinator_server(&mut self) -> ContainerAsync<GenericImage> {
         let mut coordinator_confs = HashMap::new();
-        coordinator_confs.insert("zookeeper.address", "zookeeper:2181");
+        coordinator_confs.insert(
+            "zookeeper.address",
+            format!("{}:2181", self.zookeeper_container_name()),
+        );
         coordinator_confs.insert(
             "bind.listeners",
-            "INTERNAL://coordinator-server:0, CLIENT://coordinator-server:9123",
+            format!(
+                "INTERNAL://{}:0, CLIENT://{}:9123",
+                self.coordinator_server_container_name(),
+                self.coordinator_server_container_name()
+            ),
         );
-        coordinator_confs.insert("advertised.listeners", "CLIENT://localhost:9123");
-        coordinator_confs.insert("internal.listener.name", "INTERNAL");
+        coordinator_confs.insert(
+            "advertised.listeners",
+            "CLIENT://localhost:9123".to_string(),
+        );
+        coordinator_confs.insert("internal.listener.name", "INTERNAL".to_string());
         GenericImage::new("fluss/fluss", FLUSS_VERSION)
-            .with_container_name("coordinator-server")
+            .with_container_name(self.coordinator_server_container_name())
             .with_mapped_port(9123, ContainerPort::Tcp(9123))
             .with_network(self.network)
             .with_cmd(vec!["coordinatorServer"])
@@ -104,26 +128,30 @@ impl FlussTestingClusterBuilder {
             .unwrap()
     }
 
-    async fn start_tablet_server(&self, server_id: usize) -> ContainerAsync<GenericImage> {
+    async fn start_tablet_server(&self, server_id: i32) -> ContainerAsync<GenericImage> {
         let mut tablet_server_confs = HashMap::new();
         let bind_listeners = format!(
-            "INTERNAL://tablet-server-{}:0, CLIENT://tablet-server-{}:9123",
-            server_id, server_id
+            "INTERNAL://{}:0, CLIENT://{}:9123",
+            self.tablet_server_container_name(server_id),
+            self.tablet_server_container_name(server_id),
         );
         let expose_host_port = 9124 + server_id;
         let advertised_listeners = format!("CLIENT://localhost:{}", expose_host_port);
         let tablet_server_id = format!("{}", server_id);
-        tablet_server_confs.insert("zookeeper.address", "zookeeper:2181");
-        tablet_server_confs.insert("bind.listeners", bind_listeners.as_str());
-        tablet_server_confs.insert("advertised.listeners", advertised_listeners.as_str());
-        tablet_server_confs.insert("internal.listener.name", "INTERNAL");
-        tablet_server_confs.insert("tablet-server.id", tablet_server_id.as_str());
+        tablet_server_confs.insert(
+            "zookeeper.address",
+            format!("{}:2181", self.zookeeper_container_name()),
+        );
+        tablet_server_confs.insert("bind.listeners", bind_listeners);
+        tablet_server_confs.insert("advertised.listeners", advertised_listeners);
+        tablet_server_confs.insert("internal.listener.name", "INTERNAL".to_string());
+        tablet_server_confs.insert("tablet-server.id", tablet_server_id);
 
         GenericImage::new("fluss/fluss", FLUSS_VERSION)
             .with_cmd(vec!["tabletServer"])
             .with_mapped_port(expose_host_port as u16, ContainerPort::Tcp(9123))
             .with_network(self.network)
-            .with_container_name(format!("tablet-server-{}", server_id))
+            .with_container_name(self.tablet_server_container_name(server_id))
             .with_env_var(
                 "FLUSS_PROPERTIES",
                 self.to_fluss_properties_with(tablet_server_confs),
@@ -133,7 +161,7 @@ impl FlussTestingClusterBuilder {
             .unwrap()
     }
 
-    fn to_fluss_properties_with(&self, extra_properties: HashMap<&str, &str>) -> String {
+    fn to_fluss_properties_with(&self, extra_properties: HashMap<&str, String>) -> String {
         let mut fluss_properties = Vec::new();
         for (k, v) in self.cluster_conf.iter() {
             fluss_properties.push(format!("{}: {}", k, v));
@@ -150,7 +178,7 @@ impl FlussTestingClusterBuilder {
 pub struct FlussTestingCluster {
     zookeeper: Arc<ContainerAsync<GenericImage>>,
     coordinator_server: Arc<ContainerAsync<GenericImage>>,
-    tablet_servers: HashMap<usize, Arc<ContainerAsync<GenericImage>>>,
+    tablet_servers: HashMap<i32, Arc<ContainerAsync<GenericImage>>>,
     bootstrap_servers: String,
 }
 
@@ -165,6 +193,7 @@ impl FlussTestingCluster {
 
     pub async fn get_fluss_connection(&self) -> FlussConnection {
         let mut config = Config::default();
+        config.writer_acks = "all".to_string();
         config.bootstrap_server = Some(self.bootstrap_servers.clone());
 
         // Retry mechanism: retry for up to 1 minute
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
new file mode 100644
index 0000000000..a1a6cb288a
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -0,0 +1,132 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+use crate::integration::fluss_cluster::FlussTestingCluster;
+use once_cell::sync::Lazy;
+use parking_lot::RwLock;
+use std::sync::Arc;
+
+#[cfg(test)]
+use test_env_helpers::*;
+
+// Module-level shared cluster instance (only for this test file)
+static SHARED_FLUSS_CLUSTER: Lazy<Arc<RwLock<Option<FlussTestingCluster>>>> =
+    Lazy::new(|| Arc::new(RwLock::new(None)));
+
+#[cfg(test)]
+#[before_all]
+#[after_all]
+mod table_test {
+    use super::SHARED_FLUSS_CLUSTER;
+    use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
+    use crate::integration::utils::create_table;
+    use arrow::array::record_batch;
+    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    use std::sync::Arc;
+    use std::sync::atomic::AtomicUsize;
+    use std::thread;
+    fn before_all() {
+        // Create a new tokio runtime in a separate thread
+        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
+        std::thread::spawn(move || {
+            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+            rt.block_on(async {
+                let cluster = FlussTestingClusterBuilder::new("test_table").build().await;
+                let mut guard = cluster_guard.write();
+                *guard = Some(cluster);
+            });
+        })
+        .join()
+        .expect("Failed to create cluster");
+        // wait for 20 seconds to avoid the error like
+        // CoordinatorEventProcessor is not initialized yet
+        thread::sleep(std::time::Duration::from_secs(20));
+    }
+
+    fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
+        let cluster_guard = SHARED_FLUSS_CLUSTER.read();
+        if cluster_guard.is_none() {
+            panic!("Fluss cluster not initialized. Make sure before_all() was called.");
+        }
+        Arc::new(cluster_guard.as_ref().unwrap().clone())
+    }
+
+    fn after_all() {
+        // Create a new tokio runtime in a separate thread
+        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
+        std::thread::spawn(move || {
+            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+            rt.block_on(async {
+                let mut guard = cluster_guard.write();
+                if let Some(cluster) = guard.take() {
+                    cluster.stop().await;
+                }
+            });
+        })
+        .join()
+        .expect("Failed to cleanup cluster");
+    }
+
+    #[tokio::test]
+    async fn append_record_batch() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path =
+            TablePath::new("fluss".to_string(), "test_append_record_batch".to_string());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("c1", DataTypes::int())
+                    .column("c2", DataTypes::string())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let append_writer = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table")
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer();
+
+        let batch1 =
+            record_batch!(("c1", Int32, [1, 2, 3]), ("c2", Utf8, ["a1", "a2", "a3"])).unwrap();
+        append_writer
+            .append_arrow_batch(batch1)
+            .await
+            .expect("Failed to append batch");
+
+        let batch2 =
+            record_batch!(("c1", Int32, [4, 5, 6]), ("c2", Utf8, ["a4", "a5", "a6"])).unwrap();
+        append_writer
+            .append_arrow_batch(batch2)
+            .await
+            .expect("Failed to append batch");
+
+        // todo: add scan code to verify the records appended in #30
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
new file mode 100644
index 0000000000..cd1f6ccb2d
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -0,0 +1,30 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+use fluss::client::FlussAdmin;
+use fluss::metadata::{TableDescriptor, TablePath};
+
+pub async fn create_table(
+    admin: &FlussAdmin,
+    table_path: &TablePath,
+    table_descriptor: &TableDescriptor,
+) {
+    admin
+        .create_table(&table_path, &table_descriptor, false)
+        .await
+        .expect("Failed to create table");
+}
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
index 28b9bef7d9..a15ca2395a 100644
--- a/fluss-rust/crates/fluss/tests/test_fluss.rs
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -22,4 +22,7 @@ extern crate fluss;
 mod integration {
     mod admin;
     mod fluss_cluster;
+    mod table;
+
+    mod utils;
 }

From 073d41ba8ff0a1a07172d84138047ee98a9edbd7 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Mon, 24 Nov 2025 10:40:02 +0800
Subject: [PATCH 017/287] [chore] Bump arrow version to 57 (#58)

---
 fluss-rust/Cargo.toml                        |  2 +-
 fluss-rust/bindings/python/Cargo.toml        |  8 ++++--
 fluss-rust/bindings/python/src/admin.rs      |  6 ++--
 fluss-rust/bindings/python/src/connection.rs | 12 ++++----
 fluss-rust/bindings/python/src/metadata.rs   |  6 ++--
 fluss-rust/bindings/python/src/table.rs      | 18 ++++++------
 fluss-rust/bindings/python/src/utils.rs      | 30 ++++++++++++--------
 fluss-rust/crates/fluss/Cargo.toml           |  2 +-
 8 files changed, 46 insertions(+), 38 deletions(-)

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 54436ac17d..e745d95e07 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -34,5 +34,5 @@ members = ["crates/fluss", "crates/examples", "bindings/python"]
 fluss = { version = "0.1.0", path = "./crates/fluss" }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
-arrow = "55.1.0"
+arrow = "57.0.0"
 chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }
diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
index 04826fb289..9ecc6299cd 100644
--- a/fluss-rust/bindings/python/Cargo.toml
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -27,11 +27,13 @@ name = "fluss"
 crate-type = ["cdylib"]
 
 [dependencies]
-pyo3 = { version = "0.24", features = ["extension-module"] }
+pyo3 = { version = "0.26.0", features = ["extension-module"] }
 fluss = { path = "../../crates/fluss" }
 tokio = { workspace = true }
 arrow = { workspace = true }
-arrow-pyarrow = "55.1.0"
-pyo3-async-runtimes = { version = "0.24.0", features = ["tokio-runtime"] }
+arrow-pyarrow = "57.0.0"
+arrow-schema = "57.0.0"
+arrow-array = "57.0.0"
+pyo3-async-runtimes = { version = "0.26.0", features = ["tokio-runtime"] }
 chrono = { workspace = true }
 once_cell = "1.21.3"
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index 73b2dd3af0..fa189eb80d 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -48,7 +48,7 @@ impl FlussAdmin {
                 .await
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
 
-            Python::with_gil(|py| Ok(py.None()))
+            Python::attach(|py| Ok(py.None()))
         })
     }
 
@@ -67,7 +67,7 @@ impl FlussAdmin {
                 .await
                 .map_err(|e| FlussError::new_err(format!("Failed to get table: {e}")))?;
 
-            Python::with_gil(|py| {
+            Python::attach(|py| {
                 let table_info = TableInfo::from_core(core_table_info);
                 Py::new(py, table_info)
             })
@@ -89,7 +89,7 @@ impl FlussAdmin {
                 .await
                 .map_err(|e| FlussError::new_err(format!("Failed to get lake snapshot: {e}")))?;
 
-            Python::with_gil(|py| {
+            Python::attach(|py| {
                 let lake_snapshot = LakeSnapshot::from_core(core_lake_snapshot);
                 Py::new(py, lake_snapshot)
             })
diff --git a/fluss-rust/bindings/python/src/connection.rs b/fluss-rust/bindings/python/src/connection.rs
index aeb8410ddf..a7559cec57 100644
--- a/fluss-rust/bindings/python/src/connection.rs
+++ b/fluss-rust/bindings/python/src/connection.rs
@@ -41,7 +41,7 @@ impl FlussConnection {
                 inner: Arc::new(connection),
             };
 
-            Python::with_gil(|py| Py::new(py, py_connection))
+            Python::attach(|py| Py::new(py, py_connection))
         })
     }
 
@@ -57,7 +57,7 @@ impl FlussConnection {
 
             let py_admin = FlussAdmin::from_core(admin);
 
-            Python::with_gil(|py| Py::new(py, py_admin))
+            Python::attach(|py| Py::new(py, py_admin))
         })
     }
 
@@ -84,7 +84,7 @@ impl FlussConnection {
                 core_table.has_primary_key(),
             );
 
-            Python::with_gil(|py| Py::new(py, py_table))
+            Python::attach(|py| Py::new(py, py_table))
         })
     }
 
@@ -102,9 +102,9 @@ impl FlussConnection {
     #[pyo3(signature = (_exc_type=None, _exc_value=None, _traceback=None))]
     fn __exit__(
         &mut self,
-        _exc_type: Option<PyObject>,
-        _exc_value: Option<PyObject>,
-        _traceback: Option<PyObject>,
+        _exc_type: Option<Bound<'_, PyAny>>,
+        _exc_value: Option<Bound<'_, PyAny>>,
+        _traceback: Option<Bound<'_, PyAny>>,
     ) -> PyResult<bool> {
         self.close()?;
         Ok(false)
diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
index 66748ab316..bc5f288071 100644
--- a/fluss-rust/bindings/python/src/metadata.rs
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -106,7 +106,7 @@ impl Schema {
     #[new]
     #[pyo3(signature = (schema, primary_keys=None))]
     pub fn new(
-        schema: PyObject, // PyArrow schema
+        schema: Py<PyAny>, // PyArrow schema
         primary_keys: Option<Vec<String>>,
     ) -> PyResult<Self> {
         let arrow_schema = crate::utils::Utils::pyarrow_to_arrow_schema(&schema)?;
@@ -553,7 +553,7 @@ impl LakeSnapshot {
 
     /// Get table bucket offsets as a Python dictionary with TableBucket keys
     #[getter]
-    pub fn table_buckets_offset(&self, py: Python) -> PyResult<PyObject> {
+    pub fn table_buckets_offset(&self, py: Python) -> PyResult<Py<PyAny>> {
         let dict = PyDict::new(py);
         for (bucket, offset) in &self.table_buckets_offset {
             let py_bucket = TableBucket::from_core(bucket.clone());
@@ -569,7 +569,7 @@ impl LakeSnapshot {
     }
 
     /// Get all table buckets
-    pub fn get_table_buckets(&self, py: Python) -> PyResult<Vec<PyObject>> {
+    pub fn get_table_buckets(&self, py: Python) -> PyResult<Vec<Py<PyAny>>> {
         let mut buckets = Vec::new();
         for bucket in self.table_buckets_offset.keys() {
             let py_bucket = TableBucket::from_core(bucket.clone());
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index c255fa6f8a..2a8df25c9d 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -51,7 +51,7 @@ impl FlussTable {
 
             let py_writer = AppendWriter::from_core(rust_writer);
 
-            Python::with_gil(|py| Py::new(py, py_writer))
+            Python::attach(|py| Py::new(py, py_writer))
         })
     }
 
@@ -75,7 +75,7 @@ impl FlussTable {
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
 
             let py_scanner = LogScanner::from_core(rust_scanner, admin, table_info.clone());
-            Python::with_gil(|py| Py::new(py, py_scanner))
+            Python::attach(|py| Py::new(py, py_scanner))
         })
     }
 
@@ -131,10 +131,10 @@ pub struct AppendWriter {
 #[pymethods]
 impl AppendWriter {
     /// Write Arrow table data
-    pub fn write_arrow(&mut self, py: Python, table: PyObject) -> PyResult<()> {
+    pub fn write_arrow(&mut self, py: Python, table: Py<PyAny>) -> PyResult<()> {
         // Convert Arrow Table to batches and write each batch
         let batches = table.call_method0(py, "to_batches")?;
-        let batch_list: Vec<PyObject> = batches.extract(py)?;
+        let batch_list: Vec<Py<PyAny>> = batches.extract(py)?;
 
         for batch in batch_list {
             self.write_arrow_batch(py, batch)?;
@@ -143,7 +143,7 @@ impl AppendWriter {
     }
 
     /// Write Arrow batch data
-    pub fn write_arrow_batch(&mut self, py: Python, batch: PyObject) -> PyResult<()> {
+    pub fn write_arrow_batch(&mut self, py: Python, batch: Py<PyAny>) -> PyResult<()> {
         // Extract number of rows and columns from the Arrow batch
         let num_rows: usize = batch.getattr(py, "num_rows")?.extract(py)?;
         let num_columns: usize = batch.getattr(py, "num_columns")?.extract(py)?;
@@ -175,7 +175,7 @@ impl AppendWriter {
     }
 
     /// Write Pandas DataFrame data
-    pub fn write_pandas(&mut self, py: Python, df: PyObject) -> PyResult<()> {
+    pub fn write_pandas(&mut self, py: Python, df: Py<PyAny>) -> PyResult<()> {
         // Import pyarrow module
         let pyarrow = py.import("pyarrow")?;
 
@@ -213,7 +213,7 @@ impl AppendWriter {
     fn convert_python_value_to_datum(
         &self,
         py: Python,
-        value: PyObject,
+        value: Py<PyAny>,
     ) -> PyResult<fcore::row::Datum<'static>> {
         use fcore::row::{Blob, Datum, F32, F64};
 
@@ -321,7 +321,7 @@ impl LogScanner {
     }
 
     /// Convert all data to Arrow Table
-    fn to_arrow(&self, py: Python) -> PyResult<PyObject> {
+    fn to_arrow(&self, py: Python) -> PyResult<Py<PyAny>> {
         use std::collections::HashMap;
         use std::time::Duration;
 
@@ -387,7 +387,7 @@ impl LogScanner {
     }
 
     /// Convert all data to Pandas DataFrame
-    fn to_pandas(&self, py: Python) -> PyResult<PyObject> {
+    fn to_pandas(&self, py: Python) -> PyResult<Py<PyAny>> {
         let arrow_table = self.to_arrow(py)?;
 
         // Convert Arrow Table to Pandas DataFrame using pyarrow
diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
index 93933b3774..09e6b5f589 100644
--- a/fluss-rust/bindings/python/src/utils.rs
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -16,8 +16,8 @@
 // under the License.
 
 use crate::*;
-use arrow::datatypes::{Schema as ArrowSchema, SchemaRef};
-use arrow_pyarrow::ToPyArrow;
+use arrow_pyarrow::{FromPyArrow, ToPyArrow};
+use arrow_schema::SchemaRef;
 use std::sync::Arc;
 
 /// Utilities for schema conversion between PyArrow, Arrow, and Fluss
@@ -25,11 +25,10 @@ pub struct Utils;
 
 impl Utils {
     /// Convert PyArrow schema to Rust Arrow schema
-    pub fn pyarrow_to_arrow_schema(py_schema: &PyObject) -> PyResult<SchemaRef> {
-        Python::with_gil(|py| {
+    pub fn pyarrow_to_arrow_schema(py_schema: &Py<PyAny>) -> PyResult<SchemaRef> {
+        Python::attach(|py| {
             let schema_bound = py_schema.bind(py);
-
-            let schema: ArrowSchema = arrow_pyarrow::FromPyArrow::from_pyarrow_bound(schema_bound)
+            let schema: arrow_schema::Schema = FromPyArrow::from_pyarrow_bound(schema_bound)
                 .map_err(|e| {
                     FlussError::new_err(format!("Failed to convert PyArrow schema: {e}"))
                 })?;
@@ -172,14 +171,21 @@ impl Utils {
     pub fn combine_batches_to_table(
         py: Python,
         batches: Vec<Arc<arrow::record_batch::RecordBatch>>,
-    ) -> PyResult<PyObject> {
-        // Convert Rust Arrow RecordBatch to PyObject
-        let py_batches: Result<Vec<PyObject>, _> = batches
+    ) -> PyResult<Py<PyAny>> {
+        use arrow_array::RecordBatch as ArrowArrayRecordBatch;
+
+        let py_batches: Result<Vec<Py<PyAny>>, _> = batches
             .iter()
             .map(|batch| {
-                batch.as_ref().to_pyarrow(py).map_err(|e| {
-                    FlussError::new_err(format!("Failed to convert RecordBatch to PyObject: {e}"))
-                })
+                ArrowArrayRecordBatch::try_new(batch.schema().clone(), batch.columns().to_vec())
+                    .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch: {e}")))
+                    .and_then(|b| {
+                        ToPyArrow::to_pyarrow(&b, py)
+                            .map(|x| x.into())
+                            .map_err(|e| {
+                                FlussError::new_err(format!("Failed to convert to PyObject: {e}"))
+                            })
+                    })
             })
             .collect();
 
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index ab1efc26d2..af770377ce 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -24,7 +24,7 @@ build = "src/build.rs"
 
 [dependencies]
 arrow = { workspace = true }
-arrow-schema = "55.1.0"
+arrow-schema = "57.0.0"
 byteorder = "1.5"
 futures = "0.3"
 clap = { workspace = true }

From 6ea79746e39bf80443fe9e590cee067d3df795b7 Mon Sep 17 00:00:00 2001
From: Pavlos-Petros Tournaris <p.tournaris@gmail.com>
Date: Mon, 24 Nov 2025 04:48:37 +0200
Subject: [PATCH 018/287] chore: add integration test for scan records after
 append (#51)

---
 .../crates/fluss/tests/integration/table.rs   | 50 ++++++++++++++++++-
 1 file changed, 48 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index a1a6cb288a..aa02724715 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -36,7 +36,8 @@ mod table_test {
     use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
     use crate::integration::utils::create_table;
     use arrow::array::record_batch;
-    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
+    use fluss::row::InternalRow;
     use std::sync::Arc;
     use std::sync::atomic::AtomicUsize;
     use std::thread;
@@ -127,6 +128,51 @@ mod table_test {
             .await
             .expect("Failed to append batch");
 
-        // todo: add scan code to verify the records appended in #30
+        // Create scanner to verify appended records
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let table_scan = table.new_scan();
+        let log_scanner = table_scan.create_log_scanner();
+
+        // Subscribe to bucket 0 starting from offset 0
+        log_scanner
+            .subscribe(0, 0)
+            .await
+            .expect("Failed to subscribe to bucket");
+
+        // Poll for records
+        let scan_records = log_scanner
+            .poll(tokio::time::Duration::from_secs(5))
+            .await
+            .expect("Failed to poll records");
+
+        // Verify the scanned records
+        let table_bucket = TableBucket::new(table.table_info().table_id, 0);
+        let records = scan_records.records(&table_bucket);
+
+        assert_eq!(records.len(), 6, "Expected 6 records");
+
+        // Verify record contents match what was appended
+        let expected_c1_values = vec![1, 2, 3, 4, 5, 6];
+        let expected_c2_values = vec!["a1", "a2", "a3", "a4", "a5", "a6"];
+
+        for (i, record) in records.iter().enumerate() {
+            let row = record.row();
+            assert_eq!(
+                row.get_int(0),
+                expected_c1_values[i],
+                "c1 value mismatch at row {}",
+                i
+            );
+            assert_eq!(
+                row.get_string(1),
+                expected_c2_values[i],
+                "c2 value mismatch at row {}",
+                i
+            );
+        }
     }
 }

From fdbe7f4acab5dceb0369365214fbdc4194c57fa2 Mon Sep 17 00:00:00 2001
From: Evan <binary-signal@users.noreply.github.com>
Date: Tue, 25 Nov 2025 02:39:23 +0100
Subject: [PATCH 019/287] [chore] Add ipc_compression feature to arrow
 dependency (#59)

---
 fluss-rust/Cargo.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index e745d95e07..15bcb796fd 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -34,5 +34,5 @@ members = ["crates/fluss", "crates/examples", "bindings/python"]
 fluss = { version = "0.1.0", path = "./crates/fluss" }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
-arrow = "57.0.0"
+arrow = { version = "57.0.0", features = ["ipc_compression"] }
 chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }

From a62d9fe428ae72b2b6fc465e9fb2f6790e6cbe22 Mon Sep 17 00:00:00 2001
From: Evan <binary-signal@users.noreply.github.com>
Date: Tue, 25 Nov 2025 13:21:59 +0100
Subject: [PATCH 020/287] [chore] Fix build fail on mac os (#61)

---
 fluss-rust/.github/.DS_Store        | Bin 6148 -> 0 bytes
 fluss-rust/.github/workflows/ci.yml |  55 ++++++++++++++++++++++------
 2 files changed, 44 insertions(+), 11 deletions(-)
 delete mode 100644 fluss-rust/.github/.DS_Store

diff --git a/fluss-rust/.github/.DS_Store b/fluss-rust/.github/.DS_Store
deleted file mode 100644
index 7adc49df07876bc71be2a10c09a4f4452106ddaf..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 6148
zcmeHKQA+|r5S~@b6DfQs@bREmAuAK2m+R7ppddP{hYGtxsiW&w^vnkl?z#R@zog&O
z%<fu<)k_c|Gcx<l&d%(z-^$J{00?*3*#am5fQ3q!DPZ%3&^YOwWQ>PUs5zR@h88s8
z1WxCo+3_D4ptD<rBk=Hdjwknde#dY?XBmtJy&#eS#=Qo;C>$i!>YK=9b4$y4D{mF8
z8}D9@yu?q21K00gQLiOs6ijVDxCpzWc4_TU#)%)s-M&f)J6#O9z6|4z9Jz8BcLplg
z(*st)Dzr=G@p!jdt=P4CZBntvd)s91)F+dIwZ5^rf7X789%K2ei52)CRI*}l3NL8<
zxW^~2A4f92!?@`j(_BVofEi#07LfsS*IC6y+#K(T8DIu}#Q@z8HY%ZGFx9B84s7W2
zk;Zd`BxuuHg3vbT7)&+d2#V0Dh&ol6Cx+1J=(kOrV=&dI(?O_}aUQd>FfSCLR!6_B
z!a+D1xn%~JfmsH!x?7_9-~9glKbyooW`G%3C<a8X;Wb>`lBun8o1<E5qu!#DP+Y3<
lBLxjriZPZ-aT!$!`fV~09fPSx^q}yEfTDpLX5dd5cn5ScO<w>2

diff --git a/fluss-rust/.github/workflows/ci.yml b/fluss-rust/.github/workflows/ci.yml
index 69625f8f2e..cf7a126486 100644
--- a/fluss-rust/.github/workflows/ci.yml
+++ b/fluss-rust/.github/workflows/ci.yml
@@ -54,17 +54,34 @@ jobs:
         os:
           - ubuntu-latest
           - macos-latest
+        python: ["3.11", "3.12", "3.13"]
     steps:
       - uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python }}
+
       - name: Install protoc
         run: |
-          if [ "$RUNNER_OS" == "Linux" ]; then
+          if [ "$RUNNER_OS" = "Linux" ]; then
             sudo apt-get update && sudo apt-get install -y protobuf-compiler
-          elif [ "$RUNNER_OS" == "macOS" ]; then
+          elif [ "$RUNNER_OS" = "macOS" ]; then
             brew install protobuf
           fi
+
+      - name: Rust Cache
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cargo/registry
+            ~/.cargo/git
+            target
+          key: build-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
+
       - name: Build
-        run: cargo build
+        run: cargo build --workspace --all-targets
 
   test:
     runs-on: ${{ matrix.os }}
@@ -73,26 +90,42 @@ jobs:
         os:
           - ubuntu-latest
           - macos-latest
+        python: ["3.11", "3.12", "3.13"]
     steps:
       - uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python }}
+
       - name: Install protoc
         run: |
-          if [ "$RUNNER_OS" == "Linux" ]; then
+          if [ "$RUNNER_OS" = "Linux" ]; then
             sudo apt-get update && sudo apt-get install -y protobuf-compiler
-          elif [ "$RUNNER_OS" == "macOS" ]; then
+          elif [ "$RUNNER_OS" = "macOS" ]; then
             brew install protobuf
           fi
+
+      - name: Rust Cache
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cargo/registry
+            ~/.cargo/git
+            target
+          key: test-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
+
       - name: Unit Test
         run: cargo test --all-targets --workspace
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
-      - name: Integration Test
-        # only run IT in linux since no docker in macos by default
+
+      - name: Integration Test (Linux only)
+        if: runner.os == 'Linux'
         run: |
-          if [ "$RUNNER_OS" == "Linux" ]; then
-            RUST_TEST_THREADS=1 cargo test --features integration_tests --all-targets --workspace  -- --nocapture
-          fi
+          RUST_TEST_THREADS=1 cargo test --features integration_tests --all-targets --workspace -- --nocapture
         env:
           RUST_LOG: DEBUG
-          RUST_BACKTRACE: full
\ No newline at end of file
+          RUST_BACKTRACE: full

From 121a03606f7acb8cbd3a61b8a65f4d9eb55caf62 Mon Sep 17 00:00:00 2001
From: Yang Guo <100583615+gyang94@users.noreply.github.com>
Date: Sun, 30 Nov 2025 00:15:25 +0800
Subject: [PATCH 021/287] feat: implement get_long for GenericRow (#49)

---
 .../crates/examples/src/example_table.rs      | 10 +++++++---
 fluss-rust/crates/fluss/src/row/datum.rs      | 19 +++++++++++++++++++
 fluss-rust/crates/fluss/src/row/mod.rs        |  2 +-
 3 files changed, 27 insertions(+), 4 deletions(-)

diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index 3eb8dd867f..deab3639da 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -27,7 +27,7 @@ use tokio::try_join;
 #[tokio::main]
 pub async fn main() -> Result<()> {
     let mut config = Config::parse();
-    config.bootstrap_server = Some("127.0.0.1:56405".to_string());
+    config.bootstrap_server = Some("127.0.0.1:9123".to_string());
 
     let conn = FlussConnection::new(config).await?;
 
@@ -36,11 +36,12 @@ pub async fn main() -> Result<()> {
             Schema::builder()
                 .column("c1", DataTypes::int())
                 .column("c2", DataTypes::string())
+                .column("c3", DataTypes::bigint())
                 .build()?,
         )
         .build()?;
 
-    let table_path = TablePath::new("fluss".to_owned(), "rust_test".to_owned());
+    let table_path = TablePath::new("fluss".to_owned(), "rust_test_long".to_owned());
 
     let admin = conn.get_admin().await?;
 
@@ -56,6 +57,7 @@ pub async fn main() -> Result<()> {
     let mut row = GenericRow::new();
     row.set_field(0, 22222);
     row.set_field(1, "t2t");
+    row.set_field(2, 123_456_789_123i64);
 
     let table = conn.get_table(&table_path).await?;
     let append_writer = table.new_append()?.create_writer();
@@ -63,6 +65,7 @@ pub async fn main() -> Result<()> {
     row = GenericRow::new();
     row.set_field(0, 233333);
     row.set_field(1, "tt44");
+    row.set_field(2, 987_654_321_987i64);
     let f2 = append_writer.append(row);
     try_join!(f1, f2, append_writer.flush())?;
 
@@ -76,9 +79,10 @@ pub async fn main() -> Result<()> {
         for record in scan_records {
             let row = record.row();
             println!(
-                "{{{}, {}}}@{}",
+                "{{{}, {}, {}}}@{}",
                 row.get_int(0),
                 row.get_string(1),
+                row.get_long(2),
                 record.offset()
             );
         }
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index d8c4f748ca..ed33b8badf 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -88,6 +88,13 @@ impl<'a> From<i32> for Datum<'a> {
     }
 }
 
+impl<'a> From<i64> for Datum<'a> {
+    #[inline]
+    fn from(i: i64) -> Datum<'a> {
+        Datum::Int64(i)
+    }
+}
+
 impl<'a> From<&'a str> for Datum<'a> {
     #[inline]
     fn from(s: &'a str) -> Datum<'a> {
@@ -127,6 +134,18 @@ impl TryFrom<&Datum<'_>> for i32 {
     }
 }
 
+impl TryFrom<&Datum<'_>> for i64 {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Int64(i) => Ok(*i),
+            _ => Err(()),
+        }
+    }
+}
+
 impl<'a> TryFrom<&Datum<'a>> for &'a str {
     type Error = ();
 
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index b900cb51d5..aa2c41159e 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -102,7 +102,7 @@ impl<'a> InternalRow for GenericRow<'a> {
     }
 
     fn get_long(&self, _pos: usize) -> i64 {
-        todo!()
+        self.values.get(_pos).unwrap().try_into().unwrap()
     }
 
     fn get_float(&self, _pos: usize) -> f32 {

From 236ae5af44f6f58ff3f9a4a4a19863c9516f0b80 Mon Sep 17 00:00:00 2001
From: Pavlos-Petros Tournaris <p.tournaris@gmail.com>
Date: Sat, 29 Nov 2025 18:16:27 +0200
Subject: [PATCH 022/287] feat: implement Display trait for DataType and
 related types (#50)

Fixes #38
---
 .../crates/fluss/src/metadata/datatype.rs     | 474 +++++++++++++++++-
 fluss-rust/rust-toolchain.toml                |   2 +-
 2 files changed, 474 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 09ca0c2c57..c7f93264df 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -93,6 +93,32 @@ impl DataType {
     }
 }
 
+impl Display for DataType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        match self {
+            DataType::Boolean(v) => write!(f, "{}", v),
+            DataType::TinyInt(v) => write!(f, "{}", v),
+            DataType::SmallInt(v) => write!(f, "{}", v),
+            DataType::Int(v) => write!(f, "{}", v),
+            DataType::BigInt(v) => write!(f, "{}", v),
+            DataType::Float(v) => write!(f, "{}", v),
+            DataType::Double(v) => write!(f, "{}", v),
+            DataType::Char(v) => write!(f, "{}", v),
+            DataType::String(v) => write!(f, "{}", v),
+            DataType::Decimal(v) => write!(f, "{}", v),
+            DataType::Date(v) => write!(f, "{}", v),
+            DataType::Time(v) => write!(f, "{}", v),
+            DataType::Timestamp(v) => write!(f, "{}", v),
+            DataType::TimestampLTz(v) => write!(f, "{}", v),
+            DataType::Bytes(v) => write!(f, "{}", v),
+            DataType::Binary(v) => write!(f, "{}", v),
+            DataType::Array(v) => write!(f, "{}", v),
+            DataType::Map(v) => write!(f, "{}", v),
+            DataType::Row(v) => write!(f, "{}", v),
+        }
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct BooleanType {
     nullable: bool,
@@ -118,6 +144,16 @@ impl BooleanType {
     }
 }
 
+impl Display for BooleanType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "BOOLEAN")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct TinyIntType {
     nullable: bool,
@@ -143,6 +179,16 @@ impl TinyIntType {
     }
 }
 
+impl Display for TinyIntType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "TINYINT")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct SmallIntType {
     nullable: bool,
@@ -168,6 +214,16 @@ impl SmallIntType {
     }
 }
 
+impl Display for SmallIntType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "SMALLINT")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct IntType {
     nullable: bool,
@@ -193,6 +249,16 @@ impl IntType {
     }
 }
 
+impl Display for IntType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "INT")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct BigIntType {
     nullable: bool,
@@ -218,6 +284,16 @@ impl BigIntType {
     }
 }
 
+impl Display for BigIntType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "BIGINT")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct FloatType {
     nullable: bool,
@@ -243,6 +319,16 @@ impl FloatType {
     }
 }
 
+impl Display for FloatType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "FLOAT")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct DoubleType {
     nullable: bool,
@@ -268,6 +354,16 @@ impl DoubleType {
     }
 }
 
+impl Display for DoubleType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "DOUBLE")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct CharType {
     nullable: bool,
@@ -327,6 +423,16 @@ impl StringType {
     }
 }
 
+impl Display for StringType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "STRING")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct DecimalType {
     nullable: bool,
@@ -370,6 +476,16 @@ impl DecimalType {
     }
 }
 
+impl Display for DecimalType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "DECIMAL({}, {})", self.precision, self.scale)?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct DateType {
     nullable: bool,
@@ -395,6 +511,16 @@ impl DateType {
     }
 }
 
+impl Display for DateType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "DATE")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Default, Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct TimeType {
     nullable: bool,
@@ -434,6 +560,16 @@ impl TimeType {
     }
 }
 
+impl Display for TimeType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "TIME({})", self.precision)?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct TimestampType {
     nullable: bool,
@@ -473,6 +609,16 @@ impl TimestampType {
     }
 }
 
+impl Display for TimestampType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "TIMESTAMP({})", self.precision)?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct TimestampLTzType {
     nullable: bool,
@@ -512,6 +658,16 @@ impl TimestampLTzType {
     }
 }
 
+impl Display for TimestampLTzType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "TIMESTAMP_LTZ({})", self.precision)?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct BytesType {
     nullable: bool,
@@ -537,6 +693,16 @@ impl BytesType {
     }
 }
 
+impl Display for BytesType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "BYTES")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct BinaryType {
     nullable: bool,
@@ -567,6 +733,16 @@ impl BinaryType {
     }
 }
 
+impl Display for BinaryType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "BINARY({})", self.length)?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Hash, Serialize, Deserialize)]
 pub struct ArrayType {
     nullable: bool,
@@ -597,6 +773,16 @@ impl ArrayType {
     }
 }
 
+impl Display for ArrayType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "ARRAY<{}>", self.element_type)?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Deserialize, Serialize, Hash)]
 pub struct MapType {
     nullable: bool,
@@ -634,6 +820,16 @@ impl MapType {
     }
 }
 
+impl Display for MapType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "MAP<{}, {}>", self.key_type, self.value_type)?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Deserialize, Serialize, Hash)]
 pub struct RowType {
     nullable: bool,
@@ -658,6 +854,23 @@ impl RowType {
     }
 }
 
+impl Display for RowType {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "ROW<")?;
+        for (i, field) in self.fields.iter().enumerate() {
+            if i > 0 {
+                write!(f, ", ")?;
+            }
+            write!(f, "{}", field)?;
+        }
+        write!(f, ">")?;
+        if !self.nullable {
+            write!(f, " NOT NULL")?;
+        }
+        Ok(())
+    }
+}
+
 pub struct DataTypes;
 
 impl DataTypes {
@@ -823,4 +1036,263 @@ impl DataField {
     }
 }
 
-// todo: implement display for datatype
+impl Display for DataField {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{} {}", self.name, self.data_type)
+    }
+}
+
+#[test]
+fn test_boolean_display() {
+    assert_eq!(BooleanType::new().to_string(), "BOOLEAN");
+    assert_eq!(
+        BooleanType::with_nullable(false).to_string(),
+        "BOOLEAN NOT NULL"
+    );
+}
+
+#[test]
+fn test_tinyint_display() {
+    assert_eq!(TinyIntType::new().to_string(), "TINYINT");
+    assert_eq!(
+        TinyIntType::with_nullable(false).to_string(),
+        "TINYINT NOT NULL"
+    );
+}
+
+#[test]
+fn test_smallint_display() {
+    assert_eq!(SmallIntType::new().to_string(), "SMALLINT");
+    assert_eq!(
+        SmallIntType::with_nullable(false).to_string(),
+        "SMALLINT NOT NULL"
+    );
+}
+
+#[test]
+fn test_int_display() {
+    assert_eq!(IntType::new().to_string(), "INT");
+    assert_eq!(IntType::with_nullable(false).to_string(), "INT NOT NULL");
+}
+
+#[test]
+fn test_bigint_display() {
+    assert_eq!(BigIntType::new().to_string(), "BIGINT");
+    assert_eq!(
+        BigIntType::with_nullable(false).to_string(),
+        "BIGINT NOT NULL"
+    );
+}
+
+#[test]
+fn test_float_display() {
+    assert_eq!(FloatType::new().to_string(), "FLOAT");
+    assert_eq!(
+        FloatType::with_nullable(false).to_string(),
+        "FLOAT NOT NULL"
+    );
+}
+
+#[test]
+fn test_double_display() {
+    assert_eq!(DoubleType::new().to_string(), "DOUBLE");
+    assert_eq!(
+        DoubleType::with_nullable(false).to_string(),
+        "DOUBLE NOT NULL"
+    );
+}
+
+#[test]
+fn test_string_display() {
+    assert_eq!(StringType::new().to_string(), "STRING");
+    assert_eq!(
+        StringType::with_nullable(false).to_string(),
+        "STRING NOT NULL"
+    );
+}
+
+#[test]
+fn test_date_display() {
+    assert_eq!(DateType::new().to_string(), "DATE");
+    assert_eq!(DateType::with_nullable(false).to_string(), "DATE NOT NULL");
+}
+
+#[test]
+fn test_bytes_display() {
+    assert_eq!(BytesType::new().to_string(), "BYTES");
+    assert_eq!(
+        BytesType::with_nullable(false).to_string(),
+        "BYTES NOT NULL"
+    );
+}
+
+#[test]
+fn test_char_display() {
+    assert_eq!(CharType::new(10).to_string(), "CHAR(10)");
+    assert_eq!(
+        CharType::with_nullable(20, false).to_string(),
+        "CHAR(20) NOT NULL"
+    );
+}
+
+#[test]
+fn test_decimal_display() {
+    assert_eq!(DecimalType::new(10, 2).to_string(), "DECIMAL(10, 2)");
+    assert_eq!(
+        DecimalType::with_nullable(false, 38, 10).to_string(),
+        "DECIMAL(38, 10) NOT NULL"
+    );
+}
+
+#[test]
+fn test_time_display() {
+    assert_eq!(TimeType::new(0).to_string(), "TIME(0)");
+    assert_eq!(TimeType::new(3).to_string(), "TIME(3)");
+    assert_eq!(
+        TimeType::with_nullable(false, 9).to_string(),
+        "TIME(9) NOT NULL"
+    );
+}
+
+#[test]
+fn test_timestamp_display() {
+    assert_eq!(TimestampType::new(6).to_string(), "TIMESTAMP(6)");
+    assert_eq!(TimestampType::new(0).to_string(), "TIMESTAMP(0)");
+    assert_eq!(
+        TimestampType::with_nullable(false, 9).to_string(),
+        "TIMESTAMP(9) NOT NULL"
+    );
+}
+
+#[test]
+fn test_timestamp_ltz_display() {
+    assert_eq!(TimestampLTzType::new(6).to_string(), "TIMESTAMP_LTZ(6)");
+    assert_eq!(TimestampLTzType::new(3).to_string(), "TIMESTAMP_LTZ(3)");
+    assert_eq!(
+        TimestampLTzType::with_nullable(false, 9).to_string(),
+        "TIMESTAMP_LTZ(9) NOT NULL"
+    );
+}
+
+#[test]
+fn test_binary_display() {
+    assert_eq!(BinaryType::new(100).to_string(), "BINARY(100)");
+    assert_eq!(
+        BinaryType::with_nullable(false, 256).to_string(),
+        "BINARY(256) NOT NULL"
+    );
+}
+
+#[test]
+fn test_array_display() {
+    let array_type = ArrayType::new(DataTypes::int());
+    assert_eq!(array_type.to_string(), "ARRAY<INT>");
+
+    let array_type_non_null = ArrayType::with_nullable(false, DataTypes::string());
+    assert_eq!(array_type_non_null.to_string(), "ARRAY<STRING> NOT NULL");
+
+    let nested_array = ArrayType::new(DataTypes::array(DataTypes::int()));
+    assert_eq!(nested_array.to_string(), "ARRAY<ARRAY<INT>>");
+}
+
+#[test]
+fn test_map_display() {
+    let map_type = MapType::new(DataTypes::string(), DataTypes::int());
+    assert_eq!(map_type.to_string(), "MAP<STRING, INT>");
+
+    let map_type_non_null =
+        MapType::with_nullable(false, DataTypes::int(), DataTypes::string());
+    assert_eq!(map_type_non_null.to_string(), "MAP<INT, STRING> NOT NULL");
+
+    let nested_map = MapType::new(
+        DataTypes::string(),
+        DataTypes::map(DataTypes::int(), DataTypes::boolean()),
+    );
+    assert_eq!(nested_map.to_string(), "MAP<STRING, MAP<INT, BOOLEAN>>");
+}
+
+#[test]
+fn test_row_display() {
+    let fields = vec![
+        DataTypes::field("id".to_string(), DataTypes::int()),
+        DataTypes::field("name".to_string(), DataTypes::string()),
+    ];
+    let row_type = RowType::new(fields);
+    assert_eq!(row_type.to_string(), "ROW<id INT, name STRING>");
+
+    let fields_non_null = vec![DataTypes::field("age".to_string(), DataTypes::bigint())];
+    let row_type_non_null = RowType::with_nullable(false, fields_non_null);
+    assert_eq!(row_type_non_null.to_string(), "ROW<age BIGINT> NOT NULL");
+}
+
+#[test]
+fn test_datatype_display() {
+    assert_eq!(DataTypes::boolean().to_string(), "BOOLEAN");
+    assert_eq!(DataTypes::int().to_string(), "INT");
+    assert_eq!(DataTypes::string().to_string(), "STRING");
+    assert_eq!(DataTypes::char(50).to_string(), "CHAR(50)");
+    assert_eq!(DataTypes::decimal(10, 2).to_string(), "DECIMAL(10, 2)");
+    assert_eq!(DataTypes::time_with_precision(3).to_string(), "TIME(3)");
+    assert_eq!(
+        DataTypes::timestamp_with_precision(6).to_string(),
+        "TIMESTAMP(6)"
+    );
+    assert_eq!(
+        DataTypes::timestamp_ltz_with_precision(9).to_string(),
+        "TIMESTAMP_LTZ(9)"
+    );
+    assert_eq!(DataTypes::array(DataTypes::int()).to_string(), "ARRAY<INT>");
+    assert_eq!(
+        DataTypes::map(DataTypes::string(), DataTypes::int()).to_string(),
+        "MAP<STRING, INT>"
+    );
+}
+
+#[test]
+fn test_datafield_display() {
+    let field = DataTypes::field("user_id".to_string(), DataTypes::bigint());
+    assert_eq!(field.to_string(), "user_id BIGINT");
+
+    let field2 = DataTypes::field("email".to_string(), DataTypes::string());
+    assert_eq!(field2.to_string(), "email STRING");
+
+    let field3 = DataTypes::field("score".to_string(), DataTypes::decimal(10, 2));
+    assert_eq!(field3.to_string(), "score DECIMAL(10, 2)");
+}
+
+#[test]
+fn test_complex_nested_display() {
+    let row_type = DataTypes::row(vec![
+        DataTypes::field("id".to_string(), DataTypes::int()),
+        DataTypes::field("tags".to_string(), DataTypes::array(DataTypes::string())),
+        DataTypes::field(
+            "metadata".to_string(),
+            DataTypes::map(DataTypes::string(), DataTypes::string()),
+        ),
+    ]);
+    assert_eq!(
+        row_type.to_string(),
+        "ROW<id INT, tags ARRAY<STRING>, metadata MAP<STRING, STRING>>"
+    );
+}
+
+#[test]
+fn test_non_nullable_datatype() {
+    let nullable_int = DataTypes::int();
+    assert_eq!(nullable_int.to_string(), "INT");
+
+    let non_nullable_int = nullable_int.as_non_nullable();
+    assert_eq!(non_nullable_int.to_string(), "INT NOT NULL");
+}
+
+#[test]
+fn test_deeply_nested_types() {
+    let nested = DataTypes::array(DataTypes::map(
+        DataTypes::string(),
+        DataTypes::row(vec![
+            DataTypes::field("x".to_string(), DataTypes::int()),
+            DataTypes::field("y".to_string(), DataTypes::int()),
+        ]),
+    ));
+    assert_eq!(nested.to_string(), "ARRAY<MAP<STRING, ROW<x INT, y INT>>>");
+}
diff --git a/fluss-rust/rust-toolchain.toml b/fluss-rust/rust-toolchain.toml
index 56c3bf5df8..870d7eb7af 100644
--- a/fluss-rust/rust-toolchain.toml
+++ b/fluss-rust/rust-toolchain.toml
@@ -17,4 +17,4 @@
 
 [toolchain]
 channel = "stable"
-components = ["rustfmt", "clippy"]
\ No newline at end of file
+components = ["rustfmt", "clippy"]

From 3d3de438e20b1cc19dc84c2227d91e7dda05ed0f Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 30 Nov 2025 00:27:38 +0800
Subject: [PATCH 023/287] chore: fix ci (#69)

---
 fluss-rust/crates/fluss/src/metadata/datatype.rs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index c7f93264df..4deed2bce0 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -1200,8 +1200,7 @@ fn test_map_display() {
     let map_type = MapType::new(DataTypes::string(), DataTypes::int());
     assert_eq!(map_type.to_string(), "MAP<STRING, INT>");
 
-    let map_type_non_null =
-        MapType::with_nullable(false, DataTypes::int(), DataTypes::string());
+    let map_type_non_null = MapType::with_nullable(false, DataTypes::int(), DataTypes::string());
     assert_eq!(map_type_non_null.to_string(), "MAP<INT, STRING> NOT NULL");
 
     let nested_map = MapType::new(

From 0f8ff0b50db49be897bca90785fe6f14c2683995 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Thu, 4 Dec 2025 10:58:56 +0800
Subject: [PATCH 024/287] feat: support ColumnPruning (#57)

---
 fluss-rust/crates/examples/Cargo.toml         |   2 -
 .../crates/fluss/src/client/table/scanner.rs  | 115 ++++++++-
 fluss-rust/crates/fluss/src/record/arrow.rs   | 239 +++++++++++++++---
 .../crates/fluss/tests/integration/table.rs   |  87 ++++++-
 4 files changed, 390 insertions(+), 53 deletions(-)

diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
index 82d864f818..dab85b66ed 100644
--- a/fluss-rust/crates/examples/Cargo.toml
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -27,8 +27,6 @@ version = { workspace = true }
 fluss = { workspace = true }
 tokio = { workspace = true }
 clap = { workspace = true}
-
-
 [[example]]
 name = "example-table"
 path = "src/example_table.rs"
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index e1ab59ffbb..13372efecf 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -17,12 +17,13 @@
 
 use crate::client::connection::FlussConnection;
 use crate::client::metadata::Metadata;
-use crate::error::Result;
+use crate::error::{Error, Result};
 use crate::metadata::{TableBucket, TableInfo, TablePath};
 use crate::proto::{FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
 use crate::record::{LogRecordsBatchs, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
 use crate::rpc::RpcClient;
 use crate::util::FairBucketStatusMap;
+use arrow_schema::SchemaRef;
 use parking_lot::RwLock;
 use std::collections::HashMap;
 use std::slice::from_ref;
@@ -39,6 +40,8 @@ pub struct TableScan<'a> {
     conn: &'a FlussConnection,
     table_info: TableInfo,
     metadata: Arc<Metadata>,
+    /// Column indices to project. None means all columns, Some(vec) means only the specified columns (non-empty).
+    projected_fields: Option<Vec<usize>>,
 }
 
 impl<'a> TableScan<'a> {
@@ -47,14 +50,82 @@ impl<'a> TableScan<'a> {
             conn,
             table_info,
             metadata,
+            projected_fields: None,
         }
     }
 
-    pub fn create_log_scanner(&self) -> LogScanner {
+    /// Projects the scan to only include specified columns by their indices.
+    ///
+    /// # Arguments
+    /// * `column_indices` - Zero-based indices of columns to include in the scan
+    ///
+    /// # Errors
+    /// Returns an error if `column_indices` is empty or if any column index is out of range.
+    ///
+    /// # Example
+    /// ```
+    /// let scanner = table.new_scan().project(&[0, 2, 3])?.create_log_scanner();
+    /// ```
+    pub fn project(mut self, column_indices: &[usize]) -> Result<Self> {
+        if column_indices.is_empty() {
+            return Err(Error::IllegalArgument(
+                "Column indices cannot be empty".to_string(),
+            ));
+        }
+        let field_count = self.table_info.row_type().fields().len();
+        for &idx in column_indices {
+            if idx >= field_count {
+                return Err(Error::IllegalArgument(format!(
+                    "Column index {} out of range (max: {})",
+                    idx,
+                    field_count - 1
+                )));
+            }
+        }
+        self.projected_fields = Some(column_indices.to_vec());
+        Ok(self)
+    }
+
+    /// Projects the scan to only include specified columns by their names.
+    ///
+    /// # Arguments
+    /// * `column_names` - Names of columns to include in the scan
+    ///
+    /// # Errors
+    /// Returns an error if `column_names` is empty or if any column name is not found in the table schema.
+    ///
+    /// # Example
+    /// ```
+    /// let scanner = table.new_scan().project_by_name(&["col1", "col3"])?.create_log_scanner();
+    /// ```
+    pub fn project_by_name(mut self, column_names: &[&str]) -> Result<Self> {
+        if column_names.is_empty() {
+            return Err(Error::IllegalArgument(
+                "Column names cannot be empty".to_string(),
+            ));
+        }
+        let row_type = self.table_info.row_type();
+        let mut indices = Vec::new();
+
+        for name in column_names {
+            let idx = row_type
+                .fields()
+                .iter()
+                .position(|f| f.name() == *name)
+                .ok_or_else(|| Error::IllegalArgument(format!("Column '{name}' not found")))?;
+            indices.push(idx);
+        }
+
+        self.projected_fields = Some(indices);
+        Ok(self)
+    }
+
+    pub fn create_log_scanner(self) -> LogScanner {
         LogScanner::new(
             &self.table_info,
             self.metadata.clone(),
             self.conn.get_connections(),
+            self.projected_fields,
         )
     }
 }
@@ -72,6 +143,7 @@ impl LogScanner {
         table_info: &TableInfo,
         metadata: Arc<Metadata>,
         connections: Arc<RpcClient>,
+        projected_fields: Option<Vec<usize>>,
     ) -> Self {
         let log_scanner_status = Arc::new(LogScannerStatus::new());
         Self {
@@ -84,6 +156,7 @@ impl LogScanner {
                 connections.clone(),
                 metadata.clone(),
                 log_scanner_status.clone(),
+                projected_fields,
             ),
         }
     }
@@ -114,6 +187,7 @@ struct LogFetcher {
     table_info: TableInfo,
     metadata: Arc<Metadata>,
     log_scanner_status: Arc<LogScannerStatus>,
+    read_context: ReadContext,
 }
 
 impl LogFetcher {
@@ -122,13 +196,27 @@ impl LogFetcher {
         conns: Arc<RpcClient>,
         metadata: Arc<Metadata>,
         log_scanner_status: Arc<LogScannerStatus>,
+        projected_fields: Option<Vec<usize>>,
     ) -> Self {
+        let full_arrow_schema = to_arrow_schema(table_info.get_row_type());
+        let read_context = Self::create_read_context(full_arrow_schema, projected_fields);
         LogFetcher {
             table_path: table_info.table_path.clone(),
-            conns: conns.clone(),
-            table_info: table_info.clone(),
-            metadata: metadata.clone(),
-            log_scanner_status: log_scanner_status.clone(),
+            conns,
+            table_info,
+            metadata,
+            log_scanner_status,
+            read_context,
+        }
+    }
+
+    fn create_read_context(
+        full_arrow_schema: SchemaRef,
+        projected_fields: Option<Vec<usize>>,
+    ) -> ReadContext {
+        match projected_fields {
+            None => ReadContext::new(full_arrow_schema),
+            Some(fields) => ReadContext::with_projection_pushdown(full_arrow_schema, fields),
         }
     }
 
@@ -149,7 +237,7 @@ impl LogFetcher {
             for pb_fetch_log_resp in fetch_response.tables_resp {
                 let table_id = pb_fetch_log_resp.table_id;
                 let fetch_log_for_buckets = pb_fetch_log_resp.buckets_resp;
-                let arrow_schema = to_arrow_schema(self.table_info.get_row_type());
+
                 for fetch_log_for_bucket in fetch_log_for_buckets {
                     let mut fetch_records = vec![];
                     let bucket: i32 = fetch_log_for_bucket.bucket_id;
@@ -158,8 +246,7 @@ impl LogFetcher {
                         let data = fetch_log_for_bucket.records.unwrap();
                         for log_record in &mut LogRecordsBatchs::new(&data) {
                             let last_offset = log_record.last_log_offset();
-                            fetch_records
-                                .extend(log_record.records(ReadContext::new(arrow_schema.clone())));
+                            fetch_records.extend(log_record.records(&self.read_context)?);
                             self.log_scanner_status
                                 .update_offset(&table_bucket, last_offset + 1);
                         }
@@ -209,13 +296,19 @@ impl LogFetcher {
         if ready_for_fetch_count == 0 {
             HashMap::new()
         } else {
+            let (projection_enabled, projected_fields) =
+                match self.read_context.project_fields_in_order() {
+                    None => (false, vec![]),
+                    Some(fields) => (true, fields.iter().map(|&i| i as i32).collect()),
+                };
+
             fetch_log_req_for_buckets
                 .into_iter()
                 .map(|(leader_id, feq_for_buckets)| {
                     let req_for_table = PbFetchLogReqForTable {
                         table_id: table_id.unwrap(),
-                        projection_pushdown_enabled: false,
-                        projected_fields: vec![],
+                        projection_pushdown_enabled: projection_enabled,
+                        projected_fields: projected_fields.clone(),
                         buckets_req: feq_for_buckets,
                     };
 
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 487f50c348..29bfe41a21 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -27,7 +27,12 @@ use arrow::array::{
 };
 use arrow::{
     array::RecordBatch,
-    ipc::{reader::StreamReader, writer::StreamWriter},
+    buffer::Buffer,
+    ipc::{
+        reader::{StreamReader, read_record_batch},
+        root_as_message,
+        writer::StreamWriter,
+    },
 };
 use arrow_schema::SchemaRef;
 use arrow_schema::{DataType as ArrowDataType, Field};
@@ -472,41 +477,84 @@ impl<'a> LogRecordBatch<'a> {
         LittleEndian::read_i32(&self.data[offset..offset + RECORDS_COUNT_LENGTH])
     }
 
-    pub fn records(&self, read_context: ReadContext) -> LogRecordIterator {
-        let count = self.record_count();
-        if count == 0 {
-            return LogRecordIterator::empty();
+    pub fn records(&self, read_context: &ReadContext) -> Result<LogRecordIterator> {
+        if self.record_count() == 0 {
+            return Ok(LogRecordIterator::empty());
         }
 
-        // get arrow_metadata
-        let arrow_metadata_bytes = read_context.to_arrow_metadata().unwrap();
-        // arrow_batch_data
         let data = &self.data[RECORDS_OFFSET..];
 
-        // need to combine arrow_metadata_bytes + arrow_batch_data
-        let cursor = Cursor::new([&arrow_metadata_bytes, data].concat());
-        let mut stream_reader = StreamReader::try_new(cursor, None).unwrap();
-
-        let mut record_batch = None;
-        if let Some(bath) = stream_reader.next() {
-            record_batch = Some(bath.unwrap());
-        }
-
-        if record_batch.is_none() {
-            return LogRecordIterator::empty();
-        }
-
-        let arrow_reader = ArrowReader::new(Arc::new(record_batch.unwrap()));
-        LogRecordIterator::Arrow(ArrowLogRecordIterator {
-            reader: arrow_reader,
-            base_offset: self.base_log_offset(),
-            timestamp: self.commit_timestamp(),
-            row_id: 0,
-            change_type: ChangeType::AppendOnly,
-        })
+        let record_batch = read_context.record_batch(data)?;
+        let log_record_iterator = match record_batch {
+            None => LogRecordIterator::empty(),
+            Some(record_batch) => {
+                let arrow_reader = ArrowReader::new(Arc::new(record_batch));
+                LogRecordIterator::Arrow(ArrowLogRecordIterator {
+                    reader: arrow_reader,
+                    base_offset: self.base_log_offset(),
+                    timestamp: self.commit_timestamp(),
+                    row_id: 0,
+                    change_type: ChangeType::AppendOnly,
+                })
+            }
+        };
+        Ok(log_record_iterator)
     }
 }
 
+/// Parse an Arrow IPC message from a byte slice.
+///
+/// Server returns RecordBatch message (without Schema message) in the encapsulated message format.
+/// Format: [continuation: 4 bytes (0xFFFFFFFF)][metadata_size: 4 bytes][RecordBatch metadata][body]
+///
+/// This format is documented at:
+/// https://arrow.apache.org/docs/format/Columnar.html#encapsulated-message-format
+///
+/// # Arguments
+/// * `data` - The byte slice containing the IPC message.
+///
+/// # Returns
+/// Returns `Some((batch_metadata, body_buffer, version))` on success:
+/// - `batch_metadata`: The RecordBatch metadata from the IPC message.
+/// - `body_buffer`: The buffer containing the record batch body data.
+/// - `version`: The Arrow IPC metadata version.
+///
+/// Returns `None` if the data is malformed or too short.
+fn parse_ipc_message(
+    data: &[u8],
+) -> Option<(
+    arrow::ipc::RecordBatch<'_>,
+    Buffer,
+    arrow::ipc::MetadataVersion,
+)> {
+    const CONTINUATION_MARKER: u32 = 0xFFFFFFFF;
+
+    if data.len() < 8 {
+        return None;
+    }
+
+    let continuation = LittleEndian::read_u32(&data[0..4]);
+    let metadata_size = LittleEndian::read_u32(&data[4..8]) as usize;
+
+    if continuation != CONTINUATION_MARKER {
+        return None;
+    }
+
+    if data.len() < 8 + metadata_size {
+        return None;
+    }
+
+    let metadata_bytes = &data[8..8 + metadata_size];
+    let message = root_as_message(metadata_bytes).ok()?;
+    let batch_metadata = message.header_as_record_batch()?;
+
+    let body_start = 8 + metadata_size;
+    let body_data = &data[body_start..];
+    let body_buffer = Buffer::from(body_data);
+
+    Some((batch_metadata, body_buffer, message.version()))
+}
+
 pub fn to_arrow_schema(fluss_schema: &DataType) -> SchemaRef {
     match &fluss_schema {
         DataType::Row(row_type) => {
@@ -554,19 +602,140 @@ pub fn to_arrow_type(fluss_type: &DataType) -> ArrowDataType {
     }
 }
 
+#[derive(Clone)]
 pub struct ReadContext {
-    arrow_schema: SchemaRef,
+    target_schema: SchemaRef,
+
+    projection: Option<Projection>,
+}
+
+#[derive(Clone)]
+struct Projection {
+    ordered_schema: SchemaRef,
+    projected_fields: Vec<usize>,
+    ordered_fields: Vec<usize>,
+
+    reordering_indexes: Vec<usize>,
+    reordering_needed: bool,
 }
 
 impl ReadContext {
     pub fn new(arrow_schema: SchemaRef) -> ReadContext {
-        ReadContext { arrow_schema }
+        ReadContext {
+            target_schema: arrow_schema,
+            projection: None,
+        }
     }
 
-    pub fn to_arrow_metadata(&self) -> Result<Vec<u8>> {
-        let mut arrow_schema_bytes = vec![];
-        let _writer = StreamWriter::try_new(&mut arrow_schema_bytes, &self.arrow_schema)?;
-        Ok(arrow_schema_bytes)
+    pub fn with_projection_pushdown(
+        arrow_schema: SchemaRef,
+        projected_fields: Vec<usize>,
+    ) -> ReadContext {
+        let target_schema = Self::project_schema(arrow_schema.clone(), projected_fields.as_slice());
+        let mut sorted_fields = projected_fields.clone();
+        sorted_fields.sort_unstable();
+
+        let project = {
+            if !sorted_fields.eq(&projected_fields) {
+                // reordering is required
+                // Calculate reordering indexes to transform from sorted order to user-requested order
+                let mut reordering_indexes = Vec::with_capacity(projected_fields.len());
+                for &original_idx in &projected_fields {
+                    let pos = sorted_fields
+                        .binary_search(&original_idx)
+                        .expect("projection index should exist in sorted list");
+                    reordering_indexes.push(pos);
+                }
+                Projection {
+                    ordered_schema: Self::project_schema(
+                        arrow_schema.clone(),
+                        sorted_fields.as_slice(),
+                    ),
+                    projected_fields,
+                    ordered_fields: sorted_fields,
+                    reordering_indexes,
+                    reordering_needed: true,
+                }
+            } else {
+                Projection {
+                    ordered_schema: Self::project_schema(arrow_schema, projected_fields.as_slice()),
+                    ordered_fields: projected_fields.clone(),
+                    projected_fields,
+                    reordering_indexes: vec![],
+                    reordering_needed: false,
+                }
+            }
+        };
+
+        ReadContext {
+            target_schema,
+            projection: Some(project),
+        }
+    }
+
+    pub fn project_schema(schema: SchemaRef, projected_fields: &[usize]) -> SchemaRef {
+        // todo: handle the exception
+        SchemaRef::new(
+            schema
+                .project(projected_fields)
+                .expect("can't project schema"),
+        )
+    }
+
+    pub fn project_fields(&self) -> Option<&[usize]> {
+        self.projection
+            .as_ref()
+            .map(|p| p.projected_fields.as_slice())
+    }
+
+    pub fn project_fields_in_order(&self) -> Option<&[usize]> {
+        self.projection
+            .as_ref()
+            .map(|p| p.ordered_fields.as_slice())
+    }
+
+    pub fn record_batch(&self, data: &[u8]) -> Result<Option<RecordBatch>> {
+        let (batch_metadata, body_buffer, version) = match parse_ipc_message(data) {
+            Some(result) => result,
+            None => return Ok(None),
+        };
+
+        // the record batch from server must be ordered by field pos,
+        // according to project to decide what arrow schema to use
+        // to parse the record batch
+        let resolve_schema = match self.projection {
+            Some(ref projection) => {
+                // projection, should use ordered schema by project field pos
+                projection.ordered_schema.clone()
+            }
+            None => {
+                // no projection, use target output schema
+                self.target_schema.clone()
+            }
+        };
+
+        let record_batch = read_record_batch(
+            &body_buffer,
+            batch_metadata,
+            resolve_schema,
+            &std::collections::HashMap::new(),
+            None,
+            &version,
+        )?;
+
+        let record_batch = match &self.projection {
+            Some(projection) if projection.reordering_needed => {
+                // Reorder columns if needed (when projection pushdown with non-sorted order)
+                let reordered_columns: Vec<_> = projection
+                    .reordering_indexes
+                    .iter()
+                    .map(|&idx| record_batch.column(idx).clone())
+                    .collect();
+                RecordBatch::try_new(self.target_schema.clone(), reordered_columns)?
+            }
+            _ => record_batch,
+        };
+        Ok(Some(record_batch))
     }
 }
 
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index aa02724715..e14b852648 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -54,6 +54,7 @@ mod table_test {
         })
         .join()
         .expect("Failed to create cluster");
+
         // wait for 20 seconds to avoid the error like
         // CoordinatorEventProcessor is not initialized yet
         thread::sleep(std::time::Duration::from_secs(20));
@@ -84,14 +85,16 @@ mod table_test {
     }
 
     #[tokio::test]
-    async fn append_record_batch() {
+    async fn append_record_batch_and_scan() {
         let cluster = get_fluss_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path =
-            TablePath::new("fluss".to_string(), "test_append_record_batch".to_string());
+        let table_path = TablePath::new(
+            "fluss".to_string(),
+            "test_append_record_batch_and_scan".to_string(),
+        );
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
@@ -101,15 +104,18 @@ mod table_test {
                     .build()
                     .expect("Failed to build schema"),
             )
+            .property("table.log.arrow.compression.type", "NONE")
             .build()
             .expect("Failed to build table");
 
         create_table(&admin, &table_path, &table_descriptor).await;
 
-        let append_writer = connection
+        let table = connection
             .get_table(&table_path)
             .await
-            .expect("Failed to get table")
+            .expect("Failed to get table");
+
+        let append_writer = table
             .new_append()
             .expect("Failed to create append")
             .create_writer();
@@ -128,6 +134,77 @@ mod table_test {
             .await
             .expect("Failed to append batch");
 
+        append_writer.flush().await.expect("Failed to flush");
+
+        let num_buckets = table.table_info().get_num_buckets();
+        let log_scanner = table.new_scan().create_log_scanner();
+        for bucket_id in 0..num_buckets {
+            log_scanner
+                .subscribe(bucket_id, 0)
+                .await
+                .expect("Failed to subscribe");
+        }
+
+        let scan_records = log_scanner
+            .poll(std::time::Duration::from_secs(5))
+            .await
+            .expect("Failed to poll");
+
+        let mut records: Vec<_> = scan_records.into_iter().collect();
+        records.sort_by_key(|r| r.offset());
+
+        assert_eq!(records.len(), 6, "Should have 6 records");
+        for (i, record) in records.iter().enumerate() {
+            let row = record.row();
+            let expected_c1 = (i + 1) as i32;
+            let expected_c2 = format!("a{}", i + 1);
+            assert_eq!(row.get_int(0), expected_c1, "c1 mismatch at index {}", i);
+            assert_eq!(row.get_string(1), expected_c2, "c2 mismatch at index {}", i);
+        }
+
+        let log_scanner_projected = table
+            .new_scan()
+            .project(&[1, 0])
+            .expect("Failed to project")
+            .create_log_scanner();
+        for bucket_id in 0..num_buckets {
+            log_scanner_projected
+                .subscribe(bucket_id, 0)
+                .await
+                .expect("Failed to subscribe");
+        }
+
+        let scan_records_projected = log_scanner_projected
+            .poll(std::time::Duration::from_secs(5))
+            .await
+            .expect("Failed to poll");
+
+        let mut records_projected: Vec<_> = scan_records_projected.into_iter().collect();
+        records_projected.sort_by_key(|r| r.offset());
+
+        assert_eq!(
+            records_projected.len(),
+            6,
+            "Should have 6 records with projection"
+        );
+        for (i, record) in records_projected.iter().enumerate() {
+            let row = record.row();
+            let expected_c2 = format!("a{}", i + 1);
+            let expected_c1 = (i + 1) as i32;
+            assert_eq!(
+                row.get_string(0),
+                expected_c2,
+                "Projected c2 (first column) mismatch at index {}",
+                i
+            );
+            assert_eq!(
+                row.get_int(1),
+                expected_c1,
+                "Projected c1 (second column) mismatch at index {}",
+                i
+            );
+        }
+
         // Create scanner to verify appended records
         let table = connection
             .get_table(&table_path)

From de9022e7030323e81c10ea6ed4844010dbaa36e1 Mon Sep 17 00:00:00 2001
From: Pavlos-Petros Tournaris <p.tournaris@gmail.com>
Date: Fri, 5 Dec 2025 06:26:24 +0200
Subject: [PATCH 025/287] feat: Implement JsonSerde for all datatypes (#53)

---
 .../crates/fluss/src/metadata/json_serde.rs   | 285 +++++++++++++++---
 1 file changed, 251 insertions(+), 34 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
index 1c7604c98a..447b0f9ff3 100644
--- a/fluss-rust/crates/fluss/src/metadata/json_serde.rs
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -17,7 +17,7 @@
 
 use crate::error::Error::{InvalidTableError, JsonSerdeError};
 use crate::error::Result;
-use crate::metadata::datatype::{DataType, DataTypes};
+use crate::metadata::datatype::{DataField, DataType, DataTypes};
 use crate::metadata::table::{Column, Schema, TableDescriptor};
 use serde_json::{Value, json};
 use std::collections::HashMap;
@@ -58,10 +58,8 @@ impl DataType {
     const FIELD_NAME_TYPE_NAME: &'static str = "type";
     const FIELD_NAME_NULLABLE: &'static str = "nullable";
     const FIELD_NAME_LENGTH: &'static str = "length";
-    #[allow(dead_code)]
     const FIELD_NAME_PRECISION: &'static str = "precision";
-    #[allow(dead_code)]
-    const FILED_NAME_SCALE: &'static str = "scale";
+    const FIELD_NAME_SCALE: &'static str = "scale";
     #[allow(dead_code)]
     const FIELD_NAME_ELEMENT_TYPE: &'static str = "element_type";
     #[allow(dead_code)]
@@ -111,21 +109,54 @@ impl JsonSerde for DataType {
                 obj.insert(Self::FIELD_NAME_LENGTH.to_string(), json!(_type.length()));
             }
             DataType::Decimal(_type) => {
-                todo!()
+                obj.insert(
+                    Self::FIELD_NAME_PRECISION.to_string(),
+                    json!(_type.precision()),
+                );
+                obj.insert(Self::FIELD_NAME_SCALE.to_string(), json!(_type.scale()));
             }
-
             DataType::Time(_type) => {
-                todo!()
+                obj.insert(
+                    Self::FIELD_NAME_PRECISION.to_string(),
+                    json!(_type.precision()),
+                );
             }
             DataType::Timestamp(_type) => {
-                todo!()
+                obj.insert(
+                    Self::FIELD_NAME_PRECISION.to_string(),
+                    json!(_type.precision()),
+                );
             }
             DataType::TimestampLTz(_type) => {
-                todo!()
+                obj.insert(
+                    Self::FIELD_NAME_PRECISION.to_string(),
+                    json!(_type.precision()),
+                );
+            }
+            DataType::Array(_type) => {
+                obj.insert(
+                    Self::FIELD_NAME_ELEMENT_TYPE.to_string(),
+                    _type.get_element_type().serialize_json()?,
+                );
+            }
+            DataType::Map(_type) => {
+                obj.insert(
+                    Self::FIELD_NAME_KEY_TYPE.to_string(),
+                    _type.key_type().serialize_json()?,
+                );
+                obj.insert(
+                    Self::FIELD_NAME_VALUE_TYPE.to_string(),
+                    _type.value_type().serialize_json()?,
+                );
+            }
+            DataType::Row(_type) => {
+                let fields: Vec<Value> = _type
+                    .fields()
+                    .iter()
+                    .map(|field| field.serialize_json())
+                    .collect::<Result<_>>()?;
+                obj.insert(Self::FIELD_NAME_FIELDS.to_string(), json!(fields));
             }
-            DataType::Array(_type) => todo!(),
-            DataType::Map(_type) => todo!(),
-            DataType::Row(_type) => todo!(),
         }
         Ok(Value::Object(obj))
     }
@@ -150,18 +181,112 @@ impl JsonSerde for DataType {
             "BIGINT" => DataTypes::bigint(),
             "FLOAT" => DataTypes::float(),
             "DOUBLE" => DataTypes::double(),
-            "CHAR" => todo!(),
+            "CHAR" => {
+                let length = node
+                    .get(Self::FIELD_NAME_LENGTH)
+                    .and_then(|v| v.as_u64())
+                    .ok_or_else(|| {
+                        JsonSerdeError(format!(
+                            "Missing required field: {}",
+                            Self::FIELD_NAME_LENGTH
+                        ))
+                    })? as u32;
+                DataTypes::char(length)
+            }
             "STRING" => DataTypes::string(),
-            "DECIMAL" => todo!(),
+            "DECIMAL" => {
+                let precision = node
+                    .get(Self::FIELD_NAME_PRECISION)
+                    .and_then(|v| v.as_u64())
+                    .ok_or_else(|| {
+                        JsonSerdeError(format!(
+                            "Missing required field: {}",
+                            Self::FIELD_NAME_PRECISION
+                        ))
+                    })? as u32;
+                let scale = node
+                    .get(Self::FIELD_NAME_SCALE)
+                    .and_then(|v| v.as_u64())
+                    .unwrap_or(0) as u32;
+                DataTypes::decimal(precision, scale)
+            }
             "DATE" => DataTypes::date(),
-            "TIME_WITHOUT_TIME_ZONE" => todo!(), // Precision set separately
-            "TIMESTAMP_WITHOUT_TIME_ZONE" => todo!(), // Precision set separately
-            "TIMESTAMP_WITH_LOCAL_TIME_ZONE" => todo!(), // Precision set separately
+            "TIME_WITHOUT_TIME_ZONE" => {
+                let precision = node
+                    .get(Self::FIELD_NAME_PRECISION)
+                    .and_then(|v| v.as_u64())
+                    .unwrap_or(0) as u32;
+                DataTypes::time_with_precision(precision)
+            }
+            "TIMESTAMP_WITHOUT_TIME_ZONE" => {
+                let precision = node
+                    .get(Self::FIELD_NAME_PRECISION)
+                    .and_then(|v| v.as_u64())
+                    .unwrap_or(6) as u32;
+                DataTypes::timestamp_with_precision(precision)
+            }
+            "TIMESTAMP_WITH_LOCAL_TIME_ZONE" => {
+                let precision = node
+                    .get(Self::FIELD_NAME_PRECISION)
+                    .and_then(|v| v.as_u64())
+                    .unwrap_or(6) as u32;
+                DataTypes::timestamp_ltz_with_precision(precision)
+            }
             "BYTES" => DataTypes::bytes(),
-            "BINARY" => todo!(),
-            "ARRAY" => todo!(),
-            "MAP" => todo!(),
-            "ROW" => todo!(),
+            "BINARY" => {
+                let length = node
+                    .get(Self::FIELD_NAME_LENGTH)
+                    .and_then(|v| v.as_u64())
+                    .unwrap_or(1) as usize;
+                DataTypes::binary(length)
+            }
+            "ARRAY" => {
+                let element_type_node =
+                    node.get(Self::FIELD_NAME_ELEMENT_TYPE).ok_or_else(|| {
+                        JsonSerdeError(format!(
+                            "Missing required field: {}",
+                            Self::FIELD_NAME_ELEMENT_TYPE
+                        ))
+                    })?;
+                let element_type = DataType::deserialize_json(element_type_node)?;
+                DataTypes::array(element_type)
+            }
+            "MAP" => {
+                let key_type_node = node.get(Self::FIELD_NAME_KEY_TYPE).ok_or_else(|| {
+                    JsonSerdeError(format!(
+                        "Missing required field: {}",
+                        Self::FIELD_NAME_KEY_TYPE
+                    ))
+                })?;
+                let key_type = DataType::deserialize_json(key_type_node)?;
+                let value_type_node = node.get(Self::FIELD_NAME_VALUE_TYPE).ok_or_else(|| {
+                    JsonSerdeError(format!(
+                        "Missing required field: {}",
+                        Self::FIELD_NAME_VALUE_TYPE
+                    ))
+                })?;
+                let value_type = DataType::deserialize_json(value_type_node)?;
+                DataTypes::map(key_type, value_type)
+            }
+            "ROW" => {
+                let fields_node = node
+                    .get(Self::FIELD_NAME_FIELDS)
+                    .ok_or_else(|| {
+                        JsonSerdeError(format!(
+                            "Missing required field: {}",
+                            Self::FIELD_NAME_FIELDS
+                        ))
+                    })?
+                    .as_array()
+                    .ok_or_else(|| {
+                        JsonSerdeError(format!("{} must be an array", Self::FIELD_NAME_FIELDS))
+                    })?;
+                let mut fields = Vec::with_capacity(fields_node.len());
+                for field_node in fields_node {
+                    fields.push(DataField::deserialize_json(field_node)?);
+                }
+                DataTypes::row(fields)
+            }
             _ => return Err(JsonSerdeError(format!("Unknown type root: {type_root}"))),
         };
 
@@ -175,6 +300,51 @@ impl JsonSerde for DataType {
     }
 }
 
+impl DataField {
+    const NAME: &'static str = "name";
+    const FIELD_TYPE: &'static str = "field_type";
+    const DESCRIPTION: &'static str = "description";
+}
+
+impl JsonSerde for DataField {
+    fn serialize_json(&self) -> Result<Value> {
+        let mut obj = serde_json::Map::new();
+
+        obj.insert(Self::NAME.to_string(), json!(self.name()));
+        obj.insert(
+            Self::FIELD_TYPE.to_string(),
+            self.data_type.serialize_json()?,
+        );
+
+        if let Some(description) = &self.description {
+            obj.insert(Self::DESCRIPTION.to_string(), json!(description));
+        }
+
+        Ok(Value::Object(obj))
+    }
+
+    fn deserialize_json(node: &Value) -> Result<DataField> {
+        let name = node
+            .get(Self::NAME)
+            .and_then(|v| v.as_str())
+            .ok_or_else(|| JsonSerdeError(format!("Missing required field: {}", Self::NAME)))?
+            .to_string();
+
+        let field_type_node = node.get(Self::FIELD_TYPE).ok_or_else(|| {
+            JsonSerdeError(format!("Missing required field: {}", Self::FIELD_TYPE))
+        })?;
+
+        let data_type = DataType::deserialize_json(field_type_node)?;
+
+        let description = node
+            .get(Self::DESCRIPTION)
+            .and_then(|v| v.as_str())
+            .map(|s| s.to_string());
+
+        Ok(DataField::new(name, data_type, description))
+    }
+}
+
 impl Column {
     const NAME: &'static str = "name";
     const DATA_TYPE: &'static str = "data_type";
@@ -203,7 +373,7 @@ impl JsonSerde for Column {
         let name = node
             .get(Self::NAME)
             .and_then(|v| v.as_str())
-            .unwrap_or_else(|| panic!("{}", format!("Missing required field: {}", Self::NAME)))
+            .ok_or_else(|| JsonSerdeError(format!("Missing required field: {}", Self::NAME)))?
             .to_string();
 
         let data_type_node = node.get(Self::DATA_TYPE).ok_or_else(|| {
@@ -263,7 +433,7 @@ impl JsonSerde for Schema {
                 JsonSerdeError(format!("Missing required field: {}", Self::COLUMNS_NAME))
             })?
             .as_array()
-            .ok_or_else(|| JsonSerdeError(format!("{} should be an array", Self::COLUMNS_NAME)))?;
+            .ok_or_else(|| JsonSerdeError(format!("{} must be an array", Self::COLUMNS_NAME)))?;
 
         let mut columns = Vec::with_capacity(columns_node.len());
         for col_node in columns_node {
@@ -275,14 +445,16 @@ impl JsonSerde for Schema {
         if let Some(pk_node) = node.get(Self::PRIMARY_KEY_NAME) {
             let pk_array = pk_node
                 .as_array()
-                .ok_or_else(|| InvalidTableError("Primary key is not an array".to_string()))?;
+                .ok_or_else(|| InvalidTableError("Primary key must be an array".to_string()))?;
 
             let mut primary_keys = Vec::with_capacity(pk_array.len());
             for name_node in pk_array {
                 primary_keys.push(
                     name_node
                         .as_str()
-                        .ok_or_else(|| InvalidTableError("Primary key is not string".to_string()))?
+                        .ok_or_else(|| {
+                            InvalidTableError("Primary key element must be a string".to_string())
+                        })?
                         .to_string(),
                 );
             }
@@ -308,7 +480,7 @@ impl TableDescriptor {
     fn deserialize_properties(node: &Value) -> Result<HashMap<String, String>> {
         let obj = node
             .as_object()
-            .ok_or_else(|| JsonSerdeError("Properties should be an object".to_string()))?;
+            .ok_or_else(|| JsonSerdeError("Properties must be an object".to_string()))?;
 
         let mut properties = HashMap::with_capacity(obj.len());
         for (key, value) in obj {
@@ -316,7 +488,7 @@ impl TableDescriptor {
                 key.clone(),
                 value
                     .as_str()
-                    .ok_or_else(|| JsonSerdeError("Properties should be an object".to_string()))?
+                    .ok_or_else(|| JsonSerdeError("Property value must be a string".to_string()))?
                     .to_owned(),
             );
         }
@@ -383,9 +555,7 @@ impl JsonSerde for TableDescriptor {
         if let Some(comment_node) = node.get(Self::COMMENT_NAME) {
             let comment = comment_node
                 .as_str()
-                .ok_or_else(|| {
-                    JsonSerdeError(format!("{} should be a string", Self::COMMENT_NAME))
-                })?
+                .ok_or_else(|| JsonSerdeError(format!("{} must be a string", Self::COMMENT_NAME)))?
                 .to_owned();
             builder = builder.comment(comment.as_str());
         }
@@ -400,7 +570,7 @@ impl JsonSerde for TableDescriptor {
             })?
             .as_array()
             .ok_or_else(|| {
-                JsonSerdeError(format!("{} should be an array", Self::PARTITION_KEY_NAME))
+                JsonSerdeError(format!("{} must be an array", Self::PARTITION_KEY_NAME))
             })?;
 
         let mut partition_keys = Vec::with_capacity(partition_node.len());
@@ -409,7 +579,10 @@ impl JsonSerde for TableDescriptor {
                 key_node
                     .as_str()
                     .ok_or_else(|| {
-                        JsonSerdeError(format!("{} should be a string", Self::PARTITION_KEY_NAME))
+                        JsonSerdeError(format!(
+                            "{} element must be a string",
+                            Self::PARTITION_KEY_NAME
+                        ))
                     })?
                     .to_owned(),
             );
@@ -420,14 +593,14 @@ impl JsonSerde for TableDescriptor {
         let mut bucket_keys = vec![];
         if let Some(bucket_key_node) = node.get(Self::BUCKET_KEY_NAME) {
             let bucket_key_node = bucket_key_node.as_array().ok_or_else(|| {
-                JsonSerdeError(format!("{} should be an array", Self::BUCKET_COUNT_NAME))
+                JsonSerdeError(format!("{} must be an array", Self::BUCKET_KEY_NAME))
             })?;
 
             for key_node in bucket_key_node {
                 bucket_keys.push(
                     key_node
                         .as_str()
-                        .ok_or_else(|| JsonSerdeError("Bucket key should be a string".to_string()))?
+                        .ok_or_else(|| JsonSerdeError("Bucket key must be a string".to_string()))?
                         .to_owned(),
                 );
             }
@@ -462,3 +635,47 @@ impl JsonSerde for TableDescriptor {
         builder.build()
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::DataTypes;
+
+    #[test]
+    fn test_datatype_json_serde() {
+        let data_types = vec![
+            DataTypes::boolean(),
+            DataTypes::tinyint(),
+            DataTypes::smallint(),
+            DataTypes::int().as_non_nullable(),
+            DataTypes::bigint(),
+            DataTypes::float(),
+            DataTypes::double(),
+            DataTypes::char(10),
+            DataTypes::string(),
+            DataTypes::decimal(10, 2),
+            DataTypes::date(),
+            DataTypes::time(),
+            DataTypes::timestamp(),
+            DataTypes::timestamp_ltz(),
+            DataTypes::bytes(),
+            DataTypes::binary(100),
+            DataTypes::array(DataTypes::int()),
+            DataTypes::map(DataTypes::string(), DataTypes::int()),
+            DataTypes::row(vec![
+                DataField::new("f1".to_string(), DataTypes::int(), None),
+                DataField::new(
+                    "f2".to_string(),
+                    DataTypes::string(),
+                    Some("desc".to_string()),
+                ),
+            ]),
+        ];
+
+        for dt in data_types {
+            let json = dt.serialize_json().unwrap();
+            let deserialized = DataType::deserialize_json(&json).unwrap();
+            assert_eq!(dt, deserialized);
+        }
+    }
+}

From f98f49fcf00f2507be6148f24a239b066a2abd3f Mon Sep 17 00:00:00 2001
From: Karan Pradhan <78605930+KaranPradhan266@users.noreply.github.com>
Date: Thu, 11 Dec 2025 06:29:30 -0800
Subject: [PATCH 026/287] chore: implemented all get methods for GenericRow
 (#82)

---
 fluss-rust/crates/fluss/src/row/datum.rs | 92 ++++++++++++++++++++++++
 fluss-rust/crates/fluss/src/row/mod.rs   | 40 ++++++-----
 2 files changed, 116 insertions(+), 16 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index ed33b8badf..3e487039b3 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -44,6 +44,8 @@ pub enum Datum<'a> {
     #[display("{0}")]
     Bool(bool),
     #[display("{0}")]
+    Int8(i8),
+    #[display("{0}")]
     Int16(i16),
     #[display("{0}")]
     Int32(i32),
@@ -78,6 +80,13 @@ impl Datum<'_> {
             _ => panic!("not a string: {self:?}"),
         }
     }
+
+    pub fn as_blob(&self) -> &[u8] {
+        match self {
+            Self::Blob(blob) => blob.as_ref(),
+            _ => panic!("not a blob: {self:?}"),
+        }
+    }
 }
 
 // ----------- implement from
@@ -95,6 +104,20 @@ impl<'a> From<i64> for Datum<'a> {
     }
 }
 
+impl<'a> From<i8> for Datum<'a> {
+    #[inline]
+    fn from(i: i8) -> Datum<'a> {
+        Datum::Int8(i)
+    }
+}
+
+impl<'a> From<i16> for Datum<'a> {
+    #[inline]
+    fn from(i: i16) -> Datum<'a> {
+        Datum::Int16(i)
+    }
+}
+
 impl<'a> From<&'a str> for Datum<'a> {
     #[inline]
     fn from(s: &'a str) -> Datum<'a> {
@@ -134,6 +157,18 @@ impl TryFrom<&Datum<'_>> for i32 {
     }
 }
 
+impl TryFrom<&Datum<'_>> for i16 {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Int16(i) => Ok(*i),
+            _ => Err(()),
+        }
+    }
+}
+
 impl TryFrom<&Datum<'_>> for i64 {
     type Error = ();
 
@@ -146,6 +181,42 @@ impl TryFrom<&Datum<'_>> for i64 {
     }
 }
 
+impl TryFrom<&Datum<'_>> for f32 {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Float32(f) => Ok(f.into_inner()),
+            _ => Err(()),
+        }
+    }
+}
+
+impl TryFrom<&Datum<'_>> for f64 {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Float64(f) => Ok(f.into_inner()),
+            _ => Err(()),
+        }
+    }
+}
+
+impl TryFrom<&Datum<'_>> for bool {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Bool(b) => Ok(*b),
+            _ => Err(()),
+        }
+    }
+}
+
 impl<'a> TryFrom<&Datum<'a>> for &'a str {
     type Error = ();
 
@@ -158,6 +229,25 @@ impl<'a> TryFrom<&Datum<'a>> for &'a str {
     }
 }
 
+impl TryFrom<&Datum<'_>> for i8 {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Int8(i) => Ok(*i),
+            _ => Err(()),
+        }
+    }
+}
+
+impl<'a> From<bool> for Datum<'a> {
+    #[inline]
+    fn from(b: bool) -> Datum<'a> {
+        Datum::Bool(b)
+    }
+}
+
 pub trait ToArrow {
     fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()>;
 }
@@ -184,6 +274,7 @@ impl Datum<'_> {
 
         match self {
             Datum::Null => {
+                append_null_to_arrow!(Int8Builder);
                 append_null_to_arrow!(BooleanBuilder);
                 append_null_to_arrow!(Int16Builder);
                 append_null_to_arrow!(Int32Builder);
@@ -194,6 +285,7 @@ impl Datum<'_> {
                 append_null_to_arrow!(BinaryBuilder);
             }
             Datum::Bool(v) => append_value_to_arrow!(BooleanBuilder, *v),
+            Datum::Int8(v) => append_value_to_arrow!(Int8Builder, *v),
             Datum::Int16(v) => append_value_to_arrow!(Int16Builder, *v),
             Datum::Int32(v) => append_value_to_arrow!(Int32Builder, *v),
             Datum::Int64(v) => append_value_to_arrow!(Int64Builder, *v),
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index aa2c41159e..a3b8885254 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -85,16 +85,16 @@ impl<'a> InternalRow for GenericRow<'a> {
         false
     }
 
-    fn get_boolean(&self, _pos: usize) -> bool {
-        todo!()
+    fn get_boolean(&self, pos: usize) -> bool {
+        self.values.get(pos).unwrap().try_into().unwrap()
     }
 
-    fn get_byte(&self, _pos: usize) -> i8 {
-        todo!()
+    fn get_byte(&self, pos: usize) -> i8 {
+        self.values.get(pos).unwrap().try_into().unwrap()
     }
 
-    fn get_short(&self, _pos: usize) -> i16 {
-        todo!()
+    fn get_short(&self, pos: usize) -> i16 {
+        self.values.get(pos).unwrap().try_into().unwrap()
     }
 
     fn get_int(&self, pos: usize) -> i32 {
@@ -105,28 +105,36 @@ impl<'a> InternalRow for GenericRow<'a> {
         self.values.get(_pos).unwrap().try_into().unwrap()
     }
 
-    fn get_float(&self, _pos: usize) -> f32 {
-        todo!()
+    fn get_float(&self, pos: usize) -> f32 {
+        self.values.get(pos).unwrap().try_into().unwrap()
     }
 
-    fn get_double(&self, _pos: usize) -> f64 {
-        todo!()
+    fn get_double(&self, pos: usize) -> f64 {
+        self.values.get(pos).unwrap().try_into().unwrap()
     }
 
-    fn get_char(&self, _pos: usize, _length: usize) -> String {
-        todo!()
+    fn get_char(&self, pos: usize, length: usize) -> String {
+        let value = self.get_string(pos);
+        if value.len() != length {
+            panic!(
+                "Length mismatch for fixed-size char: expected {}, got {}",
+                length,
+                value.len()
+            );
+        }
+        value.to_string()
     }
 
     fn get_string(&self, pos: usize) -> &str {
         self.values.get(pos).unwrap().try_into().unwrap()
     }
 
-    fn get_binary(&self, _pos: usize, _length: usize) -> Vec<u8> {
-        todo!()
+    fn get_binary(&self, pos: usize, _length: usize) -> Vec<u8> {
+        self.values.get(pos).unwrap().as_blob().to_vec()
     }
 
-    fn get_bytes(&self, _pos: usize) -> Vec<u8> {
-        todo!()
+    fn get_bytes(&self, pos: usize) -> Vec<u8> {
+        self.values.get(pos).unwrap().as_blob().to_vec()
     }
 }
 

From 1239980006b0155c44179b278fa1432ede2384e7 Mon Sep 17 00:00:00 2001
From: Chase Naples <cnaples79@gmail.com>
Date: Thu, 11 Dec 2025 20:34:59 -0500
Subject: [PATCH 027/287] chore: fix GenericRow null detection (#86)

---
 fluss-rust/crates/fluss/src/row/mod.rs | 22 ++++++++++++++++++++--
 1 file changed, 20 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index a3b8885254..909f3b136f 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -81,8 +81,11 @@ impl<'a> InternalRow for GenericRow<'a> {
         self.values.len()
     }
 
-    fn is_null_at(&self, _pos: usize) -> bool {
-        false
+    fn is_null_at(&self, pos: usize) -> bool {
+        self.values
+            .get(pos)
+            .expect("position out of bounds")
+            .is_null()
     }
 
     fn get_boolean(&self, pos: usize) -> bool {
@@ -153,3 +156,18 @@ impl<'a> GenericRow<'a> {
         self.values.insert(pos, value.into());
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn is_null_at_checks_datum_nullity() {
+        let mut row = GenericRow::new();
+        row.set_field(0, Datum::Null);
+        row.set_field(1, 42_i32);
+
+        assert!(row.is_null_at(0));
+        assert!(!row.is_null_at(1));
+    }
+}

From 5ed475e9ffd6da7756115d317f210c1a83990375 Mon Sep 17 00:00:00 2001
From: Junbo Wang <beryllwang@gmail.com>
Date: Fri, 12 Dec 2025 19:58:59 +0800
Subject: [PATCH 028/287] chore: Implement datatype conversion for all types in
 arrow.rs (#81)

---
 .../crates/fluss/src/metadata/datatype.rs     |  40 ++--
 fluss-rust/crates/fluss/src/record/arrow.rs   | 212 +++++++++++++++++-
 2 files changed, 223 insertions(+), 29 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 4deed2bce0..8ad4f7e569 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -96,25 +96,25 @@ impl DataType {
 impl Display for DataType {
     fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
         match self {
-            DataType::Boolean(v) => write!(f, "{}", v),
-            DataType::TinyInt(v) => write!(f, "{}", v),
-            DataType::SmallInt(v) => write!(f, "{}", v),
-            DataType::Int(v) => write!(f, "{}", v),
-            DataType::BigInt(v) => write!(f, "{}", v),
-            DataType::Float(v) => write!(f, "{}", v),
-            DataType::Double(v) => write!(f, "{}", v),
-            DataType::Char(v) => write!(f, "{}", v),
-            DataType::String(v) => write!(f, "{}", v),
-            DataType::Decimal(v) => write!(f, "{}", v),
-            DataType::Date(v) => write!(f, "{}", v),
-            DataType::Time(v) => write!(f, "{}", v),
-            DataType::Timestamp(v) => write!(f, "{}", v),
-            DataType::TimestampLTz(v) => write!(f, "{}", v),
-            DataType::Bytes(v) => write!(f, "{}", v),
-            DataType::Binary(v) => write!(f, "{}", v),
-            DataType::Array(v) => write!(f, "{}", v),
-            DataType::Map(v) => write!(f, "{}", v),
-            DataType::Row(v) => write!(f, "{}", v),
+            DataType::Boolean(v) => write!(f, "{v}"),
+            DataType::TinyInt(v) => write!(f, "{v}"),
+            DataType::SmallInt(v) => write!(f, "{v}"),
+            DataType::Int(v) => write!(f, "{v}"),
+            DataType::BigInt(v) => write!(f, "{v}"),
+            DataType::Float(v) => write!(f, "{v}"),
+            DataType::Double(v) => write!(f, "{v}"),
+            DataType::Char(v) => write!(f, "{v}"),
+            DataType::String(v) => write!(f, "{v}"),
+            DataType::Decimal(v) => write!(f, "{v}"),
+            DataType::Date(v) => write!(f, "{v}"),
+            DataType::Time(v) => write!(f, "{v}"),
+            DataType::Timestamp(v) => write!(f, "{v}"),
+            DataType::TimestampLTz(v) => write!(f, "{v}"),
+            DataType::Bytes(v) => write!(f, "{v}"),
+            DataType::Binary(v) => write!(f, "{v}"),
+            DataType::Array(v) => write!(f, "{v}"),
+            DataType::Map(v) => write!(f, "{v}"),
+            DataType::Row(v) => write!(f, "{v}"),
         }
     }
 }
@@ -861,7 +861,7 @@ impl Display for RowType {
             if i > 0 {
                 write!(f, ", ")?;
             }
-            write!(f, "{}", field)?;
+            write!(f, "{field}")?;
         }
         write!(f, ">")?;
         if !self.nullable {
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 29bfe41a21..e46093dd14 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -589,16 +589,84 @@ pub fn to_arrow_type(fluss_type: &DataType) -> ArrowDataType {
         DataType::Double(_) => ArrowDataType::Float64,
         DataType::Char(_) => ArrowDataType::Utf8,
         DataType::String(_) => ArrowDataType::Utf8,
-        DataType::Decimal(_) => todo!(),
+        DataType::Decimal(decimal_type) => ArrowDataType::Decimal128(
+            decimal_type
+                .precision()
+                .try_into()
+                .expect("precision exceeds u8::MAX"),
+            decimal_type
+                .scale()
+                .try_into()
+                .expect("scale exceeds i8::MAX"),
+        ),
         DataType::Date(_) => ArrowDataType::Date32,
-        DataType::Time(_) => todo!(),
-        DataType::Timestamp(_) => todo!(),
-        DataType::TimestampLTz(_) => todo!(),
-        DataType::Bytes(_) => todo!(),
-        DataType::Binary(_) => todo!(),
-        DataType::Array(_data_type) => todo!(),
-        DataType::Map(_data_type) => todo!(),
-        DataType::Row(_data_fields) => todo!(),
+        DataType::Time(time_type) => match time_type.precision() {
+            0 => ArrowDataType::Time32(arrow_schema::TimeUnit::Second),
+            1..=3 => ArrowDataType::Time32(arrow_schema::TimeUnit::Millisecond),
+            4..=6 => ArrowDataType::Time64(arrow_schema::TimeUnit::Microsecond),
+            7..=9 => ArrowDataType::Time64(arrow_schema::TimeUnit::Nanosecond),
+            // This arm should never be reached due to validation in TimeType.
+            invalid => panic!("Invalid precision value for TimeType: {invalid}"),
+        },
+        DataType::Timestamp(timestamp_type) => match timestamp_type.precision() {
+            0 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, None),
+            1..=3 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, None),
+            4..=6 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, None),
+            7..=9 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None),
+            // This arm should never be reached due to validation in Timestamp.
+            invalid => panic!("Invalid precision value for TimestampType: {invalid}"),
+        },
+        DataType::TimestampLTz(timestamp_ltz_type) => match timestamp_ltz_type.precision() {
+            0 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, None),
+            1..=3 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, None),
+            4..=6 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, None),
+            7..=9 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None),
+            // This arm should never be reached due to validation in TimestampLTz.
+            invalid => panic!("Invalid precision value for TimestampLTzType: {invalid}"),
+        },
+        DataType::Bytes(_) => ArrowDataType::Binary,
+        DataType::Binary(binary_type) => ArrowDataType::FixedSizeBinary(
+            binary_type
+                .length()
+                .try_into()
+                .expect("length exceeds i32::MAX"),
+        ),
+        DataType::Array(array_type) => ArrowDataType::List(
+            Field::new_list_field(
+                to_arrow_type(array_type.get_element_type()),
+                fluss_type.is_nullable(),
+            )
+            .into(),
+        ),
+        DataType::Map(map_type) => {
+            let key_type = to_arrow_type(map_type.key_type());
+            let value_type = to_arrow_type(map_type.value_type());
+            let entry_fields = vec![
+                Field::new("key", key_type, map_type.key_type().is_nullable()),
+                Field::new("value", value_type, map_type.value_type().is_nullable()),
+            ];
+            ArrowDataType::Map(
+                Arc::new(Field::new(
+                    "entries",
+                    ArrowDataType::Struct(arrow_schema::Fields::from(entry_fields)),
+                    fluss_type.is_nullable(),
+                )),
+                false,
+            )
+        }
+        DataType::Row(row_type) => ArrowDataType::Struct(arrow_schema::Fields::from(
+            row_type
+                .fields()
+                .iter()
+                .map(|f| {
+                    Field::new(
+                        f.name(),
+                        to_arrow_type(f.data_type()),
+                        f.data_type().is_nullable(),
+                    )
+                })
+                .collect::<Vec<Field>>(),
+        )),
     }
 }
 
@@ -820,3 +888,129 @@ impl ArrowReader {
     }
 }
 pub struct MyVec<T>(pub StreamReader<T>);
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::DataTypes;
+
+    #[test]
+    fn test_to_array_type() {
+        assert_eq!(to_arrow_type(&DataTypes::boolean()), ArrowDataType::Boolean);
+        assert_eq!(to_arrow_type(&DataTypes::tinyint()), ArrowDataType::Int8);
+        assert_eq!(to_arrow_type(&DataTypes::smallint()), ArrowDataType::Int16);
+        assert_eq!(to_arrow_type(&DataTypes::bigint()), ArrowDataType::Int64);
+        assert_eq!(to_arrow_type(&DataTypes::int()), ArrowDataType::Int32);
+        assert_eq!(to_arrow_type(&DataTypes::float()), ArrowDataType::Float32);
+        assert_eq!(to_arrow_type(&DataTypes::double()), ArrowDataType::Float64);
+        assert_eq!(to_arrow_type(&DataTypes::char(16)), ArrowDataType::Utf8);
+        assert_eq!(to_arrow_type(&DataTypes::string()), ArrowDataType::Utf8);
+        assert_eq!(
+            to_arrow_type(&DataTypes::decimal(10, 2)),
+            ArrowDataType::Decimal128(10, 2)
+        );
+        assert_eq!(to_arrow_type(&DataTypes::date()), ArrowDataType::Date32);
+        assert_eq!(
+            to_arrow_type(&DataTypes::time()),
+            ArrowDataType::Time32(arrow_schema::TimeUnit::Second)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::time_with_precision(3)),
+            ArrowDataType::Time32(arrow_schema::TimeUnit::Millisecond)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::time_with_precision(6)),
+            ArrowDataType::Time64(arrow_schema::TimeUnit::Microsecond)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::time_with_precision(9)),
+            ArrowDataType::Time64(arrow_schema::TimeUnit::Nanosecond)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::timestamp_with_precision(0)),
+            ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, None)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::timestamp_with_precision(3)),
+            ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, None)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::timestamp_with_precision(6)),
+            ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, None)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::timestamp_with_precision(9)),
+            ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(0)),
+            ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, None)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(3)),
+            ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, None)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(6)),
+            ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, None)
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(9)),
+            ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None)
+        );
+        assert_eq!(to_arrow_type(&DataTypes::bytes()), ArrowDataType::Binary);
+        assert_eq!(
+            to_arrow_type(&DataTypes::binary(16)),
+            ArrowDataType::FixedSizeBinary(16)
+        );
+
+        assert_eq!(
+            to_arrow_type(&DataTypes::array(DataTypes::int())),
+            ArrowDataType::List(Field::new_list_field(ArrowDataType::Int32, true).into())
+        );
+
+        assert_eq!(
+            to_arrow_type(&DataTypes::map(DataTypes::string(), DataTypes::int())),
+            ArrowDataType::Map(
+                Arc::new(Field::new(
+                    "entries",
+                    ArrowDataType::Struct(arrow_schema::Fields::from(vec![
+                        Field::new("key", ArrowDataType::Utf8, true),
+                        Field::new("value", ArrowDataType::Int32, true),
+                    ])),
+                    true,
+                )),
+                false,
+            )
+        );
+
+        assert_eq!(
+            to_arrow_type(&DataTypes::row(vec![
+                DataTypes::field("f1".to_string(), DataTypes::int()),
+                DataTypes::field("f2".to_string(), DataTypes::string()),
+            ])),
+            ArrowDataType::Struct(arrow_schema::Fields::from(vec![
+                Field::new("f1", ArrowDataType::Int32, true),
+                Field::new("f2", ArrowDataType::Utf8, true),
+            ]))
+        );
+    }
+
+    #[test]
+    #[should_panic(expected = "Invalid precision value for TimeType: 10")]
+    fn test_time_invalid_precision() {
+        to_arrow_type(&DataTypes::time_with_precision(10));
+    }
+
+    #[test]
+    #[should_panic(expected = "Invalid precision value for TimestampType: 10")]
+    fn test_timestamp_invalid_precision() {
+        to_arrow_type(&DataTypes::timestamp_with_precision(10));
+    }
+
+    #[test]
+    #[should_panic(expected = "Invalid precision value for TimestampLTzType: 10")]
+    fn test_timestamp_ltz_invalid_precision() {
+        to_arrow_type(&DataTypes::timestamp_ltz_with_precision(10));
+    }
+}

From c3f110436b0be4dc107981571cef45c65425dd57 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Sat, 13 Dec 2025 15:14:05 +0800
Subject: [PATCH 029/287] feat: introduce cpp bindings (#83)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---------

Co-authored-by: 赵海源 <zhaohaiyuan@xiaohongshu.com>
---
 fluss-rust/Cargo.toml                         |   2 +-
 fluss-rust/bindings/cpp/.clang-format         |  21 +
 fluss-rust/bindings/cpp/.gitignore            |   7 +
 fluss-rust/bindings/cpp/CMakeLists.txt        | 107 ++++
 fluss-rust/bindings/cpp/Cargo.toml            |  36 ++
 fluss-rust/bindings/cpp/build.rs              |  24 +
 fluss-rust/bindings/cpp/examples/example.cpp  | 166 ++++++
 fluss-rust/bindings/cpp/include/fluss.hpp     | 461 +++++++++++++++
 fluss-rust/bindings/cpp/src/admin.cpp         | 101 ++++
 fluss-rust/bindings/cpp/src/connection.cpp    |  95 ++++
 fluss-rust/bindings/cpp/src/ffi_converter.hpp | 256 +++++++++
 fluss-rust/bindings/cpp/src/lib.rs            | 523 ++++++++++++++++++
 fluss-rust/bindings/cpp/src/table.cpp         | 228 ++++++++
 fluss-rust/bindings/cpp/src/types.rs          | 485 ++++++++++++++++
 fluss-rust/crates/fluss/src/config.rs         |  14 +-
 15 files changed, 2524 insertions(+), 2 deletions(-)
 create mode 100644 fluss-rust/bindings/cpp/.clang-format
 create mode 100644 fluss-rust/bindings/cpp/.gitignore
 create mode 100644 fluss-rust/bindings/cpp/CMakeLists.txt
 create mode 100644 fluss-rust/bindings/cpp/Cargo.toml
 create mode 100644 fluss-rust/bindings/cpp/build.rs
 create mode 100644 fluss-rust/bindings/cpp/examples/example.cpp
 create mode 100644 fluss-rust/bindings/cpp/include/fluss.hpp
 create mode 100644 fluss-rust/bindings/cpp/src/admin.cpp
 create mode 100644 fluss-rust/bindings/cpp/src/connection.cpp
 create mode 100644 fluss-rust/bindings/cpp/src/ffi_converter.hpp
 create mode 100644 fluss-rust/bindings/cpp/src/lib.rs
 create mode 100644 fluss-rust/bindings/cpp/src/table.cpp
 create mode 100644 fluss-rust/bindings/cpp/src/types.rs

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 15bcb796fd..b4ac03b7be 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -28,7 +28,7 @@ rust-version = "1.85"
 
 [workspace]
 resolver = "2"
-members = ["crates/fluss", "crates/examples", "bindings/python"]
+members = ["crates/fluss", "crates/examples", "bindings/python", "bindings/cpp"]
 
 [workspace.dependencies]
 fluss = { version = "0.1.0", path = "./crates/fluss" }
diff --git a/fluss-rust/bindings/cpp/.clang-format b/fluss-rust/bindings/cpp/.clang-format
new file mode 100644
index 0000000000..1c31900ec4
--- /dev/null
+++ b/fluss-rust/bindings/cpp/.clang-format
@@ -0,0 +1,21 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+---
+BasedOnStyle: Google
+ColumnLimit: 100
+IndentWidth: 4
diff --git a/fluss-rust/bindings/cpp/.gitignore b/fluss-rust/bindings/cpp/.gitignore
new file mode 100644
index 0000000000..6836e70c06
--- /dev/null
+++ b/fluss-rust/bindings/cpp/.gitignore
@@ -0,0 +1,7 @@
+build/
+cmake-build-*/
+.idea/
+*.o
+*.a
+*.so
+*.dylib
diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
new file mode 100644
index 0000000000..629f3f076d
--- /dev/null
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -0,0 +1,107 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+cmake_minimum_required(VERSION 3.22)
+
+if (POLICY CMP0135)
+    cmake_policy(SET CMP0135 NEW)
+endif()
+
+project(fluss-cpp LANGUAGES CXX)
+
+include(FetchContent)
+set(FLUSS_GOOGLETEST_VERSION 1.15.2 CACHE STRING "version of GoogleTest")
+set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
+
+find_package(Threads REQUIRED)
+
+if (NOT CMAKE_BUILD_TYPE)
+    set(CMAKE_BUILD_TYPE Debug)
+endif()
+
+set(CMAKE_CXX_STANDARD 17)
+set(CMAKE_CXX_STANDARD_REQUIRED ON)
+
+option(FLUSS_ENABLE_ADDRESS_SANITIZER "Enable address sanitizer" OFF)
+option(FLUSS_ENABLE_TESTING "Enable building test binary for fluss" OFF)
+option(FLUSS_DEV "Enable dev mode" OFF)
+
+if (FLUSS_DEV)
+    set(FLUSS_ENABLE_ADDRESS_SANITIZER ON)
+    set(FLUSS_ENABLE_TESTING ON)
+endif()
+
+# Get cargo target dir
+execute_process(COMMAND cargo locate-project --workspace --message-format plain
+    OUTPUT_VARIABLE CARGO_TARGET_DIR
+    WORKING_DIRECTORY ${PROJECT_SOURCE_DIR})
+string(REGEX REPLACE "/Cargo.toml\n$" "/target" CARGO_TARGET_DIR "${CARGO_TARGET_DIR}")
+
+set(CARGO_MANIFEST ${PROJECT_SOURCE_DIR}/Cargo.toml)
+set(RUST_SOURCE_FILE ${PROJECT_SOURCE_DIR}/src/lib.rs)
+set(RUST_BRIDGE_CPP ${CARGO_TARGET_DIR}/cxxbridge/fluss-cpp/src/lib.rs.cc)
+set(RUST_HEADER_FILE ${CARGO_TARGET_DIR}/cxxbridge/fluss-cpp/src/lib.rs.h)
+
+if (CMAKE_BUILD_TYPE STREQUAL "Debug")
+    set(RUST_LIB ${CARGO_TARGET_DIR}/debug/${CMAKE_STATIC_LIBRARY_PREFIX}fluss_cpp${CMAKE_STATIC_LIBRARY_SUFFIX})
+else()
+    set(RUST_LIB ${CARGO_TARGET_DIR}/release/${CMAKE_STATIC_LIBRARY_PREFIX}fluss_cpp${CMAKE_STATIC_LIBRARY_SUFFIX})
+endif()
+
+set(CPP_INCLUDE_DIR ${PROJECT_SOURCE_DIR}/include
+                    ${PROJECT_SOURCE_DIR}/src
+                    ${CARGO_TARGET_DIR}/cxxbridge
+                    ${CARGO_TARGET_DIR}/cxxbridge/fluss-cpp/src)
+
+file(GLOB CPP_SOURCE_FILE "src/*.cpp")
+file(GLOB CPP_HEADER_FILE "include/*.hpp")
+
+if (NOT CMAKE_BUILD_TYPE STREQUAL "Debug")
+    list(APPEND CARGO_BUILD_FLAGS "--release")
+endif()
+
+add_custom_target(cargo_build
+    COMMAND cargo build --manifest-path ${CARGO_MANIFEST} ${CARGO_BUILD_FLAGS}
+    BYPRODUCTS ${RUST_BRIDGE_CPP} ${RUST_LIB} ${RUST_HEADER_FILE}
+    DEPENDS ${RUST_SOURCE_FILE}
+    USES_TERMINAL
+    COMMENT "Running cargo..."
+)
+
+add_library(fluss_cpp STATIC ${CPP_SOURCE_FILE} ${RUST_BRIDGE_CPP})
+target_sources(fluss_cpp PUBLIC ${CPP_HEADER_FILE})
+target_sources(fluss_cpp PRIVATE ${RUST_HEADER_FILE})
+target_include_directories(fluss_cpp PUBLIC ${CPP_INCLUDE_DIR})
+target_link_libraries(fluss_cpp PUBLIC ${RUST_LIB})
+target_link_libraries(fluss_cpp PRIVATE ${CMAKE_DL_LIBS} Threads::Threads)
+if(APPLE)
+    target_link_libraries(fluss_cpp PUBLIC "-framework CoreFoundation" "-framework Security")
+endif()
+
+add_executable(fluss_cpp_example examples/example.cpp)
+target_link_libraries(fluss_cpp_example fluss_cpp)
+target_include_directories(fluss_cpp_example PUBLIC ${CPP_INCLUDE_DIR})
+
+set_target_properties(fluss_cpp
+    PROPERTIES ADDITIONAL_CLEAN_FILES ${CARGO_TARGET_DIR}
+)
+add_dependencies(fluss_cpp cargo_build)
+
+if (FLUSS_ENABLE_ADDRESS_SANITIZER)
+    target_compile_options(fluss_cpp PRIVATE -fsanitize=leak,address,undefined -fno-omit-frame-pointer -fno-common -O1)
+    target_link_options(fluss_cpp PRIVATE -fsanitize=leak,address,undefined)
+endif()
\ No newline at end of file
diff --git a/fluss-rust/bindings/cpp/Cargo.toml b/fluss-rust/bindings/cpp/Cargo.toml
new file mode 100644
index 0000000000..2d3d913550
--- /dev/null
+++ b/fluss-rust/bindings/cpp/Cargo.toml
@@ -0,0 +1,36 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[package]
+name = "fluss-cpp"
+version = "0.1.0"
+edition.workspace = true
+rust-version.workspace = true
+publish = false
+
+[lib]
+crate-type = ["staticlib"]
+
+[dependencies]
+anyhow = "1.0"
+arrow = { workspace = true }
+cxx = "1.0"
+fluss = { path = "../../crates/fluss" }
+tokio = { version = "1.27", features = ["rt-multi-thread", "macros"] }
+
+[build-dependencies]
+cxx-build = "1.0"
diff --git a/fluss-rust/bindings/cpp/build.rs b/fluss-rust/bindings/cpp/build.rs
new file mode 100644
index 0000000000..ec75e24aeb
--- /dev/null
+++ b/fluss-rust/bindings/cpp/build.rs
@@ -0,0 +1,24 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+fn main() {
+    cxx_build::bridge("src/lib.rs")
+        .std("c++17")
+        .compile("fluss-cpp-bridge");
+
+    println!("cargo:rerun-if-changed=src/lib.rs");
+}
diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
new file mode 100644
index 0000000000..5146f28216
--- /dev/null
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -0,0 +1,166 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include "fluss.hpp"
+
+#include <iostream>
+#include <vector>
+
+static void check(const char* step, const fluss::Result& r) {
+    if (!r.Ok()) {
+        std::cerr << step << " failed: code=" << r.error_code
+                  << " msg=" << r.error_message << std::endl;
+        std::exit(1);
+    }
+}
+
+int main() {
+    // 1) Connect
+    fluss::Connection conn;
+    check("connect", fluss::Connection::Connect("127.0.0.1:9123", conn));
+
+    // 2) Admin
+    fluss::Admin admin;
+    check("get_admin", conn.GetAdmin(admin));
+
+    // 3) Schema & descriptor
+    auto schema = fluss::Schema::NewBuilder()
+                        .AddColumn("id", fluss::DataType::Int)
+                        .AddColumn("name", fluss::DataType::String)
+                        .AddColumn("score", fluss::DataType::Float)
+                        .AddColumn("age", fluss::DataType::Int)
+                        .Build();
+
+    auto descriptor = fluss::TableDescriptor::NewBuilder()
+                          .SetSchema(schema)
+                          .SetBucketCount(1)
+                          .SetProperty("table.log.arrow.compression.type", "NONE")
+                          .SetComment("cpp example table")
+                          .Build();
+
+    fluss::TablePath table_path("fluss", "sample_table_cpp_v1");
+    // ignore_if_exists=true to allow re-run
+    check("create_table", admin.CreateTable(table_path, descriptor, true));
+
+    // 4) Get table
+    fluss::Table table;
+    check("get_table", conn.GetTable(table_path, table));
+
+    // 5) Writer
+    fluss::AppendWriter writer;
+    check("new_append_writer", table.NewAppendWriter(writer));
+
+    struct RowData {
+        int id;
+        const char* name;
+        float score;
+        int age;
+    };
+
+    std::vector<RowData> rows = {
+        {1, "Alice", 95.2f, 25},
+        {2, "Bob", 87.2f, 30},
+        {3, "Charlie", 92.1f, 35},
+    };
+
+    for (const auto& r : rows) {
+        fluss::GenericRow row;
+        row.SetInt32(0, r.id);
+        row.SetString(1, r.name);
+        row.SetFloat32(2, r.score);
+        row.SetInt32(3, r.age);
+        check("append", writer.Append(row));
+    }
+    check("flush", writer.Flush());
+    std::cout << "Wrote " << rows.size() << " rows" << std::endl;
+
+    // 6) Scan
+    fluss::LogScanner scanner;
+    check("new_log_scanner", table.NewLogScanner(scanner));
+
+    auto info = table.GetTableInfo();
+    int buckets = info.num_buckets;
+    for (int b = 0; b < buckets; ++b) {
+        check("subscribe", scanner.Subscribe(b, 0));
+    }
+
+    fluss::ScanRecords records;
+    check("poll", scanner.Poll(5000, records));
+
+    std::cout << "Scanned records: " << records.records.size() << std::endl;
+    for (const auto& rec : records.records) {
+        std::cout << " offset=" << rec.offset << " id=" << rec.row.fields[0].i32_val
+                  << " name=" << rec.row.fields[1].string_val
+                  << " score=" << rec.row.fields[2].f32_val << " age=" << rec.row.fields[3].i32_val
+                  << " ts=" << rec.timestamp << std::endl;
+    }
+    
+    // 7) Project only id (0) and name (1) columns
+    std::vector<size_t> projected_columns = {0, 1};
+    fluss::LogScanner projected_scanner;
+    check("new_log_scanner_with_projection", 
+          table.NewLogScannerWithProjection(projected_columns, projected_scanner));
+    
+    for (int b = 0; b < buckets; ++b) {
+        check("subscribe_projected", projected_scanner.Subscribe(b, 0));
+    }
+    
+    fluss::ScanRecords projected_records;
+    check("poll_projected", projected_scanner.Poll(5000, projected_records));
+    
+    std::cout << "Projected records: " << projected_records.records.size() << std::endl;
+    
+    bool projection_verified = true;
+    for (size_t i = 0; i < projected_records.records.size(); ++i) {
+        const auto& rec = projected_records.records[i];
+        const auto& row = rec.row;
+        
+        if (row.fields.size() != projected_columns.size()) {
+            std::cerr << "ERROR: Record " << i << " has " << row.fields.size() 
+                      << " fields, expected " << projected_columns.size() << std::endl;
+            projection_verified = false;
+            continue;
+        }
+        
+        // Verify field types match expected columns
+        // Column 0 (id) should be Int32, Column 1 (name) should be String
+        if (row.fields[0].type != fluss::DatumType::Int32) {
+            std::cerr << "ERROR: Record " << i << " field 0 type mismatch, expected Int32" << std::endl;
+            projection_verified = false;
+        }
+        if (row.fields[1].type != fluss::DatumType::String) {
+            std::cerr << "ERROR: Record " << i << " field 1 type mismatch, expected String" << std::endl;
+            projection_verified = false;
+        }
+        
+        // Print projected data
+        if (row.fields[0].type == fluss::DatumType::Int32 && 
+            row.fields[1].type == fluss::DatumType::String) {
+            std::cout << "  Record " << i << ": id=" << row.fields[0].i32_val 
+                      << ", name=" << row.fields[1].string_val << std::endl;
+        }
+    }
+    
+    if (projection_verified) {
+        std::cout << "Column pruning verification passed!" << std::endl;
+    } else {
+        std::cerr << "Column pruning verification failed!" << std::endl;
+        std::exit(1);
+    }
+
+    return 0;
+}
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
new file mode 100644
index 0000000000..002f80694a
--- /dev/null
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -0,0 +1,461 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <cstdint>
+#include <memory>
+#include <optional>
+#include <string>
+#include <unordered_map>
+#include <vector>
+
+namespace fluss {
+
+namespace ffi {
+    struct Connection;
+    struct Admin;
+    struct Table;
+    struct AppendWriter;
+    struct LogScanner;
+}  // namespace ffi
+
+enum class DataType {
+    Boolean = 1,
+    TinyInt = 2,
+    SmallInt = 3,
+    Int = 4,
+    BigInt = 5,
+    Float = 6,
+    Double = 7,
+    String = 8,
+    Bytes = 9,
+    Date = 10,
+    Time = 11,
+    Timestamp = 12,
+    TimestampLtz = 13,
+};
+
+enum class DatumType {
+    Null = 0,
+    Bool = 1,
+    Int32 = 2,
+    Int64 = 3,
+    Float32 = 4,
+    Float64 = 5,
+    String = 6,
+    Bytes = 7,
+};
+
+struct Result {
+    int32_t error_code{0};
+    std::string error_message;
+
+    bool Ok() const { return error_code == 0; }
+};
+
+struct TablePath {
+    std::string database_name;
+    std::string table_name;
+
+    TablePath() = default;
+    TablePath(std::string db, std::string tbl)
+        : database_name(std::move(db)), table_name(std::move(tbl)) {}
+
+    std::string ToString() const { return database_name + "." + table_name; }
+};
+
+struct Column {
+    std::string name;
+    DataType data_type;
+    std::string comment;
+};
+
+struct Schema {
+    std::vector<Column> columns;
+    std::vector<std::string> primary_keys;
+
+    class Builder {
+    public:
+        Builder& AddColumn(std::string name, DataType type,
+                           std::string comment = "") {
+            columns_.push_back({std::move(name), type, std::move(comment)});
+            return *this;
+        }
+
+        Builder& SetPrimaryKeys(std::vector<std::string> keys) {
+            primary_keys_ = std::move(keys);
+            return *this;
+        }
+
+        Schema Build() {
+            return Schema{std::move(columns_), std::move(primary_keys_)};
+        }
+
+    private:
+        std::vector<Column> columns_;
+        std::vector<std::string> primary_keys_;
+    };
+
+    static Builder NewBuilder() { return Builder(); }
+};
+
+struct TableDescriptor {
+    Schema schema;
+    std::vector<std::string> partition_keys;
+    int32_t bucket_count{0};
+    std::vector<std::string> bucket_keys;
+    std::unordered_map<std::string, std::string> properties;
+    std::string comment;
+
+    class Builder {
+    public:
+        Builder& SetSchema(Schema s) {
+            schema_ = std::move(s);
+            return *this;
+        }
+
+        Builder& SetPartitionKeys(std::vector<std::string> keys) {
+            partition_keys_ = std::move(keys);
+            return *this;
+        }
+
+        Builder& SetBucketCount(int32_t count) {
+            bucket_count_ = count;
+            return *this;
+        }
+
+        Builder& SetBucketKeys(std::vector<std::string> keys) {
+            bucket_keys_ = std::move(keys);
+            return *this;
+        }
+
+        Builder& SetProperty(std::string key, std::string value) {
+            properties_[std::move(key)] = std::move(value);
+            return *this;
+        }
+
+        Builder& SetComment(std::string comment) {
+            comment_ = std::move(comment);
+            return *this;
+        }
+
+        TableDescriptor Build() {
+            return TableDescriptor{std::move(schema_),
+                                   std::move(partition_keys_),
+                                   bucket_count_,
+                                   std::move(bucket_keys_),
+                                   std::move(properties_),
+                                   std::move(comment_)};
+        }
+
+    private:
+        Schema schema_;
+        std::vector<std::string> partition_keys_;
+        int32_t bucket_count_{0};
+        std::vector<std::string> bucket_keys_;
+        std::unordered_map<std::string, std::string> properties_;
+        std::string comment_;
+    };
+
+    static Builder NewBuilder() { return Builder(); }
+};
+
+struct TableInfo {
+    int64_t table_id;
+    int32_t schema_id;
+    TablePath table_path;
+    int64_t created_time;
+    int64_t modified_time;
+    std::vector<std::string> primary_keys;
+    std::vector<std::string> bucket_keys;
+    std::vector<std::string> partition_keys;
+    int32_t num_buckets;
+    bool has_primary_key;
+    bool is_partitioned;
+    std::unordered_map<std::string, std::string> properties;
+    std::string comment;
+    Schema schema;
+};
+
+struct Datum {
+    DatumType type{DatumType::Null};
+    bool bool_val{false};
+    int32_t i32_val{0};
+    int64_t i64_val{0};
+    float f32_val{0.0F};
+    double f64_val{0.0};
+    std::string string_val;
+    std::vector<uint8_t> bytes_val;
+
+    static Datum Null() { return {}; }
+    static Datum Bool(bool v) {
+        Datum d;
+        d.type = DatumType::Bool;
+        d.bool_val = v;
+        return d;
+    }
+    static Datum Int32(int32_t v) {
+        Datum d;
+        d.type = DatumType::Int32;
+        d.i32_val = v;
+        return d;
+    }
+    static Datum Int64(int64_t v) {
+        Datum d;
+        d.type = DatumType::Int64;
+        d.i64_val = v;
+        return d;
+    }
+    static Datum Float32(float v) {
+        Datum d;
+        d.type = DatumType::Float32;
+        d.f32_val = v;
+        return d;
+    }
+    static Datum Float64(double v) {
+        Datum d;
+        d.type = DatumType::Float64;
+        d.f64_val = v;
+        return d;
+    }
+    static Datum String(std::string v) {
+        Datum d;
+        d.type = DatumType::String;
+        d.string_val = std::move(v);
+        return d;
+    }
+    static Datum Bytes(std::vector<uint8_t> v) {
+        Datum d;
+        d.type = DatumType::Bytes;
+        d.bytes_val = std::move(v);
+        return d;
+    }
+};
+
+struct GenericRow {
+    std::vector<Datum> fields;
+
+    void SetNull(size_t idx) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Null();
+    }
+
+    void SetBool(size_t idx, bool v) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Bool(v);
+    }
+
+    void SetInt32(size_t idx, int32_t v) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Int32(v);
+    }
+
+    void SetInt64(size_t idx, int64_t v) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Int64(v);
+    }
+
+    void SetFloat32(size_t idx, float v) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Float32(v);
+    }
+
+    void SetFloat64(size_t idx, double v) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Float64(v);
+    }
+
+    void SetString(size_t idx, std::string v) {
+        EnsureSize(idx);
+        fields[idx] = Datum::String(std::move(v));
+    }
+
+    void SetBytes(size_t idx, std::vector<uint8_t> v) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Bytes(std::move(v));
+    }
+
+private:
+    void EnsureSize(size_t idx) {
+        if (fields.size() <= idx) {
+            fields.resize(idx + 1);
+        }
+    }
+};
+
+struct ScanRecord {
+    int64_t offset;
+    int64_t timestamp;
+    GenericRow row;
+};
+
+struct ScanRecords {
+    std::vector<ScanRecord> records;
+
+    size_t Size() const { return records.size(); }
+    bool Empty() const { return records.empty(); }
+    const ScanRecord& operator[](size_t idx) const { return records[idx]; }
+
+    auto begin() const { return records.begin(); }
+    auto end() const { return records.end(); }
+};
+
+struct BucketOffset {
+    int64_t table_id;
+    int64_t partition_id;
+    int32_t bucket_id;
+    int64_t offset;
+};
+
+struct LakeSnapshot {
+    int64_t snapshot_id;
+    std::vector<BucketOffset> bucket_offsets;
+};
+
+class AppendWriter;
+class LogScanner;
+class Admin;
+class Table;
+
+class Connection {
+public:
+    Connection() noexcept;
+    ~Connection() noexcept;
+
+    Connection(const Connection&) = delete;
+    Connection& operator=(const Connection&) = delete;
+    Connection(Connection&& other) noexcept;
+    Connection& operator=(Connection&& other) noexcept;
+
+    static Result Connect(const std::string& bootstrap_server, Connection& out);
+
+    bool Available() const;
+
+    Result GetAdmin(Admin& out);
+    Result GetTable(const TablePath& table_path, Table& out);
+
+private:
+    void Destroy() noexcept;
+    ffi::Connection* conn_{nullptr};
+};
+
+class Admin {
+public:
+    Admin() noexcept;
+    ~Admin() noexcept;
+
+    Admin(const Admin&) = delete;
+    Admin& operator=(const Admin&) = delete;
+    Admin(Admin&& other) noexcept;
+    Admin& operator=(Admin&& other) noexcept;
+
+    bool Available() const;
+
+    Result CreateTable(const TablePath& table_path,
+                       const TableDescriptor& descriptor,
+                       bool ignore_if_exists = false);
+
+    Result GetTable(const TablePath& table_path, TableInfo& out);
+
+    Result GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& out);
+
+private:
+    friend class Connection;
+    Admin(ffi::Admin* admin) noexcept;
+
+    void Destroy() noexcept;
+    ffi::Admin* admin_{nullptr};
+};
+
+class Table {
+public:
+    Table() noexcept;
+    ~Table() noexcept;
+
+    Table(const Table&) = delete;
+    Table& operator=(const Table&) = delete;
+    Table(Table&& other) noexcept;
+    Table& operator=(Table&& other) noexcept;
+
+    bool Available() const;
+
+    Result NewAppendWriter(AppendWriter& out);
+    Result NewLogScanner(LogScanner& out);
+    Result NewLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out);
+
+    TableInfo GetTableInfo() const;
+    TablePath GetTablePath() const;
+    bool HasPrimaryKey() const;
+
+private:
+    friend class Connection;
+    Table(ffi::Table* table) noexcept;
+
+    void Destroy() noexcept;
+    ffi::Table* table_{nullptr};
+};
+
+class AppendWriter {
+public:
+    AppendWriter() noexcept;
+    ~AppendWriter() noexcept;
+
+    AppendWriter(const AppendWriter&) = delete;
+    AppendWriter& operator=(const AppendWriter&) = delete;
+    AppendWriter(AppendWriter&& other) noexcept;
+    AppendWriter& operator=(AppendWriter&& other) noexcept;
+
+    bool Available() const;
+
+    Result Append(const GenericRow& row);
+    Result Flush();
+
+private:
+    friend class Table;
+    AppendWriter(ffi::AppendWriter* writer) noexcept;
+
+    void Destroy() noexcept;
+    ffi::AppendWriter* writer_{nullptr};
+};
+
+class LogScanner {
+public:
+    LogScanner() noexcept;
+    ~LogScanner() noexcept;
+
+    LogScanner(const LogScanner&) = delete;
+    LogScanner& operator=(const LogScanner&) = delete;
+    LogScanner(LogScanner&& other) noexcept;
+    LogScanner& operator=(LogScanner&& other) noexcept;
+
+    bool Available() const;
+
+    Result Subscribe(int32_t bucket_id, int64_t start_offset);
+    Result Poll(int64_t timeout_ms, ScanRecords& out);
+
+private:
+    friend class Table;
+    LogScanner(ffi::LogScanner* scanner) noexcept;
+
+    void Destroy() noexcept;
+    ffi::LogScanner* scanner_{nullptr};
+};
+
+}  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
new file mode 100644
index 0000000000..f6997a640a
--- /dev/null
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -0,0 +1,101 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "fluss.hpp"
+#include "lib.rs.h"
+#include "ffi_converter.hpp"
+#include "rust/cxx.h"
+
+namespace fluss {
+
+Admin::Admin() noexcept = default;
+
+Admin::Admin(ffi::Admin* admin) noexcept : admin_(admin) {}
+
+Admin::~Admin() noexcept { Destroy(); }
+
+void Admin::Destroy() noexcept {
+    if (admin_) {
+        ffi::delete_admin(admin_);
+        admin_ = nullptr;
+    }
+}
+
+Admin::Admin(Admin&& other) noexcept : admin_(other.admin_) {
+    other.admin_ = nullptr;
+}
+
+Admin& Admin::operator=(Admin&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        admin_ = other.admin_;
+        other.admin_ = nullptr;
+    }
+    return *this;
+}
+
+bool Admin::Available() const { return admin_ != nullptr; }
+
+Result Admin::CreateTable(const TablePath& table_path,
+                          const TableDescriptor& descriptor,
+                          bool ignore_if_exists) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+    auto ffi_desc = utils::to_ffi_table_descriptor(descriptor);
+
+    auto ffi_result = admin_->create_table(ffi_path, ffi_desc, ignore_if_exists);
+    return utils::from_ffi_result(ffi_result);
+}
+
+Result Admin::GetTable(const TablePath& table_path, TableInfo& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+    auto ffi_result = admin_->get_table_info(ffi_path);
+
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = utils::from_ffi_table_info(ffi_result.table_info);
+    }
+
+    return result;
+}
+
+Result Admin::GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+    auto ffi_result = admin_->get_latest_lake_snapshot(ffi_path);
+
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = utils::from_ffi_lake_snapshot(ffi_result.lake_snapshot);
+    }
+
+    return result;
+}
+
+}  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/connection.cpp b/fluss-rust/bindings/cpp/src/connection.cpp
new file mode 100644
index 0000000000..ea884cdb1f
--- /dev/null
+++ b/fluss-rust/bindings/cpp/src/connection.cpp
@@ -0,0 +1,95 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "fluss.hpp"
+#include "lib.rs.h"
+#include "ffi_converter.hpp"
+#include "rust/cxx.h"
+
+namespace fluss {
+
+Connection::Connection() noexcept = default;
+
+Connection::~Connection() noexcept { Destroy(); }
+
+void Connection::Destroy() noexcept {
+    if (conn_) {
+        ffi::delete_connection(conn_);
+        conn_ = nullptr;
+    }
+}
+
+Connection::Connection(Connection&& other) noexcept : conn_(other.conn_) {
+    other.conn_ = nullptr;
+}
+
+Connection& Connection::operator=(Connection&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        conn_ = other.conn_;
+        other.conn_ = nullptr;
+    }
+    return *this;
+}
+
+Result Connection::Connect(const std::string& bootstrap_server, Connection& out) {
+    try {
+        out.conn_ = ffi::new_connection(bootstrap_server);
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+bool Connection::Available() const { return conn_ != nullptr; }
+
+Result Connection::GetAdmin(Admin& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Connection not available");
+    }
+
+    try {
+        out.admin_ = conn_->get_admin();
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result Connection::GetTable(const TablePath& table_path, Table& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Connection not available");
+    }
+
+    try {
+        auto ffi_path = utils::to_ffi_table_path(table_path);
+        out.table_ = conn_->get_table(ffi_path);
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+}  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
new file mode 100644
index 0000000000..52dd7fe5d4
--- /dev/null
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -0,0 +1,256 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include "fluss.hpp"
+#include "lib.rs.h"
+
+namespace fluss {
+namespace utils {
+
+inline Result make_error(int32_t code, std::string msg) {
+    return Result{code, std::move(msg)};
+}
+
+inline Result make_ok() {
+    return Result{0, {}};
+}
+
+inline Result from_ffi_result(const ffi::FfiResult& ffi_result) {
+    return Result{ffi_result.error_code, std::string(ffi_result.error_message)};
+}
+
+inline ffi::FfiTablePath to_ffi_table_path(const TablePath& path) {
+    ffi::FfiTablePath ffi_path;
+    ffi_path.database_name = rust::String(path.database_name);
+    ffi_path.table_name = rust::String(path.table_name);
+    return ffi_path;
+}
+
+inline ffi::FfiColumn to_ffi_column(const Column& col) {
+    ffi::FfiColumn ffi_col;
+    ffi_col.name = rust::String(col.name);
+    ffi_col.data_type = static_cast<int32_t>(col.data_type);
+    ffi_col.comment = rust::String(col.comment);
+    return ffi_col;
+}
+
+inline ffi::FfiSchema to_ffi_schema(const Schema& schema) {
+    ffi::FfiSchema ffi_schema;
+
+    rust::Vec<ffi::FfiColumn> cols;
+    for (const auto& col : schema.columns) {
+        cols.push_back(to_ffi_column(col));
+    }
+    ffi_schema.columns = std::move(cols);
+
+    rust::Vec<rust::String> pks;
+    for (const auto& pk : schema.primary_keys) {
+        pks.push_back(rust::String(pk));
+    }
+    ffi_schema.primary_keys = std::move(pks);
+
+    return ffi_schema;
+}
+
+inline ffi::FfiTableDescriptor to_ffi_table_descriptor(const TableDescriptor& desc) {
+    ffi::FfiTableDescriptor ffi_desc;
+
+    ffi_desc.schema = to_ffi_schema(desc.schema);
+
+    rust::Vec<rust::String> partition_keys;
+    for (const auto& pk : desc.partition_keys) {
+        partition_keys.push_back(rust::String(pk));
+    }
+    ffi_desc.partition_keys = std::move(partition_keys);
+
+    ffi_desc.bucket_count = desc.bucket_count;
+
+    rust::Vec<rust::String> bucket_keys;
+    for (const auto& bk : desc.bucket_keys) {
+        bucket_keys.push_back(rust::String(bk));
+    }
+    ffi_desc.bucket_keys = std::move(bucket_keys);
+
+    rust::Vec<ffi::HashMapValue> props;
+    for (const auto& [k, v] : desc.properties) {
+        ffi::HashMapValue prop;
+        prop.key = rust::String(k);
+        prop.value = rust::String(v);
+        props.push_back(prop);
+    }
+    ffi_desc.properties = std::move(props);
+
+    ffi_desc.comment = rust::String(desc.comment);
+
+    return ffi_desc;
+}
+
+inline ffi::FfiDatum to_ffi_datum(const Datum& datum) {
+    ffi::FfiDatum ffi_datum;
+    ffi_datum.datum_type = static_cast<int32_t>(datum.type);
+    ffi_datum.bool_val = datum.bool_val;
+    ffi_datum.i32_val = datum.i32_val;
+    ffi_datum.i64_val = datum.i64_val;
+    ffi_datum.f32_val = datum.f32_val;
+    ffi_datum.f64_val = datum.f64_val;
+    ffi_datum.string_val = rust::String(datum.string_val);
+
+    rust::Vec<uint8_t> bytes;
+    for (auto b : datum.bytes_val) {
+        bytes.push_back(b);
+    }
+    ffi_datum.bytes_val = std::move(bytes);
+
+    return ffi_datum;
+}
+
+inline ffi::FfiGenericRow to_ffi_generic_row(const GenericRow& row) {
+    ffi::FfiGenericRow ffi_row;
+
+    rust::Vec<ffi::FfiDatum> fields;
+    for (const auto& field : row.fields) {
+        fields.push_back(to_ffi_datum(field));
+    }
+    ffi_row.fields = std::move(fields);
+
+    return ffi_row;
+}
+
+inline Column from_ffi_column(const ffi::FfiColumn& ffi_col) {
+    return Column{
+        std::string(ffi_col.name),
+        static_cast<DataType>(ffi_col.data_type),
+        std::string(ffi_col.comment)};
+}
+
+inline Schema from_ffi_schema(const ffi::FfiSchema& ffi_schema) {
+    Schema schema;
+
+    for (const auto& col : ffi_schema.columns) {
+        schema.columns.push_back(from_ffi_column(col));
+    }
+
+    for (const auto& pk : ffi_schema.primary_keys) {
+        schema.primary_keys.push_back(std::string(pk));
+    }
+
+    return schema;
+}
+
+inline TableInfo from_ffi_table_info(const ffi::FfiTableInfo& ffi_info) {
+    TableInfo info;
+
+    info.table_id = ffi_info.table_id;
+    info.schema_id = ffi_info.schema_id;
+    info.table_path = TablePath{
+        std::string(ffi_info.table_path.database_name),
+        std::string(ffi_info.table_path.table_name)};
+    info.created_time = ffi_info.created_time;
+    info.modified_time = ffi_info.modified_time;
+
+    for (const auto& pk : ffi_info.primary_keys) {
+        info.primary_keys.push_back(std::string(pk));
+    }
+
+    for (const auto& bk : ffi_info.bucket_keys) {
+        info.bucket_keys.push_back(std::string(bk));
+    }
+
+    for (const auto& pk : ffi_info.partition_keys) {
+        info.partition_keys.push_back(std::string(pk));
+    }
+
+    info.num_buckets = ffi_info.num_buckets;
+    info.has_primary_key = ffi_info.has_primary_key;
+    info.is_partitioned = ffi_info.is_partitioned;
+
+    for (const auto& prop : ffi_info.properties) {
+        info.properties[std::string(prop.key)] = std::string(prop.value);
+    }
+
+    info.comment = std::string(ffi_info.comment);
+    info.schema = from_ffi_schema(ffi_info.schema);
+
+    return info;
+}
+
+inline Datum from_ffi_datum(const ffi::FfiDatum& ffi_datum) {
+    Datum datum;
+    datum.type = static_cast<DatumType>(ffi_datum.datum_type);
+    datum.bool_val = ffi_datum.bool_val;
+    datum.i32_val = ffi_datum.i32_val;
+    datum.i64_val = ffi_datum.i64_val;
+    datum.f32_val = ffi_datum.f32_val;
+    datum.f64_val = ffi_datum.f64_val;
+    // todo: avoid copy string
+    datum.string_val = std::string(ffi_datum.string_val);
+
+    for (auto b : ffi_datum.bytes_val) {
+        datum.bytes_val.push_back(b);
+    }
+
+    return datum;
+}
+
+inline GenericRow from_ffi_generic_row(const ffi::FfiGenericRow& ffi_row) {
+    GenericRow row;
+
+    for (const auto& field : ffi_row.fields) {
+        row.fields.push_back(from_ffi_datum(field));
+    }
+
+    return row;
+}
+
+inline ScanRecord from_ffi_scan_record(const ffi::FfiScanRecord& ffi_record) {
+    return ScanRecord{
+        ffi_record.offset,
+        ffi_record.timestamp,
+        from_ffi_generic_row(ffi_record.row)};
+}
+
+inline ScanRecords from_ffi_scan_records(const ffi::FfiScanRecords& ffi_records) {
+    ScanRecords records;
+
+    for (const auto& record : ffi_records.records) {
+        records.records.push_back(from_ffi_scan_record(record));
+    }
+
+    return records;
+}
+
+inline LakeSnapshot from_ffi_lake_snapshot(const ffi::FfiLakeSnapshot& ffi_snapshot) {
+    LakeSnapshot snapshot;
+    snapshot.snapshot_id = ffi_snapshot.snapshot_id;
+
+    for (const auto& offset : ffi_snapshot.bucket_offsets) {
+        snapshot.bucket_offsets.push_back(BucketOffset{
+            offset.table_id,
+            offset.partition_id,
+            offset.bucket_id,
+            offset.offset});
+    }
+
+    return snapshot;
+}
+
+}  // namespace utils
+}  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
new file mode 100644
index 0000000000..3e883e29c6
--- /dev/null
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -0,0 +1,523 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+mod types;
+
+use std::sync::{Arc, LazyLock};
+use std::time::Duration;
+
+use fluss as fcore;
+
+static RUNTIME: LazyLock<tokio::runtime::Runtime> = LazyLock::new(|| {
+    tokio::runtime::Builder::new_multi_thread()
+        .enable_all()
+        .build()
+        .unwrap()
+});
+
+#[cxx::bridge(namespace = "fluss::ffi")]
+mod ffi {
+    struct HashMapValue {
+        key: String,
+        value: String,
+    }
+
+    struct FfiResult {
+        error_code: i32,
+        error_message: String,
+    }
+
+    struct FfiTablePath {
+        database_name: String,
+        table_name: String,
+    }
+
+    struct FfiColumn {
+        name: String,
+        data_type: i32,
+        comment: String,
+    }
+
+    struct FfiSchema {
+        columns: Vec<FfiColumn>,
+        primary_keys: Vec<String>,
+    }
+
+    struct FfiTableDescriptor {
+        schema: FfiSchema,
+        partition_keys: Vec<String>,
+        bucket_count: i32,
+        bucket_keys: Vec<String>,
+        properties: Vec<HashMapValue>,
+        comment: String,
+    }
+
+    struct FfiTableInfo {
+        table_id: i64,
+        schema_id: i32,
+        table_path: FfiTablePath,
+        created_time: i64,
+        modified_time: i64,
+        primary_keys: Vec<String>,
+        bucket_keys: Vec<String>,
+        partition_keys: Vec<String>,
+        num_buckets: i32,
+        has_primary_key: bool,
+        is_partitioned: bool,
+        properties: Vec<HashMapValue>,
+        comment: String,
+        schema: FfiSchema,
+    }
+
+    struct FfiTableInfoResult {
+        result: FfiResult,
+        table_info: FfiTableInfo,
+    }
+
+    struct FfiDatum {
+        datum_type: i32,
+        bool_val: bool,
+        i32_val: i32,
+        i64_val: i64,
+        f32_val: f32,
+        f64_val: f64,
+        string_val: String,
+        bytes_val: Vec<u8>,
+    }
+
+    struct FfiGenericRow {
+        fields: Vec<FfiDatum>,
+    }
+
+    struct FfiScanRecord {
+        offset: i64,
+        timestamp: i64,
+        row: FfiGenericRow,
+    }
+
+    struct FfiScanRecords {
+        records: Vec<FfiScanRecord>,
+    }
+
+    struct FfiScanRecordsResult {
+        result: FfiResult,
+        scan_records: FfiScanRecords,
+    }
+
+    struct FfiLakeSnapshot {
+        snapshot_id: i64,
+        bucket_offsets: Vec<FfiBucketOffset>,
+    }
+
+    struct FfiBucketOffset {
+        table_id: i64,
+        partition_id: i64,
+        bucket_id: i32,
+        offset: i64,
+    }
+
+    struct FfiLakeSnapshotResult {
+        result: FfiResult,
+        lake_snapshot: FfiLakeSnapshot,
+    }
+
+    extern "Rust" {
+        type Connection;
+        type Admin;
+        type Table;
+        type AppendWriter;
+        type LogScanner;
+
+        // Connection
+        fn new_connection(bootstrap_server: &str) -> Result<*mut Connection>;
+        unsafe fn delete_connection(conn: *mut Connection);
+        fn get_admin(self: &Connection) -> Result<*mut Admin>;
+        fn get_table(self: &Connection, table_path: &FfiTablePath) -> Result<*mut Table>;
+
+        // Admin
+        unsafe fn delete_admin(admin: *mut Admin);
+        fn create_table(
+            self: &Admin,
+            table_path: &FfiTablePath,
+            descriptor: &FfiTableDescriptor,
+            ignore_if_exists: bool,
+        ) -> FfiResult;
+        fn get_table_info(self: &Admin, table_path: &FfiTablePath) -> FfiTableInfoResult;
+        fn get_latest_lake_snapshot(
+            self: &Admin,
+            table_path: &FfiTablePath,
+        ) -> FfiLakeSnapshotResult;
+
+        // Table
+        unsafe fn delete_table(table: *mut Table);
+        fn new_append_writer(self: &Table) -> Result<*mut AppendWriter>;
+        fn new_log_scanner(self: &Table) -> Result<*mut LogScanner>;
+        fn new_log_scanner_with_projection(
+            self: &Table,
+            column_indices: Vec<usize>,
+        ) -> Result<*mut LogScanner>;
+        fn get_table_info_from_table(self: &Table) -> FfiTableInfo;
+        fn get_table_path(self: &Table) -> FfiTablePath;
+        fn has_primary_key(self: &Table) -> bool;
+
+        // AppendWriter
+        unsafe fn delete_append_writer(writer: *mut AppendWriter);
+        fn append(self: &mut AppendWriter, row: &FfiGenericRow) -> FfiResult;
+        fn flush(self: &mut AppendWriter) -> FfiResult;
+
+        // LogScanner
+        unsafe fn delete_log_scanner(scanner: *mut LogScanner);
+        fn subscribe(self: &LogScanner, bucket_id: i32, start_offset: i64) -> FfiResult;
+        fn poll(self: &LogScanner, timeout_ms: i64) -> FfiScanRecordsResult;
+    }
+}
+
+pub struct Connection {
+    inner: Arc<fcore::client::FlussConnection>,
+    #[allow(dead_code)]
+    metadata: Option<Arc<fcore::client::Metadata>>,
+}
+
+pub struct Admin {
+    inner: fcore::client::FlussAdmin,
+}
+
+pub struct Table {
+    connection: Arc<fcore::client::FlussConnection>,
+    metadata: Arc<fcore::client::Metadata>,
+    table_info: fcore::metadata::TableInfo,
+    table_path: fcore::metadata::TablePath,
+    has_pk: bool,
+}
+
+pub struct AppendWriter {
+    inner: fcore::client::AppendWriter,
+}
+
+pub struct LogScanner {
+    inner: fcore::client::LogScanner,
+}
+
+fn ok_result() -> ffi::FfiResult {
+    ffi::FfiResult {
+        error_code: 0,
+        error_message: String::new(),
+    }
+}
+
+fn err_result(code: i32, msg: String) -> ffi::FfiResult {
+    ffi::FfiResult {
+        error_code: code,
+        error_message: msg,
+    }
+}
+
+// Connection implementation
+fn new_connection(bootstrap_server: &str) -> Result<*mut Connection, String> {
+    let config = fluss::config::Config {
+        bootstrap_server: Some(bootstrap_server.to_string()),
+        ..Default::default()
+    };
+
+    let conn = RUNTIME.block_on(async { fcore::client::FlussConnection::new(config).await });
+
+    match conn {
+        Ok(c) => {
+            let conn = Box::into_raw(Box::new(Connection {
+                inner: Arc::new(c),
+                metadata: None,
+            }));
+            Ok(conn)
+        }
+        Err(e) => Err(format!("Failed to connect: {}", e)),
+    }
+}
+
+unsafe fn delete_connection(conn: *mut Connection) {
+    if !conn.is_null() {
+        unsafe {
+            drop(Box::from_raw(conn));
+        }
+    }
+}
+
+impl Connection {
+    fn get_admin(&self) -> Result<*mut Admin, String> {
+        let admin_result = RUNTIME.block_on(async { self.inner.get_admin().await });
+
+        match admin_result {
+            Ok(admin) => {
+                let admin = Box::into_raw(Box::new(Admin { inner: admin }));
+                Ok(admin)
+            }
+            Err(e) => Err(format!("Failed to get admin: {}", e)),
+        }
+    }
+
+    fn get_table(&self, table_path: &ffi::FfiTablePath) -> Result<*mut Table, String> {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+
+        let table_result = RUNTIME.block_on(async { self.inner.get_table(&path).await });
+
+        match table_result {
+            Ok(t) => {
+                let table = Box::into_raw(Box::new(Table {
+                    connection: self.inner.clone(),
+                    metadata: t.metadata().clone(),
+                    table_info: t.table_info().clone(),
+                    table_path: t.table_path().clone(),
+                    has_pk: t.has_primary_key(),
+                }));
+                Ok(table)
+            }
+            Err(e) => Err(format!("Failed to get table: {}", e)),
+        }
+    }
+}
+
+// Admin implementation
+unsafe fn delete_admin(admin: *mut Admin) {
+    if !admin.is_null() {
+        unsafe {
+            drop(Box::from_raw(admin));
+        }
+    }
+}
+
+impl Admin {
+    fn create_table(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        descriptor: &ffi::FfiTableDescriptor,
+        ignore_if_exists: bool,
+    ) -> ffi::FfiResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+
+        let core_descriptor = match types::ffi_descriptor_to_core(descriptor) {
+            Ok(d) => d,
+            Err(e) => return err_result(1, e.to_string()),
+        };
+
+        let result = RUNTIME.block_on(async {
+            self.inner
+                .create_table(&path, &core_descriptor, ignore_if_exists)
+                .await
+        });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(2, e.to_string()),
+        }
+    }
+
+    fn get_table_info(&self, table_path: &ffi::FfiTablePath) -> ffi::FfiTableInfoResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+
+        let result = RUNTIME.block_on(async { self.inner.get_table(&path).await });
+
+        match result {
+            Ok(info) => ffi::FfiTableInfoResult {
+                result: ok_result(),
+                table_info: types::core_table_info_to_ffi(&info),
+            },
+            Err(e) => ffi::FfiTableInfoResult {
+                result: err_result(1, e.to_string()),
+                table_info: types::empty_table_info(),
+            },
+        }
+    }
+
+    fn get_latest_lake_snapshot(
+        &self,
+        table_path: &ffi::FfiTablePath,
+    ) -> ffi::FfiLakeSnapshotResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+
+        let result = RUNTIME.block_on(async { self.inner.get_latest_lake_snapshot(&path).await });
+
+        match result {
+            Ok(snapshot) => ffi::FfiLakeSnapshotResult {
+                result: ok_result(),
+                lake_snapshot: types::core_lake_snapshot_to_ffi(&snapshot),
+            },
+            Err(e) => ffi::FfiLakeSnapshotResult {
+                result: err_result(1, e.to_string()),
+                lake_snapshot: ffi::FfiLakeSnapshot {
+                    snapshot_id: -1,
+                    bucket_offsets: vec![],
+                },
+            },
+        }
+    }
+}
+
+// Table implementation
+unsafe fn delete_table(table: *mut Table) {
+    if !table.is_null() {
+        unsafe {
+            drop(Box::from_raw(table));
+        }
+    }
+}
+
+impl Table {
+    fn new_append_writer(&self) -> Result<*mut AppendWriter, String> {
+        let _enter = RUNTIME.enter();
+
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+
+        let table_append = match fluss_table.new_append() {
+            Ok(a) => a,
+            Err(e) => return Err(format!("Failed to create append: {}", e)),
+        };
+
+        let writer = table_append.create_writer();
+        let writer = Box::into_raw(Box::new(AppendWriter { inner: writer }));
+        Ok(writer)
+    }
+
+    fn new_log_scanner(&self) -> Result<*mut LogScanner, String> {
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+
+        let scanner = fluss_table.new_scan().create_log_scanner();
+        let scanner = Box::into_raw(Box::new(LogScanner { inner: scanner }));
+        Ok(scanner)
+    }
+
+    fn new_log_scanner_with_projection(
+        &self,
+        column_indices: Vec<usize>,
+    ) -> Result<*mut LogScanner, String> {
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+
+        let scan = fluss_table.new_scan();
+        let scan = match scan.project(&column_indices) {
+            Ok(s) => s,
+            Err(e) => return Err(format!("Failed to project columns: {}", e)),
+        };
+        let scanner = scan.create_log_scanner();
+        let scanner = Box::into_raw(Box::new(LogScanner { inner: scanner }));
+        Ok(scanner)
+    }
+
+    fn get_table_info_from_table(&self) -> ffi::FfiTableInfo {
+        types::core_table_info_to_ffi(&self.table_info)
+    }
+
+    fn get_table_path(&self) -> ffi::FfiTablePath {
+        ffi::FfiTablePath {
+            database_name: self.table_path.database().to_string(),
+            table_name: self.table_path.table().to_string(),
+        }
+    }
+
+    fn has_primary_key(&self) -> bool {
+        self.has_pk
+    }
+}
+
+// AppendWriter implementation
+unsafe fn delete_append_writer(writer: *mut AppendWriter) {
+    if !writer.is_null() {
+        unsafe {
+            drop(Box::from_raw(writer));
+        }
+    }
+}
+
+impl AppendWriter {
+    fn append(&mut self, row: &ffi::FfiGenericRow) -> ffi::FfiResult {
+        let generic_row = types::ffi_row_to_core(row);
+
+        let result = RUNTIME.block_on(async { self.inner.append(generic_row).await });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+
+    fn flush(&mut self) -> ffi::FfiResult {
+        let result = RUNTIME.block_on(async { self.inner.flush().await });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+}
+
+// LogScanner implementation
+unsafe fn delete_log_scanner(scanner: *mut LogScanner) {
+    if !scanner.is_null() {
+        unsafe {
+            drop(Box::from_raw(scanner));
+        }
+    }
+}
+
+impl LogScanner {
+    fn subscribe(&self, bucket_id: i32, start_offset: i64) -> ffi::FfiResult {
+        let result =
+            RUNTIME.block_on(async { self.inner.subscribe(bucket_id, start_offset).await });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+
+    fn poll(&self, timeout_ms: i64) -> ffi::FfiScanRecordsResult {
+        let timeout = Duration::from_millis(timeout_ms as u64);
+        let result = RUNTIME.block_on(async { self.inner.poll(timeout).await });
+
+        match result {
+            Ok(records) => ffi::FfiScanRecordsResult {
+                result: ok_result(),
+                scan_records: types::core_scan_records_to_ffi(&records),
+            },
+            Err(e) => ffi::FfiScanRecordsResult {
+                result: err_result(1, e.to_string()),
+                scan_records: ffi::FfiScanRecords { records: vec![] },
+            },
+        }
+    }
+}
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
new file mode 100644
index 0000000000..b28b783ee8
--- /dev/null
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -0,0 +1,228 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include "fluss.hpp"
+#include "lib.rs.h"
+#include "ffi_converter.hpp"
+#include "rust/cxx.h"
+
+namespace fluss {
+
+Table::Table() noexcept = default;
+
+Table::Table(ffi::Table* table) noexcept : table_(table) {}
+
+Table::~Table() noexcept { Destroy(); }
+
+void Table::Destroy() noexcept {
+    if (table_) {
+        ffi::delete_table(table_);
+        table_ = nullptr;
+    }
+}
+
+Table::Table(Table&& other) noexcept : table_(other.table_) {
+    other.table_ = nullptr;
+}
+
+Table& Table::operator=(Table&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        table_ = other.table_;
+        other.table_ = nullptr;
+    }
+    return *this;
+}
+
+bool Table::Available() const { return table_ != nullptr; }
+
+Result Table::NewAppendWriter(AppendWriter& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        out.writer_ = table_->new_append_writer();
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result Table::NewLogScanner(LogScanner& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        out.scanner_ = table_->new_log_scanner();
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result Table::NewLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        rust::Vec<size_t> rust_indices;
+        for (size_t idx : column_indices) {
+            rust_indices.push_back(idx);
+        }
+        out.scanner_ = table_->new_log_scanner_with_projection(std::move(rust_indices));
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+TableInfo Table::GetTableInfo() const {
+    if (!Available()) {
+        return TableInfo{};
+    }
+    auto ffi_info = table_->get_table_info_from_table();
+    return utils::from_ffi_table_info(ffi_info);
+}
+
+TablePath Table::GetTablePath() const {
+    if (!Available()) {
+        return TablePath{};
+    }
+    auto ffi_path = table_->get_table_path();
+    return TablePath{std::string(ffi_path.database_name), std::string(ffi_path.table_name)};
+}
+
+bool Table::HasPrimaryKey() const {
+    if (!Available()) {
+        return false;
+    }
+    return table_->has_primary_key();
+}
+
+// AppendWriter implementation
+AppendWriter::AppendWriter() noexcept = default;
+
+AppendWriter::AppendWriter(ffi::AppendWriter* writer) noexcept : writer_(writer) {}
+
+AppendWriter::~AppendWriter() noexcept { Destroy(); }
+
+void AppendWriter::Destroy() noexcept {
+    if (writer_) {
+        ffi::delete_append_writer(writer_);
+        writer_ = nullptr;
+    }
+}
+
+AppendWriter::AppendWriter(AppendWriter&& other) noexcept : writer_(other.writer_) {
+    other.writer_ = nullptr;
+}
+
+AppendWriter& AppendWriter::operator=(AppendWriter&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        writer_ = other.writer_;
+        other.writer_ = nullptr;
+    }
+    return *this;
+}
+
+bool AppendWriter::Available() const { return writer_ != nullptr; }
+
+Result AppendWriter::Append(const GenericRow& row) {
+    if (!Available()) {
+        return utils::make_error(1, "AppendWriter not available");
+    }
+
+    auto ffi_row = utils::to_ffi_generic_row(row);
+    auto ffi_result = writer_->append(ffi_row);
+    return utils::from_ffi_result(ffi_result);
+}
+
+Result AppendWriter::Flush() {
+    if (!Available()) {
+        return utils::make_error(1, "AppendWriter not available");
+    }
+
+    auto ffi_result = writer_->flush();
+    return utils::from_ffi_result(ffi_result);
+}
+
+// LogScanner implementation
+LogScanner::LogScanner() noexcept = default;
+
+LogScanner::LogScanner(ffi::LogScanner* scanner) noexcept : scanner_(scanner) {}
+
+LogScanner::~LogScanner() noexcept { Destroy(); }
+
+void LogScanner::Destroy() noexcept {
+    if (scanner_) {
+        ffi::delete_log_scanner(scanner_);
+        scanner_ = nullptr;
+    }
+}
+
+LogScanner::LogScanner(LogScanner&& other) noexcept : scanner_(other.scanner_) {
+    other.scanner_ = nullptr;
+}
+
+LogScanner& LogScanner::operator=(LogScanner&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        scanner_ = other.scanner_;
+        other.scanner_ = nullptr;
+    }
+    return *this;
+}
+
+bool LogScanner::Available() const { return scanner_ != nullptr; }
+
+Result LogScanner::Subscribe(int32_t bucket_id, int64_t start_offset) {
+    if (!Available()) {
+        return utils::make_error(1, "LogScanner not available");
+    }
+
+    auto ffi_result = scanner_->subscribe(bucket_id, start_offset);
+    return utils::from_ffi_result(ffi_result);
+}
+
+Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
+    if (!Available()) {
+        return utils::make_error(1, "LogScanner not available");
+    }
+
+    auto ffi_result = scanner_->poll(timeout_ms);
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (!result.Ok()) {
+        return result;
+    }
+
+    out = utils::from_ffi_scan_records(ffi_result.scan_records);
+    return utils::make_ok();
+}
+
+}  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
new file mode 100644
index 0000000000..d3bab38abe
--- /dev/null
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -0,0 +1,485 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::ffi;
+use anyhow::{Result, anyhow};
+use arrow::array::{
+    Date32Array, LargeBinaryArray, LargeStringArray, Time32MillisecondArray, Time32SecondArray,
+    Time64MicrosecondArray, Time64NanosecondArray, TimestampMicrosecondArray,
+    TimestampMillisecondArray, TimestampNanosecondArray, TimestampSecondArray,
+};
+use arrow::datatypes::{DataType as ArrowDataType, TimeUnit};
+use fcore::row::InternalRow;
+use fluss as fcore;
+
+pub const DATA_TYPE_BOOLEAN: i32 = 1;
+pub const DATA_TYPE_TINYINT: i32 = 2;
+pub const DATA_TYPE_SMALLINT: i32 = 3;
+pub const DATA_TYPE_INT: i32 = 4;
+pub const DATA_TYPE_BIGINT: i32 = 5;
+pub const DATA_TYPE_FLOAT: i32 = 6;
+pub const DATA_TYPE_DOUBLE: i32 = 7;
+pub const DATA_TYPE_STRING: i32 = 8;
+pub const DATA_TYPE_BYTES: i32 = 9;
+pub const DATA_TYPE_DATE: i32 = 10;
+pub const DATA_TYPE_TIME: i32 = 11;
+pub const DATA_TYPE_TIMESTAMP: i32 = 12;
+pub const DATA_TYPE_TIMESTAMP_LTZ: i32 = 13;
+
+pub const DATUM_TYPE_NULL: i32 = 0;
+pub const DATUM_TYPE_BOOL: i32 = 1;
+pub const DATUM_TYPE_INT32: i32 = 2;
+pub const DATUM_TYPE_INT64: i32 = 3;
+pub const DATUM_TYPE_FLOAT32: i32 = 4;
+pub const DATUM_TYPE_FLOAT64: i32 = 5;
+pub const DATUM_TYPE_STRING: i32 = 6;
+pub const DATUM_TYPE_BYTES: i32 = 7;
+
+fn ffi_data_type_to_core(dt: i32) -> Result<fcore::metadata::DataType> {
+    match dt {
+        DATA_TYPE_BOOLEAN => Ok(fcore::metadata::DataTypes::boolean()),
+        DATA_TYPE_TINYINT => Ok(fcore::metadata::DataTypes::tinyint()),
+        DATA_TYPE_SMALLINT => Ok(fcore::metadata::DataTypes::smallint()),
+        DATA_TYPE_INT => Ok(fcore::metadata::DataTypes::int()),
+        DATA_TYPE_BIGINT => Ok(fcore::metadata::DataTypes::bigint()),
+        DATA_TYPE_FLOAT => Ok(fcore::metadata::DataTypes::float()),
+        DATA_TYPE_DOUBLE => Ok(fcore::metadata::DataTypes::double()),
+        DATA_TYPE_STRING => Ok(fcore::metadata::DataTypes::string()),
+        DATA_TYPE_BYTES => Ok(fcore::metadata::DataTypes::bytes()),
+        DATA_TYPE_DATE => Ok(fcore::metadata::DataTypes::date()),
+        DATA_TYPE_TIME => Ok(fcore::metadata::DataTypes::time()),
+        DATA_TYPE_TIMESTAMP => Ok(fcore::metadata::DataTypes::timestamp()),
+        DATA_TYPE_TIMESTAMP_LTZ => Ok(fcore::metadata::DataTypes::timestamp_ltz()),
+        _ => Err(anyhow!("Unknown data type: {}", dt)),
+    }
+}
+
+fn core_data_type_to_ffi(dt: &fcore::metadata::DataType) -> i32 {
+    match dt {
+        fcore::metadata::DataType::Boolean(_) => DATA_TYPE_BOOLEAN,
+        fcore::metadata::DataType::TinyInt(_) => DATA_TYPE_TINYINT,
+        fcore::metadata::DataType::SmallInt(_) => DATA_TYPE_SMALLINT,
+        fcore::metadata::DataType::Int(_) => DATA_TYPE_INT,
+        fcore::metadata::DataType::BigInt(_) => DATA_TYPE_BIGINT,
+        fcore::metadata::DataType::Float(_) => DATA_TYPE_FLOAT,
+        fcore::metadata::DataType::Double(_) => DATA_TYPE_DOUBLE,
+        fcore::metadata::DataType::String(_) => DATA_TYPE_STRING,
+        fcore::metadata::DataType::Bytes(_) => DATA_TYPE_BYTES,
+        fcore::metadata::DataType::Date(_) => DATA_TYPE_DATE,
+        fcore::metadata::DataType::Time(_) => DATA_TYPE_TIME,
+        fcore::metadata::DataType::Timestamp(_) => DATA_TYPE_TIMESTAMP,
+        fcore::metadata::DataType::TimestampLTz(_) => DATA_TYPE_TIMESTAMP_LTZ,
+        _ => 0,
+    }
+}
+
+pub fn ffi_descriptor_to_core(
+    descriptor: &ffi::FfiTableDescriptor,
+) -> Result<fcore::metadata::TableDescriptor> {
+    let mut schema_builder = fcore::metadata::Schema::builder();
+
+    for col in &descriptor.schema.columns {
+        let dt = ffi_data_type_to_core(col.data_type)?;
+        schema_builder = schema_builder.column(&col.name, dt);
+        if !col.comment.is_empty() {
+            schema_builder = schema_builder.with_comment(&col.comment);
+        }
+    }
+
+    if !descriptor.schema.primary_keys.is_empty() {
+        schema_builder = schema_builder.primary_key(descriptor.schema.primary_keys.clone());
+    }
+
+    let schema = schema_builder.build()?;
+
+    let mut builder = fcore::metadata::TableDescriptor::builder()
+        .schema(schema)
+        .partitioned_by(descriptor.partition_keys.clone());
+
+    if descriptor.bucket_count > 0 {
+        builder = builder.distributed_by(
+            Some(descriptor.bucket_count),
+            descriptor.bucket_keys.clone(),
+        );
+    } else {
+        builder = builder.distributed_by(None, descriptor.bucket_keys.clone());
+    }
+
+    for prop in &descriptor.properties {
+        builder = builder.property(&prop.key, &prop.value);
+    }
+
+    if !descriptor.comment.is_empty() {
+        builder = builder.comment(&descriptor.comment);
+    }
+
+    Ok(builder.build()?)
+}
+
+pub fn core_table_info_to_ffi(info: &fcore::metadata::TableInfo) -> ffi::FfiTableInfo {
+    let schema = info.get_schema();
+    let columns: Vec<ffi::FfiColumn> = schema
+        .columns()
+        .iter()
+        .map(|col| ffi::FfiColumn {
+            name: col.name().to_string(),
+            data_type: core_data_type_to_ffi(col.data_type()),
+            comment: col.comment().unwrap_or("").to_string(),
+        })
+        .collect();
+
+    let primary_keys: Vec<String> = schema
+        .primary_key()
+        .map(|pk| pk.column_names().to_vec())
+        .unwrap_or_default();
+
+    let properties: Vec<ffi::HashMapValue> = info
+        .get_properties()
+        .iter()
+        .map(|(k, v)| ffi::HashMapValue {
+            key: k.clone(),
+            value: v.clone(),
+        })
+        .collect();
+
+    ffi::FfiTableInfo {
+        table_id: info.get_table_id(),
+        schema_id: info.get_schema_id(),
+        table_path: ffi::FfiTablePath {
+            database_name: info.get_table_path().database().to_string(),
+            table_name: info.get_table_path().table().to_string(),
+        },
+        created_time: info.get_created_time(),
+        modified_time: info.get_modified_time(),
+        primary_keys: info.get_primary_keys().clone(),
+        bucket_keys: info.get_bucket_keys().to_vec(),
+        partition_keys: info.get_partition_keys().to_vec(),
+        num_buckets: info.get_num_buckets(),
+        has_primary_key: info.has_primary_key(),
+        is_partitioned: info.is_partitioned(),
+        properties,
+        comment: info.get_comment().unwrap_or("").to_string(),
+        schema: ffi::FfiSchema {
+            columns,
+            primary_keys,
+        },
+    }
+}
+
+pub fn empty_table_info() -> ffi::FfiTableInfo {
+    ffi::FfiTableInfo {
+        table_id: 0,
+        schema_id: 0,
+        table_path: ffi::FfiTablePath {
+            database_name: String::new(),
+            table_name: String::new(),
+        },
+        created_time: 0,
+        modified_time: 0,
+        primary_keys: vec![],
+        bucket_keys: vec![],
+        partition_keys: vec![],
+        num_buckets: 0,
+        has_primary_key: false,
+        is_partitioned: false,
+        properties: vec![],
+        comment: String::new(),
+        schema: ffi::FfiSchema {
+            columns: vec![],
+            primary_keys: vec![],
+        },
+    }
+}
+
+pub fn ffi_row_to_core(row: &ffi::FfiGenericRow) -> fcore::row::GenericRow<'_> {
+    use fcore::row::Datum;
+
+    let mut generic_row = fcore::row::GenericRow::new();
+
+    for (idx, field) in row.fields.iter().enumerate() {
+        let datum = match field.datum_type {
+            DATUM_TYPE_NULL => Datum::Null,
+            DATUM_TYPE_BOOL => Datum::Bool(field.bool_val),
+            DATUM_TYPE_INT32 => Datum::Int32(field.i32_val),
+            DATUM_TYPE_INT64 => Datum::Int64(field.i64_val),
+            DATUM_TYPE_FLOAT32 => Datum::Float32(field.f32_val.into()),
+            DATUM_TYPE_FLOAT64 => Datum::Float64(field.f64_val.into()),
+            DATUM_TYPE_STRING => Datum::String(field.string_val.as_str()),
+            // todo: avoid copy bytes for blob
+            DATUM_TYPE_BYTES => Datum::Blob(field.bytes_val.clone().into()),
+            _ => Datum::Null,
+        };
+        generic_row.set_field(idx, datum);
+    }
+
+    generic_row
+}
+
+pub fn core_scan_records_to_ffi(records: &fcore::record::ScanRecords) -> ffi::FfiScanRecords {
+    let mut ffi_records = Vec::new();
+
+    // Iterate over all buckets and their records
+    for bucket_records in records.records_by_buckets().values() {
+        for record in bucket_records {
+            let row = record.row();
+            let fields = core_row_to_ffi_fields(row);
+
+            ffi_records.push(ffi::FfiScanRecord {
+                offset: record.offset(),
+                timestamp: record.timestamp(),
+                row: ffi::FfiGenericRow { fields },
+            });
+        }
+    }
+
+    ffi::FfiScanRecords {
+        records: ffi_records,
+    }
+}
+
+fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
+    fn new_datum(datum_type: i32) -> ffi::FfiDatum {
+        ffi::FfiDatum {
+            datum_type,
+            bool_val: false,
+            i32_val: 0,
+            i64_val: 0,
+            f32_val: 0.0,
+            f64_val: 0.0,
+            string_val: String::new(),
+            bytes_val: vec![],
+        }
+    }
+
+    let record_batch = row.get_record_batch();
+    let schema = record_batch.schema();
+    let row_id = row.get_row_id();
+
+    let mut fields = Vec::with_capacity(schema.fields().len());
+
+    for (i, field) in schema.fields().iter().enumerate() {
+        if row.is_null_at(i) {
+            fields.push(new_datum(DATUM_TYPE_NULL));
+            continue;
+        }
+
+        let datum = match field.data_type() {
+            ArrowDataType::Boolean => {
+                let mut datum = new_datum(DATUM_TYPE_BOOL);
+                datum.bool_val = row.get_boolean(i);
+                datum
+            }
+            ArrowDataType::Int8 => {
+                let mut datum = new_datum(DATUM_TYPE_INT32);
+                datum.i32_val = row.get_byte(i) as i32;
+                datum
+            }
+            ArrowDataType::Int16 => {
+                let mut datum = new_datum(DATUM_TYPE_INT32);
+                datum.i32_val = row.get_short(i) as i32;
+                datum
+            }
+            ArrowDataType::Int32 => {
+                let mut datum = new_datum(DATUM_TYPE_INT32);
+                datum.i32_val = row.get_int(i);
+                datum
+            }
+            ArrowDataType::Int64 => {
+                let mut datum = new_datum(DATUM_TYPE_INT64);
+                datum.i64_val = row.get_long(i);
+                datum
+            }
+            ArrowDataType::Float32 => {
+                let mut datum = new_datum(DATUM_TYPE_FLOAT32);
+                datum.f32_val = row.get_float(i);
+                datum
+            }
+            ArrowDataType::Float64 => {
+                let mut datum = new_datum(DATUM_TYPE_FLOAT64);
+                datum.f64_val = row.get_double(i);
+                datum
+            }
+            ArrowDataType::Utf8 => {
+                let mut datum = new_datum(DATUM_TYPE_STRING);
+                // todo: avoid copy string
+                datum.string_val = row.get_string(i).to_string();
+                datum
+            }
+            ArrowDataType::LargeUtf8 => {
+                let array = record_batch
+                    .column(i)
+                    .as_any()
+                    .downcast_ref::<LargeStringArray>()
+                    .expect("LargeUtf8 column expected");
+                let mut datum = new_datum(DATUM_TYPE_STRING);
+                datum.string_val = array.value(row_id).to_string();
+                datum
+            }
+            ArrowDataType::Binary => {
+                let mut datum = new_datum(DATUM_TYPE_BYTES);
+                // todo: avoid copy bytes for blob
+                datum.bytes_val = row.get_bytes(i);
+                datum
+            }
+            ArrowDataType::FixedSizeBinary(len) => {
+                let mut datum = new_datum(DATUM_TYPE_BYTES);
+                datum.bytes_val = row.get_binary(i, *len as usize);
+                datum
+            }
+            ArrowDataType::LargeBinary => {
+                let array = record_batch
+                    .column(i)
+                    .as_any()
+                    .downcast_ref::<LargeBinaryArray>()
+                    .expect("LargeBinary column expected");
+                let mut datum = new_datum(DATUM_TYPE_BYTES);
+                datum.bytes_val = array.value(row_id).to_vec();
+                datum
+            }
+            ArrowDataType::Date32 => {
+                let array = record_batch
+                    .column(i)
+                    .as_any()
+                    .downcast_ref::<Date32Array>()
+                    .expect("Date32 column expected");
+                let mut datum = new_datum(DATUM_TYPE_INT32);
+                datum.i32_val = array.value(row_id);
+                datum
+            }
+            ArrowDataType::Timestamp(unit, _) => match unit {
+                TimeUnit::Second => {
+                    let array = record_batch
+                        .column(i)
+                        .as_any()
+                        .downcast_ref::<TimestampSecondArray>()
+                        .expect("Timestamp(second) column expected");
+                    let mut datum = new_datum(DATUM_TYPE_INT64);
+                    datum.i64_val = array.value(row_id);
+                    datum
+                }
+                TimeUnit::Millisecond => {
+                    let array = record_batch
+                        .column(i)
+                        .as_any()
+                        .downcast_ref::<TimestampMillisecondArray>()
+                        .expect("Timestamp(millisecond) column expected");
+                    let mut datum = new_datum(DATUM_TYPE_INT64);
+                    datum.i64_val = array.value(row_id);
+                    datum
+                }
+                TimeUnit::Microsecond => {
+                    let array = record_batch
+                        .column(i)
+                        .as_any()
+                        .downcast_ref::<TimestampMicrosecondArray>()
+                        .expect("Timestamp(microsecond) column expected");
+                    let mut datum = new_datum(DATUM_TYPE_INT64);
+                    datum.i64_val = array.value(row_id);
+                    datum
+                }
+                TimeUnit::Nanosecond => {
+                    let array = record_batch
+                        .column(i)
+                        .as_any()
+                        .downcast_ref::<TimestampNanosecondArray>()
+                        .expect("Timestamp(nanosecond) column expected");
+                    let mut datum = new_datum(DATUM_TYPE_INT64);
+                    datum.i64_val = array.value(row_id);
+                    datum
+                }
+            },
+            ArrowDataType::Time32(unit) => match unit {
+                TimeUnit::Second => {
+                    let array = record_batch
+                        .column(i)
+                        .as_any()
+                        .downcast_ref::<Time32SecondArray>()
+                        .expect("Time32(second) column expected");
+                    let mut datum = new_datum(DATUM_TYPE_INT32);
+                    datum.i32_val = array.value(row_id);
+                    datum
+                }
+                TimeUnit::Millisecond => {
+                    let array = record_batch
+                        .column(i)
+                        .as_any()
+                        .downcast_ref::<Time32MillisecondArray>()
+                        .expect("Time32(millisecond) column expected");
+                    let mut datum = new_datum(DATUM_TYPE_INT32);
+                    datum.i32_val = array.value(row_id);
+                    datum
+                }
+                _ => panic!(
+                    "Will never come here. Unsupported Time32 unit for column {}",
+                    i
+                ),
+            },
+            ArrowDataType::Time64(unit) => match unit {
+                TimeUnit::Microsecond => {
+                    let array = record_batch
+                        .column(i)
+                        .as_any()
+                        .downcast_ref::<Time64MicrosecondArray>()
+                        .expect("Time64(microsecond) column expected");
+                    let mut datum = new_datum(DATUM_TYPE_INT64);
+                    datum.i64_val = array.value(row_id);
+                    datum
+                }
+                TimeUnit::Nanosecond => {
+                    let array = record_batch
+                        .column(i)
+                        .as_any()
+                        .downcast_ref::<Time64NanosecondArray>()
+                        .expect("Time64(nanosecond) column expected");
+                    let mut datum = new_datum(DATUM_TYPE_INT64);
+                    datum.i64_val = array.value(row_id);
+                    datum
+                }
+                _ => panic!(
+                    "Will never come here. Unsupported Time64 unit for column {}",
+                    i
+                ),
+            },
+            other => panic!(
+                "Will never come here. Unsupported Arrow data type for column {}: {:?}",
+                i, other
+            ),
+        };
+
+        fields.push(datum);
+    }
+
+    fields
+}
+
+pub fn core_lake_snapshot_to_ffi(snapshot: &fcore::metadata::LakeSnapshot) -> ffi::FfiLakeSnapshot {
+    let bucket_offsets: Vec<ffi::FfiBucketOffset> = snapshot
+        .table_buckets_offset
+        .iter()
+        .map(|(bucket, offset)| ffi::FfiBucketOffset {
+            table_id: bucket.table_id(),
+            partition_id: bucket.partition_id().unwrap_or(-1),
+            bucket_id: bucket.bucket_id(),
+            offset: *offset,
+        })
+        .collect();
+
+    ffi::FfiLakeSnapshot {
+        snapshot_id: snapshot.snapshot_id,
+        bucket_offsets,
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 08574965f4..92f600e62a 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -18,7 +18,7 @@
 use clap::Parser;
 use serde::{Deserialize, Serialize};
 
-#[derive(Parser, Debug, Clone, Deserialize, Serialize, Default)]
+#[derive(Parser, Debug, Clone, Deserialize, Serialize)]
 #[command(author, version, about, long_about = None)]
 pub struct Config {
     #[arg(long)]
@@ -37,3 +37,15 @@ pub struct Config {
     #[arg(long, default_value_t = 2 * 1024 * 1024)]
     pub writer_batch_size: i32,
 }
+
+impl Default for Config {
+    fn default() -> Self {
+        Self {
+            bootstrap_server: None,
+            request_max_size: 10 * 1024 * 1024,
+            writer_acks: String::from("all"),
+            writer_retries: i32::MAX,
+            writer_batch_size: 2 * 1024 * 1024,
+        }
+    }
+}

From 8e273a801b9f157102b64a0e1910a03b058673e1 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sat, 13 Dec 2025 15:17:44 +0800
Subject: [PATCH 030/287] chore: update readme to mark it as official rust
 client (#88)

---
 fluss-rust/README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/README.md b/fluss-rust/README.md
index 6caaebb154..ee9478c6a5 100644
--- a/fluss-rust/README.md
+++ b/fluss-rust/README.md
@@ -28,7 +28,7 @@ Rust implementation of [Apache Fluss™](https://fluss.apache.org/).
 It bridges the gap between streaming data and the data Lakehouse by enabling low-latency, high-throughput data ingestion and processing while seamlessly integrating with popular compute engines.
 
 ## Why Fluss Rust Client
-It's an unofficial experimental Rust client for interacting with Fluss. This client provides foundational capabilities for table management and log streaming operations, enabling developers to explore Fluss within Rust ecosystems.
+It's an official Rust client for interacting with Fluss. This client provides foundational capabilities for table management and log streaming operations, enabling developers to explore Fluss within Rust ecosystems.
 
 ## Quick-Start
 

From bf42412bb92b89f690ae864dde04755fb6abe331 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Sat, 13 Dec 2025 17:10:03 +0800
Subject: [PATCH 031/287] chore: abort last not complete batch (#91)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-authored-by: 赵海源 <zhaohaiyuan@xiaohongshu.com>
---
 fluss-rust/crates/fluss/src/record/arrow.rs | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index e46093dd14..806c9a5824 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -369,7 +369,11 @@ impl<'a> LogRecordsBatchs<'a> {
 
         let batch_size_bytes =
             LittleEndian::read_i32(self.data.get(self.current_pos + LENGTH_OFFSET..).unwrap());
-        Some(batch_size_bytes as usize + LOG_OVERHEAD)
+        let batch_size = batch_size_bytes as usize + LOG_OVERHEAD;
+        if batch_size > self.remaining_bytes {
+            return None;
+        }
+        Some(batch_size)
     }
 }
 

From d5586643db49eb07cbf35b0ef42f93c33ea7f6c1 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sat, 13 Dec 2025 17:11:28 +0800
Subject: [PATCH 032/287] feat: support subscribe from remote (#76)

---
 fluss-rust/bindings/cpp/src/lib.rs            |  20 +-
 fluss-rust/bindings/cpp/src/types.rs          |  15 +-
 fluss-rust/bindings/python/src/table.rs       |   6 +-
 .../crates/examples/src/example_table.rs      |   2 +-
 fluss-rust/crates/fluss/Cargo.toml            |  17 +-
 .../crates/fluss/src/client/table/mod.rs      |   1 +
 .../fluss/src/client/table/remote_log.rs      | 267 ++++++++++++++++++
 .../crates/fluss/src/client/table/scanner.rs  |  90 +++++-
 fluss-rust/crates/fluss/src/error.rs          |  12 +
 fluss-rust/crates/fluss/src/io/file_io.rs     | 158 +++++++++++
 fluss-rust/crates/fluss/src/io/mod.rs         |  34 +++
 fluss-rust/crates/fluss/src/io/storage.rs     |  79 ++++++
 fluss-rust/crates/fluss/src/io/storage_fs.rs  |  30 ++
 .../crates/fluss/src/io/storage_memory.rs     |  24 ++
 fluss-rust/crates/fluss/src/lib.rs            |   1 +
 fluss-rust/crates/fluss/src/util/mod.rs       |   8 +
 .../fluss/tests/integration/fluss_cluster.rs  |  60 +++-
 .../crates/fluss/tests/integration/table.rs   |  19 +-
 .../tests/integration/table_remote_scan.rs    | 223 +++++++++++++++
 fluss-rust/crates/fluss/tests/test_fluss.rs   |   2 +
 20 files changed, 1019 insertions(+), 49 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/table/remote_log.rs
 create mode 100644 fluss-rust/crates/fluss/src/io/file_io.rs
 create mode 100644 fluss-rust/crates/fluss/src/io/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/io/storage.rs
 create mode 100644 fluss-rust/crates/fluss/src/io/storage_fs.rs
 create mode 100644 fluss-rust/crates/fluss/src/io/storage_memory.rs
 create mode 100644 fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 3e883e29c6..54d6941379 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -243,7 +243,7 @@ fn new_connection(bootstrap_server: &str) -> Result<*mut Connection, String> {
             }));
             Ok(conn)
         }
-        Err(e) => Err(format!("Failed to connect: {}", e)),
+        Err(e) => Err(format!("Failed to connect: {e}")),
     }
 }
 
@@ -264,7 +264,7 @@ impl Connection {
                 let admin = Box::into_raw(Box::new(Admin { inner: admin }));
                 Ok(admin)
             }
-            Err(e) => Err(format!("Failed to get admin: {}", e)),
+            Err(e) => Err(format!("Failed to get admin: {e}")),
         }
     }
 
@@ -287,7 +287,7 @@ impl Connection {
                 }));
                 Ok(table)
             }
-            Err(e) => Err(format!("Failed to get table: {}", e)),
+            Err(e) => Err(format!("Failed to get table: {e}")),
         }
     }
 }
@@ -398,7 +398,7 @@ impl Table {
 
         let table_append = match fluss_table.new_append() {
             Ok(a) => a,
-            Err(e) => return Err(format!("Failed to create append: {}", e)),
+            Err(e) => return Err(format!("Failed to create append: {e}")),
         };
 
         let writer = table_append.create_writer();
@@ -413,7 +413,10 @@ impl Table {
             self.table_info.clone(),
         );
 
-        let scanner = fluss_table.new_scan().create_log_scanner();
+        let scanner = match fluss_table.new_scan().create_log_scanner() {
+            Ok(a) => a,
+            Err(e) => return Err(format!("Failed to create log scanner: {e}")),
+        };
         let scanner = Box::into_raw(Box::new(LogScanner { inner: scanner }));
         Ok(scanner)
     }
@@ -431,9 +434,12 @@ impl Table {
         let scan = fluss_table.new_scan();
         let scan = match scan.project(&column_indices) {
             Ok(s) => s,
-            Err(e) => return Err(format!("Failed to project columns: {}", e)),
+            Err(e) => return Err(format!("Failed to project columns: {e}")),
+        };
+        let scanner = match scan.create_log_scanner() {
+            Ok(a) => a,
+            Err(e) => return Err(format!("Failed to create log scanner: {e}")),
         };
-        let scanner = scan.create_log_scanner();
         let scanner = Box::into_raw(Box::new(LogScanner { inner: scanner }));
         Ok(scanner)
     }
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index d3bab38abe..f9404ac633 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -64,7 +64,7 @@ fn ffi_data_type_to_core(dt: i32) -> Result<fcore::metadata::DataType> {
         DATA_TYPE_TIME => Ok(fcore::metadata::DataTypes::time()),
         DATA_TYPE_TIMESTAMP => Ok(fcore::metadata::DataTypes::timestamp()),
         DATA_TYPE_TIMESTAMP_LTZ => Ok(fcore::metadata::DataTypes::timestamp_ltz()),
-        _ => Err(anyhow!("Unknown data type: {}", dt)),
+        _ => Err(anyhow!("Unknown data type: {dt}")),
     }
 }
 
@@ -423,10 +423,7 @@ fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
                     datum.i32_val = array.value(row_id);
                     datum
                 }
-                _ => panic!(
-                    "Will never come here. Unsupported Time32 unit for column {}",
-                    i
-                ),
+                _ => panic!("Will never come here. Unsupported Time32 unit for column {i}"),
             },
             ArrowDataType::Time64(unit) => match unit {
                 TimeUnit::Microsecond => {
@@ -449,14 +446,10 @@ fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
                     datum.i64_val = array.value(row_id);
                     datum
                 }
-                _ => panic!(
-                    "Will never come here. Unsupported Time64 unit for column {}",
-                    i
-                ),
+                _ => panic!("Will never come here. Unsupported Time64 unit for column {i}"),
             },
             other => panic!(
-                "Will never come here. Unsupported Arrow data type for column {}: {:?}",
-                i, other
+                "Will never come here. Unsupported Arrow data type for column {i}: {other:?}"
             ),
         };
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 2a8df25c9d..71759d7505 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -67,7 +67,11 @@ impl FlussTable {
 
             let table_scan = fluss_table.new_scan();
 
-            let rust_scanner = table_scan.create_log_scanner();
+            let rust_scanner = table_scan.create_log_scanner().map_err(|e| {
+                PyErr::new::<pyo3::exceptions::PyRuntimeError, _>(format!(
+                    "Failed to create log scanner: {e:?}"
+                ))
+            })?;
 
             let admin = conn
                 .get_admin()
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index deab3639da..2d6ac53d8f 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -70,7 +70,7 @@ pub async fn main() -> Result<()> {
     try_join!(f1, f2, append_writer.flush())?;
 
     // scan rows
-    let log_scanner = table.new_scan().create_log_scanner();
+    let log_scanner = table.new_scan().create_log_scanner()?;
     log_scanner.subscribe(0, 0).await?;
 
     loop {
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index af770377ce..4547b9c327 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -22,6 +22,14 @@ version = { workspace = true }
 name = "fluss"
 build = "src/build.rs"
 
+[features]
+default = ["storage-memory", "storage-fs"]
+storage-all = ["storage-memory", "storage-fs"]
+
+storage-memory = ["opendal/services-memory"]
+storage-fs = ["opendal/services-fs"]
+integration_tests = []
+
 [dependencies]
 arrow = { workspace = true }
 arrow-schema = "57.0.0"
@@ -45,16 +53,17 @@ ordered-float = { version = "4", features = ["serde"] }
 parse-display = "0.10"
 ref-cast = "1.0"
 chrono = { workspace = true }
-oneshot = "0.1.11"
+opendal = "0.53.3"
+url = "2.5.7"
+async-trait = "0.1.89"
+uuid = { version = "1.10", features = ["v4"] }
+tempfile= "3.23.0"
 
 [dev-dependencies]
 testcontainers = "0.25.0"
 once_cell = "1.19"
 test-env-helpers = "0.2.2"
 
-[features]
-integration_tests = []
-
 
 [build-dependencies]
 prost-build = {  version = "0.13.5"  }
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 52ae700fc6..99722477c5 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -26,6 +26,7 @@ pub const EARLIEST_OFFSET: i64 = -2;
 
 mod append;
 
+mod remote_log;
 mod scanner;
 mod writer;
 
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
new file mode 100644
index 0000000000..65805d069b
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -0,0 +1,267 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+
+use crate::error::{Error, Result};
+use crate::io::{FileIO, Storage};
+use crate::metadata::TableBucket;
+use crate::proto::{PbRemoteLogFetchInfo, PbRemoteLogSegment};
+use crate::record::{LogRecordsBatchs, ReadContext, ScanRecord};
+use crate::util::delete_file;
+use std::collections::HashMap;
+use std::io;
+use std::path::{Path, PathBuf};
+use tempfile::TempDir;
+use tokio::io::AsyncWriteExt;
+use tokio::sync::oneshot;
+
+/// Represents a remote log segment that needs to be downloaded
+#[derive(Debug, Clone)]
+pub struct RemoteLogSegment {
+    pub segment_id: String,
+    pub start_offset: i64,
+    #[allow(dead_code)]
+    pub end_offset: i64,
+    #[allow(dead_code)]
+    pub size_in_bytes: i32,
+    pub table_bucket: TableBucket,
+}
+
+impl RemoteLogSegment {
+    pub fn from_proto(segment: &PbRemoteLogSegment, table_bucket: TableBucket) -> Self {
+        Self {
+            segment_id: segment.remote_log_segment_id.clone(),
+            start_offset: segment.remote_log_start_offset,
+            end_offset: segment.remote_log_end_offset,
+            size_in_bytes: segment.segment_size_in_bytes,
+            table_bucket,
+        }
+    }
+
+    /// Get the local file name for this remote log segment
+    pub fn local_file_name(&self) -> String {
+        // Format: ${remote_segment_id}_${offset_prefix}.log
+        let offset_prefix = format!("{:020}", self.start_offset);
+        format!("{}_{}.log", self.segment_id, offset_prefix)
+    }
+}
+
+/// Represents remote log fetch information
+#[derive(Debug, Clone)]
+pub struct RemoteLogFetchInfo {
+    pub remote_log_tablet_dir: String,
+    #[allow(dead_code)]
+    pub partition_name: Option<String>,
+    pub remote_log_segments: Vec<RemoteLogSegment>,
+    pub first_start_pos: i32,
+}
+
+impl RemoteLogFetchInfo {
+    pub fn from_proto(info: &PbRemoteLogFetchInfo, table_bucket: TableBucket) -> Result<Self> {
+        let segments = info
+            .remote_log_segments
+            .iter()
+            .map(|s| RemoteLogSegment::from_proto(s, table_bucket.clone()))
+            .collect();
+
+        Ok(Self {
+            remote_log_tablet_dir: info.remote_log_tablet_dir.clone(),
+            partition_name: info.partition_name.clone(),
+            remote_log_segments: segments,
+            first_start_pos: info.first_start_pos.unwrap_or(0),
+        })
+    }
+}
+
+/// Future for a remote log download request
+pub struct RemoteLogDownloadFuture {
+    receiver: Option<oneshot::Receiver<Result<PathBuf>>>,
+}
+
+impl RemoteLogDownloadFuture {
+    pub fn new(receiver: oneshot::Receiver<Result<PathBuf>>) -> Self {
+        Self {
+            receiver: Some(receiver),
+        }
+    }
+
+    /// Get the downloaded file path
+    pub async fn get_file_path(&mut self) -> Result<PathBuf> {
+        let receiver = self
+            .receiver
+            .take()
+            .ok_or_else(|| Error::Io(io::Error::other("Download future already consumed")))?;
+
+        receiver.await.map_err(|e| {
+            Error::Io(io::Error::other(format!(
+                "Download future cancelled: {e:?}"
+            )))
+        })?
+    }
+}
+
+/// Downloader for remote log segment files
+pub struct RemoteLogDownloader {
+    local_log_dir: TempDir,
+}
+
+impl RemoteLogDownloader {
+    pub fn new(local_log_dir: TempDir) -> Result<Self> {
+        Ok(Self { local_log_dir })
+    }
+
+    /// Request to fetch a remote log segment to local. This method is non-blocking.
+    pub fn request_remote_log(
+        &self,
+        remote_log_tablet_dir: &str,
+        segment: &RemoteLogSegment,
+    ) -> Result<RemoteLogDownloadFuture> {
+        let (sender, receiver) = oneshot::channel();
+        let local_file_name = segment.local_file_name();
+        let local_file_path = self.local_log_dir.path().join(&local_file_name);
+        let remote_path = self.build_remote_path(remote_log_tablet_dir, segment);
+        let remote_log_tablet_dir = remote_log_tablet_dir.to_string();
+        // Spawn async download task
+        tokio::spawn(async move {
+            let result =
+                Self::download_file(&remote_log_tablet_dir, &remote_path, &local_file_path).await;
+            let _ = sender.send(result);
+        });
+        Ok(RemoteLogDownloadFuture::new(receiver))
+    }
+
+    /// Build the remote path for a log segment
+    fn build_remote_path(&self, remote_log_tablet_dir: &str, segment: &RemoteLogSegment) -> String {
+        // Format: ${remote_log_tablet_dir}/${segment_id}/${offset_prefix}.log
+        let offset_prefix = format!("{:020}", segment.start_offset);
+        format!(
+            "{}/{}/{}.log",
+            remote_log_tablet_dir, segment.segment_id, offset_prefix
+        )
+    }
+
+    /// Download a file from remote storage to local using streaming read/write
+    async fn download_file(
+        remote_log_tablet_dir: &str,
+        remote_path: &str,
+        local_path: &Path,
+    ) -> Result<PathBuf> {
+        // Handle both URL (e.g., "s3://bucket/path") and local file paths
+        // If the path doesn't contain "://", treat it as a local file path
+        let remote_log_tablet_dir_url = if remote_log_tablet_dir.contains("://") {
+            remote_log_tablet_dir.to_string()
+        } else {
+            format!("file://{remote_log_tablet_dir}")
+        };
+
+        // Create FileIO from the remote log tablet dir URL to get the storage
+        let file_io_builder = FileIO::from_url(&remote_log_tablet_dir_url)?;
+
+        // Build storage and create operator directly
+        let storage = Storage::build(file_io_builder)?;
+        let (op, relative_path) = storage.create(remote_path)?;
+
+        // Get file metadata to know the size
+        let meta = op.stat(relative_path).await?;
+        let file_size = meta.content_length();
+
+        // Create local file for writing
+        let mut local_file = tokio::fs::File::create(local_path).await?;
+
+        // Stream data from remote to local file in chunks
+        // opendal::Reader::read accepts a range, so we read in chunks
+        const CHUNK_SIZE: u64 = 8 * 1024 * 1024; // 8MB chunks for efficient reading
+        let mut offset = 0u64;
+
+        while offset < file_size {
+            let end = std::cmp::min(offset + CHUNK_SIZE, file_size);
+            let range = offset..end;
+
+            // Read chunk from remote storage
+            let chunk = op.read_with(relative_path).range(range.clone()).await?;
+            let bytes = chunk.to_bytes();
+
+            // Write chunk to local file
+            local_file.write_all(&bytes).await?;
+
+            offset = end;
+        }
+
+        // Ensure all data is flushed to disk
+        local_file.sync_all().await?;
+
+        Ok(local_path.to_path_buf())
+    }
+}
+
+/// Pending fetch that waits for remote log file to be downloaded
+pub struct RemotePendingFetch {
+    segment: RemoteLogSegment,
+    download_future: RemoteLogDownloadFuture,
+    pos_in_log_segment: i32,
+    #[allow(dead_code)]
+    fetch_offset: i64,
+    #[allow(dead_code)]
+    high_watermark: i64,
+    read_context: ReadContext,
+}
+
+impl RemotePendingFetch {
+    pub fn new(
+        segment: RemoteLogSegment,
+        download_future: RemoteLogDownloadFuture,
+        pos_in_log_segment: i32,
+        fetch_offset: i64,
+        high_watermark: i64,
+        read_context: ReadContext,
+    ) -> Self {
+        Self {
+            segment,
+            download_future,
+            pos_in_log_segment,
+            fetch_offset,
+            high_watermark,
+            read_context,
+        }
+    }
+
+    /// Convert to completed fetch by reading the downloaded file
+    pub async fn convert_to_completed_fetch(
+        mut self,
+    ) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
+        let file_path = self.download_future.get_file_path().await?;
+        let file_data = tokio::fs::read(&file_path).await?;
+
+        // Slice the data if needed
+        let data = if self.pos_in_log_segment > 0 {
+            &file_data[self.pos_in_log_segment as usize..]
+        } else {
+            &file_data
+        };
+
+        // delete the downloaded local file to free disk
+        delete_file(file_path).await;
+
+        // Parse log records
+        let mut fetch_records = vec![];
+        for log_record in &mut LogRecordsBatchs::new(data) {
+            fetch_records.extend(log_record.records(&self.read_context)?);
+        }
+
+        let mut result = HashMap::new();
+        result.insert(self.segment.table_bucket.clone(), fetch_records);
+        Ok(result)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 13372efecf..f6780d715c 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -29,6 +29,11 @@ use std::collections::HashMap;
 use std::slice::from_ref;
 use std::sync::Arc;
 use std::time::Duration;
+use tempfile::TempDir;
+
+use crate::client::table::remote_log::{
+    RemoteLogDownloader, RemoteLogFetchInfo, RemotePendingFetch,
+};
 
 const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
 #[allow(dead_code)]
@@ -120,7 +125,7 @@ impl<'a> TableScan<'a> {
         Ok(self)
     }
 
-    pub fn create_log_scanner(self) -> LogScanner {
+    pub fn create_log_scanner(self) -> Result<LogScanner> {
         LogScanner::new(
             &self.table_info,
             self.metadata.clone(),
@@ -144,9 +149,9 @@ impl LogScanner {
         metadata: Arc<Metadata>,
         connections: Arc<RpcClient>,
         projected_fields: Option<Vec<usize>>,
-    ) -> Self {
+    ) -> Result<Self> {
         let log_scanner_status = Arc::new(LogScannerStatus::new());
-        Self {
+        Ok(Self {
             table_path: table_info.table_path.clone(),
             table_id: table_info.table_id,
             metadata: metadata.clone(),
@@ -157,8 +162,8 @@ impl LogScanner {
                 metadata.clone(),
                 log_scanner_status.clone(),
                 projected_fields,
-            ),
-        }
+            )?,
+        })
     }
 
     pub async fn poll(&self, _timeout: Duration) -> Result<ScanRecords> {
@@ -188,6 +193,7 @@ struct LogFetcher {
     metadata: Arc<Metadata>,
     log_scanner_status: Arc<LogScannerStatus>,
     read_context: ReadContext,
+    remote_log_downloader: RemoteLogDownloader,
 }
 
 impl LogFetcher {
@@ -197,17 +203,21 @@ impl LogFetcher {
         metadata: Arc<Metadata>,
         log_scanner_status: Arc<LogScannerStatus>,
         projected_fields: Option<Vec<usize>>,
-    ) -> Self {
+    ) -> Result<Self> {
         let full_arrow_schema = to_arrow_schema(table_info.get_row_type());
-        let read_context = Self::create_read_context(full_arrow_schema, projected_fields);
-        LogFetcher {
+        let read_context = Self::create_read_context(full_arrow_schema, projected_fields.clone());
+
+        let tmp_dir = TempDir::with_prefix("fluss-remote-logs")?;
+
+        Ok(LogFetcher {
             table_path: table_info.table_path.clone(),
             conns,
             table_info,
             metadata,
             log_scanner_status,
             read_context,
-        }
+            remote_log_downloader: RemoteLogDownloader::new(tmp_dir)?,
+        })
     }
 
     fn create_read_context(
@@ -239,10 +249,66 @@ impl LogFetcher {
                 let fetch_log_for_buckets = pb_fetch_log_resp.buckets_resp;
 
                 for fetch_log_for_bucket in fetch_log_for_buckets {
-                    let mut fetch_records = vec![];
                     let bucket: i32 = fetch_log_for_bucket.bucket_id;
                     let table_bucket = TableBucket::new(table_id, bucket);
-                    if fetch_log_for_bucket.records.is_some() {
+
+                    // Check if this is a remote log fetch
+                    if let Some(ref remote_log_fetch_info) =
+                        fetch_log_for_bucket.remote_log_fetch_info
+                    {
+                        let remote_fetch_info = RemoteLogFetchInfo::from_proto(
+                            remote_log_fetch_info,
+                            table_bucket.clone(),
+                        )?;
+
+                        if let Some(fetch_offset) =
+                            self.log_scanner_status.get_bucket_offset(&table_bucket)
+                        {
+                            let high_watermark = fetch_log_for_bucket.high_watermark.unwrap_or(-1);
+                            // Download and process remote log segments
+                            let mut pos_in_log_segment = remote_fetch_info.first_start_pos;
+                            let mut current_fetch_offset = fetch_offset;
+                            // todo: make segment download parallelly
+                            for (i, segment) in
+                                remote_fetch_info.remote_log_segments.iter().enumerate()
+                            {
+                                if i > 0 {
+                                    pos_in_log_segment = 0;
+                                    current_fetch_offset = segment.start_offset;
+                                }
+
+                                let download_future =
+                                    self.remote_log_downloader.request_remote_log(
+                                        &remote_fetch_info.remote_log_tablet_dir,
+                                        segment,
+                                    )?;
+                                let pending_fetch = RemotePendingFetch::new(
+                                    segment.clone(),
+                                    download_future,
+                                    pos_in_log_segment,
+                                    current_fetch_offset,
+                                    high_watermark,
+                                    self.read_context.clone(),
+                                );
+                                let remote_records =
+                                    pending_fetch.convert_to_completed_fetch().await?;
+                                // Update offset and merge results
+                                for (tb, records) in remote_records {
+                                    if let Some(last_record) = records.last() {
+                                        self.log_scanner_status
+                                            .update_offset(&tb, last_record.offset() + 1);
+                                    }
+                                    result.entry(tb).or_default().extend(records);
+                                }
+                            }
+                        } else {
+                            // if the offset is null, it means the bucket has been unsubscribed,
+                            // skip processing and continue to the next bucket.
+                            continue;
+                        }
+                    } else if fetch_log_for_bucket.records.is_some() {
+                        // Handle regular in-memory records
+                        let mut fetch_records = vec![];
                         let data = fetch_log_for_bucket.records.unwrap();
                         for log_record in &mut LogRecordsBatchs::new(&data) {
                             let last_offset = log_record.last_log_offset();
@@ -250,8 +316,8 @@ impl LogFetcher {
                             self.log_scanner_status
                                 .update_offset(&table_bucket, last_offset + 1);
                         }
+                        result.insert(table_bucket, fetch_records);
                     }
-                    result.insert(table_bucket, fetch_records);
                 }
             }
         }
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index 58b88a4786..b1d5d13b6e 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -47,4 +47,16 @@ pub enum Error {
 
     #[error("Illegal argument error: {0}")]
     IllegalArgument(String),
+
+    #[error("IO not supported error: {0}")]
+    IoUnsupported(String),
+
+    #[error("IO operation failed on underlying storage: {0}")]
+    IoUnexpected(Box<opendal::Error>),
+}
+
+impl From<opendal::Error> for Error {
+    fn from(err: opendal::Error) -> Self {
+        Error::IoUnexpected(Box::new(err))
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/io/file_io.rs b/fluss-rust/crates/fluss/src/io/file_io.rs
new file mode 100644
index 0000000000..69a4c9707f
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/io/file_io.rs
@@ -0,0 +1,158 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+use crate::error::*;
+use std::collections::HashMap;
+use std::ops::Range;
+use std::sync::Arc;
+
+use bytes::Bytes;
+use chrono::{DateTime, Utc};
+use opendal::Operator;
+
+use url::Url;
+
+use super::Storage;
+
+use crate::error::Result;
+
+#[derive(Clone, Debug)]
+pub struct FileIO {
+    storage: Arc<Storage>,
+}
+
+impl FileIO {
+    /// Try to infer file io scheme from path.
+    pub fn from_url(path: &str) -> Result<FileIOBuilder> {
+        let url =
+            Url::parse(path).map_err(|_| Error::IllegalArgument(format!("Invalid URL: {path}")))?;
+        Ok(FileIOBuilder::new(url.scheme()))
+    }
+
+    /// Create a new input file to read data.
+    pub fn new_input(&self, path: &str) -> Result<InputFile> {
+        let (op, relative_path) = self.storage.create(path)?;
+        let path = path.to_string();
+        let relative_path_pos = path.len() - relative_path.len();
+        Ok(InputFile {
+            op,
+            path,
+            relative_path_pos,
+        })
+    }
+}
+
+#[derive(Debug)]
+pub struct FileIOBuilder {
+    scheme_str: Option<String>,
+    props: HashMap<String, String>,
+}
+
+impl FileIOBuilder {
+    pub fn new(scheme_str: impl ToString) -> Self {
+        Self {
+            scheme_str: Some(scheme_str.to_string()),
+            props: HashMap::default(),
+        }
+    }
+
+    pub(crate) fn into_parts(self) -> (String, HashMap<String, String>) {
+        (self.scheme_str.unwrap_or_default(), self.props)
+    }
+
+    pub fn with_prop(mut self, key: impl ToString, value: impl ToString) -> Self {
+        self.props.insert(key.to_string(), value.to_string());
+        self
+    }
+
+    pub fn with_props(
+        mut self,
+        args: impl IntoIterator<Item = (impl ToString, impl ToString)>,
+    ) -> Self {
+        self.props
+            .extend(args.into_iter().map(|e| (e.0.to_string(), e.1.to_string())));
+        self
+    }
+
+    pub fn build(self) -> Result<FileIO> {
+        let storage = Storage::build(self)?;
+        Ok(FileIO {
+            storage: Arc::new(storage),
+        })
+    }
+}
+
+#[async_trait::async_trait]
+pub trait FileRead: Send + Unpin + 'static {
+    async fn read(&self, range: Range<u64>) -> Result<Bytes>;
+}
+
+#[async_trait::async_trait]
+impl FileRead for opendal::Reader {
+    async fn read(&self, range: Range<u64>) -> Result<Bytes> {
+        Ok(opendal::Reader::read(self, range).await?.to_bytes())
+    }
+}
+
+#[derive(Debug)]
+pub struct InputFile {
+    op: Operator,
+    path: String,
+    relative_path_pos: usize,
+}
+
+impl InputFile {
+    pub fn location(&self) -> &str {
+        &self.path
+    }
+
+    pub async fn exists(&self) -> Result<bool> {
+        Ok(self.op.exists(&self.path[self.relative_path_pos..]).await?)
+    }
+
+    pub async fn metadata(&self) -> Result<FileStatus> {
+        let meta = self.op.stat(&self.path[self.relative_path_pos..]).await?;
+
+        Ok(FileStatus {
+            size: meta.content_length(),
+            is_dir: meta.is_dir(),
+            path: self.path.clone(),
+            last_modified: meta.last_modified(),
+        })
+    }
+
+    pub async fn read(&self) -> Result<Bytes> {
+        Ok(self
+            .op
+            .read(&self.path[self.relative_path_pos..])
+            .await?
+            .to_bytes())
+    }
+
+    pub async fn reader(&self) -> Result<impl FileRead> {
+        Ok(self.op.reader(&self.path[self.relative_path_pos..]).await?)
+    }
+}
+
+#[derive(Clone, Debug)]
+pub struct FileStatus {
+    pub size: u64,
+    pub is_dir: bool,
+    pub path: String,
+    pub last_modified: Option<DateTime<Utc>>,
+}
diff --git a/fluss-rust/crates/fluss/src/io/mod.rs b/fluss-rust/crates/fluss/src/io/mod.rs
new file mode 100644
index 0000000000..3c9a1659e4
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/io/mod.rs
@@ -0,0 +1,34 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+mod file_io;
+
+pub use file_io::*;
+
+mod storage;
+pub use storage::*;
+
+#[cfg(feature = "storage-fs")]
+mod storage_fs;
+#[cfg(feature = "storage-fs")]
+use storage_fs::*;
+#[cfg(feature = "storage-memory")]
+mod storage_memory;
+
+#[cfg(feature = "storage-memory")]
+use storage_memory::*;
diff --git a/fluss-rust/crates/fluss/src/io/storage.rs b/fluss-rust/crates/fluss/src/io/storage.rs
new file mode 100644
index 0000000000..361da7ee80
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/io/storage.rs
@@ -0,0 +1,79 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+use crate::error;
+use crate::error::Result;
+use crate::io::FileIOBuilder;
+use opendal::{Operator, Scheme};
+
+/// The storage carries all supported storage services in fluss
+#[derive(Debug)]
+pub enum Storage {
+    #[cfg(feature = "storage-memory")]
+    Memory,
+    #[cfg(feature = "storage-fs")]
+    LocalFs,
+}
+
+impl Storage {
+    pub(crate) fn build(file_io_builder: FileIOBuilder) -> Result<Self> {
+        let (scheme_str, _) = file_io_builder.into_parts();
+        let scheme = Self::parse_scheme(&scheme_str)?;
+
+        match scheme {
+            #[cfg(feature = "storage-memory")]
+            Scheme::Memory => Ok(Self::Memory),
+            #[cfg(feature = "storage-fs")]
+            Scheme::Fs => Ok(Self::LocalFs),
+            _ => Err(error::Error::IoUnsupported(
+                "Unsupported storage feature".to_string(),
+            )),
+        }
+    }
+
+    pub(crate) fn create<'a>(&self, path: &'a str) -> Result<(Operator, &'a str)> {
+        match self {
+            #[cfg(feature = "storage-memory")]
+            Storage::Memory => {
+                let op = super::memory_config_build()?;
+
+                if let Some(stripped) = path.strip_prefix("memory:/") {
+                    Ok((op, stripped))
+                } else {
+                    Ok((op, &path[1..]))
+                }
+            }
+            #[cfg(feature = "storage-fs")]
+            Storage::LocalFs => {
+                let op = super::fs_config_build()?;
+                if let Some(stripped) = path.strip_prefix("file:/") {
+                    Ok((op, stripped))
+                } else {
+                    Ok((op, &path[1..]))
+                }
+            }
+        }
+    }
+
+    fn parse_scheme(scheme: &str) -> Result<Scheme> {
+        match scheme {
+            "memory" => Ok(Scheme::Memory),
+            "file" | "" => Ok(Scheme::Fs),
+            s => Ok(s.parse::<Scheme>()?),
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/io/storage_fs.rs b/fluss-rust/crates/fluss/src/io/storage_fs.rs
new file mode 100644
index 0000000000..95ca6fa95f
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/io/storage_fs.rs
@@ -0,0 +1,30 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+use opendal::Operator;
+use opendal::services::FsConfig;
+
+use crate::error::Result;
+
+/// Build new opendal operator from give path.
+pub(crate) fn fs_config_build() -> Result<Operator> {
+    let mut cfg = FsConfig::default();
+    cfg.root = Some("/".to_string());
+
+    Ok(Operator::from_config(cfg)?.finish())
+}
diff --git a/fluss-rust/crates/fluss/src/io/storage_memory.rs b/fluss-rust/crates/fluss/src/io/storage_memory.rs
new file mode 100644
index 0000000000..af73a90174
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/io/storage_memory.rs
@@ -0,0 +1,24 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+use crate::error::Result;
+use opendal::Operator;
+use opendal::services::MemoryConfig;
+
+pub(crate) fn memory_config_build() -> Result<Operator> {
+    Ok(Operator::from_config(MemoryConfig::default())?.finish())
+}
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index e63b5edfd8..366edfc60a 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -26,6 +26,7 @@ mod cluster;
 pub mod config;
 pub mod error;
 
+pub mod io;
 mod util;
 
 pub type TableId = u64;
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index c26b4ec43a..f93abf967b 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -19,8 +19,10 @@ use crate::metadata::TableBucket;
 use linked_hash_map::LinkedHashMap;
 use std::collections::{HashMap, HashSet};
 use std::hash::Hash;
+use std::path::PathBuf;
 use std::sync::Arc;
 use std::time::{SystemTime, UNIX_EPOCH};
+use tracing::warn;
 
 pub fn current_time_ms() -> i64 {
     SystemTime::now()
@@ -29,6 +31,12 @@ pub fn current_time_ms() -> i64 {
         .as_millis() as i64
 }
 
+pub async fn delete_file(file_path: PathBuf) {
+    tokio::fs::remove_file(&file_path)
+        .await
+        .unwrap_or_else(|e| warn!("Could not delete file: {:?}, error: {:?}", &file_path, e));
+}
+
 pub struct FairBucketStatusMap<S> {
     map: LinkedHashMap<TableBucket, Arc<S>>,
     size: usize,
diff --git a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
index e827e14932..21422df6a0 100644
--- a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
+++ b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
@@ -32,12 +32,27 @@ pub struct FlussTestingClusterBuilder {
     network: &'static str,
     cluster_conf: HashMap<String, String>,
     testing_name: String,
+    remote_data_dir: Option<std::path::PathBuf>,
 }
 
 impl FlussTestingClusterBuilder {
     pub fn new(testing_name: impl Into<String>) -> Self {
+        Self::new_with_cluster_conf(testing_name.into(), &HashMap::default())
+    }
+
+    pub fn with_remote_data_dir(mut self, dir: std::path::PathBuf) -> Self {
+        // Ensure the directory exists before mounting
+        std::fs::create_dir_all(&dir).expect("Failed to create remote data directory");
+        self.remote_data_dir = Some(dir);
+        self
+    }
+
+    pub fn new_with_cluster_conf(
+        testing_name: impl Into<String>,
+        conf: &HashMap<String, String>,
+    ) -> Self {
         // reduce testing resources
-        let mut cluster_conf = HashMap::new();
+        let mut cluster_conf = conf.clone();
         cluster_conf.insert(
             "netty.server.num-network-threads".to_string(),
             "1".to_string(),
@@ -52,6 +67,7 @@ impl FlussTestingClusterBuilder {
             cluster_conf,
             network: "fluss-cluster-network",
             testing_name: testing_name.into(),
+            remote_data_dir: None,
         }
     }
 
@@ -92,6 +108,7 @@ impl FlussTestingClusterBuilder {
             coordinator_server,
             tablet_servers,
             bootstrap_servers: "127.0.0.1:9123".to_string(),
+            remote_data_dir: self.remote_data_dir.clone(),
         }
     }
 
@@ -147,7 +164,15 @@ impl FlussTestingClusterBuilder {
         tablet_server_confs.insert("internal.listener.name", "INTERNAL".to_string());
         tablet_server_confs.insert("tablet-server.id", tablet_server_id);
 
-        GenericImage::new("fluss/fluss", FLUSS_VERSION)
+        // Set remote.data.dir to use the same path as host when volume mount is provided
+        // This ensures the path is consistent between host and container
+        if let Some(remote_data_dir) = &self.remote_data_dir {
+            tablet_server_confs.insert(
+                "remote.data.dir",
+                remote_data_dir.to_string_lossy().to_string(),
+            );
+        }
+        let mut image = GenericImage::new("fluss/fluss", FLUSS_VERSION)
             .with_cmd(vec!["tabletServer"])
             .with_mapped_port(expose_host_port as u16, ContainerPort::Tcp(9123))
             .with_network(self.network)
@@ -155,10 +180,20 @@ impl FlussTestingClusterBuilder {
             .with_env_var(
                 "FLUSS_PROPERTIES",
                 self.to_fluss_properties_with(tablet_server_confs),
-            )
-            .start()
-            .await
-            .unwrap()
+            );
+
+        // Add volume mount if remote_data_dir is provided
+        if let Some(ref remote_data_dir) = self.remote_data_dir {
+            use testcontainers::core::Mount;
+            // Ensure directory exists before mounting (double check)
+            std::fs::create_dir_all(remote_data_dir)
+                .expect("Failed to create remote data directory for mount");
+            let host_path = remote_data_dir.to_string_lossy().to_string();
+            let container_path = remote_data_dir.to_string_lossy().to_string();
+            image = image.with_mount(Mount::bind_mount(host_path, container_path));
+        }
+
+        image.start().await.unwrap()
     }
 
     fn to_fluss_properties_with(&self, extra_properties: HashMap<&str, String>) -> String {
@@ -180,6 +215,7 @@ pub struct FlussTestingCluster {
     coordinator_server: Arc<ContainerAsync<GenericImage>>,
     tablet_servers: HashMap<i32, Arc<ContainerAsync<GenericImage>>>,
     bootstrap_servers: String,
+    remote_data_dir: Option<std::path::PathBuf>,
 }
 
 impl FlussTestingCluster {
@@ -189,6 +225,18 @@ impl FlussTestingCluster {
         }
         self.coordinator_server.stop().await.unwrap();
         self.zookeeper.stop().await.unwrap();
+        if let Some(remote_data_dir) = &self.remote_data_dir {
+            // Try to clean up the remote data directory, but don't fail if it can't be deleted.
+            // This can happen in CI environments or if Docker containers are still using the directory.
+            // The directory will be cleaned up by the CI system or OS eventually.
+            if let Err(e) = tokio::fs::remove_dir_all(remote_data_dir).await {
+                eprintln!(
+                    "Warning: Failed to delete remote data directory: {:?}, error: {:?}. \
+                     This is non-fatal and the directory may be cleaned up later.",
+                    remote_data_dir, e
+                );
+            }
+        }
     }
 
     pub async fn get_fluss_connection(&self) -> FlussConnection {
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index e14b852648..b23fd793cd 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -16,11 +16,11 @@
  * limitations under the License.
  */
 
-use crate::integration::fluss_cluster::FlussTestingCluster;
 use once_cell::sync::Lazy;
 use parking_lot::RwLock;
 use std::sync::Arc;
 
+use crate::integration::fluss_cluster::FlussTestingCluster;
 #[cfg(test)]
 use test_env_helpers::*;
 
@@ -39,12 +39,11 @@ mod table_test {
     use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
     use fluss::row::InternalRow;
     use std::sync::Arc;
-    use std::sync::atomic::AtomicUsize;
     use std::thread;
     fn before_all() {
         // Create a new tokio runtime in a separate thread
         let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
-        std::thread::spawn(move || {
+        thread::spawn(move || {
             let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
             rt.block_on(async {
                 let cluster = FlussTestingClusterBuilder::new("test_table").build().await;
@@ -71,7 +70,7 @@ mod table_test {
     fn after_all() {
         // Create a new tokio runtime in a separate thread
         let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
-        std::thread::spawn(move || {
+        thread::spawn(move || {
             let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
             rt.block_on(async {
                 let mut guard = cluster_guard.write();
@@ -137,7 +136,10 @@ mod table_test {
         append_writer.flush().await.expect("Failed to flush");
 
         let num_buckets = table.table_info().get_num_buckets();
-        let log_scanner = table.new_scan().create_log_scanner();
+        let log_scanner = table
+            .new_scan()
+            .create_log_scanner()
+            .expect("Failed to create log scanner");
         for bucket_id in 0..num_buckets {
             log_scanner
                 .subscribe(bucket_id, 0)
@@ -166,7 +168,8 @@ mod table_test {
             .new_scan()
             .project(&[1, 0])
             .expect("Failed to project")
-            .create_log_scanner();
+            .create_log_scanner()
+            .expect("Failed to create log scanner");
         for bucket_id in 0..num_buckets {
             log_scanner_projected
                 .subscribe(bucket_id, 0)
@@ -212,7 +215,9 @@ mod table_test {
             .expect("Failed to get table");
 
         let table_scan = table.new_scan();
-        let log_scanner = table_scan.create_log_scanner();
+        let log_scanner = table_scan
+            .create_log_scanner()
+            .expect("Failed to create log scanner");
 
         // Subscribe to bucket 0 starting from offset 0
         log_scanner
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
new file mode 100644
index 0000000000..f33d440f40
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -0,0 +1,223 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+use crate::integration::fluss_cluster::FlussTestingCluster;
+use once_cell::sync::Lazy;
+use parking_lot::RwLock;
+use std::sync::Arc;
+
+#[cfg(test)]
+use test_env_helpers::*;
+
+// Module-level shared cluster instance (only for this test file)
+static SHARED_FLUSS_CLUSTER: Lazy<Arc<RwLock<Option<FlussTestingCluster>>>> =
+    Lazy::new(|| Arc::new(RwLock::new(None)));
+
+#[cfg(test)]
+#[before_all]
+#[after_all]
+mod table_remote_scan_test {
+    use super::SHARED_FLUSS_CLUSTER;
+    use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
+    use crate::integration::utils::create_table;
+    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    use fluss::row::{GenericRow, InternalRow};
+    use std::collections::HashMap;
+    use std::sync::Arc;
+    use std::sync::atomic::AtomicUsize;
+    use std::sync::atomic::Ordering;
+    use std::thread;
+    use std::thread::sleep;
+    use std::time::Duration;
+    use uuid::Uuid;
+
+    fn before_all() {
+        // Create a new tokio runtime in a separate thread
+        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
+        thread::spawn(move || {
+            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+            rt.block_on(async {
+                // Create a temporary directory for remote data that can be accessed from both
+                // container and host. Use a fixed path so it's the same in container and host.
+                // On macOS, Docker Desktop may have issues with /tmp, so we use a path in the
+                // current working directory or user's home directory which Docker can access.
+                let temp_dir = std::env::current_dir()
+                    .unwrap_or_else(|_| std::path::PathBuf::from("."))
+                    .join("target")
+                    .join(format!("test-remote-data-{}", Uuid::new_v4()));
+
+                // Remove existing directory if it exists to start fresh
+                let _ = std::fs::remove_dir_all(&temp_dir);
+                std::fs::create_dir_all(&temp_dir)
+                    .expect("Failed to create temporary directory for remote data");
+                println!("temp_dir: {:?}", temp_dir);
+
+                // Verify directory was created and is accessible
+                if !temp_dir.exists() {
+                    panic!("Remote data directory was not created: {:?}", temp_dir);
+                }
+
+                // Get absolute path for Docker mount
+                let temp_dir = temp_dir
+                    .canonicalize()
+                    .expect("Failed to canonicalize remote data directory path");
+
+                let mut cluster_conf = HashMap::new();
+                // set to a small size to make data can be tiered to remote
+                cluster_conf.insert("log.segment.file-size".to_string(), "120b".to_string());
+                cluster_conf.insert(
+                    "remote.log.task-interval-duration".to_string(),
+                    "1s".to_string(),
+                );
+                // remote.data.dir uses the same path in container and host
+                cluster_conf.insert(
+                    "remote.data.dir".to_string(),
+                    temp_dir.to_string_lossy().to_string(),
+                );
+
+                let cluster =
+                    FlussTestingClusterBuilder::new_with_cluster_conf("test_table", &cluster_conf)
+                        .with_remote_data_dir(temp_dir)
+                        .build()
+                        .await;
+                let mut guard = cluster_guard.write();
+                *guard = Some(cluster);
+            });
+        })
+        .join()
+        .expect("Failed to create cluster");
+
+        // wait for 20 seconds to avoid the error like
+        // CoordinatorEventProcessor is not initialized yet
+        sleep(Duration::from_secs(20));
+    }
+
+    fn after_all() {
+        // Create a new tokio runtime in a separate thread
+        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
+        thread::spawn(move || {
+            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+            rt.block_on(async {
+                let mut guard = cluster_guard.write();
+                if let Some(cluster) = guard.take() {
+                    cluster.stop().await;
+                }
+            });
+        })
+        .join()
+        .expect("Failed to cleanup cluster");
+    }
+
+    #[tokio::test]
+    async fn test_scan_remote_log() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new(
+            "fluss".to_string(),
+            "test_append_record_batch_and_scan".to_string(),
+        );
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("c1", DataTypes::int())
+                    .column("c2", DataTypes::string())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .property("table.log.arrow.compression.type", "NONE")
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer();
+
+        // append 20 rows, there must be some tiered to remote
+        let record_count = 20;
+        for i in 0..record_count {
+            let mut row = GenericRow::new();
+            row.set_field(0, i as i32);
+            let v = format!("v{}", i);
+            row.set_field(1, v.as_str());
+            append_writer
+                .append(row)
+                .await
+                .expect("Failed to append row");
+        }
+
+        // Create a log scanner and subscribe to all buckets to read appended records
+        let num_buckets = table.table_info().get_num_buckets();
+        let log_scanner = table
+            .new_scan()
+            .create_log_scanner()
+            .expect("Failed to create log scanner");
+        for bucket_id in 0..num_buckets {
+            log_scanner
+                .subscribe(bucket_id, 0)
+                .await
+                .expect("Failed to subscribe");
+        }
+
+        let mut records = Vec::with_capacity(record_count);
+        let start = std::time::Instant::now();
+        const MAX_WAIT_DURATION: Duration = Duration::from_secs(30);
+        while records.len() < record_count {
+            if start.elapsed() > MAX_WAIT_DURATION {
+                panic!(
+                    "Timed out waiting for {} records; only got {} after {:?}",
+                    record_count,
+                    records.len(),
+                    start.elapsed()
+                );
+            }
+            let scan_records = log_scanner
+                .poll(Duration::from_secs(1))
+                .await
+                .expect("Failed to poll log scanner");
+            records.extend(scan_records);
+        }
+
+        // then, check the data
+        for (i, record) in records.iter().enumerate() {
+            let row = record.row();
+            let expected_c1 = i as i32;
+            let expected_c2 = format!("v{}", i);
+            assert_eq!(row.get_int(0), expected_c1, "c1 mismatch at index {}", i);
+            assert_eq!(row.get_string(1), expected_c2, "c2 mismatch at index {}", i);
+        }
+    }
+
+    fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
+        let cluster_guard = SHARED_FLUSS_CLUSTER.read();
+        if cluster_guard.is_none() {
+            panic!("Fluss cluster not initialized. Make sure before_all() was called.");
+        }
+        Arc::new(cluster_guard.as_ref().unwrap().clone())
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
index a15ca2395a..65111af218 100644
--- a/fluss-rust/crates/fluss/tests/test_fluss.rs
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -25,4 +25,6 @@ mod integration {
     mod table;
 
     mod utils;
+
+    mod table_remote_scan;
 }

From 5b31e28a9f3c68393db11ed51f32a6e4752fe2b2 Mon Sep 17 00:00:00 2001
From: tison <wander4096@gmail.com>
Date: Mon, 15 Dec 2025 10:41:45 +0800
Subject: [PATCH 033/287] chore: upgrade opendal and adopt jiff (#95)

Signed-off-by: tison <wander4096@gmail.com>
---
 fluss-rust/Cargo.toml                         |  4 +--
 fluss-rust/bindings/python/Cargo.toml         |  3 +--
 fluss-rust/bindings/python/src/lib.rs         |  5 ++--
 fluss-rust/crates/fluss/Cargo.toml            | 13 +++++-----
 fluss-rust/crates/fluss/{src => }/build.rs    |  0
 fluss-rust/crates/fluss/src/io/file_io.rs     |  6 ++---
 fluss-rust/crates/fluss/src/row/datum.rs      | 25 +++++++++----------
 .../crates/fluss/tests/integration/admin.rs   |  7 +++---
 .../crates/fluss/tests/integration/table.rs   |  6 ++---
 .../tests/integration/table_remote_scan.rs    |  6 ++---
 10 files changed, 37 insertions(+), 38 deletions(-)
 rename fluss-rust/crates/fluss/{src => }/build.rs (100%)

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index b4ac03b7be..284a836349 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -19,13 +19,11 @@
 categories = ["command-line-utilities"]
 description = "The rust implementation of fluss"
 repository = "https://github.com/apache/fluss-rust"
-name = "fluss"
 edition = "2024"
 version = "0.1.0"
 license = "Apache-2.0"
 rust-version = "1.85"
 
-
 [workspace]
 resolver = "2"
 members = ["crates/fluss", "crates/examples", "bindings/python", "bindings/cpp"]
@@ -35,4 +33,4 @@ fluss = { version = "0.1.0", path = "./crates/fluss" }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression"] }
-chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }
+jiff = { version = "0.2" }
diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
index 9ecc6299cd..4da8bf835e 100644
--- a/fluss-rust/bindings/python/Cargo.toml
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -35,5 +35,4 @@ arrow-pyarrow = "57.0.0"
 arrow-schema = "57.0.0"
 arrow-array = "57.0.0"
 pyo3-async-runtimes = { version = "0.26.0", features = ["tokio-runtime"] }
-chrono = { workspace = true }
-once_cell = "1.21.3"
+jiff = { workspace = true }
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 63e84b1f86..49d51794ca 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -15,8 +15,9 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use std::sync::LazyLock;
+
 pub use ::fluss as fcore;
-use once_cell::sync::Lazy;
 use pyo3::prelude::*;
 use tokio::runtime::Runtime;
 
@@ -36,7 +37,7 @@ pub use metadata::*;
 pub use table::*;
 pub use utils::*;
 
-static TOKIO_RUNTIME: Lazy<Runtime> = Lazy::new(|| {
+static TOKIO_RUNTIME: LazyLock<Runtime> = LazyLock::new(|| {
     tokio::runtime::Builder::new_multi_thread()
         .enable_all()
         .build()
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 4547b9c327..54235c4107 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -20,7 +20,6 @@ edition = { workspace = true }
 rust-version = { workspace = true }
 version = { workspace = true }
 name = "fluss"
-build = "src/build.rs"
 
 [features]
 default = ["storage-memory", "storage-fs"]
@@ -52,18 +51,20 @@ rust_decimal = "1"
 ordered-float = { version = "4", features = ["serde"] }
 parse-display = "0.10"
 ref-cast = "1.0"
-chrono = { workspace = true }
-opendal = "0.53.3"
+jiff = { workspace = true }
+opendal = "0.55.0"
 url = "2.5.7"
 async-trait = "0.1.89"
 uuid = { version = "1.10", features = ["v4"] }
-tempfile= "3.23.0"
+tempfile = "3.23.0"
+
+[target.'cfg(target_arch = "wasm32")'.dependencies]
+jiff = { workspace = true, features = ["js"] }
 
 [dev-dependencies]
 testcontainers = "0.25.0"
-once_cell = "1.19"
 test-env-helpers = "0.2.2"
 
 
 [build-dependencies]
-prost-build = {  version = "0.13.5"  }
+prost-build = { version = "0.13.5" }
diff --git a/fluss-rust/crates/fluss/src/build.rs b/fluss-rust/crates/fluss/build.rs
similarity index 100%
rename from fluss-rust/crates/fluss/src/build.rs
rename to fluss-rust/crates/fluss/build.rs
diff --git a/fluss-rust/crates/fluss/src/io/file_io.rs b/fluss-rust/crates/fluss/src/io/file_io.rs
index 69a4c9707f..96be06f019 100644
--- a/fluss-rust/crates/fluss/src/io/file_io.rs
+++ b/fluss-rust/crates/fluss/src/io/file_io.rs
@@ -22,7 +22,7 @@ use std::ops::Range;
 use std::sync::Arc;
 
 use bytes::Bytes;
-use chrono::{DateTime, Utc};
+use jiff::Timestamp;
 use opendal::Operator;
 
 use url::Url;
@@ -132,7 +132,7 @@ impl InputFile {
             size: meta.content_length(),
             is_dir: meta.is_dir(),
             path: self.path.clone(),
-            last_modified: meta.last_modified(),
+            last_modified: meta.last_modified().map(Into::into),
         })
     }
 
@@ -154,5 +154,5 @@ pub struct FileStatus {
     pub size: u64,
     pub is_dir: bool,
     pub path: String,
-    pub last_modified: Option<DateTime<Utc>>,
+    pub last_modified: Option<Timestamp>,
 }
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 3e487039b3..6929b57c5c 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -15,15 +15,13 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use chrono::Datelike;
-
 use crate::error::Error::RowConvertError;
 use crate::error::Result;
 use arrow::array::{
     ArrayBuilder, BinaryBuilder, BooleanBuilder, Float32Builder, Float64Builder, Int8Builder,
     Int16Builder, Int32Builder, Int64Builder, StringBuilder,
 };
-use chrono::NaiveDate;
+use jiff::ToSpan;
 use ordered_float::OrderedFloat;
 use parse_display::Display;
 use ref_cast::RefCast;
@@ -35,8 +33,6 @@ use std::ops::Deref;
 #[allow(dead_code)]
 const THIRTY_YEARS_MICROSECONDS: i64 = 946_684_800_000_000;
 
-pub const UNIX_EPOCH_DAYS: i32 = 719_163;
-
 #[derive(Debug, Clone, Display, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize)]
 pub enum Datum<'a> {
     #[display("null")]
@@ -404,6 +400,8 @@ impl From<Vec<u8>> for Blob {
     }
 }
 
+const UNIX_EPOCH_DAY: jiff::civil::Date = jiff::civil::date(1970, 1, 1);
+
 impl Date {
     pub const fn new(inner: i32) -> Self {
         Date(inner)
@@ -414,16 +412,17 @@ impl Date {
         self.0
     }
 
-    pub fn year(&self) -> i32 {
-        let date = NaiveDate::from_num_days_from_ce_opt(self.0 + UNIX_EPOCH_DAYS).unwrap();
+    pub fn year(&self) -> i16 {
+        let date = UNIX_EPOCH_DAY + self.0.days();
         date.year()
     }
-    pub fn month(&self) -> i32 {
-        let date = NaiveDate::from_num_days_from_ce_opt(self.0 + UNIX_EPOCH_DAYS).unwrap();
-        date.month() as i32
+    pub fn month(&self) -> i8 {
+        let date = UNIX_EPOCH_DAY + self.0.days();
+        date.month()
     }
-    pub fn day(&self) -> i32 {
-        let date = NaiveDate::from_num_days_from_ce_opt(self.0 + UNIX_EPOCH_DAYS).unwrap();
-        date.day() as i32
+
+    pub fn day(&self) -> i8 {
+        let date = UNIX_EPOCH_DAY + self.0.days();
+        date.day()
     }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index c51373d2cb..0086d9c03e 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -16,16 +16,17 @@
 // under the License.
 
 use crate::integration::fluss_cluster::FlussTestingCluster;
-use once_cell::sync::Lazy;
 use parking_lot::RwLock;
+
 use std::sync::Arc;
+use std::sync::LazyLock;
 
 #[cfg(test)]
 use test_env_helpers::*;
 
 // Module-level shared cluster instance (only for this test file)
-static SHARED_FLUSS_CLUSTER: Lazy<Arc<RwLock<Option<FlussTestingCluster>>>> =
-    Lazy::new(|| Arc::new(RwLock::new(None)));
+static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>> =
+    LazyLock::new(|| Arc::new(RwLock::new(None)));
 
 #[cfg(test)]
 #[before_all]
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index b23fd793cd..a058bfe0bc 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -16,17 +16,17 @@
  * limitations under the License.
  */
 
-use once_cell::sync::Lazy;
 use parking_lot::RwLock;
 use std::sync::Arc;
+use std::sync::LazyLock;
 
 use crate::integration::fluss_cluster::FlussTestingCluster;
 #[cfg(test)]
 use test_env_helpers::*;
 
 // Module-level shared cluster instance (only for this test file)
-static SHARED_FLUSS_CLUSTER: Lazy<Arc<RwLock<Option<FlussTestingCluster>>>> =
-    Lazy::new(|| Arc::new(RwLock::new(None)));
+static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>> =
+    LazyLock::new(|| Arc::new(RwLock::new(None)));
 
 #[cfg(test)]
 #[before_all]
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index f33d440f40..f52d526e37 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -16,16 +16,16 @@
  * limitations under the License.
  */
 use crate::integration::fluss_cluster::FlussTestingCluster;
-use once_cell::sync::Lazy;
 use parking_lot::RwLock;
 use std::sync::Arc;
+use std::sync::LazyLock;
 
 #[cfg(test)]
 use test_env_helpers::*;
 
 // Module-level shared cluster instance (only for this test file)
-static SHARED_FLUSS_CLUSTER: Lazy<Arc<RwLock<Option<FlussTestingCluster>>>> =
-    Lazy::new(|| Arc::new(RwLock::new(None)));
+static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>> =
+    LazyLock::new(|| Arc::new(RwLock::new(None)));
 
 #[cfg(test)]
 #[before_all]

From d634a7083c5f10efe718cd00151f7ed472164b0a Mon Sep 17 00:00:00 2001
From: tison <wander4096@gmail.com>
Date: Mon, 15 Dec 2025 14:31:17 +0800
Subject: [PATCH 034/287] chore: use log over tracing (#96)

Signed-off-by: tison <wander4096@gmail.com>
---
 fluss-rust/crates/fluss/Cargo.toml                    | 11 +++++------
 fluss-rust/crates/fluss/src/client/write/broadcast.rs |  3 +--
 fluss-rust/crates/fluss/src/io/file_io.rs             |  4 +---
 fluss-rust/crates/fluss/src/rpc/server_connection.rs  | 11 ++++++-----
 fluss-rust/crates/fluss/src/util/mod.rs               |  3 +--
 5 files changed, 14 insertions(+), 18 deletions(-)

diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 54235c4107..aa763d584e 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -37,24 +37,23 @@ futures = "0.3"
 clap = { workspace = true }
 crc32c = "0.6.8"
 linked-hash-map = "0.5.6"
-prost = "0.13.5"
+prost = "0.14"
 rand = "0.9.1"
 serde = { version = "1.0.219", features = ["derive", "rc"] }
 serde_json = "1.0.140"
-thiserror = "1.0"
-tracing = "0.1"
+thiserror = "2"
+log = { version = "0.4", features = ["kv_std"] }
 tokio = { workspace = true }
 parking_lot = "0.12"
 bytes = "1.10.1"
 dashmap = "6.1.0"
 rust_decimal = "1"
-ordered-float = { version = "4", features = ["serde"] }
+ordered-float = { version = "5", features = ["serde"] }
 parse-display = "0.10"
 ref-cast = "1.0"
 jiff = { workspace = true }
 opendal = "0.55.0"
 url = "2.5.7"
-async-trait = "0.1.89"
 uuid = { version = "1.10", features = ["v4"] }
 tempfile = "3.23.0"
 
@@ -67,4 +66,4 @@ test-env-helpers = "0.2.2"
 
 
 [build-dependencies]
-prost-build = { version = "0.13.5" }
+prost-build = { version = "0.14" }
diff --git a/fluss-rust/crates/fluss/src/client/write/broadcast.rs b/fluss-rust/crates/fluss/src/client/write/broadcast.rs
index 2dcc34cbc4..d2e7f0c91c 100644
--- a/fluss-rust/crates/fluss/src/client/write/broadcast.rs
+++ b/fluss-rust/crates/fluss/src/client/write/broadcast.rs
@@ -19,7 +19,6 @@ use parking_lot::RwLock;
 use std::sync::Arc;
 use thiserror::Error;
 use tokio::sync::Notify;
-use tracing::warn;
 
 pub type Result<T, E = Error> = std::result::Result<T, E>;
 
@@ -111,7 +110,7 @@ where
     fn drop(&mut self) {
         let mut data = self.shared.data.write();
         if data.is_none() {
-            warn!("BroadcastOnce dropped without producing");
+            log::warn!("BroadcastOnce dropped without producing");
             *data = Some(Err(Error::Dropped));
             self.shared.notify.notify_waiters();
         }
diff --git a/fluss-rust/crates/fluss/src/io/file_io.rs b/fluss-rust/crates/fluss/src/io/file_io.rs
index 96be06f019..ec3b87ec5b 100644
--- a/fluss-rust/crates/fluss/src/io/file_io.rs
+++ b/fluss-rust/crates/fluss/src/io/file_io.rs
@@ -97,12 +97,10 @@ impl FileIOBuilder {
     }
 }
 
-#[async_trait::async_trait]
 pub trait FileRead: Send + Unpin + 'static {
-    async fn read(&self, range: Range<u64>) -> Result<Bytes>;
+    fn read(&self, range: Range<u64>) -> impl Future<Output = Result<Bytes>> + Send;
 }
 
-#[async_trait::async_trait]
 impl FileRead for opendal::Reader {
     async fn read(&self, range: Range<u64>) -> Result<Bytes> {
         Ok(opendal::Reader::read(self, range).await?.to_bytes())
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index 4eeda46063..c474534b61 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -37,7 +37,6 @@ use tokio::io::{AsyncRead, AsyncWrite, AsyncWriteExt, BufStream, WriteHalf};
 use tokio::sync::Mutex as AsyncMutex;
 use tokio::sync::oneshot::{Sender, channel};
 use tokio::task::JoinHandle;
-use tracing::warn;
 
 pub type MessengerTransport = ServerConnectionInner<BufStream<Transport>>;
 
@@ -178,8 +177,10 @@ where
                         let header =
                             match ResponseHeader::read_versioned(&mut cursor, ApiVersion(0)) {
                                 Ok(header) => header,
-                                Err(e) => {
-                                    warn!(%e, "Cannot read message header, ignoring message");
+                                Err(err) => {
+                                    log::warn!(
+                                        "Cannot read message header, ignoring message: {err:?}"
+                                    );
                                     continue;
                                 }
                             };
@@ -189,8 +190,8 @@ where
                                 match map.remove(&header.request_id) {
                                     Some(active_request) => active_request,
                                     _ => {
-                                        warn!(
-                                            request_id = header.request_id,
+                                        log::warn!(
+                                            request_id:% = header.request_id;
                                             "Got response for unknown request",
                                         );
                                         continue;
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index f93abf967b..d8c0db59d8 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -22,7 +22,6 @@ use std::hash::Hash;
 use std::path::PathBuf;
 use std::sync::Arc;
 use std::time::{SystemTime, UNIX_EPOCH};
-use tracing::warn;
 
 pub fn current_time_ms() -> i64 {
     SystemTime::now()
@@ -34,7 +33,7 @@ pub fn current_time_ms() -> i64 {
 pub async fn delete_file(file_path: PathBuf) {
     tokio::fs::remove_file(&file_path)
         .await
-        .unwrap_or_else(|e| warn!("Could not delete file: {:?}, error: {:?}", &file_path, e));
+        .unwrap_or_else(|err| log::warn!("Could not delete file: {file_path:?}, error: {err:?}"));
 }
 
 pub struct FairBucketStatusMap<S> {

From 746f948837878b2c42b8b5f4394c29f4ac56fcb2 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Sat, 20 Dec 2025 11:32:10 +0800
Subject: [PATCH 035/287] feat: support s3 as remote segment (#93)

---------
Co-authored-by: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
---
 fluss-rust/Cargo.toml                         |   5 +
 fluss-rust/crates/examples/Cargo.toml         |   2 +-
 fluss-rust/crates/fluss/Cargo.toml            |  11 +-
 .../crates/fluss/src/client/credentials.rs    | 165 ++++++++++++++++++
 fluss-rust/crates/fluss/src/client/mod.rs     |   2 +
 .../fluss/src/client/table/remote_log.rs      |  69 +++++++-
 .../crates/fluss/src/client/table/scanner.rs  |   9 +
 fluss-rust/crates/fluss/src/io/mod.rs         |   7 +-
 fluss-rust/crates/fluss/src/io/storage.rs     |  16 +-
 fluss-rust/crates/fluss/src/io/storage_s3.rs  |  48 +++++
 .../crates/fluss/src/proto/fluss_api.proto    |  15 ++
 fluss-rust/crates/fluss/src/record/arrow.rs   |  67 ++++++-
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |   3 +
 .../src/rpc/message/get_security_token.rs     |  53 ++++++
 .../crates/fluss/src/rpc/message/mod.rs       |   2 +
 15 files changed, 453 insertions(+), 21 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/credentials.rs
 create mode 100644 fluss-rust/crates/fluss/src/io/storage_s3.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/get_security_token.rs

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 284a836349..4155ea84b9 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -33,4 +33,9 @@ fluss = { version = "0.1.0", path = "./crates/fluss" }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression"] }
+chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }
+
+serde = { version = "1.0", features = ["derive"] }
+serde_json = "1.0"
+opendal = "0.53"
 jiff = { version = "0.2" }
diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
index dab85b66ed..e1fa531764 100644
--- a/fluss-rust/crates/examples/Cargo.toml
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -26,7 +26,7 @@ version = { workspace = true }
 [dependencies]
 fluss = { workspace = true }
 tokio = { workspace = true }
-clap = { workspace = true}
+clap = { workspace = true }
 [[example]]
 name = "example-table"
 path = "src/example_table.rs"
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index aa763d584e..0cf0364773 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -22,11 +22,12 @@ version = { workspace = true }
 name = "fluss"
 
 [features]
-default = ["storage-memory", "storage-fs"]
-storage-all = ["storage-memory", "storage-fs"]
+default = ["storage-memory", "storage-fs", "storage-s3"]
+storage-all = ["storage-memory", "storage-fs", "storage-s3"]
 
 storage-memory = ["opendal/services-memory"]
 storage-fs = ["opendal/services-fs"]
+storage-s3 = ["opendal/services-s3"]
 integration_tests = []
 
 [dependencies]
@@ -39,9 +40,9 @@ crc32c = "0.6.8"
 linked-hash-map = "0.5.6"
 prost = "0.14"
 rand = "0.9.1"
-serde = { version = "1.0.219", features = ["derive", "rc"] }
-serde_json = "1.0.140"
-thiserror = "2"
+serde = { workspace = true, features = ["rc"] }
+serde_json = { workspace = true }
+thiserror = "1.0"
 log = { version = "0.4", features = ["kv_std"] }
 tokio = { workspace = true }
 parking_lot = "0.12"
diff --git a/fluss-rust/crates/fluss/src/client/credentials.rs b/fluss-rust/crates/fluss/src/client/credentials.rs
new file mode 100644
index 0000000000..bd2a477a85
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/credentials.rs
@@ -0,0 +1,165 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::metadata::Metadata;
+use crate::error::{Error, Result};
+use crate::rpc::RpcClient;
+use crate::rpc::message::GetSecurityTokenRequest;
+use parking_lot::RwLock;
+use serde::Deserialize;
+use std::collections::HashMap;
+use std::sync::Arc;
+use std::time::{Duration, Instant};
+
+const CACHE_TTL: Duration = Duration::from_secs(3600);
+
+#[derive(Debug, Deserialize)]
+struct Credentials {
+    access_key_id: String,
+    access_key_secret: String,
+    security_token: Option<String>,
+}
+
+struct CachedToken {
+    access_key_id: String,
+    secret_access_key: String,
+    security_token: Option<String>,
+    addition_infos: HashMap<String, String>,
+    cached_at: Instant,
+}
+
+impl CachedToken {
+    fn to_remote_fs_props(&self) -> HashMap<String, String> {
+        let mut props = HashMap::new();
+
+        props.insert("access_key_id".to_string(), self.access_key_id.clone());
+        props.insert(
+            "secret_access_key".to_string(),
+            self.secret_access_key.clone(),
+        );
+
+        if let Some(token) = &self.security_token {
+            props.insert("security_token".to_string(), token.clone());
+        }
+
+        for (key, value) in &self.addition_infos {
+            if let Some((opendal_key, transform)) = convert_hadoop_key_to_opendal(key) {
+                let final_value = if transform {
+                    // Invert boolean value (path_style_access -> enable_virtual_host_style)
+                    if value == "true" {
+                        "false".to_string()
+                    } else {
+                        "true".to_string()
+                    }
+                } else {
+                    value.clone()
+                };
+                props.insert(opendal_key, final_value);
+            }
+        }
+
+        props
+    }
+}
+
+/// Returns (opendal_key, needs_inversion)
+/// needs_inversion is true for path_style_access -> enable_virtual_host_style conversion
+fn convert_hadoop_key_to_opendal(hadoop_key: &str) -> Option<(String, bool)> {
+    match hadoop_key {
+        "fs.s3a.endpoint" => Some(("endpoint".to_string(), false)),
+        "fs.s3a.endpoint.region" => Some(("region".to_string(), false)),
+        "fs.s3a.path.style.access" => Some(("enable_virtual_host_style".to_string(), true)),
+        "fs.s3a.connection.ssl.enabled" => None,
+        _ => None,
+    }
+}
+
+pub struct CredentialsCache {
+    inner: RwLock<Option<CachedToken>>,
+}
+
+impl CredentialsCache {
+    pub fn new() -> Self {
+        Self {
+            inner: RwLock::new(None),
+        }
+    }
+
+    pub async fn get_or_refresh(
+        &self,
+        rpc_client: &Arc<RpcClient>,
+        metadata: &Arc<Metadata>,
+    ) -> Result<HashMap<String, String>> {
+        {
+            let guard = self.inner.read();
+            if let Some(cached) = guard.as_ref() {
+                if cached.cached_at.elapsed() < CACHE_TTL {
+                    return Ok(cached.to_remote_fs_props());
+                }
+            }
+        }
+
+        self.refresh_from_server(rpc_client, metadata).await
+    }
+
+    async fn refresh_from_server(
+        &self,
+        rpc_client: &Arc<RpcClient>,
+        metadata: &Arc<Metadata>,
+    ) -> Result<HashMap<String, String>> {
+        let cluster = metadata.get_cluster();
+        let server_node = cluster.get_one_available_server();
+        let conn = rpc_client.get_connection(server_node).await?;
+
+        let request = GetSecurityTokenRequest::new();
+        let response = conn.request(request).await?;
+
+        // the token may be empty if the remote filesystem
+        // doesn't require token to access
+        if response.token.is_empty() {
+            return Ok(HashMap::new());
+        }
+
+        let credentials: Credentials = serde_json::from_slice(&response.token).map_err(|e| {
+            Error::JsonSerdeError(format!("Error when parse token from server: {e}"))
+        })?;
+
+        let mut addition_infos = HashMap::new();
+        for kv in &response.addition_info {
+            addition_infos.insert(kv.key.clone(), kv.value.clone());
+        }
+
+        let cached = CachedToken {
+            access_key_id: credentials.access_key_id,
+            secret_access_key: credentials.access_key_secret,
+            security_token: credentials.security_token,
+            addition_infos,
+            cached_at: Instant::now(),
+        };
+
+        let props = cached.to_remote_fs_props();
+        *self.inner.write() = Some(cached);
+
+        Ok(props)
+    }
+}
+
+impl Default for CredentialsCache {
+    fn default() -> Self {
+        Self::new()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/mod.rs b/fluss-rust/crates/fluss/src/client/mod.rs
index a971439258..cff218b345 100644
--- a/fluss-rust/crates/fluss/src/client/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/mod.rs
@@ -17,12 +17,14 @@
 
 mod admin;
 mod connection;
+mod credentials;
 mod metadata;
 mod table;
 mod write;
 
 pub use admin::*;
 pub use connection::*;
+pub use credentials::*;
 pub use metadata::*;
 pub use table::*;
 pub use write::*;
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index 65805d069b..a2561f3925 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -20,6 +20,7 @@ use crate::metadata::TableBucket;
 use crate::proto::{PbRemoteLogFetchInfo, PbRemoteLogSegment};
 use crate::record::{LogRecordsBatchs, ReadContext, ScanRecord};
 use crate::util::delete_file;
+use parking_lot::RwLock;
 use std::collections::HashMap;
 use std::io;
 use std::path::{Path, PathBuf};
@@ -115,11 +116,19 @@ impl RemoteLogDownloadFuture {
 /// Downloader for remote log segment files
 pub struct RemoteLogDownloader {
     local_log_dir: TempDir,
+    remote_fs_props: RwLock<HashMap<String, String>>,
 }
 
 impl RemoteLogDownloader {
     pub fn new(local_log_dir: TempDir) -> Result<Self> {
-        Ok(Self { local_log_dir })
+        Ok(Self {
+            local_log_dir,
+            remote_fs_props: RwLock::new(HashMap::new()),
+        })
+    }
+
+    pub fn set_remote_fs_props(&self, props: HashMap<String, String>) {
+        *self.remote_fs_props.write() = props;
     }
 
     /// Request to fetch a remote log segment to local. This method is non-blocking.
@@ -133,10 +142,16 @@ impl RemoteLogDownloader {
         let local_file_path = self.local_log_dir.path().join(&local_file_name);
         let remote_path = self.build_remote_path(remote_log_tablet_dir, segment);
         let remote_log_tablet_dir = remote_log_tablet_dir.to_string();
+        let remote_fs_props = self.remote_fs_props.read().clone();
         // Spawn async download task
         tokio::spawn(async move {
-            let result =
-                Self::download_file(&remote_log_tablet_dir, &remote_path, &local_file_path).await;
+            let result = Self::download_file(
+                &remote_log_tablet_dir,
+                &remote_path,
+                &local_file_path,
+                &remote_fs_props,
+            )
+            .await;
             let _ = sender.send(result);
         });
         Ok(RemoteLogDownloadFuture::new(receiver))
@@ -157,6 +172,7 @@ impl RemoteLogDownloader {
         remote_log_tablet_dir: &str,
         remote_path: &str,
         local_path: &Path,
+        remote_fs_props: &HashMap<String, String>,
     ) -> Result<PathBuf> {
         // Handle both URL (e.g., "s3://bucket/path") and local file paths
         // If the path doesn't contain "://", treat it as a local file path
@@ -169,11 +185,27 @@ impl RemoteLogDownloader {
         // Create FileIO from the remote log tablet dir URL to get the storage
         let file_io_builder = FileIO::from_url(&remote_log_tablet_dir_url)?;
 
+        // For S3/S3A URLs, inject S3 credentials from props
+        let file_io_builder = if remote_log_tablet_dir.starts_with("s3://")
+            || remote_log_tablet_dir.starts_with("s3a://")
+        {
+            file_io_builder.with_props(
+                remote_fs_props
+                    .iter()
+                    .map(|(k, v)| (k.as_str(), v.as_str())),
+            )
+        } else {
+            file_io_builder
+        };
+
         // Build storage and create operator directly
         let storage = Storage::build(file_io_builder)?;
         let (op, relative_path) = storage.create(remote_path)?;
 
-        // Get file metadata to know the size
+        // Timeout for remote storage operations (30 seconds)
+        const REMOTE_OP_TIMEOUT: std::time::Duration = std::time::Duration::from_secs(30);
+
+        // Get file metadata to know the size with timeout
         let meta = op.stat(relative_path).await?;
         let file_size = meta.content_length();
 
@@ -184,13 +216,32 @@ impl RemoteLogDownloader {
         // opendal::Reader::read accepts a range, so we read in chunks
         const CHUNK_SIZE: u64 = 8 * 1024 * 1024; // 8MB chunks for efficient reading
         let mut offset = 0u64;
+        let mut chunk_count = 0u64;
+        let total_chunks = file_size.div_ceil(CHUNK_SIZE);
 
         while offset < file_size {
             let end = std::cmp::min(offset + CHUNK_SIZE, file_size);
             let range = offset..end;
-
-            // Read chunk from remote storage
-            let chunk = op.read_with(relative_path).range(range.clone()).await?;
+            chunk_count += 1;
+
+            if chunk_count <= 3 || chunk_count % 10 == 0 {
+                log::debug!(
+                    "Remote log download: reading chunk {chunk_count}/{total_chunks} (offset {offset})"
+                );
+            }
+
+            // Read chunk from remote storage with timeout
+            let read_future = op.read_with(relative_path).range(range.clone());
+            let chunk = tokio::time::timeout(REMOTE_OP_TIMEOUT, read_future)
+                .await
+                .map_err(|_| {
+                    Error::Io(io::Error::new(
+                        io::ErrorKind::TimedOut,
+                        format!(
+                            "Timeout reading chunk from remote storage: {remote_path} at offset {offset}"
+                        ),
+                    ))
+                })??;
             let bytes = chunk.to_bytes();
 
             // Write chunk to local file
@@ -254,10 +305,10 @@ impl RemotePendingFetch {
         // delete the downloaded local file to free disk
         delete_file(file_path).await;
 
-        // Parse log records
+        // Parse log records (remote log contains full data, need client-side projection)
         let mut fetch_records = vec![];
         for log_record in &mut LogRecordsBatchs::new(data) {
-            fetch_records.extend(log_record.records(&self.read_context)?);
+            fetch_records.extend(log_record.records_for_remote_log(&self.read_context)?);
         }
 
         let mut result = HashMap::new();
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index f6780d715c..f66d7d7a14 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use crate::client::connection::FlussConnection;
+use crate::client::credentials::CredentialsCache;
 use crate::client::metadata::Metadata;
 use crate::error::{Error, Result};
 use crate::metadata::{TableBucket, TableInfo, TablePath};
@@ -194,6 +195,7 @@ struct LogFetcher {
     log_scanner_status: Arc<LogScannerStatus>,
     read_context: ReadContext,
     remote_log_downloader: RemoteLogDownloader,
+    credentials_cache: CredentialsCache,
 }
 
 impl LogFetcher {
@@ -217,6 +219,7 @@ impl LogFetcher {
             log_scanner_status,
             read_context,
             remote_log_downloader: RemoteLogDownloader::new(tmp_dir)?,
+            credentials_cache: CredentialsCache::new(),
         })
     }
 
@@ -256,6 +259,12 @@ impl LogFetcher {
                     if let Some(ref remote_log_fetch_info) =
                         fetch_log_for_bucket.remote_log_fetch_info
                     {
+                        let remote_fs_props = self
+                            .credentials_cache
+                            .get_or_refresh(&self.conns, &self.metadata)
+                            .await?;
+                        self.remote_log_downloader
+                            .set_remote_fs_props(remote_fs_props);
                         let remote_fetch_info = RemoteLogFetchInfo::from_proto(
                             remote_log_fetch_info,
                             table_bucket.clone(),
diff --git a/fluss-rust/crates/fluss/src/io/mod.rs b/fluss-rust/crates/fluss/src/io/mod.rs
index 3c9a1659e4..a03a394529 100644
--- a/fluss-rust/crates/fluss/src/io/mod.rs
+++ b/fluss-rust/crates/fluss/src/io/mod.rs
@@ -27,8 +27,13 @@ pub use storage::*;
 mod storage_fs;
 #[cfg(feature = "storage-fs")]
 use storage_fs::*;
+
 #[cfg(feature = "storage-memory")]
 mod storage_memory;
-
 #[cfg(feature = "storage-memory")]
 use storage_memory::*;
+
+#[cfg(feature = "storage-s3")]
+mod storage_s3;
+#[cfg(feature = "storage-s3")]
+use storage_s3::*;
diff --git a/fluss-rust/crates/fluss/src/io/storage.rs b/fluss-rust/crates/fluss/src/io/storage.rs
index 361da7ee80..089670e24c 100644
--- a/fluss-rust/crates/fluss/src/io/storage.rs
+++ b/fluss-rust/crates/fluss/src/io/storage.rs
@@ -19,6 +19,7 @@ use crate::error;
 use crate::error::Result;
 use crate::io::FileIOBuilder;
 use opendal::{Operator, Scheme};
+use std::collections::HashMap;
 
 /// The storage carries all supported storage services in fluss
 #[derive(Debug)]
@@ -27,11 +28,13 @@ pub enum Storage {
     Memory,
     #[cfg(feature = "storage-fs")]
     LocalFs,
+    #[cfg(feature = "storage-s3")]
+    S3 { props: HashMap<String, String> },
 }
 
 impl Storage {
     pub(crate) fn build(file_io_builder: FileIOBuilder) -> Result<Self> {
-        let (scheme_str, _) = file_io_builder.into_parts();
+        let (scheme_str, props) = file_io_builder.into_parts();
         let scheme = Self::parse_scheme(&scheme_str)?;
 
         match scheme {
@@ -39,6 +42,8 @@ impl Storage {
             Scheme::Memory => Ok(Self::Memory),
             #[cfg(feature = "storage-fs")]
             Scheme::Fs => Ok(Self::LocalFs),
+            #[cfg(feature = "storage-s3")]
+            Scheme::S3 => Ok(Self::S3 { props }),
             _ => Err(error::Error::IoUnsupported(
                 "Unsupported storage feature".to_string(),
             )),
@@ -66,6 +71,14 @@ impl Storage {
                     Ok((op, &path[1..]))
                 }
             }
+            #[cfg(feature = "storage-s3")]
+            Storage::S3 { props } => {
+                let (bucket, key) = super::parse_s3_path(path);
+                let mut s3_props = props.clone();
+                s3_props.insert("bucket".to_string(), bucket.to_string());
+                let op = super::s3_config_build(&s3_props)?;
+                Ok((op, key))
+            }
         }
     }
 
@@ -73,6 +86,7 @@ impl Storage {
         match scheme {
             "memory" => Ok(Scheme::Memory),
             "file" | "" => Ok(Scheme::Fs),
+            "s3" | "s3a" => Ok(Scheme::S3),
             s => Ok(s.parse::<Scheme>()?),
         }
     }
diff --git a/fluss-rust/crates/fluss/src/io/storage_s3.rs b/fluss-rust/crates/fluss/src/io/storage_s3.rs
new file mode 100644
index 0000000000..8000d091dd
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/io/storage_s3.rs
@@ -0,0 +1,48 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Result;
+use opendal::Configurator;
+use opendal::Operator;
+use opendal::layers::TimeoutLayer;
+use opendal::services::S3Config;
+use std::collections::HashMap;
+use std::time::Duration;
+
+pub(crate) fn s3_config_build(props: &HashMap<String, String>) -> Result<Operator> {
+    let config = S3Config::from_iter(props.clone())?;
+    let op = Operator::from_config(config)?.finish();
+
+    // Add timeout layer to prevent hanging on S3 operations
+    let timeout_layer = TimeoutLayer::new()
+        .with_timeout(Duration::from_secs(10))
+        .with_io_timeout(Duration::from_secs(30));
+
+    Ok(op.layer(timeout_layer))
+}
+
+pub(crate) fn parse_s3_path(path: &str) -> (&str, &str) {
+    let path = path
+        .strip_prefix("s3a://")
+        .or_else(|| path.strip_prefix("s3://"))
+        .unwrap_or(path);
+
+    match path.find('/') {
+        Some(idx) => (&path[..idx], &path[idx + 1..]),
+        None => (path, ""),
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index ef460fc559..e59c2d9dd6 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -297,4 +297,19 @@ message PbLakeSnapshotForBucket {
   optional int64 partition_id = 1;
   required int32 bucket_id = 2;
   optional int64 log_offset = 3;
+}
+
+message PbKeyValue {
+  required string key = 1;
+  required string value = 2;
+}
+
+message GetFileSystemSecurityTokenRequest {
+}
+
+message GetFileSystemSecurityTokenResponse {
+  required string schema = 1;
+  required bytes token = 2;
+  optional int64 expiration_time = 3;
+  repeated PbKeyValue addition_info = 4;
 }
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 806c9a5824..f079f09dfb 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -504,6 +504,30 @@ impl<'a> LogRecordBatch<'a> {
         };
         Ok(log_record_iterator)
     }
+
+    pub fn records_for_remote_log(&self, read_context: &ReadContext) -> Result<LogRecordIterator> {
+        if self.record_count() == 0 {
+            return Ok(LogRecordIterator::empty());
+        }
+
+        let data = &self.data[RECORDS_OFFSET..];
+
+        let record_batch = read_context.record_batch_for_remote_log(data)?;
+        let log_record_iterator = match record_batch {
+            None => LogRecordIterator::empty(),
+            Some(record_batch) => {
+                let arrow_reader = ArrowReader::new(Arc::new(record_batch));
+                LogRecordIterator::Arrow(ArrowLogRecordIterator {
+                    reader: arrow_reader,
+                    base_offset: self.base_log_offset(),
+                    timestamp: self.commit_timestamp(),
+                    row_id: 0,
+                    change_type: ChangeType::AppendOnly,
+                })
+            }
+        };
+        Ok(log_record_iterator)
+    }
 }
 
 /// Parse an Arrow IPC message from a byte slice.
@@ -552,7 +576,8 @@ fn parse_ipc_message(
     let message = root_as_message(metadata_bytes).ok()?;
     let batch_metadata = message.header_as_record_batch()?;
 
-    let body_start = 8 + metadata_size;
+    let metadata_padded_size = (metadata_size + 7) & !7;
+    let body_start = 8 + metadata_padded_size;
     let body_data = &data[body_start..];
     let body_buffer = Buffer::from(body_data);
 
@@ -677,7 +702,7 @@ pub fn to_arrow_type(fluss_type: &DataType) -> ArrowDataType {
 #[derive(Clone)]
 pub struct ReadContext {
     target_schema: SchemaRef,
-
+    full_schema: SchemaRef,
     projection: Option<Projection>,
 }
 
@@ -694,7 +719,8 @@ struct Projection {
 impl ReadContext {
     pub fn new(arrow_schema: SchemaRef) -> ReadContext {
         ReadContext {
-            target_schema: arrow_schema,
+            target_schema: arrow_schema.clone(),
+            full_schema: arrow_schema,
             projection: None,
         }
     }
@@ -730,7 +756,10 @@ impl ReadContext {
                 }
             } else {
                 Projection {
-                    ordered_schema: Self::project_schema(arrow_schema, projected_fields.as_slice()),
+                    ordered_schema: Self::project_schema(
+                        arrow_schema.clone(),
+                        projected_fields.as_slice(),
+                    ),
                     ordered_fields: projected_fields.clone(),
                     projected_fields,
                     reordering_indexes: vec![],
@@ -741,6 +770,7 @@ impl ReadContext {
 
         ReadContext {
             target_schema,
+            full_schema: arrow_schema,
             projection: Some(project),
         }
     }
@@ -809,6 +839,35 @@ impl ReadContext {
         };
         Ok(Some(record_batch))
     }
+
+    pub fn record_batch_for_remote_log(&self, data: &[u8]) -> Result<Option<RecordBatch>> {
+        let (batch_metadata, body_buffer, version) = match parse_ipc_message(data) {
+            Some(result) => result,
+            None => return Ok(None),
+        };
+
+        let record_batch = read_record_batch(
+            &body_buffer,
+            batch_metadata,
+            self.full_schema.clone(),
+            &std::collections::HashMap::new(),
+            None,
+            &version,
+        )?;
+
+        let record_batch = match &self.projection {
+            Some(projection) => {
+                let projected_columns: Vec<_> = projection
+                    .projected_fields
+                    .iter()
+                    .map(|&idx| record_batch.column(idx).clone())
+                    .collect();
+                RecordBatch::try_new(self.target_schema.clone(), projected_columns)?
+            }
+            None => record_batch,
+        };
+        Ok(Some(record_batch))
+    }
 }
 
 pub enum LogRecordIterator {
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index 215bb39389..b11647f960 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -32,6 +32,7 @@ pub enum ApiKey {
     ProduceLog,
     FetchLog,
     ListOffsets,
+    GetFileSystemSecurityToken,
     GetDatabaseInfo,
     GetLatestLakeSnapshot,
     Unknown(i16),
@@ -53,6 +54,7 @@ impl From<i16> for ApiKey {
             1014 => ApiKey::ProduceLog,
             1015 => ApiKey::FetchLog,
             1021 => ApiKey::ListOffsets,
+            1025 => ApiKey::GetFileSystemSecurityToken,
             1032 => ApiKey::GetLatestLakeSnapshot,
             1035 => ApiKey::GetDatabaseInfo,
             _ => Unknown(key),
@@ -76,6 +78,7 @@ impl From<ApiKey> for i16 {
             ApiKey::ProduceLog => 1014,
             ApiKey::FetchLog => 1015,
             ApiKey::ListOffsets => 1021,
+            ApiKey::GetFileSystemSecurityToken => 1025,
             ApiKey::GetLatestLakeSnapshot => 1032,
             ApiKey::GetDatabaseInfo => 1035,
             Unknown(x) => x,
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_security_token.rs b/fluss-rust/crates/fluss/src/rpc/message/get_security_token.rs
new file mode 100644
index 0000000000..7995232d1a
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_security_token.rs
@@ -0,0 +1,53 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::{GetFileSystemSecurityTokenRequest, GetFileSystemSecurityTokenResponse};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct GetSecurityTokenRequest {
+    pub inner_request: GetFileSystemSecurityTokenRequest,
+}
+
+impl GetSecurityTokenRequest {
+    pub fn new() -> Self {
+        Self {
+            inner_request: GetFileSystemSecurityTokenRequest {},
+        }
+    }
+}
+
+impl Default for GetSecurityTokenRequest {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl RequestBody for GetSecurityTokenRequest {
+    type ResponseBody = GetFileSystemSecurityTokenResponse;
+    const API_KEY: ApiKey = ApiKey::GetFileSystemSecurityToken;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(GetSecurityTokenRequest);
+impl_read_version_type!(GetFileSystemSecurityTokenResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 230d971a49..0ed5b7c0e6 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -28,6 +28,7 @@ mod drop_table;
 mod fetch;
 mod get_database_info;
 mod get_latest_lake_snapshot;
+mod get_security_token;
 mod get_table;
 mod header;
 mod list_databases;
@@ -45,6 +46,7 @@ pub use drop_table::*;
 pub use fetch::*;
 pub use get_database_info::*;
 pub use get_latest_lake_snapshot::*;
+pub use get_security_token::*;
 pub use get_table::*;
 pub use header::*;
 pub use list_databases::*;

From 57ebe0c49e70f4a1fd63631c9010d4f93079d81d Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sat, 20 Dec 2025 03:37:01 +0000
Subject: [PATCH 036/287] chore: parse_ipc_message should return exception
 instead of return None if parse failed (#97)

---------

Co-authored-by: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
---
 fluss-rust/crates/fluss/src/error.rs        |   2 +-
 fluss-rust/crates/fluss/src/record/arrow.rs | 112 +++++++++++++++-----
 2 files changed, 84 insertions(+), 30 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index b1d5d13b6e..63438b1966 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -39,7 +39,7 @@ pub enum Error {
     #[error("Row convert error")]
     RowConvertError(String),
 
-    #[error("arrow error")]
+    #[error("Arrow error: {0}")]
     ArrowError(#[from] ArrowError),
 
     #[error("Write error: {0}")]
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index f079f09dfb..6e8cb55962 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -34,6 +34,7 @@ use arrow::{
         writer::StreamWriter,
     },
 };
+use arrow_schema::ArrowError::ParseError;
 use arrow_schema::SchemaRef;
 use arrow_schema::{DataType as ArrowDataType, Field};
 use byteorder::WriteBytesExt;
@@ -489,19 +490,15 @@ impl<'a> LogRecordBatch<'a> {
         let data = &self.data[RECORDS_OFFSET..];
 
         let record_batch = read_context.record_batch(data)?;
-        let log_record_iterator = match record_batch {
-            None => LogRecordIterator::empty(),
-            Some(record_batch) => {
-                let arrow_reader = ArrowReader::new(Arc::new(record_batch));
-                LogRecordIterator::Arrow(ArrowLogRecordIterator {
-                    reader: arrow_reader,
-                    base_offset: self.base_log_offset(),
-                    timestamp: self.commit_timestamp(),
-                    row_id: 0,
-                    change_type: ChangeType::AppendOnly,
-                })
-            }
-        };
+        let arrow_reader = ArrowReader::new(Arc::new(record_batch));
+        let log_record_iterator = LogRecordIterator::Arrow(ArrowLogRecordIterator {
+            reader: arrow_reader,
+            base_offset: self.base_log_offset(),
+            timestamp: self.commit_timestamp(),
+            row_id: 0,
+            change_type: ChangeType::AppendOnly,
+        });
+
         Ok(log_record_iterator)
     }
 
@@ -542,15 +539,16 @@ impl<'a> LogRecordBatch<'a> {
 /// * `data` - The byte slice containing the IPC message.
 ///
 /// # Returns
-/// Returns `Some((batch_metadata, body_buffer, version))` on success:
+/// Returns `Ok((batch_metadata, body_buffer, version))` on success:
 /// - `batch_metadata`: The RecordBatch metadata from the IPC message.
 /// - `body_buffer`: The buffer containing the record batch body data.
 /// - `version`: The Arrow IPC metadata version.
 ///
-/// Returns `None` if the data is malformed or too short.
+/// Returns `Err(arrow_error)` on errors
+/// - `arrow_error`: Error details e.g. malformed, too short or bad continuation marker.
 fn parse_ipc_message(
     data: &[u8],
-) -> Option<(
+) -> Result<(
     arrow::ipc::RecordBatch<'_>,
     Buffer,
     arrow::ipc::MetadataVersion,
@@ -558,30 +556,38 @@ fn parse_ipc_message(
     const CONTINUATION_MARKER: u32 = 0xFFFFFFFF;
 
     if data.len() < 8 {
-        return None;
+        Err(ParseError(format!("Invalid data length: {}", data.len())))?
     }
 
     let continuation = LittleEndian::read_u32(&data[0..4]);
     let metadata_size = LittleEndian::read_u32(&data[4..8]) as usize;
 
     if continuation != CONTINUATION_MARKER {
-        return None;
+        Err(ParseError(format!(
+            "Invalid continuation marker: {continuation}"
+        )))?
     }
 
     if data.len() < 8 + metadata_size {
-        return None;
+        Err(ParseError(format!(
+            "Invalid data length. Remaining data length {} is shorter than specified size {}",
+            data.len() - 8,
+            metadata_size
+        )))?
     }
 
     let metadata_bytes = &data[8..8 + metadata_size];
-    let message = root_as_message(metadata_bytes).ok()?;
-    let batch_metadata = message.header_as_record_batch()?;
+    let message = root_as_message(metadata_bytes).map_err(|err| ParseError(err.to_string()))?;
+    let batch_metadata = message
+        .header_as_record_batch()
+        .ok_or(ParseError(String::from("Not a record batch")))?;
 
     let metadata_padded_size = (metadata_size + 7) & !7;
     let body_start = 8 + metadata_padded_size;
     let body_data = &data[body_start..];
     let body_buffer = Buffer::from(body_data);
 
-    Some((batch_metadata, body_buffer, message.version()))
+    Ok((batch_metadata, body_buffer, message.version()))
 }
 
 pub fn to_arrow_schema(fluss_schema: &DataType) -> SchemaRef {
@@ -602,7 +608,7 @@ pub fn to_arrow_schema(fluss_schema: &DataType) -> SchemaRef {
             SchemaRef::new(arrow_schema::Schema::new(fields))
         }
         _ => {
-            panic!("must be row data tyoe.")
+            panic!("must be row data type.")
         }
     }
 }
@@ -796,11 +802,8 @@ impl ReadContext {
             .map(|p| p.ordered_fields.as_slice())
     }
 
-    pub fn record_batch(&self, data: &[u8]) -> Result<Option<RecordBatch>> {
-        let (batch_metadata, body_buffer, version) = match parse_ipc_message(data) {
-            Some(result) => result,
-            None => return Ok(None),
-        };
+    pub fn record_batch(&self, data: &[u8]) -> Result<RecordBatch> {
+        let (batch_metadata, body_buffer, version) = parse_ipc_message(data)?;
 
         // the record batch from server must be ordered by field pos,
         // according to project to decide what arrow schema to use
@@ -837,7 +840,7 @@ impl ReadContext {
             }
             _ => record_batch,
         };
-        Ok(Some(record_batch))
+        Ok(record_batch)
     }
 
     pub fn record_batch_for_remote_log(&self, data: &[u8]) -> Result<Option<RecordBatch>> {
@@ -1076,4 +1079,55 @@ mod tests {
     fn test_timestamp_ltz_invalid_precision() {
         to_arrow_type(&DataTypes::timestamp_ltz_with_precision(10));
     }
+
+    #[test]
+    fn test_parse_ipc_message() {
+        let empty_body: &[u8] = &le_bytes(&[0xFFFFFFFF, 0x00000000]);
+        let result = parse_ipc_message(empty_body);
+        assert_eq!(
+            result.unwrap_err().to_string(),
+            String::from("Arrow error: Parser error: Range [0, 4) is out of bounds.\n\n")
+        );
+
+        let invalid_data = &[];
+        assert_eq!(
+            parse_ipc_message(invalid_data).unwrap_err().to_string(),
+            String::from("Arrow error: Parser error: Invalid data length: 0")
+        );
+
+        let data_with_invalid_continuation: &[u8] = &le_bytes(&[0x00000001, 0x00000000]);
+        assert_eq!(
+            parse_ipc_message(data_with_invalid_continuation)
+                .unwrap_err()
+                .to_string(),
+            String::from("Arrow error: Parser error: Invalid continuation marker: 1")
+        );
+
+        let data_with_invalid_length: &[u8] = &le_bytes(&[0xFFFFFFFF, 0x00000001]);
+        assert_eq!(
+            parse_ipc_message(data_with_invalid_length)
+                .unwrap_err()
+                .to_string(),
+            String::from(
+                "Arrow error: Parser error: Invalid data length. \
+                   Remaining data length 0 is shorter than specified size 1"
+            )
+        );
+
+        let data_with_invalid_length = &le_bytes(&[0xFFFFFFFF, 0x00000004, 0x00000000]);
+        assert_eq!(
+            parse_ipc_message(data_with_invalid_length)
+                .unwrap_err()
+                .to_string(),
+            String::from("Arrow error: Parser error: Not a record batch")
+        );
+    }
+
+    fn le_bytes(vals: &[u32]) -> Vec<u8> {
+        let mut out = Vec::with_capacity(vals.len() * 4);
+        for &v in vals {
+            out.extend_from_slice(&v.to_le_bytes());
+        }
+        out
+    }
 }

From e585d1f0aafa890f74ffb1da8aab09908345fb02 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sat, 20 Dec 2025 12:04:20 +0800
Subject: [PATCH 037/287] chore: Improve error (#77)

---
 fluss-rust/crates/fluss/Cargo.toml            |   1 +
 fluss-rust/crates/fluss/src/client/admin.rs   |  28 +-
 .../crates/fluss/src/client/credentials.rs    |   7 +-
 .../fluss/src/client/table/remote_log.rs      |  29 +-
 .../crates/fluss/src/client/table/scanner.rs  |  30 +-
 .../crates/fluss/src/client/write/mod.rs      |  10 +-
 .../crates/fluss/src/client/write/sender.rs   |  11 +-
 .../fluss/src/client/write/writer_client.rs   |  17 +-
 fluss-rust/crates/fluss/src/error.rs          | 139 +++++--
 fluss-rust/crates/fluss/src/io/file_io.rs     |   5 +-
 fluss-rust/crates/fluss/src/io/storage.rs     |   6 +-
 .../crates/fluss/src/metadata/database.rs     |  22 +-
 .../crates/fluss/src/metadata/json_serde.rs   | 179 +++++----
 fluss-rust/crates/fluss/src/metadata/table.rs |  88 +++--
 .../crates/fluss/src/proto/fluss_api.proto    |   5 +
 fluss-rust/crates/fluss/src/record/arrow.rs   |  24 +-
 fluss-rust/crates/fluss/src/row/datum.rs      |  34 +-
 fluss-rust/crates/fluss/src/rpc/error.rs      |   4 +
 .../crates/fluss/src/rpc/fluss_api_error.rs   | 371 ++++++++++++++++++
 fluss-rust/crates/fluss/src/rpc/frame.rs      |   4 +
 .../fluss/src/rpc/message/create_database.rs  |   3 +-
 .../fluss/src/rpc/message/create_table.rs     |   3 +-
 .../fluss/src/rpc/message/database_exists.rs  |   4 +-
 .../fluss/src/rpc/message/drop_database.rs    |   4 +-
 .../fluss/src/rpc/message/drop_table.rs       |   4 +-
 .../crates/fluss/src/rpc/message/fetch.rs     |   4 +-
 .../src/rpc/message/get_database_info.rs      |   4 +-
 .../rpc/message/get_latest_lake_snapshot.rs   |   4 +-
 .../crates/fluss/src/rpc/message/get_table.rs |   4 +-
 .../crates/fluss/src/rpc/message/header.rs    |  18 +-
 .../fluss/src/rpc/message/list_databases.rs   |   4 +-
 .../fluss/src/rpc/message/list_offsets.rs     |  19 +-
 .../fluss/src/rpc/message/list_tables.rs      |   4 +-
 .../crates/fluss/src/rpc/message/mod.rs       |   1 +
 .../fluss/src/rpc/message/produce_log.rs      |   4 +-
 .../fluss/src/rpc/message/table_exists.rs     |   5 +-
 .../fluss/src/rpc/message/update_metadata.rs  |   4 +-
 fluss-rust/crates/fluss/src/rpc/mod.rs        |   4 +-
 .../crates/fluss/src/rpc/server_connection.rs |  24 +-
 .../crates/fluss/tests/integration/admin.rs   |  32 ++
 .../tests/integration/table_remote_scan.rs    |  14 +-
 41 files changed, 908 insertions(+), 273 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs

diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 0cf0364773..cdba9de5a4 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -57,6 +57,7 @@ opendal = "0.55.0"
 url = "2.5.7"
 uuid = { version = "1.10", features = ["v4"] }
 tempfile = "3.23.0"
+snafu = "0.8.3"
 
 [target.'cfg(target_arch = "wasm32")'.dependencies]
 jiff = { workspace = true, features = ["js"] }
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index fefab43520..e185af84ac 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -29,7 +29,7 @@ use crate::rpc::message::{ListOffsetsRequest, OffsetSpec};
 use crate::rpc::{RpcClient, ServerConnection};
 
 use crate::BucketId;
-use crate::error::Result;
+use crate::error::{Error, Result};
 use crate::proto::GetTableInfoResponse;
 use std::collections::HashMap;
 use std::slice::from_ref;
@@ -245,10 +245,10 @@ impl FlussAdmin {
         let mut results = HashMap::new();
 
         for response_future in response_futures {
-            let offsets = response_future.await.map_err(
-                // todo: consider use suitable error
-                |e| crate::error::Error::WriteError(format!("Fail to get result: {e}")),
-            )?;
+            let offsets = response_future.await.map_err(|e| Error::UnexpectedError {
+                message: "Fail to get result for list offsets.".to_string(),
+                source: Some(Box::new(e)),
+            })?;
             results.extend(offsets?);
         }
         Ok(results)
@@ -267,10 +267,11 @@ impl FlussAdmin {
         for bucket_id in buckets {
             let table_bucket = TableBucket::new(table_id, *bucket_id);
             let leader = cluster.leader_for(&table_bucket).ok_or_else(|| {
-                // todo: consider use another suitable error
-                crate::error::Error::InvalidTableError(format!(
-                    "No leader found for table bucket: table_id={table_id}, bucket_id={bucket_id}"
-                ))
+                // todo: consider retry?
+                Error::UnexpectedError {
+                    message: format!("No leader found for table bucket: {table_bucket}."),
+                    source: None,
+                }
             })?;
 
             node_for_bucket_list
@@ -301,10 +302,11 @@ impl FlussAdmin {
             let task = tokio::spawn(async move {
                 let cluster = metadata.get_cluster();
                 let tablet_server = cluster.get_tablet_server(leader_id).ok_or_else(|| {
-                    // todo: consider use more suitable error
-                    crate::error::Error::InvalidTableError(format!(
-                        "Tablet server {leader_id} not found"
-                    ))
+                    Error::LeaderNotAvailable {
+                        message: format!(
+                            "Tablet server {leader_id} is not found in metadata cache."
+                        ),
+                    }
                 })?;
                 let connection = rpc_client.get_connection(tablet_server).await?;
                 let list_offsets_response = connection.request(request).await?;
diff --git a/fluss-rust/crates/fluss/src/client/credentials.rs b/fluss-rust/crates/fluss/src/client/credentials.rs
index bd2a477a85..6b07d08eb1 100644
--- a/fluss-rust/crates/fluss/src/client/credentials.rs
+++ b/fluss-rust/crates/fluss/src/client/credentials.rs
@@ -134,9 +134,10 @@ impl CredentialsCache {
             return Ok(HashMap::new());
         }
 
-        let credentials: Credentials = serde_json::from_slice(&response.token).map_err(|e| {
-            Error::JsonSerdeError(format!("Error when parse token from server: {e}"))
-        })?;
+        let credentials: Credentials =
+            serde_json::from_slice(&response.token).map_err(|e| Error::JsonSerdeError {
+                message: format!("Error when parse token from server: {e}"),
+            })?;
 
         let mut addition_infos = HashMap::new();
         for kv in &response.addition_info {
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index a2561f3925..10273dde2e 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -100,15 +100,14 @@ impl RemoteLogDownloadFuture {
 
     /// Get the downloaded file path
     pub async fn get_file_path(&mut self) -> Result<PathBuf> {
-        let receiver = self
-            .receiver
-            .take()
-            .ok_or_else(|| Error::Io(io::Error::other("Download future already consumed")))?;
-
-        receiver.await.map_err(|e| {
-            Error::Io(io::Error::other(format!(
-                "Download future cancelled: {e:?}"
-            )))
+        let receiver = self.receiver.take().ok_or_else(|| Error::UnexpectedError {
+            message: "Downloaded file already consumed".to_string(),
+            source: None,
+        })?;
+
+        receiver.await.map_err(|e| Error::UnexpectedError {
+            message: format!("Download future cancelled: {e:?}"),
+            source: None,
         })?
     }
 }
@@ -234,13 +233,13 @@ impl RemoteLogDownloader {
             let read_future = op.read_with(relative_path).range(range.clone());
             let chunk = tokio::time::timeout(REMOTE_OP_TIMEOUT, read_future)
                 .await
-                .map_err(|_| {
-                    Error::Io(io::Error::new(
-                        io::ErrorKind::TimedOut,
-                        format!(
-                            "Timeout reading chunk from remote storage: {remote_path} at offset {offset}"
+                .map_err(|e| {
+                    Error::IoUnexpectedError {
+                        message: format!(
+                            "Timeout reading chunk from remote storage: {remote_path} at offset {offset}, exception: {e}."
                         ),
-                    ))
+                        source: io::ErrorKind::TimedOut.into(),
+                    }
                 })??;
             let bytes = chunk.to_bytes();
 
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index f66d7d7a14..1e70649e0b 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -74,18 +74,20 @@ impl<'a> TableScan<'a> {
     /// ```
     pub fn project(mut self, column_indices: &[usize]) -> Result<Self> {
         if column_indices.is_empty() {
-            return Err(Error::IllegalArgument(
-                "Column indices cannot be empty".to_string(),
-            ));
+            return Err(Error::IllegalArgument {
+                message: "Column indices cannot be empty".to_string(),
+            });
         }
         let field_count = self.table_info.row_type().fields().len();
         for &idx in column_indices {
             if idx >= field_count {
-                return Err(Error::IllegalArgument(format!(
-                    "Column index {} out of range (max: {})",
-                    idx,
-                    field_count - 1
-                )));
+                return Err(Error::IllegalArgument {
+                    message: format!(
+                        "Column index {} out of range (max: {})",
+                        idx,
+                        field_count - 1
+                    ),
+                });
             }
         }
         self.projected_fields = Some(column_indices.to_vec());
@@ -106,9 +108,9 @@ impl<'a> TableScan<'a> {
     /// ```
     pub fn project_by_name(mut self, column_names: &[&str]) -> Result<Self> {
         if column_names.is_empty() {
-            return Err(Error::IllegalArgument(
-                "Column names cannot be empty".to_string(),
-            ));
+            return Err(Error::IllegalArgument {
+                message: "Column names cannot be empty".to_string(),
+            });
         }
         let row_type = self.table_info.row_type();
         let mut indices = Vec::new();
@@ -118,7 +120,9 @@ impl<'a> TableScan<'a> {
                 .fields()
                 .iter()
                 .position(|f| f.name() == *name)
-                .ok_or_else(|| Error::IllegalArgument(format!("Column '{name}' not found")))?;
+                .ok_or_else(|| Error::IllegalArgument {
+                    message: format!("Column '{name}' not found"),
+                })?;
             indices.push(idx);
         }
 
@@ -277,7 +281,7 @@ impl LogFetcher {
                             // Download and process remote log segments
                             let mut pos_in_log_segment = remote_fetch_info.first_start_pos;
                             let mut current_fetch_offset = fetch_offset;
-                            // todo: make segment download parallelly
+                            // todo: make segment download in parallel
                             for (i, segment) in
                                 remote_fetch_info.remote_log_segments.iter().enumerate()
                             {
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index e632cde451..cd33586c89 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -74,11 +74,17 @@ impl ResultHandle {
         self.receiver
             .receive()
             .await
-            .map_err(|e| Error::WriteError(e.to_string()))
+            .map_err(|e| Error::UnexpectedError {
+                message: format!("Fail to wait write result {e:?}"),
+                source: None,
+            })
     }
 
     pub fn result(&self, batch_result: BatchWriteResult) -> Result<(), Error> {
         // do nothing, just return empty result
-        batch_result.map_err(|e| Error::WriteError(e.to_string()))
+        batch_result.map_err(|e| Error::UnexpectedError {
+            message: format!("Fail to get write result {e:?}"),
+            source: None,
+        })
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index 27460e3863..462a846d6c 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -17,7 +17,7 @@
 
 use crate::client::metadata::Metadata;
 use crate::client::{ReadyWriteBatch, RecordAccumulator};
-use crate::error::Error::WriteError;
+use crate::error::Error;
 use crate::error::Result;
 use crate::metadata::TableBucket;
 use crate::proto::ProduceLogResponse;
@@ -150,9 +150,12 @@ impl Sender {
 
         let cluster = self.metadata.get_cluster();
 
-        let destination_node = cluster
-            .get_tablet_server(destination)
-            .ok_or(WriteError(String::from("destination node not found")))?;
+        let destination_node =
+            cluster
+                .get_tablet_server(destination)
+                .ok_or(Error::LeaderNotAvailable {
+                    message: format!("destination node not found in metadata cache {destination}."),
+                })?;
         let connection = self.metadata.get_connection(destination_node).await?;
 
         for (table_id, write_batches) in write_batch_by_table {
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index 28f5371e8d..042859afb4 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -78,11 +78,12 @@ impl WriterClient {
 
     fn get_ack(config: &Config) -> Result<i16> {
         let acks = config.writer_acks.as_str();
-        if acks.eq("all") {
+        if acks.eq_ignore_ascii_case("all") {
             Ok(-1)
         } else {
-            acks.parse::<i16>()
-                .map_err(|e| Error::IllegalArgument(e.to_string()))
+            acks.parse::<i16>().map_err(|e| Error::IllegalArgument {
+                message: format!("invalid writer ack '{acks}': {e}"),
+            })
         }
     }
 
@@ -133,11 +134,17 @@ impl WriterClient {
         self.shutdown_tx
             .send(())
             .await
-            .map_err(|e| Error::WriteError(e.to_string()))?;
+            .map_err(|e| Error::UnexpectedError {
+                message: format!("Failed to close write client: {e:?}"),
+                source: None,
+            })?;
 
         self.sender_join_handle
             .await
-            .map_err(|e| Error::WriteError(e.to_string()))?;
+            .map_err(|e| Error::UnexpectedError {
+                message: format!("Failed to close write client: {e:?}"),
+                source: None,
+            })?;
         Ok(())
     }
 
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index 63438b1966..0f4b1b6d11 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -15,48 +15,137 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::rpc::RpcError;
+pub use crate::rpc::RpcError;
+pub use crate::rpc::{ApiError, FlussError};
+
 use arrow_schema::ArrowError;
+use snafu::Snafu;
 use std::{io, result};
-use thiserror::Error;
 
 pub type Result<T> = result::Result<T, Error>;
 
-#[derive(Debug, Error)]
+#[derive(Debug, Snafu)]
 pub enum Error {
-    #[error(transparent)]
-    Io(#[from] io::Error),
+    #[snafu(
+        whatever,
+        display("Fluss hitting unexpected error {}: {:?}", message, source)
+    )]
+    UnexpectedError {
+        message: String,
+        /// see https://github.com/shepmaster/snafu/issues/446
+        #[snafu(source(from(Box<dyn std::error::Error + Send + Sync + 'static>, Some)))]
+        source: Option<Box<dyn std::error::Error + Send + Sync + 'static>>,
+    },
+
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting unexpected io error {}: {:?}", message, source)
+    )]
+    IoUnexpectedError { message: String, source: io::Error },
+
+    #[snafu(
+        visibility(pub(crate)),
+        display(
+            "Fluss hitting remote storage unexpected error {}: {:?}",
+            message,
+            source
+        )
+    )]
+    RemoteStorageUnexpectedError {
+        message: String,
+        source: opendal::Error,
+    },
+
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting invalid table error {}.", message)
+    )]
+    InvalidTableError { message: String },
 
-    #[error("Invalid table")]
-    InvalidTableError(String),
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting json serde error {}.", message)
+    )]
+    JsonSerdeError { message: String },
 
-    #[error("Json serde error")]
-    JsonSerdeError(String),
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting unexpected rpc error {}: {:?}", message, source)
+    )]
+    RpcError { message: String, source: RpcError },
 
-    #[error("Rpc error")]
-    RpcError(#[from] RpcError),
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting row convert error {}.", message)
+    )]
+    RowConvertError { message: String },
 
-    #[error("Row convert error")]
-    RowConvertError(String),
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting Arrow error {}: {:?}.", message, source)
+    )]
+    ArrowError { message: String, source: ArrowError },
 
-    #[error("Arrow error: {0}")]
-    ArrowError(#[from] ArrowError),
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting illegal argument error {}.", message)
+    )]
+    IllegalArgument { message: String },
 
-    #[error("Write error: {0}")]
-    WriteError(String),
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting IO not supported error {}.", message)
+    )]
+    IoUnsupported { message: String },
 
-    #[error("Illegal argument error: {0}")]
-    IllegalArgument(String),
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting leader not available error {}.", message)
+    )]
+    LeaderNotAvailable { message: String },
 
-    #[error("IO not supported error: {0}")]
-    IoUnsupported(String),
+    #[snafu(visibility(pub(crate)), display("Fluss API Error: {}.", api_error))]
+    FlussAPIError { api_error: ApiError },
+}
 
-    #[error("IO operation failed on underlying storage: {0}")]
-    IoUnexpected(Box<opendal::Error>),
+impl From<ArrowError> for Error {
+    fn from(value: ArrowError) -> Self {
+        Error::ArrowError {
+            message: format!("{value}"),
+            source: value,
+        }
+    }
+}
+
+impl From<RpcError> for Error {
+    fn from(value: RpcError) -> Self {
+        Error::RpcError {
+            message: format!("{value}"),
+            source: value,
+        }
+    }
+}
+
+impl From<io::Error> for Error {
+    fn from(value: io::Error) -> Self {
+        Error::IoUnexpectedError {
+            message: format!("{value}"),
+            source: value,
+        }
+    }
 }
 
 impl From<opendal::Error> for Error {
-    fn from(err: opendal::Error) -> Self {
-        Error::IoUnexpected(Box::new(err))
+    fn from(value: opendal::Error) -> Self {
+        Error::RemoteStorageUnexpectedError {
+            message: format!("{value}"),
+            source: value,
+        }
+    }
+}
+
+impl From<ApiError> for Error {
+    fn from(value: ApiError) -> Self {
+        Error::FlussAPIError { api_error: value }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/io/file_io.rs b/fluss-rust/crates/fluss/src/io/file_io.rs
index ec3b87ec5b..e7b026df55 100644
--- a/fluss-rust/crates/fluss/src/io/file_io.rs
+++ b/fluss-rust/crates/fluss/src/io/file_io.rs
@@ -39,8 +39,9 @@ pub struct FileIO {
 impl FileIO {
     /// Try to infer file io scheme from path.
     pub fn from_url(path: &str) -> Result<FileIOBuilder> {
-        let url =
-            Url::parse(path).map_err(|_| Error::IllegalArgument(format!("Invalid URL: {path}")))?;
+        let url = Url::parse(path).map_err(|_| Error::IllegalArgument {
+            message: format!("Invalid URL: {path}"),
+        })?;
         Ok(FileIOBuilder::new(url.scheme()))
     }
 
diff --git a/fluss-rust/crates/fluss/src/io/storage.rs b/fluss-rust/crates/fluss/src/io/storage.rs
index 089670e24c..d90eaa5711 100644
--- a/fluss-rust/crates/fluss/src/io/storage.rs
+++ b/fluss-rust/crates/fluss/src/io/storage.rs
@@ -44,9 +44,9 @@ impl Storage {
             Scheme::Fs => Ok(Self::LocalFs),
             #[cfg(feature = "storage-s3")]
             Scheme::S3 => Ok(Self::S3 { props }),
-            _ => Err(error::Error::IoUnsupported(
-                "Unsupported storage feature".to_string(),
-            )),
+            _ => Err(error::Error::IoUnsupported {
+                message: format!("Unsupported storage feature {scheme_str}"),
+            }),
         }
     }
 
diff --git a/fluss-rust/crates/fluss/src/metadata/database.rs b/fluss-rust/crates/fluss/src/metadata/database.rs
index 8eaa4d3eb0..fad1498f58 100644
--- a/fluss-rust/crates/fluss/src/metadata/database.rs
+++ b/fluss-rust/crates/fluss/src/metadata/database.rs
@@ -148,8 +148,8 @@ impl JsonSerde for DatabaseDescriptor {
         if let Some(comment_node) = node.get(Self::COMMENT_NAME) {
             let comment = comment_node
                 .as_str()
-                .ok_or_else(|| {
-                    JsonSerdeError(format!("{} should be a string", Self::COMMENT_NAME))
+                .ok_or_else(|| JsonSerdeError {
+                    message: format!("{} should be a string", Self::COMMENT_NAME),
                 })?
                 .to_owned();
             builder = builder.comment(&comment);
@@ -157,8 +157,8 @@ impl JsonSerde for DatabaseDescriptor {
 
         // Deserialize custom properties directly
         let custom_properties = if let Some(props_node) = node.get(Self::CUSTOM_PROPERTIES_NAME) {
-            let obj = props_node.as_object().ok_or_else(|| {
-                JsonSerdeError("Custom properties should be an object".to_string())
+            let obj = props_node.as_object().ok_or_else(|| JsonSerdeError {
+                message: "Custom properties should be an object".to_string(),
             })?;
 
             let mut properties = HashMap::with_capacity(obj.len());
@@ -167,8 +167,8 @@ impl JsonSerde for DatabaseDescriptor {
                     key.clone(),
                     value
                         .as_str()
-                        .ok_or_else(|| {
-                            JsonSerdeError("Property value should be a string".to_string())
+                        .ok_or_else(|| JsonSerdeError {
+                            message: "Property value should be a string".to_string(),
                         })?
                         .to_owned(),
                 );
@@ -186,16 +186,18 @@ impl JsonSerde for DatabaseDescriptor {
 impl DatabaseDescriptor {
     /// Create DatabaseDescriptor from JSON bytes (equivalent to Java's fromJsonBytes)
     pub fn from_json_bytes(bytes: &[u8]) -> Result<Self> {
-        let json_value: Value = serde_json::from_slice(bytes)
-            .map_err(|e| JsonSerdeError(format!("Failed to parse JSON: {e}")))?;
+        let json_value: Value = serde_json::from_slice(bytes).map_err(|e| JsonSerdeError {
+            message: format!("Failed to parse JSON: {e}"),
+        })?;
         Self::deserialize_json(&json_value)
     }
 
     /// Convert DatabaseDescriptor to JSON bytes
     pub fn to_json_bytes(&self) -> Result<Vec<u8>> {
         let json_value = self.serialize_json()?;
-        serde_json::to_vec(&json_value)
-            .map_err(|e| JsonSerdeError(format!("Failed to serialize to JSON: {e}")))
+        serde_json::to_vec(&json_value).map_err(|e| JsonSerdeError {
+            message: format!("Failed to serialize to JSON: {e}"),
+        })
     }
 }
 
diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
index 447b0f9ff3..7d94e194e2 100644
--- a/fluss-rust/crates/fluss/src/metadata/json_serde.rs
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -15,8 +15,8 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::error::Error::{InvalidTableError, JsonSerdeError};
-use crate::error::Result;
+use crate::error::Error::JsonSerdeError;
+use crate::error::{Error, Result};
 use crate::metadata::datatype::{DataField, DataType, DataTypes};
 use crate::metadata::table::{Column, Schema, TableDescriptor};
 use serde_json::{Value, json};
@@ -166,11 +166,11 @@ impl JsonSerde for DataType {
         let type_root = node
             .get(Self::FIELD_NAME_TYPE_NAME)
             .and_then(|v| v.as_str())
-            .ok_or_else(|| {
-                JsonSerdeError(format!(
+            .ok_or_else(|| Error::JsonSerdeError {
+                message: format!(
                     "Couldn't find field {} while deserializing datatype.",
                     Self::FIELD_NAME_TYPE_NAME
-                ))
+                ),
             })?;
 
         let mut data_type = match type_root {
@@ -185,11 +185,8 @@ impl JsonSerde for DataType {
                 let length = node
                     .get(Self::FIELD_NAME_LENGTH)
                     .and_then(|v| v.as_u64())
-                    .ok_or_else(|| {
-                        JsonSerdeError(format!(
-                            "Missing required field: {}",
-                            Self::FIELD_NAME_LENGTH
-                        ))
+                    .ok_or_else(|| Error::JsonSerdeError {
+                        message: format!("Missing required field: {}", Self::FIELD_NAME_LENGTH),
                     })? as u32;
                 DataTypes::char(length)
             }
@@ -198,11 +195,8 @@ impl JsonSerde for DataType {
                 let precision = node
                     .get(Self::FIELD_NAME_PRECISION)
                     .and_then(|v| v.as_u64())
-                    .ok_or_else(|| {
-                        JsonSerdeError(format!(
-                            "Missing required field: {}",
-                            Self::FIELD_NAME_PRECISION
-                        ))
+                    .ok_or_else(|| Error::JsonSerdeError {
+                        message: format!("Missing required field: {}", Self::FIELD_NAME_PRECISION),
                     })? as u32;
                 let scale = node
                     .get(Self::FIELD_NAME_SCALE)
@@ -243,43 +237,46 @@ impl JsonSerde for DataType {
             "ARRAY" => {
                 let element_type_node =
                     node.get(Self::FIELD_NAME_ELEMENT_TYPE).ok_or_else(|| {
-                        JsonSerdeError(format!(
-                            "Missing required field: {}",
-                            Self::FIELD_NAME_ELEMENT_TYPE
-                        ))
+                        Error::JsonSerdeError {
+                            message: format!(
+                                "Missing required field: {}",
+                                Self::FIELD_NAME_ELEMENT_TYPE
+                            ),
+                        }
                     })?;
                 let element_type = DataType::deserialize_json(element_type_node)?;
                 DataTypes::array(element_type)
             }
             "MAP" => {
-                let key_type_node = node.get(Self::FIELD_NAME_KEY_TYPE).ok_or_else(|| {
-                    JsonSerdeError(format!(
-                        "Missing required field: {}",
-                        Self::FIELD_NAME_KEY_TYPE
-                    ))
-                })?;
+                let key_type_node =
+                    node.get(Self::FIELD_NAME_KEY_TYPE)
+                        .ok_or_else(|| Error::JsonSerdeError {
+                            message: format!(
+                                "Missing required field: {}",
+                                Self::FIELD_NAME_KEY_TYPE
+                            ),
+                        })?;
                 let key_type = DataType::deserialize_json(key_type_node)?;
-                let value_type_node = node.get(Self::FIELD_NAME_VALUE_TYPE).ok_or_else(|| {
-                    JsonSerdeError(format!(
-                        "Missing required field: {}",
-                        Self::FIELD_NAME_VALUE_TYPE
-                    ))
-                })?;
+                let value_type_node =
+                    node.get(Self::FIELD_NAME_VALUE_TYPE)
+                        .ok_or_else(|| Error::JsonSerdeError {
+                            message: format!(
+                                "Missing required field: {}",
+                                Self::FIELD_NAME_VALUE_TYPE
+                            ),
+                        })?;
                 let value_type = DataType::deserialize_json(value_type_node)?;
                 DataTypes::map(key_type, value_type)
             }
             "ROW" => {
                 let fields_node = node
                     .get(Self::FIELD_NAME_FIELDS)
-                    .ok_or_else(|| {
-                        JsonSerdeError(format!(
-                            "Missing required field: {}",
-                            Self::FIELD_NAME_FIELDS
-                        ))
+                    .ok_or_else(|| Error::JsonSerdeError {
+                        message: format!("Missing required field: {}", Self::FIELD_NAME_FIELDS),
                     })?
                     .as_array()
-                    .ok_or_else(|| {
-                        JsonSerdeError(format!("{} must be an array", Self::FIELD_NAME_FIELDS))
+                    .ok_or_else(|| Error::JsonSerdeError {
+                        message: format!("{} must be an array", Self::FIELD_NAME_FIELDS),
                     })?;
                 let mut fields = Vec::with_capacity(fields_node.len());
                 for field_node in fields_node {
@@ -287,7 +284,11 @@ impl JsonSerde for DataType {
                 }
                 DataTypes::row(fields)
             }
-            _ => return Err(JsonSerdeError(format!("Unknown type root: {type_root}"))),
+            _ => {
+                return Err(Error::JsonSerdeError {
+                    message: format!("Unknown type root: {type_root}"),
+                });
+            }
         };
 
         if let Some(nullable) = node.get(Self::FIELD_NAME_NULLABLE) {
@@ -327,12 +328,16 @@ impl JsonSerde for DataField {
         let name = node
             .get(Self::NAME)
             .and_then(|v| v.as_str())
-            .ok_or_else(|| JsonSerdeError(format!("Missing required field: {}", Self::NAME)))?
+            .ok_or_else(|| Error::JsonSerdeError {
+                message: format!("Missing required field: {}", Self::NAME),
+            })?
             .to_string();
 
-        let field_type_node = node.get(Self::FIELD_TYPE).ok_or_else(|| {
-            JsonSerdeError(format!("Missing required field: {}", Self::FIELD_TYPE))
-        })?;
+        let field_type_node = node
+            .get(Self::FIELD_TYPE)
+            .ok_or_else(|| Error::JsonSerdeError {
+                message: format!("Missing required field: {}", Self::FIELD_TYPE),
+            })?;
 
         let data_type = DataType::deserialize_json(field_type_node)?;
 
@@ -373,12 +378,16 @@ impl JsonSerde for Column {
         let name = node
             .get(Self::NAME)
             .and_then(|v| v.as_str())
-            .ok_or_else(|| JsonSerdeError(format!("Missing required field: {}", Self::NAME)))?
+            .ok_or_else(|| Error::JsonSerdeError {
+                message: format!("Missing required field: {}", Self::NAME),
+            })?
             .to_string();
 
-        let data_type_node = node.get(Self::DATA_TYPE).ok_or_else(|| {
-            JsonSerdeError(format!("Missing required field: {}", Self::DATA_TYPE))
-        })?;
+        let data_type_node = node
+            .get(Self::DATA_TYPE)
+            .ok_or_else(|| Error::JsonSerdeError {
+                message: format!("Missing required field: {}", Self::DATA_TYPE),
+            })?;
 
         let data_type = DataType::deserialize_json(data_type_node)?;
 
@@ -429,11 +438,13 @@ impl JsonSerde for Schema {
     fn deserialize_json(node: &Value) -> Result<Schema> {
         let columns_node = node
             .get(Self::COLUMNS_NAME)
-            .ok_or_else(|| {
-                JsonSerdeError(format!("Missing required field: {}", Self::COLUMNS_NAME))
+            .ok_or_else(|| Error::JsonSerdeError {
+                message: format!("Missing required field: {}", Self::COLUMNS_NAME),
             })?
             .as_array()
-            .ok_or_else(|| JsonSerdeError(format!("{} must be an array", Self::COLUMNS_NAME)))?;
+            .ok_or_else(|| Error::JsonSerdeError {
+                message: format!("{} must be an array", Self::COLUMNS_NAME),
+            })?;
 
         let mut columns = Vec::with_capacity(columns_node.len());
         for col_node in columns_node {
@@ -443,17 +454,17 @@ impl JsonSerde for Schema {
         let mut schema_builder = Schema::builder().with_columns(columns);
 
         if let Some(pk_node) = node.get(Self::PRIMARY_KEY_NAME) {
-            let pk_array = pk_node
-                .as_array()
-                .ok_or_else(|| InvalidTableError("Primary key must be an array".to_string()))?;
+            let pk_array = pk_node.as_array().ok_or_else(|| Error::InvalidTableError {
+                message: "Primary key must be an array".to_string(),
+            })?;
 
             let mut primary_keys = Vec::with_capacity(pk_array.len());
             for name_node in pk_array {
                 primary_keys.push(
                     name_node
                         .as_str()
-                        .ok_or_else(|| {
-                            InvalidTableError("Primary key element must be a string".to_string())
+                        .ok_or_else(|| Error::InvalidTableError {
+                            message: "Primary key element must be a string".to_string(),
                         })?
                         .to_string(),
                 );
@@ -478,9 +489,9 @@ impl TableDescriptor {
     const VERSION: u32 = 1;
 
     fn deserialize_properties(node: &Value) -> Result<HashMap<String, String>> {
-        let obj = node
-            .as_object()
-            .ok_or_else(|| JsonSerdeError("Properties must be an object".to_string()))?;
+        let obj = node.as_object().ok_or_else(|| Error::JsonSerdeError {
+            message: "Properties must be an object".to_string(),
+        })?;
 
         let mut properties = HashMap::with_capacity(obj.len());
         for (key, value) in obj {
@@ -488,7 +499,9 @@ impl TableDescriptor {
                 key.clone(),
                 value
                     .as_str()
-                    .ok_or_else(|| JsonSerdeError("Property value must be a string".to_string()))?
+                    .ok_or_else(|| Error::JsonSerdeError {
+                        message: "Property value must be a string".to_string(),
+                    })?
                     .to_owned(),
             );
         }
@@ -545,8 +558,8 @@ impl JsonSerde for TableDescriptor {
         let mut builder = TableDescriptor::builder();
 
         // Deserialize schema
-        let schema_node = node.get(Self::SCHEMA_NAME).ok_or_else(|| {
-            JsonSerdeError(format!("Missing required field: {}", Self::SCHEMA_NAME))
+        let schema_node = node.get(Self::SCHEMA_NAME).ok_or_else(|| JsonSerdeError {
+            message: format!("Missing required field: {}", Self::SCHEMA_NAME),
         })?;
         let schema = Schema::deserialize_json(schema_node)?;
         builder = builder.schema(schema);
@@ -555,22 +568,21 @@ impl JsonSerde for TableDescriptor {
         if let Some(comment_node) = node.get(Self::COMMENT_NAME) {
             let comment = comment_node
                 .as_str()
-                .ok_or_else(|| JsonSerdeError(format!("{} must be a string", Self::COMMENT_NAME)))?
+                .ok_or_else(|| JsonSerdeError {
+                    message: format!("{} must be a string", Self::COMMENT_NAME),
+                })?
                 .to_owned();
             builder = builder.comment(comment.as_str());
         }
 
         let partition_node = node
             .get(Self::PARTITION_KEY_NAME)
-            .ok_or_else(|| {
-                JsonSerdeError(format!(
-                    "Missing required field: {}",
-                    Self::PARTITION_KEY_NAME
-                ))
+            .ok_or_else(|| JsonSerdeError {
+                message: format!("Missing required field: {}", Self::PARTITION_KEY_NAME),
             })?
             .as_array()
-            .ok_or_else(|| {
-                JsonSerdeError(format!("{} must be an array", Self::PARTITION_KEY_NAME))
+            .ok_or_else(|| JsonSerdeError {
+                message: format!("{} must be an array", Self::PARTITION_KEY_NAME),
             })?;
 
         let mut partition_keys = Vec::with_capacity(partition_node.len());
@@ -578,11 +590,8 @@ impl JsonSerde for TableDescriptor {
             partition_keys.push(
                 key_node
                     .as_str()
-                    .ok_or_else(|| {
-                        JsonSerdeError(format!(
-                            "{} element must be a string",
-                            Self::PARTITION_KEY_NAME
-                        ))
+                    .ok_or_else(|| JsonSerdeError {
+                        message: format!("{} element must be a string", Self::PARTITION_KEY_NAME),
                     })?
                     .to_owned(),
             );
@@ -592,15 +601,17 @@ impl JsonSerde for TableDescriptor {
         let mut bucket_count = None;
         let mut bucket_keys = vec![];
         if let Some(bucket_key_node) = node.get(Self::BUCKET_KEY_NAME) {
-            let bucket_key_node = bucket_key_node.as_array().ok_or_else(|| {
-                JsonSerdeError(format!("{} must be an array", Self::BUCKET_KEY_NAME))
+            let bucket_key_node = bucket_key_node.as_array().ok_or_else(|| JsonSerdeError {
+                message: format!("{} must be an array", Self::BUCKET_KEY_NAME),
             })?;
 
             for key_node in bucket_key_node {
                 bucket_keys.push(
                     key_node
                         .as_str()
-                        .ok_or_else(|| JsonSerdeError("Bucket key must be a string".to_string()))?
+                        .ok_or_else(|| JsonSerdeError {
+                            message: "Bucket key must be a string".to_string(),
+                        })?
                         .to_owned(),
                 );
             }
@@ -617,18 +628,18 @@ impl JsonSerde for TableDescriptor {
         // Deserialize properties
         let properties =
             Self::deserialize_properties(node.get(Self::PROPERTIES_NAME).ok_or_else(|| {
-                JsonSerdeError(format!("Missing required field: {}", Self::PROPERTIES_NAME))
+                JsonSerdeError {
+                    message: format!("Missing required field: {}", Self::PROPERTIES_NAME),
+                }
             })?)?;
         builder = builder.properties(properties);
 
         // Deserialize custom properties
         let custom_properties = Self::deserialize_properties(
-            node.get(Self::CUSTOM_PROPERTIES_NAME).ok_or_else(|| {
-                JsonSerdeError(format!(
-                    "Missing required field: {}",
-                    Self::CUSTOM_PROPERTIES_NAME
-                ))
-            })?,
+            node.get(Self::CUSTOM_PROPERTIES_NAME)
+                .ok_or_else(|| JsonSerdeError {
+                    message: format!("Missing required field: {}", Self::CUSTOM_PROPERTIES_NAME),
+                })?,
         )?;
         builder = builder.custom_properties(custom_properties);
 
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 751dd6da02..770c4f2cfe 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -16,7 +16,7 @@
 // under the License.
 
 use crate::error::Error::InvalidTableError;
-use crate::error::Result;
+use crate::error::{Error, Result};
 use crate::metadata::datatype::{DataField, DataType, RowType};
 use core::fmt;
 use serde::{Deserialize, Serialize};
@@ -220,9 +220,9 @@ impl SchemaBuilder {
     ) -> Result<Vec<Column>> {
         let names: Vec<_> = columns.iter().map(|c| &c.name).collect();
         if let Some(duplicates) = Self::find_duplicates(&names) {
-            return Err(InvalidTableError(format!(
-                "Duplicate column names found: {duplicates:?}"
-            )));
+            return Err(InvalidTableError {
+                message: format!("Duplicate column names found: {duplicates:?}"),
+            });
         }
 
         let Some(pk) = primary_key else {
@@ -232,9 +232,9 @@ impl SchemaBuilder {
         let pk_set: HashSet<_> = pk.column_names.iter().collect();
         let all_columns: HashSet<_> = columns.iter().map(|c| &c.name).collect();
         if !pk_set.is_subset(&all_columns) {
-            return Err(InvalidTableError(format!(
-                "Primary key columns {pk_set:?} not found in schema"
-            )));
+            return Err(InvalidTableError {
+                message: format!("Primary key columns {pk_set:?} not found in schema"),
+            });
         }
 
         Ok(columns
@@ -441,12 +441,12 @@ impl TableDescriptor {
     pub fn replication_factor(&self) -> Result<i32> {
         self.properties
             .get("table.replication.factor")
-            .ok_or(InvalidTableError(
-                "Replication factor is not set".to_string(),
-            ))?
+            .ok_or_else(|| InvalidTableError {
+                message: "Replication factor is not set".to_string(),
+            })?
             .parse()
-            .map_err(|_e| {
-                InvalidTableError("Replication factor can't be convert into int".to_string())
+            .map_err(|_e| InvalidTableError {
+                message: "Replication factor can't be convert into int".to_string(),
             })
     }
 
@@ -497,11 +497,13 @@ impl TableDescriptor {
         bucket_keys.retain(|k| !partition_keys.contains(k));
 
         if bucket_keys.is_empty() {
-            return Err(InvalidTableError(format!(
-                "Primary Key constraint {:?} should not be same with partition fields {:?}.",
-                schema.primary_key().unwrap().column_names(),
-                partition_keys
-            )));
+            return Err(Error::InvalidTableError {
+                message: format!(
+                    "Primary Key constraint {:?} should not be same with partition fields {:?}.",
+                    schema.primary_key().unwrap().column_names(),
+                    partition_keys
+                ),
+            });
         }
 
         Ok(bucket_keys)
@@ -518,10 +520,12 @@ impl TableDescriptor {
                 .iter()
                 .any(|k| partition_keys.contains(k))
             {
-                return Err(InvalidTableError(format!(
-                    "Bucket key {:?} shouldn't include any column in partition keys {:?}.",
-                    distribution.bucket_keys, partition_keys
-                )));
+                return Err(InvalidTableError {
+                    message: format!(
+                        "Bucket key {:?} shouldn't include any column in partition keys {:?}.",
+                        distribution.bucket_keys, partition_keys
+                    ),
+                });
             }
 
             return if let Some(pk) = schema.primary_key() {
@@ -540,13 +544,15 @@ impl TableDescriptor {
                         .iter()
                         .all(|k| pk_columns.contains(k))
                     {
-                        return Err(InvalidTableError(format!(
-                            "Bucket keys must be a subset of primary keys excluding partition keys for primary-key tables. \
-                            The primary keys are {:?}, the partition keys are {:?}, but the user-defined bucket keys are {:?}.",
-                            pk.column_names(),
-                            partition_keys,
-                            distribution.bucket_keys
-                        )));
+                        return Err(InvalidTableError {
+                            message: format!(
+                                "Bucket keys must be a subset of primary keys excluding partition keys for primary-key tables. \
+                                The primary keys are {:?}, the partition keys are {:?}, but the user-defined bucket keys are {:?}.",
+                                pk.column_names(),
+                                partition_keys,
+                                distribution.bucket_keys
+                            ),
+                        });
                     }
                     Ok(Some(distribution))
                 }
@@ -589,7 +595,9 @@ impl LogFormat {
         match s.to_uppercase().as_str() {
             "ARROW" => Ok(LogFormat::ARROW),
             "INDEXED" => Ok(LogFormat::INDEXED),
-            _ => Err(InvalidTableError(format!("Unknown log format: {s}"))),
+            _ => Err(InvalidTableError {
+                message: format!("Unknown log format: {s}"),
+            }),
         }
     }
 }
@@ -615,7 +623,9 @@ impl KvFormat {
         match s.to_uppercase().as_str() {
             "INDEXED" => Ok(KvFormat::INDEXED),
             "COMPACTED" => Ok(KvFormat::COMPACTED),
-            _ => Err(InvalidTableError(format!("Unknown kv format: {s}"))),
+            _ => Err(Error::InvalidTableError {
+                message: format!("Unknown kv format: {s}"),
+            }),
         }
     }
 }
@@ -961,6 +971,24 @@ impl TableBucket {
     }
 }
 
+impl Display for TableBucket {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        if let Some(partition_id) = self.partition_id {
+            write!(
+                f,
+                "TableBucket(table_id={}, partition_id={}, bucket={})",
+                self.table_id, partition_id, self.bucket
+            )
+        } else {
+            write!(
+                f,
+                "TableBucket(table_id={}, bucket={})",
+                self.table_id, self.bucket
+            )
+        }
+    }
+}
+
 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct LakeSnapshot {
     pub snapshot_id: i64,
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index e59c2d9dd6..dbbb45daea 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -19,6 +19,11 @@ syntax = "proto2";
 
 package proto;
 
+message ErrorResponse {
+  required int32 error_code = 1;
+  optional string error_message = 2;
+}
+
 // metadata request and response, request send from client to each server.
 message MetadataRequest {
   repeated PbTablePath table_path = 1;
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 6e8cb55962..9295713cc2 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -844,10 +844,7 @@ impl ReadContext {
     }
 
     pub fn record_batch_for_remote_log(&self, data: &[u8]) -> Result<Option<RecordBatch>> {
-        let (batch_metadata, body_buffer, version) = match parse_ipc_message(data) {
-            Some(result) => result,
-            None => return Ok(None),
-        };
+        let (batch_metadata, body_buffer, version) = parse_ipc_message(data)?;
 
         let record_batch = read_record_batch(
             &body_buffer,
@@ -1086,13 +1083,17 @@ mod tests {
         let result = parse_ipc_message(empty_body);
         assert_eq!(
             result.unwrap_err().to_string(),
-            String::from("Arrow error: Parser error: Range [0, 4) is out of bounds.\n\n")
+            String::from(
+                "Fluss hitting Arrow error Parser error: Range [0, 4) is out of bounds.\n\n: ParseError(\"Range [0, 4) is out of bounds.\\n\\n\")."
+            )
         );
 
         let invalid_data = &[];
         assert_eq!(
             parse_ipc_message(invalid_data).unwrap_err().to_string(),
-            String::from("Arrow error: Parser error: Invalid data length: 0")
+            String::from(
+                "Fluss hitting Arrow error Parser error: Invalid data length: 0: ParseError(\"Invalid data length: 0\")."
+            )
         );
 
         let data_with_invalid_continuation: &[u8] = &le_bytes(&[0x00000001, 0x00000000]);
@@ -1100,7 +1101,9 @@ mod tests {
             parse_ipc_message(data_with_invalid_continuation)
                 .unwrap_err()
                 .to_string(),
-            String::from("Arrow error: Parser error: Invalid continuation marker: 1")
+            String::from(
+                "Fluss hitting Arrow error Parser error: Invalid continuation marker: 1: ParseError(\"Invalid continuation marker: 1\")."
+            )
         );
 
         let data_with_invalid_length: &[u8] = &le_bytes(&[0xFFFFFFFF, 0x00000001]);
@@ -1109,8 +1112,7 @@ mod tests {
                 .unwrap_err()
                 .to_string(),
             String::from(
-                "Arrow error: Parser error: Invalid data length. \
-                   Remaining data length 0 is shorter than specified size 1"
+                "Fluss hitting Arrow error Parser error: Invalid data length. Remaining data length 0 is shorter than specified size 1: ParseError(\"Invalid data length. Remaining data length 0 is shorter than specified size 1\")."
             )
         );
 
@@ -1119,7 +1121,9 @@ mod tests {
             parse_ipc_message(data_with_invalid_length)
                 .unwrap_err()
                 .to_string(),
-            String::from("Arrow error: Parser error: Not a record batch")
+            String::from(
+                "Fluss hitting Arrow error Parser error: Not a record batch: ParseError(\"Not a record batch\")."
+            )
         );
     }
 
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 6929b57c5c..1ea393349e 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -290,18 +290,22 @@ impl Datum<'_> {
             Datum::String(v) => append_value_to_arrow!(StringBuilder, *v),
             Datum::Blob(v) => append_value_to_arrow!(BinaryBuilder, v.as_ref()),
             Datum::Decimal(_) | Datum::Date(_) | Datum::Timestamp(_) | Datum::TimestampTz(_) => {
-                return Err(RowConvertError(format!(
-                    "Type {:?} is not yet supported for Arrow conversion",
-                    std::mem::discriminant(self)
-                )));
+                return Err(RowConvertError {
+                    message: format!(
+                        "Type {:?} is not yet supported for Arrow conversion",
+                        std::mem::discriminant(self)
+                    ),
+                });
             }
         }
 
-        Err(RowConvertError(format!(
-            "Cannot append {:?} to builder of type {}",
-            self,
-            std::any::type_name_of_val(builder)
-        )))
+        Err(RowConvertError {
+            message: format!(
+                "Cannot append {:?} to builder of type {}",
+                self,
+                std::any::type_name_of_val(builder)
+            ),
+        })
     }
 }
 
@@ -313,11 +317,13 @@ macro_rules! impl_to_arrow {
                     b.append_value(*self);
                     Ok(())
                 } else {
-                    Err(RowConvertError(format!(
-                        "Cannot cast {} to {} builder",
-                        stringify!($ty),
-                        stringify!($variant)
-                    )))
+                    Err(RowConvertError {
+                        message: format!(
+                            "Cannot cast {} to {} builder",
+                            stringify!($ty),
+                            stringify!($variant)
+                        ),
+                    })
                 }
             }
         }
diff --git a/fluss-rust/crates/fluss/src/rpc/error.rs b/fluss-rust/crates/fluss/src/rpc/error.rs
index 84b20b102e..da3a11e295 100644
--- a/fluss-rust/crates/fluss/src/rpc/error.rs
+++ b/fluss-rust/crates/fluss/src/rpc/error.rs
@@ -17,6 +17,7 @@
 
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
+use prost::DecodeError;
 use std::sync::Arc;
 use thiserror::Error;
 
@@ -29,6 +30,9 @@ pub enum RpcError {
     #[error("Cannot read framed message: {0}")]
     ReadMessageError(#[from] crate::rpc::frame::ReadError),
 
+    #[error("Rpc Decode Error: {0}")]
+    RpcDecodeError(#[from] DecodeError),
+
     #[error("connection error")]
     ConnectionError(String),
 
diff --git a/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs b/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
new file mode 100644
index 0000000000..b26eb72f61
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
@@ -0,0 +1,371 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::ErrorResponse;
+use std::fmt::{Debug, Display, Formatter};
+
+/// API error response from Fluss server
+pub struct ApiError {
+    pub code: i32,
+    pub message: String,
+}
+
+impl Debug for ApiError {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("ApiError")
+            .field("code", &self.code)
+            .field("message", &self.message)
+            .finish()
+    }
+}
+
+impl Display for ApiError {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        Debug::fmt(self, f)
+    }
+}
+
+/// Fluss protocol errors. These errors are part of the client-server protocol.
+/// The error codes cannot be changed, but the names can be.
+///
+/// Do not add exceptions that occur only on the client or only on the server here.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+#[repr(i32)]
+pub enum FlussError {
+    /// The server experienced an unexpected error when processing the request.
+    UnknownServerError = -1,
+    /// No error occurred.
+    None = 0,
+    /// The server disconnected before a response was received.
+    NetworkException = 1,
+    /// The version of API is not supported.
+    UnsupportedVersion = 2,
+    /// This message has failed its CRC checksum, exceeds the valid size, has a null key for a primary key table, or is otherwise corrupt.
+    CorruptMessage = 3,
+    /// The database does not exist.
+    DatabaseNotExist = 4,
+    /// The database is not empty.
+    DatabaseNotEmpty = 5,
+    /// The database already exists.
+    DatabaseAlreadyExist = 6,
+    /// The table does not exist.
+    TableNotExist = 7,
+    /// The table already exists.
+    TableAlreadyExist = 8,
+    /// The schema does not exist.
+    SchemaNotExist = 9,
+    /// Exception occur while storage data for log in server.
+    LogStorageException = 10,
+    /// Exception occur while storage data for kv in server.
+    KvStorageException = 11,
+    /// Not leader or follower.
+    NotLeaderOrFollower = 12,
+    /// The record is too large.
+    RecordTooLargeException = 13,
+    /// The record is corrupt.
+    CorruptRecordException = 14,
+    /// The client has attempted to perform an operation on an invalid table.
+    InvalidTableException = 15,
+    /// The client has attempted to perform an operation on an invalid database.
+    InvalidDatabaseException = 16,
+    /// The replication factor is larger then the number of available tablet servers.
+    InvalidReplicationFactor = 17,
+    /// Produce request specified an invalid value for required acks.
+    InvalidRequiredAcks = 18,
+    /// The log offset is out of range.
+    LogOffsetOutOfRangeException = 19,
+    /// The table is not primary key table.
+    NonPrimaryKeyTableException = 20,
+    /// The table or bucket does not exist.
+    UnknownTableOrBucketException = 21,
+    /// The update version is invalid.
+    InvalidUpdateVersionException = 22,
+    /// The coordinator is invalid.
+    InvalidCoordinatorException = 23,
+    /// The leader epoch is invalid.
+    FencedLeaderEpochException = 24,
+    /// The request time out.
+    RequestTimeOut = 25,
+    /// The general storage exception.
+    StorageException = 26,
+    /// The server did not attempt to execute this operation.
+    OperationNotAttemptedException = 27,
+    /// Records are written to the server already, but to fewer in-sync replicas than required.
+    NotEnoughReplicasAfterAppendException = 28,
+    /// Messages are rejected since there are fewer in-sync replicas than required.
+    NotEnoughReplicasException = 29,
+    /// Get file access security token exception.
+    SecurityTokenException = 30,
+    /// The tablet server received an out of order sequence batch.
+    OutOfOrderSequenceException = 31,
+    /// The tablet server received a duplicate sequence batch.
+    DuplicateSequenceException = 32,
+    /// This exception is raised by the tablet server if it could not locate the writer metadata.
+    UnknownWriterIdException = 33,
+    /// The requested column projection is invalid.
+    InvalidColumnProjection = 34,
+    /// The requested target column to write is invalid.
+    InvalidTargetColumn = 35,
+    /// The partition does not exist.
+    PartitionNotExists = 36,
+    /// The table is not partitioned.
+    TableNotPartitionedException = 37,
+    /// The timestamp is invalid.
+    InvalidTimestampException = 38,
+    /// The config is invalid.
+    InvalidConfigException = 39,
+    /// The lake storage is not configured.
+    LakeStorageNotConfiguredException = 40,
+    /// The kv snapshot is not exist.
+    KvSnapshotNotExist = 41,
+    /// The partition already exists.
+    PartitionAlreadyExists = 42,
+    /// The partition spec is invalid.
+    PartitionSpecInvalidException = 43,
+    /// There is no currently available leader for the given partition.
+    LeaderNotAvailableException = 44,
+    /// Exceed the maximum number of partitions.
+    PartitionMaxNumException = 45,
+    /// Authentication failed.
+    AuthenticateException = 46,
+    /// Security is disabled.
+    SecurityDisabledException = 47,
+    /// Authorization failed.
+    AuthorizationException = 48,
+    /// Exceed the maximum number of buckets.
+    BucketMaxNumException = 49,
+    /// The tiering epoch is invalid.
+    FencedTieringEpochException = 50,
+    /// Authentication failed with retriable exception.
+    RetriableAuthenticateException = 51,
+    /// The server rack info is invalid.
+    InvalidServerRackInfoException = 52,
+    /// The lake snapshot is not exist.
+    LakeSnapshotNotExist = 53,
+    /// The lake table already exists.
+    LakeTableAlreadyExist = 54,
+    /// The new ISR contains at least one ineligible replica.
+    IneligibleReplicaException = 55,
+    /// The alter table is invalid.
+    InvalidAlterTableException = 56,
+    /// Deletion operations are disabled on this table.
+    DeletionDisabledException = 57,
+}
+
+impl FlussError {
+    /// Returns the error code for this error.
+    pub fn code(&self) -> i32 {
+        *self as i32
+    }
+
+    /// Returns a friendly description of the error.
+    pub fn message(&self) -> &'static str {
+        match self {
+            FlussError::UnknownServerError => {
+                "The server experienced an unexpected error when processing the request."
+            }
+            FlussError::None => "No error",
+            FlussError::NetworkException => {
+                "The server disconnected before a response was received."
+            }
+            FlussError::UnsupportedVersion => "The version of API is not supported.",
+            FlussError::CorruptMessage => {
+                "This message has failed its CRC checksum, exceeds the valid size, has a null key for a primary key table, or is otherwise corrupt."
+            }
+            FlussError::DatabaseNotExist => "The database does not exist.",
+            FlussError::DatabaseNotEmpty => "The database is not empty.",
+            FlussError::DatabaseAlreadyExist => "The database already exists.",
+            FlussError::TableNotExist => "The table does not exist.",
+            FlussError::TableAlreadyExist => "The table already exists.",
+            FlussError::SchemaNotExist => "The schema does not exist.",
+            FlussError::LogStorageException => {
+                "Exception occur while storage data for log in server."
+            }
+            FlussError::KvStorageException => {
+                "Exception occur while storage data for kv in server."
+            }
+            FlussError::NotLeaderOrFollower => "Not leader or follower.",
+            FlussError::RecordTooLargeException => "The record is too large.",
+            FlussError::CorruptRecordException => "The record is corrupt.",
+            FlussError::InvalidTableException => {
+                "The client has attempted to perform an operation on an invalid table."
+            }
+            FlussError::InvalidDatabaseException => {
+                "The client has attempted to perform an operation on an invalid database."
+            }
+            FlussError::InvalidReplicationFactor => {
+                "The replication factor is larger then the number of available tablet servers."
+            }
+            FlussError::InvalidRequiredAcks => {
+                "Produce request specified an invalid value for required acks."
+            }
+            FlussError::LogOffsetOutOfRangeException => "The log offset is out of range.",
+            FlussError::NonPrimaryKeyTableException => "The table is not primary key table.",
+            FlussError::UnknownTableOrBucketException => "The table or bucket does not exist.",
+            FlussError::InvalidUpdateVersionException => "The update version is invalid.",
+            FlussError::InvalidCoordinatorException => "The coordinator is invalid.",
+            FlussError::FencedLeaderEpochException => "The leader epoch is invalid.",
+            FlussError::RequestTimeOut => "The request time out.",
+            FlussError::StorageException => "The general storage exception.",
+            FlussError::OperationNotAttemptedException => {
+                "The server did not attempt to execute this operation."
+            }
+            FlussError::NotEnoughReplicasAfterAppendException => {
+                "Records are written to the server already, but to fewer in-sync replicas than required."
+            }
+            FlussError::NotEnoughReplicasException => {
+                "Messages are rejected since there are fewer in-sync replicas than required."
+            }
+            FlussError::SecurityTokenException => "Get file access security token exception.",
+            FlussError::OutOfOrderSequenceException => {
+                "The tablet server received an out of order sequence batch."
+            }
+            FlussError::DuplicateSequenceException => {
+                "The tablet server received a duplicate sequence batch."
+            }
+            FlussError::UnknownWriterIdException => {
+                "This exception is raised by the tablet server if it could not locate the writer metadata."
+            }
+            FlussError::InvalidColumnProjection => "The requested column projection is invalid.",
+            FlussError::InvalidTargetColumn => "The requested target column to write is invalid.",
+            FlussError::PartitionNotExists => "The partition does not exist.",
+            FlussError::TableNotPartitionedException => "The table is not partitioned.",
+            FlussError::InvalidTimestampException => "The timestamp is invalid.",
+            FlussError::InvalidConfigException => "The config is invalid.",
+            FlussError::LakeStorageNotConfiguredException => "The lake storage is not configured.",
+            FlussError::KvSnapshotNotExist => "The kv snapshot does not exist.",
+            FlussError::PartitionAlreadyExists => "The partition already exists.",
+            FlussError::PartitionSpecInvalidException => "The partition spec is invalid.",
+            FlussError::LeaderNotAvailableException => {
+                "There is no currently available leader for the given partition."
+            }
+            FlussError::PartitionMaxNumException => "Exceed the maximum number of partitions.",
+            FlussError::AuthenticateException => "Authentication failed.",
+            FlussError::SecurityDisabledException => "Security is disabled.",
+            FlussError::AuthorizationException => "Authorization failed.",
+            FlussError::BucketMaxNumException => "Exceed the maximum number of buckets.",
+            FlussError::FencedTieringEpochException => "The tiering epoch is invalid.",
+            FlussError::RetriableAuthenticateException => {
+                "Authentication failed with retriable exception."
+            }
+            FlussError::InvalidServerRackInfoException => "The server rack info is invalid.",
+            FlussError::LakeSnapshotNotExist => "The lake snapshot does not exist.",
+            FlussError::LakeTableAlreadyExist => "The lake table already exists.",
+            FlussError::IneligibleReplicaException => {
+                "The new ISR contains at least one ineligible replica."
+            }
+            FlussError::InvalidAlterTableException => "The alter table is invalid.",
+            FlussError::DeletionDisabledException => {
+                "Deletion operations are disabled on this table."
+            }
+        }
+    }
+
+    /// Create an ApiError from this error with the default message.
+    pub fn to_api_error(&self, message: Option<String>) -> ApiError {
+        ApiError {
+            code: self.code(),
+            message: message.unwrap_or(self.message().to_string()),
+        }
+    }
+
+    /// Get the FlussError for the given error code.
+    /// Returns `UnknownServerError` if the code is not recognized.
+    pub fn for_code(code: i32) -> Self {
+        match code {
+            -1 => FlussError::UnknownServerError,
+            0 => FlussError::None,
+            1 => FlussError::NetworkException,
+            2 => FlussError::UnsupportedVersion,
+            3 => FlussError::CorruptMessage,
+            4 => FlussError::DatabaseNotExist,
+            5 => FlussError::DatabaseNotEmpty,
+            6 => FlussError::DatabaseAlreadyExist,
+            7 => FlussError::TableNotExist,
+            8 => FlussError::TableAlreadyExist,
+            9 => FlussError::SchemaNotExist,
+            10 => FlussError::LogStorageException,
+            11 => FlussError::KvStorageException,
+            12 => FlussError::NotLeaderOrFollower,
+            13 => FlussError::RecordTooLargeException,
+            14 => FlussError::CorruptRecordException,
+            15 => FlussError::InvalidTableException,
+            16 => FlussError::InvalidDatabaseException,
+            17 => FlussError::InvalidReplicationFactor,
+            18 => FlussError::InvalidRequiredAcks,
+            19 => FlussError::LogOffsetOutOfRangeException,
+            20 => FlussError::NonPrimaryKeyTableException,
+            21 => FlussError::UnknownTableOrBucketException,
+            22 => FlussError::InvalidUpdateVersionException,
+            23 => FlussError::InvalidCoordinatorException,
+            24 => FlussError::FencedLeaderEpochException,
+            25 => FlussError::RequestTimeOut,
+            26 => FlussError::StorageException,
+            27 => FlussError::OperationNotAttemptedException,
+            28 => FlussError::NotEnoughReplicasAfterAppendException,
+            29 => FlussError::NotEnoughReplicasException,
+            30 => FlussError::SecurityTokenException,
+            31 => FlussError::OutOfOrderSequenceException,
+            32 => FlussError::DuplicateSequenceException,
+            33 => FlussError::UnknownWriterIdException,
+            34 => FlussError::InvalidColumnProjection,
+            35 => FlussError::InvalidTargetColumn,
+            36 => FlussError::PartitionNotExists,
+            37 => FlussError::TableNotPartitionedException,
+            38 => FlussError::InvalidTimestampException,
+            39 => FlussError::InvalidConfigException,
+            40 => FlussError::LakeStorageNotConfiguredException,
+            41 => FlussError::KvSnapshotNotExist,
+            42 => FlussError::PartitionAlreadyExists,
+            43 => FlussError::PartitionSpecInvalidException,
+            44 => FlussError::LeaderNotAvailableException,
+            45 => FlussError::PartitionMaxNumException,
+            46 => FlussError::AuthenticateException,
+            47 => FlussError::SecurityDisabledException,
+            48 => FlussError::AuthorizationException,
+            49 => FlussError::BucketMaxNumException,
+            50 => FlussError::FencedTieringEpochException,
+            51 => FlussError::RetriableAuthenticateException,
+            52 => FlussError::InvalidServerRackInfoException,
+            53 => FlussError::LakeSnapshotNotExist,
+            54 => FlussError::LakeTableAlreadyExist,
+            55 => FlussError::IneligibleReplicaException,
+            56 => FlussError::InvalidAlterTableException,
+            57 => FlussError::DeletionDisabledException,
+            _ => FlussError::UnknownServerError,
+        }
+    }
+}
+
+impl Display for FlussError {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}", self.message())
+    }
+}
+
+impl From<ErrorResponse> for ApiError {
+    fn from(error_response: ErrorResponse) -> Self {
+        let fluss_error = FlussError::for_code(error_response.error_code);
+        fluss_error.to_api_error(error_response.error_message)
+    }
+}
+
+impl From<ApiError> for FlussError {
+    fn from(api_error: ApiError) -> Self {
+        FlussError::for_code(api_error.code)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/frame.rs b/fluss-rust/crates/fluss/src/rpc/frame.rs
index 44dadc9408..81cc0946d7 100644
--- a/fluss-rust/crates/fluss/src/rpc/frame.rs
+++ b/fluss-rust/crates/fluss/src/rpc/frame.rs
@@ -15,6 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use prost::DecodeError;
 use thiserror::Error;
 use tokio::io::{AsyncRead, AsyncReadExt, AsyncWrite, AsyncWriteExt};
 
@@ -29,6 +30,9 @@ pub enum ReadError {
 
     #[error("Message too large, limit is {limit} bytes but got {actual} bytes")]
     MessageTooLarge { limit: usize, actual: usize },
+
+    #[error("Fail to decode error response: {0}")]
+    ProtoErrorResponseDecodeError(#[from] DecodeError),
 }
 
 pub trait AsyncMessageRead {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_database.rs b/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
index e4052ef361..7d24235a57 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
@@ -22,7 +22,8 @@ use crate::error::Result as FlussResult;
 use crate::proto::CreateDatabaseResponse;
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::ReadError;
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 
 use bytes::{Buf, BufMut};
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_table.rs b/fluss-rust/crates/fluss/src/rpc/message/create_table.rs
index 5802e71797..69865b8902 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/create_table.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_table.rs
@@ -23,7 +23,8 @@ use crate::proto::CreateTableResponse;
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::ReadError;
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 
 use bytes::{Buf, BufMut};
diff --git a/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs b/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
index 795eea1260..7e717a4e7a 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
@@ -15,9 +15,11 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 use bytes::{Buf, BufMut};
diff --git a/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs b/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
index 49cbfaf8d4..663e970a91 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
@@ -15,9 +15,11 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 use bytes::{Buf, BufMut};
diff --git a/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs b/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
index 0dbc21bbbe..a2b3f2d129 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
@@ -19,10 +19,12 @@ use crate::metadata::TablePath;
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 
 use crate::proto::DropTableResponse;
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 
 use bytes::{Buf, BufMut};
diff --git a/fluss-rust/crates/fluss/src/rpc/message/fetch.rs b/fluss-rust/crates/fluss/src/rpc/message/fetch.rs
index 6ebc5a2b33..15876069d7 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/fetch.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/fetch.rs
@@ -16,9 +16,11 @@
 // under the License.
 
 use crate::proto::FetchLogResponse;
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 use prost::Message;
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs b/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
index 85492a8bf0..6468bebd5f 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
@@ -15,9 +15,11 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 use bytes::{Buf, BufMut};
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs b/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
index a0e186efd2..a632a1596d 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
@@ -19,10 +19,12 @@ use crate::proto;
 use crate::proto::PbTablePath;
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 
 use crate::metadata::TablePath;
+use crate::rpc::frame::ReadError;
+
 use crate::{impl_read_version_type, impl_write_version_type};
 use bytes::{Buf, BufMut};
 use prost::Message;
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_table.rs b/fluss-rust/crates/fluss/src/rpc/message/get_table.rs
index 4f4d6c7a41..61657f7a7c 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_table.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_table.rs
@@ -18,10 +18,12 @@
 use crate::proto::{GetTableInfoRequest, GetTableInfoResponse, PbTablePath};
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 
 use crate::metadata::TablePath;
+use crate::rpc::frame::ReadError;
+
 use crate::{impl_read_version_type, impl_write_version_type};
 use bytes::{Buf, BufMut};
 use prost::Message;
diff --git a/fluss-rust/crates/fluss/src/rpc/message/header.rs b/fluss-rust/crates/fluss/src/rpc/message/header.rs
index fe60f8c997..77bda7c78c 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/header.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/header.rs
@@ -15,11 +15,13 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::proto::ErrorResponse;
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::{ReadError, WriteError};
 use crate::rpc::message::{ReadVersionedType, WriteVersionedType};
 use bytes::{Buf, BufMut};
+use prost::Message;
 
 #[allow(dead_code)]
 const REQUEST_HEADER_LENGTH: i32 = 8;
@@ -53,9 +55,10 @@ where
     }
 }
 
-#[derive(Debug, PartialEq, Eq)]
+#[derive(Debug, PartialEq)]
 pub struct ResponseHeader {
     pub request_id: i32,
+    pub error_response: Option<ErrorResponse>,
 }
 
 impl<R> ReadVersionedType<R> for ResponseHeader
@@ -64,10 +67,17 @@ where
 {
     fn read_versioned(reader: &mut R, _version: ApiVersion) -> Result<Self, ReadError> {
         let resp_type = reader.get_u8();
+        let request_id = reader.get_i32();
         if resp_type != SUCCESS_RESPONSE {
-            todo!("handle unsuccess response type");
+            let error_response = ErrorResponse::decode(reader)?;
+            return Ok(ResponseHeader {
+                request_id,
+                error_response: Some(error_response),
+            });
         }
-        let request_id = reader.get_i32();
-        Ok(ResponseHeader { request_id })
+        Ok(ResponseHeader {
+            request_id,
+            error_response: None,
+        })
     }
 }
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs b/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
index ce5a091540..83226ab1a9 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
@@ -15,9 +15,11 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 use bytes::{Buf, BufMut};
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
index 500db33e8c..9ab1f143f3 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
@@ -20,9 +20,11 @@ use crate::{impl_read_version_type, impl_write_version_type, proto};
 use crate::error::Error;
 use crate::error::Result as FlussResult;
 use crate::proto::ListOffsetsResponse;
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use std::collections::HashMap;
 
@@ -108,12 +110,15 @@ impl ListOffsetsResponse {
             .map(|resp| {
                 if resp.error_code.is_some() {
                     // todo: consider use another suitable error
-                    Err(Error::WriteError(format!(
-                        "Missing offset, error message: {}",
-                        resp.error_message
-                            .as_deref()
-                            .unwrap_or("unknown server exception")
-                    )))
+                    Err(Error::UnexpectedError {
+                        message: format!(
+                            "Missing offset, error message: {}",
+                            resp.error_message
+                                .as_deref()
+                                .unwrap_or("unknown server exception")
+                        ),
+                        source: None,
+                    })
                 } else {
                     // if no error msg, offset must exists
                     Ok((resp.bucket_id, resp.offset.unwrap()))
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs b/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
index daf57ea6b5..ff2497a063 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
@@ -18,9 +18,11 @@
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 
 use crate::proto::ListTablesResponse;
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 
 use bytes::{Buf, BufMut};
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 0ed5b7c0e6..b619ee4023 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -38,6 +38,7 @@ mod produce_log;
 mod table_exists;
 mod update_metadata;
 
+pub use crate::rpc::RpcError;
 pub use create_database::*;
 pub use create_table::*;
 pub use database_exists::*;
diff --git a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
index 7da2b59a2d..39bfb3f205 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
@@ -17,9 +17,11 @@
 
 use crate::error::Result as FlussResult;
 use crate::proto::{PbProduceLogReqForBucket, ProduceLogResponse};
+use crate::rpc::frame::ReadError;
+
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 use std::sync::Arc;
diff --git a/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs b/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs
index 3b71f471ac..ec982116b4 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs
@@ -22,12 +22,13 @@ use crate::proto::TableExistsResponse;
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 
+use crate::rpc::frame::ReadError;
+
 use bytes::{Buf, BufMut};
 use prost::Message;
-
 #[derive(Debug)]
 pub struct TableExistsRequest {
     pub inner_request: proto::TableExistsRequest,
diff --git a/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs b/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
index 0d8ad6464a..a6e6288609 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
@@ -18,10 +18,12 @@
 use crate::proto::{MetadataResponse, PbTablePath};
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
-use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 
 use crate::metadata::TablePath;
+use crate::rpc::frame::ReadError;
+
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
diff --git a/fluss-rust/crates/fluss/src/rpc/mod.rs b/fluss-rust/crates/fluss/src/rpc/mod.rs
index b8705a3f65..86e13b1c4c 100644
--- a/fluss-rust/crates/fluss/src/rpc/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/mod.rs
@@ -17,7 +17,9 @@
 
 mod api_key;
 mod api_version;
-mod error;
+pub mod error;
+mod fluss_api_error;
+pub use fluss_api_error::{ApiError, FlussError};
 mod frame;
 pub mod message;
 pub use error::*;
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index c474534b61..fdeb56fbbe 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use crate::cluster::ServerNode;
+use crate::error::Error;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::error::RpcError;
 use crate::rpc::error::RpcError::ConnectionError;
@@ -230,7 +231,7 @@ where
         }
     }
 
-    pub async fn request<R>(&self, msg: R) -> Result<R::ResponseBody, RpcError>
+    pub async fn request<R>(&self, msg: R) -> Result<R::ResponseBody, Error>
     where
         R: RequestBody + Send + WriteVersionedType<Vec<u8>>,
         R::ResponseBody: ReadVersionedType<Cursor<Vec<u8>>>,
@@ -249,9 +250,12 @@ where
 
         let mut buf = Vec::new();
         // write header
-        header.write_versioned(&mut buf, header_version)?;
+        header
+            .write_versioned(&mut buf, header_version)
+            .map_err(RpcError::WriteMessageError)?;
         // write message body
-        msg.write_versioned(&mut buf, body_api_version)?;
+        msg.write_versioned(&mut buf, body_api_version)
+            .map_err(RpcError::WriteMessageError)?;
 
         let (tx, rx) = channel();
 
@@ -264,14 +268,21 @@ where
             ConnectionState::RequestMap(map) => {
                 map.insert(request_id, ActiveRequest { channel: tx });
             }
-            ConnectionState::Poison(e) => return Err(RpcError::Poisoned(Arc::clone(e))),
+            ConnectionState::Poison(e) => return Err(RpcError::Poisoned(Arc::clone(e)).into()),
         }
 
         self.send_message(buf).await?;
         _cleanup_on_cancel.message_sent();
         let mut response = rx.await.expect("Who closed this channel?!")?;
 
-        let body = R::ResponseBody::read_versioned(&mut response.data, body_api_version)?;
+        if let Some(error_response) = response.header.error_response {
+            return Err(Error::FlussAPIError {
+                api_error: crate::rpc::ApiError::from(error_response),
+            });
+        }
+
+        let body = R::ResponseBody::read_versioned(&mut response.data, body_api_version)
+            .map_err(RpcError::ReadMessageError)?;
 
         let read_bytes = response.data.position();
         let message_bytes = response.data.into_inner().len() as u64;
@@ -281,7 +292,8 @@ where
                 read: read_bytes,
                 api_key: R::API_KEY,
                 api_version: body_api_version,
-            });
+            }
+            .into());
         }
         Ok(body)
     }
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index 0086d9c03e..ccb717228e 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -34,6 +34,7 @@ static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>>
 mod admin_test {
     use super::SHARED_FLUSS_CLUSTER;
     use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
+    use fluss::error::FlussError;
     use fluss::metadata::{
         DataTypes, DatabaseDescriptorBuilder, KvFormat, LogFormat, Schema, TableDescriptor,
         TablePath,
@@ -251,4 +252,35 @@ mod admin_test {
         // database shouldn't exist now
         assert_eq!(admin.database_exists(test_db_name).await.unwrap(), false);
     }
+
+    #[tokio::test]
+    async fn test_fluss_error_response() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection
+            .get_admin()
+            .await
+            .expect("Failed to get admin client");
+
+        let table_path = TablePath::new("fluss".to_string(), "not_exist".to_string());
+
+        let result = admin.get_table(&table_path).await;
+        assert!(result.is_err(), "Expected error but got Ok");
+
+        let error = result.unwrap_err();
+        match error {
+            fluss::error::Error::FlussAPIError { api_error } => {
+                assert_eq!(
+                    api_error.code,
+                    FlussError::TableNotExist.code(),
+                    "Expected error code 7 (TableNotExist)"
+                );
+                assert_eq!(
+                    api_error.message, "Table 'fluss.not_exist' does not exist.",
+                    "Expected specific error message"
+                );
+            }
+            other => panic!("Expected FlussAPIError, got {:?}", other),
+        }
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index f52d526e37..ca61ff8502 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -38,8 +38,6 @@ mod table_remote_scan_test {
     use fluss::row::{GenericRow, InternalRow};
     use std::collections::HashMap;
     use std::sync::Arc;
-    use std::sync::atomic::AtomicUsize;
-    use std::sync::atomic::Ordering;
     use std::thread;
     use std::thread::sleep;
     use std::time::Duration;
@@ -89,11 +87,13 @@ mod table_remote_scan_test {
                     temp_dir.to_string_lossy().to_string(),
                 );
 
-                let cluster =
-                    FlussTestingClusterBuilder::new_with_cluster_conf("test_table", &cluster_conf)
-                        .with_remote_data_dir(temp_dir)
-                        .build()
-                        .await;
+                let cluster = FlussTestingClusterBuilder::new_with_cluster_conf(
+                    "test_table_remote",
+                    &cluster_conf,
+                )
+                .with_remote_data_dir(temp_dir)
+                .build()
+                .await;
                 let mut guard = cluster_guard.write();
                 *guard = Some(cluster);
             });

From 7772f15e8b1348549b2aa22cd3f63cc4a0e34b6f Mon Sep 17 00:00:00 2001
From: Kelvin Wu <kelvinyu1117@gmail.com>
Date: Sun, 21 Dec 2025 12:44:26 +0800
Subject: [PATCH 038/287] chore: Update the InternalRow Trait: get_binary,
 get_bytes to return &[u8] (#104)

---
 fluss-rust/bindings/cpp/src/types.rs      |  4 ++--
 fluss-rust/crates/fluss/src/row/column.rs |  6 ++----
 fluss-rust/crates/fluss/src/row/mod.rs    | 12 ++++++------
 3 files changed, 10 insertions(+), 12 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index f9404ac633..8221f22c9f 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -332,12 +332,12 @@ fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
             ArrowDataType::Binary => {
                 let mut datum = new_datum(DATUM_TYPE_BYTES);
                 // todo: avoid copy bytes for blob
-                datum.bytes_val = row.get_bytes(i);
+                datum.bytes_val = row.get_bytes(i).to_vec();
                 datum
             }
             ArrowDataType::FixedSizeBinary(len) => {
                 let mut datum = new_datum(DATUM_TYPE_BYTES);
-                datum.bytes_val = row.get_binary(i, *len as usize);
+                datum.bytes_val = row.get_binary(i, *len as usize).to_vec();
                 datum
             }
             ArrowDataType::LargeBinary => {
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 6d47836d9b..20d86c0297 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -156,23 +156,21 @@ impl InternalRow for ColumnarRow {
             .value(self.row_id)
     }
 
-    fn get_binary(&self, pos: usize, _length: usize) -> Vec<u8> {
+    fn get_binary(&self, pos: usize, _length: usize) -> &[u8] {
         self.record_batch
             .column(pos)
             .as_any()
             .downcast_ref::<FixedSizeBinaryArray>()
             .expect("Expected binary array.")
             .value(self.row_id)
-            .to_vec()
     }
 
-    fn get_bytes(&self, pos: usize) -> Vec<u8> {
+    fn get_bytes(&self, pos: usize) -> &[u8] {
         self.record_batch
             .column(pos)
             .as_any()
             .downcast_ref::<BinaryArray>()
             .expect("Expected bytes array.")
             .value(self.row_id)
-            .to_vec()
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 909f3b136f..dd1dedfeac 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -66,10 +66,10 @@ pub trait InternalRow {
     // fn get_timestamp_ltz(&self, pos: usize, precision: usize) -> TimestampLtz;
 
     /// Returns the binary value at the given position with fixed length
-    fn get_binary(&self, pos: usize, length: usize) -> Vec<u8>;
+    fn get_binary(&self, pos: usize, length: usize) -> &[u8];
 
     /// Returns the binary value at the given position
-    fn get_bytes(&self, pos: usize) -> Vec<u8>;
+    fn get_bytes(&self, pos: usize) -> &[u8];
 }
 
 pub struct GenericRow<'a> {
@@ -132,12 +132,12 @@ impl<'a> InternalRow for GenericRow<'a> {
         self.values.get(pos).unwrap().try_into().unwrap()
     }
 
-    fn get_binary(&self, pos: usize, _length: usize) -> Vec<u8> {
-        self.values.get(pos).unwrap().as_blob().to_vec()
+    fn get_binary(&self, pos: usize, _length: usize) -> &[u8] {
+        self.values.get(pos).unwrap().as_blob()
     }
 
-    fn get_bytes(&self, pos: usize) -> Vec<u8> {
-        self.values.get(pos).unwrap().as_blob().to_vec()
+    fn get_bytes(&self, pos: usize) -> &[u8] {
+        self.values.get(pos).unwrap().as_blob()
     }
 }
 

From f4b0628b21feb290a30b320c5c72d10b0da2a004 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 21 Dec 2025 13:06:02 +0800
Subject: [PATCH 039/287] chore: optimize get_char method (#105)

---
 fluss-rust/crates/fluss/src/row/column.rs | 14 +++-----------
 fluss-rust/crates/fluss/src/row/mod.rs    | 15 ++++-----------
 2 files changed, 7 insertions(+), 22 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 20d86c0297..31f0fdf298 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -126,7 +126,7 @@ impl InternalRow for ColumnarRow {
             .value(self.row_id)
     }
 
-    fn get_char(&self, pos: usize, length: usize) -> String {
+    fn get_char(&self, pos: usize, _length: usize) -> &str {
         let array = self
             .record_batch
             .column(pos)
@@ -135,16 +135,8 @@ impl InternalRow for ColumnarRow {
             .expect("Expected fixed-size binary array for char type");
 
         let bytes = array.value(self.row_id);
-        if bytes.len() != length {
-            panic!(
-                "Length mismatch for fixed-size char: expected {}, got {}",
-                length,
-                bytes.len()
-            );
-        }
-
-        String::from_utf8(bytes.to_vec())
-            .unwrap_or_else(|_| String::from_utf8_lossy(bytes).into_owned())
+        // don't check length, following java client
+        std::str::from_utf8(bytes).expect("Invalid UTF-8 in char field")
     }
 
     fn get_string(&self, pos: usize) -> &str {
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index dd1dedfeac..01b89fc9f4 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -51,7 +51,7 @@ pub trait InternalRow {
     fn get_double(&self, pos: usize) -> f64;
 
     /// Returns the string value at the given position with fixed length
-    fn get_char(&self, pos: usize, length: usize) -> String;
+    fn get_char(&self, pos: usize, length: usize) -> &str;
 
     /// Returns the string value at the given position
     fn get_string(&self, pos: usize) -> &str;
@@ -116,16 +116,9 @@ impl<'a> InternalRow for GenericRow<'a> {
         self.values.get(pos).unwrap().try_into().unwrap()
     }
 
-    fn get_char(&self, pos: usize, length: usize) -> String {
-        let value = self.get_string(pos);
-        if value.len() != length {
-            panic!(
-                "Length mismatch for fixed-size char: expected {}, got {}",
-                length,
-                value.len()
-            );
-        }
-        value.to_string()
+    fn get_char(&self, pos: usize, _length: usize) -> &str {
+        // don't check length, following java client
+        self.get_string(pos)
     }
 
     fn get_string(&self, pos: usize) -> &str {

From f55375905c42bc6e3d9e2a526928a950d0d190b2 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Sun, 21 Dec 2025 15:19:56 +0800
Subject: [PATCH 040/287] feat: support ListOffset/SubscribeBatch/DropTable for
 cpp bindings (#100)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---------

Co-authored-by: 赵海源 <zhaohaiyuan@xiaohongshu.com>
---
 fluss-rust/bindings/cpp/examples/example.cpp  |  99 +++++++++++++-
 fluss-rust/bindings/cpp/include/fluss.hpp     |  32 +++++
 fluss-rust/bindings/cpp/src/admin.cpp         |  42 ++++++
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |   1 +
 fluss-rust/bindings/cpp/src/lib.rs            | 122 ++++++++++++++++++
 fluss-rust/bindings/cpp/src/table.cpp         |  17 +++
 fluss-rust/bindings/cpp/src/types.rs          |   4 +-
 fluss-rust/crates/fluss/src/client/admin.rs   |   7 +
 .../crates/fluss/src/client/table/scanner.rs  |  22 ++++
 9 files changed, 340 insertions(+), 6 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 5146f28216..04f9ac64f5 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -19,6 +19,8 @@
 
 #include <iostream>
 #include <vector>
+#include <unordered_map>
+#include <chrono>
 
 static void check(const char* step, const fluss::Result& r) {
     if (!r.Ok()) {
@@ -37,6 +39,17 @@ int main() {
     fluss::Admin admin;
     check("get_admin", conn.GetAdmin(admin));
 
+    fluss::TablePath table_path("fluss", "sample_table_cpp_v1");
+    
+    // 2.1) Drop table if exists
+    std::cout << "Dropping table if exists..." << std::endl;
+    auto drop_result = admin.DropTable(table_path, true);
+    if (drop_result.Ok()) {
+        std::cout << "Table dropped successfully" << std::endl;
+    } else {
+        std::cout << "Table drop result: " << drop_result.error_message << std::endl;
+    }
+
     // 3) Schema & descriptor
     auto schema = fluss::Schema::NewBuilder()
                         .AddColumn("id", fluss::DataType::Int)
@@ -47,14 +60,14 @@ int main() {
 
     auto descriptor = fluss::TableDescriptor::NewBuilder()
                           .SetSchema(schema)
-                          .SetBucketCount(1)
+                          .SetBucketCount(3)
                           .SetProperty("table.log.arrow.compression.type", "NONE")
-                          .SetComment("cpp example table")
+                          .SetComment("cpp example table with 3 buckets")
                           .Build();
 
-    fluss::TablePath table_path("fluss", "sample_table_cpp_v1");
-    // ignore_if_exists=true to allow re-run
-    check("create_table", admin.CreateTable(table_path, descriptor, true));
+    // 3.1) Create table with 3 buckets
+    std::cout << "Creating table with 3 buckets..." << std::endl;
+    check("create_table", admin.CreateTable(table_path, descriptor, false));
 
     // 4) Get table
     fluss::Table table;
@@ -162,5 +175,81 @@ int main() {
         std::exit(1);
     }
 
+    // 8) List offsets examples
+    std::cout << "\n=== List Offsets Examples ===" << std::endl;
+    
+    // 8.1) Query earliest offsets for all buckets
+    std::vector<int32_t> all_bucket_ids;
+    for (int b = 0; b < buckets; ++b) {
+        all_bucket_ids.push_back(b);
+    }
+    
+    std::unordered_map<int32_t, int64_t> earliest_offsets;
+    check("list_earliest_offsets", 
+          admin.ListOffsets(table_path, all_bucket_ids, 
+                           fluss::OffsetQuery::Earliest(), 
+                           earliest_offsets));
+    std::cout << "Earliest offsets:" << std::endl;
+    for (const auto& [bucket_id, offset] : earliest_offsets) {
+        std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
+    }
+    
+    // 8.2) Query latest offsets for all buckets
+    std::unordered_map<int32_t, int64_t> latest_offsets;
+    check("list_latest_offsets", 
+          admin.ListOffsets(table_path, all_bucket_ids, 
+                           fluss::OffsetQuery::Latest(), 
+                           latest_offsets));
+    std::cout << "Latest offsets:" << std::endl;
+    for (const auto& [bucket_id, offset] : latest_offsets) {
+        std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
+    }
+    
+    // 8.3) Query offsets for a specific timestamp (current time - 1 hour)
+    auto now = std::chrono::system_clock::now();
+    auto one_hour_ago = now - std::chrono::hours(1);
+    auto timestamp_ms = std::chrono::duration_cast<std::chrono::milliseconds>(
+        one_hour_ago.time_since_epoch()).count();
+    
+    std::unordered_map<int32_t, int64_t> timestamp_offsets;
+    check("list_timestamp_offsets", 
+          admin.ListOffsets(table_path, all_bucket_ids, 
+                           fluss::OffsetQuery::FromTimestamp(timestamp_ms), 
+                           timestamp_offsets));
+    std::cout << "Offsets for timestamp " << timestamp_ms << " (1 hour ago):" << std::endl;
+    for (const auto& [bucket_id, offset] : timestamp_offsets) {
+        std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
+    }
+    
+    // 8.4) Use batch subscribe with offsets from list_offsets
+    std::cout << "\n=== Batch Subscribe Example ===" << std::endl;
+    fluss::LogScanner batch_scanner;
+    check("new_log_scanner_for_batch", table.NewLogScanner(batch_scanner));
+    
+    std::vector<fluss::BucketSubscription> subscriptions;
+    for (const auto& [bucket_id, offset] : earliest_offsets) {
+        subscriptions.push_back({bucket_id, offset});
+        std::cout << "Preparing subscription: bucket=" << bucket_id 
+                  << ", offset=" << offset << std::endl;
+    }
+    
+    check("subscribe_batch", batch_scanner.Subscribe(subscriptions));
+    std::cout << "Batch subscribed to " << subscriptions.size() << " buckets" << std::endl;
+    
+    // 8.5) Poll and verify bucket_id in records
+    fluss::ScanRecords batch_records;
+    check("poll_batch", batch_scanner.Poll(5000, batch_records));
+    
+    std::cout << "Scanned " << batch_records.Size() << " records from batch subscription" << std::endl;
+    for (size_t i = 0; i < batch_records.Size() && i < 5; ++i) {
+        const auto& rec = batch_records[i];
+        std::cout << "  Record " << i << ": bucket_id=" << rec.bucket_id 
+                  << ", offset=" << rec.offset 
+                  << ", timestamp=" << rec.timestamp << std::endl;
+    }
+    if (batch_records.Size() > 5) {
+        std::cout << "  ... and " << (batch_records.Size() - 5) << " more records" << std::endl;
+    }
+
     return 0;
 }
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 002f80694a..479adf97a9 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -63,6 +63,24 @@ enum class DatumType {
     Bytes = 7,
 };
 
+constexpr int64_t EARLIEST_OFFSET = -2;
+constexpr int64_t LATEST_OFFSET = -1;
+
+enum class OffsetSpec {
+    Earliest = 0,
+    Latest = 1,
+    Timestamp = 2,
+};
+
+struct OffsetQuery {
+    OffsetSpec spec;
+    int64_t timestamp{0};
+
+    static OffsetQuery Earliest() { return {OffsetSpec::Earliest, 0}; }
+    static OffsetQuery Latest() { return {OffsetSpec::Latest, 0}; }
+    static OffsetQuery FromTimestamp(int64_t ts) { return {OffsetSpec::Timestamp, ts}; }
+};
+
 struct Result {
     int32_t error_code{0};
     std::string error_message;
@@ -301,6 +319,7 @@ struct GenericRow {
 };
 
 struct ScanRecord {
+    int32_t bucket_id;
     int64_t offset;
     int64_t timestamp;
     GenericRow row;
@@ -324,6 +343,11 @@ struct BucketOffset {
     int64_t offset;
 };
 
+struct BucketSubscription {
+    int32_t bucket_id;
+    int64_t offset;
+};
+
 struct LakeSnapshot {
     int64_t snapshot_id;
     std::vector<BucketOffset> bucket_offsets;
@@ -372,10 +396,17 @@ class Admin {
                        const TableDescriptor& descriptor,
                        bool ignore_if_exists = false);
 
+    Result DropTable(const TablePath& table_path, bool ignore_if_not_exists = false);
+
     Result GetTable(const TablePath& table_path, TableInfo& out);
 
     Result GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& out);
 
+    Result ListOffsets(const TablePath& table_path,
+                       const std::vector<int32_t>& bucket_ids,
+                       const OffsetQuery& offset_query,
+                       std::unordered_map<int32_t, int64_t>& out);
+
 private:
     friend class Connection;
     Admin(ffi::Admin* admin) noexcept;
@@ -448,6 +479,7 @@ class LogScanner {
     bool Available() const;
 
     Result Subscribe(int32_t bucket_id, int64_t start_offset);
+    Result Subscribe(const std::vector<BucketSubscription>& bucket_offsets);
     Result Poll(int64_t timeout_ms, ScanRecords& out);
 
 private:
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index f6997a640a..bf9c712f4e 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -66,6 +66,16 @@ Result Admin::CreateTable(const TablePath& table_path,
     return utils::from_ffi_result(ffi_result);
 }
 
+Result Admin::DropTable(const TablePath& table_path, bool ignore_if_not_exists) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+    auto ffi_result = admin_->drop_table(ffi_path, ignore_if_not_exists);
+    return utils::from_ffi_result(ffi_result);
+}
+
 Result Admin::GetTable(const TablePath& table_path, TableInfo& out) {
     if (!Available()) {
         return utils::make_error(1, "Admin not available");
@@ -98,4 +108,36 @@ Result Admin::GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& o
     return result;
 }
 
+Result Admin::ListOffsets(const TablePath& table_path,
+                          const std::vector<int32_t>& bucket_ids,
+                          const OffsetQuery& offset_query,
+                          std::unordered_map<int32_t, int64_t>& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+    
+    rust::Vec<int32_t> rust_bucket_ids;
+    for (int32_t id : bucket_ids) {
+        rust_bucket_ids.push_back(id);
+    }
+
+    ffi::FfiOffsetQuery ffi_query;
+    ffi_query.offset_type = static_cast<int32_t>(offset_query.spec);
+    ffi_query.timestamp = offset_query.timestamp;
+
+    auto ffi_result = admin_->list_offsets(ffi_path, std::move(rust_bucket_ids), ffi_query);
+    
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.clear();
+        for (const auto& pair : ffi_result.bucket_offsets) {
+            out[pair.bucket_id] = pair.offset;
+        }
+    }
+
+    return result;
+}
+
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 52dd7fe5d4..63a2e91a7b 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -222,6 +222,7 @@ inline GenericRow from_ffi_generic_row(const ffi::FfiGenericRow& ffi_row) {
 
 inline ScanRecord from_ffi_scan_record(const ffi::FfiScanRecord& ffi_record) {
     return ScanRecord{
+        ffi_record.bucket_id,
         ffi_record.offset,
         ffi_record.timestamp,
         from_ffi_generic_row(ffi_record.row)};
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 54d6941379..cd1803b888 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -104,6 +104,7 @@ mod ffi {
     }
 
     struct FfiScanRecord {
+        bucket_id: i32,
         offset: i64,
         timestamp: i64,
         row: FfiGenericRow,
@@ -130,6 +131,26 @@ mod ffi {
         offset: i64,
     }
 
+    struct FfiOffsetQuery {
+        offset_type: i32,
+        timestamp: i64,
+    }
+
+    struct FfiBucketSubscription {
+        bucket_id: i32,
+        offset: i64,
+    }
+
+    struct FfiBucketOffsetPair {
+        bucket_id: i32,
+        offset: i64,
+    }
+
+    struct FfiListOffsetsResult {
+        result: FfiResult,
+        bucket_offsets: Vec<FfiBucketOffsetPair>,
+    }
+
     struct FfiLakeSnapshotResult {
         result: FfiResult,
         lake_snapshot: FfiLakeSnapshot,
@@ -156,11 +177,22 @@ mod ffi {
             descriptor: &FfiTableDescriptor,
             ignore_if_exists: bool,
         ) -> FfiResult;
+        fn drop_table(
+            self: &Admin,
+            table_path: &FfiTablePath,
+            ignore_if_not_exists: bool,
+        ) -> FfiResult;
         fn get_table_info(self: &Admin, table_path: &FfiTablePath) -> FfiTableInfoResult;
         fn get_latest_lake_snapshot(
             self: &Admin,
             table_path: &FfiTablePath,
         ) -> FfiLakeSnapshotResult;
+        fn list_offsets(
+            self: &Admin,
+            table_path: &FfiTablePath,
+            bucket_ids: Vec<i32>,
+            offset_query: &FfiOffsetQuery,
+        ) -> FfiListOffsetsResult;
 
         // Table
         unsafe fn delete_table(table: *mut Table);
@@ -182,6 +214,10 @@ mod ffi {
         // LogScanner
         unsafe fn delete_log_scanner(scanner: *mut LogScanner);
         fn subscribe(self: &LogScanner, bucket_id: i32, start_offset: i64) -> FfiResult;
+        fn subscribe_batch(
+            self: &LogScanner,
+            subscriptions: Vec<FfiBucketSubscription>,
+        ) -> FfiResult;
         fn poll(self: &LogScanner, timeout_ms: i64) -> FfiScanRecordsResult;
     }
 }
@@ -330,6 +366,25 @@ impl Admin {
         }
     }
 
+    fn drop_table(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        ignore_if_not_exists: bool,
+    ) -> ffi::FfiResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+
+        let result =
+            RUNTIME.block_on(async { self.inner.drop_table(&path, ignore_if_not_exists).await });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+
     fn get_table_info(&self, table_path: &ffi::FfiTablePath) -> ffi::FfiTableInfoResult {
         let path = fcore::metadata::TablePath::new(
             table_path.database_name.clone(),
@@ -375,6 +430,58 @@ impl Admin {
             },
         }
     }
+
+    fn list_offsets(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        bucket_ids: Vec<i32>,
+        offset_query: &ffi::FfiOffsetQuery,
+    ) -> ffi::FfiListOffsetsResult {
+        use fcore::rpc::message::OffsetSpec;
+
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+
+        let offset_spec = match offset_query.offset_type {
+            0 => OffsetSpec::Earliest,
+            1 => OffsetSpec::Latest,
+            2 => OffsetSpec::Timestamp(offset_query.timestamp),
+            _ => {
+                return ffi::FfiListOffsetsResult {
+                    result: err_result(
+                        1,
+                        format!("Invalid offset_type: {}", offset_query.offset_type),
+                    ),
+                    bucket_offsets: vec![],
+                };
+            }
+        };
+
+        let result = RUNTIME.block_on(async {
+            self.inner
+                .list_offsets(&path, &bucket_ids, offset_spec)
+                .await
+        });
+
+        match result {
+            Ok(offsets) => {
+                let bucket_offsets: Vec<ffi::FfiBucketOffsetPair> = offsets
+                    .into_iter()
+                    .map(|(bucket_id, offset)| ffi::FfiBucketOffsetPair { bucket_id, offset })
+                    .collect();
+                ffi::FfiListOffsetsResult {
+                    result: ok_result(),
+                    bucket_offsets,
+                }
+            }
+            Err(e) => ffi::FfiListOffsetsResult {
+                result: err_result(1, e.to_string()),
+                bucket_offsets: vec![],
+            },
+        }
+    }
 }
 
 // Table implementation
@@ -511,6 +618,21 @@ impl LogScanner {
         }
     }
 
+    fn subscribe_batch(&self, subscriptions: Vec<ffi::FfiBucketSubscription>) -> ffi::FfiResult {
+        use std::collections::HashMap;
+        let mut bucket_offsets = HashMap::new();
+        for sub in subscriptions {
+            bucket_offsets.insert(sub.bucket_id, sub.offset);
+        }
+
+        let result = RUNTIME.block_on(async { self.inner.subscribe_batch(bucket_offsets).await });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+
     fn poll(&self, timeout_ms: i64) -> ffi::FfiScanRecordsResult {
         let timeout = Duration::from_millis(timeout_ms as u64);
         let result = RUNTIME.block_on(async { self.inner.poll(timeout).await });
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index b28b783ee8..d42e1a2299 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -210,6 +210,23 @@ Result LogScanner::Subscribe(int32_t bucket_id, int64_t start_offset) {
     return utils::from_ffi_result(ffi_result);
 }
 
+Result LogScanner::Subscribe(const std::vector<BucketSubscription>& bucket_offsets) {
+    if (!Available()) {
+        return utils::make_error(1, "LogScanner not available");
+    }
+
+    rust::Vec<ffi::FfiBucketSubscription> rust_subs;
+    for (const auto& sub : bucket_offsets) {
+        ffi::FfiBucketSubscription ffi_sub;
+        ffi_sub.bucket_id = sub.bucket_id;
+        ffi_sub.offset = sub.offset;
+        rust_subs.push_back(ffi_sub);
+    }
+
+    auto ffi_result = scanner_->subscribe_batch(std::move(rust_subs));
+    return utils::from_ffi_result(ffi_result);
+}
+
 Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
     if (!Available()) {
         return utils::make_error(1, "LogScanner not available");
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 8221f22c9f..d95da14212 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -233,12 +233,14 @@ pub fn core_scan_records_to_ffi(records: &fcore::record::ScanRecords) -> ffi::Ff
     let mut ffi_records = Vec::new();
 
     // Iterate over all buckets and their records
-    for bucket_records in records.records_by_buckets().values() {
+    for (table_bucket, bucket_records) in records.records_by_buckets() {
+        let bucket_id = table_bucket.bucket_id();
         for record in bucket_records {
             let row = record.row();
             let fields = core_row_to_ffi_fields(row);
 
             ffi_records.push(ffi::FfiScanRecord {
+                bucket_id,
                 offset: record.offset(),
                 timestamp: record.timestamp(),
                 row: ffi::FfiGenericRow { fields },
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index e185af84ac..6646f97cf8 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -232,6 +232,13 @@ impl FlussAdmin {
             .check_and_update_table_metadata(from_ref(table_path))
             .await?;
 
+        if buckets_id.is_empty() {
+            return Err(Error::UnexpectedError {
+                message: "Buckets are empty.".to_string(),
+                source: None,
+            });
+        }
+
         let cluster = self.metadata.get_cluster();
         let table_id = cluster.get_table(table_path).table_id;
 
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 1e70649e0b..a9384d905a 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -185,6 +185,28 @@ impl LogScanner {
         Ok(())
     }
 
+    pub async fn subscribe_batch(&self, bucket_offsets: HashMap<i32, i64>) -> Result<()> {
+        self.metadata
+            .check_and_update_table_metadata(from_ref(&self.table_path))
+            .await?;
+        if bucket_offsets.is_empty() {
+            return Err(Error::UnexpectedError {
+                message: "Bucket offsets are empty.".to_string(),
+                source: None,
+            });
+        }
+
+        let mut scan_bucket_offsets = HashMap::new();
+        for (bucket_id, offset) in bucket_offsets {
+            let table_bucket = TableBucket::new(self.table_id, bucket_id);
+            scan_bucket_offsets.insert(table_bucket, offset);
+        }
+
+        self.log_scanner_status
+            .assign_scan_buckets(scan_bucket_offsets);
+        Ok(())
+    }
+
     async fn poll_for_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
         self.log_fetcher.send_fetches_and_collect().await
     }

From 39189175320e7453e8ad80537d61541741a82d54 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 21 Dec 2025 15:22:05 +0800
Subject: [PATCH 041/287] chore: introduce prefetch to improve log poll
 performance (#103)

---
 fluss-rust/crates/fluss/Cargo.toml            |   1 +
 .../crates/fluss/src/client/credentials.rs    |  30 +-
 .../src/client/table/log_fetch_buffer.rs      | 376 +++++++++++
 .../crates/fluss/src/client/table/mod.rs      |   1 +
 .../fluss/src/client/table/remote_log.rs      | 195 ++++--
 .../crates/fluss/src/client/table/scanner.rs  | 586 ++++++++++++++----
 fluss-rust/crates/fluss/src/record/arrow.rs   | 113 ++--
 .../crates/fluss/tests/integration/table.rs   |   6 +-
 .../tests/integration/table_remote_scan.rs    |   8 +-
 9 files changed, 1077 insertions(+), 239 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs

diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index cdba9de5a4..27604eecd8 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -58,6 +58,7 @@ url = "2.5.7"
 uuid = { version = "1.10", features = ["v4"] }
 tempfile = "3.23.0"
 snafu = "0.8.3"
+scopeguard = "1.2.0"
 
 [target.'cfg(target_arch = "wasm32")'.dependencies]
 jiff = { workspace = true, features = ["js"] }
diff --git a/fluss-rust/crates/fluss/src/client/credentials.rs b/fluss-rust/crates/fluss/src/client/credentials.rs
index 6b07d08eb1..8adfe48b99 100644
--- a/fluss-rust/crates/fluss/src/client/credentials.rs
+++ b/fluss-rust/crates/fluss/src/client/credentials.rs
@@ -90,20 +90,20 @@ fn convert_hadoop_key_to_opendal(hadoop_key: &str) -> Option<(String, bool)> {
 
 pub struct CredentialsCache {
     inner: RwLock<Option<CachedToken>>,
+    rpc_client: Arc<RpcClient>,
+    metadata: Arc<Metadata>,
 }
 
 impl CredentialsCache {
-    pub fn new() -> Self {
+    pub fn new(rpc_client: Arc<RpcClient>, metadata: Arc<Metadata>) -> Self {
         Self {
             inner: RwLock::new(None),
+            rpc_client,
+            metadata,
         }
     }
 
-    pub async fn get_or_refresh(
-        &self,
-        rpc_client: &Arc<RpcClient>,
-        metadata: &Arc<Metadata>,
-    ) -> Result<HashMap<String, String>> {
+    pub async fn get_or_refresh(&self) -> Result<HashMap<String, String>> {
         {
             let guard = self.inner.read();
             if let Some(cached) = guard.as_ref() {
@@ -113,17 +113,13 @@ impl CredentialsCache {
             }
         }
 
-        self.refresh_from_server(rpc_client, metadata).await
+        self.refresh_from_server().await
     }
 
-    async fn refresh_from_server(
-        &self,
-        rpc_client: &Arc<RpcClient>,
-        metadata: &Arc<Metadata>,
-    ) -> Result<HashMap<String, String>> {
-        let cluster = metadata.get_cluster();
+    async fn refresh_from_server(&self) -> Result<HashMap<String, String>> {
+        let cluster = self.metadata.get_cluster();
         let server_node = cluster.get_one_available_server();
-        let conn = rpc_client.get_connection(server_node).await?;
+        let conn = self.rpc_client.get_connection(server_node).await?;
 
         let request = GetSecurityTokenRequest::new();
         let response = conn.request(request).await?;
@@ -158,9 +154,3 @@ impl CredentialsCache {
         Ok(props)
     }
 }
-
-impl Default for CredentialsCache {
-    fn default() -> Self {
-        Self::new()
-    }
-}
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
new file mode 100644
index 0000000000..cee104e020
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -0,0 +1,376 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Result;
+use crate::metadata::TableBucket;
+use crate::record::{
+    LogRecordBatch, LogRecordIterator, LogRecordsBatches, ReadContext, ScanRecord,
+};
+use parking_lot::Mutex;
+use std::collections::{HashMap, VecDeque};
+use std::sync::Arc;
+use std::sync::atomic::{AtomicBool, Ordering};
+use std::time::Duration;
+use tokio::sync::Notify;
+
+/// Represents a completed fetch that can be consumed
+pub trait CompletedFetch: Send + Sync {
+    fn table_bucket(&self) -> &TableBucket;
+    fn fetch_records(&mut self, max_records: usize) -> Result<Vec<ScanRecord>>;
+    fn is_consumed(&self) -> bool;
+    fn drain(&mut self);
+    fn size_in_bytes(&self) -> usize;
+    fn high_watermark(&self) -> i64;
+    fn is_initialized(&self) -> bool;
+    fn set_initialized(&mut self);
+    fn next_fetch_offset(&self) -> i64;
+}
+
+/// Represents a pending fetch that is waiting to be completed
+pub trait PendingFetch: Send + Sync {
+    fn table_bucket(&self) -> &TableBucket;
+    fn is_completed(&self) -> bool;
+    fn to_completed_fetch(self: Box<Self>) -> Result<Box<dyn CompletedFetch>>;
+}
+
+/// Thread-safe buffer for completed fetches
+pub struct LogFetchBuffer {
+    completed_fetches: Mutex<VecDeque<Box<dyn CompletedFetch>>>,
+    pending_fetches: Mutex<HashMap<TableBucket, VecDeque<Box<dyn PendingFetch>>>>,
+    next_in_line_fetch: Mutex<Option<Box<dyn CompletedFetch>>>,
+    not_empty_notify: Notify,
+    woken_up: Arc<AtomicBool>,
+}
+
+impl LogFetchBuffer {
+    pub fn new() -> Self {
+        Self {
+            completed_fetches: Mutex::new(VecDeque::new()),
+            pending_fetches: Mutex::new(HashMap::new()),
+            next_in_line_fetch: Mutex::new(None),
+            not_empty_notify: Notify::new(),
+            woken_up: Arc::new(AtomicBool::new(false)),
+        }
+    }
+
+    /// Check if the buffer is empty
+    pub fn is_empty(&self) -> bool {
+        self.completed_fetches.lock().is_empty()
+    }
+
+    /// Wait for the buffer to become non-empty, with timeout
+    /// Returns true if data became available, false if timeout
+    pub async fn await_not_empty(&self, timeout: Duration) -> bool {
+        let deadline = std::time::Instant::now() + timeout;
+
+        loop {
+            // Check if buffer is not empty
+            if !self.is_empty() {
+                return true;
+            }
+
+            // Check if woken up
+            if self.woken_up.swap(false, Ordering::Acquire) {
+                return true;
+            }
+
+            // Check if timeout
+            let now = std::time::Instant::now();
+            if now >= deadline {
+                return false;
+            }
+
+            // Wait for notification with remaining time
+            let remaining = deadline - now;
+            let notified = self.not_empty_notify.notified();
+            tokio::select! {
+                _ = tokio::time::sleep(remaining) => {
+                    return false; // Timeout
+                }
+                _ = notified => {
+                    // Got notification, check again
+                    continue;
+                }
+            }
+        }
+    }
+
+    #[allow(dead_code)]
+    /// Wake up any waiting threads
+    pub fn wakeup(&self) {
+        self.woken_up.store(true, Ordering::Release);
+        self.not_empty_notify.notify_waiters();
+    }
+
+    /// Add a pending fetch to the buffer
+    pub fn pend(&self, pending_fetch: Box<dyn PendingFetch>) {
+        let table_bucket = pending_fetch.table_bucket().clone();
+        self.pending_fetches
+            .lock()
+            .entry(table_bucket)
+            .or_default()
+            .push_back(pending_fetch);
+    }
+
+    /// Try to complete pending fetches in order, converting them to completed fetches
+    pub fn try_complete(&self, table_bucket: &TableBucket) {
+        // Collect completed fetches while holding the pending_fetches lock,
+        // then push them to completed_fetches after releasing it to avoid
+        // holding both locks simultaneously.
+        let mut completed_to_push: Vec<Box<dyn CompletedFetch>> = Vec::new();
+        let mut has_completed = false;
+        {
+            let mut pending_map = self.pending_fetches.lock();
+            if let Some(pendings) = pending_map.get_mut(table_bucket) {
+                while let Some(front) = pendings.front() {
+                    if front.is_completed() {
+                        let pending = pendings.pop_front().unwrap();
+                        match pending.to_completed_fetch() {
+                            Ok(completed) => {
+                                completed_to_push.push(completed);
+                                has_completed = true;
+                            }
+                            Err(e) => {
+                                // todo: handle exception?
+                                log::error!("Error when completing: {e}");
+                            }
+                        }
+                    } else {
+                        break;
+                    }
+                }
+                if has_completed && pendings.is_empty() {
+                    pending_map.remove(table_bucket);
+                }
+            }
+        }
+
+        if !completed_to_push.is_empty() {
+            let mut completed_queue = self.completed_fetches.lock();
+            for completed in completed_to_push {
+                completed_queue.push_back(completed);
+            }
+        }
+
+        if has_completed {
+            // Signal that buffer is not empty
+            self.not_empty_notify.notify_waiters();
+        }
+    }
+
+    /// Add a completed fetch to the buffer
+    pub fn add(&self, completed_fetch: Box<dyn CompletedFetch>) {
+        let table_bucket = completed_fetch.table_bucket();
+        let mut pending_map = self.pending_fetches.lock();
+
+        if let Some(pendings) = pending_map.get_mut(table_bucket)
+            && !pendings.is_empty()
+        {
+            pendings.push_back(Box::new(CompletedPendingFetch::new(completed_fetch)));
+            return;
+        }
+        // If there's no pending fetch for this table_bucket,
+        // directly add to completed_fetches
+        self.completed_fetches.lock().push_back(completed_fetch);
+        self.not_empty_notify.notify_waiters();
+    }
+
+    /// Poll the next completed fetch
+    pub fn poll(&self) -> Option<Box<dyn CompletedFetch>> {
+        self.completed_fetches.lock().pop_front()
+    }
+
+    /// Get the next in line fetch
+    pub fn next_in_line_fetch(&self) -> Option<Box<dyn CompletedFetch>> {
+        self.next_in_line_fetch.lock().take()
+    }
+
+    /// Set the next in line fetch
+    pub fn set_next_in_line_fetch(&self, fetch: Option<Box<dyn CompletedFetch>>) {
+        *self.next_in_line_fetch.lock() = fetch;
+    }
+
+    /// Get the set of buckets that have buffered data
+    pub fn buffered_buckets(&self) -> Vec<TableBucket> {
+        let mut buckets = Vec::new();
+
+        let next_in_line_fetch = self.next_in_line_fetch.lock();
+        if let Some(complete_fetch) = next_in_line_fetch.as_ref() {
+            if !complete_fetch.is_consumed() {
+                buckets.push(complete_fetch.table_bucket().clone());
+            }
+        }
+
+        let completed = self.completed_fetches.lock();
+        for fetch in completed.iter() {
+            buckets.push(fetch.table_bucket().clone());
+        }
+        let pending = self.pending_fetches.lock();
+        buckets.extend(pending.keys().cloned());
+        buckets
+    }
+}
+
+impl Default for LogFetchBuffer {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+/// A wrapper that makes a completed fetch look like a pending fetch
+struct CompletedPendingFetch {
+    completed_fetch: Box<dyn CompletedFetch>,
+}
+
+impl CompletedPendingFetch {
+    fn new(completed_fetch: Box<dyn CompletedFetch>) -> Self {
+        Self { completed_fetch }
+    }
+}
+
+impl PendingFetch for CompletedPendingFetch {
+    fn table_bucket(&self) -> &TableBucket {
+        self.completed_fetch.table_bucket()
+    }
+
+    fn is_completed(&self) -> bool {
+        true
+    }
+
+    fn to_completed_fetch(self: Box<Self>) -> Result<Box<dyn CompletedFetch>> {
+        Ok(self.completed_fetch)
+    }
+}
+
+/// Default implementation of CompletedFetch for in-memory log records
+pub struct DefaultCompletedFetch {
+    table_bucket: TableBucket,
+    log_record_batch: LogRecordsBatches,
+    read_context: ReadContext,
+    next_fetch_offset: i64,
+    high_watermark: i64,
+    size_in_bytes: usize,
+    consumed: bool,
+    initialized: bool,
+    records_read: usize,
+    current_record_iterator: Option<LogRecordIterator>,
+    current_record_batch: Option<LogRecordBatch>,
+}
+
+impl DefaultCompletedFetch {
+    pub fn new(
+        table_bucket: TableBucket,
+        log_record_batch: LogRecordsBatches,
+        size_in_bytes: usize,
+        read_context: ReadContext,
+        fetch_offset: i64,
+        high_watermark: i64,
+    ) -> Result<Self> {
+        Ok(Self {
+            table_bucket,
+            log_record_batch,
+            read_context,
+            next_fetch_offset: fetch_offset,
+            high_watermark,
+            size_in_bytes,
+            consumed: false,
+            initialized: false,
+            records_read: 0,
+            current_record_iterator: None,
+            current_record_batch: None,
+        })
+    }
+
+    /// Get the next fetched record, handling batch iteration and record skipping
+    fn next_fetched_record(&mut self) -> Result<Option<ScanRecord>> {
+        loop {
+            if let Some(record) = self
+                .current_record_iterator
+                .as_mut()
+                .and_then(Iterator::next)
+            {
+                if record.offset() >= self.next_fetch_offset {
+                    return Ok(Some(record));
+                }
+            } else if let Some(batch) = self.log_record_batch.next() {
+                self.current_record_iterator = Some(batch.records(&self.read_context)?);
+                self.current_record_batch = Some(batch);
+            } else {
+                if let Some(batch) = self.current_record_batch.take() {
+                    self.next_fetch_offset = batch.next_log_offset();
+                }
+                self.drain();
+                return Ok(None);
+            }
+        }
+    }
+}
+
+impl CompletedFetch for DefaultCompletedFetch {
+    fn table_bucket(&self) -> &TableBucket {
+        &self.table_bucket
+    }
+
+    fn fetch_records(&mut self, max_records: usize) -> Result<Vec<ScanRecord>> {
+        // todo: handle corrupt_last_record
+        if self.consumed {
+            return Ok(Vec::new());
+        }
+
+        let mut scan_records = Vec::new();
+
+        for _ in 0..max_records {
+            if let Some(record) = self.next_fetched_record()? {
+                self.next_fetch_offset = record.offset() + 1;
+                self.records_read += 1;
+                scan_records.push(record);
+            } else {
+                break;
+            }
+        }
+
+        Ok(scan_records)
+    }
+
+    fn is_consumed(&self) -> bool {
+        self.consumed
+    }
+
+    fn drain(&mut self) {
+        self.consumed = true;
+    }
+
+    fn size_in_bytes(&self) -> usize {
+        self.size_in_bytes
+    }
+
+    fn high_watermark(&self) -> i64 {
+        self.high_watermark
+    }
+
+    fn is_initialized(&self) -> bool {
+        self.initialized
+    }
+
+    fn set_initialized(&mut self) {
+        self.initialized = true;
+    }
+
+    fn next_fetch_offset(&self) -> i64 {
+        self.next_fetch_offset
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 99722477c5..e2cf9e6d5e 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -26,6 +26,7 @@ pub const EARLIEST_OFFSET: i64 = -2;
 
 mod append;
 
+mod log_fetch_buffer;
 mod remote_log;
 mod scanner;
 mod writer;
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index 10273dde2e..d9abd19c29 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -14,16 +14,18 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+use crate::client::table::log_fetch_buffer::{CompletedFetch, DefaultCompletedFetch, PendingFetch};
 use crate::error::{Error, Result};
 use crate::io::{FileIO, Storage};
 use crate::metadata::TableBucket;
 use crate::proto::{PbRemoteLogFetchInfo, PbRemoteLogSegment};
-use crate::record::{LogRecordsBatchs, ReadContext, ScanRecord};
+use crate::record::{LogRecordsBatches, ReadContext};
 use crate::util::delete_file;
-use parking_lot::RwLock;
+use parking_lot::{Mutex, RwLock};
 use std::collections::HashMap;
 use std::io;
 use std::path::{Path, PathBuf};
+use std::sync::Arc;
 use tempfile::TempDir;
 use tokio::io::AsyncWriteExt;
 use tokio::sync::oneshot;
@@ -70,45 +72,121 @@ pub struct RemoteLogFetchInfo {
 }
 
 impl RemoteLogFetchInfo {
-    pub fn from_proto(info: &PbRemoteLogFetchInfo, table_bucket: TableBucket) -> Result<Self> {
+    pub fn from_proto(info: &PbRemoteLogFetchInfo, table_bucket: TableBucket) -> Self {
         let segments = info
             .remote_log_segments
             .iter()
             .map(|s| RemoteLogSegment::from_proto(s, table_bucket.clone()))
             .collect();
 
-        Ok(Self {
+        Self {
             remote_log_tablet_dir: info.remote_log_tablet_dir.clone(),
             partition_name: info.partition_name.clone(),
             remote_log_segments: segments,
             first_start_pos: info.first_start_pos.unwrap_or(0),
-        })
+        }
     }
 }
 
+type CompletionCallback = Box<dyn Fn() + Send + Sync>;
+
 /// Future for a remote log download request
 pub struct RemoteLogDownloadFuture {
-    receiver: Option<oneshot::Receiver<Result<PathBuf>>>,
+    result: Arc<Mutex<Option<Result<Vec<u8>>>>>,
+    completion_callbacks: Arc<Mutex<Vec<CompletionCallback>>>,
+    // todo: add recycleCallback
 }
 
 impl RemoteLogDownloadFuture {
-    pub fn new(receiver: oneshot::Receiver<Result<PathBuf>>) -> Self {
+    pub fn new(receiver: oneshot::Receiver<Result<Vec<u8>>>) -> Self {
+        let result = Arc::new(Mutex::new(None));
+        let result_clone = Arc::clone(&result);
+        let completion_callbacks: Arc<Mutex<Vec<CompletionCallback>>> =
+            Arc::new(Mutex::new(Vec::new()));
+        let callbacks_clone = Arc::clone(&completion_callbacks);
+
+        // Spawn a task to wait for the download and update result, then call callbacks
+        tokio::spawn(async move {
+            let download_result = match receiver.await {
+                Ok(Ok(path)) => Ok(path),
+                Ok(Err(e)) => Err(e),
+                Err(e) => Err(Error::UnexpectedError {
+                    message: format!("Download & Read future cancelled: {e:?}"),
+                    source: None,
+                }),
+            };
+
+            *result_clone.lock() = Some(download_result);
+
+            // Call all registered callbacks
+            // We need to take the callbacks to avoid holding the lock while calling them
+            // This also ensures that any callbacks registered after this point will be called immediately
+            let callbacks: Vec<CompletionCallback> = {
+                let mut callbacks_guard = callbacks_clone.lock();
+                std::mem::take(&mut *callbacks_guard)
+            };
+            for callback in callbacks {
+                callback();
+            }
+
+            // After calling callbacks, any new callbacks registered will see is_done() == true
+            // and will be called immediately in on_complete()
+        });
+
         Self {
-            receiver: Some(receiver),
+            result,
+            completion_callbacks,
         }
     }
 
-    /// Get the downloaded file path
-    pub async fn get_file_path(&mut self) -> Result<PathBuf> {
-        let receiver = self.receiver.take().ok_or_else(|| Error::UnexpectedError {
-            message: "Downloaded file already consumed".to_string(),
-            source: None,
-        })?;
-
-        receiver.await.map_err(|e| Error::UnexpectedError {
-            message: format!("Download future cancelled: {e:?}"),
-            source: None,
-        })?
+    /// Register a callback to be called when download completes (similar to Java's onComplete)
+    pub fn on_complete<F>(&self, callback: F)
+    where
+        F: Fn() + Send + Sync + 'static,
+    {
+        // Acquire callbacks lock first to ensure atomicity of the check-and-register operation
+        let mut callbacks_guard = self.completion_callbacks.lock();
+
+        // Check completion status while holding the callbacks lock.
+        // This ensures that:
+        // 1. If the task completes between checking is_done() and registering the callback,
+        //    we'll see the completion state correctly
+        // 2. The background task cannot clear the callbacks list while we're checking/registering
+        let is_done = self.result.lock().is_some();
+
+        if is_done {
+            // If already completed, call immediately (drop lock first to avoid deadlock)
+            drop(callbacks_guard);
+            callback();
+        } else {
+            // Register the callback while holding the callbacks lock.
+            // This ensures that even if the background task completes right after we check
+            // is_done(), it will wait for us to release the lock before taking callbacks.
+            // When it does take callbacks, it will see our callback in the list and execute it.
+            callbacks_guard.push(Box::new(callback));
+            // Lock is automatically released here
+        }
+    }
+
+    pub fn is_done(&self) -> bool {
+        self.result.lock().is_some()
+    }
+
+    /// Get the downloaded file path (synchronous, only works after is_done() returns true)
+    pub fn get_remote_log_bytes(&self) -> Result<Vec<u8>> {
+        // todo: handle download fail
+        let guard = self.result.lock();
+        match guard.as_ref() {
+            Some(Ok(path)) => Ok(path.clone()),
+            Some(Err(e)) => Err(Error::IoUnexpectedError {
+                message: format!("Fail to get remote log bytes: {e}"),
+                source: io::Error::other(format!("{e:?}")),
+            }),
+            None => Err(Error::IoUnexpectedError {
+                message: "Get remote log bytes not completed yet".to_string(),
+                source: io::Error::other("Get remote log bytes not completed yet"),
+            }),
+        }
     }
 }
 
@@ -135,25 +213,38 @@ impl RemoteLogDownloader {
         &self,
         remote_log_tablet_dir: &str,
         segment: &RemoteLogSegment,
-    ) -> Result<RemoteLogDownloadFuture> {
+    ) -> RemoteLogDownloadFuture {
         let (sender, receiver) = oneshot::channel();
         let local_file_name = segment.local_file_name();
         let local_file_path = self.local_log_dir.path().join(&local_file_name);
         let remote_path = self.build_remote_path(remote_log_tablet_dir, segment);
         let remote_log_tablet_dir = remote_log_tablet_dir.to_string();
         let remote_fs_props = self.remote_fs_props.read().clone();
-        // Spawn async download task
+        // Spawn async download & read task
         tokio::spawn(async move {
-            let result = Self::download_file(
-                &remote_log_tablet_dir,
-                &remote_path,
-                &local_file_path,
-                &remote_fs_props,
-            )
+            let result = async {
+                let file_path = Self::download_file(
+                    &remote_log_tablet_dir,
+                    &remote_path,
+                    &local_file_path,
+                    &remote_fs_props,
+                )
+                .await?;
+                let bytes = tokio::fs::read(&file_path).await?;
+
+                // Delete the downloaded local file to free disk (async, but we'll do it in background)
+                let file_path_clone = file_path.clone();
+                tokio::spawn(async move {
+                    let _ = delete_file(file_path_clone).await;
+                });
+
+                Ok(bytes)
+            }
             .await;
+
             let _ = sender.send(result);
         });
-        Ok(RemoteLogDownloadFuture::new(receiver))
+        RemoteLogDownloadFuture::new(receiver)
     }
 
     /// Build the remote path for a log segment
@@ -261,9 +352,7 @@ pub struct RemotePendingFetch {
     segment: RemoteLogSegment,
     download_future: RemoteLogDownloadFuture,
     pos_in_log_segment: i32,
-    #[allow(dead_code)]
     fetch_offset: i64,
-    #[allow(dead_code)]
     high_watermark: i64,
     read_context: ReadContext,
 }
@@ -286,32 +375,42 @@ impl RemotePendingFetch {
             read_context,
         }
     }
+}
+
+impl PendingFetch for RemotePendingFetch {
+    fn table_bucket(&self) -> &TableBucket {
+        &self.segment.table_bucket
+    }
 
-    /// Convert to completed fetch by reading the downloaded file
-    pub async fn convert_to_completed_fetch(
-        mut self,
-    ) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
-        let file_path = self.download_future.get_file_path().await?;
-        let file_data = tokio::fs::read(&file_path).await?;
+    fn is_completed(&self) -> bool {
+        self.download_future.is_done()
+    }
+
+    fn to_completed_fetch(self: Box<Self>) -> Result<Box<dyn CompletedFetch>> {
+        // Get the file path (this should only be called when is_completed() returns true)
+        let mut data = self.download_future.get_remote_log_bytes()?;
 
         // Slice the data if needed
         let data = if self.pos_in_log_segment > 0 {
-            &file_data[self.pos_in_log_segment as usize..]
+            data.split_off(self.pos_in_log_segment as usize)
         } else {
-            &file_data
+            data
         };
 
-        // delete the downloaded local file to free disk
-        delete_file(file_path).await;
+        let size_in_bytes = data.len();
 
-        // Parse log records (remote log contains full data, need client-side projection)
-        let mut fetch_records = vec![];
-        for log_record in &mut LogRecordsBatchs::new(data) {
-            fetch_records.extend(log_record.records_for_remote_log(&self.read_context)?);
-        }
+        let log_record_batch = LogRecordsBatches::new(data);
+
+        // Create DefaultCompletedFetch from the data
+        let completed_fetch = DefaultCompletedFetch::new(
+            self.segment.table_bucket,
+            log_record_batch,
+            size_in_bytes,
+            self.read_context,
+            self.fetch_offset,
+            self.high_watermark,
+        )?;
 
-        let mut result = HashMap::new();
-        result.insert(self.segment.table_bucket.clone(), fetch_records);
-        Ok(result)
+        Ok(Box::new(completed_fetch))
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index a9384d905a..2246e2cbae 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -18,24 +18,27 @@
 use crate::client::connection::FlussConnection;
 use crate::client::credentials::CredentialsCache;
 use crate::client::metadata::Metadata;
+use crate::client::table::log_fetch_buffer::{
+    CompletedFetch, DefaultCompletedFetch, LogFetchBuffer,
+};
+use crate::client::table::remote_log::{
+    RemoteLogDownloader, RemoteLogFetchInfo, RemotePendingFetch,
+};
 use crate::error::{Error, Result};
 use crate::metadata::{TableBucket, TableInfo, TablePath};
 use crate::proto::{FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
-use crate::record::{LogRecordsBatchs, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
-use crate::rpc::RpcClient;
+use crate::record::{LogRecordsBatches, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
+use crate::rpc::{RpcClient, message};
 use crate::util::FairBucketStatusMap;
 use arrow_schema::SchemaRef;
-use parking_lot::RwLock;
-use std::collections::HashMap;
+use log::{debug, error, warn};
+use parking_lot::{Mutex, RwLock};
+use std::collections::{HashMap, HashSet};
 use std::slice::from_ref;
 use std::sync::Arc;
 use std::time::Duration;
 use tempfile::TempDir;
 
-use crate::client::table::remote_log::{
-    RemoteLogDownloader, RemoteLogFetchInfo, RemotePendingFetch,
-};
-
 const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
 #[allow(dead_code)]
 const LOG_FETCH_MAX_BYTES_FOR_BUCKET: i32 = 1024;
@@ -171,8 +174,43 @@ impl LogScanner {
         })
     }
 
-    pub async fn poll(&self, _timeout: Duration) -> Result<ScanRecords> {
-        Ok(ScanRecords::new(self.poll_for_fetches().await?))
+    pub async fn poll(&self, timeout: Duration) -> Result<ScanRecords> {
+        let start = std::time::Instant::now();
+        let deadline = start + timeout;
+
+        loop {
+            // Try to collect fetches
+            let fetch_result = self.poll_for_fetches().await?;
+
+            if !fetch_result.is_empty() {
+                // We have data, send next round of fetches and return
+                // This enables pipelining while user processes the data
+                self.log_fetcher.send_fetches().await?;
+                return Ok(ScanRecords::new(fetch_result));
+            }
+
+            // No data available, check if we should wait
+            let now = std::time::Instant::now();
+            if now >= deadline {
+                // Timeout reached, return empty result
+                return Ok(ScanRecords::new(HashMap::new()));
+            }
+
+            // Wait for buffer to become non-empty with remaining time
+            let remaining = deadline - now;
+            let has_data = self
+                .log_fetcher
+                .log_fetch_buffer
+                .await_not_empty(remaining)
+                .await;
+
+            if !has_data {
+                // Timeout while waiting
+                return Ok(ScanRecords::new(HashMap::new()));
+            }
+
+            // Buffer became non-empty, try again
+        }
     }
 
     pub async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
@@ -208,20 +246,31 @@ impl LogScanner {
     }
 
     async fn poll_for_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
-        self.log_fetcher.send_fetches_and_collect().await
+        let result = self.log_fetcher.collect_fetches()?;
+        if !result.is_empty() {
+            return Ok(result);
+        }
+
+        // send any new fetches (won't resend pending fetches).
+        self.log_fetcher.send_fetches().await?;
+
+        // Collect completed fetches from buffer
+        self.log_fetcher.collect_fetches()
     }
 }
 
-#[allow(dead_code)]
 struct LogFetcher {
-    table_path: TablePath,
     conns: Arc<RpcClient>,
-    table_info: TableInfo,
     metadata: Arc<Metadata>,
     log_scanner_status: Arc<LogScannerStatus>,
     read_context: ReadContext,
-    remote_log_downloader: RemoteLogDownloader,
-    credentials_cache: CredentialsCache,
+    remote_read_context: ReadContext,
+    remote_log_downloader: Arc<RemoteLogDownloader>,
+    // todo: consider schedule a background thread to update
+    // token instead of update in fetch phase
+    credentials_cache: Arc<CredentialsCache>,
+    log_fetch_buffer: Arc<LogFetchBuffer>,
+    nodes_with_pending_fetch_requests: Arc<Mutex<HashSet<i32>>>,
 }
 
 impl LogFetcher {
@@ -233,126 +282,306 @@ impl LogFetcher {
         projected_fields: Option<Vec<usize>>,
     ) -> Result<Self> {
         let full_arrow_schema = to_arrow_schema(table_info.get_row_type());
-        let read_context = Self::create_read_context(full_arrow_schema, projected_fields.clone());
+        let read_context =
+            Self::create_read_context(full_arrow_schema.clone(), projected_fields.clone(), false);
+        let remote_read_context =
+            Self::create_read_context(full_arrow_schema, projected_fields.clone(), true);
 
         let tmp_dir = TempDir::with_prefix("fluss-remote-logs")?;
 
         Ok(LogFetcher {
-            table_path: table_info.table_path.clone(),
-            conns,
-            table_info,
-            metadata,
+            conns: conns.clone(),
+            metadata: metadata.clone(),
             log_scanner_status,
             read_context,
-            remote_log_downloader: RemoteLogDownloader::new(tmp_dir)?,
-            credentials_cache: CredentialsCache::new(),
+            remote_read_context,
+            remote_log_downloader: Arc::new(RemoteLogDownloader::new(tmp_dir)?),
+            credentials_cache: Arc::new(CredentialsCache::new(conns.clone(), metadata.clone())),
+            log_fetch_buffer: Arc::new(LogFetchBuffer::new()),
+            nodes_with_pending_fetch_requests: Arc::new(Mutex::new(HashSet::new())),
         })
     }
 
     fn create_read_context(
         full_arrow_schema: SchemaRef,
         projected_fields: Option<Vec<usize>>,
+        is_from_remote: bool,
     ) -> ReadContext {
         match projected_fields {
-            None => ReadContext::new(full_arrow_schema),
-            Some(fields) => ReadContext::with_projection_pushdown(full_arrow_schema, fields),
+            None => ReadContext::new(full_arrow_schema, is_from_remote),
+            Some(fields) => {
+                ReadContext::with_projection_pushdown(full_arrow_schema, fields, is_from_remote)
+            }
         }
     }
 
-    async fn send_fetches_and_collect(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
+    /// Send fetch requests asynchronously without waiting for responses
+    async fn send_fetches(&self) -> Result<()> {
+        // todo: check update metadata like fluss-java in case leader changes
         let fetch_request = self.prepare_fetch_log_requests().await;
-        let mut result: HashMap<TableBucket, Vec<ScanRecord>> = HashMap::new();
+
         for (leader, fetch_request) in fetch_request {
-            let cluster = self.metadata.get_cluster();
-            let server_node = cluster
-                .get_tablet_server(leader)
-                .expect("todo: handle leader not exist.");
-            let con = self.conns.get_connection(server_node).await?;
-
-            let fetch_response = con
-                .request(crate::rpc::message::FetchLogRequest::new(fetch_request))
-                .await?;
-
-            for pb_fetch_log_resp in fetch_response.tables_resp {
-                let table_id = pb_fetch_log_resp.table_id;
-                let fetch_log_for_buckets = pb_fetch_log_resp.buckets_resp;
-
-                for fetch_log_for_bucket in fetch_log_for_buckets {
-                    let bucket: i32 = fetch_log_for_bucket.bucket_id;
-                    let table_bucket = TableBucket::new(table_id, bucket);
-
-                    // Check if this is a remote log fetch
-                    if let Some(ref remote_log_fetch_info) =
-                        fetch_log_for_bucket.remote_log_fetch_info
-                    {
-                        let remote_fs_props = self
-                            .credentials_cache
-                            .get_or_refresh(&self.conns, &self.metadata)
-                            .await?;
-                        self.remote_log_downloader
-                            .set_remote_fs_props(remote_fs_props);
-                        let remote_fetch_info = RemoteLogFetchInfo::from_proto(
-                            remote_log_fetch_info,
-                            table_bucket.clone(),
-                        )?;
-
-                        if let Some(fetch_offset) =
-                            self.log_scanner_status.get_bucket_offset(&table_bucket)
-                        {
-                            let high_watermark = fetch_log_for_bucket.high_watermark.unwrap_or(-1);
-                            // Download and process remote log segments
-                            let mut pos_in_log_segment = remote_fetch_info.first_start_pos;
-                            let mut current_fetch_offset = fetch_offset;
-                            // todo: make segment download in parallel
-                            for (i, segment) in
-                                remote_fetch_info.remote_log_segments.iter().enumerate()
-                            {
-                                if i > 0 {
-                                    pos_in_log_segment = 0;
-                                    current_fetch_offset = segment.start_offset;
-                                }
+            debug!("Adding pending request for node id {leader}");
+            // Check if we already have a pending request for this node
+            {
+                self.nodes_with_pending_fetch_requests.lock().insert(leader);
+            }
+
+            let cluster = self.metadata.get_cluster().clone();
+
+            let conns = Arc::clone(&self.conns);
+            let log_fetch_buffer = self.log_fetch_buffer.clone();
+            let log_scanner_status = self.log_scanner_status.clone();
+            let read_context = self.read_context.clone();
+            let remote_read_context = self.remote_read_context.clone();
+            let remote_log_downloader = Arc::clone(&self.remote_log_downloader);
+            let creds_cache = self.credentials_cache.clone();
+            let nodes_with_pending = self.nodes_with_pending_fetch_requests.clone();
+
+            // Spawn async task to handle the fetch request
+            // Note: These tasks are not explicitly tracked or cancelled when LogFetcher is dropped.
+            // This is acceptable because:
+            // 1. Tasks will naturally complete (network requests will return or timeout)
+            // 2. Tasks use Arc references, so resources are properly shared
+            // 3. When the program exits, tokio runtime will clean up all tasks
+            // 4. Tasks are short-lived (network I/O operations)
+            tokio::spawn(async move {
+                // make sure it will always remove leader from pending nodes
+                let _guard = scopeguard::guard((), |_| {
+                    nodes_with_pending.lock().remove(&leader);
+                });
+
+                let server_node = cluster
+                    .get_tablet_server(leader)
+                    .expect("todo: handle leader not exist.");
+
+                let con = match conns.get_connection(server_node).await {
+                    Ok(con) => con,
+                    Err(e) => {
+                        // todo: handle failed to get connection
+                        warn!("Failed to get connection to destination node: {e:?}");
+                        return;
+                    }
+                };
+
+                let fetch_response = match con
+                    .request(message::FetchLogRequest::new(fetch_request))
+                    .await
+                {
+                    Ok(resp) => resp,
+                    Err(e) => {
+                        // todo: handle fetch log from destination node
+                        warn!("Failed to fetch log from destination node {server_node:?}: {e:?}");
+                        return;
+                    }
+                };
+
+                if let Err(e) = Self::handle_fetch_response(
+                    fetch_response,
+                    &log_fetch_buffer,
+                    &log_scanner_status,
+                    &read_context,
+                    &remote_read_context,
+                    &remote_log_downloader,
+                    &creds_cache,
+                )
+                .await
+                {
+                    // todo: handle fail to handle fetch response
+                    error!("Fail to handle fetch response: {e:?}");
+                }
+            });
+        }
+
+        Ok(())
+    }
 
-                                let download_future =
-                                    self.remote_log_downloader.request_remote_log(
-                                        &remote_fetch_info.remote_log_tablet_dir,
-                                        segment,
-                                    )?;
-                                let pending_fetch = RemotePendingFetch::new(
-                                    segment.clone(),
-                                    download_future,
-                                    pos_in_log_segment,
-                                    current_fetch_offset,
-                                    high_watermark,
-                                    self.read_context.clone(),
-                                );
-                                let remote_records =
-                                    pending_fetch.convert_to_completed_fetch().await?;
-                                // Update offset and merge results
-                                for (tb, records) in remote_records {
-                                    if let Some(last_record) = records.last() {
-                                        self.log_scanner_status
-                                            .update_offset(&tb, last_record.offset() + 1);
-                                    }
-                                    result.entry(tb).or_default().extend(records);
+    /// Handle fetch response and add completed fetches to buffer
+    async fn handle_fetch_response(
+        fetch_response: crate::proto::FetchLogResponse,
+        log_fetch_buffer: &Arc<LogFetchBuffer>,
+        log_scanner_status: &Arc<LogScannerStatus>,
+        read_context: &ReadContext,
+        remote_read_context: &ReadContext,
+        remote_log_downloader: &Arc<RemoteLogDownloader>,
+        credentials_cache: &Arc<CredentialsCache>,
+    ) -> Result<()> {
+        for pb_fetch_log_resp in fetch_response.tables_resp {
+            let table_id = pb_fetch_log_resp.table_id;
+            let fetch_log_for_buckets = pb_fetch_log_resp.buckets_resp;
+
+            for fetch_log_for_bucket in fetch_log_for_buckets {
+                let bucket: i32 = fetch_log_for_bucket.bucket_id;
+                let table_bucket = TableBucket::new(table_id, bucket);
+
+                // todo: check fetch result code for per-bucket
+                let Some(fetch_offset) = log_scanner_status.get_bucket_offset(&table_bucket) else {
+                    debug!(
+                        "Ignoring fetch log response for bucket {table_bucket} because the bucket has been unsubscribed."
+                    );
+                    continue;
+                };
+
+                // Check if this is a remote log fetch
+                if let Some(ref remote_log_fetch_info) = fetch_log_for_bucket.remote_log_fetch_info
+                {
+                    // set remote fs props
+                    let remote_fs_props = credentials_cache.get_or_refresh().await?;
+                    remote_log_downloader.set_remote_fs_props(remote_fs_props);
+
+                    let remote_fetch_info =
+                        RemoteLogFetchInfo::from_proto(remote_log_fetch_info, table_bucket.clone());
+
+                    let high_watermark = fetch_log_for_bucket.high_watermark.unwrap_or(-1);
+                    Self::pending_remote_fetches(
+                        remote_log_downloader.clone(),
+                        log_fetch_buffer.clone(),
+                        remote_read_context.clone(),
+                        &table_bucket,
+                        remote_fetch_info,
+                        fetch_offset,
+                        high_watermark,
+                    );
+                } else if fetch_log_for_bucket.records.is_some() {
+                    // Handle regular in-memory records - create completed fetch directly
+                    let high_watermark = fetch_log_for_bucket.high_watermark.unwrap_or(-1);
+                    let records = fetch_log_for_bucket.records.unwrap_or(vec![]);
+                    let size_in_bytes = records.len();
+                    let log_record_batch = LogRecordsBatches::new(records);
+
+                    match DefaultCompletedFetch::new(
+                        table_bucket.clone(),
+                        log_record_batch,
+                        size_in_bytes,
+                        read_context.clone(),
+                        fetch_offset,
+                        high_watermark,
+                    ) {
+                        Ok(completed_fetch) => {
+                            log_fetch_buffer.add(Box::new(completed_fetch));
+                        }
+                        Err(e) => {
+                            // todo: handle error
+                            log::warn!("Failed to create completed fetch: {e:?}");
+                        }
+                    }
+                }
+            }
+        }
+        Ok(())
+    }
+
+    fn pending_remote_fetches(
+        remote_log_downloader: Arc<RemoteLogDownloader>,
+        log_fetch_buffer: Arc<LogFetchBuffer>,
+        read_context: ReadContext,
+        table_bucket: &TableBucket,
+        remote_fetch_info: RemoteLogFetchInfo,
+        fetch_offset: i64,
+        high_watermark: i64,
+    ) {
+        // Download and process remote log segments
+        let mut pos_in_log_segment = remote_fetch_info.first_start_pos;
+        let mut current_fetch_offset = fetch_offset;
+        for (i, segment) in remote_fetch_info.remote_log_segments.iter().enumerate() {
+            if i > 0 {
+                pos_in_log_segment = 0;
+                current_fetch_offset = segment.start_offset;
+            }
+
+            // todo:
+            // 1: control the max threads to download remote segment
+            // 2: introduce priority queue to priority highest for earliest segment
+            let download_future = remote_log_downloader
+                .request_remote_log(&remote_fetch_info.remote_log_tablet_dir, segment);
+
+            // Register callback to be called when download completes
+            // (similar to Java's downloadFuture.onComplete)
+            // This must be done before creating RemotePendingFetch to avoid move issues
+            let table_bucket = table_bucket.clone();
+            let log_fetch_buffer_clone = log_fetch_buffer.clone();
+            download_future.on_complete(move || {
+                log_fetch_buffer_clone.try_complete(&table_bucket);
+            });
+
+            let pending_fetch = RemotePendingFetch::new(
+                segment.clone(),
+                download_future,
+                pos_in_log_segment,
+                current_fetch_offset,
+                high_watermark,
+                read_context.clone(),
+            );
+            // Add to pending fetches in buffer (similar to Java's logFetchBuffer.pend)
+            log_fetch_buffer.pend(Box::new(pending_fetch));
+        }
+    }
+
+    /// Collect completed fetches from buffer
+    /// Reference: LogFetchCollector.collectFetch in Java
+    fn collect_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
+        const MAX_POLL_RECORDS: usize = 500; // Default max poll records
+        let mut result: HashMap<TableBucket, Vec<ScanRecord>> = HashMap::new();
+        let mut records_remaining = MAX_POLL_RECORDS;
+
+        while records_remaining > 0 {
+            // Get the next in line fetch, or get a new one from buffer
+            let next_in_line = self.log_fetch_buffer.next_in_line_fetch();
+
+            if next_in_line.is_none() || next_in_line.as_ref().unwrap().is_consumed() {
+                // Get a new fetch from buffer
+                if let Some(completed_fetch) = self.log_fetch_buffer.poll() {
+                    // Initialize the fetch if not already initialized
+                    if !completed_fetch.is_initialized() {
+                        let size_in_bytes = completed_fetch.size_in_bytes();
+                        match self.initialize_fetch(completed_fetch) {
+                            Ok(initialized) => {
+                                self.log_fetch_buffer.set_next_in_line_fetch(initialized);
+                                continue;
+                            }
+                            Err(e) => {
+                                // Remove a completedFetch upon a parse with exception if
+                                // (1) it contains no records, and
+                                // (2) there are no fetched records with actual content preceding this
+                                // exception.
+                                if result.is_empty() && size_in_bytes == 0 {
+                                    // todo: do we need to consider it like java ?
+                                    // self.log_fetch_buffer.poll();
                                 }
+                                return Err(e);
                             }
-                        } else {
-                            // if the offset is null, it means the bucket has been unsubscribed,
-                            // skip processing and continue to the next bucket.
-                            continue;
                         }
-                    } else if fetch_log_for_bucket.records.is_some() {
-                        // Handle regular in-memory records
-                        let mut fetch_records = vec![];
-                        let data = fetch_log_for_bucket.records.unwrap();
-                        for log_record in &mut LogRecordsBatchs::new(&data) {
-                            let last_offset = log_record.last_log_offset();
-                            fetch_records.extend(log_record.records(&self.read_context)?);
-                            self.log_scanner_status
-                                .update_offset(&table_bucket, last_offset + 1);
-                        }
-                        result.insert(table_bucket, fetch_records);
+                    } else {
+                        self.log_fetch_buffer
+                            .set_next_in_line_fetch(Some(completed_fetch));
+                    }
+                    // Note: poll() already removed the fetch from buffer, so no need to call poll()
+                } else {
+                    // No more fetches available
+                    break;
+                }
+            } else {
+                // Fetch records from next_in_line
+                if let Some(mut next_fetch) = next_in_line {
+                    let records =
+                        self.fetch_records_from_fetch(&mut next_fetch, records_remaining)?;
+
+                    if !records.is_empty() {
+                        let table_bucket = next_fetch.table_bucket().clone();
+                        // Merge with existing records for this bucket
+                        let existing = result.entry(table_bucket).or_default();
+                        let records_count = records.len();
+                        existing.extend(records);
+
+                        records_remaining = records_remaining.saturating_sub(records_count);
                     }
+
+                    // If the fetch is not fully consumed, put it back for the next round
+                    if !next_fetch.is_consumed() {
+                        self.log_fetch_buffer
+                            .set_next_in_line_fetch(Some(next_fetch));
+                    }
+                    // If consumed, next_fetch will be dropped here (which is correct)
                 }
             }
         }
@@ -360,6 +589,83 @@ impl LogFetcher {
         Ok(result)
     }
 
+    /// Initialize a completed fetch, checking offset match and updating high watermark
+    fn initialize_fetch(
+        &self,
+        mut completed_fetch: Box<dyn CompletedFetch>,
+    ) -> Result<Option<Box<dyn CompletedFetch>>> {
+        // todo: handle error in initialize fetch
+        let table_bucket = completed_fetch.table_bucket();
+        let fetch_offset = completed_fetch.next_fetch_offset();
+
+        // Check if bucket is still subscribed
+        let Some(current_offset) = self.log_scanner_status.get_bucket_offset(table_bucket) else {
+            warn!(
+                "Discarding stale fetch response for bucket {table_bucket:?} since the bucket has been unsubscribed"
+            );
+            return Ok(None);
+        };
+
+        // Check if offset matches
+        if fetch_offset != current_offset {
+            warn!(
+                "Discarding stale fetch response for bucket {table_bucket:?} since its offset {fetch_offset} does not match the expected offset {current_offset}"
+            );
+            return Ok(None);
+        }
+
+        // Update high watermark
+        let high_watermark = completed_fetch.high_watermark();
+        if high_watermark >= 0 {
+            self.log_scanner_status
+                .update_high_watermark(table_bucket, high_watermark);
+        }
+
+        completed_fetch.set_initialized();
+        Ok(Some(completed_fetch))
+    }
+
+    /// Fetch records from a completed fetch, checking offset match
+    fn fetch_records_from_fetch(
+        &self,
+        next_in_line_fetch: &mut Box<dyn CompletedFetch>,
+        max_records: usize,
+    ) -> Result<Vec<ScanRecord>> {
+        let table_bucket = next_in_line_fetch.table_bucket().clone();
+        let current_offset = self.log_scanner_status.get_bucket_offset(&table_bucket);
+
+        if current_offset.is_none() {
+            warn!(
+                "Ignoring fetched records for {table_bucket:?} since the bucket has been unsubscribed"
+            );
+            next_in_line_fetch.drain();
+            return Ok(Vec::new());
+        }
+
+        let current_offset = current_offset.unwrap();
+        let fetch_offset = next_in_line_fetch.next_fetch_offset();
+
+        // Check if this fetch is next in line
+        if fetch_offset == current_offset {
+            let records = next_in_line_fetch.fetch_records(max_records)?;
+            let next_fetch_offset = next_in_line_fetch.next_fetch_offset();
+
+            if next_fetch_offset > current_offset {
+                self.log_scanner_status
+                    .update_offset(&table_bucket, next_fetch_offset);
+            }
+
+            Ok(records)
+        } else {
+            // These records aren't next in line, ignore them
+            warn!(
+                "Ignoring fetched records for {table_bucket:?} at offset {fetch_offset} since the current offset is {current_offset}"
+            );
+            next_in_line_fetch.drain();
+            Ok(Vec::new())
+        }
+    }
+
     async fn prepare_fetch_log_requests(&self) -> HashMap<i32, FetchLogRequest> {
         let mut fetch_log_req_for_buckets = HashMap::new();
         let mut table_id = None;
@@ -372,25 +678,44 @@ impl LogFetcher {
             let offset = match self.log_scanner_status.get_bucket_offset(&bucket) {
                 Some(offset) => offset,
                 None => {
-                    // todo: debug
+                    debug!(
+                        "Skipping fetch request for bucket {bucket} because the bucket has been unsubscribed."
+                    );
                     continue;
                 }
             };
 
-            if let Some(leader) = self.get_table_bucket_leader(&bucket) {
-                let fetch_log_req_for_bucket = PbFetchLogReqForBucket {
-                    partition_id: None,
-                    bucket_id: bucket.bucket_id(),
-                    fetch_offset: offset,
-                    // 1M
-                    max_fetch_bytes: 1024 * 1024,
-                };
-
-                fetch_log_req_for_buckets
-                    .entry(leader)
-                    .or_insert_with(Vec::new)
-                    .push(fetch_log_req_for_bucket);
-                ready_for_fetch_count += 1;
+            match self.get_table_bucket_leader(&bucket) {
+                None => {
+                    log::trace!(
+                        "Skipping fetch request for bucket {bucket} because leader is not available."
+                    )
+                }
+                Some(leader) => {
+                    if self
+                        .nodes_with_pending_fetch_requests
+                        .lock()
+                        .contains(&leader)
+                    {
+                        log::trace!(
+                            "Skipping fetch request for bucket {bucket} because previous request to server {leader} has not been processed."
+                        )
+                    } else {
+                        let fetch_log_req_for_bucket = PbFetchLogReqForBucket {
+                            partition_id: None,
+                            bucket_id: bucket.bucket_id(),
+                            fetch_offset: offset,
+                            // 1M
+                            max_fetch_bytes: 1024 * 1024,
+                        };
+
+                        fetch_log_req_for_buckets
+                            .entry(leader)
+                            .or_insert_with(Vec::new)
+                            .push(fetch_log_req_for_bucket);
+                        ready_for_fetch_count += 1;
+                    }
+                }
             }
         }
 
@@ -427,8 +752,11 @@ impl LogFetcher {
     }
 
     fn fetchable_buckets(&self) -> Vec<TableBucket> {
-        // always available now
-        self.log_scanner_status.fetchable_buckets(|_| true)
+        // Get buckets that are not already in the buffer
+        let buffered = self.log_fetch_buffer.buffered_buckets();
+        let buffered_set: HashSet<TableBucket> = buffered.into_iter().collect();
+        self.log_scanner_status
+            .fetchable_buckets(|tb| !buffered_set.contains(tb))
     }
 
     fn get_table_bucket_leader(&self, tb: &TableBucket) -> Option<i32> {
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 9295713cc2..0a803aec6d 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -39,6 +39,7 @@ use arrow_schema::SchemaRef;
 use arrow_schema::{DataType as ArrowDataType, Field};
 use byteorder::WriteBytesExt;
 use byteorder::{ByteOrder, LittleEndian};
+use bytes::Bytes;
 use crc32c::crc32c;
 use parking_lot::Mutex;
 use std::{
@@ -347,17 +348,17 @@ pub trait ToArrow {
     fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()>;
 }
 
-pub struct LogRecordsBatchs<'a> {
-    data: &'a [u8],
+pub struct LogRecordsBatches {
+    data: Bytes,
     current_pos: usize,
     remaining_bytes: usize,
 }
 
-impl<'a> LogRecordsBatchs<'a> {
-    pub fn new(data: &'a [u8]) -> Self {
+impl LogRecordsBatches {
+    pub fn new(data: Vec<u8>) -> Self {
         let remaining_bytes: usize = data.len();
         Self {
-            data,
+            data: Bytes::from(data),
             current_pos: 0,
             remaining_bytes,
         }
@@ -378,14 +379,17 @@ impl<'a> LogRecordsBatchs<'a> {
     }
 }
 
-impl<'a> Iterator for &'a mut LogRecordsBatchs<'a> {
-    type Item = LogRecordBatch<'a>;
+impl Iterator for LogRecordsBatches {
+    type Item = LogRecordBatch;
 
     fn next(&mut self) -> Option<Self::Item> {
         match self.next_batch_size() {
             Some(batch_size) => {
-                let data_slice = &self.data[self.current_pos..self.current_pos + batch_size];
-                let record_batch = LogRecordBatch::new(data_slice);
+                let start = self.current_pos;
+                let end = start + batch_size;
+                // Since LogRecordsBatches owns the Vec<u8>, the slice is valid
+                // as long as the mutable reference exists, which is 'a
+                let record_batch = LogRecordBatch::new(self.data.slice(start..end));
                 self.current_pos += batch_size;
                 self.remaining_bytes -= batch_size;
                 Some(record_batch)
@@ -395,13 +399,13 @@ impl<'a> Iterator for &'a mut LogRecordsBatchs<'a> {
     }
 }
 
-pub struct LogRecordBatch<'a> {
-    data: &'a [u8],
+pub struct LogRecordBatch {
+    data: Bytes,
 }
 
 #[allow(dead_code)]
-impl<'a> LogRecordBatch<'a> {
-    pub fn new(data: &'a [u8]) -> Self {
+impl LogRecordBatch {
+    pub fn new(data: Bytes) -> Self {
         LogRecordBatch { data }
     }
 
@@ -710,6 +714,7 @@ pub struct ReadContext {
     target_schema: SchemaRef,
     full_schema: SchemaRef,
     projection: Option<Projection>,
+    is_from_remote: bool,
 }
 
 #[derive(Clone)]
@@ -723,24 +728,39 @@ struct Projection {
 }
 
 impl ReadContext {
-    pub fn new(arrow_schema: SchemaRef) -> ReadContext {
+    pub fn new(arrow_schema: SchemaRef, is_from_remote: bool) -> ReadContext {
         ReadContext {
             target_schema: arrow_schema.clone(),
             full_schema: arrow_schema,
             projection: None,
+            is_from_remote,
         }
     }
 
     pub fn with_projection_pushdown(
         arrow_schema: SchemaRef,
         projected_fields: Vec<usize>,
+        is_from_remote: bool,
     ) -> ReadContext {
         let target_schema = Self::project_schema(arrow_schema.clone(), projected_fields.as_slice());
-        let mut sorted_fields = projected_fields.clone();
-        sorted_fields.sort_unstable();
+        // the logic is little bit of hard to understand, to refactor it to follow
+        // java side
+        let (need_do_reorder, sorted_fields) = {
+            // currently, for remote read, arrow log doesn't support projection pushdown,
+            // so, only need to do reordering when is not from remote
+            if !is_from_remote {
+                let mut sorted_fields = projected_fields.clone();
+                sorted_fields.sort_unstable();
+                (!sorted_fields.eq(&projected_fields), sorted_fields)
+            } else {
+                // sorted_fields won't be used when need_do_reorder is false,
+                // let's use an empty vec directly
+                (false, vec![])
+            }
+        };
 
         let project = {
-            if !sorted_fields.eq(&projected_fields) {
+            if need_do_reorder {
                 // reordering is required
                 // Calculate reordering indexes to transform from sorted order to user-requested order
                 let mut reordering_indexes = Vec::with_capacity(projected_fields.len());
@@ -778,6 +798,7 @@ impl ReadContext {
             target_schema,
             full_schema: arrow_schema,
             projection: Some(project),
+            is_from_remote,
         }
     }
 
@@ -805,17 +826,24 @@ impl ReadContext {
     pub fn record_batch(&self, data: &[u8]) -> Result<RecordBatch> {
         let (batch_metadata, body_buffer, version) = parse_ipc_message(data)?;
 
-        // the record batch from server must be ordered by field pos,
-        // according to project to decide what arrow schema to use
-        // to parse the record batch
-        let resolve_schema = match self.projection {
-            Some(ref projection) => {
-                // projection, should use ordered schema by project field pos
-                projection.ordered_schema.clone()
-            }
-            None => {
-                // no projection, use target output schema
-                self.target_schema.clone()
+        let resolve_schema = {
+            // if from remote, no projection, need to use full schema
+            if self.is_from_remote {
+                self.full_schema.clone()
+            } else {
+                // the record batch from server must be ordered by field pos,
+                // according to project to decide what arrow schema to use
+                // to parse the record batch
+                match self.projection {
+                    Some(ref projection) => {
+                        // projection, should use ordered schema by project field pos
+                        projection.ordered_schema.clone()
+                    }
+                    None => {
+                        // no projection, use target output schema
+                        self.target_schema.clone()
+                    }
+                }
             }
         };
 
@@ -829,14 +857,27 @@ impl ReadContext {
         )?;
 
         let record_batch = match &self.projection {
-            Some(projection) if projection.reordering_needed => {
-                // Reorder columns if needed (when projection pushdown with non-sorted order)
-                let reordered_columns: Vec<_> = projection
-                    .reordering_indexes
-                    .iter()
-                    .map(|&idx| record_batch.column(idx).clone())
-                    .collect();
-                RecordBatch::try_new(self.target_schema.clone(), reordered_columns)?
+            Some(projection) => {
+                let reordered_columns = {
+                    // need to do reorder
+                    if self.is_from_remote {
+                        Some(&projection.projected_fields)
+                    } else if projection.reordering_needed {
+                        Some(&projection.reordering_indexes)
+                    } else {
+                        None
+                    }
+                };
+                match reordered_columns {
+                    Some(reordered_columns) => {
+                        let arrow_columns = reordered_columns
+                            .iter()
+                            .map(|&idx| record_batch.column(idx).clone())
+                            .collect();
+                        RecordBatch::try_new(self.target_schema.clone(), arrow_columns)?
+                    }
+                    _ => record_batch,
+                }
             }
             _ => record_batch,
         };
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index a058bfe0bc..9eec98eaaf 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -148,7 +148,7 @@ mod table_test {
         }
 
         let scan_records = log_scanner
-            .poll(std::time::Duration::from_secs(5))
+            .poll(std::time::Duration::from_secs(60))
             .await
             .expect("Failed to poll");
 
@@ -178,7 +178,7 @@ mod table_test {
         }
 
         let scan_records_projected = log_scanner_projected
-            .poll(std::time::Duration::from_secs(5))
+            .poll(std::time::Duration::from_secs(10))
             .await
             .expect("Failed to poll");
 
@@ -227,7 +227,7 @@ mod table_test {
 
         // Poll for records
         let scan_records = log_scanner
-            .poll(tokio::time::Duration::from_secs(5))
+            .poll(tokio::time::Duration::from_secs(10))
             .await
             .expect("Failed to poll records");
 
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index ca61ff8502..bdbced95c4 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -175,6 +175,8 @@ mod table_remote_scan_test {
         let num_buckets = table.table_info().get_num_buckets();
         let log_scanner = table
             .new_scan()
+            .project(&[1, 0])
+            .unwrap()
             .create_log_scanner()
             .expect("Failed to create log scanner");
         for bucket_id in 0..num_buckets {
@@ -186,7 +188,7 @@ mod table_remote_scan_test {
 
         let mut records = Vec::with_capacity(record_count);
         let start = std::time::Instant::now();
-        const MAX_WAIT_DURATION: Duration = Duration::from_secs(30);
+        const MAX_WAIT_DURATION: Duration = Duration::from_secs(60);
         while records.len() < record_count {
             if start.elapsed() > MAX_WAIT_DURATION {
                 panic!(
@@ -208,8 +210,8 @@ mod table_remote_scan_test {
             let row = record.row();
             let expected_c1 = i as i32;
             let expected_c2 = format!("v{}", i);
-            assert_eq!(row.get_int(0), expected_c1, "c1 mismatch at index {}", i);
-            assert_eq!(row.get_string(1), expected_c2, "c2 mismatch at index {}", i);
+            assert_eq!(row.get_int(1), expected_c1, "c1 mismatch at index {}", i);
+            assert_eq!(row.get_string(0), expected_c2, "c2 mismatch at index {}", i);
         }
     }
 

From 7515f71591a94be910d4bb220bb81c4dea4ad250 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Mon, 22 Dec 2025 09:43:43 +0000
Subject: [PATCH 042/287] chore: fix bug where column prune won't work when
 compression is enabled (#108)

---
 fluss-rust/bindings/cpp/examples/example.cpp  |   1 -
 .../fluss/src/client/write/accumulator.rs     |   2 +
 .../crates/fluss/src/client/write/batch.rs    |   4 +
 .../src/compression/arrow_compression.rs      | 245 ++++++++++++++++++
 .../crates/fluss/src/compression/mod.rs       |  20 ++
 fluss-rust/crates/fluss/src/lib.rs            |   1 +
 fluss-rust/crates/fluss/src/metadata/table.rs |   5 +
 fluss-rust/crates/fluss/src/record/arrow.rs   |  21 +-
 .../crates/fluss/tests/integration/table.rs   |   1 -
 .../tests/integration/table_remote_scan.rs    |   1 -
 10 files changed, 296 insertions(+), 5 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/compression/arrow_compression.rs
 create mode 100644 fluss-rust/crates/fluss/src/compression/mod.rs

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 04f9ac64f5..6ff2b9b7e3 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -61,7 +61,6 @@ int main() {
     auto descriptor = fluss::TableDescriptor::NewBuilder()
                           .SetSchema(schema)
                           .SetBucketCount(3)
-                          .SetProperty("table.log.arrow.compression.type", "NONE")
                           .SetComment("cpp example table with 3 buckets")
                           .Build();
 
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index e4ca957827..215adbe695 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -94,6 +94,7 @@ impl RecordAccumulator {
 
         let table_path = &record.table_path;
         let table_info = cluster.get_table(table_path);
+        let arrow_compression_info = table_info.get_table_config().get_arrow_compression_info()?;
         let row_type = &cluster.get_table(table_path).row_type;
 
         let schema_id = table_info.schema_id;
@@ -102,6 +103,7 @@ impl RecordAccumulator {
             self.batch_id.fetch_add(1, Ordering::Relaxed),
             table_path.as_ref().clone(),
             schema_id,
+            arrow_compression_info,
             row_type,
             bucket_id,
             current_time_ms(),
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index 13b3d36402..ba04db4ac6 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -18,6 +18,7 @@
 use crate::BucketId;
 use crate::client::broadcast::{BatchWriteResult, BroadcastOnce};
 use crate::client::{ResultHandle, WriteRecord};
+use crate::compression::ArrowCompressionInfo;
 use crate::error::Result;
 use crate::metadata::{DataType, TablePath};
 use crate::record::MemoryLogRecordsArrowBuilder;
@@ -132,10 +133,12 @@ pub struct ArrowLogWriteBatch {
 }
 
 impl ArrowLogWriteBatch {
+    #[allow(clippy::too_many_arguments)]
     pub fn new(
         batch_id: i64,
         table_path: TablePath,
         schema_id: i32,
+        arrow_compression_info: ArrowCompressionInfo,
         row_type: &DataType,
         bucket_id: BucketId,
         create_ms: i64,
@@ -148,6 +151,7 @@ impl ArrowLogWriteBatch {
                 schema_id,
                 row_type,
                 to_append_record_batch,
+                arrow_compression_info,
             ),
         }
     }
diff --git a/fluss-rust/crates/fluss/src/compression/arrow_compression.rs b/fluss-rust/crates/fluss/src/compression/arrow_compression.rs
new file mode 100644
index 0000000000..32dfadb48c
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/compression/arrow_compression.rs
@@ -0,0 +1,245 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::{Error, Result};
+use arrow::ipc::CompressionType;
+use std::collections::HashMap;
+
+pub const TABLE_LOG_ARROW_COMPRESSION_ZSTD_LEVEL: &str = "table.log.arrow.compression.zstd.level";
+pub const TABLE_LOG_ARROW_COMPRESSION_TYPE: &str = "table.log.arrow.compression.type";
+pub const DEFAULT_NON_ZSTD_COMPRESSION_LEVEL: i32 = -1;
+pub const DEFAULT_ZSTD_COMPRESSION_LEVEL: i32 = 3;
+
+#[derive(Clone, Debug, PartialEq)]
+pub enum ArrowCompressionType {
+    None,
+    Lz4Frame,
+    Zstd,
+}
+
+impl ArrowCompressionType {
+    fn from_conf(properties: &HashMap<String, String>) -> Result<Self> {
+        match properties
+            .get(TABLE_LOG_ARROW_COMPRESSION_TYPE)
+            .map(|s| s.as_str())
+        {
+            Some("NONE") => Ok(Self::None),
+            Some("LZ4_FRAME") => Ok(Self::Lz4Frame),
+            Some("ZSTD") => Ok(Self::Zstd),
+            Some(other) => Err(Error::IllegalArgument {
+                message: format!("Unsupported compression type: {other}"),
+            }),
+            None => Ok(Self::Zstd),
+        }
+    }
+}
+
+#[derive(Clone, Debug)]
+pub struct ArrowCompressionInfo {
+    pub compression_type: ArrowCompressionType,
+    pub compression_level: i32,
+}
+
+impl ArrowCompressionInfo {
+    pub fn from_conf(properties: &HashMap<String, String>) -> Result<Self> {
+        let compression_type = ArrowCompressionType::from_conf(properties)?;
+
+        if compression_type != ArrowCompressionType::Zstd {
+            return Ok(Self {
+                compression_type,
+                compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+            });
+        }
+
+        match properties
+            .get(TABLE_LOG_ARROW_COMPRESSION_ZSTD_LEVEL)
+            .map(|s| s.as_str().parse::<i32>())
+        {
+            Some(Ok(level)) if !(1..=22).contains(&level) => Err(Error::IllegalArgument {
+                message: format!(
+                    "Invalid ZSTD compression level: {}. Expected a value between 1 and 22.",
+                    level
+                ),
+            }),
+            Some(Err(e)) => Err(Error::IllegalArgument {
+                message: format!(
+                    "Invalid ZSTD compression level. Expected a value between 1 and 22. {}",
+                    e
+                ),
+            }),
+
+            Some(Ok(level)) => Ok(Self {
+                compression_type,
+                compression_level: level,
+            }),
+            None => Ok(Self {
+                compression_type,
+                compression_level: DEFAULT_ZSTD_COMPRESSION_LEVEL,
+            }),
+        }
+    }
+
+    #[cfg(test)]
+    fn new(compression_type: ArrowCompressionType, compression_level: i32) -> ArrowCompressionInfo {
+        Self {
+            compression_type,
+            compression_level,
+        }
+    }
+
+    pub fn get_compression_type(&self) -> Option<CompressionType> {
+        match self.compression_type {
+            ArrowCompressionType::Zstd => Some(CompressionType::ZSTD),
+            ArrowCompressionType::Lz4Frame => Some(CompressionType::LZ4_FRAME),
+            ArrowCompressionType::None => None,
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::collections::HashMap;
+
+    #[test]
+    fn test_from_conf() {
+        assert_eq!(
+            ArrowCompressionType::from_conf(&HashMap::new()).unwrap(),
+            ArrowCompressionType::Zstd
+        );
+
+        assert_eq!(
+            ArrowCompressionType::from_conf(&mk_map(&[(
+                "table.log.arrow.compression.type",
+                "NONE"
+            )]))
+            .unwrap(),
+            ArrowCompressionType::None
+        );
+
+        assert_eq!(
+            ArrowCompressionType::from_conf(&mk_map(&[(
+                "table.log.arrow.compression.type",
+                "LZ4_FRAME"
+            )]))
+            .unwrap(),
+            ArrowCompressionType::Lz4Frame
+        );
+
+        assert_eq!(
+            ArrowCompressionType::from_conf(&mk_map(&[(
+                "table.log.arrow.compression.type",
+                "ZSTD"
+            )]))
+            .unwrap(),
+            ArrowCompressionType::Zstd
+        );
+    }
+
+    #[test]
+    fn test_from_conf_invalid_compression_type() {
+        let props = mk_map(&[("table.log.arrow.compression.type", "FOO")]);
+
+        assert!(
+            ArrowCompressionInfo::from_conf(&props)
+                .unwrap_err()
+                .to_string()
+                .contains(
+                    "Fluss hitting illegal argument error Unsupported compression type: FOO."
+                )
+        );
+    }
+
+    #[test]
+    fn test_from_conf_zstd_compression_level() {
+        let compression_info = ArrowCompressionInfo::from_conf(&mk_map(&[(
+            "table.log.arrow.compression.type",
+            "ZSTD",
+        )]));
+        assert_eq!(compression_info.unwrap().compression_level, 3);
+        let compression_info = ArrowCompressionInfo::from_conf(&mk_map(&[
+            ("table.log.arrow.compression.type", "ZSTD"),
+            ("table.log.arrow.compression.zstd.level", "1"),
+        ]));
+        assert_eq!(compression_info.unwrap().compression_level, 1);
+    }
+
+    #[test]
+    fn test_from_conf_compression_level_out_of_range() {
+        let props = mk_map(&[
+            ("table.log.arrow.compression.type", "ZSTD"),
+            ("table.log.arrow.compression.zstd.level", "0"),
+        ]);
+
+        assert!(
+            ArrowCompressionInfo::from_conf(&props)
+                .unwrap_err()
+                .to_string()
+                .contains("Expected a value between 1 and 22.")
+        );
+
+        let props = mk_map(&[
+            ("table.log.arrow.compression.type", "ZSTD"),
+            ("table.log.arrow.compression.zstd.level", "23"),
+        ]);
+
+        assert!(
+            ArrowCompressionInfo::from_conf(&props)
+                .unwrap_err()
+                .to_string()
+                .contains("Expected a value between 1 and 22.")
+        );
+    }
+
+    #[test]
+    fn test_from_conf_compression_level_parse_error() {
+        let props = mk_map(&[
+            ("table.log.arrow.compression.type", "ZSTD"),
+            ("table.log.arrow.compression.zstd.level", "not-a-number"),
+        ]);
+
+        assert!(
+            ArrowCompressionInfo::from_conf(&props)
+                .unwrap_err()
+                .to_string()
+                .contains("Expected a value between 1 and 22.")
+        );
+    }
+
+    #[test]
+    fn get_compression_type_maps_correctly() {
+        assert_eq!(
+            ArrowCompressionInfo::new(ArrowCompressionType::None, -1).get_compression_type(),
+            None
+        );
+        assert_eq!(
+            ArrowCompressionInfo::new(ArrowCompressionType::Lz4Frame, -1).get_compression_type(),
+            Some(CompressionType::LZ4_FRAME)
+        );
+        assert_eq!(
+            ArrowCompressionInfo::new(ArrowCompressionType::Zstd, -1).get_compression_type(),
+            Some(CompressionType::ZSTD)
+        );
+    }
+
+    fn mk_map(pairs: &[(&str, &str)]) -> HashMap<String, String> {
+        pairs
+            .iter()
+            .map(|(k, v)| (k.to_string(), v.to_string()))
+            .collect()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/compression/mod.rs b/fluss-rust/crates/fluss/src/compression/mod.rs
new file mode 100644
index 0000000000..2b86dba77d
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/compression/mod.rs
@@ -0,0 +1,20 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+mod arrow_compression;
+
+pub use arrow_compression::*;
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index 366edfc60a..25978ce0bb 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -26,6 +26,7 @@ mod cluster;
 pub mod config;
 pub mod error;
 
+mod compression;
 pub mod io;
 mod util;
 
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 770c4f2cfe..4f6c04bc61 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -15,6 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::compression::ArrowCompressionInfo;
 use crate::error::Error::InvalidTableError;
 use crate::error::{Error, Result};
 use crate::metadata::datatype::{DataField, DataType, RowType};
@@ -721,6 +722,10 @@ impl TableConfig {
     pub fn from_properties(properties: HashMap<String, String>) -> Self {
         TableConfig { properties }
     }
+
+    pub fn get_arrow_compression_info(&self) -> Result<ArrowCompressionInfo> {
+        ArrowCompressionInfo::from_conf(&self.properties)
+    }
 }
 
 impl TableInfo {
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 0a803aec6d..5a5115edfa 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use crate::client::{Record, WriteRecord};
+use crate::compression::ArrowCompressionInfo;
 use crate::error::Result;
 use crate::metadata::DataType;
 use crate::record::{ChangeType, ScanRecord};
@@ -47,6 +48,7 @@ use std::{
     sync::Arc,
 };
 
+use arrow::ipc::writer::IpcWriteOptions;
 /// const for record batch
 pub const BASE_OFFSET_LENGTH: usize = 8;
 pub const LENGTH_LENGTH: usize = 4;
@@ -104,6 +106,7 @@ pub struct MemoryLogRecordsArrowBuilder {
     batch_sequence: i32,
     arrow_record_batch_builder: Box<dyn ArrowRecordBatchInnerBuilder>,
     is_closed: bool,
+    arrow_compression_info: ArrowCompressionInfo,
 }
 
 pub trait ArrowRecordBatchInnerBuilder: Send + Sync {
@@ -244,7 +247,12 @@ impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
 }
 
 impl MemoryLogRecordsArrowBuilder {
-    pub fn new(schema_id: i32, row_type: &DataType, to_append_record_batch: bool) -> Self {
+    pub fn new(
+        schema_id: i32,
+        row_type: &DataType,
+        to_append_record_batch: bool,
+        arrow_compression_info: ArrowCompressionInfo,
+    ) -> Self {
         let arrow_batch_builder: Box<dyn ArrowRecordBatchInnerBuilder> = {
             if to_append_record_batch {
                 Box::new(PrebuiltRecordBatchBuilder::default())
@@ -260,6 +268,7 @@ impl MemoryLogRecordsArrowBuilder {
             batch_sequence: NO_BATCH_SEQUENCE,
             is_closed: false,
             arrow_record_batch_builder: arrow_batch_builder,
+            arrow_compression_info,
         }
     }
 
@@ -289,7 +298,15 @@ impl MemoryLogRecordsArrowBuilder {
         // serialize arrow batch
         let mut arrow_batch_bytes = vec![];
         let table_schema = self.arrow_record_batch_builder.schema();
-        let mut writer = StreamWriter::try_new(&mut arrow_batch_bytes, &table_schema)?;
+        let compression_type = self.arrow_compression_info.get_compression_type();
+        let write_option =
+            IpcWriteOptions::try_with_compression(IpcWriteOptions::default(), compression_type);
+        let mut writer = StreamWriter::try_new_with_options(
+            &mut arrow_batch_bytes,
+            &table_schema,
+            write_option?,
+        )?;
+
         // get header len
         let header = writer.get_ref().len();
         let record_batch = self.arrow_record_batch_builder.build_arrow_record_batch()?;
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index 9eec98eaaf..3f7946ee9f 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -103,7 +103,6 @@ mod table_test {
                     .build()
                     .expect("Failed to build schema"),
             )
-            .property("table.log.arrow.compression.type", "NONE")
             .build()
             .expect("Failed to build table");
 
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index bdbced95c4..43c89b5468 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -142,7 +142,6 @@ mod table_remote_scan_test {
                     .build()
                     .expect("Failed to build schema"),
             )
-            .property("table.log.arrow.compression.type", "NONE")
             .build()
             .expect("Failed to build table");
 

From 2bf3701aaca36aef16767097644cecb0bf56149a Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Thu, 25 Dec 2025 14:02:50 +0000
Subject: [PATCH 043/287] chore: scanner should retry when bucket lead is not
 available (#102)

---
 .../crates/fluss/src/client/credentials.rs    |  4 +-
 .../crates/fluss/src/client/metadata.rs       | 51 +++++++++---
 .../crates/fluss/src/client/table/scanner.rs  | 78 ++++++++++++++++---
 .../crates/fluss/src/cluster/cluster.rs       | 52 ++++++++++---
 .../crates/fluss/src/rpc/server_connection.rs | 25 +++++-
 5 files changed, 175 insertions(+), 35 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/credentials.rs b/fluss-rust/crates/fluss/src/client/credentials.rs
index 8adfe48b99..ffb682ed7d 100644
--- a/fluss-rust/crates/fluss/src/client/credentials.rs
+++ b/fluss-rust/crates/fluss/src/client/credentials.rs
@@ -118,7 +118,9 @@ impl CredentialsCache {
 
     async fn refresh_from_server(&self) -> Result<HashMap<String, String>> {
         let cluster = self.metadata.get_cluster();
-        let server_node = cluster.get_one_available_server();
+        let server_node = cluster
+            .get_one_available_server()
+            .expect("no tablet server available");
         let conn = self.rpc_client.get_connection(server_node).await?;
 
         let request = GetSecurityTokenRequest::new();
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index 3c3ba4bd2e..a51442254c 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -16,38 +16,40 @@
 // under the License.
 
 use crate::cluster::{Cluster, ServerNode, ServerType};
+use crate::error::Result;
 use crate::metadata::{TableBucket, TablePath};
+use crate::proto::MetadataResponse;
 use crate::rpc::message::UpdateMetadataRequest;
 use crate::rpc::{RpcClient, ServerConnection};
+use log::info;
 use parking_lot::RwLock;
 use std::collections::HashSet;
 use std::net::SocketAddr;
 use std::sync::Arc;
 
-use crate::error::Result;
-use crate::proto::MetadataResponse;
-
 #[derive(Default)]
 pub struct Metadata {
     cluster: RwLock<Arc<Cluster>>,
     connections: Arc<RpcClient>,
+    bootstrap: Arc<str>,
 }
 
 impl Metadata {
-    pub async fn new(boot_strap: &str, connections: Arc<RpcClient>) -> Result<Self> {
-        let custer = Self::init_cluster(boot_strap, connections.clone()).await?;
+    pub async fn new(bootstrap: &str, connections: Arc<RpcClient>) -> Result<Self> {
+        let cluster = Self::init_cluster(bootstrap, connections.clone()).await?;
         Ok(Metadata {
-            cluster: RwLock::new(Arc::new(custer)),
+            cluster: RwLock::new(Arc::new(cluster)),
             connections,
+            bootstrap: bootstrap.into(),
         })
     }
 
     async fn init_cluster(boot_strap: &str, connections: Arc<RpcClient>) -> Result<Cluster> {
-        let socker_addrss = boot_strap.parse::<SocketAddr>().unwrap();
+        let socket_address = boot_strap.parse::<SocketAddr>().unwrap();
         let server_node = ServerNode::new(
             -1,
-            socker_addrss.ip().to_string(),
-            socker_addrss.port() as u32,
+            socket_address.ip().to_string(),
+            socket_address.port() as u32,
             ServerType::CoordinatorServer,
         );
         let con = connections.get_connection(&server_node).await?;
@@ -55,6 +57,20 @@ impl Metadata {
         Cluster::from_metadata_response(response, None)
     }
 
+    async fn reinit_cluster(&self) -> Result<()> {
+        let cluster = Self::init_cluster(&self.bootstrap, self.connections.clone()).await?;
+        *self.cluster.write() = cluster.into();
+        Ok(())
+    }
+
+    pub fn invalidate_server(&self, server_id: &i32, table_ids: Vec<i64>) {
+        // Take a write lock for the entire operation to avoid races between
+        // reading the current cluster state and writing back the updated one.
+        let mut cluster_guard = self.cluster.write();
+        let updated_cluster = cluster_guard.invalidate_server(server_id, table_ids);
+        *cluster_guard = Arc::new(updated_cluster);
+    }
+
     pub async fn update(&self, metadata_response: MetadataResponse) -> Result<()> {
         let origin_cluster = self.cluster.read().clone();
         let new_cluster =
@@ -65,7 +81,22 @@ impl Metadata {
     }
 
     pub async fn update_tables_metadata(&self, table_paths: &HashSet<&TablePath>) -> Result<()> {
-        let server = self.cluster.read().get_one_available_server().clone();
+        let maybe_server = {
+            let guard = self.cluster.read();
+            guard.get_one_available_server().cloned()
+        };
+
+        let server = match maybe_server {
+            Some(s) => s,
+            None => {
+                info!(
+                    "No available tablet server to update metadata, attempting to re-initialize cluster using bootstrap server."
+                );
+                self.reinit_cluster().await?;
+                return Ok(());
+            }
+        };
+
         let conn = self.connections.get_connection(&server).await?;
 
         let update_table_paths: Vec<&TablePath> = table_paths.iter().copied().collect();
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 2246e2cbae..11bdfa3148 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -24,7 +24,7 @@ use crate::client::table::log_fetch_buffer::{
 use crate::client::table::remote_log::{
     RemoteLogDownloader, RemoteLogFetchInfo, RemotePendingFetch,
 };
-use crate::error::{Error, Result};
+use crate::error::{Error, Result, RpcError};
 use crate::metadata::{TableBucket, TableInfo, TablePath};
 use crate::proto::{FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
 use crate::record::{LogRecordsBatches, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
@@ -271,6 +271,8 @@ struct LogFetcher {
     credentials_cache: Arc<CredentialsCache>,
     log_fetch_buffer: Arc<LogFetchBuffer>,
     nodes_with_pending_fetch_requests: Arc<Mutex<HashSet<i32>>>,
+    table_path: TablePath,
+    is_partitioned: bool,
 }
 
 impl LogFetcher {
@@ -299,6 +301,8 @@ impl LogFetcher {
             credentials_cache: Arc::new(CredentialsCache::new(conns.clone(), metadata.clone())),
             log_fetch_buffer: Arc::new(LogFetchBuffer::new()),
             nodes_with_pending_fetch_requests: Arc::new(Mutex::new(HashSet::new())),
+            table_path: table_info.table_path.clone(),
+            is_partitioned: table_info.is_partitioned(),
         })
     }
 
@@ -315,9 +319,45 @@ impl LogFetcher {
         }
     }
 
+    async fn check_and_update_metadata(&self) -> Result<()> {
+        if self.is_partitioned {
+            // TODO: Implement partition-aware metadata refresh for buckets whose leaders are unknown.
+            // The implementation will likely need to collect partition IDs for such buckets and
+            // perform targeted metadata updates. Until then, we avoid computing unused partition_ids.
+            return Ok(());
+        }
+
+        let need_update = self
+            .fetchable_buckets()
+            .iter()
+            .any(|bucket| self.get_table_bucket_leader(bucket).is_none());
+
+        if !need_update {
+            return Ok(());
+        }
+
+        // TODO: Handle PartitionNotExist error
+        self.metadata
+            .update_tables_metadata(&HashSet::from([&self.table_path]))
+            .await
+            .or_else(|e| {
+                if let Error::RpcError { source, .. } = &e
+                    && matches!(source, RpcError::ConnectionError(_) | RpcError::Poisoned(_))
+                {
+                    warn!(
+                        "Retrying after encountering error while updating table metadata: {}",
+                        e
+                    );
+                    Ok(())
+                } else {
+                    Err(e)
+                }
+            })
+    }
+
     /// Send fetch requests asynchronously without waiting for responses
     async fn send_fetches(&self) -> Result<()> {
-        // todo: check update metadata like fluss-java in case leader changes
+        self.check_and_update_metadata().await?;
         let fetch_request = self.prepare_fetch_log_requests().await;
 
         for (leader, fetch_request) in fetch_request {
@@ -337,6 +377,7 @@ impl LogFetcher {
             let remote_log_downloader = Arc::clone(&self.remote_log_downloader);
             let creds_cache = self.credentials_cache.clone();
             let nodes_with_pending = self.nodes_with_pending_fetch_requests.clone();
+            let metadata = self.metadata.clone();
 
             // Spawn async task to handle the fetch request
             // Note: These tasks are not explicitly tracked or cancelled when LogFetcher is dropped.
@@ -351,27 +392,34 @@ impl LogFetcher {
                     nodes_with_pending.lock().remove(&leader);
                 });
 
-                let server_node = cluster
-                    .get_tablet_server(leader)
-                    .expect("todo: handle leader not exist.");
+                let server_node = match cluster.get_tablet_server(leader) {
+                    Some(node) => node,
+                    None => {
+                        warn!("No server node found for leader {}, retrying", leader);
+                        Self::handle_fetch_failure(metadata, &leader, &fetch_request).await;
+                        return;
+                    }
+                };
 
                 let con = match conns.get_connection(server_node).await {
                     Ok(con) => con,
                     Err(e) => {
-                        // todo: handle failed to get connection
-                        warn!("Failed to get connection to destination node: {e:?}");
+                        warn!("Retrying after error getting connection to destination node: {e:?}");
+                        Self::handle_fetch_failure(metadata, &leader, &fetch_request).await;
                         return;
                     }
                 };
 
                 let fetch_response = match con
-                    .request(message::FetchLogRequest::new(fetch_request))
+                    .request(message::FetchLogRequest::new(fetch_request.clone()))
                     .await
                 {
                     Ok(resp) => resp,
                     Err(e) => {
-                        // todo: handle fetch log from destination node
-                        warn!("Failed to fetch log from destination node {server_node:?}: {e:?}");
+                        warn!(
+                            "Retrying after error fetching log from destination node {server_node:?}: {e:?}"
+                        );
+                        Self::handle_fetch_failure(metadata, &leader, &fetch_request).await;
                         return;
                     }
                 };
@@ -387,7 +435,6 @@ impl LogFetcher {
                 )
                 .await
                 {
-                    // todo: handle fail to handle fetch response
                     error!("Fail to handle fetch response: {e:?}");
                 }
             });
@@ -396,6 +443,15 @@ impl LogFetcher {
         Ok(())
     }
 
+    async fn handle_fetch_failure(
+        metadata: Arc<Metadata>,
+        server_id: &i32,
+        request: &FetchLogRequest,
+    ) {
+        let table_ids = request.tables_req.iter().map(|r| r.table_id).collect();
+        metadata.invalidate_server(server_id, table_ids);
+    }
+
     /// Handle fetch response and add completed fetches to buffer
     async fn handle_fetch_response(
         fetch_response: crate::proto::FetchLogResponse,
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
index a6f20a8262..f14d055f9b 100644
--- a/fluss-rust/crates/fluss/src/cluster/cluster.rs
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -22,7 +22,7 @@ use crate::metadata::{JsonSerde, TableBucket, TableDescriptor, TableInfo, TableP
 use crate::proto::MetadataResponse;
 use crate::rpc::{from_pb_server_node, from_pb_table_path};
 use rand::random_range;
-use std::collections::HashMap;
+use std::collections::{HashMap, HashSet};
 
 static EMPTY: Vec<BucketLocation> = Vec::new();
 
@@ -64,6 +64,43 @@ impl Cluster {
         }
     }
 
+    pub fn invalidate_server(&self, server_id: &i32, table_ids: Vec<i64>) -> Self {
+        let alive_tablet_servers_by_id = self
+            .alive_tablet_servers_by_id
+            .iter()
+            .filter(|&(id, _)| id != server_id)
+            .map(|(id, ts)| (*id, ts.clone()))
+            .collect();
+
+        let table_paths: HashSet<&TablePath> = table_ids
+            .iter()
+            .filter_map(|id| self.table_path_by_id.get(id))
+            .collect();
+
+        let available_locations_by_path = self
+            .available_locations_by_path
+            .iter()
+            .filter(|&(path, _)| !table_paths.contains(path))
+            .map(|(path, locations)| (path.clone(), locations.clone()))
+            .collect();
+
+        let available_locations_by_bucket = self
+            .available_locations_by_bucket
+            .iter()
+            .filter(|&(_bucket, location)| !table_paths.contains(&location.table_path))
+            .map(|(bucket, location)| (bucket.clone(), location.clone()))
+            .collect();
+
+        Cluster::new(
+            self.coordinator_server.clone(),
+            alive_tablet_servers_by_id,
+            available_locations_by_path,
+            available_locations_by_bucket,
+            self.table_id_by_path.clone(),
+            self.table_info_by_path.clone(),
+        )
+    }
+
     pub fn update(&mut self, cluster: Cluster) {
         let Cluster {
             coordinator_server,
@@ -214,15 +251,12 @@ impl Cluster {
             .unwrap_or(&EMPTY)
     }
 
-    pub fn get_one_available_server(&self) -> &ServerNode {
-        assert!(
-            !self.alive_tablet_servers.is_empty(),
-            "no alive tablet server in cluster"
-        );
+    pub fn get_one_available_server(&self) -> Option<&ServerNode> {
+        if self.alive_tablet_servers.is_empty() {
+            return None;
+        }
         let offset = random_range(0..self.alive_tablet_servers.len());
-        self.alive_tablet_servers
-            .get(offset)
-            .unwrap_or_else(|| panic!("can't find alive tab server by offset {offset}"))
+        self.alive_tablet_servers.get(offset)
     }
 
     pub fn get_bucket_count(&self, table_path: &TablePath) -> i32 {
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index fdeb56fbbe..441b175a24 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -66,13 +66,25 @@ impl RpcClient {
         server_node: &ServerNode,
     ) -> Result<ServerConnection, RpcError> {
         let server_id = server_node.uid();
-        {
+        let connection = {
             let connections = self.connections.read();
-            if let Some(connection) = connections.get(server_id) {
-                return Ok(connection.clone());
+            connections.get(server_id).cloned()
+        };
+
+        if let Some(conn) = connection {
+            if !conn.is_poisoned() {
+                return Ok(conn);
             }
         }
-        let new_server = self.connect(server_node).await?;
+
+        let new_server = match self.connect(server_node).await {
+            Ok(new_server) => new_server,
+            Err(e) => {
+                self.connections.write().remove(server_id);
+                return Err(e);
+            }
+        };
+
         self.connections
             .write()
             .insert(server_id.clone(), new_server.clone());
@@ -231,6 +243,11 @@ where
         }
     }
 
+    fn is_poisoned(&self) -> bool {
+        let guard = self.state.lock();
+        matches!(*guard, ConnectionState::Poison(_))
+    }
+
     pub async fn request<R>(&self, msg: R) -> Result<R::ResponseBody, Error>
     where
         R: RequestBody + Send + WriteVersionedType<Vec<u8>>,

From 02ca3eb4f410017f9c72e482cc5605b59c13b41b Mon Sep 17 00:00:00 2001
From: Pavlos-Petros Tournaris <p.tournaris@gmail.com>
Date: Thu, 25 Dec 2025 16:47:42 +0200
Subject: [PATCH 044/287] chore: add integration test for list offsets (#52)

---------

Co-authored-by: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
---
 .../crates/fluss/tests/integration/table.rs   | 126 ++++++++++++++++++
 1 file changed, 126 insertions(+)

diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index 3f7946ee9f..006adcc45b 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -38,8 +38,11 @@ mod table_test {
     use arrow::array::record_batch;
     use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
     use fluss::row::InternalRow;
+    use fluss::rpc::message::OffsetSpec;
+    use jiff::Timestamp;
     use std::sync::Arc;
     use std::thread;
+
     fn before_all() {
         // Create a new tokio runtime in a separate thread
         let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
@@ -256,4 +259,127 @@ mod table_test {
             );
         }
     }
+
+    #[tokio::test]
+    async fn list_offsets() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_list_offsets".to_string());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        // Wait for table to be fully initialized
+        tokio::time::sleep(tokio::time::Duration::from_secs(2)).await;
+
+        // Test earliest offset (should be 0 for empty table)
+        let earliest_offsets = admin
+            .list_offsets(&table_path, &[0], OffsetSpec::Earliest)
+            .await
+            .expect("Failed to list earliest offsets");
+
+        assert_eq!(
+            earliest_offsets.get(&0),
+            Some(&0),
+            "Earliest offset should be 0 for bucket 0"
+        );
+
+        // Test latest offset (should be 0 for empty table)
+        let latest_offsets = admin
+            .list_offsets(&table_path, &[0], OffsetSpec::Latest)
+            .await
+            .expect("Failed to list latest offsets");
+
+        assert_eq!(
+            latest_offsets.get(&0),
+            Some(&0),
+            "Latest offset should be 0 for empty table"
+        );
+
+        let before_append_ms = Timestamp::now().as_millisecond();
+
+        // Append some records
+        let append_writer = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table")
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer();
+
+        let batch = record_batch!(
+            ("id", Int32, [1, 2, 3]),
+            ("name", Utf8, ["alice", "bob", "charlie"])
+        )
+        .unwrap();
+        append_writer
+            .append_arrow_batch(batch)
+            .await
+            .expect("Failed to append batch");
+
+        tokio::time::sleep(tokio::time::Duration::from_secs(1)).await;
+
+        let after_append_ms = Timestamp::now().as_millisecond();
+
+        // Test latest offset after appending (should be 3)
+        let latest_offsets_after = admin
+            .list_offsets(&table_path, &[0], OffsetSpec::Latest)
+            .await
+            .expect("Failed to list latest offsets after append");
+
+        assert_eq!(
+            latest_offsets_after.get(&0),
+            Some(&3),
+            "Latest offset should be 3 after appending 3 records"
+        );
+
+        // Test earliest offset after appending (should still be 0)
+        let earliest_offsets_after = admin
+            .list_offsets(&table_path, &[0], OffsetSpec::Earliest)
+            .await
+            .expect("Failed to list earliest offsets after append");
+
+        assert_eq!(
+            earliest_offsets_after.get(&0),
+            Some(&0),
+            "Earliest offset should still be 0"
+        );
+
+        // Test list_offsets_by_timestamp
+
+        let timestamp_offsets = admin
+            .list_offsets(&table_path, &[0], OffsetSpec::Timestamp(before_append_ms))
+            .await
+            .expect("Failed to list offsets by timestamp");
+
+        assert_eq!(
+            timestamp_offsets.get(&0),
+            Some(&0),
+            "Timestamp before append should resolve to offset 0 (start of new data)"
+        );
+
+        let timestamp_offsets = admin
+            .list_offsets(&table_path, &[0], OffsetSpec::Timestamp(after_append_ms))
+            .await
+            .expect("Failed to list offsets by timestamp");
+
+        assert_eq!(
+            timestamp_offsets.get(&0),
+            Some(&3),
+            "Timestamp after append should resolve to offset 0 (no newer records)"
+        );
+    }
 }

From 4a225d501ce5219f7e96cc031bfbbe7561e43022 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Mon, 29 Dec 2025 11:14:01 +0000
Subject: [PATCH 045/287] feat: Introduce HashBucketAssigner (#117)

---
 fluss-rust/crates/fluss/src/bucketing/mod.rs  | 266 ++++++++++++++++++
 .../fluss/src/client/write/bucket_assigner.rs |  54 +++-
 .../fluss/src/client/write/writer_client.rs   |  13 +-
 fluss-rust/crates/fluss/src/lib.rs            |   1 +
 .../fluss/src/metadata/data_lake_format.rs    |  30 ++
 fluss-rust/crates/fluss/src/metadata/mod.rs   |   2 +
 fluss-rust/crates/fluss/src/util/mod.rs       |   2 +
 .../crates/fluss/src/util/murmur_hash.rs      | 222 +++++++++++++++
 8 files changed, 581 insertions(+), 9 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/bucketing/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
 create mode 100644 fluss-rust/crates/fluss/src/util/murmur_hash.rs

diff --git a/fluss-rust/crates/fluss/src/bucketing/mod.rs b/fluss-rust/crates/fluss/src/bucketing/mod.rs
new file mode 100644
index 0000000000..2611ac7ecf
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/bucketing/mod.rs
@@ -0,0 +1,266 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::DataLakeFormat;
+use crate::util::murmur_hash;
+
+pub trait BucketingFunction: Sync + Send {
+    fn bucketing(&self, bucket_key: &[u8], num_buckets: i32) -> Result<i32>;
+}
+
+#[allow(dead_code)]
+impl dyn BucketingFunction {
+    /// Provides the bucketing function for a given [DataLakeFormat]
+    ///
+    /// # Arguments
+    /// * `lake_format` - Data lake format or none
+    ///
+    /// # Returns
+    /// * BucketingFunction
+    pub fn of(lake_format: Option<&DataLakeFormat>) -> Box<dyn BucketingFunction> {
+        match lake_format {
+            None => Box::new(FlussBucketingFunction),
+            Some(DataLakeFormat::Paimon) => Box::new(PaimonBucketingFunction),
+            Some(DataLakeFormat::Lance) => Box::new(FlussBucketingFunction),
+            Some(DataLakeFormat::Iceberg) => Box::new(IcebergBucketingFunction),
+        }
+    }
+}
+
+struct FlussBucketingFunction;
+impl BucketingFunction for FlussBucketingFunction {
+    fn bucketing(&self, bucket_key: &[u8], num_buckets: i32) -> Result<i32> {
+        if bucket_key.is_empty() {
+            return Err(IllegalArgument {
+                message: "bucket_key must not be empty!".to_string(),
+            });
+        }
+
+        if num_buckets <= 0 {
+            return Err(IllegalArgument {
+                message: "num_buckets must be positive!".to_string(),
+            });
+        }
+
+        let key_hash = murmur_hash::fluss_hash_bytes(bucket_key)?;
+
+        Ok(murmur_hash::fluss_hash_i32(key_hash) % num_buckets)
+    }
+}
+
+struct PaimonBucketingFunction;
+impl BucketingFunction for PaimonBucketingFunction {
+    fn bucketing(&self, bucket_key: &[u8], num_buckets: i32) -> Result<i32> {
+        if bucket_key.is_empty() {
+            return Err(IllegalArgument {
+                message: "bucket_key must not be empty!".to_string(),
+            });
+        }
+
+        if num_buckets <= 0 {
+            return Err(IllegalArgument {
+                message: "num_buckets must be positive!".to_string(),
+            });
+        }
+
+        let key_hash = murmur_hash::fluss_hash_bytes(bucket_key)?;
+
+        Ok((key_hash % num_buckets).abs())
+    }
+}
+
+struct IcebergBucketingFunction;
+impl BucketingFunction for IcebergBucketingFunction {
+    fn bucketing(&self, bucket_key: &[u8], num_buckets: i32) -> Result<i32> {
+        if bucket_key.is_empty() {
+            return Err(IllegalArgument {
+                message: "bucket_key must not be empty!".to_string(),
+            });
+        }
+
+        if num_buckets <= 0 {
+            return Err(IllegalArgument {
+                message: "num_buckets must be positive!".to_string(),
+            });
+        };
+
+        Ok((murmur_hash::hash_bytes(bucket_key) as i32 & i32::MAX) % num_buckets)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_default_bucketing() {
+        let default_bucketing = <dyn BucketingFunction>::of(None);
+
+        let expected = 1;
+        let actual = default_bucketing.bucketing(&[00u8, 10u8], 7).unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 0;
+        let actual = default_bucketing
+            .bucketing(&[00u8, 10u8, 10u8, 10u8], 12)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 6;
+        let actual = default_bucketing
+            .bucketing("2bb87d68-baf9-4e64-90f9-f80910419fa6".as_bytes(), 16)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 6;
+        let actual = default_bucketing
+            .bucketing("The quick brown fox jumps over the lazy dog".as_bytes(), 8)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+    }
+
+    #[test]
+    fn test_paimon_bucketing() {
+        let paimon_bucketing = <dyn BucketingFunction>::of(Some(&DataLakeFormat::Paimon));
+
+        let expected = 1;
+        let actual = paimon_bucketing.bucketing(&[00u8, 10u8], 7).unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 11;
+        let actual = paimon_bucketing
+            .bucketing(&[00u8, 10u8, 10u8, 10u8], 12)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 12;
+        let actual = paimon_bucketing
+            .bucketing("2bb87d68-baf9-4e64-90f9-f80910419fa6".as_bytes(), 16)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 0;
+        let actual = paimon_bucketing
+            .bucketing("The quick brown fox jumps over the lazy dog".as_bytes(), 8)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+    }
+
+    #[test]
+    fn test_lance_bucketing() {
+        let lance_bucketing = <dyn BucketingFunction>::of(Some(&DataLakeFormat::Lance));
+
+        let expected = 1;
+        let actual = lance_bucketing.bucketing(&[00u8, 10u8], 7).unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 0;
+        let actual = lance_bucketing
+            .bucketing(&[00u8, 10u8, 10u8, 10u8], 12)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 6;
+        let actual = lance_bucketing
+            .bucketing("2bb87d68-baf9-4e64-90f9-f80910419fa6".as_bytes(), 16)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 6;
+        let actual = lance_bucketing
+            .bucketing("The quick brown fox jumps over the lazy dog".as_bytes(), 8)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+    }
+
+    #[test]
+    fn test_iceberg_bucketing() {
+        let iceberg_bucketing = <dyn BucketingFunction>::of(Some(&DataLakeFormat::Iceberg));
+
+        let expected = 3;
+        let actual = iceberg_bucketing.bucketing(&[00u8, 10u8], 7).unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 4;
+        let actual = iceberg_bucketing
+            .bucketing(&[00u8, 10u8, 10u8, 10u8], 12)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 12;
+        let actual = iceberg_bucketing
+            .bucketing("2bb87d68-baf9-4e64-90f9-f80910419fa6".as_bytes(), 16)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+
+        let expected = 3;
+        let actual = iceberg_bucketing
+            .bucketing("The quick brown fox jumps over the lazy dog".as_bytes(), 8)
+            .unwrap();
+        assert_eq!(
+            expected, actual,
+            "Expecting bucket to be {expected} but got {actual}"
+        );
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
index 991c5f9197..44b2673697 100644
--- a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
+++ b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
@@ -15,7 +15,10 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::bucketing::BucketingFunction;
 use crate::cluster::Cluster;
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
 use crate::metadata::TablePath;
 use rand::Rng;
 use std::sync::atomic::{AtomicI32, Ordering};
@@ -25,7 +28,7 @@ pub trait BucketAssigner: Sync + Send {
 
     fn on_new_batch(&self, cluster: &Cluster, prev_bucket_id: i32);
 
-    fn assign_bucket(&self, bucket_key: Option<&[u8]>, cluster: &Cluster) -> i32;
+    fn assign_bucket(&self, bucket_key: Option<&[u8]>, cluster: &Cluster) -> Result<i32>;
 }
 
 #[derive(Debug)]
@@ -91,12 +94,55 @@ impl BucketAssigner for StickyBucketAssigner {
         self.next_bucket(cluster, prev_bucket_id);
     }
 
-    fn assign_bucket(&self, _bucket_key: Option<&[u8]>, cluster: &Cluster) -> i32 {
+    fn assign_bucket(&self, _bucket_key: Option<&[u8]>, cluster: &Cluster) -> Result<i32> {
         let bucket_id = self.current_bucket_id.load(Ordering::Relaxed);
         if bucket_id < 0 {
-            self.next_bucket(cluster, bucket_id)
+            Ok(self.next_bucket(cluster, bucket_id))
         } else {
-            bucket_id
+            Ok(bucket_id)
         }
     }
 }
+
+/// A [BucketAssigner] which assigns based on a modulo hashing function
+pub struct HashBucketAssigner {
+    num_buckets: i32,
+    bucketing_function: Box<dyn BucketingFunction>,
+}
+
+#[allow(dead_code)]
+impl HashBucketAssigner {
+    /// Creates a new [HashBucketAssigner] based on the given [BucketingFunction].
+    /// See [BucketingFunction.of(Option<&DataLakeFormat>)] for bucketing functions.
+    ///
+    ///
+    /// # Arguments
+    /// * `num_buckets` - The number of buckets
+    /// * `bucketing_function` - The bucketing function
+    ///
+    /// # Returns
+    /// * [HashBucketAssigner] - The hash bucket assigner
+    pub fn new(num_buckets: i32, bucketing_function: Box<dyn BucketingFunction>) -> Self {
+        HashBucketAssigner {
+            num_buckets,
+            bucketing_function,
+        }
+    }
+}
+
+impl BucketAssigner for HashBucketAssigner {
+    fn abort_if_batch_full(&self) -> bool {
+        false
+    }
+
+    fn on_new_batch(&self, _: &Cluster, _: i32) {
+        // do nothing
+    }
+
+    fn assign_bucket(&self, bucket_key: Option<&[u8]>, _: &Cluster) -> Result<i32> {
+        let key = bucket_key.ok_or_else(|| IllegalArgument {
+            message: "no bucket key provided".to_string(),
+        })?;
+        self.bucketing_function.bucketing(key, self.num_buckets)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index 042859afb4..22e0397212 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -91,7 +91,7 @@ impl WriterClient {
         let table_path = &record.table_path;
         let cluster = self.metadata.get_cluster();
 
-        let (bucket_assigner, bucket_id) = self.assign_bucket(table_path);
+        let (bucket_assigner, bucket_id) = self.assign_bucket(table_path)?;
 
         let mut result = self
             .accumulate
@@ -101,7 +101,7 @@ impl WriterClient {
         if result.abort_record_for_new_batch {
             let prev_bucket_id = bucket_id;
             bucket_assigner.on_new_batch(&cluster, prev_bucket_id);
-            let bucket_id = bucket_assigner.assign_bucket(None, &cluster);
+            let bucket_id = bucket_assigner.assign_bucket(None, &cluster)?;
             result = self
                 .accumulate
                 .append(record, bucket_id, &cluster, false)
@@ -114,7 +114,10 @@ impl WriterClient {
 
         Ok(result.result_handle.expect("result_handle should exist"))
     }
-    fn assign_bucket(&self, table_path: &Arc<TablePath>) -> (Arc<Box<dyn BucketAssigner>>, i32) {
+    fn assign_bucket(
+        &self,
+        table_path: &Arc<TablePath>,
+    ) -> Result<(Arc<Box<dyn BucketAssigner>>, i32)> {
         let cluster = self.metadata.get_cluster();
         let bucket_assigner = {
             if let Some(assigner) = self.bucket_assigners.get(table_path) {
@@ -126,8 +129,8 @@ impl WriterClient {
                 assigner
             }
         };
-        let bucket_id = bucket_assigner.assign_bucket(None, &cluster);
-        (bucket_assigner, bucket_id)
+        let bucket_id = bucket_assigner.assign_bucket(None, &cluster)?;
+        Ok((bucket_assigner, bucket_id))
     }
 
     pub async fn close(self) -> Result<()> {
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index 25978ce0bb..1bd72a4aac 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -26,6 +26,7 @@ mod cluster;
 pub mod config;
 pub mod error;
 
+mod bucketing;
 mod compression;
 pub mod io;
 mod util;
diff --git a/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs b/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
new file mode 100644
index 0000000000..76a23f8d96
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
@@ -0,0 +1,30 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+/// Identifies the logical format of a data lake table supported by Fluss.
+///
+/// This enum is typically used in metadata and configuration to distinguish
+/// between different table formats so that the appropriate integration and
+/// semantics can be applied.
+pub enum DataLakeFormat {
+    /// Apache Paimon data lake table format.
+    Paimon,
+    /// Lance columnar data format / lakehouse table format.
+    Lance,
+    /// Apache Iceberg data lake table format.
+    Iceberg,
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/mod.rs b/fluss-rust/crates/fluss/src/metadata/mod.rs
index 87540071f3..9c0b1b472c 100644
--- a/fluss-rust/crates/fluss/src/metadata/mod.rs
+++ b/fluss-rust/crates/fluss/src/metadata/mod.rs
@@ -15,11 +15,13 @@
 // specific language governing permissions and limitations
 // under the License.
 
+mod data_lake_format;
 mod database;
 mod datatype;
 mod json_serde;
 mod table;
 
+pub use data_lake_format::*;
 pub use database::*;
 pub use datatype::*;
 pub use json_serde::*;
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index d8c0db59d8..5f67290e43 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -15,6 +15,8 @@
 // specific language governing permissions and limitations
 // under the License.
 
+pub mod murmur_hash;
+
 use crate::metadata::TableBucket;
 use linked_hash_map::LinkedHashMap;
 use std::collections::{HashMap, HashSet};
diff --git a/fluss-rust/crates/fluss/src/util/murmur_hash.rs b/fluss-rust/crates/fluss/src/util/murmur_hash.rs
new file mode 100644
index 0000000000..12229c717d
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/util/murmur_hash.rs
@@ -0,0 +1,222 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+/* This file is based on source code of Apache Flink Project (https://flink.apache.org/), licensed by the Apache
+ * Software Foundation (ASF) under the Apache License, Version 2.0. See the NOTICE file distributed with this work for
+ * additional information regarding copyright ownership. */
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+
+pub const MURMUR3_DEFAULT_SEED: u32 = 0;
+pub const FLINK_MURMUR3_DEFAULT_SEED: i32 = 42;
+
+const C1: u32 = 0xCC9E_2D51;
+const C2: u32 = 0x1B87_3593;
+const R1: u32 = 15;
+const R2: u32 = 13;
+const M: u32 = 5;
+const N: u32 = 0xE654_6B64;
+const CHUNK_SIZE: usize = 4;
+
+/// Hashes the data using 32-bit Murmur3 hash with 0 as seed
+///
+/// # Arguments
+/// * `data` - byte array containing data to be hashed
+///
+/// # Returns
+/// Returns hash value
+pub fn hash_bytes(data: &[u8]) -> u32 {
+    hash_bytes_with_seed(data, MURMUR3_DEFAULT_SEED)
+}
+
+#[inline(always)]
+fn hash_bytes_with_seed(data: &[u8], seed: u32) -> u32 {
+    let length = data.len();
+    let chunks = length / CHUNK_SIZE;
+    let length_aligned = chunks * CHUNK_SIZE;
+
+    let mut h1 = hash_full_chunks(data, seed);
+    let mut k1 = 0u32;
+
+    for (shift, &b) in data[length_aligned..].iter().enumerate() {
+        k1 |= (b as u32) << (8 * shift);
+    }
+
+    h1 ^= k1.wrapping_mul(C1).rotate_left(R1).wrapping_mul(C2);
+
+    fmix(h1, length)
+}
+
+/// Hashes the data using Fluss'/Flink's variant of 32-bit Murmur hash with 42 as seed and tail bytes mixed into hash byte-by-byte
+/// Maximum data array size supported is 2GB
+///
+/// # Arguments
+/// * `data` - byte array containing data to be hashed
+///
+/// # Returns
+/// * result of hashing, `Ok(hash_value)`
+///
+/// # Error
+/// Returns `Err(IllegalArgument)` if byte array is larger than 2GB
+pub fn fluss_hash_bytes(data: &[u8]) -> Result<i32> {
+    fluss_hash_bytes_with_seed(data, FLINK_MURMUR3_DEFAULT_SEED)
+}
+#[inline(always)]
+fn fluss_hash_bytes_with_seed(data: &[u8], seed: i32) -> Result<i32> {
+    let length = data.len();
+
+    if length >= i32::MAX as usize {
+        return Err(IllegalArgument {
+            message: "data array size {length} is bigger than supported".to_string(),
+        });
+    }
+
+    let chunks = length / CHUNK_SIZE;
+    let length_aligned = chunks * CHUNK_SIZE;
+
+    let mut h1 = hash_full_chunks(data, seed as u32);
+
+    for byte in data.iter().take(length).skip(length_aligned) {
+        let k1 = mix_k1(*byte as u32);
+        h1 = mix_h1(h1, k1);
+    }
+
+    Ok(fmix(h1, length) as i32)
+}
+
+#[inline(always)]
+fn hash_full_chunks(data: &[u8], seed: u32) -> u32 {
+    data.chunks_exact(CHUNK_SIZE).fold(seed, |h1, chunk| {
+        let block = u32::from_le_bytes(chunk.try_into().unwrap());
+        let k1 = mix_k1(block);
+        mix_h1(h1, k1)
+    })
+}
+
+#[inline(always)]
+fn mix_k1(k1: u32) -> u32 {
+    k1.wrapping_mul(C1).rotate_left(R1).wrapping_mul(C2)
+}
+
+#[inline(always)]
+fn mix_h1(h1: u32, k1: u32) -> u32 {
+    (h1 ^ k1).rotate_left(R2).wrapping_mul(M).wrapping_add(N)
+}
+
+// Finalization mix - force all bits of a hash block to avalanche
+#[inline(always)]
+fn fmix(mut h1: u32, length: usize) -> u32 {
+    h1 ^= length as u32;
+    bit_mix(h1)
+}
+
+/// Hashes an i32 using Fluss'/Flink's variant of Murmur
+///
+/// # Arguments
+/// * `input` - i32 value to be hashed
+///
+/// # Returns
+/// Returns hash value
+pub fn fluss_hash_i32(input: i32) -> i32 {
+    let mut input = input as u32;
+    input = input.wrapping_mul(C1);
+    input = input.rotate_left(R1);
+    input = input.wrapping_mul(C2);
+    input = input.rotate_left(R2);
+
+    input = input.wrapping_mul(M).wrapping_add(N);
+    input ^= CHUNK_SIZE as u32;
+    let output = bit_mix(input) as i32;
+
+    if output >= 0 {
+        output
+    } else if output != i32::MIN {
+        -output
+    } else {
+        0
+    }
+}
+
+const BIT_MIX_A: u32 = 0x85EB_CA6B;
+const BIT_MIX_B: u32 = 0xC2B2_AE35;
+
+#[inline(always)]
+fn bit_mix(mut input: u32) -> u32 {
+    input = input ^ (input >> 16);
+    input = input.wrapping_mul(BIT_MIX_A);
+    input = input ^ (input >> 13);
+    input = input.wrapping_mul(BIT_MIX_B);
+    input = input ^ (input >> 16);
+    input
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    #[test]
+    fn test_murmur3() {
+        //
+        let empty_data_hash = hash_bytes(&[]);
+        assert_eq!(empty_data_hash, 0);
+
+        let empty_data_hash = hash_bytes_with_seed(&[], 1);
+        assert_eq!(0x514E_28B7, empty_data_hash);
+
+        let empty_data_hash = hash_bytes_with_seed(&[], 0xFFFF_FFFF);
+        assert_eq!(0x81F1_6F39, empty_data_hash);
+
+        let hash = hash_bytes("The quick brown fox jumps over the lazy dog".as_bytes());
+        assert_eq!(0x2E4F_F723, hash);
+
+        let hash = hash_bytes_with_seed(
+            "The quick brown fox jumps over the lazy dog".as_bytes(),
+            0x9747_B28C,
+        );
+        assert_eq!(0x2FA8_26CD, hash);
+    }
+
+    #[test]
+    fn test_flink_murmur() {
+        let empty_data_hash = fluss_hash_bytes_with_seed(&[], 0).expect("Failed to hash");
+        assert_eq!(empty_data_hash, 0);
+
+        let empty_data_hash = fluss_hash_bytes(&[]).expect("Failed to hash");
+        assert_eq!(0x087F_CD5C, empty_data_hash);
+
+        let empty_data_hash =
+            fluss_hash_bytes_with_seed(&[], 0xFFFF_FFFFu32 as i32).expect("Failed to hash");
+        assert_eq!(0x81F1_6F39u32 as i32, empty_data_hash);
+
+        let hash =
+            fluss_hash_bytes_with_seed("The quick brown fox jumps over the lazy dog".as_bytes(), 0)
+                .expect("Failed to hash");
+        assert_eq!(0x5FD2_0A20, hash);
+
+        let hash = fluss_hash_bytes("The quick brown fox jumps over the lazy dog".as_bytes())
+            .expect("Failed to hash");
+        assert_eq!(0x1BC6_F880, hash);
+
+        let hash = fluss_hash_i32(0);
+        assert_eq!(0x2362_F9DE, hash);
+
+        let hash = fluss_hash_i32(42);
+        assert_eq!(0x43A4_6E1D, hash);
+
+        let hash = fluss_hash_i32(-77);
+        assert_eq!(0x2EEB_27DE, hash);
+    }
+}

From eea8da1fd2fca46435f30d4f741cdd7b58c40a61 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Fri, 2 Jan 2026 08:35:43 +0000
Subject: [PATCH 046/287] chore: rust client to return error when currently
 unimplemented non-default ZSTD compression is configured (#120)

---------

Co-authored-by: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
---
 .../crates/fluss/src/client/table/scanner.rs  |  7 +---
 .../src/compression/arrow_compression.rs      | 41 ++++++++++++++-----
 2 files changed, 32 insertions(+), 16 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 11bdfa3148..bf3983917d 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -344,10 +344,7 @@ impl LogFetcher {
                 if let Error::RpcError { source, .. } = &e
                     && matches!(source, RpcError::ConnectionError(_) | RpcError::Poisoned(_))
                 {
-                    warn!(
-                        "Retrying after encountering error while updating table metadata: {}",
-                        e
-                    );
+                    warn!("Retrying after encountering error while updating table metadata: {e}");
                     Ok(())
                 } else {
                     Err(e)
@@ -395,7 +392,7 @@ impl LogFetcher {
                 let server_node = match cluster.get_tablet_server(leader) {
                     Some(node) => node,
                     None => {
-                        warn!("No server node found for leader {}, retrying", leader);
+                        warn!("No server node found for leader {leader}, retrying");
                         Self::handle_fetch_failure(metadata, &leader, &fetch_request).await;
                         return;
                     }
diff --git a/fluss-rust/crates/fluss/src/compression/arrow_compression.rs b/fluss-rust/crates/fluss/src/compression/arrow_compression.rs
index 32dfadb48c..8121a512b1 100644
--- a/fluss-rust/crates/fluss/src/compression/arrow_compression.rs
+++ b/fluss-rust/crates/fluss/src/compression/arrow_compression.rs
@@ -17,6 +17,7 @@
 
 use crate::error::{Error, Result};
 use arrow::ipc::CompressionType;
+use arrow_schema::ArrowError;
 use std::collections::HashMap;
 
 pub const TABLE_LOG_ARROW_COMPRESSION_ZSTD_LEVEL: &str = "table.log.arrow.compression.zstd.level";
@@ -71,21 +72,31 @@ impl ArrowCompressionInfo {
         {
             Some(Ok(level)) if !(1..=22).contains(&level) => Err(Error::IllegalArgument {
                 message: format!(
-                    "Invalid ZSTD compression level: {}. Expected a value between 1 and 22.",
-                    level
+                    "Invalid ZSTD compression level: {level}. Expected a value between 1 and 22."
                 ),
             }),
             Some(Err(e)) => Err(Error::IllegalArgument {
                 message: format!(
-                    "Invalid ZSTD compression level. Expected a value between 1 and 22. {}",
-                    e
+                    "Invalid ZSTD compression level. Expected a value between 1 and 22. {e}"
                 ),
             }),
-
-            Some(Ok(level)) => Ok(Self {
-                compression_type,
-                compression_level: level,
-            }),
+            Some(Ok(level)) => {
+                // TODO Remove once non-default ZSTD compression level is implemented https://github.com/apache/fluss-rust/issues/109
+                if level != DEFAULT_ZSTD_COMPRESSION_LEVEL {
+                    return Err(Error::ArrowError {
+                        message: format!(
+                            "Rust client currently only implements default ZSTD compression level {DEFAULT_ZSTD_COMPRESSION_LEVEL}. Got: {level}."
+                        ),
+                        source: ArrowError::NotYetImplemented(format!(
+                            "zstd compression level {level}."
+                        )),
+                    });
+                }
+                Ok(Self {
+                    compression_type,
+                    compression_level: level,
+                })
+            }
             None => Ok(Self {
                 compression_type,
                 compression_level: DEFAULT_ZSTD_COMPRESSION_LEVEL,
@@ -171,11 +182,19 @@ mod tests {
             "ZSTD",
         )]));
         assert_eq!(compression_info.unwrap().compression_level, 3);
-        let compression_info = ArrowCompressionInfo::from_conf(&mk_map(&[
+    }
+
+    // TODO Remove once non-default ZSTD compression level is implemented https://github.com/apache/fluss-rust/issues/109
+    #[test]
+    fn test_from_conf_zstd_compression_level_error_when_non_default() {
+        let result = ArrowCompressionInfo::from_conf(&mk_map(&[
             ("table.log.arrow.compression.type", "ZSTD"),
             ("table.log.arrow.compression.zstd.level", "1"),
         ]));
-        assert_eq!(compression_info.unwrap().compression_level, 1);
+        assert!(result.is_err());
+        assert!(result.unwrap_err().to_string().contains(
+            "Rust client currently only implements default ZSTD compression level 3. Got: 1."
+        ));
     }
 
     #[test]

From 3d8483ef53338a9c67fa7f157990d3c283d5e7c7 Mon Sep 17 00:00:00 2001
From: Andrea Bozzo <andreabozzo92@gmail.com>
Date: Fri, 2 Jan 2026 09:54:09 +0100
Subject: [PATCH 047/287] chore: add integration tests for subscribe_batch and
 project_by_name (#116)

---------

Co-authored-by: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
---
 fluss-rust/bindings/cpp/src/lib.rs            |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  |   6 +-
 .../crates/fluss/tests/integration/table.rs   | 243 ++++++++++++------
 3 files changed, 169 insertions(+), 82 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index cd1803b888..2d37763673 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -625,7 +625,7 @@ impl LogScanner {
             bucket_offsets.insert(sub.bucket_id, sub.offset);
         }
 
-        let result = RUNTIME.block_on(async { self.inner.subscribe_batch(bucket_offsets).await });
+        let result = RUNTIME.block_on(async { self.inner.subscribe_batch(&bucket_offsets).await });
 
         match result {
             Ok(_) => ok_result(),
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index bf3983917d..0acaac890f 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -223,7 +223,7 @@ impl LogScanner {
         Ok(())
     }
 
-    pub async fn subscribe_batch(&self, bucket_offsets: HashMap<i32, i64>) -> Result<()> {
+    pub async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
         self.metadata
             .check_and_update_table_metadata(from_ref(&self.table_path))
             .await?;
@@ -236,8 +236,8 @@ impl LogScanner {
 
         let mut scan_bucket_offsets = HashMap::new();
         for (bucket_id, offset) in bucket_offsets {
-            let table_bucket = TableBucket::new(self.table_id, bucket_id);
-            scan_bucket_offsets.insert(table_bucket, offset);
+            let table_bucket = TableBucket::new(self.table_id, *bucket_id);
+            scan_bucket_offsets.insert(table_bucket, *offset);
         }
 
         self.log_scanner_status
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index 006adcc45b..0ac34c7635 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -36,12 +36,16 @@ mod table_test {
     use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
     use crate::integration::utils::create_table;
     use arrow::array::record_batch;
+    use fluss::client::{FlussTable, TableScan};
     use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
+    use fluss::record::ScanRecord;
     use fluss::row::InternalRow;
     use fluss::rpc::message::OffsetSpec;
     use jiff::Timestamp;
+    use std::collections::HashMap;
     use std::sync::Arc;
     use std::thread;
+    use std::time::Duration;
 
     fn before_all() {
         // Create a new tokio runtime in a separate thread
@@ -137,6 +141,11 @@ mod table_test {
 
         append_writer.flush().await.expect("Failed to flush");
 
+        // Create scanner to verify appended records
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
         let num_buckets = table.table_info().get_num_buckets();
         let log_scanner = table
             .new_scan()
@@ -149,84 +158,6 @@ mod table_test {
                 .expect("Failed to subscribe");
         }
 
-        let scan_records = log_scanner
-            .poll(std::time::Duration::from_secs(60))
-            .await
-            .expect("Failed to poll");
-
-        let mut records: Vec<_> = scan_records.into_iter().collect();
-        records.sort_by_key(|r| r.offset());
-
-        assert_eq!(records.len(), 6, "Should have 6 records");
-        for (i, record) in records.iter().enumerate() {
-            let row = record.row();
-            let expected_c1 = (i + 1) as i32;
-            let expected_c2 = format!("a{}", i + 1);
-            assert_eq!(row.get_int(0), expected_c1, "c1 mismatch at index {}", i);
-            assert_eq!(row.get_string(1), expected_c2, "c2 mismatch at index {}", i);
-        }
-
-        let log_scanner_projected = table
-            .new_scan()
-            .project(&[1, 0])
-            .expect("Failed to project")
-            .create_log_scanner()
-            .expect("Failed to create log scanner");
-        for bucket_id in 0..num_buckets {
-            log_scanner_projected
-                .subscribe(bucket_id, 0)
-                .await
-                .expect("Failed to subscribe");
-        }
-
-        let scan_records_projected = log_scanner_projected
-            .poll(std::time::Duration::from_secs(10))
-            .await
-            .expect("Failed to poll");
-
-        let mut records_projected: Vec<_> = scan_records_projected.into_iter().collect();
-        records_projected.sort_by_key(|r| r.offset());
-
-        assert_eq!(
-            records_projected.len(),
-            6,
-            "Should have 6 records with projection"
-        );
-        for (i, record) in records_projected.iter().enumerate() {
-            let row = record.row();
-            let expected_c2 = format!("a{}", i + 1);
-            let expected_c1 = (i + 1) as i32;
-            assert_eq!(
-                row.get_string(0),
-                expected_c2,
-                "Projected c2 (first column) mismatch at index {}",
-                i
-            );
-            assert_eq!(
-                row.get_int(1),
-                expected_c1,
-                "Projected c1 (second column) mismatch at index {}",
-                i
-            );
-        }
-
-        // Create scanner to verify appended records
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let table_scan = table.new_scan();
-        let log_scanner = table_scan
-            .create_log_scanner()
-            .expect("Failed to create log scanner");
-
-        // Subscribe to bucket 0 starting from offset 0
-        log_scanner
-            .subscribe(0, 0)
-            .await
-            .expect("Failed to subscribe to bucket");
-
         // Poll for records
         let scan_records = log_scanner
             .poll(tokio::time::Duration::from_secs(10))
@@ -382,4 +313,160 @@ mod table_test {
             "Timestamp after append should resolve to offset 0 (no newer records)"
         );
     }
+
+    #[tokio::test]
+    async fn test_project() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_project".to_string());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("col_a", DataTypes::int())
+                    .column("col_b", DataTypes::string())
+                    .column("col_c", DataTypes::int())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        // Append 3 records
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer();
+
+        let batch = record_batch!(
+            ("col_a", Int32, [1, 2, 3]),
+            ("col_b", Utf8, ["x", "y", "z"]),
+            ("col_c", Int32, [10, 20, 30])
+        )
+        .unwrap();
+        append_writer
+            .append_arrow_batch(batch)
+            .await
+            .expect("Failed to append batch");
+        append_writer.flush().await.expect("Failed to flush");
+
+        // Test project_by_name: select col_b and col_c only
+        let records = scan_table(&table, |scan| {
+            scan.project_by_name(&["col_b", "col_c"])
+                .expect("Failed to project by name")
+        })
+        .await;
+
+        assert_eq!(
+            records.len(),
+            3,
+            "Should have 3 records with project_by_name"
+        );
+
+        // Verify projected columns are in the correct order (col_b, col_c)
+        let expected_col_b = ["x", "y", "z"];
+        let expected_col_c = [10, 20, 30];
+
+        for (i, record) in records.iter().enumerate() {
+            let row = record.row();
+            // col_b is now at index 0, col_c is at index 1
+            assert_eq!(
+                row.get_string(0),
+                expected_col_b[i],
+                "col_b mismatch at index {}",
+                i
+            );
+            assert_eq!(
+                row.get_int(1),
+                expected_col_c[i],
+                "col_c mismatch at index {}",
+                i
+            );
+        }
+
+        // test project by column indices
+        let records = scan_table(&table, |scan| {
+            scan.project(&[1, 0]).expect("Failed to project by indices")
+        })
+        .await;
+
+        assert_eq!(
+            records.len(),
+            3,
+            "Should have 3 records with project_by_name"
+        );
+        // Verify projected columns are in the correct order (col_b, col_a)
+        let expected_col_b = ["x", "y", "z"];
+        let expected_col_a = [1, 2, 3];
+
+        for (i, record) in records.iter().enumerate() {
+            let row = record.row();
+            // col_b is now at index 0, col_c is at index 1
+            assert_eq!(
+                row.get_string(0),
+                expected_col_b[i],
+                "col_b mismatch at index {}",
+                i
+            );
+            assert_eq!(
+                row.get_int(1),
+                expected_col_a[i],
+                "col_c mismatch at index {}",
+                i
+            );
+        }
+
+        // Test error case: empty column names should fail
+        let result = table.new_scan().project_by_name(&[]);
+        assert!(
+            result.is_err(),
+            "project_by_name with empty names should fail"
+        );
+
+        // Test error case: non-existent column should fail
+        let result = table.new_scan().project_by_name(&["nonexistent_column"]);
+        assert!(
+            result.is_err(),
+            "project_by_name with non-existent column should fail"
+        );
+    }
+
+    async fn scan_table<'a>(
+        table: &FlussTable<'a>,
+        setup_scan: impl FnOnce(TableScan) -> TableScan,
+    ) -> Vec<ScanRecord> {
+        // 1. build log scanner
+        let log_scanner = setup_scan(table.new_scan())
+            .create_log_scanner()
+            .expect("Failed to create log scanner");
+
+        // 2. subscribe
+        let mut bucket_offsets = HashMap::new();
+        bucket_offsets.insert(0, 0);
+        log_scanner
+            .subscribe_batch(&bucket_offsets)
+            .await
+            .expect("Failed to subscribe");
+
+        // 3. poll records
+        let scan_records = log_scanner
+            .poll(Duration::from_secs(10))
+            .await
+            .expect("Failed to poll");
+
+        // 4. collect and sort
+        let mut records: Vec<_> = scan_records.into_iter().collect();
+        records.sort_by_key(|r| r.offset());
+        records
+    }
 }

From 2fc00e2c13fad60b9efeb9fb7c6fa2317bdbde47 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Fri, 2 Jan 2026 19:37:56 +0800
Subject: [PATCH 048/287] feat: support bazel build for cpp bindings (#107)

---
 fluss-rust/bindings/cpp/.bazelrc     |  37 +++
 fluss-rust/bindings/cpp/.gitignore   |   9 +
 fluss-rust/bindings/cpp/BUILD.bazel  | 342 +++++++++++++++++++++++++++
 fluss-rust/bindings/cpp/MODULE.bazel |  23 ++
 fluss-rust/bindings/cpp/ci.sh        | 100 ++++++++
 5 files changed, 511 insertions(+)
 create mode 100644 fluss-rust/bindings/cpp/.bazelrc
 create mode 100644 fluss-rust/bindings/cpp/BUILD.bazel
 create mode 100644 fluss-rust/bindings/cpp/MODULE.bazel
 create mode 100755 fluss-rust/bindings/cpp/ci.sh

diff --git a/fluss-rust/bindings/cpp/.bazelrc b/fluss-rust/bindings/cpp/.bazelrc
new file mode 100644
index 0000000000..ce7d81f82a
--- /dev/null
+++ b/fluss-rust/bindings/cpp/.bazelrc
@@ -0,0 +1,37 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# Bazel configuration for fluss-rust C++ bindings
+
+# Enable BzlMod
+common --enable_bzlmod
+
+# Debug configuration (matches BUILD.bazel settings)
+build:debug --compilation_mode=dbg
+build:debug --copt=-g3
+build:debug --copt=-ggdb
+build:debug --copt=-O0
+build:debug --copt=-fno-omit-frame-pointer
+build:debug --copt=-DDEBUG
+build:debug --strip=never
+build:debug --linkopt=-g
+
+# Release configuration
+build:release --compilation_mode=opt
+build:release --copt=-O2
+build:release --copt=-DNDEBUG
+build:release --strip=always
diff --git a/fluss-rust/bindings/cpp/.gitignore b/fluss-rust/bindings/cpp/.gitignore
index 6836e70c06..43f761c951 100644
--- a/fluss-rust/bindings/cpp/.gitignore
+++ b/fluss-rust/bindings/cpp/.gitignore
@@ -5,3 +5,12 @@ cmake-build-*/
 *.a
 *.so
 *.dylib
+
+# Bazel build outputs
+bazel-build/
+bazel-bin
+bazel-out
+bazel-testlogs
+bazel-cpp
+bazel-*
+MODULE.bazel.lock
diff --git a/fluss-rust/bindings/cpp/BUILD.bazel b/fluss-rust/bindings/cpp/BUILD.bazel
new file mode 100644
index 0000000000..81d483cb72
--- /dev/null
+++ b/fluss-rust/bindings/cpp/BUILD.bazel
@@ -0,0 +1,342 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+licenses(["notice"])
+
+load("@rules_cc//cc:defs.bzl", "cc_library", "cc_binary")
+
+config_setting(
+    name = "debug_mode",
+    values = {"compilation_mode": "dbg"},
+)
+
+config_setting(
+    name = "fastbuild_mode",
+    values = {"compilation_mode": "fastbuild"},
+)
+
+config_setting(
+    name = "release_mode",
+    values = {"compilation_mode": "opt"},
+)
+
+genrule(
+    name = "cargo_build_debug",
+    srcs = glob([
+        "src/**/*.rs",
+        "Cargo.toml",
+    ]),
+    outs = [
+        "rust_lib_debug.a",
+        "rust_bridge_cc_debug.cc",
+        "rust_bridge_h_debug.h",
+        "src/lib.rs_debug.h",
+        "cxxbridge/rust/cxx_debug.h",
+    ],
+    cmd = """
+        set -e
+        EXECROOT=$$(pwd)
+        OUTPUT_LIB=$(location rust_lib_debug.a)
+        OUTPUT_CC=$(location rust_bridge_cc_debug.cc)
+        OUTPUT_H=$(location rust_bridge_h_debug.h)
+        OUTPUT_SRC_H=$(location src/lib.rs_debug.h)
+        OUTPUT_CXX_H=$(location cxxbridge/rust/cxx_debug.h)
+        # Resolve real source path from sandbox symlink
+        SANDBOX_CARGO=$(location Cargo.toml)
+        REAL_CARGO=$$(readlink -f $$SANDBOX_CARGO 2>/dev/null || python3 -c "import os; print(os.path.realpath('$$SANDBOX_CARGO'))")
+        CARGO_DIR=$$(dirname $$REAL_CARGO)
+        # Find Cargo workspace root (fluss-rust directory, 2 levels up from bindings/cpp)
+        WORKSPACE_ROOT=$$(cd $$CARGO_DIR/../.. && pwd)
+        if [ ! -f $$WORKSPACE_ROOT/Cargo.toml ]; then
+            echo "Error: Cannot find workspace root Cargo.toml at $$WORKSPACE_ROOT" >&2
+            exit 1
+        fi
+        cd $$WORKSPACE_ROOT
+        cargo build --manifest-path $$CARGO_DIR/Cargo.toml
+        CARGO_TARGET_DIR=$$WORKSPACE_ROOT/target
+        # cxxbridge uses the Cargo package name (with hyphen): fluss-cpp
+        RUST_BRIDGE_DIR=$$CARGO_TARGET_DIR/cxxbridge/fluss-cpp/src
+        # Cargo converts hyphens to underscores in library file names: libfluss_cpp.a
+        RUST_LIB=$$CARGO_TARGET_DIR/debug/libfluss_cpp.a
+        if [ ! -f $$RUST_LIB ]; then
+            echo "Error: Rust library not found at $$RUST_LIB" >&2
+            exit 1
+        fi
+        if [ ! -f $$RUST_BRIDGE_DIR/lib.rs.cc ]; then
+            echo "Error: cxxbridge CC file not found at $$RUST_BRIDGE_DIR/lib.rs.cc" >&2
+            exit 1
+        fi
+        if [ ! -f $$RUST_BRIDGE_DIR/lib.rs.h ]; then
+            echo "Error: cxxbridge header file not found at $$RUST_BRIDGE_DIR/lib.rs.h" >&2
+            exit 1
+        fi
+        cd $$EXECROOT
+        mkdir -p $$(dirname $$OUTPUT_SRC_H) $$(dirname $$OUTPUT_CXX_H)
+        cp $$RUST_LIB $$OUTPUT_LIB || (echo "Failed to copy $$RUST_LIB to $$OUTPUT_LIB" >&2; exit 1)
+        cp $$RUST_BRIDGE_DIR/lib.rs.cc $$OUTPUT_CC || (echo "Failed to copy $$RUST_BRIDGE_DIR/lib.rs.cc to $$OUTPUT_CC" >&2; exit 1)
+        cp $$RUST_BRIDGE_DIR/lib.rs.h $$OUTPUT_H || (echo "Failed to copy $$RUST_BRIDGE_DIR/lib.rs.h to $$OUTPUT_H" >&2; exit 1)
+        cp $$RUST_BRIDGE_DIR/lib.rs.h $$OUTPUT_SRC_H || (echo "Failed to copy $$RUST_BRIDGE_DIR/lib.rs.h to $$OUTPUT_SRC_H" >&2; exit 1)
+        CXX_H_SOURCE=$$CARGO_TARGET_DIR/cxxbridge/rust/cxx.h
+        if [ ! -f $$CXX_H_SOURCE ] && [ ! -L $$CXX_H_SOURCE ]; then
+            echo "Error: cxx.h not found at $$CXX_H_SOURCE" >&2
+            exit 1
+        fi
+        cp -L $$CXX_H_SOURCE $$OUTPUT_CXX_H || (echo "Failed to copy $$CXX_H_SOURCE to $$OUTPUT_CXX_H" >&2; exit 1)
+    """,
+    message = "Building Rust library (debug) with cargo...",
+    local = 1,
+)
+
+genrule(
+    name = "cargo_build_release",
+    srcs = glob([
+        "src/**/*.rs",
+        "Cargo.toml",
+    ]),
+    outs = [
+        "rust_lib_release.a",
+        "rust_bridge_cc_release.cc",
+        "rust_bridge_h_release.h",
+        "src/lib.rs_release.h",
+        "cxxbridge/rust/cxx_release.h",
+    ],
+    cmd = """
+        set -e
+        EXECROOT=$$(pwd)
+        OUTPUT_LIB=$(location rust_lib_release.a)
+        OUTPUT_CC=$(location rust_bridge_cc_release.cc)
+        OUTPUT_H=$(location rust_bridge_h_release.h)
+        OUTPUT_SRC_H=$(location src/lib.rs_release.h)
+        OUTPUT_CXX_H=$(location cxxbridge/rust/cxx_release.h)
+        # Resolve real source path from sandbox symlink
+        SANDBOX_CARGO=$(location Cargo.toml)
+        REAL_CARGO=$$(readlink -f $$SANDBOX_CARGO 2>/dev/null || python3 -c "import os; print(os.path.realpath('$$SANDBOX_CARGO'))")
+        CARGO_DIR=$$(dirname $$REAL_CARGO)
+        # Find Cargo workspace root (fluss-rust directory, 2 levels up from bindings/cpp)
+        WORKSPACE_ROOT=$$(cd $$CARGO_DIR/../.. && pwd)
+        if [ ! -f $$WORKSPACE_ROOT/Cargo.toml ]; then
+            echo "Error: Cannot find workspace root Cargo.toml at $$WORKSPACE_ROOT" >&2
+            exit 1
+        fi
+        cd $$WORKSPACE_ROOT
+        cargo build --release --manifest-path $$CARGO_DIR/Cargo.toml
+        CARGO_TARGET_DIR=$$WORKSPACE_ROOT/target
+        # cxxbridge uses the Cargo package name (with hyphen): fluss-cpp
+        RUST_BRIDGE_DIR=$$CARGO_TARGET_DIR/cxxbridge/fluss-cpp/src
+        # Cargo converts hyphens to underscores in library file names: libfluss_cpp.a
+        RUST_LIB=$$CARGO_TARGET_DIR/release/libfluss_cpp.a
+        if [ ! -f $$RUST_LIB ]; then
+            echo "Error: Rust library not found at $$RUST_LIB" >&2
+            exit 1
+        fi
+        if [ ! -f $$RUST_BRIDGE_DIR/lib.rs.cc ]; then
+            echo "Error: cxxbridge CC file not found at $$RUST_BRIDGE_DIR/lib.rs.cc" >&2
+            exit 1
+        fi
+        if [ ! -f $$RUST_BRIDGE_DIR/lib.rs.h ]; then
+            echo "Error: cxxbridge header file not found at $$RUST_BRIDGE_DIR/lib.rs.h" >&2
+            exit 1
+        fi
+        cd $$EXECROOT
+        mkdir -p $$(dirname $$OUTPUT_SRC_H) $$(dirname $$OUTPUT_CXX_H)
+        cp $$RUST_LIB $$OUTPUT_LIB || (echo "Failed to copy $$RUST_LIB to $$OUTPUT_LIB" >&2; exit 1)
+        cp $$RUST_BRIDGE_DIR/lib.rs.cc $$OUTPUT_CC || (echo "Failed to copy $$RUST_BRIDGE_DIR/lib.rs.cc to $$OUTPUT_CC" >&2; exit 1)
+        cp $$RUST_BRIDGE_DIR/lib.rs.h $$OUTPUT_H || (echo "Failed to copy $$RUST_BRIDGE_DIR/lib.rs.h to $$OUTPUT_H" >&2; exit 1)
+        cp $$RUST_BRIDGE_DIR/lib.rs.h $$OUTPUT_SRC_H || (echo "Failed to copy $$RUST_BRIDGE_DIR/lib.rs.h to $$OUTPUT_SRC_H" >&2; exit 1)
+        CXX_H_SOURCE=$$CARGO_TARGET_DIR/cxxbridge/rust/cxx.h
+        if [ ! -f $$CXX_H_SOURCE ] && [ ! -L $$CXX_H_SOURCE ]; then
+            echo "Error: cxx.h not found at $$CXX_H_SOURCE" >&2
+            exit 1
+        fi
+        cp -L $$CXX_H_SOURCE $$OUTPUT_CXX_H || (echo "Failed to copy $$CXX_H_SOURCE to $$OUTPUT_CXX_H" >&2; exit 1)
+    """,
+    message = "Building Rust library (release) with cargo...",
+    local = 1,
+)
+
+filegroup(
+    name = "lib_rs_h_selected",
+    srcs = select({
+        ":debug_mode": [":src/lib.rs_debug.h"],
+        ":fastbuild_mode": [":src/lib.rs_debug.h"],
+        ":release_mode": [":src/lib.rs_release.h"],
+    }),
+)
+
+genrule(
+    name = "lib_rs_h_unified",
+    srcs = [":lib_rs_h_selected"],
+    outs = ["src/lib.rs.h"],
+    cmd = "cp $(location :lib_rs_h_selected) $(location src/lib.rs.h)",
+    message = "Unifying lib.rs.h for C++ includes",
+)
+
+filegroup(
+    name = "rust_bridge_cc_selected",
+    srcs = select({
+        ":debug_mode": [":rust_bridge_cc_debug.cc"],
+        ":fastbuild_mode": [":rust_bridge_cc_debug.cc"],
+        ":release_mode": [":rust_bridge_cc_release.cc"],
+    }),
+)
+
+genrule(
+    name = "rust_bridge_cc_unified",
+    srcs = [":rust_bridge_cc_selected"],
+    outs = ["rust_bridge_cc.cc"],
+    cmd = "cp $(location :rust_bridge_cc_selected) $(location rust_bridge_cc.cc)",
+    message = "Unifying rust_bridge_cc.cc for C++ compilation",
+)
+
+filegroup(
+    name = "rust_bridge_h_selected",
+    srcs = select({
+        ":debug_mode": [":rust_bridge_h_debug.h"],
+        ":fastbuild_mode": [":rust_bridge_h_debug.h"],
+        ":release_mode": [":rust_bridge_h_release.h"],
+    }),
+)
+
+genrule(
+    name = "rust_bridge_h_unified",
+    srcs = [":rust_bridge_h_selected"],
+    outs = ["rust_bridge_h.h"],
+    cmd = "cp $(location :rust_bridge_h_selected) $(location rust_bridge_h.h)",
+    message = "Unifying rust_bridge_h.h for C++ includes",
+)
+
+filegroup(
+    name = "cxx_h_selected",
+    srcs = select({
+        ":debug_mode": [":cxxbridge/rust/cxx_debug.h"],
+        ":fastbuild_mode": [":cxxbridge/rust/cxx_debug.h"],
+        ":release_mode": [":cxxbridge/rust/cxx_release.h"],
+    }),
+)
+
+genrule(
+    name = "cxx_h_unified",
+    srcs = [":cxx_h_selected"],
+    outs = ["cxxbridge/rust/cxx.h"],
+    cmd = "mkdir -p $$(dirname $(location cxxbridge/rust/cxx.h)) && cp $(location :cxx_h_selected) $(location cxxbridge/rust/cxx.h)",
+    message = "Unifying cxx.h for C++ includes",
+)
+
+cc_import(
+    name = "rust_lib",
+    static_library = select({
+        ":debug_mode": ":rust_lib_debug.a",
+        ":fastbuild_mode": ":rust_lib_debug.a",
+        ":release_mode": ":rust_lib_release.a",
+    }),
+    alwayslink = True,
+)
+
+cc_library(
+    name = "fluss_cpp",
+    srcs = [
+        "src/admin.cpp",
+        "src/connection.cpp",
+        "src/table.cpp",
+        ":rust_bridge_cc_unified",
+    ],
+    hdrs = [
+        "include/fluss.hpp",
+    ],
+    textual_hdrs = [
+        "src/ffi_converter.hpp",
+        ":rust_bridge_h_unified",
+        ":lib_rs_h_unified",
+        ":cxx_h_unified",
+    ],
+    strip_include_prefix = "include",
+    copts = [
+        "-std=c++17",
+    ] + select({
+        ":debug_mode": [
+            "-g3",
+            "-O0",
+            "-ggdb",
+            "-fno-omit-frame-pointer",
+            "-DDEBUG",
+        ],
+        ":fastbuild_mode": [
+            "-g",
+            "-O0",
+        ],
+        ":release_mode": [
+            "-O2",
+            "-DNDEBUG",
+        ],
+    }),
+    includes = [
+        "src",
+        "cxxbridge",
+    ],
+    linkopts = [
+        "-ldl",
+        "-lpthread",
+    ] + select({
+        ":debug_mode": ["-g"],
+        ":fastbuild_mode": ["-g"],
+        ":release_mode": [],
+    }) + select({
+        "@platforms//os:macos": [
+            "-framework", "CoreFoundation",
+            "-framework", "Security",
+        ],
+        "//conditions:default": [],
+    }),
+    deps = [
+        ":rust_lib",
+    ],
+    visibility = ["//visibility:public"],
+)
+
+cc_binary(
+    name = "fluss_cpp_example",
+    srcs = [
+        "examples/example.cpp",
+    ],
+    deps = [":fluss_cpp"],
+    copts = [
+        "-std=c++17",
+    ] + select({
+        ":debug_mode": [
+            "-g3",
+            "-O0",
+            "-ggdb",
+            "-fno-omit-frame-pointer",
+            "-DDEBUG",
+        ],
+        ":fastbuild_mode": [
+            "-g",
+            "-O0",
+        ],
+        ":release_mode": [
+            "-O2",
+            "-DNDEBUG",
+        ],
+    }),
+    linkopts = select({
+        ":debug_mode": ["-g"],
+        ":fastbuild_mode": ["-g"],
+        ":release_mode": [],
+    }),
+    visibility = ["//visibility:public"],
+)
+
diff --git a/fluss-rust/bindings/cpp/MODULE.bazel b/fluss-rust/bindings/cpp/MODULE.bazel
new file mode 100644
index 0000000000..f75d3e6f69
--- /dev/null
+++ b/fluss-rust/bindings/cpp/MODULE.bazel
@@ -0,0 +1,23 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+module(
+    name = "fluss_cpp",
+)
+
+bazel_dep(name = "rules_cc", version = "0.0.17")
+bazel_dep(name = "platforms", version = "0.0.10")
diff --git a/fluss-rust/bindings/cpp/ci.sh b/fluss-rust/bindings/cpp/ci.sh
new file mode 100755
index 0000000000..b5eb9676b6
--- /dev/null
+++ b/fluss-rust/bindings/cpp/ci.sh
@@ -0,0 +1,100 @@
+#!/bin/bash
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+set -xe 
+
+DIR="$(cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd)"
+
+# Set Bazel output base to bazel-build directory
+# This ensures all Bazel outputs are in bazel-build/.bazel-output-base
+BAZEL_OUTPUT_BASE="$DIR/bazel-build/.bazel-output-base"
+
+# Create output base directory if it doesn't exist
+mkdir -p "$BAZEL_OUTPUT_BASE"
+
+# Wrapper function to run bazel with --output_base
+bazel() {
+    command bazel --output_base="$BAZEL_OUTPUT_BASE" "$@"
+}
+
+compile() {
+    bazel build //:fluss_cpp
+}
+
+build_example() {
+    bazel build //:fluss_cpp_example
+}
+
+run_example() {
+    build_example
+    bazel run //:fluss_cpp_example
+}
+
+clean() {
+    bazel clean
+    # Remove bazel-* symlinks (Bazel automatically creates these)
+    rm -f "$DIR"/bazel-*
+    # Also remove the bazel-build directory if it exists
+    if [ -d "$DIR/bazel-build" ]; then
+        rm -rf "$DIR/bazel-build"
+    fi
+    echo "Cleaned all Bazel outputs and symlinks"
+}
+
+show_outputs() {
+    echo "=== Library outputs ==="
+    bazel cquery //:fluss_cpp --output=files 2>/dev/null || echo "Run 'bazel build //:fluss_cpp' first"
+    echo ""
+    echo "=== Example binary outputs ==="
+    bazel cquery //:fluss_cpp_example --output=files 2>/dev/null || echo "Run 'bazel build //:fluss_cpp_example' first"
+    echo ""
+    echo "=== To run the example ==="
+    echo "  bazel run //:fluss_cpp_example"
+    echo ""
+    echo "=== To find outputs manually ==="
+    echo "  bazel info bazel-bin"
+}
+
+case $1 in 
+    compile )
+        compile
+        ;;
+    example )
+        build_example
+        ;;
+    run )
+        run_example
+        ;;
+    outputs )
+        show_outputs
+        ;;
+    clean )
+        clean
+        ;;
+    * )
+        echo "Usage: $0 {compile|example|run|outputs|clean}"
+        echo ""
+        echo "Commands:"
+        echo "  compile  - Build the fluss_cpp library"
+        echo "  example  - Build the example binary"
+        echo "  run      - Build and run the example binary"
+        echo "  outputs  - Show the location of build outputs"
+        echo "  clean    - Clean all Bazel outputs"
+        exit 1
+        ;;
+esac

From 9f834df90aa76b01849063ff302504e13ebea824 Mon Sep 17 00:00:00 2001
From: Kelvin Wu <kelvinyu1117@gmail.com>
Date: Sat, 3 Jan 2026 14:45:54 +0800
Subject: [PATCH 049/287] feat: implement CompactedRowWriter (#121)

---
 .../src/row/compacted/compacted_row_writer.rs | 153 ++++++++++++++++++
 .../crates/fluss/src/row/compacted/mod.rs     |   1 +
 fluss-rust/crates/fluss/src/row/mod.rs        |   2 +
 3 files changed, 156 insertions(+)
 create mode 100644 fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/compacted/mod.rs

diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
new file mode 100644
index 0000000000..7c0addef34
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -0,0 +1,153 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use bytes::{Bytes, BytesMut};
+use std::cmp;
+
+// Writer for CompactedRow
+// Reference implementation:
+// https://github.com/apache/fluss/blob/d4a72fad240d4b81563aaf83fa3b09b5058674ed/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRowWriter.java#L71
+pub struct CompactedRowWriter {
+    header_size_in_bytes: usize,
+    position: usize,
+    buffer: BytesMut,
+}
+
+impl CompactedRowWriter {
+    pub const MAX_INT_SIZE: usize = 5;
+    pub const MAX_LONG_SIZE: usize = 10;
+
+    pub fn new(field_count: usize) -> Self {
+        // bitset width in bytes, it should be in CompactedRow
+        let header_size = (field_count + 7) / 8;
+        let cap = cmp::max(64, header_size);
+
+        let mut buffer = BytesMut::with_capacity(cap);
+        buffer.resize(cap, 0);
+
+        Self {
+            header_size_in_bytes: header_size,
+            position: header_size,
+            buffer,
+        }
+    }
+
+    pub fn reset(&mut self) {
+        self.position = self.header_size_in_bytes;
+        self.buffer[..self.header_size_in_bytes].fill(0);
+    }
+
+    pub fn position(&self) -> usize {
+        self.position
+    }
+
+    pub fn buffer(&self) -> &[u8] {
+        &self.buffer[..self.position]
+    }
+
+    pub fn to_bytes(&self) -> Bytes {
+        Bytes::copy_from_slice(&self.buffer[..self.position])
+    }
+
+    fn ensure_capacity(&mut self, need_len: usize) {
+        if (self.buffer.len() - self.position) < need_len {
+            let new_len = cmp::max(self.buffer.len() * 2, self.buffer.len() + need_len);
+            self.buffer.resize(new_len, 0);
+        }
+    }
+
+    fn write_raw(&mut self, src: &[u8]) {
+        let end = self.position + src.len();
+        self.ensure_capacity(src.len());
+        self.buffer[self.position..end].copy_from_slice(src);
+        self.position = end;
+    }
+
+    pub fn set_null_at(&mut self, pos: usize) {
+        let byte_index = pos >> 3;
+        let bit = pos & 7;
+        debug_assert!(byte_index < self.header_size_in_bytes);
+        self.buffer[byte_index] |= 1u8 << bit;
+    }
+
+    pub fn write_boolean(&mut self, value: bool) {
+        let b = if value { 1u8 } else { 0u8 };
+        self.write_raw(&[b]);
+    }
+
+    pub fn write_byte(&mut self, value: u8) {
+        self.write_raw(&[value as u8]);
+    }
+
+    pub fn write_binary(&mut self, bytes: &[u8], length: usize) {
+        // TODO: currently, we encoding BINARY(length) as the same with BYTES, the length info can
+        //  be omitted and the bytes length should be enforced in the future.
+        self.write_bytes(&bytes[..length.min(bytes.len())]);
+    }
+
+    pub fn write_bytes(&mut self, value: &[u8]) {
+        let len_i32 =
+            i32::try_from(value.len()).expect("byte slice too large to encode length as i32");
+        self.write_int(len_i32);
+        self.write_raw(value);
+    }
+
+    pub fn write_char(&mut self, value: &str, length: usize) {
+        // TODO: currently, we encoding CHAR(length) as the same with STRING, the length info can be
+        //  omitted and the bytes length should be enforced in the future.
+        self.write_string(value);
+    }
+
+    pub fn write_string(&mut self, value: &str) {
+        self.write_bytes(value.as_ref());
+    }
+
+    pub fn write_short(&mut self, value: i16) {
+        self.write_raw(&value.to_ne_bytes());
+    }
+
+    pub fn write_int(&mut self, value: i32) {
+        self.ensure_capacity(Self::MAX_INT_SIZE);
+        let mut v = value as u32;
+        while (v & !0x7F) != 0 {
+            self.buffer[self.position] = ((v as u8) & 0x7F) | 0x80;
+            self.position += 1;
+            v >>= 7;
+        }
+        self.buffer[self.position] = v as u8;
+        self.position += 1;
+    }
+    pub fn write_long(&mut self, value: i64) {
+        self.ensure_capacity(Self::MAX_LONG_SIZE);
+        let mut v = value as u64;
+        while (v & !0x7F) != 0 {
+            self.buffer[self.position] = ((v as u8) & 0x7F) | 0x80;
+            self.position += 1;
+            v >>= 7;
+        }
+        self.buffer[self.position] = v as u8;
+        self.position += 1;
+    }
+
+    pub fn write_float(&mut self, value: f32) {
+        self.write_raw(&value.to_ne_bytes());
+    }
+
+    pub fn write_double(&mut self, value: f64) {
+        self.write_raw(&value.to_ne_bytes());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/compacted/mod.rs b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
new file mode 100644
index 0000000000..b9bc66b5cb
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
@@ -0,0 +1 @@
+mod compacted_row_writer;
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 01b89fc9f4..86fdf90c98 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -19,6 +19,8 @@ mod column;
 
 mod datum;
 
+mod compacted;
+
 pub use column::*;
 pub use datum::*;
 

From 83c452563fabe07f53b596ecadd353fed1136ab7 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sat, 3 Jan 2026 15:07:55 +0800
Subject: [PATCH 050/287] chore: add license header to fix ci (#123)

---
 .../src/row/compacted/compacted_row_writer.rs   |  8 +++++---
 .../crates/fluss/src/row/compacted/mod.rs       | 17 +++++++++++++++++
 2 files changed, 22 insertions(+), 3 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index 7c0addef34..2debab19ae 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -21,19 +21,21 @@ use std::cmp;
 // Writer for CompactedRow
 // Reference implementation:
 // https://github.com/apache/fluss/blob/d4a72fad240d4b81563aaf83fa3b09b5058674ed/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRowWriter.java#L71
+#[allow(dead_code)]
 pub struct CompactedRowWriter {
     header_size_in_bytes: usize,
     position: usize,
     buffer: BytesMut,
 }
 
+#[allow(dead_code)]
 impl CompactedRowWriter {
     pub const MAX_INT_SIZE: usize = 5;
     pub const MAX_LONG_SIZE: usize = 10;
 
     pub fn new(field_count: usize) -> Self {
         // bitset width in bytes, it should be in CompactedRow
-        let header_size = (field_count + 7) / 8;
+        let header_size = field_count.div_ceil(8);
         let cap = cmp::max(64, header_size);
 
         let mut buffer = BytesMut::with_capacity(cap);
@@ -90,7 +92,7 @@ impl CompactedRowWriter {
     }
 
     pub fn write_byte(&mut self, value: u8) {
-        self.write_raw(&[value as u8]);
+        self.write_raw(&[value]);
     }
 
     pub fn write_binary(&mut self, bytes: &[u8], length: usize) {
@@ -106,7 +108,7 @@ impl CompactedRowWriter {
         self.write_raw(value);
     }
 
-    pub fn write_char(&mut self, value: &str, length: usize) {
+    pub fn write_char(&mut self, value: &str, _length: usize) {
         // TODO: currently, we encoding CHAR(length) as the same with STRING, the length info can be
         //  omitted and the bytes length should be enforced in the future.
         self.write_string(value);
diff --git a/fluss-rust/crates/fluss/src/row/compacted/mod.rs b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
index b9bc66b5cb..695cdad988 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
@@ -1 +1,18 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
 mod compacted_row_writer;

From 526d360f4420151ee99e78d7f5965c58c86c9345 Mon Sep 17 00:00:00 2001
From: Arnav_Panjla <146819303+Arnav-panjla@users.noreply.github.com>
Date: Tue, 6 Jan 2026 11:38:02 +0530
Subject: [PATCH 051/287] feat: return error for partitioned tables in
 FlussConnection#get_table (#115)

---
 fluss-rust/crates/fluss/src/client/connection.rs | 5 +++++
 fluss-rust/crates/fluss/src/error.rs             | 6 ++++++
 2 files changed, 11 insertions(+)

diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 899ad597c1..595daf55f5 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -77,6 +77,11 @@ impl FlussConnection {
     pub async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>> {
         self.metadata.update_table_metadata(table_path).await?;
         let table_info = self.metadata.get_cluster().get_table(table_path).clone();
+        if table_info.is_partitioned() {
+            return Err(crate::error::Error::UnsupportedOperation {
+                message: "Partitioned tables are not supported".to_string(),
+            });
+        }
         Ok(FlussTable::new(self, self.metadata.clone(), table_info))
     }
 }
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index 0f4b1b6d11..e04fde14d7 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -98,6 +98,12 @@ pub enum Error {
     )]
     IoUnsupported { message: String },
 
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting unsupported operation error {}.", message)
+    )]
+    UnsupportedOperation { message: String },
+
     #[snafu(
         visibility(pub(crate)),
         display("Fluss hitting leader not available error {}.", message)

From 49c3043329c74eec947dc6602688b28b30557517 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Wed, 7 Jan 2026 13:50:27 +0800
Subject: [PATCH 052/287] chore: fix append hang issue (#126)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---------

Co-authored-by: 赵海源 <zhaohaiyuan@xiaohongshu.com>
---
 .../fluss/src/client/write/accumulator.rs     | 50 ++++++++++---------
 1 file changed, 26 insertions(+), 24 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 215adbe695..beae0caacc 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -299,34 +299,36 @@ impl RecordAccumulator {
                     .batches
                     .get(&table_bucket.bucket_id())
                 {
-                    let mut batch = {
+                    let mut maybe_batch = None;
+                    {
                         let mut batch_lock = deque.lock().await;
-                        if batch_lock.is_empty() {
-                            continue;
+                        if !batch_lock.is_empty() {
+                            let first_batch = batch_lock.front().unwrap();
+
+                            if size + first_batch.estimated_size_in_bytes() > max_size as i64
+                                && !ready.is_empty()
+                            {
+                                // there is a rare case that a single batch size is larger than the request size
+                                // due to compression; in this case we will still eventually send this batch in
+                                // a single request.
+                                break;
+                            }
+
+                            maybe_batch = Some(batch_lock.pop_front().unwrap());
                         }
-                        let first_batch = batch_lock.front().unwrap();
-
-                        if size + first_batch.estimated_size_in_bytes() > max_size as i64
-                            && !ready.is_empty()
-                        {
-                            // there is a rare case that a single batch size is larger than the request size
-                            // due to compression; in this case we will still eventually send this batch in
-                            // a single request.
-                            break;
-                        }
-
-                        batch_lock.pop_front().unwrap()
-                    };
+                    }
 
-                    let current_batch_size = batch.estimated_size_in_bytes();
-                    size += current_batch_size;
+                    if let Some(mut batch) = maybe_batch {
+                        let current_batch_size = batch.estimated_size_in_bytes();
+                        size += current_batch_size;
 
-                    // mark the batch as drained.
-                    batch.drained(current_time_ms());
-                    ready.push(Arc::new(ReadyWriteBatch {
-                        table_bucket,
-                        write_batch: batch,
-                    }));
+                        // mark the batch as drained.
+                        batch.drained(current_time_ms());
+                        ready.push(Arc::new(ReadyWriteBatch {
+                            table_bucket,
+                            write_batch: batch,
+                        }));
+                    }
                 }
             }
             if current_index == start {

From 6459f2cdbda3079ed75db1e3f9094655a43c84fb Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Fri, 9 Jan 2026 12:16:17 +0000
Subject: [PATCH 053/287] chore: Fix scanner's example documentation test to
 allow `cargo test --release` to complete (#129)

---
 .../crates/fluss/src/client/table/scanner.rs  | 86 ++++++++++++++++++-
 1 file changed, 84 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 0acaac890f..4255bb6841 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -73,7 +73,49 @@ impl<'a> TableScan<'a> {
     ///
     /// # Example
     /// ```
-    /// let scanner = table.new_scan().project(&[0, 2, 3])?.create_log_scanner();
+    /// # use fluss::client::FlussConnection;
+    /// # use fluss::config::Config;
+    /// # use fluss::error::Result;
+    /// # use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    /// # use fluss::row::InternalRow;
+    /// # use std::time::Duration;
+    ///
+    /// # pub async fn example() -> Result<()> {
+    ///     let mut config = Config::default();
+    ///     config.bootstrap_server = Some("127.0.0.1:9123".to_string());
+    ///     let conn = FlussConnection::new(config).await?;
+    ///
+    ///     let table_descriptor = TableDescriptor::builder()
+    ///         .schema(
+    ///             Schema::builder()
+    ///                 .column("col1", DataTypes::int())
+    ///                 .column("col2", DataTypes::string())
+    ///                 .column("col3", DataTypes::string())
+    ///                 .column("col3", DataTypes::string())
+    ///             .build()?,
+    ///         ).build()?;
+    ///     let table_path = TablePath::new("fluss".to_owned(), "rust_test_long".to_owned());
+    ///     let admin = conn.get_admin().await?;
+    ///     admin.create_table(&table_path, &table_descriptor, true)
+    ///         .await?;
+    ///     let table_info = admin.get_table(&table_path).await?;
+    ///     let table = conn.get_table(&table_path).await?;
+    ///
+    ///     // Project columns by indices
+    ///     let scanner = table.new_scan().project(&[0, 2, 3])?.create_log_scanner()?;
+    ///     let scan_records = scanner.poll(Duration::from_secs(10)).await?;
+    ///     for record in scan_records {
+    ///         let row = record.row();
+    ///         println!(
+    ///             "{{{}, {}, {}}}@{}",
+    ///             row.get_int(0),
+    ///             row.get_string(2),
+    ///             row.get_string(3),
+    ///             record.offset()
+    ///         );
+    ///     }
+    ///     # Ok(())
+    /// # }
     /// ```
     pub fn project(mut self, column_indices: &[usize]) -> Result<Self> {
         if column_indices.is_empty() {
@@ -107,7 +149,47 @@ impl<'a> TableScan<'a> {
     ///
     /// # Example
     /// ```
-    /// let scanner = table.new_scan().project_by_name(&["col1", "col3"])?.create_log_scanner();
+    /// # use fluss::client::FlussConnection;
+    /// # use fluss::config::Config;
+    /// # use fluss::error::Result;
+    /// # use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    /// # use fluss::row::InternalRow;
+    /// # use std::time::Duration;
+    ///
+    /// # pub async fn example() -> Result<()> {
+    ///     let mut config = Config::default();
+    ///     config.bootstrap_server = Some("127.0.0.1:9123".to_string());
+    ///     let conn = FlussConnection::new(config).await?;
+    ///
+    ///     let table_descriptor = TableDescriptor::builder()
+    ///         .schema(
+    ///             Schema::builder()
+    ///                 .column("col1", DataTypes::int())
+    ///                 .column("col2", DataTypes::string())
+    ///                 .column("col3", DataTypes::string())
+    ///             .build()?,
+    ///         ).build()?;
+    ///     let table_path = TablePath::new("fluss".to_owned(), "rust_test_long".to_owned());
+    ///     let admin = conn.get_admin().await?;
+    ///     admin.create_table(&table_path, &table_descriptor, true)
+    ///         .await?;
+    ///     let table_info = admin.get_table(&table_path).await?;
+    ///     let table = conn.get_table(&table_path).await?;
+    ///
+    ///     // Project columns by column names
+    ///     let scanner = table.new_scan().project_by_name(&["col1", "col3"])?.create_log_scanner()?;
+    ///     let scan_records = scanner.poll(Duration::from_secs(10)).await?;
+    ///     for record in scan_records {
+    ///         let row = record.row();
+    ///         println!(
+    ///             "{{{}, {}}}@{}",
+    ///             row.get_int(0),
+    ///             row.get_string(1),
+    ///             record.offset()
+    ///         );
+    ///     }
+    ///     # Ok(())
+    /// # }
     /// ```
     pub fn project_by_name(mut self, column_names: &[&str]) -> Result<Self> {
         if column_names.is_empty() {

From 305a448736a6121a50b7855893de2d5c89f1e873 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Fri, 9 Jan 2026 12:56:59 +0000
Subject: [PATCH 054/287] feat:  introduce CompactedKeyEncoder (#124)

---
 fluss-rust/crates/fluss/Cargo.toml            |   1 +
 .../crates/fluss/src/metadata/datatype.rs     |  30 ++
 .../fluss/src/row/binary/binary_writer.rs     | 210 +++++++++++
 fluss-rust/crates/fluss/src/row/binary/mod.rs |  28 ++
 .../src/row/compacted/compacted_key_writer.rs |  97 ++++++
 .../crates/fluss/src/row/compacted/mod.rs     |   3 +
 fluss-rust/crates/fluss/src/row/datum.rs      |  10 +
 .../src/row/encode/compacted_key_encoder.rs   | 329 ++++++++++++++++++
 fluss-rust/crates/fluss/src/row/encode/mod.rs |  64 ++++
 .../crates/fluss/src/row/field_getter.rs      | 116 ++++++
 fluss-rust/crates/fluss/src/row/mod.rs        |   9 +
 11 files changed, 897 insertions(+)
 create mode 100644 fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/binary/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/encode/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/field_getter.rs

diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 27604eecd8..e8c851f7b7 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -59,6 +59,7 @@ uuid = { version = "1.10", features = ["v4"] }
 tempfile = "3.23.0"
 snafu = "0.8.3"
 scopeguard = "1.2.0"
+delegate = "0.13.5"
 
 [target.'cfg(target_arch = "wasm32")'.dependencies]
 jiff = { workspace = true, features = ["js"] }
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 8ad4f7e569..e5ccb9a8e9 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -852,6 +852,36 @@ impl RowType {
     pub fn fields(&self) -> &Vec<DataField> {
         &self.fields
     }
+
+    pub fn get_field_index(&self, field_name: &str) -> Option<usize> {
+        self.fields.iter().position(|f| f.name == field_name)
+    }
+
+    #[cfg(test)]
+    pub fn with_data_types(data_types: Vec<DataType>) -> Self {
+        let mut fields: Vec<DataField> = Vec::new();
+        data_types.iter().enumerate().for_each(|(idx, data_type)| {
+            fields.push(DataField::new(format!("f{}", idx), data_type.clone(), None));
+        });
+
+        Self::with_nullable(true, fields)
+    }
+
+    #[cfg(test)]
+    pub fn with_data_types_and_field_names(
+        data_types: Vec<DataType>,
+        field_names: Vec<&str>,
+    ) -> Self {
+        let fields = data_types
+            .into_iter()
+            .zip(field_names)
+            .map(|(data_type, field_name)| {
+                DataField::new(field_name.to_string(), data_type.clone(), None)
+            })
+            .collect::<Vec<_>>();
+
+        Self::with_nullable(true, fields)
+    }
 }
 
 impl Display for RowType {
diff --git a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
new file mode 100644
index 0000000000..a296777a30
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
@@ -0,0 +1,210 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::DataType;
+use crate::row::Datum;
+use crate::row::binary::BinaryRowFormat;
+
+/// Writer to write a composite data format, like row, array,
+#[allow(dead_code)]
+pub trait BinaryWriter {
+    /// Reset writer to prepare next write
+    fn reset(&mut self);
+
+    /// Set null to this field
+    fn set_null_at(&mut self, pos: usize);
+
+    fn write_boolean(&mut self, value: bool);
+
+    fn write_byte(&mut self, value: u8);
+
+    fn write_bytes(&mut self, value: &[u8]);
+
+    fn write_char(&mut self, value: &str, length: usize);
+
+    fn write_string(&mut self, value: &str);
+
+    fn write_short(&mut self, value: i16);
+
+    fn write_int(&mut self, value: i32);
+
+    fn write_long(&mut self, value: i64);
+
+    fn write_float(&mut self, value: f32);
+
+    fn write_double(&mut self, value: f64);
+
+    fn write_binary(&mut self, bytes: &[u8], length: usize);
+
+    // TODO Decimal type
+    // fn write_decimal(&mut self, pos: i32, value: f64);
+
+    // TODO Timestamp type
+    // fn write_timestamp_ntz(&mut self, pos: i32, value: i64);
+
+    // TODO Timestamp type
+    // fn write_timestamp_ltz(&mut self, pos: i32, value: i64);
+
+    // TODO InternalArray, ArraySerializer
+    // fn write_array(&mut self, pos: i32, value: i64);
+
+    // TODO Row serializer
+    // fn write_row(&mut self, pos: i32, value: &InternalRow);
+
+    /// Finally, complete write to set real size to binary.
+    fn complete(&mut self);
+}
+
+pub enum ValueWriter {
+    Nullable(InnerValueWriter),
+    NonNullable(InnerValueWriter),
+}
+
+impl ValueWriter {
+    pub fn create_value_writer(
+        element_type: &DataType,
+        binary_row_format: Option<&BinaryRowFormat>,
+    ) -> Result<ValueWriter> {
+        let value_writer =
+            InnerValueWriter::create_inner_value_writer(element_type, binary_row_format)?;
+        if element_type.is_nullable() {
+            Ok(Self::Nullable(value_writer))
+        } else {
+            Ok(Self::NonNullable(value_writer))
+        }
+    }
+
+    pub fn write_value<W: BinaryWriter>(
+        &self,
+        writer: &mut W,
+        pos: usize,
+        value: &Datum,
+    ) -> Result<()> {
+        match self {
+            Self::Nullable(inner_value_writer) => {
+                if let Datum::Null = value {
+                    writer.set_null_at(pos);
+                    Ok(())
+                } else {
+                    inner_value_writer.write_value(writer, pos, value)
+                }
+            }
+            Self::NonNullable(inner_value_writer) => {
+                inner_value_writer.write_value(writer, pos, value)
+            }
+        }
+    }
+}
+
+#[derive(Debug)]
+pub enum InnerValueWriter {
+    Char,
+    String,
+    Boolean,
+    Binary,
+    Bytes,
+    TinyInt,
+    SmallInt,
+    Int,
+    BigInt,
+    Float,
+    Double,
+    // TODO Decimal, Date, TimeWithoutTimeZone, TimestampWithoutTimeZone, TimestampWithLocalTimeZone, Array, Row
+}
+
+/// Accessor for writing the fields/elements of a binary writer during runtime, the
+/// fields/elements must be written in the order.
+impl InnerValueWriter {
+    pub fn create_inner_value_writer(
+        data_type: &DataType,
+        _: Option<&BinaryRowFormat>,
+    ) -> Result<InnerValueWriter> {
+        match data_type {
+            DataType::Char(_) => Ok(InnerValueWriter::Char),
+            DataType::String(_) => Ok(InnerValueWriter::String),
+            DataType::Boolean(_) => Ok(InnerValueWriter::Boolean),
+            DataType::Binary(_) => Ok(InnerValueWriter::Binary),
+            DataType::Bytes(_) => Ok(InnerValueWriter::Bytes),
+            DataType::TinyInt(_) => Ok(InnerValueWriter::TinyInt),
+            DataType::SmallInt(_) => Ok(InnerValueWriter::SmallInt),
+            DataType::Int(_) => Ok(InnerValueWriter::Int),
+            DataType::BigInt(_) => Ok(InnerValueWriter::BigInt),
+            DataType::Float(_) => Ok(InnerValueWriter::Float),
+            DataType::Double(_) => Ok(InnerValueWriter::Double),
+            _ => unimplemented!(
+                "ValueWriter for DataType {:?} is currently not implemented",
+                data_type
+            ),
+        }
+    }
+    pub fn write_value<W: BinaryWriter>(
+        &self,
+        writer: &mut W,
+        _pos: usize,
+        value: &Datum,
+    ) -> Result<()> {
+        match (self, value) {
+            (InnerValueWriter::Char, Datum::String(v)) => {
+                writer.write_char(v, v.len());
+            }
+            (InnerValueWriter::String, Datum::String(v)) => {
+                writer.write_string(v);
+            }
+            (InnerValueWriter::Boolean, Datum::Bool(v)) => {
+                writer.write_boolean(*v);
+            }
+            (InnerValueWriter::Binary, Datum::Blob(v)) => {
+                writer.write_binary(v.as_ref(), v.len());
+            }
+            (InnerValueWriter::Binary, Datum::BorrowedBlob(v)) => {
+                writer.write_binary(v.as_ref(), v.len());
+            }
+            (InnerValueWriter::Bytes, Datum::Blob(v)) => {
+                writer.write_bytes(v.as_ref());
+            }
+            (InnerValueWriter::Bytes, Datum::BorrowedBlob(v)) => {
+                writer.write_bytes(v.as_ref());
+            }
+            (InnerValueWriter::TinyInt, Datum::Int8(v)) => {
+                writer.write_byte(*v as u8);
+            }
+            (InnerValueWriter::SmallInt, Datum::Int16(v)) => {
+                writer.write_short(*v);
+            }
+            (InnerValueWriter::Int, Datum::Int32(v)) => {
+                writer.write_int(*v);
+            }
+            (InnerValueWriter::BigInt, Datum::Int64(v)) => {
+                writer.write_long(*v);
+            }
+            (InnerValueWriter::Float, Datum::Float32(v)) => {
+                writer.write_float(v.into_inner());
+            }
+            (InnerValueWriter::Double, Datum::Float64(v)) => {
+                writer.write_double(v.into_inner());
+            }
+            _ => {
+                return Err(IllegalArgument {
+                    message: format!("{:?} used to write value {:?}", self, value),
+                });
+            }
+        }
+        Ok(())
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/binary/mod.rs b/fluss-rust/crates/fluss/src/row/binary/mod.rs
new file mode 100644
index 0000000000..c31cbd59c1
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/binary/mod.rs
@@ -0,0 +1,28 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+mod binary_writer;
+
+pub use binary_writer::*;
+
+/// The binary row format types, it indicates the generated [`BinaryRow`] type by the [`BinaryWriter`]
+#[allow(dead_code)]
+pub enum BinaryRowFormat {
+    Compacted,
+    Aligned,
+    Indexed,
+}
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
new file mode 100644
index 0000000000..84a6b22724
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
@@ -0,0 +1,97 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
+use bytes::Bytes;
+
+use crate::error::Result;
+use crate::metadata::DataType;
+use crate::row::binary::{BinaryRowFormat, BinaryWriter, ValueWriter};
+use delegate::delegate;
+
+/// A wrapping of [`CompactedRowWriter`] used to encode key columns.
+/// The encoding is the same as [`CompactedRowWriter`], but is without header of null bits to
+/// represent whether the field value is null or not since the key columns must be not null.
+pub struct CompactedKeyWriter {
+    delegate: CompactedRowWriter,
+}
+
+impl CompactedKeyWriter {
+    pub fn new() -> CompactedKeyWriter {
+        CompactedKeyWriter {
+            // in compacted key encoder, we don't need to set null bits as the key columns must be not
+            // null, to use field count 0 to init to make the null bits 0
+            delegate: CompactedRowWriter::new(0),
+        }
+    }
+
+    pub fn create_value_writer(field_type: &DataType) -> Result<ValueWriter> {
+        ValueWriter::create_value_writer(field_type, Some(&BinaryRowFormat::Compacted))
+    }
+
+    delegate! {
+        to self.delegate {
+            pub fn reset(&mut self);
+
+            #[allow(dead_code)]
+            pub fn position(&self) -> usize;
+
+            #[allow(dead_code)]
+            pub fn buffer(&self) -> &[u8];
+
+            pub fn to_bytes(&self) -> Bytes;
+        }
+    }
+}
+
+impl BinaryWriter for CompactedKeyWriter {
+    delegate! {
+        to self.delegate {
+            fn reset(&mut self);
+
+            fn set_null_at(&mut self, pos: usize);
+
+            fn write_boolean(&mut self, value: bool);
+
+            fn write_byte(&mut self, value: u8);
+
+            fn write_binary(&mut self, bytes: &[u8], length: usize);
+
+            fn write_bytes(&mut self, value: &[u8]);
+
+            fn write_char(&mut self, value: &str, _length: usize);
+
+            fn write_string(&mut self, value: &str);
+
+            fn write_short(&mut self, value: i16);
+
+            fn write_int(&mut self, value: i32);
+
+            fn write_long(&mut self, value: i64);
+
+            fn write_float(&mut self, value: f32);
+
+            fn write_double(&mut self, value: f64);
+
+
+        }
+    }
+
+    fn complete(&mut self) {
+        // do nothing
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/compacted/mod.rs b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
index 695cdad988..c81eb5a50b 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
@@ -15,4 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+mod compacted_key_writer;
 mod compacted_row_writer;
+
+pub use compacted_key_writer::CompactedKeyWriter;
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 1ea393349e..28a378fd56 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -55,6 +55,8 @@ pub enum Datum<'a> {
     String(&'a str),
     #[display("{0}")]
     Blob(Blob),
+    #[display("{:?}")]
+    BorrowedBlob(&'a [u8]),
     #[display("{0}")]
     Decimal(Decimal),
     #[display("{0}")]
@@ -80,6 +82,7 @@ impl Datum<'_> {
     pub fn as_blob(&self) -> &[u8] {
         match self {
             Self::Blob(blob) => blob.as_ref(),
+            Self::BorrowedBlob(blob) => blob,
             _ => panic!("not a blob: {self:?}"),
         }
     }
@@ -289,6 +292,7 @@ impl Datum<'_> {
             Datum::Float64(v) => append_value_to_arrow!(Float64Builder, v.into_inner()),
             Datum::String(v) => append_value_to_arrow!(StringBuilder, *v),
             Datum::Blob(v) => append_value_to_arrow!(BinaryBuilder, v.as_ref()),
+            Datum::BorrowedBlob(v) => append_value_to_arrow!(BinaryBuilder, *v),
             Datum::Decimal(_) | Datum::Date(_) | Datum::Timestamp(_) | Datum::TimestampTz(_) => {
                 return Err(RowConvertError {
                     message: format!(
@@ -406,6 +410,12 @@ impl From<Vec<u8>> for Blob {
     }
 }
 
+impl<'a> From<&'a [u8]> for Datum<'a> {
+    fn from(bytes: &'a [u8]) -> Datum<'a> {
+        Datum::BorrowedBlob(bytes)
+    }
+}
+
 const UNIX_EPOCH_DAY: jiff::civil::Date = jiff::civil::date(1970, 1, 1);
 
 impl Date {
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
new file mode 100644
index 0000000000..b9335a3c13
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
@@ -0,0 +1,329 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::RowType;
+use crate::row::binary::ValueWriter;
+use crate::row::compacted::CompactedKeyWriter;
+use crate::row::encode::KeyEncoder;
+use crate::row::field_getter::FieldGetter;
+use crate::row::{Datum, InternalRow};
+use bytes::Bytes;
+
+#[allow(dead_code)]
+pub struct CompactedKeyEncoder {
+    field_getters: Vec<FieldGetter>,
+    field_encoders: Vec<ValueWriter>,
+    compacted_encoder: CompactedKeyWriter,
+}
+
+impl CompactedKeyEncoder {
+    /// Create a key encoder to encode the key of the input row.
+    ///
+    /// # Arguments
+    /// * `row_type` - the row type of the input row
+    /// * `keys` - the key fields to encode
+    ///
+    /// # Returns
+    /// * key_encoder - the [`KeyEncoder`]
+    pub fn create_key_encoder(row_type: &RowType, keys: &[String]) -> Result<CompactedKeyEncoder> {
+        let mut encode_col_indexes = Vec::with_capacity(keys.len());
+
+        for key in keys {
+            match row_type.get_field_index(key) {
+                Some(idx) => encode_col_indexes.push(idx),
+                None => {
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "Field {:?} not found in input row type {:?}",
+                            key, row_type
+                        ),
+                    });
+                }
+            }
+        }
+
+        Self::new(row_type, encode_col_indexes)
+    }
+
+    pub fn new(row_type: &RowType, encode_field_pos: Vec<usize>) -> Result<CompactedKeyEncoder> {
+        let mut field_getters: Vec<FieldGetter> = Vec::with_capacity(encode_field_pos.len());
+        let mut field_encoders: Vec<ValueWriter> = Vec::with_capacity(encode_field_pos.len());
+
+        for pos in &encode_field_pos {
+            let data_type = row_type.fields().get(*pos).unwrap().data_type();
+            field_getters.push(FieldGetter::create(data_type, *pos));
+            field_encoders.push(CompactedKeyWriter::create_value_writer(data_type)?);
+        }
+
+        Ok(CompactedKeyEncoder {
+            field_encoders,
+            field_getters,
+            compacted_encoder: CompactedKeyWriter::new(),
+        })
+    }
+}
+
+#[allow(dead_code)]
+impl KeyEncoder for CompactedKeyEncoder {
+    fn encode_key(&mut self, row: &dyn InternalRow) -> Result<Bytes> {
+        self.compacted_encoder.reset();
+
+        // iterate all the fields of the row, and encode each field
+        for (pos, field_getter) in self.field_getters.iter().enumerate() {
+            match &field_getter.get_field(row) {
+                Datum::Null => {
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "Cannot encode key with null value at position: {:?}",
+                            pos
+                        ),
+                    });
+                }
+                value => self.field_encoders.get(pos).unwrap().write_value(
+                    &mut self.compacted_encoder,
+                    pos,
+                    value,
+                )?,
+            }
+        }
+
+        Ok(self.compacted_encoder.to_bytes())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::DataTypes;
+    use crate::row::{Datum, GenericRow};
+
+    pub fn for_test_row_type(row_type: &RowType) -> CompactedKeyEncoder {
+        CompactedKeyEncoder::new(row_type, (0..row_type.fields().len()).collect())
+            .expect("CompactedKeyEncoder initialization failed")
+    }
+
+    #[test]
+    fn test_encode_key() {
+        let row_type = RowType::with_data_types(vec![
+            DataTypes::int(),
+            DataTypes::bigint(),
+            DataTypes::int(),
+        ]);
+        let row = GenericRow::from_data(vec![
+            Datum::from(1i32),
+            Datum::from(3i64),
+            Datum::from(2i32),
+        ]);
+
+        let mut encoder = for_test_row_type(&row_type);
+
+        assert_eq!(
+            encoder.encode_key(&row).unwrap().iter().as_slice(),
+            [1u8, 3u8, 2u8]
+        );
+
+        let row = GenericRow::from_data(vec![
+            Datum::from(2i32),
+            Datum::from(5i64),
+            Datum::from(6i32),
+        ]);
+
+        assert_eq!(
+            encoder.encode_key(&row).unwrap().iter().as_slice(),
+            [2u8, 5u8, 6u8]
+        );
+    }
+
+    #[test]
+    fn test_encode_key_with_key_names() {
+        let data_types = vec![
+            DataTypes::string(),
+            DataTypes::bigint(),
+            DataTypes::string(),
+        ];
+        let field_names = vec!["partition", "f1", "f2"];
+
+        let row_type = RowType::with_data_types_and_field_names(data_types, field_names);
+
+        let primary_keys = &["f2".to_string()];
+
+        let mut encoder = CompactedKeyEncoder::create_key_encoder(&row_type, primary_keys).unwrap();
+
+        let row = GenericRow::from_data(vec![
+            Datum::from("p1"),
+            Datum::from(1i64),
+            Datum::from("a2"),
+        ]);
+
+        // should only get "a2" 's ASCII representation
+        assert_eq!(
+            encoder.encode_key(&row).unwrap().iter().as_slice(),
+            //  2 (start of text), 97 (the letter a), 50 (the number 2)
+            [2u8, 97u8, 50u8]
+        );
+    }
+
+    #[test]
+    #[should_panic(expected = "Cannot encode key with null value at position: 2")]
+    fn test_null_primary_key() {
+        let row_type = RowType::with_data_types(vec![
+            DataTypes::int(),
+            DataTypes::bigint(),
+            DataTypes::int(),
+            DataTypes::string(),
+        ]);
+
+        let primary_key_indices = vec![0, 1, 2];
+
+        let mut encoder = CompactedKeyEncoder::new(&row_type, primary_key_indices)
+            .expect("CompactedKeyEncoder initialization failed");
+
+        let row = GenericRow::from_data(vec![
+            Datum::from(1i32),
+            Datum::from(3i64),
+            Datum::from(2i32),
+            Datum::from("a2"),
+        ]);
+
+        assert_eq!(
+            encoder.encode_key(&row).unwrap().iter().as_slice(),
+            [1u8, 3u8, 2u8]
+        );
+
+        let row = GenericRow::from_data(vec![
+            Datum::from(1i32),
+            Datum::from(3i64),
+            Datum::Null,
+            Datum::from("a2"),
+        ]);
+
+        encoder.encode_key(&row).unwrap();
+    }
+
+    #[test]
+    fn test_int_string_as_primary_key() {
+        let row_type = RowType::with_data_types(vec![
+            DataTypes::string(),
+            DataTypes::int(),
+            DataTypes::string(),
+            DataTypes::string(),
+        ]);
+
+        let primary_key_indices = vec![1, 2];
+        let mut encoder = CompactedKeyEncoder::new(&row_type, primary_key_indices)
+            .expect("CompactedKeyEncoder initialization failed");
+
+        let row = GenericRow::from_data(vec![
+            Datum::from("a1"),
+            Datum::from(1i32),
+            Datum::from("a2"),
+            Datum::from("a3"),
+        ]);
+
+        assert_eq!(
+            encoder.encode_key(&row).unwrap().iter().as_slice(),
+            // 1 (1i32), 2 (start of text), 97 (the letter a), 50 (the number 2)
+            [1u8, 2u8, 97u8, 50u8]
+        );
+    }
+
+    #[test]
+    fn test_all_data_types() {
+        let row_type = RowType::with_data_types(vec![
+            DataTypes::boolean(),
+            DataTypes::tinyint(),
+            DataTypes::smallint(),
+            DataTypes::int(),
+            DataTypes::bigint(),
+            DataTypes::float(),
+            DataTypes::double(),
+            // TODO Date
+            // TODO Time
+            DataTypes::binary(20),
+            DataTypes::bytes(),
+            DataTypes::char(2),
+            DataTypes::string(),
+            // TODO Decimal
+            // TODO Timestamp
+            // TODO Timestamp LTZ
+            // TODO Array of Int
+            // TODO Array of Float
+            // TODO Array of String
+            // TODO: Add Map and Row fields in Issue #1973
+        ]);
+
+        let row = GenericRow::from_data(vec![
+            Datum::from(true),
+            Datum::from(2i8),
+            Datum::from(10i16),
+            Datum::from(100i32),
+            Datum::from(-6101065172474983726i64), // from Java test case: new BigInteger("12345678901234567890").longValue()
+            Datum::from(13.2f32),
+            Datum::from(15.21f64),
+            // TODO Date
+            // TODO Time
+            Datum::from("1234567890".as_bytes()),
+            Datum::from("20".as_bytes()),
+            Datum::from("1"),
+            Datum::from("hello"),
+            // TODO Decimal
+            // TODO Timestamp
+            // TODO Timestamp LTZ
+            // TODO Array of Int
+            // TODO Array of Float
+            // TODO Array of String
+            // TODO: Add Map and Row fields in Issue #1973
+        ]);
+
+        let mut encoder = for_test_row_type(&row_type);
+
+        let mut expected: Vec<u8> = Vec::new();
+        // BOOLEAN: true
+        expected.extend(vec![0x01]);
+        // TINYINT: 2
+        expected.extend(vec![0x02]);
+        // SMALLINT: 10
+        expected.extend(vec![0x0A]);
+        // INT: 100
+        expected.extend(vec![0x00, 0x64]);
+        // BIGINT: -6101065172474983726
+        expected.extend(vec![
+            0xD2, 0x95, 0xFC, 0xD8, 0xCE, 0xB1, 0xAA, 0xAA, 0xAB, 0x01,
+        ]);
+        // FLOAT: 13.2
+        expected.extend(vec![0x33, 0x33, 0x53, 0x41]);
+        // DOUBLE: 15.21
+        expected.extend(vec![0xEC, 0x51, 0xB8, 0x1E, 0x85, 0x6B, 0x2E, 0x40]);
+        // BINARY(20): "1234567890".getBytes()
+        expected.extend(vec![
+            0x0A, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39, 0x30,
+        ]);
+
+        // BYTES: "20".getBytes()
+        expected.extend(vec![0x02, 0x32, 0x30]);
+        // CHAR(2): "1"
+        expected.extend(vec![0x01, 0x31]);
+        // STRING: String: "hello"
+        expected.extend(vec![0x05, 0x68, 0x65, 0x6C, 0x6C, 0x6F]);
+        assert_eq!(
+            encoder.encode_key(&row).unwrap().iter().as_slice(),
+            expected.as_slice()
+        );
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/encode/mod.rs b/fluss-rust/crates/fluss/src/row/encode/mod.rs
new file mode 100644
index 0000000000..6c6eed9936
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/encode/mod.rs
@@ -0,0 +1,64 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+mod compacted_key_encoder;
+
+use crate::error::Result;
+use crate::metadata::{DataLakeFormat, RowType};
+use crate::row::InternalRow;
+use crate::row::encode::compacted_key_encoder::CompactedKeyEncoder;
+use bytes::Bytes;
+
+/// An interface for encoding key of row into bytes.
+#[allow(dead_code)]
+pub trait KeyEncoder {
+    fn encode_key(&mut self, row: &dyn InternalRow) -> Result<Bytes>;
+}
+
+#[allow(dead_code)]
+impl dyn KeyEncoder {
+    /// Create a key encoder to encode the key bytes of the input row.
+    /// # Arguments
+    /// * `row_type` - the row type of the input row
+    /// * `key_fields` - the key fields to encode
+    /// * `lake_format` - the data lake format
+    ///
+    /// # Returns
+    /// key encoder
+    pub fn of(
+        row_type: &RowType,
+        key_fields: Vec<String>,
+        data_lake_format: Option<DataLakeFormat>,
+    ) -> Result<Box<dyn KeyEncoder>> {
+        match data_lake_format {
+            Some(DataLakeFormat::Paimon) => {
+                unimplemented!("KeyEncoder for Paimon format is currently unimplemented")
+            }
+            Some(DataLakeFormat::Lance) => Ok(Box::new(CompactedKeyEncoder::create_key_encoder(
+                row_type,
+                key_fields.as_slice(),
+            )?)),
+            Some(DataLakeFormat::Iceberg) => {
+                unimplemented!("KeyEncoder for Iceberg format is currently unimplemented")
+            }
+            None => Ok(Box::new(CompactedKeyEncoder::create_key_encoder(
+                row_type,
+                key_fields.as_slice(),
+            )?)),
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
new file mode 100644
index 0000000000..3a9cf0fa81
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -0,0 +1,116 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::DataType;
+use crate::row::{Datum, InternalRow};
+
+pub enum FieldGetter {
+    Nullable(InnerFieldGetter),
+    NonNullable(InnerFieldGetter),
+}
+impl FieldGetter {
+    pub fn get_field<'a>(&self, row: &'a dyn InternalRow) -> Datum<'a> {
+        match self {
+            FieldGetter::Nullable(getter) => {
+                if row.is_null_at(getter.pos()) {
+                    Datum::Null
+                } else {
+                    getter.get_field(row)
+                }
+            }
+            FieldGetter::NonNullable(getter) => getter.get_field(row),
+        }
+    }
+
+    pub fn create(data_type: &DataType, pos: usize) -> FieldGetter {
+        let inner_field_getter = match data_type {
+            DataType::Char(t) => InnerFieldGetter::Char {
+                pos,
+                len: t.length() as usize,
+            },
+            DataType::String(_) => InnerFieldGetter::String { pos },
+            DataType::Boolean(_) => InnerFieldGetter::Bool { pos },
+            DataType::Binary(t) => InnerFieldGetter::Binary {
+                pos,
+                len: t.length(),
+            },
+            DataType::Bytes(_) => InnerFieldGetter::Bytes { pos },
+            DataType::TinyInt(_) => InnerFieldGetter::TinyInt { pos },
+            DataType::SmallInt(_) => InnerFieldGetter::SmallInt { pos },
+            DataType::Int(_) => InnerFieldGetter::Int { pos },
+            DataType::BigInt(_) => InnerFieldGetter::BigInt { pos },
+            DataType::Float(_) => InnerFieldGetter::Float { pos },
+            DataType::Double(_) => InnerFieldGetter::Double { pos },
+            _ => unimplemented!("DataType {:?} is currently unimplemented", data_type),
+        };
+
+        if data_type.is_nullable() {
+            Self::Nullable(inner_field_getter)
+        } else {
+            Self::NonNullable(inner_field_getter)
+        }
+    }
+}
+
+pub enum InnerFieldGetter {
+    Char { pos: usize, len: usize },
+    String { pos: usize },
+    Bool { pos: usize },
+    Binary { pos: usize, len: usize },
+    Bytes { pos: usize },
+    TinyInt { pos: usize },
+    SmallInt { pos: usize },
+    Int { pos: usize },
+    BigInt { pos: usize },
+    Float { pos: usize },
+    Double { pos: usize },
+}
+
+impl InnerFieldGetter {
+    pub fn get_field<'a>(&self, row: &'a dyn InternalRow) -> Datum<'a> {
+        match self {
+            InnerFieldGetter::Char { pos, len } => Datum::String(row.get_char(*pos, *len)),
+            InnerFieldGetter::String { pos } => Datum::from(row.get_string(*pos)),
+            InnerFieldGetter::Bool { pos } => Datum::from(row.get_boolean(*pos)),
+            InnerFieldGetter::Binary { pos, len } => Datum::from(row.get_binary(*pos, *len)),
+            InnerFieldGetter::Bytes { pos } => Datum::from(row.get_bytes(*pos)),
+            InnerFieldGetter::TinyInt { pos } => Datum::from(row.get_byte(*pos)),
+            InnerFieldGetter::SmallInt { pos } => Datum::from(row.get_short(*pos)),
+            InnerFieldGetter::Int { pos } => Datum::from(row.get_int(*pos)),
+            InnerFieldGetter::BigInt { pos } => Datum::from(row.get_long(*pos)),
+            InnerFieldGetter::Float { pos } => Datum::from(row.get_float(*pos)),
+            InnerFieldGetter::Double { pos } => Datum::from(row.get_double(*pos)),
+            //TODO Decimal, Date, Time, Timestamp, TimestampLTZ, Array, Map, Row
+        }
+    }
+
+    pub fn pos(&self) -> usize {
+        match self {
+            Self::Char { pos, .. }
+            | Self::String { pos }
+            | Self::Bool { pos }
+            | Self::Binary { pos, .. }
+            | Self::Bytes { pos }
+            | Self::TinyInt { pos }
+            | Self::SmallInt { pos, .. }
+            | Self::Int { pos }
+            | Self::BigInt { pos }
+            | Self::Float { pos, .. }
+            | Self::Double { pos } => *pos,
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 86fdf90c98..c321ab9d6b 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -19,11 +19,15 @@ mod column;
 
 mod datum;
 
+mod binary;
 mod compacted;
+mod encode;
+mod field_getter;
 
 pub use column::*;
 pub use datum::*;
 
+// TODO make functions return Result<?> for better error handling
 pub trait InternalRow {
     /// Returns the number of fields in this row
     fn get_field_count(&self) -> usize;
@@ -143,6 +147,11 @@ impl<'a> Default for GenericRow<'a> {
 }
 
 impl<'a> GenericRow<'a> {
+    pub fn from_data(data: Vec<impl Into<Datum<'a>>>) -> GenericRow<'a> {
+        GenericRow {
+            values: data.into_iter().map(Into::into).collect(),
+        }
+    }
     pub fn new() -> GenericRow<'a> {
         GenericRow { values: vec![] }
     }

From 1f547950559a6be6ae26393f7ba16389f0ed9ff8 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 10 Jan 2026 02:00:12 +0000
Subject: [PATCH 055/287] feat: log scanner support poll record batch directly

---
 .../src/client/table/log_fetch_buffer.rs      |  54 +++-
 .../crates/fluss/src/client/table/mod.rs      |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  | 236 ++++++++++++++++--
 fluss-rust/crates/fluss/src/record/arrow.rs   |  22 ++
 .../crates/fluss/tests/integration/table.rs   | 133 ++++++++++
 5 files changed, 430 insertions(+), 17 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index cee104e020..e9bac53f1a 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -15,12 +15,14 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use arrow::array::RecordBatch;
+use parking_lot::Mutex;
+
 use crate::error::Result;
 use crate::metadata::TableBucket;
 use crate::record::{
     LogRecordBatch, LogRecordIterator, LogRecordsBatches, ReadContext, ScanRecord,
 };
-use parking_lot::Mutex;
 use std::collections::{HashMap, VecDeque};
 use std::sync::Arc;
 use std::sync::atomic::{AtomicBool, Ordering};
@@ -31,6 +33,7 @@ use tokio::sync::Notify;
 pub trait CompletedFetch: Send + Sync {
     fn table_bucket(&self) -> &TableBucket;
     fn fetch_records(&mut self, max_records: usize) -> Result<Vec<ScanRecord>>;
+    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<RecordBatch>>;
     fn is_consumed(&self) -> bool;
     fn drain(&mut self);
     fn size_in_bytes(&self) -> usize;
@@ -318,6 +321,38 @@ impl DefaultCompletedFetch {
             }
         }
     }
+
+    /// Get the next batch directly without row iteration
+    fn next_fetched_batch(&mut self) -> Result<Option<RecordBatch>> {
+        loop {
+            let Some(log_batch) = self.log_record_batch.next() else {
+                self.drain();
+                return Ok(None);
+            };
+
+            let mut record_batch = log_batch.record_batch(&self.read_context)?;
+
+            // Skip empty batches
+            if record_batch.num_rows() == 0 {
+                continue;
+            }
+
+            // Truncate batch
+            let base_offset = log_batch.base_log_offset();
+            if self.next_fetch_offset > base_offset {
+                let skip_count = (self.next_fetch_offset - base_offset) as usize;
+                if skip_count >= record_batch.num_rows() {
+                    continue;
+                }
+                // Slice the batch to skip the first skip_count rows
+                record_batch = record_batch.slice(skip_count, record_batch.num_rows() - skip_count);
+            }
+
+            self.next_fetch_offset = log_batch.next_log_offset();
+            self.records_read += record_batch.num_rows();
+            return Ok(Some(record_batch));
+        }
+    }
 }
 
 impl CompletedFetch for DefaultCompletedFetch {
@@ -346,6 +381,23 @@ impl CompletedFetch for DefaultCompletedFetch {
         Ok(scan_records)
     }
 
+    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<RecordBatch>> {
+        if self.consumed {
+            return Ok(Vec::new());
+        }
+
+        let mut batches = Vec::with_capacity(max_batches.min(16));
+
+        for _ in 0..max_batches {
+            match self.next_fetched_batch()? {
+                Some(batch) => batches.push(batch),
+                None => break,
+            }
+        }
+
+        Ok(batches)
+    }
+
     fn is_consumed(&self) -> bool {
         self.consumed
     }
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index e2cf9e6d5e..26341d70a6 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -32,7 +32,7 @@ mod scanner;
 mod writer;
 
 pub use append::{AppendWriter, TableAppend};
-pub use scanner::{LogScanner, TableScan};
+pub use scanner::{LogScanner, RecordBatchLogScanner, TableScan};
 
 #[allow(dead_code)]
 pub struct FlussTable<'a> {
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 4255bb6841..7d22324d6b 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -15,6 +15,16 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use arrow::array::RecordBatch;
+use arrow_schema::SchemaRef;
+use log::{debug, error, warn};
+use parking_lot::{Mutex, RwLock};
+use std::collections::{HashMap, HashSet};
+use std::slice::from_ref;
+use std::sync::Arc;
+use std::time::Duration;
+use tempfile::TempDir;
+
 use crate::client::connection::FlussConnection;
 use crate::client::credentials::CredentialsCache;
 use crate::client::metadata::Metadata;
@@ -30,14 +40,6 @@ use crate::proto::{FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTabl
 use crate::record::{LogRecordsBatches, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
 use crate::rpc::{RpcClient, message};
 use crate::util::FairBucketStatusMap;
-use arrow_schema::SchemaRef;
-use log::{debug, error, warn};
-use parking_lot::{Mutex, RwLock};
-use std::collections::{HashMap, HashSet};
-use std::slice::from_ref;
-use std::sync::Arc;
-use std::time::Duration;
-use tempfile::TempDir;
 
 const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
 #[allow(dead_code)]
@@ -216,16 +218,48 @@ impl<'a> TableScan<'a> {
     }
 
     pub fn create_log_scanner(self) -> Result<LogScanner> {
-        LogScanner::new(
+        let inner = LogScannerInner::new(
             &self.table_info,
             self.metadata.clone(),
             self.conn.get_connections(),
             self.projected_fields,
-        )
+        )?;
+        Ok(LogScanner {
+            inner: Arc::new(inner),
+        })
+    }
+
+    pub fn create_record_batch_log_scanner(self) -> Result<RecordBatchLogScanner> {
+        let inner = LogScannerInner::new(
+            &self.table_info,
+            self.metadata.clone(),
+            self.conn.get_connections(),
+            self.projected_fields,
+        )?;
+        Ok(RecordBatchLogScanner {
+            inner: Arc::new(inner),
+        })
     }
 }
 
+/// Scanner for reading log records one at a time with per-record metadata.
+///
+/// Use this scanner when you need access to individual record offsets and timestamps.
+/// For batch-level access, use [`RecordBatchLogScanner`] instead.
 pub struct LogScanner {
+    inner: Arc<LogScannerInner>,
+}
+
+/// Scanner for reading log data as Arrow RecordBatches.
+///
+/// More efficient than [`LogScanner`] for batch-level analytics where per-record
+/// metadata (offsets, timestamps) is not needed.
+pub struct RecordBatchLogScanner {
+    inner: Arc<LogScannerInner>,
+}
+
+/// Private shared implementation for both scanner types
+struct LogScannerInner {
     table_path: TablePath,
     table_id: i64,
     metadata: Arc<Metadata>,
@@ -233,8 +267,8 @@ pub struct LogScanner {
     log_fetcher: LogFetcher,
 }
 
-impl LogScanner {
-    pub fn new(
+impl LogScannerInner {
+    fn new(
         table_info: &TableInfo,
         metadata: Arc<Metadata>,
         connections: Arc<RpcClient>,
@@ -256,7 +290,7 @@ impl LogScanner {
         })
     }
 
-    pub async fn poll(&self, timeout: Duration) -> Result<ScanRecords> {
+    async fn poll_records(&self, timeout: Duration) -> Result<ScanRecords> {
         let start = std::time::Instant::now();
         let deadline = start + timeout;
 
@@ -295,7 +329,7 @@ impl LogScanner {
         }
     }
 
-    pub async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
+    async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
         let table_bucket = TableBucket::new(self.table_id, bucket);
         self.metadata
             .check_and_update_table_metadata(from_ref(&self.table_path))
@@ -305,7 +339,7 @@ impl LogScanner {
         Ok(())
     }
 
-    pub async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
+    async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
         self.metadata
             .check_and_update_table_metadata(from_ref(&self.table_path))
             .await?;
@@ -339,6 +373,76 @@ impl LogScanner {
         // Collect completed fetches from buffer
         self.log_fetcher.collect_fetches()
     }
+
+    async fn poll_batches(&self, timeout: Duration) -> Result<Vec<RecordBatch>> {
+        let start = std::time::Instant::now();
+        let deadline = start + timeout;
+
+        loop {
+            let batches = self.poll_for_batches().await?;
+
+            if !batches.is_empty() {
+                self.log_fetcher.send_fetches().await?;
+                return Ok(batches);
+            }
+
+            let now = std::time::Instant::now();
+            if now >= deadline {
+                return Ok(Vec::new());
+            }
+
+            let remaining = deadline - now;
+            let has_data = self
+                .log_fetcher
+                .log_fetch_buffer
+                .await_not_empty(remaining)
+                .await;
+
+            if !has_data {
+                return Ok(Vec::new());
+            }
+        }
+    }
+
+    async fn poll_for_batches(&self) -> Result<Vec<RecordBatch>> {
+        let result = self.log_fetcher.collect_batches()?;
+        if !result.is_empty() {
+            return Ok(result);
+        }
+
+        self.log_fetcher.send_fetches().await?;
+        self.log_fetcher.collect_batches()
+    }
+}
+
+// Implementation for LogScanner (records mode)
+impl LogScanner {
+    pub async fn poll(&self, timeout: Duration) -> Result<ScanRecords> {
+        self.inner.poll_records(timeout).await
+    }
+
+    pub async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
+        self.inner.subscribe(bucket, offset).await
+    }
+
+    pub async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
+        self.inner.subscribe_batch(bucket_offsets).await
+    }
+}
+
+// Implementation for RecordBatchLogScanner (batches mode)
+impl RecordBatchLogScanner {
+    pub async fn poll(&self, timeout: Duration) -> Result<Vec<RecordBatch>> {
+        self.inner.poll_batches(timeout).await
+    }
+
+    pub async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
+        self.inner.subscribe(bucket, offset).await
+    }
+
+    pub async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
+        self.inner.subscribe_batch(bucket_offsets).await
+    }
 }
 
 struct LogFetcher {
@@ -801,6 +905,108 @@ impl LogFetcher {
         }
     }
 
+    /// Collect completed fetches as RecordBatches
+    fn collect_batches(&self) -> Result<Vec<RecordBatch>> {
+        // Limit memory usage with both batch count and byte size constraints.
+        // Max 100 batches per poll, but also check total bytes (soft cap ~64MB).
+        const MAX_BATCHES: usize = 100;
+        const MAX_BYTES: usize = 64 * 1024 * 1024; // 64MB soft cap
+        let mut result: Vec<RecordBatch> = Vec::new();
+        let mut batches_remaining = MAX_BATCHES;
+        let mut bytes_consumed: usize = 0;
+
+        while batches_remaining > 0 && bytes_consumed < MAX_BYTES {
+            let next_in_line = self.log_fetch_buffer.next_in_line_fetch();
+
+            match next_in_line {
+                Some(mut next_fetch) if !next_fetch.is_consumed() => {
+                    let batches =
+                        self.fetch_batches_from_fetch(&mut next_fetch, batches_remaining)?;
+                    let batch_count = batches.len();
+
+                    if !batches.is_empty() {
+                        // Track bytes consumed (soft cap - may exceed by one fetch)
+                        let batch_bytes: usize =
+                            batches.iter().map(|b| b.get_array_memory_size()).sum();
+                        bytes_consumed += batch_bytes;
+
+                        result.extend(batches);
+                        batches_remaining = batches_remaining.saturating_sub(batch_count);
+                    }
+
+                    if !next_fetch.is_consumed() {
+                        self.log_fetch_buffer
+                            .set_next_in_line_fetch(Some(next_fetch));
+                    }
+                }
+                _ => {
+                    if let Some(completed_fetch) = self.log_fetch_buffer.poll() {
+                        if !completed_fetch.is_initialized() {
+                            let size_in_bytes = completed_fetch.size_in_bytes();
+                            match self.initialize_fetch(completed_fetch) {
+                                Ok(initialized) => {
+                                    self.log_fetch_buffer.set_next_in_line_fetch(initialized);
+                                    continue;
+                                }
+                                Err(e) => {
+                                    if result.is_empty() && size_in_bytes == 0 {
+                                        continue;
+                                    }
+                                    return Err(e);
+                                }
+                            }
+                        } else {
+                            self.log_fetch_buffer
+                                .set_next_in_line_fetch(Some(completed_fetch));
+                        }
+                    } else {
+                        break;
+                    }
+                }
+            }
+        }
+
+        Ok(result)
+    }
+
+    fn fetch_batches_from_fetch(
+        &self,
+        next_in_line_fetch: &mut Box<dyn CompletedFetch>,
+        max_batches: usize,
+    ) -> Result<Vec<RecordBatch>> {
+        let table_bucket = next_in_line_fetch.table_bucket().clone();
+        let current_offset = self.log_scanner_status.get_bucket_offset(&table_bucket);
+
+        if current_offset.is_none() {
+            warn!(
+                "Ignoring fetched batches for {table_bucket:?} since the bucket has been unsubscribed"
+            );
+            next_in_line_fetch.drain();
+            return Ok(Vec::new());
+        }
+
+        let current_offset = current_offset.unwrap();
+        let fetch_offset = next_in_line_fetch.next_fetch_offset();
+
+        if fetch_offset == current_offset {
+            let batches = next_in_line_fetch.fetch_batches(max_batches)?;
+            let next_fetch_offset = next_in_line_fetch.next_fetch_offset();
+
+            if next_fetch_offset > current_offset {
+                self.log_scanner_status
+                    .update_offset(&table_bucket, next_fetch_offset);
+            }
+
+            Ok(batches)
+        } else {
+            warn!(
+                "Ignoring fetched batches for {table_bucket:?} at offset {fetch_offset} since the current offset is {current_offset}"
+            );
+            next_in_line_fetch.drain();
+            Ok(Vec::new())
+        }
+    }
+
     async fn prepare_fetch_log_requests(&self) -> HashMap<i32, FetchLogRequest> {
         let mut fetch_log_req_for_buckets = HashMap::new();
         let mut table_id = None;
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 5a5115edfa..89fb7b9c94 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -546,6 +546,28 @@ impl LogRecordBatch {
         };
         Ok(log_record_iterator)
     }
+
+    /// Returns the record batch directly without creating an iterator.
+    /// This is more efficient when you need the entire batch rather than
+    /// iterating row-by-row.
+    pub fn record_batch(&self, read_context: &ReadContext) -> Result<RecordBatch> {
+        if self.record_count() == 0 {
+            // Return empty batch with correct schema
+            return Ok(RecordBatch::new_empty(read_context.target_schema.clone()));
+        }
+
+        let data = self.data.get(RECORDS_OFFSET..).ok_or_else(|| {
+            crate::error::Error::UnexpectedError {
+                message: format!(
+                    "Corrupt log record batch: data length {} is less than RECORDS_OFFSET {}",
+                    self.data.len(),
+                    RECORDS_OFFSET
+                ),
+                source: None,
+            }
+        })?;
+        read_context.record_batch(data)
+    }
 }
 
 /// Parse an Arrow IPC message from a byte slice.
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index 0ac34c7635..4cba46993f 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -469,4 +469,137 @@ mod table_test {
         records.sort_by_key(|r| r.offset());
         records
     }
+
+    #[tokio::test]
+    async fn test_poll_batches() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_poll_batches".to_string());
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .build()
+            .unwrap();
+
+        create_table(
+            &admin,
+            &table_path,
+            &TableDescriptor::builder().schema(schema).build().unwrap(),
+        )
+        .await;
+        tokio::time::sleep(Duration::from_secs(1)).await;
+
+        let table = connection.get_table(&table_path).await.unwrap();
+        let scanner = table.new_scan().create_record_batch_log_scanner().unwrap();
+        scanner.subscribe(0, 0).await.unwrap();
+
+        // Test 1: Empty table should return empty result
+        assert!(
+            scanner
+                .poll(Duration::from_millis(500))
+                .await
+                .unwrap()
+                .is_empty()
+        );
+
+        let writer = table.new_append().unwrap().create_writer();
+        writer
+            .append_arrow_batch(
+                record_batch!(("id", Int32, [1, 2]), ("name", Utf8, ["a", "b"])).unwrap(),
+            )
+            .await
+            .unwrap();
+        writer
+            .append_arrow_batch(
+                record_batch!(("id", Int32, [3, 4]), ("name", Utf8, ["c", "d"])).unwrap(),
+            )
+            .await
+            .unwrap();
+        writer
+            .append_arrow_batch(
+                record_batch!(("id", Int32, [5, 6]), ("name", Utf8, ["e", "f"])).unwrap(),
+            )
+            .await
+            .unwrap();
+        writer.flush().await.unwrap();
+
+        use arrow::array::Int32Array;
+        let batches = scanner.poll(Duration::from_secs(10)).await.unwrap();
+        let mut all_ids: Vec<i32> = batches
+            .iter()
+            .flat_map(|b| {
+                (0..b.num_rows()).map(|i| {
+                    b.column(0)
+                        .as_any()
+                        .downcast_ref::<Int32Array>()
+                        .unwrap()
+                        .value(i)
+                })
+            })
+            .collect();
+
+        // Test 2: Order should be preserved across multiple batches
+        assert_eq!(all_ids, vec![1, 2, 3, 4, 5, 6]);
+
+        writer
+            .append_arrow_batch(
+                record_batch!(("id", Int32, [7, 8]), ("name", Utf8, ["g", "h"])).unwrap(),
+            )
+            .await
+            .unwrap();
+        writer.flush().await.unwrap();
+
+        let more = scanner.poll(Duration::from_secs(10)).await.unwrap();
+        let new_ids: Vec<i32> = more
+            .iter()
+            .flat_map(|b| {
+                (0..b.num_rows()).map(|i| {
+                    b.column(0)
+                        .as_any()
+                        .downcast_ref::<Int32Array>()
+                        .unwrap()
+                        .value(i)
+                })
+            })
+            .collect();
+
+        // Test 3: Subsequent polls should not return duplicate data (offset continuation)
+        assert_eq!(new_ids, vec![7, 8]);
+
+        // Test 4: Subscribing from mid-offset should truncate batch (Arrow batch slicing)
+        // Server returns all records from start of batch, but client truncates to subscription offset
+        let trunc_scanner = table.new_scan().create_record_batch_log_scanner().unwrap();
+        trunc_scanner.subscribe(0, 3).await.unwrap();
+        let trunc_batches = trunc_scanner.poll(Duration::from_secs(10)).await.unwrap();
+        let trunc_ids: Vec<i32> = trunc_batches
+            .iter()
+            .flat_map(|b| {
+                (0..b.num_rows()).map(|i| {
+                    b.column(0)
+                        .as_any()
+                        .downcast_ref::<Int32Array>()
+                        .unwrap()
+                        .value(i)
+                })
+            })
+            .collect();
+
+        // Subscribing from offset 3 should return [4,5,6,7,8], not [1,2,3,4,5,6,7,8]
+        assert_eq!(trunc_ids, vec![4, 5, 6, 7, 8]);
+
+        // Test 5: Projection should only return requested columns
+        let proj = table
+            .new_scan()
+            .project_by_name(&["id"])
+            .unwrap()
+            .create_record_batch_log_scanner()
+            .unwrap();
+        proj.subscribe(0, 0).await.unwrap();
+        let proj_batches = proj.poll(Duration::from_secs(10)).await.unwrap();
+
+        // Projected batch should have 1 column (id), not 2 (id, name)
+        assert_eq!(proj_batches[0].num_columns(), 1);
+    }
 }

From d61086fa8457e521dd949f4648ddbbc9c4ad6c88 Mon Sep 17 00:00:00 2001
From: Kelvin Wu <kelvinyu1117@gmail.com>
Date: Sat, 10 Jan 2026 22:01:24 +0800
Subject: [PATCH 056/287] feat: introduce CompactedRowReader, CompactedRow,
 CompactedRowDeserializer (#131)

---
 .../crates/fluss/src/metadata/datatype.rs     |   2 +-
 .../fluss/src/row/binary/binary_writer.rs     |   2 +-
 .../fluss/src/row/compacted/compacted_row.rs  | 260 ++++++++++++++++++
 .../src/row/compacted/compacted_row_reader.rs | 218 +++++++++++++++
 .../src/row/compacted/compacted_row_writer.rs |   5 +-
 .../crates/fluss/src/row/compacted/mod.rs     |   9 +
 fluss-rust/crates/fluss/src/row/datum.rs      |  10 +-
 .../src/row/encode/compacted_key_encoder.rs   |  10 +-
 8 files changed, 502 insertions(+), 14 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs

diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index e5ccb9a8e9..c53cd273cb 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -861,7 +861,7 @@ impl RowType {
     pub fn with_data_types(data_types: Vec<DataType>) -> Self {
         let mut fields: Vec<DataField> = Vec::new();
         data_types.iter().enumerate().for_each(|(idx, data_type)| {
-            fields.push(DataField::new(format!("f{}", idx), data_type.clone(), None));
+            fields.push(DataField::new(format!("f{idx}"), data_type.clone(), None));
         });
 
         Self::with_nullable(true, fields)
diff --git a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
index a296777a30..44f10b6309 100644
--- a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
@@ -201,7 +201,7 @@ impl InnerValueWriter {
             }
             _ => {
                 return Err(IllegalArgument {
-                    message: format!("{:?} used to write value {:?}", self, value),
+                    message: format!("{self:?} used to write value {value:?}"),
                 });
             }
         }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
new file mode 100644
index 0000000000..fca41c655f
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -0,0 +1,260 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use bytes::Bytes;
+
+use crate::metadata::DataType;
+use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
+use crate::row::{GenericRow, InternalRow};
+
+// Reference implementation:
+// https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRow.java
+#[allow(dead_code)]
+pub struct CompactedRow {
+    arity: usize,
+    segment: Bytes,
+    offset: usize,
+    size_in_bytes: usize,
+    decoded: bool,
+    decoded_row: GenericRow<'static>,
+    reader: CompactedRowReader,
+    deserializer: CompactedRowDeserializer,
+}
+
+#[allow(dead_code)]
+impl CompactedRow {
+    pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
+        arity.div_ceil(8)
+    }
+
+    pub fn new(types: Vec<DataType>) -> Self {
+        let arity = types.len();
+        Self {
+            arity,
+            segment: Bytes::new(),
+            offset: 0,
+            size_in_bytes: 0,
+            decoded: false,
+            decoded_row: GenericRow::new(),
+            reader: CompactedRowReader::new(arity),
+            deserializer: CompactedRowDeserializer::new(types),
+        }
+    }
+
+    pub fn from_bytes(types: Vec<DataType>, data: Bytes) -> Self {
+        let arity = types.len();
+        let size = data.len();
+        Self {
+            arity,
+            segment: data,
+            offset: 0,
+            size_in_bytes: size,
+            decoded: false,
+            decoded_row: GenericRow::new(),
+            reader: CompactedRowReader::new(arity),
+            deserializer: CompactedRowDeserializer::new(types),
+        }
+    }
+
+    pub fn point_to(&mut self, segment: Bytes, offset: usize, size_in_bytes: usize) {
+        self.segment = segment;
+        self.offset = offset;
+        self.size_in_bytes = size_in_bytes;
+        self.decoded = false;
+    }
+
+    pub fn get_segment(&self) -> &Bytes {
+        &self.segment
+    }
+
+    pub fn get_offset(&self) -> usize {
+        self.offset
+    }
+
+    pub fn get_size_in_bytes(&self) -> usize {
+        self.size_in_bytes
+    }
+
+    pub fn get_field_count(&self) -> usize {
+        self.arity
+    }
+
+    pub fn is_null_at(&self, pos: usize) -> bool {
+        let byte_index = pos >> 3;
+        let bit = pos & 7;
+        let idx = self.offset + byte_index;
+        (self.segment[idx] & (1u8 << bit)) != 0
+    }
+
+    fn decoded_row(&mut self) -> &GenericRow<'static> {
+        if !self.decoded {
+            self.reader
+                .point_to(self.segment.clone(), self.offset, self.size_in_bytes);
+            self.decoded_row = self.deserializer.deserialize(&mut self.reader);
+            self.decoded = true;
+        }
+        &self.decoded_row
+    }
+
+    pub fn get_boolean(&mut self, pos: usize) -> bool {
+        self.decoded_row().get_boolean(pos)
+    }
+
+    pub fn get_byte(&mut self, pos: usize) -> i8 {
+        self.decoded_row().get_byte(pos)
+    }
+
+    pub fn get_short(&mut self, pos: usize) -> i16 {
+        self.decoded_row().get_short(pos)
+    }
+
+    pub fn get_int(&mut self, pos: usize) -> i32 {
+        self.decoded_row().get_int(pos)
+    }
+
+    pub fn get_long(&mut self, pos: usize) -> i64 {
+        self.decoded_row().get_long(pos)
+    }
+
+    pub fn get_float(&mut self, pos: usize) -> f32 {
+        self.decoded_row().get_float(pos)
+    }
+
+    pub fn get_double(&mut self, pos: usize) -> f64 {
+        self.decoded_row().get_double(pos)
+    }
+
+    pub fn get_string(&mut self, pos: usize) -> &str {
+        self.decoded_row().get_string(pos)
+    }
+
+    pub fn get_bytes(&mut self, pos: usize) -> &[u8] {
+        self.decoded_row().get_bytes(pos)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{
+        BigIntType, BooleanType, BytesType, DoubleType, FloatType, IntType, SmallIntType,
+        StringType, TinyIntType,
+    };
+    use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
+
+    #[test]
+    fn test_compacted_row() {
+        // Test all primitive types
+        let types = vec![
+            DataType::Boolean(BooleanType::new()),
+            DataType::TinyInt(TinyIntType::new()),
+            DataType::SmallInt(SmallIntType::new()),
+            DataType::Int(IntType::new()),
+            DataType::BigInt(BigIntType::new()),
+            DataType::Float(FloatType::new()),
+            DataType::Double(DoubleType::new()),
+            DataType::String(StringType::new()),
+            DataType::Bytes(BytesType::new()),
+        ];
+
+        let mut row = CompactedRow::new(types.clone());
+        let mut writer = CompactedRowWriter::new(types.len());
+
+        writer.write_boolean(true);
+        writer.write_byte(1);
+        writer.write_short(100);
+        writer.write_int(1000);
+        writer.write_long(10000);
+        writer.write_float(1.5);
+        writer.write_double(2.5);
+        writer.write_string("Hello World");
+        writer.write_bytes(&[1, 2, 3, 4, 5]);
+
+        row.point_to(writer.to_bytes(), 0, writer.position());
+
+        assert_eq!(row.get_field_count(), 9);
+        assert!(row.get_boolean(0));
+        assert_eq!(row.get_byte(1), 1);
+        assert_eq!(row.get_short(2), 100);
+        assert_eq!(row.get_int(3), 1000);
+        assert_eq!(row.get_long(4), 10000);
+        assert_eq!(row.get_float(5), 1.5);
+        assert_eq!(row.get_double(6), 2.5);
+        assert_eq!(row.get_string(7), "Hello World");
+        assert_eq!(row.get_bytes(8), &[1, 2, 3, 4, 5]);
+
+        // Test with nulls
+        let types = vec![
+            DataType::Int(IntType::new()),
+            DataType::String(StringType::new()),
+            DataType::Double(DoubleType::new()),
+        ];
+
+        let mut row = CompactedRow::new(types.clone());
+        let mut writer = CompactedRowWriter::new(types.len());
+
+        writer.write_int(100);
+        writer.set_null_at(1);
+        writer.write_double(2.71);
+
+        row.point_to(writer.to_bytes(), 0, writer.position());
+
+        assert!(!row.is_null_at(0));
+        assert!(row.is_null_at(1));
+        assert!(!row.is_null_at(2));
+        assert_eq!(row.get_int(0), 100);
+        assert_eq!(row.get_double(2), 2.71);
+
+        // Test multiple reads (caching)
+        assert_eq!(row.get_int(0), 100);
+        assert_eq!(row.get_int(0), 100);
+
+        // Test from_bytes
+        let types = vec![
+            DataType::Int(IntType::new()),
+            DataType::String(StringType::new()),
+        ];
+
+        let mut writer = CompactedRowWriter::new(types.len());
+        writer.write_int(42);
+        writer.write_string("test");
+
+        let mut row = CompactedRow::from_bytes(types, writer.to_bytes());
+
+        assert_eq!(row.get_int(0), 42);
+        assert_eq!(row.get_string(1), "test");
+
+        // Test large row
+        let num_fields = 100;
+        let types: Vec<DataType> = (0..num_fields)
+            .map(|_| DataType::Int(IntType::new()))
+            .collect();
+
+        let mut row = CompactedRow::new(types.clone());
+        let mut writer = CompactedRowWriter::new(num_fields);
+
+        for i in 0..num_fields {
+            writer.write_int((i * 10) as i32);
+        }
+
+        row.point_to(writer.to_bytes(), 0, writer.position());
+
+        for i in 0..num_fields {
+            assert_eq!(row.get_int(i), (i * 10) as i32);
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
new file mode 100644
index 0000000000..19afe887d4
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -0,0 +1,218 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use bytes::Bytes;
+
+use crate::{
+    metadata::DataType,
+    row::{
+        Datum, GenericRow,
+        compacted::{compacted_row::CompactedRow, compacted_row_writer::CompactedRowWriter},
+    },
+};
+
+#[allow(dead_code)]
+pub struct CompactedRowDeserializer {
+    schema: Vec<DataType>,
+}
+
+#[allow(dead_code)]
+impl CompactedRowDeserializer {
+    pub fn new(schema: Vec<DataType>) -> Self {
+        Self { schema }
+    }
+
+    pub fn deserialize(&self, reader: &mut CompactedRowReader) -> GenericRow<'static> {
+        let mut row = GenericRow::new();
+        for (pos, dtype) in self.schema.iter().enumerate() {
+            if reader.is_null_at(pos) {
+                row.set_field(pos, Datum::Null);
+                continue;
+            }
+            let datum = match dtype {
+                DataType::Boolean(_) => Datum::Bool(reader.read_boolean()),
+                DataType::TinyInt(_) => Datum::Int8(reader.read_byte() as i8),
+                DataType::SmallInt(_) => Datum::Int16(reader.read_short()),
+                DataType::Int(_) => Datum::Int32(reader.read_int()),
+                DataType::BigInt(_) => Datum::Int64(reader.read_long()),
+                DataType::Float(_) => Datum::Float32(reader.read_float().into()),
+                DataType::Double(_) => Datum::Float64(reader.read_double().into()),
+                // TODO: use read_char(length) in the future, but need to keep compatibility
+                DataType::Char(_) | DataType::String(_) => Datum::OwnedString(reader.read_string()),
+                // TODO: use read_binary(length) in the future, but need to keep compatibility
+                DataType::Bytes(_) | DataType::Binary(_) => {
+                    Datum::Blob(reader.read_bytes().into_vec().into())
+                }
+                _ => panic!("unsupported DataType in CompactedRowDeserializer"),
+            };
+            row.set_field(pos, datum);
+        }
+        row
+    }
+}
+
+// Reference implementation:
+// https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRowReader.java
+#[allow(dead_code)]
+pub struct CompactedRowReader {
+    segment: Bytes,
+    offset: usize,
+    position: usize,
+    limit: usize,
+    header_size_in_bytes: usize,
+}
+
+#[allow(dead_code)]
+impl CompactedRowReader {
+    pub fn new(field_count: usize) -> Self {
+        let header = CompactedRow::calculate_bit_set_width_in_bytes(field_count);
+        Self {
+            header_size_in_bytes: header,
+            segment: Bytes::new(),
+            offset: 0,
+            position: 0,
+            limit: 0,
+        }
+    }
+
+    pub fn point_to(&mut self, data: Bytes, offset: usize, length: usize) {
+        let limit = offset + length;
+        let position = offset + self.header_size_in_bytes;
+
+        debug_assert!(limit <= data.len());
+        debug_assert!(position <= limit);
+
+        self.segment = data;
+        self.offset = offset;
+        self.position = position;
+        self.limit = limit;
+    }
+
+    pub fn is_null_at(&self, pos: usize) -> bool {
+        let byte_index = pos >> 3;
+        let bit = pos & 7;
+        debug_assert!(byte_index < self.header_size_in_bytes);
+        let idx = self.offset + byte_index;
+        (self.segment[idx] & (1u8 << bit)) != 0
+    }
+
+    pub fn read_boolean(&mut self) -> bool {
+        self.read_byte() != 0
+    }
+
+    pub fn read_byte(&mut self) -> u8 {
+        debug_assert!(self.position < self.limit);
+        let b = self.segment[self.position];
+        self.position += 1;
+        b
+    }
+
+    pub fn read_short(&mut self) -> i16 {
+        debug_assert!(self.position + 2 <= self.limit);
+        let bytes_slice = &self.segment[self.position..self.position + 2];
+        let byte_array: [u8; 2] = bytes_slice
+            .try_into()
+            .expect("Slice must be exactly 2 bytes long");
+
+        self.position += 2;
+        i16::from_ne_bytes(byte_array)
+    }
+
+    pub fn read_int(&mut self) -> i32 {
+        let mut result: u32 = 0;
+        let mut shift = 0;
+
+        for _ in 0..CompactedRowWriter::MAX_INT_SIZE {
+            let b = self.read_byte();
+            result |= ((b & 0x7F) as u32) << shift;
+            if (b & 0x80) == 0 {
+                return result as i32;
+            }
+            shift += 7;
+        }
+
+        panic!("Invalid input stream.");
+    }
+
+    pub fn read_long(&mut self) -> i64 {
+        let mut result: u64 = 0;
+        let mut shift = 0;
+
+        for _ in 0..CompactedRowWriter::MAX_LONG_SIZE {
+            let b = self.read_byte();
+            result |= ((b & 0x7F) as u64) << shift;
+            if (b & 0x80) == 0 {
+                return result as i64;
+            }
+            shift += 7;
+        }
+
+        panic!("Invalid input stream.");
+    }
+
+    pub fn read_float(&mut self) -> f32 {
+        debug_assert!(self.position + 4 <= self.limit);
+        let bytes_slice = &self.segment[self.position..self.position + 4];
+        let byte_array: [u8; 4] = bytes_slice
+            .try_into()
+            .expect("Slice must be exactly 4 bytes long");
+
+        self.position += 4;
+        f32::from_ne_bytes(byte_array)
+    }
+
+    pub fn read_double(&mut self) -> f64 {
+        debug_assert!(self.position + 8 <= self.limit);
+        let bytes_slice = &self.segment[self.position..self.position + 8];
+        let byte_array: [u8; 8] = bytes_slice
+            .try_into()
+            .expect("Slice must be exactly 8 bytes long");
+
+        self.position += 8;
+        f64::from_ne_bytes(byte_array)
+    }
+
+    pub fn read_binary(&mut self, length: usize) -> Bytes {
+        debug_assert!(self.position + length <= self.limit);
+
+        let start = self.position;
+        let end = start + length;
+        self.position = end;
+
+        self.segment.slice(start..end)
+    }
+
+    pub fn read_bytes(&mut self) -> Box<[u8]> {
+        let len = self.read_int();
+        debug_assert!(len >= 0);
+
+        let len = len as usize;
+        debug_assert!(self.position + len <= self.limit);
+
+        let start = self.position;
+        let end = start + len;
+        self.position = end;
+
+        self.segment[start..end].to_vec().into_boxed_slice()
+    }
+
+    pub fn read_string(&mut self) -> String {
+        let bytes = self.read_bytes();
+        String::from_utf8(bytes.into_vec())
+            .unwrap_or_else(|e| panic!("Invalid UTF-8 in string data: {e}"))
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index 2debab19ae..834512350c 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -18,6 +18,8 @@
 use bytes::{Bytes, BytesMut};
 use std::cmp;
 
+use crate::row::compacted::compacted_row::CompactedRow;
+
 // Writer for CompactedRow
 // Reference implementation:
 // https://github.com/apache/fluss/blob/d4a72fad240d4b81563aaf83fa3b09b5058674ed/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRowWriter.java#L71
@@ -34,8 +36,7 @@ impl CompactedRowWriter {
     pub const MAX_LONG_SIZE: usize = 10;
 
     pub fn new(field_count: usize) -> Self {
-        // bitset width in bytes, it should be in CompactedRow
-        let header_size = field_count.div_ceil(8);
+        let header_size = CompactedRow::calculate_bit_set_width_in_bytes(field_count);
         let cap = cmp::max(64, header_size);
 
         let mut buffer = BytesMut::with_capacity(cap);
diff --git a/fluss-rust/crates/fluss/src/row/compacted/mod.rs b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
index c81eb5a50b..3361078321 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
@@ -16,6 +16,15 @@
 // under the License.
 
 mod compacted_key_writer;
+
+mod compacted_row;
+mod compacted_row_reader;
 mod compacted_row_writer;
 
 pub use compacted_key_writer::CompactedKeyWriter;
+#[allow(unused_imports)]
+pub use compacted_row::CompactedRow;
+#[allow(unused_imports)]
+pub use compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
+#[allow(unused_imports)]
+pub use compacted_row_writer::CompactedRowWriter;
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 28a378fd56..78872a9dd4 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -53,6 +53,9 @@ pub enum Datum<'a> {
     Float64(F64),
     #[display("'{0}'")]
     String(&'a str),
+    /// Owned string
+    #[display("'{0}'")]
+    OwnedString(String),
     #[display("{0}")]
     Blob(Blob),
     #[display("{:?}")]
@@ -75,6 +78,7 @@ impl Datum<'_> {
     pub fn as_str(&self) -> &str {
         match self {
             Self::String(s) => s,
+            Self::OwnedString(s) => s.as_str(),
             _ => panic!("not a string: {self:?}"),
         }
     }
@@ -216,13 +220,14 @@ impl TryFrom<&Datum<'_>> for bool {
     }
 }
 
-impl<'a> TryFrom<&Datum<'a>> for &'a str {
+impl<'b, 'a: 'b> TryFrom<&'b Datum<'a>> for &'b str {
     type Error = ();
 
     #[inline]
-    fn try_from(from: &Datum<'a>) -> std::result::Result<Self, Self::Error> {
+    fn try_from(from: &'b Datum<'a>) -> std::result::Result<Self, Self::Error> {
         match from {
             Datum::String(i) => Ok(*i),
+            Datum::OwnedString(s) => Ok(s.as_str()),
             _ => Err(()),
         }
     }
@@ -291,6 +296,7 @@ impl Datum<'_> {
             Datum::Float32(v) => append_value_to_arrow!(Float32Builder, v.into_inner()),
             Datum::Float64(v) => append_value_to_arrow!(Float64Builder, v.into_inner()),
             Datum::String(v) => append_value_to_arrow!(StringBuilder, *v),
+            Datum::OwnedString(v) => append_value_to_arrow!(StringBuilder, v.as_str()),
             Datum::Blob(v) => append_value_to_arrow!(BinaryBuilder, v.as_ref()),
             Datum::BorrowedBlob(v) => append_value_to_arrow!(BinaryBuilder, *v),
             Datum::Decimal(_) | Datum::Date(_) | Datum::Timestamp(_) | Datum::TimestampTz(_) => {
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
index b9335a3c13..ebe3da2a0a 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
@@ -49,10 +49,7 @@ impl CompactedKeyEncoder {
                 Some(idx) => encode_col_indexes.push(idx),
                 None => {
                     return Err(IllegalArgument {
-                        message: format!(
-                            "Field {:?} not found in input row type {:?}",
-                            key, row_type
-                        ),
+                        message: format!("Field {key:?} not found in input row type {row_type:?}"),
                     });
                 }
             }
@@ -89,10 +86,7 @@ impl KeyEncoder for CompactedKeyEncoder {
             match &field_getter.get_field(row) {
                 Datum::Null => {
                     return Err(IllegalArgument {
-                        message: format!(
-                            "Cannot encode key with null value at position: {:?}",
-                            pos
-                        ),
+                        message: format!("Cannot encode key with null value at position: {pos:?}"),
                     });
                 }
                 value => self.field_encoders.get(pos).unwrap().write_value(

From 98497bef8adbb2cbd7a2a6a34b6af4469678653e Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 10 Jan 2026 16:04:31 +0000
Subject: [PATCH 057/287] chore: fix Box leaking and batch API refactor (#136)

---
 fluss-rust/bindings/python/src/table.rs | 100 +++---------------------
 1 file changed, 11 insertions(+), 89 deletions(-)

diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 71759d7505..8a1164856b 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -17,6 +17,8 @@
 
 use crate::TOKIO_RUNTIME;
 use crate::*;
+use arrow::array::RecordBatch;
+use arrow_pyarrow::FromPyArrow;
 use fluss::client::EARLIEST_OFFSET;
 use fluss::rpc::message::OffsetSpec;
 use pyo3_async_runtimes::tokio::future_into_py;
@@ -148,34 +150,17 @@ impl AppendWriter {
 
     /// Write Arrow batch data
     pub fn write_arrow_batch(&mut self, py: Python, batch: Py<PyAny>) -> PyResult<()> {
-        // Extract number of rows and columns from the Arrow batch
-        let num_rows: usize = batch.getattr(py, "num_rows")?.extract(py)?;
-        let num_columns: usize = batch.getattr(py, "num_columns")?.extract(py)?;
-
-        // Process each row in the batch
-        for row_idx in 0..num_rows {
-            let mut generic_row = fcore::row::GenericRow::new();
-
-            // Extract values for each column in this row
-            for col_idx in 0..num_columns {
-                let column = batch.call_method1(py, "column", (col_idx,))?;
-                let value = column.call_method1(py, "__getitem__", (row_idx,))?;
-
-                // Convert the Python value to a Datum and add to the row
-                let datum = self.convert_python_value_to_datum(py, value)?;
-                generic_row.set_field(col_idx, datum);
-            }
+        // This shares the underlying Arrow buffers without copying data
+        let batch_bound = batch.bind(py);
+        let rust_batch: RecordBatch = FromPyArrow::from_pyarrow_bound(batch_bound)
+            .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch: {e}")))?;
 
-            // Append this row using the async append method
-            TOKIO_RUNTIME.block_on(async {
-                self.inner
-                    .append(generic_row)
-                    .await
-                    .map_err(|e| FlussError::new_err(e.to_string()))
-            })?;
-        }
+        // Release the GIL before blocking on async operation
+        let result = py.detach(|| {
+            TOKIO_RUNTIME.block_on(async { self.inner.append_arrow_batch(rust_batch).await })
+        });
 
-        Ok(())
+        result.map_err(|e| FlussError::new_err(e.to_string()))
     }
 
     /// Write Pandas DataFrame data
@@ -213,69 +198,6 @@ impl AppendWriter {
     pub fn from_core(append: fcore::client::AppendWriter) -> Self {
         Self { inner: append }
     }
-
-    fn convert_python_value_to_datum(
-        &self,
-        py: Python,
-        value: Py<PyAny>,
-    ) -> PyResult<fcore::row::Datum<'static>> {
-        use fcore::row::{Blob, Datum, F32, F64};
-
-        // Check for None (null)
-        if value.is_none(py) {
-            return Ok(Datum::Null);
-        }
-
-        // Try to extract different types
-        if let Ok(type_name) = value.bind(py).get_type().name() {
-            if type_name == "StringScalar" {
-                if let Ok(py_value) = value.call_method0(py, "as_py") {
-                    if let Ok(str_val) = py_value.extract::<String>(py) {
-                        let leaked_str: &'static str = Box::leak(str_val.into_boxed_str());
-                        return Ok(Datum::String(leaked_str));
-                    }
-                }
-            }
-        }
-
-        if let Ok(bool_val) = value.extract::<bool>(py) {
-            return Ok(Datum::Bool(bool_val));
-        }
-
-        if let Ok(int_val) = value.extract::<i32>(py) {
-            return Ok(Datum::Int32(int_val));
-        }
-
-        if let Ok(int_val) = value.extract::<i64>(py) {
-            return Ok(Datum::Int64(int_val));
-        }
-
-        if let Ok(float_val) = value.extract::<f32>(py) {
-            return Ok(Datum::Float32(F32::from(float_val)));
-        }
-
-        if let Ok(float_val) = value.extract::<f64>(py) {
-            return Ok(Datum::Float64(F64::from(float_val)));
-        }
-
-        if let Ok(str_val) = value.extract::<String>(py) {
-            // Convert String to &'static str by leaking memory
-            // This is a simplified approach - in production, you might want better lifetime management
-            let leaked_str: &'static str = Box::leak(str_val.into_boxed_str());
-            return Ok(Datum::String(leaked_str));
-        }
-
-        if let Ok(bytes_val) = value.extract::<Vec<u8>>(py) {
-            let blob = Blob::from(bytes_val);
-            return Ok(Datum::Blob(blob));
-        }
-
-        // If we can't convert, return an error
-        let type_name = value.bind(py).get_type().name()?;
-        Err(FlussError::new_err(format!(
-            "Cannot convert Python value to Datum: {type_name:?}"
-        )))
-    }
 }
 
 /// Scanner for reading log data from a Fluss table

From 0f4f4ec62e4fe209fd8f3ecaca7de044d236eccd Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Sun, 11 Jan 2026 10:51:55 +0800
Subject: [PATCH 058/287] chore: Improve write path error handling logic (#132)

---
 fluss-rust/crates/fluss/build.rs              |   4 +-
 .../crates/fluss/src/client/credentials.rs    |  51 ++
 .../crates/fluss/src/client/metadata.rs       |  44 +-
 .../fluss/src/client/write/accumulator.rs     |  73 ++-
 .../crates/fluss/src/client/write/batch.rs    |  87 +++-
 .../fluss/src/client/write/broadcast.rs       |   4 +
 .../fluss/src/client/write/bucket_assigner.rs |  40 ++
 .../crates/fluss/src/client/write/mod.rs      |  18 +-
 .../crates/fluss/src/client/write/sender.rs   | 441 ++++++++++++++++--
 fluss-rust/crates/fluss/src/lib.rs            |   3 +
 fluss-rust/crates/fluss/src/row/datum.rs      |  66 +++
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |  38 ++
 .../crates/fluss/src/rpc/api_version.rs       |  25 +
 fluss-rust/crates/fluss/src/rpc/convert.rs    |  48 ++
 .../crates/fluss/src/rpc/fluss_api_error.rs   |  35 ++
 .../fluss/src/rpc/message/produce_log.rs      |   6 +-
 fluss-rust/crates/fluss/src/test_utils.rs     |  88 ++++
 17 files changed, 1006 insertions(+), 65 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/test_utils.rs

diff --git a/fluss-rust/crates/fluss/build.rs b/fluss-rust/crates/fluss/build.rs
index a83cd056b5..1564313732 100644
--- a/fluss-rust/crates/fluss/build.rs
+++ b/fluss-rust/crates/fluss/build.rs
@@ -18,6 +18,8 @@
 use std::io::Result;
 
 fn main() -> Result<()> {
-    prost_build::compile_protos(&["src/proto/fluss_api.proto"], &["src/proto"])?;
+    let mut config = prost_build::Config::new();
+    config.bytes([".proto.PbProduceLogReqForBucket.records"]);
+    config.compile_protos(&["src/proto/fluss_api.proto"], &["src/proto"])?;
     Ok(())
 }
diff --git a/fluss-rust/crates/fluss/src/client/credentials.rs b/fluss-rust/crates/fluss/src/client/credentials.rs
index ffb682ed7d..c520b4416d 100644
--- a/fluss-rust/crates/fluss/src/client/credentials.rs
+++ b/fluss-rust/crates/fluss/src/client/credentials.rs
@@ -156,3 +156,54 @@ impl CredentialsCache {
         Ok(props)
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::client::metadata::Metadata;
+    use crate::cluster::Cluster;
+
+    #[test]
+    fn convert_hadoop_key_to_opendal_maps_known_keys() {
+        let (key, invert) = convert_hadoop_key_to_opendal("fs.s3a.endpoint").expect("key");
+        assert_eq!(key, "endpoint");
+        assert!(!invert);
+
+        let (key, invert) = convert_hadoop_key_to_opendal("fs.s3a.path.style.access").expect("key");
+        assert_eq!(key, "enable_virtual_host_style");
+        assert!(invert);
+
+        assert!(convert_hadoop_key_to_opendal("fs.s3a.connection.ssl.enabled").is_none());
+        assert!(convert_hadoop_key_to_opendal("unknown.key").is_none());
+    }
+
+    #[tokio::test]
+    async fn credentials_cache_returns_cached_props() -> Result<()> {
+        let cached = CachedToken {
+            access_key_id: "ak".to_string(),
+            secret_access_key: "sk".to_string(),
+            security_token: Some("token".to_string()),
+            addition_infos: HashMap::from([(
+                "fs.s3a.path.style.access".to_string(),
+                "true".to_string(),
+            )]),
+            cached_at: Instant::now(),
+        };
+
+        let cache = CredentialsCache {
+            inner: RwLock::new(Some(cached)),
+            rpc_client: Arc::new(RpcClient::new()),
+            metadata: Arc::new(Metadata::new_for_test(Arc::new(Cluster::default()))),
+        };
+
+        let props = cache.get_or_refresh().await?;
+        assert_eq!(props.get("access_key_id"), Some(&"ak".to_string()));
+        assert_eq!(props.get("secret_access_key"), Some(&"sk".to_string()));
+        assert_eq!(props.get("security_token"), Some(&"token".to_string()));
+        assert_eq!(
+            props.get("enable_virtual_host_style"),
+            Some(&"false".to_string())
+        );
+        Ok(())
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index a51442254c..0e6f965131 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -135,7 +135,47 @@ impl Metadata {
         guard.clone()
     }
 
-    pub fn leader_for(&self, _table_bucket: &TableBucket) -> Option<&ServerNode> {
-        todo!()
+    pub fn leader_for(&self, table_bucket: &TableBucket) -> Option<ServerNode> {
+        let cluster = self.cluster.read();
+        cluster.leader_for(table_bucket).cloned()
+    }
+}
+
+#[cfg(test)]
+impl Metadata {
+    pub(crate) fn new_for_test(cluster: Arc<Cluster>) -> Self {
+        Metadata {
+            cluster: RwLock::new(cluster),
+            connections: Arc::new(RpcClient::new()),
+            bootstrap: Arc::from(""),
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{TableBucket, TablePath};
+    use crate::test_utils::build_cluster_arc;
+
+    #[test]
+    fn leader_for_returns_server() {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let cluster = build_cluster_arc(&table_path, 1, 1);
+        let metadata = Metadata::new_for_test(cluster);
+        let leader = metadata
+            .leader_for(&TableBucket::new(1, 0))
+            .expect("leader");
+        assert_eq!(leader.id(), 1);
+    }
+
+    #[test]
+    fn invalidate_server_removes_leader() {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let cluster = build_cluster_arc(&table_path, 1, 1);
+        let metadata = Metadata::new_for_test(cluster);
+        metadata.invalidate_server(&1, vec![1]);
+        let cluster = metadata.get_cluster();
+        assert!(cluster.get_tablet_server(1).is_none());
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index beae0caacc..001d0aa7d0 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -250,7 +250,7 @@ impl RecordAccumulator {
         cluster: Arc<Cluster>,
         nodes: &HashSet<ServerNode>,
         max_size: i32,
-    ) -> Result<HashMap<i32, Vec<Arc<ReadyWriteBatch>>>> {
+    ) -> Result<HashMap<i32, Vec<ReadyWriteBatch>>> {
         if nodes.is_empty() {
             return Ok(HashMap::new());
         }
@@ -272,7 +272,7 @@ impl RecordAccumulator {
         cluster: &Cluster,
         node: &ServerNode,
         max_size: i32,
-    ) -> Result<Vec<Arc<ReadyWriteBatch>>> {
+    ) -> Result<Vec<ReadyWriteBatch>> {
         let mut size = 0;
         let buckets = self.get_all_buckets_in_current_node(node, cluster);
         let mut ready = Vec::new();
@@ -324,10 +324,10 @@ impl RecordAccumulator {
 
                         // mark the batch as drained.
                         batch.drained(current_time_ms());
-                        ready.push(Arc::new(ReadyWriteBatch {
+                        ready.push(ReadyWriteBatch {
                             table_bucket,
                             write_batch: batch,
-                        }));
+                        });
                     }
                 }
             }
@@ -342,6 +342,29 @@ impl RecordAccumulator {
         self.incomplete_batches.write().remove(&batch_id);
     }
 
+    pub async fn re_enqueue(&self, ready_write_batch: ReadyWriteBatch) {
+        ready_write_batch.write_batch.re_enqueued();
+        let table_path = ready_write_batch.write_batch.table_path().clone();
+        let bucket_id = ready_write_batch.table_bucket.bucket_id();
+        let table_id = u64::try_from(ready_write_batch.table_bucket.table_id()).unwrap_or(0);
+        let mut binding =
+            self.write_batches
+                .entry(table_path)
+                .or_insert_with(|| BucketAndWriteBatches {
+                    table_id,
+                    is_partitioned_table: false,
+                    partition_id: None,
+                    batches: Default::default(),
+                });
+        let bucket_and_batches = binding.value_mut();
+        let dq = bucket_and_batches
+            .batches
+            .entry(bucket_id)
+            .or_insert_with(|| Mutex::new(VecDeque::new()));
+        let mut dq_guard = dq.lock().await;
+        dq_guard.push_front(ready_write_batch.write_batch);
+    }
+
     fn get_all_buckets_in_current_node(
         &self,
         current: &ServerNode,
@@ -446,3 +469,45 @@ impl ReadyCheckResult {
         }
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::TablePath;
+    use crate::row::{Datum, GenericRow};
+    use crate::test_utils::build_cluster;
+    use std::sync::Arc;
+
+    #[tokio::test]
+    async fn re_enqueue_increments_attempts() -> Result<()> {
+        let config = Config::default();
+        let accumulator = RecordAccumulator::new(config);
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = Arc::new(build_cluster(table_path.as_ref(), 1, 1));
+        let record = WriteRecord::new(
+            table_path.clone(),
+            GenericRow {
+                values: vec![Datum::Int32(1)],
+            },
+        );
+
+        accumulator.append(&record, 0, &cluster, false).await?;
+
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let mut batches = accumulator
+            .drain(cluster.clone(), &nodes, 1024 * 1024)
+            .await?;
+        let mut drained = batches.remove(&1).expect("drained batches");
+        let batch = drained.pop().expect("batch");
+        assert_eq!(batch.write_batch.attempts(), 0);
+
+        accumulator.re_enqueue(batch).await;
+
+        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024).await?;
+        let mut drained = batches.remove(&1).expect("drained batches");
+        let batch = drained.pop().expect("batch");
+        assert_eq!(batch.write_batch.attempts(), 1);
+        Ok(())
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index ba04db4ac6..1f54226f39 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -22,7 +22,10 @@ use crate::compression::ArrowCompressionInfo;
 use crate::error::Result;
 use crate::metadata::{DataType, TablePath};
 use crate::record::MemoryLogRecordsArrowBuilder;
+use bytes::Bytes;
+use parking_lot::Mutex;
 use std::cmp::max;
+use std::sync::atomic::{AtomicBool, AtomicI32, Ordering};
 
 #[allow(dead_code)]
 pub struct InnerWriteBatch {
@@ -31,7 +34,8 @@ pub struct InnerWriteBatch {
     create_ms: i64,
     bucket_id: BucketId,
     results: BroadcastOnce<BatchWriteResult>,
-    completed: bool,
+    completed: AtomicBool,
+    attempts: AtomicI32,
     drained_ms: i64,
 }
 
@@ -43,7 +47,8 @@ impl InnerWriteBatch {
             create_ms,
             bucket_id,
             results: Default::default(),
-            completed: Default::default(),
+            completed: AtomicBool::new(false),
+            attempts: AtomicI32::new(0),
             drained_ms: -1,
         }
     }
@@ -53,15 +58,36 @@ impl InnerWriteBatch {
     }
 
     fn complete(&self, write_result: BatchWriteResult) -> bool {
-        if !self.completed {
-            self.results.broadcast(write_result);
+        if self
+            .completed
+            .compare_exchange(false, true, Ordering::AcqRel, Ordering::Acquire)
+            .is_err()
+        {
+            return false;
         }
+        self.results.broadcast(write_result);
         true
     }
 
     fn drained(&mut self, now_ms: i64) {
         self.drained_ms = max(self.drained_ms, now_ms);
     }
+
+    fn table_path(&self) -> &TablePath {
+        &self.table_path
+    }
+
+    fn attempts(&self) -> i32 {
+        self.attempts.load(Ordering::Acquire)
+    }
+
+    fn re_enqueued(&self) {
+        self.attempts.fetch_add(1, Ordering::AcqRel);
+    }
+
+    fn is_done(&self) -> bool {
+        self.completed.load(Ordering::Acquire)
+    }
 }
 
 pub enum WriteBatch {
@@ -112,7 +138,7 @@ impl WriteBatch {
         }
     }
 
-    pub fn build(&self) -> Result<Vec<u8>> {
+    pub fn build(&self) -> Result<Bytes> {
         match self {
             WriteBatch::ArrowLog(batch) => batch.build(),
         }
@@ -125,11 +151,28 @@ impl WriteBatch {
     pub fn batch_id(&self) -> i64 {
         self.inner_batch().batch_id
     }
+
+    pub fn table_path(&self) -> &TablePath {
+        self.inner_batch().table_path()
+    }
+
+    pub fn attempts(&self) -> i32 {
+        self.inner_batch().attempts()
+    }
+
+    pub fn re_enqueued(&self) {
+        self.inner_batch().re_enqueued();
+    }
+
+    pub fn is_done(&self) -> bool {
+        self.inner_batch().is_done()
+    }
 }
 
 pub struct ArrowLogWriteBatch {
     pub write_batch: InnerWriteBatch,
     pub arrow_builder: MemoryLogRecordsArrowBuilder,
+    built_records: Mutex<Option<Bytes>>,
 }
 
 impl ArrowLogWriteBatch {
@@ -153,6 +196,7 @@ impl ArrowLogWriteBatch {
                 to_append_record_batch,
                 arrow_compression_info,
             ),
+            built_records: Mutex::new(None),
         }
     }
 
@@ -174,8 +218,14 @@ impl ArrowLogWriteBatch {
         }
     }
 
-    pub fn build(&self) -> Result<Vec<u8>> {
-        self.arrow_builder.build()
+    pub fn build(&self) -> Result<Bytes> {
+        let mut cached = self.built_records.lock();
+        if let Some(bytes) = cached.as_ref() {
+            return Ok(bytes.clone());
+        }
+        let bytes = Bytes::from(self.arrow_builder.build()?);
+        *cached = Some(bytes.clone());
+        Ok(bytes)
     }
 
     pub fn is_closed(&self) -> bool {
@@ -186,3 +236,26 @@ impl ArrowLogWriteBatch {
         self.arrow_builder.close()
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::TablePath;
+
+    #[test]
+    fn complete_only_once() {
+        let batch =
+            InnerWriteBatch::new(1, TablePath::new("db".to_string(), "tbl".to_string()), 0, 0);
+        assert!(batch.complete(Ok(())));
+        assert!(!batch.complete(Err(crate::client::broadcast::Error::Dropped)));
+    }
+
+    #[test]
+    fn attempts_increment_on_reenqueue() {
+        let batch =
+            InnerWriteBatch::new(1, TablePath::new("db".to_string(), "tbl".to_string()), 0, 0);
+        assert_eq!(batch.attempts(), 0);
+        batch.re_enqueued();
+        assert_eq!(batch.attempts(), 1);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/broadcast.rs b/fluss-rust/crates/fluss/src/client/write/broadcast.rs
index d2e7f0c91c..ec45776599 100644
--- a/fluss-rust/crates/fluss/src/client/write/broadcast.rs
+++ b/fluss-rust/crates/fluss/src/client/write/broadcast.rs
@@ -28,6 +28,10 @@ pub type BatchWriteResult = Result<(), Error>;
 pub enum Error {
     #[error("BroadcastOnce dropped")]
     Dropped,
+    #[error("Write failed: {message} (code {code})")]
+    WriteFailed { code: i32, message: String },
+    #[error("Write failed before request was sent: {message}")]
+    Client { message: String },
 }
 
 #[derive(Debug, Clone)]
diff --git a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
index 44b2673697..2370719efe 100644
--- a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
+++ b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
@@ -146,3 +146,43 @@ impl BucketAssigner for HashBucketAssigner {
         self.bucketing_function.bucketing(key, self.num_buckets)
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::bucketing::BucketingFunction;
+    use crate::cluster::Cluster;
+    use crate::metadata::TablePath;
+    use crate::test_utils::build_cluster;
+
+    #[test]
+    fn sticky_bucket_assigner_picks_available_bucket() {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let cluster = build_cluster(&table_path, 1, 2);
+        let assigner = StickyBucketAssigner::new(table_path);
+        let bucket = assigner.assign_bucket(None, &cluster).expect("bucket");
+        assert!((0..2).contains(&bucket));
+
+        assigner.on_new_batch(&cluster, bucket);
+        let next_bucket = assigner.assign_bucket(None, &cluster).expect("bucket");
+        assert!((0..2).contains(&next_bucket));
+    }
+
+    #[test]
+    fn hash_bucket_assigner_requires_key() {
+        let assigner = HashBucketAssigner::new(3, <dyn BucketingFunction>::of(None));
+        let cluster = Cluster::default();
+        let err = assigner.assign_bucket(None, &cluster).unwrap_err();
+        assert!(matches!(err, crate::error::Error::IllegalArgument { .. }));
+    }
+
+    #[test]
+    fn hash_bucket_assigner_hashes_key() {
+        let assigner = HashBucketAssigner::new(4, <dyn BucketingFunction>::of(None));
+        let cluster = Cluster::default();
+        let bucket = assigner
+            .assign_bucket(Some(b"key"), &cluster)
+            .expect("bucket");
+        assert!((0..4).contains(&bucket));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index cd33586c89..d79418bfc2 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -18,7 +18,7 @@
 mod accumulator;
 mod batch;
 
-use crate::client::broadcast::{BatchWriteResult, BroadcastOnceReceiver};
+use crate::client::broadcast::{self as client_broadcast, BatchWriteResult, BroadcastOnceReceiver};
 use crate::error::Error;
 use crate::metadata::TablePath;
 use crate::row::GenericRow;
@@ -81,10 +81,18 @@ impl ResultHandle {
     }
 
     pub fn result(&self, batch_result: BatchWriteResult) -> Result<(), Error> {
-        // do nothing, just return empty result
-        batch_result.map_err(|e| Error::UnexpectedError {
-            message: format!("Fail to get write result {e:?}"),
-            source: None,
+        batch_result.map_err(|e| match e {
+            client_broadcast::Error::WriteFailed { code, message } => Error::FlussAPIError {
+                api_error: crate::rpc::ApiError { code, message },
+            },
+            client_broadcast::Error::Client { message } => Error::UnexpectedError {
+                message,
+                source: None,
+            },
+            client_broadcast::Error::Dropped => Error::UnexpectedError {
+                message: "Fail to get write result because broadcast was dropped.".to_string(),
+                source: None,
+            },
         })
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index 462a846d6c..cb03a2c462 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -15,15 +15,16 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::client::broadcast;
 use crate::client::metadata::Metadata;
 use crate::client::{ReadyWriteBatch, RecordAccumulator};
-use crate::error::Error;
-use crate::error::Result;
-use crate::metadata::TableBucket;
+use crate::error::{FlussError, Result};
+use crate::metadata::{TableBucket, TablePath};
 use crate::proto::ProduceLogResponse;
 use crate::rpc::message::ProduceLogRequest;
+use log::warn;
 use parking_lot::Mutex;
-use std::collections::HashMap;
+use std::collections::{HashMap, HashSet};
 use std::sync::Arc;
 use std::time::Duration;
 
@@ -32,7 +33,7 @@ pub struct Sender {
     running: bool,
     metadata: Arc<Metadata>,
     accumulator: Arc<RecordAccumulator>,
-    in_flight_batches: Mutex<HashMap<TableBucket, Vec<Arc<ReadyWriteBatch>>>>,
+    in_flight_batches: Mutex<HashMap<TableBucket, Vec<i64>>>,
     max_request_size: i32,
     ack: i16,
     max_request_timeout_ms: i32,
@@ -99,30 +100,30 @@ impl Sender {
 
         if !batches.is_empty() {
             self.add_to_inflight_batches(&batches);
-            self.send_write_requests(&batches).await?;
+            self.send_write_requests(batches).await?;
         }
 
         Ok(())
     }
 
-    fn add_to_inflight_batches(&self, batches: &HashMap<i32, Vec<Arc<ReadyWriteBatch>>>) {
+    fn add_to_inflight_batches(&self, batches: &HashMap<i32, Vec<ReadyWriteBatch>>) {
         let mut in_flight = self.in_flight_batches.lock();
         for batch_list in batches.values() {
             for batch in batch_list {
                 in_flight
                     .entry(batch.table_bucket.clone())
                     .or_default()
-                    .push(batch.clone());
+                    .push(batch.write_batch.batch_id());
             }
         }
     }
 
     async fn send_write_requests(
         &self,
-        collated: &HashMap<i32, Vec<Arc<ReadyWriteBatch>>>,
+        collated: HashMap<i32, Vec<ReadyWriteBatch>>,
     ) -> Result<()> {
         for (leader_id, batches) in collated {
-            self.send_write_request(*leader_id, self.ack, batches)
+            self.send_write_request(leader_id, self.ack, batches)
                 .await?;
         }
         Ok(())
@@ -132,78 +133,434 @@ impl Sender {
         &self,
         destination: i32,
         acks: i16,
-        batches: &Vec<Arc<ReadyWriteBatch>>,
+        batches: Vec<ReadyWriteBatch>,
     ) -> Result<()> {
         if batches.is_empty() {
             return Ok(());
         }
         let mut records_by_bucket = HashMap::new();
-        let mut write_batch_by_table = HashMap::new();
+        let mut write_batch_by_table: HashMap<i64, Vec<TableBucket>> = HashMap::new();
 
         for batch in batches {
-            records_by_bucket.insert(batch.table_bucket.clone(), batch.clone());
+            let table_bucket = batch.table_bucket.clone();
             write_batch_by_table
-                .entry(batch.table_bucket.table_id())
-                .or_insert_with(Vec::new)
-                .push(batch);
+                .entry(table_bucket.table_id())
+                .or_default()
+                .push(table_bucket.clone());
+            records_by_bucket.insert(table_bucket, batch);
         }
 
         let cluster = self.metadata.get_cluster();
 
-        let destination_node =
-            cluster
-                .get_tablet_server(destination)
-                .ok_or(Error::LeaderNotAvailable {
-                    message: format!("destination node not found in metadata cache {destination}."),
-                })?;
-        let connection = self.metadata.get_connection(destination_node).await?;
+        let destination_node = match cluster.get_tablet_server(destination) {
+            Some(node) => node,
+            None => {
+                self.handle_batches_with_error(
+                    records_by_bucket.into_values().collect(),
+                    FlussError::LeaderNotAvailableException,
+                    format!("Destination node not found in metadata cache {destination}."),
+                )
+                .await?;
+                return Ok(());
+            }
+        };
+        let connection = match self.metadata.get_connection(destination_node).await {
+            Ok(connection) => connection,
+            Err(e) => {
+                self.handle_batches_with_error(
+                    records_by_bucket.into_values().collect(),
+                    FlussError::NetworkException,
+                    format!("Failed to connect destination node {destination}: {e}"),
+                )
+                .await?;
+                return Ok(());
+            }
+        };
 
-        for (table_id, write_batches) in write_batch_by_table {
-            let request =
-                ProduceLogRequest::new(table_id, acks, self.max_request_timeout_ms, write_batches)?;
-            let response = connection.request(request).await?;
-            self.handle_produce_response(table_id, &records_by_bucket, response)?
+        for (table_id, table_buckets) in write_batch_by_table {
+            let request_batches: Vec<&ReadyWriteBatch> = table_buckets
+                .iter()
+                .filter_map(|bucket| records_by_bucket.get(bucket))
+                .collect();
+            if request_batches.is_empty() {
+                continue;
+            }
+            let request = match ProduceLogRequest::new(
+                table_id,
+                acks,
+                self.max_request_timeout_ms,
+                request_batches.as_slice(),
+            ) {
+                Ok(request) => request,
+                Err(e) => {
+                    self.handle_batches_with_local_error(
+                        table_buckets
+                            .iter()
+                            .filter_map(|bucket| records_by_bucket.remove(bucket))
+                            .collect(),
+                        format!("Failed to build produce request: {e}"),
+                    )
+                    .await?;
+                    continue;
+                }
+            };
+
+            let response = match connection.request(request).await {
+                Ok(response) => response,
+                Err(e) => {
+                    self.handle_batches_with_error(
+                        table_buckets
+                            .iter()
+                            .filter_map(|bucket| records_by_bucket.remove(bucket))
+                            .collect(),
+                        FlussError::NetworkException,
+                        format!("Failed to send produce request: {e}"),
+                    )
+                    .await?;
+                    continue;
+                }
+            };
+
+            self.handle_produce_response(
+                table_id,
+                &table_buckets,
+                &mut records_by_bucket,
+                response,
+            )
+            .await?;
         }
 
         Ok(())
     }
 
-    fn handle_produce_response(
+    async fn handle_produce_response(
         &self,
         table_id: i64,
-        records_by_bucket: &HashMap<TableBucket, Arc<ReadyWriteBatch>>,
+        request_buckets: &[TableBucket],
+        records_by_bucket: &mut HashMap<TableBucket, ReadyWriteBatch>,
         response: ProduceLogResponse,
     ) -> Result<()> {
+        let mut invalid_metadata_tables: HashSet<TablePath> = HashSet::new();
+        let mut pending_buckets: HashSet<TableBucket> = request_buckets.iter().cloned().collect();
         for produce_log_response_for_bucket in response.buckets_resp.iter() {
             let tb = TableBucket::new(table_id, produce_log_response_for_bucket.bucket_id);
 
-            let ready_batch = records_by_bucket.get(&tb).unwrap();
+            let Some(ready_batch) = records_by_bucket.remove(&tb) else {
+                panic!("Missing ready batch for table bucket {tb}");
+            };
+            pending_buckets.remove(&tb);
+
             if let Some(error_code) = produce_log_response_for_bucket.error_code {
-                todo!("handle_produce_response error: {}", error_code)
+                if error_code == FlussError::None.code() {
+                    self.complete_batch(ready_batch);
+                    continue;
+                }
+
+                let error = FlussError::for_code(error_code);
+                let message = produce_log_response_for_bucket
+                    .error_message
+                    .clone()
+                    .unwrap_or_else(|| error.message().to_string());
+                if let Some(table_path) = self
+                    .handle_write_batch_error(ready_batch, error, message)
+                    .await?
+                {
+                    invalid_metadata_tables.insert(table_path);
+                }
             } else {
                 self.complete_batch(ready_batch)
             }
         }
+        if !pending_buckets.is_empty() {
+            for bucket in pending_buckets {
+                if let Some(ready_batch) = records_by_bucket.remove(&bucket) {
+                    let message =
+                        format!("Missing response for table bucket {bucket} in produce response.");
+                    let error = FlussError::UnknownServerError;
+                    if let Some(table_path) = self
+                        .handle_write_batch_error(ready_batch, error, message)
+                        .await?
+                    {
+                        invalid_metadata_tables.insert(table_path);
+                    }
+                }
+            }
+        }
+        self.update_metadata_if_needed(invalid_metadata_tables)
+            .await;
         Ok(())
     }
 
-    fn complete_batch(&self, ready_write_batch: &Arc<ReadyWriteBatch>) {
-        if ready_write_batch.write_batch.complete(Ok(())) {
-            // remove from in flight batches
-            let mut in_flight_guard = self.in_flight_batches.lock();
-            if let Some(in_flight) = in_flight_guard.get_mut(&ready_write_batch.table_bucket) {
-                in_flight.retain(|b| !Arc::ptr_eq(b, ready_write_batch));
-                if in_flight.is_empty() {
-                    in_flight_guard.remove(&ready_write_batch.table_bucket);
-                }
-            }
+    fn complete_batch(&self, ready_write_batch: ReadyWriteBatch) {
+        self.finish_batch(ready_write_batch, Ok(()));
+    }
+
+    fn fail_batch(&self, ready_write_batch: ReadyWriteBatch, error: broadcast::Error) {
+        self.finish_batch(ready_write_batch, Err(error));
+    }
+
+    fn finish_batch(&self, ready_write_batch: ReadyWriteBatch, result: broadcast::Result<()>) {
+        if ready_write_batch.write_batch.complete(result) {
+            self.remove_from_inflight_batches(&ready_write_batch);
             // remove from incomplete batches
             self.accumulator
                 .remove_incomplete_batches(ready_write_batch.write_batch.batch_id())
         }
     }
 
+    async fn handle_batches_with_error(
+        &self,
+        batches: Vec<ReadyWriteBatch>,
+        error: FlussError,
+        message: String,
+    ) -> Result<()> {
+        let mut invalid_metadata_tables: HashSet<TablePath> = HashSet::new();
+        for batch in batches {
+            if let Some(table_path) = self
+                .handle_write_batch_error(batch, error, message.clone())
+                .await?
+            {
+                invalid_metadata_tables.insert(table_path);
+            }
+        }
+        self.update_metadata_if_needed(invalid_metadata_tables)
+            .await;
+        Ok(())
+    }
+
+    async fn handle_batches_with_local_error(
+        &self,
+        batches: Vec<ReadyWriteBatch>,
+        message: String,
+    ) -> Result<()> {
+        for batch in batches {
+            self.fail_batch(
+                batch,
+                broadcast::Error::Client {
+                    message: message.clone(),
+                },
+            );
+        }
+        Ok(())
+    }
+
+    async fn handle_write_batch_error(
+        &self,
+        ready_write_batch: ReadyWriteBatch,
+        error: FlussError,
+        message: String,
+    ) -> Result<Option<TablePath>> {
+        let table_path = ready_write_batch.write_batch.table_path().clone();
+        if self.can_retry(&ready_write_batch, error) {
+            warn!(
+                "Retrying write batch for {table_path} on bucket {} after error {error:?}: {message}",
+                ready_write_batch.table_bucket.bucket_id()
+            );
+            self.re_enqueue_batch(ready_write_batch).await;
+            return Ok(Self::is_invalid_metadata_error(error).then_some(table_path));
+        }
+
+        if error == FlussError::DuplicateSequenceException {
+            warn!(
+                "Duplicate sequence for {table_path} on bucket {}: {message}",
+                ready_write_batch.table_bucket.bucket_id()
+            );
+            self.complete_batch(ready_write_batch);
+            return Ok(None);
+        }
+
+        self.fail_batch(
+            ready_write_batch,
+            broadcast::Error::WriteFailed {
+                code: error.code(),
+                message,
+            },
+        );
+        Ok(Self::is_invalid_metadata_error(error).then_some(table_path))
+    }
+
+    async fn re_enqueue_batch(&self, ready_write_batch: ReadyWriteBatch) {
+        self.remove_from_inflight_batches(&ready_write_batch);
+        self.accumulator.re_enqueue(ready_write_batch).await;
+    }
+
+    fn remove_from_inflight_batches(&self, ready_write_batch: &ReadyWriteBatch) {
+        let batch_id = ready_write_batch.write_batch.batch_id();
+        let mut in_flight_guard = self.in_flight_batches.lock();
+        if let Some(in_flight) = in_flight_guard.get_mut(&ready_write_batch.table_bucket) {
+            in_flight.retain(|id| *id != batch_id);
+            if in_flight.is_empty() {
+                in_flight_guard.remove(&ready_write_batch.table_bucket);
+            }
+        }
+    }
+
+    fn can_retry(&self, ready_write_batch: &ReadyWriteBatch, error: FlussError) -> bool {
+        ready_write_batch.write_batch.attempts() < self.retries
+            && !ready_write_batch.write_batch.is_done()
+            && Self::is_retriable_error(error)
+    }
+
+    async fn update_metadata_if_needed(&self, table_paths: HashSet<TablePath>) {
+        if table_paths.is_empty() {
+            return;
+        }
+        let table_path_refs: HashSet<&TablePath> = table_paths.iter().collect();
+        if let Err(e) = self.metadata.update_tables_metadata(&table_path_refs).await {
+            warn!("Failed to update metadata after write error: {e:?}");
+        }
+    }
+
+    fn is_invalid_metadata_error(error: FlussError) -> bool {
+        matches!(
+            error,
+            FlussError::NotLeaderOrFollower
+                | FlussError::UnknownTableOrBucketException
+                | FlussError::LeaderNotAvailableException
+                | FlussError::NetworkException
+        )
+    }
+
+    fn is_retriable_error(error: FlussError) -> bool {
+        matches!(
+            error,
+            FlussError::NetworkException
+                | FlussError::NotLeaderOrFollower
+                | FlussError::UnknownTableOrBucketException
+                | FlussError::LeaderNotAvailableException
+                | FlussError::LogStorageException
+                | FlussError::KvStorageException
+                | FlussError::StorageException
+                | FlussError::RequestTimeOut
+                | FlussError::NotEnoughReplicasAfterAppendException
+                | FlussError::NotEnoughReplicasException
+                | FlussError::CorruptMessage
+                | FlussError::CorruptRecordException
+        )
+    }
+
     pub async fn close(&mut self) {
         self.running = false;
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::client::WriteRecord;
+    use crate::cluster::Cluster;
+    use crate::config::Config;
+    use crate::metadata::TablePath;
+    use crate::proto::{PbProduceLogRespForBucket, ProduceLogResponse};
+    use crate::row::{Datum, GenericRow};
+    use crate::rpc::FlussError;
+    use crate::test_utils::build_cluster_arc;
+    use std::collections::HashSet;
+
+    async fn build_ready_batch(
+        accumulator: &RecordAccumulator,
+        cluster: Arc<Cluster>,
+        table_path: Arc<TablePath>,
+    ) -> Result<(ReadyWriteBatch, crate::client::ResultHandle)> {
+        let record = WriteRecord::new(
+            table_path,
+            GenericRow {
+                values: vec![Datum::Int32(1)],
+            },
+        );
+        let result = accumulator.append(&record, 0, &cluster, false).await?;
+        let result_handle = result.result_handle.expect("result handle");
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024).await?;
+        let mut drained = batches.remove(&1).expect("drained batches");
+        let batch = drained.pop().expect("batch");
+        Ok((batch, result_handle))
+    }
+
+    #[tokio::test]
+    async fn handle_write_batch_error_retries() -> Result<()> {
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
+        let accumulator = Arc::new(RecordAccumulator::new(Config::default()));
+        let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 1);
+
+        let (batch, _handle) =
+            build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path.clone()).await?;
+        let mut inflight = HashMap::new();
+        inflight.insert(1, vec![batch]);
+        sender.add_to_inflight_batches(&inflight);
+        let batch = inflight.remove(&1).unwrap().pop().unwrap();
+
+        sender
+            .handle_write_batch_error(batch, FlussError::RequestTimeOut, "timeout".to_string())
+            .await?;
+
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024).await?;
+        let mut drained = batches.remove(&1).expect("drained batches");
+        let batch = drained.pop().expect("batch");
+        assert_eq!(batch.write_batch.attempts(), 1);
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn handle_write_batch_error_fails() -> Result<()> {
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
+        let accumulator = Arc::new(RecordAccumulator::new(Config::default()));
+        let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 0);
+
+        let (batch, handle) =
+            build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path).await?;
+        sender
+            .handle_write_batch_error(
+                batch,
+                FlussError::InvalidTableException,
+                "invalid".to_string(),
+            )
+            .await?;
+
+        let batch_result = handle.wait().await?;
+        assert!(matches!(
+            batch_result,
+            Err(broadcast::Error::WriteFailed { code, .. })
+                if code == FlussError::InvalidTableException.code()
+        ));
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn handle_produce_response_duplicate_sequence_completes() -> Result<()> {
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
+        let accumulator = Arc::new(RecordAccumulator::new(Config::default()));
+        let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 0);
+
+        let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster, table_path).await?;
+        let request_buckets = vec![batch.table_bucket.clone()];
+        let mut records_by_bucket = HashMap::new();
+        records_by_bucket.insert(batch.table_bucket.clone(), batch);
+
+        let response = ProduceLogResponse {
+            buckets_resp: vec![PbProduceLogRespForBucket {
+                bucket_id: 0,
+                error_code: Some(FlussError::DuplicateSequenceException.code()),
+                error_message: Some("dup".to_string()),
+                ..Default::default()
+            }],
+        };
+
+        sender
+            .handle_produce_response(1, &request_buckets, &mut records_by_bucket, response)
+            .await?;
+
+        let batch_result = handle.wait().await?;
+        assert!(matches!(batch_result, Ok(())));
+        Ok(())
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index 1bd72a4aac..e8d822fb77 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -31,6 +31,9 @@ mod compression;
 pub mod io;
 mod util;
 
+#[cfg(test)]
+mod test_utils;
+
 pub type TableId = u64;
 pub type PartitionId = u64;
 pub type BucketId = i32;
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 78872a9dd4..c054e08aeb 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -448,3 +448,69 @@ impl Date {
         date.day()
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use arrow::array::{Array, Int32Builder, StringBuilder};
+
+    #[test]
+    fn datum_accessors_and_conversions() {
+        let datum = Datum::String("value");
+        assert_eq!(datum.as_str(), "value");
+        assert!(!datum.is_null());
+
+        let blob = Blob::from(vec![1, 2, 3]);
+        let datum = Datum::Blob(blob);
+        assert_eq!(datum.as_blob(), &[1, 2, 3]);
+
+        assert!(Datum::Null.is_null());
+
+        let datum = Datum::Int32(42);
+        let value: i32 = (&datum).try_into().unwrap();
+        assert_eq!(value, 42);
+        let value: std::result::Result<i16, _> = (&datum).try_into();
+        assert!(value.is_err());
+    }
+
+    #[test]
+    fn datum_append_to_builder() {
+        let mut builder = Int32Builder::new();
+        Datum::Null.append_to(&mut builder).unwrap();
+        Datum::Int32(5).append_to(&mut builder).unwrap();
+        let array = builder.finish();
+        assert!(array.is_null(0));
+        assert_eq!(array.value(1), 5);
+
+        let mut builder = StringBuilder::new();
+        let err = Datum::Int32(1).append_to(&mut builder).unwrap_err();
+        assert!(matches!(err, crate::error::Error::RowConvertError { .. }));
+
+        let mut builder = Int32Builder::new();
+        let err = Datum::Date(Date::new(0))
+            .append_to(&mut builder)
+            .unwrap_err();
+        assert!(matches!(err, crate::error::Error::RowConvertError { .. }));
+    }
+
+    #[test]
+    #[should_panic]
+    fn datum_as_str_panics_on_non_string() {
+        let _ = Datum::Int32(1).as_str();
+    }
+
+    #[test]
+    #[should_panic]
+    fn datum_as_blob_panics_on_non_blob() {
+        let _ = Datum::Int16(1).as_blob();
+    }
+
+    #[test]
+    fn date_components() {
+        let date = Date::new(0);
+        assert_eq!(date.get_inner(), 0);
+        assert_eq!(date.year(), 1970);
+        assert_eq!(date.month(), 1);
+        assert_eq!(date.day(), 1);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index b11647f960..c51539642b 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -85,3 +85,41 @@ impl From<ApiKey> for i16 {
         }
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn api_key_round_trip() {
+        let cases = [
+            (1001, ApiKey::CreateDatabase),
+            (1002, ApiKey::DropDatabase),
+            (1003, ApiKey::ListDatabases),
+            (1004, ApiKey::DatabaseExists),
+            (1005, ApiKey::CreateTable),
+            (1006, ApiKey::DropTable),
+            (1007, ApiKey::GetTable),
+            (1008, ApiKey::ListTables),
+            (1010, ApiKey::TableExists),
+            (1012, ApiKey::MetaData),
+            (1014, ApiKey::ProduceLog),
+            (1015, ApiKey::FetchLog),
+            (1021, ApiKey::ListOffsets),
+            (1025, ApiKey::GetFileSystemSecurityToken),
+            (1032, ApiKey::GetLatestLakeSnapshot),
+            (1035, ApiKey::GetDatabaseInfo),
+        ];
+
+        for (raw, key) in cases {
+            assert_eq!(ApiKey::from(raw), key);
+            let mapped: i16 = key.into();
+            assert_eq!(mapped, raw);
+        }
+
+        let unknown = ApiKey::from(9999);
+        assert_eq!(unknown, ApiKey::Unknown(9999));
+        let mapped: i16 = unknown.into();
+        assert_eq!(mapped, 9999);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/api_version.rs b/fluss-rust/crates/fluss/src/rpc/api_version.rs
index 395c45cd0f..f009d6914f 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_version.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_version.rs
@@ -52,3 +52,28 @@ impl std::fmt::Display for ApiVersionRange {
         write!(f, "{}:{}", self.min, self.max)
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn api_version_display() {
+        let version = ApiVersion(3);
+        assert_eq!(version.to_string(), "3");
+    }
+
+    #[test]
+    fn api_version_range_accessors() {
+        let range = ApiVersionRange::new(ApiVersion(1), ApiVersion(4));
+        assert_eq!(range.min(), ApiVersion(1));
+        assert_eq!(range.max(), ApiVersion(4));
+        assert_eq!(range.to_string(), "1:4");
+    }
+
+    #[test]
+    #[should_panic]
+    fn api_version_range_panics_on_invalid_bounds() {
+        let _ = ApiVersionRange::new(ApiVersion(4), ApiVersion(1));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/convert.rs b/fluss-rust/crates/fluss/src/rpc/convert.rs
index 6feb7eb8af..1862589bc5 100644
--- a/fluss-rust/crates/fluss/src/rpc/convert.rs
+++ b/fluss-rust/crates/fluss/src/rpc/convert.rs
@@ -41,3 +41,51 @@ pub fn from_pb_table_path(pb_table_path: &PbTablePath) -> TablePath {
         pb_table_path.table_name.to_string(),
     )
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::proto::{PbServerNode, PbTablePath};
+
+    #[test]
+    fn table_path_round_trip() {
+        let table_path = TablePath::new("db".to_string(), "table".to_string());
+        let pb = to_table_path(&table_path);
+        assert_eq!(pb.database_name, "db");
+        assert_eq!(pb.table_name, "table");
+
+        let restored = from_pb_table_path(&pb);
+        assert_eq!(restored, table_path);
+
+        let manual = PbTablePath {
+            database_name: "db2".to_string(),
+            table_name: "table2".to_string(),
+        };
+        let restored = from_pb_table_path(&manual);
+        assert_eq!(restored.database(), "db2");
+        assert_eq!(restored.table(), "table2");
+    }
+
+    #[test]
+    fn server_node_from_pb() {
+        let pb = PbServerNode {
+            node_id: 7,
+            host: "127.0.0.1".to_string(),
+            port: 9092,
+            listeners: None,
+        };
+        let node = from_pb_server_node(pb, ServerType::TabletServer);
+        assert_eq!(node.id(), 7);
+        assert_eq!(node.url(), "127.0.0.1:9092");
+        assert_eq!(node.uid(), "ts-7");
+
+        let pb = PbServerNode {
+            node_id: 3,
+            host: "localhost".to_string(),
+            port: 8123,
+            listeners: None,
+        };
+        let node = from_pb_server_node(pb, ServerType::CoordinatorServer);
+        assert_eq!(node.uid(), "cs-3");
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs b/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
index b26eb72f61..a501b9974e 100644
--- a/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
+++ b/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
@@ -369,3 +369,38 @@ impl From<ApiError> for FlussError {
         FlussError::for_code(api_error.code)
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn for_code_maps_known_and_unknown() {
+        assert_eq!(FlussError::for_code(0), FlussError::None);
+        assert_eq!(
+            FlussError::for_code(FlussError::AuthorizationException.code()),
+            FlussError::AuthorizationException
+        );
+        assert_eq!(FlussError::for_code(9999), FlussError::UnknownServerError);
+    }
+
+    #[test]
+    fn to_api_error_uses_message() {
+        let err = FlussError::InvalidTableException.to_api_error(None);
+        assert_eq!(err.code, FlussError::InvalidTableException.code());
+        assert!(err.message.contains("invalid table"));
+    }
+
+    #[test]
+    fn error_response_conversion_round_trip() {
+        let response = ErrorResponse {
+            error_code: FlussError::TableNotExist.code(),
+            error_message: Some("missing".to_string()),
+        };
+        let api_error = ApiError::from(response);
+        assert_eq!(api_error.code, FlussError::TableNotExist.code());
+        assert_eq!(api_error.message, "missing");
+        let fluss_error = FlussError::from(api_error);
+        assert_eq!(fluss_error, FlussError::TableNotExist);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
index 39bfb3f205..eb725751c7 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
@@ -19,14 +19,12 @@ use crate::error::Result as FlussResult;
 use crate::proto::{PbProduceLogReqForBucket, ProduceLogResponse};
 use crate::rpc::frame::ReadError;
 
+use crate::client::ReadyWriteBatch;
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use crate::{impl_read_version_type, impl_write_version_type, proto};
-use std::sync::Arc;
-
-use crate::client::ReadyWriteBatch;
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -39,7 +37,7 @@ impl ProduceLogRequest {
         table_id: i64,
         ack: i16,
         max_request_timeout_ms: i32,
-        ready_batches: Vec<&Arc<ReadyWriteBatch>>,
+        ready_batches: &[&ReadyWriteBatch],
     ) -> FlussResult<Self> {
         let mut request = proto::ProduceLogRequest {
             table_id,
diff --git a/fluss-rust/crates/fluss/src/test_utils.rs b/fluss-rust/crates/fluss/src/test_utils.rs
new file mode 100644
index 0000000000..d1cd3ec712
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/test_utils.rs
@@ -0,0 +1,88 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::cluster::{BucketLocation, Cluster, ServerNode, ServerType};
+use crate::metadata::{
+    DataField, DataTypes, Schema, TableBucket, TableDescriptor, TableInfo, TablePath,
+};
+use std::collections::HashMap;
+use std::sync::Arc;
+
+pub(crate) fn build_table_info(table_path: TablePath, table_id: i64, buckets: i32) -> TableInfo {
+    let row_type = DataTypes::row(vec![DataField::new(
+        "id".to_string(),
+        DataTypes::int(),
+        None,
+    )]);
+    let mut schema_builder = Schema::builder().with_row_type(&row_type);
+    let schema = schema_builder.build().expect("schema build");
+    let table_descriptor = TableDescriptor::builder()
+        .schema(schema)
+        .distributed_by(Some(buckets), vec![])
+        .build()
+        .expect("descriptor build");
+    TableInfo::of(table_path, table_id, 1, table_descriptor, 0, 0)
+}
+
+pub(crate) fn build_cluster(table_path: &TablePath, table_id: i64, buckets: i32) -> Cluster {
+    let server = ServerNode::new(1, "127.0.0.1".to_string(), 9092, ServerType::TabletServer);
+
+    let mut servers = HashMap::new();
+    servers.insert(server.id(), server.clone());
+
+    let mut locations_by_path = HashMap::new();
+    let mut locations_by_bucket = HashMap::new();
+    let mut bucket_locations = Vec::new();
+
+    for bucket_id in 0..buckets {
+        let table_bucket = TableBucket::new(table_id, bucket_id);
+        let bucket_location = BucketLocation::new(
+            table_bucket.clone(),
+            Some(server.clone()),
+            table_path.clone(),
+        );
+        bucket_locations.push(bucket_location.clone());
+        locations_by_bucket.insert(table_bucket, bucket_location);
+    }
+    locations_by_path.insert(table_path.clone(), bucket_locations);
+
+    let mut table_id_by_path = HashMap::new();
+    table_id_by_path.insert(table_path.clone(), table_id);
+
+    let mut table_info_by_path = HashMap::new();
+    table_info_by_path.insert(
+        table_path.clone(),
+        build_table_info(table_path.clone(), table_id, buckets),
+    );
+
+    Cluster::new(
+        None,
+        servers,
+        locations_by_path,
+        locations_by_bucket,
+        table_id_by_path,
+        table_info_by_path,
+    )
+}
+
+pub(crate) fn build_cluster_arc(
+    table_path: &TablePath,
+    table_id: i64,
+    buckets: i32,
+) -> Arc<Cluster> {
+    Arc::new(build_cluster(table_path, table_id, buckets))
+}

From 69b3ccc3d0d8d1bf5cd8c3fc6aac2f2e6bbf8349 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sun, 11 Jan 2026 03:16:49 +0000
Subject: [PATCH 059/287] chore: improve datum, use Cow to reduce verbosity and
 avoid Box::leak gymnastics (#139)

---
 fluss-rust/bindings/cpp/src/types.rs          |  6 +-
 .../fluss/src/row/binary/binary_writer.rs     |  9 +-
 .../src/row/compacted/compacted_row_reader.rs |  7 +-
 fluss-rust/crates/fluss/src/row/datum.rs      | 95 ++++---------------
 .../crates/fluss/src/row/field_getter.rs      |  2 +-
 5 files changed, 32 insertions(+), 87 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index d95da14212..fef73ceaf0 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -25,6 +25,7 @@ use arrow::array::{
 use arrow::datatypes::{DataType as ArrowDataType, TimeUnit};
 use fcore::row::InternalRow;
 use fluss as fcore;
+use std::borrow::Cow;
 
 pub const DATA_TYPE_BOOLEAN: i32 = 1;
 pub const DATA_TYPE_TINYINT: i32 = 2;
@@ -218,9 +219,8 @@ pub fn ffi_row_to_core(row: &ffi::FfiGenericRow) -> fcore::row::GenericRow<'_> {
             DATUM_TYPE_INT64 => Datum::Int64(field.i64_val),
             DATUM_TYPE_FLOAT32 => Datum::Float32(field.f32_val.into()),
             DATUM_TYPE_FLOAT64 => Datum::Float64(field.f64_val.into()),
-            DATUM_TYPE_STRING => Datum::String(field.string_val.as_str()),
-            // todo: avoid copy bytes for blob
-            DATUM_TYPE_BYTES => Datum::Blob(field.bytes_val.clone().into()),
+            DATUM_TYPE_STRING => Datum::String(Cow::Borrowed(field.string_val.as_str())),
+            DATUM_TYPE_BYTES => Datum::Blob(Cow::Borrowed(field.bytes_val.as_slice())),
             _ => Datum::Null,
         };
         generic_row.set_field(idx, datum);
diff --git a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
index 44f10b6309..9917c7b76a 100644
--- a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
@@ -170,17 +170,12 @@ impl InnerValueWriter {
                 writer.write_boolean(*v);
             }
             (InnerValueWriter::Binary, Datum::Blob(v)) => {
-                writer.write_binary(v.as_ref(), v.len());
-            }
-            (InnerValueWriter::Binary, Datum::BorrowedBlob(v)) => {
-                writer.write_binary(v.as_ref(), v.len());
+                let b = v.as_ref();
+                writer.write_binary(b, b.len());
             }
             (InnerValueWriter::Bytes, Datum::Blob(v)) => {
                 writer.write_bytes(v.as_ref());
             }
-            (InnerValueWriter::Bytes, Datum::BorrowedBlob(v)) => {
-                writer.write_bytes(v.as_ref());
-            }
             (InnerValueWriter::TinyInt, Datum::Int8(v)) => {
                 writer.write_byte(*v as u8);
             }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 19afe887d4..00d94ad675 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use bytes::Bytes;
+use std::borrow::Cow;
 
 use crate::{
     metadata::DataType,
@@ -52,10 +53,12 @@ impl CompactedRowDeserializer {
                 DataType::Float(_) => Datum::Float32(reader.read_float().into()),
                 DataType::Double(_) => Datum::Float64(reader.read_double().into()),
                 // TODO: use read_char(length) in the future, but need to keep compatibility
-                DataType::Char(_) | DataType::String(_) => Datum::OwnedString(reader.read_string()),
+                DataType::Char(_) | DataType::String(_) => {
+                    Datum::String(Cow::Owned(reader.read_string()))
+                }
                 // TODO: use read_binary(length) in the future, but need to keep compatibility
                 DataType::Bytes(_) | DataType::Binary(_) => {
-                    Datum::Blob(reader.read_bytes().into_vec().into())
+                    Datum::Blob(Cow::Owned(reader.read_bytes().into_vec()))
                 }
                 _ => panic!("unsupported DataType in CompactedRowDeserializer"),
             };
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index c054e08aeb..fa85ded4b8 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -24,11 +24,9 @@ use arrow::array::{
 use jiff::ToSpan;
 use ordered_float::OrderedFloat;
 use parse_display::Display;
-use ref_cast::RefCast;
 use rust_decimal::Decimal;
-use serde::{Deserialize, Serialize};
-use std::fmt;
-use std::ops::Deref;
+use serde::Serialize;
+use std::borrow::Cow;
 
 #[allow(dead_code)]
 const THIRTY_YEARS_MICROSECONDS: i64 = 946_684_800_000_000;
@@ -52,14 +50,9 @@ pub enum Datum<'a> {
     #[display("{0}")]
     Float64(F64),
     #[display("'{0}'")]
-    String(&'a str),
-    /// Owned string
-    #[display("'{0}'")]
-    OwnedString(String),
-    #[display("{0}")]
-    Blob(Blob),
+    String(Str<'a>),
     #[display("{:?}")]
-    BorrowedBlob(&'a [u8]),
+    Blob(Blob<'a>),
     #[display("{0}")]
     Decimal(Decimal),
     #[display("{0}")]
@@ -78,7 +71,6 @@ impl Datum<'_> {
     pub fn as_str(&self) -> &str {
         match self {
             Self::String(s) => s,
-            Self::OwnedString(s) => s.as_str(),
             _ => panic!("not a string: {self:?}"),
         }
     }
@@ -86,7 +78,6 @@ impl Datum<'_> {
     pub fn as_blob(&self) -> &[u8] {
         match self {
             Self::Blob(blob) => blob.as_ref(),
-            Self::BorrowedBlob(blob) => blob,
             _ => panic!("not a blob: {self:?}"),
         }
     }
@@ -121,10 +112,19 @@ impl<'a> From<i16> for Datum<'a> {
     }
 }
 
+pub type Str<'a> = Cow<'a, str>;
+
+impl<'a> From<String> for Datum<'a> {
+    #[inline]
+    fn from(s: String) -> Self {
+        Datum::String(Cow::Owned(s))
+    }
+}
+
 impl<'a> From<&'a str> for Datum<'a> {
     #[inline]
     fn from(s: &'a str) -> Datum<'a> {
-        Datum::String(s)
+        Datum::String(Cow::Borrowed(s))
     }
 }
 
@@ -226,8 +226,7 @@ impl<'b, 'a: 'b> TryFrom<&'b Datum<'a>> for &'b str {
     #[inline]
     fn try_from(from: &'b Datum<'a>) -> std::result::Result<Self, Self::Error> {
         match from {
-            Datum::String(i) => Ok(*i),
-            Datum::OwnedString(s) => Ok(s.as_str()),
+            Datum::String(s) => Ok(s.as_ref()),
             _ => Err(()),
         }
     }
@@ -295,10 +294,8 @@ impl Datum<'_> {
             Datum::Int64(v) => append_value_to_arrow!(Int64Builder, *v),
             Datum::Float32(v) => append_value_to_arrow!(Float32Builder, v.into_inner()),
             Datum::Float64(v) => append_value_to_arrow!(Float64Builder, v.into_inner()),
-            Datum::String(v) => append_value_to_arrow!(StringBuilder, *v),
-            Datum::OwnedString(v) => append_value_to_arrow!(StringBuilder, v.as_str()),
+            Datum::String(v) => append_value_to_arrow!(StringBuilder, v.as_ref()),
             Datum::Blob(v) => append_value_to_arrow!(BinaryBuilder, v.as_ref()),
-            Datum::BorrowedBlob(v) => append_value_to_arrow!(BinaryBuilder, *v),
             Datum::Decimal(_) | Datum::Date(_) | Datum::Timestamp(_) | Datum::TimestampTz(_) => {
                 return Err(RowConvertError {
                     message: format!(
@@ -349,58 +346,6 @@ impl_to_arrow!(&str, StringBuilder);
 
 pub type F32 = OrderedFloat<f32>;
 pub type F64 = OrderedFloat<f64>;
-#[allow(dead_code)]
-pub type Str = Box<str>;
-
-#[derive(PartialEq, Eq, PartialOrd, Ord, Hash, Clone, Serialize, Deserialize, Default)]
-pub struct Blob(Box<[u8]>);
-
-impl Deref for Blob {
-    type Target = BlobRef;
-
-    fn deref(&self) -> &Self::Target {
-        BlobRef::new(&self.0)
-    }
-}
-
-impl BlobRef {
-    pub fn new(bytes: &[u8]) -> &Self {
-        // SAFETY: `&BlobRef` and `&[u8]` have the same layout.
-        BlobRef::ref_cast(bytes)
-    }
-}
-
-/// A slice of a blob.
-#[repr(transparent)]
-#[derive(PartialEq, Eq, PartialOrd, Ord, RefCast, Hash)]
-pub struct BlobRef([u8]);
-
-impl fmt::Debug for Blob {
-    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
-        write!(f, "{:?}", self.as_ref())
-    }
-}
-
-impl fmt::Display for Blob {
-    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
-        write!(f, "{:?}", self.as_ref())
-    }
-}
-
-impl AsRef<[u8]> for BlobRef {
-    fn as_ref(&self) -> &[u8] {
-        &self.0
-    }
-}
-
-impl Deref for BlobRef {
-    type Target = [u8];
-
-    fn deref(&self) -> &Self::Target {
-        &self.0
-    }
-}
-
 #[derive(PartialOrd, Ord, Display, PartialEq, Eq, Debug, Copy, Clone, Default, Hash, Serialize)]
 pub struct Date(i32);
 
@@ -410,15 +355,17 @@ pub struct Timestamp(i64);
 #[derive(PartialOrd, Ord, Display, PartialEq, Eq, Debug, Copy, Clone, Default, Hash, Serialize)]
 pub struct TimestampLtz(i64);
 
-impl From<Vec<u8>> for Blob {
+pub type Blob<'a> = Cow<'a, [u8]>;
+
+impl<'a> From<Vec<u8>> for Datum<'a> {
     fn from(vec: Vec<u8>) -> Self {
-        Blob(vec.into())
+        Datum::Blob(Blob::from(vec))
     }
 }
 
 impl<'a> From<&'a [u8]> for Datum<'a> {
     fn from(bytes: &'a [u8]) -> Datum<'a> {
-        Datum::BorrowedBlob(bytes)
+        Datum::Blob(Blob::from(bytes))
     }
 }
 
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
index 3a9cf0fa81..8e529e5446 100644
--- a/fluss-rust/crates/fluss/src/row/field_getter.rs
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -83,7 +83,7 @@ pub enum InnerFieldGetter {
 impl InnerFieldGetter {
     pub fn get_field<'a>(&self, row: &'a dyn InternalRow) -> Datum<'a> {
         match self {
-            InnerFieldGetter::Char { pos, len } => Datum::String(row.get_char(*pos, *len)),
+            InnerFieldGetter::Char { pos, len } => Datum::from(row.get_char(*pos, *len)),
             InnerFieldGetter::String { pos } => Datum::from(row.get_string(*pos)),
             InnerFieldGetter::Bool { pos } => Datum::from(row.get_boolean(*pos)),
             InnerFieldGetter::Binary { pos, len } => Datum::from(row.get_binary(*pos, *len)),

From e9d16ae99d472dc38a292839125e51693fd822cb Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 11 Jan 2026 21:36:46 +0800
Subject: [PATCH 060/287] chore: implement zero copy in CompactedRowReader
 (#138)

---
 .../fluss/src/row/compacted/compacted_row.rs  | 137 ++++------
 .../src/row/compacted/compacted_row_reader.rs | 239 +++++++++---------
 .../src/row/compacted/compacted_row_writer.rs |   4 +-
 fluss-rust/crates/fluss/src/row/datum.rs      |   2 +-
 4 files changed, 178 insertions(+), 204 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index fca41c655f..481f9be502 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use bytes::Bytes;
+use std::sync::OnceLock;
 
 use crate::metadata::DataType;
 use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
@@ -24,125 +24,95 @@ use crate::row::{GenericRow, InternalRow};
 // Reference implementation:
 // https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRow.java
 #[allow(dead_code)]
-pub struct CompactedRow {
+pub struct CompactedRow<'a> {
     arity: usize,
-    segment: Bytes,
-    offset: usize,
     size_in_bytes: usize,
-    decoded: bool,
-    decoded_row: GenericRow<'static>,
-    reader: CompactedRowReader,
-    deserializer: CompactedRowDeserializer,
+    decoded_row: OnceLock<GenericRow<'a>>,
+    deserializer: CompactedRowDeserializer<'a>,
+    reader: CompactedRowReader<'a>,
+    data_types: &'a [DataType],
 }
 
-#[allow(dead_code)]
-impl CompactedRow {
-    pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
-        arity.div_ceil(8)
-    }
-
-    pub fn new(types: Vec<DataType>) -> Self {
-        let arity = types.len();
-        Self {
-            arity,
-            segment: Bytes::new(),
-            offset: 0,
-            size_in_bytes: 0,
-            decoded: false,
-            decoded_row: GenericRow::new(),
-            reader: CompactedRowReader::new(arity),
-            deserializer: CompactedRowDeserializer::new(types),
-        }
-    }
+pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
+    arity.div_ceil(8)
+}
 
-    pub fn from_bytes(types: Vec<DataType>, data: Bytes) -> Self {
-        let arity = types.len();
+#[allow(dead_code)]
+impl<'a> CompactedRow<'a> {
+    pub fn from_bytes(data_types: &'a [DataType], data: &'a [u8]) -> Self {
+        let arity = data_types.len();
         let size = data.len();
         Self {
             arity,
-            segment: data,
-            offset: 0,
             size_in_bytes: size,
-            decoded: false,
-            decoded_row: GenericRow::new(),
-            reader: CompactedRowReader::new(arity),
-            deserializer: CompactedRowDeserializer::new(types),
+            decoded_row: OnceLock::new(),
+            deserializer: CompactedRowDeserializer::new(data_types),
+            reader: CompactedRowReader::new(arity, data, 0, size),
+            data_types,
         }
     }
 
-    pub fn point_to(&mut self, segment: Bytes, offset: usize, size_in_bytes: usize) {
-        self.segment = segment;
-        self.offset = offset;
-        self.size_in_bytes = size_in_bytes;
-        self.decoded = false;
-    }
-
-    pub fn get_segment(&self) -> &Bytes {
-        &self.segment
-    }
-
-    pub fn get_offset(&self) -> usize {
-        self.offset
-    }
-
     pub fn get_size_in_bytes(&self) -> usize {
         self.size_in_bytes
     }
 
-    pub fn get_field_count(&self) -> usize {
-        self.arity
+    fn decoded_row(&self) -> &GenericRow<'_> {
+        self.decoded_row
+            .get_or_init(|| self.deserializer.deserialize(&self.reader))
     }
+}
 
-    pub fn is_null_at(&self, pos: usize) -> bool {
-        let byte_index = pos >> 3;
-        let bit = pos & 7;
-        let idx = self.offset + byte_index;
-        (self.segment[idx] & (1u8 << bit)) != 0
+#[allow(dead_code)]
+impl<'a> InternalRow for CompactedRow<'a> {
+    fn get_field_count(&self) -> usize {
+        self.arity
     }
 
-    fn decoded_row(&mut self) -> &GenericRow<'static> {
-        if !self.decoded {
-            self.reader
-                .point_to(self.segment.clone(), self.offset, self.size_in_bytes);
-            self.decoded_row = self.deserializer.deserialize(&mut self.reader);
-            self.decoded = true;
-        }
-        &self.decoded_row
+    fn is_null_at(&self, pos: usize) -> bool {
+        self.data_types[pos].is_nullable() && self.reader.is_null_at(pos)
     }
 
-    pub fn get_boolean(&mut self, pos: usize) -> bool {
+    fn get_boolean(&self, pos: usize) -> bool {
         self.decoded_row().get_boolean(pos)
     }
 
-    pub fn get_byte(&mut self, pos: usize) -> i8 {
+    fn get_byte(&self, pos: usize) -> i8 {
         self.decoded_row().get_byte(pos)
     }
 
-    pub fn get_short(&mut self, pos: usize) -> i16 {
+    fn get_short(&self, pos: usize) -> i16 {
         self.decoded_row().get_short(pos)
     }
 
-    pub fn get_int(&mut self, pos: usize) -> i32 {
+    fn get_int(&self, pos: usize) -> i32 {
         self.decoded_row().get_int(pos)
     }
 
-    pub fn get_long(&mut self, pos: usize) -> i64 {
+    fn get_long(&self, pos: usize) -> i64 {
         self.decoded_row().get_long(pos)
     }
 
-    pub fn get_float(&mut self, pos: usize) -> f32 {
+    fn get_float(&self, pos: usize) -> f32 {
         self.decoded_row().get_float(pos)
     }
 
-    pub fn get_double(&mut self, pos: usize) -> f64 {
+    fn get_double(&self, pos: usize) -> f64 {
         self.decoded_row().get_double(pos)
     }
 
-    pub fn get_string(&mut self, pos: usize) -> &str {
+    fn get_char(&self, pos: usize, length: usize) -> &str {
+        self.decoded_row().get_char(pos, length)
+    }
+
+    fn get_string(&self, pos: usize) -> &str {
         self.decoded_row().get_string(pos)
     }
 
-    pub fn get_bytes(&mut self, pos: usize) -> &[u8] {
+    fn get_binary(&self, pos: usize, length: usize) -> &[u8] {
+        self.decoded_row().get_binary(pos, length)
+    }
+
+    fn get_bytes(&self, pos: usize) -> &[u8] {
         self.decoded_row().get_bytes(pos)
     }
 }
@@ -171,7 +141,6 @@ mod tests {
             DataType::Bytes(BytesType::new()),
         ];
 
-        let mut row = CompactedRow::new(types.clone());
         let mut writer = CompactedRowWriter::new(types.len());
 
         writer.write_boolean(true);
@@ -184,7 +153,8 @@ mod tests {
         writer.write_string("Hello World");
         writer.write_bytes(&[1, 2, 3, 4, 5]);
 
-        row.point_to(writer.to_bytes(), 0, writer.position());
+        let bytes = writer.to_bytes();
+        let mut row = CompactedRow::from_bytes(types.as_slice(), bytes.as_ref());
 
         assert_eq!(row.get_field_count(), 9);
         assert!(row.get_boolean(0));
@@ -204,14 +174,14 @@ mod tests {
             DataType::Double(DoubleType::new()),
         ];
 
-        let mut row = CompactedRow::new(types.clone());
         let mut writer = CompactedRowWriter::new(types.len());
 
         writer.write_int(100);
         writer.set_null_at(1);
         writer.write_double(2.71);
 
-        row.point_to(writer.to_bytes(), 0, writer.position());
+        let bytes = writer.to_bytes();
+        row = CompactedRow::from_bytes(types.as_slice(), bytes.as_ref());
 
         assert!(!row.is_null_at(0));
         assert!(row.is_null_at(1));
@@ -230,12 +200,13 @@ mod tests {
         ];
 
         let mut writer = CompactedRowWriter::new(types.len());
-        writer.write_int(42);
+        writer.write_int(-1);
         writer.write_string("test");
 
-        let mut row = CompactedRow::from_bytes(types, writer.to_bytes());
+        let bytes = writer.to_bytes();
+        let mut row = CompactedRow::from_bytes(types.as_slice(), bytes.as_ref());
 
-        assert_eq!(row.get_int(0), 42);
+        assert_eq!(row.get_int(0), -1);
         assert_eq!(row.get_string(1), "test");
 
         // Test large row
@@ -244,14 +215,14 @@ mod tests {
             .map(|_| DataType::Int(IntType::new()))
             .collect();
 
-        let mut row = CompactedRow::new(types.clone());
         let mut writer = CompactedRowWriter::new(num_fields);
 
         for i in 0..num_fields {
             writer.write_int((i * 10) as i32);
         }
 
-        row.point_to(writer.to_bytes(), 0, writer.position());
+        let bytes = writer.to_bytes();
+        row = CompactedRow::from_bytes(types.as_slice(), bytes.as_ref());
 
         for i in 0..num_fields {
             assert_eq!(row.get_int(i), (i * 10) as i32);
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 00d94ad675..c053d4ec31 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -15,54 +15,75 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use bytes::Bytes;
-use std::borrow::Cow;
-
+use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 use crate::{
     metadata::DataType,
-    row::{
-        Datum, GenericRow,
-        compacted::{compacted_row::CompactedRow, compacted_row_writer::CompactedRowWriter},
-    },
+    row::{Datum, GenericRow, compacted::compacted_row_writer::CompactedRowWriter},
 };
+use std::str::from_utf8;
 
 #[allow(dead_code)]
-pub struct CompactedRowDeserializer {
-    schema: Vec<DataType>,
+pub struct CompactedRowDeserializer<'a> {
+    schema: &'a [DataType],
 }
 
 #[allow(dead_code)]
-impl CompactedRowDeserializer {
-    pub fn new(schema: Vec<DataType>) -> Self {
+impl<'a> CompactedRowDeserializer<'a> {
+    pub fn new(schema: &'a [DataType]) -> Self {
         Self { schema }
     }
 
-    pub fn deserialize(&self, reader: &mut CompactedRowReader) -> GenericRow<'static> {
+    pub fn deserialize(&self, reader: &CompactedRowReader<'a>) -> GenericRow<'a> {
         let mut row = GenericRow::new();
-        for (pos, dtype) in self.schema.iter().enumerate() {
-            if reader.is_null_at(pos) {
-                row.set_field(pos, Datum::Null);
+        let mut cursor = reader.initial_position();
+        for (col_pos, dtype) in self.schema.iter().enumerate() {
+            if dtype.is_nullable() && reader.is_null_at(col_pos) {
+                row.set_field(col_pos, Datum::Null);
                 continue;
             }
-            let datum = match dtype {
-                DataType::Boolean(_) => Datum::Bool(reader.read_boolean()),
-                DataType::TinyInt(_) => Datum::Int8(reader.read_byte() as i8),
-                DataType::SmallInt(_) => Datum::Int16(reader.read_short()),
-                DataType::Int(_) => Datum::Int32(reader.read_int()),
-                DataType::BigInt(_) => Datum::Int64(reader.read_long()),
-                DataType::Float(_) => Datum::Float32(reader.read_float().into()),
-                DataType::Double(_) => Datum::Float64(reader.read_double().into()),
+            let (datum, next_cursor) = match dtype {
+                DataType::Boolean(_) => {
+                    let (val, next) = reader.read_boolean(cursor);
+                    (Datum::Bool(val), next)
+                }
+                DataType::TinyInt(_) => {
+                    let (val, next) = reader.read_byte(cursor);
+                    (Datum::Int8(val as i8), next)
+                }
+                DataType::SmallInt(_) => {
+                    let (val, next) = reader.read_short(cursor);
+                    (Datum::Int16(val), next)
+                }
+                DataType::Int(_) => {
+                    let (val, next) = reader.read_int(cursor);
+                    (Datum::Int32(val), next)
+                }
+                DataType::BigInt(_) => {
+                    let (val, next) = reader.read_long(cursor);
+                    (Datum::Int64(val), next)
+                }
+                DataType::Float(_) => {
+                    let (val, next) = reader.read_float(cursor);
+                    (Datum::Float32(val.into()), next)
+                }
+                DataType::Double(_) => {
+                    let (val, next) = reader.read_double(cursor);
+                    (Datum::Float64(val.into()), next)
+                }
                 // TODO: use read_char(length) in the future, but need to keep compatibility
                 DataType::Char(_) | DataType::String(_) => {
-                    Datum::String(Cow::Owned(reader.read_string()))
+                    let (val, next) = reader.read_string(cursor);
+                    (Datum::String(val.into()), next)
                 }
                 // TODO: use read_binary(length) in the future, but need to keep compatibility
                 DataType::Bytes(_) | DataType::Binary(_) => {
-                    Datum::Blob(Cow::Owned(reader.read_bytes().into_vec()))
+                    let (val, next) = reader.read_bytes(cursor);
+                    (Datum::Blob(val.into()), next)
                 }
                 _ => panic!("unsupported DataType in CompactedRowDeserializer"),
             };
-            row.set_field(pos, datum);
+            cursor = next_cursor;
+            row.set_field(col_pos, datum);
         }
         row
     }
@@ -71,151 +92,133 @@ impl CompactedRowDeserializer {
 // Reference implementation:
 // https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRowReader.java
 #[allow(dead_code)]
-pub struct CompactedRowReader {
-    segment: Bytes,
+pub struct CompactedRowReader<'a> {
+    segment: &'a [u8],
     offset: usize,
-    position: usize,
     limit: usize,
     header_size_in_bytes: usize,
 }
 
 #[allow(dead_code)]
-impl CompactedRowReader {
-    pub fn new(field_count: usize) -> Self {
-        let header = CompactedRow::calculate_bit_set_width_in_bytes(field_count);
-        Self {
-            header_size_in_bytes: header,
-            segment: Bytes::new(),
-            offset: 0,
-            position: 0,
-            limit: 0,
-        }
-    }
-
-    pub fn point_to(&mut self, data: Bytes, offset: usize, length: usize) {
+impl<'a> CompactedRowReader<'a> {
+    pub fn new(field_count: usize, data: &'a [u8], offset: usize, length: usize) -> Self {
+        let header_size_in_bytes = calculate_bit_set_width_in_bytes(field_count);
         let limit = offset + length;
-        let position = offset + self.header_size_in_bytes;
-
+        let position = offset + header_size_in_bytes;
         debug_assert!(limit <= data.len());
         debug_assert!(position <= limit);
 
-        self.segment = data;
-        self.offset = offset;
-        self.position = position;
-        self.limit = limit;
+        CompactedRowReader {
+            segment: data,
+            offset,
+            limit,
+            header_size_in_bytes,
+        }
     }
 
-    pub fn is_null_at(&self, pos: usize) -> bool {
-        let byte_index = pos >> 3;
-        let bit = pos & 7;
+    fn initial_position(&self) -> usize {
+        self.offset + self.header_size_in_bytes
+    }
+
+    pub fn is_null_at(&self, col_pos: usize) -> bool {
+        let byte_index = col_pos >> 3;
+        let bit = col_pos & 7;
         debug_assert!(byte_index < self.header_size_in_bytes);
         let idx = self.offset + byte_index;
         (self.segment[idx] & (1u8 << bit)) != 0
     }
 
-    pub fn read_boolean(&mut self) -> bool {
-        self.read_byte() != 0
+    pub fn read_boolean(&self, pos: usize) -> (bool, usize) {
+        let (val, next) = self.read_byte(pos);
+        (val != 0, next)
     }
 
-    pub fn read_byte(&mut self) -> u8 {
-        debug_assert!(self.position < self.limit);
-        let b = self.segment[self.position];
-        self.position += 1;
-        b
+    pub fn read_byte(&self, pos: usize) -> (u8, usize) {
+        debug_assert!(pos < self.limit);
+        (self.segment[pos], pos + 1)
     }
 
-    pub fn read_short(&mut self) -> i16 {
-        debug_assert!(self.position + 2 <= self.limit);
-        let bytes_slice = &self.segment[self.position..self.position + 2];
-        let byte_array: [u8; 2] = bytes_slice
-            .try_into()
-            .expect("Slice must be exactly 2 bytes long");
-
-        self.position += 2;
-        i16::from_ne_bytes(byte_array)
+    pub fn read_short(&self, pos: usize) -> (i16, usize) {
+        let next_pos = pos + 2;
+        debug_assert!(next_pos <= self.limit);
+        let bytes_slice = &self.segment[pos..pos + 2];
+        let val = i16::from_ne_bytes(
+            bytes_slice
+                .try_into()
+                .expect("Slice must be exactly 2 bytes long"),
+        );
+        (val, next_pos)
     }
 
-    pub fn read_int(&mut self) -> i32 {
+    pub fn read_int(&self, mut pos: usize) -> (i32, usize) {
         let mut result: u32 = 0;
         let mut shift = 0;
 
         for _ in 0..CompactedRowWriter::MAX_INT_SIZE {
-            let b = self.read_byte();
+            let (b, next_pos) = self.read_byte(pos);
+            pos = next_pos;
             result |= ((b & 0x7F) as u32) << shift;
             if (b & 0x80) == 0 {
-                return result as i32;
+                return (result as i32, pos);
             }
             shift += 7;
         }
-
-        panic!("Invalid input stream.");
+        panic!("Invalid VarInt32 input stream.");
     }
 
-    pub fn read_long(&mut self) -> i64 {
+    pub fn read_long(&self, mut pos: usize) -> (i64, usize) {
         let mut result: u64 = 0;
         let mut shift = 0;
 
         for _ in 0..CompactedRowWriter::MAX_LONG_SIZE {
-            let b = self.read_byte();
+            let (b, next_pos) = self.read_byte(pos);
+            pos = next_pos;
             result |= ((b & 0x7F) as u64) << shift;
             if (b & 0x80) == 0 {
-                return result as i64;
+                return (result as i64, pos);
             }
             shift += 7;
         }
-
-        panic!("Invalid input stream.");
+        panic!("Invalid VarInt64 input stream.");
     }
 
-    pub fn read_float(&mut self) -> f32 {
-        debug_assert!(self.position + 4 <= self.limit);
-        let bytes_slice = &self.segment[self.position..self.position + 4];
-        let byte_array: [u8; 4] = bytes_slice
-            .try_into()
-            .expect("Slice must be exactly 4 bytes long");
-
-        self.position += 4;
-        f32::from_ne_bytes(byte_array)
+    pub fn read_float(&self, pos: usize) -> (f32, usize) {
+        let next_pos = pos + 4;
+        debug_assert!(next_pos <= self.limit);
+        let val = f32::from_ne_bytes(
+            self.segment[pos..pos + 4]
+                .try_into()
+                .expect("Slice must be exactly 4 bytes long"),
+        );
+        (val, next_pos)
     }
 
-    pub fn read_double(&mut self) -> f64 {
-        debug_assert!(self.position + 8 <= self.limit);
-        let bytes_slice = &self.segment[self.position..self.position + 8];
-        let byte_array: [u8; 8] = bytes_slice
-            .try_into()
-            .expect("Slice must be exactly 8 bytes long");
-
-        self.position += 8;
-        f64::from_ne_bytes(byte_array)
+    pub fn read_double(&self, pos: usize) -> (f64, usize) {
+        let next_pos = pos + 8;
+        debug_assert!(next_pos <= self.limit);
+        let val = f64::from_ne_bytes(
+            self.segment[pos..pos + 8]
+                .try_into()
+                .expect("Slice must be exactly 8 bytes long"),
+        );
+        (val, next_pos)
     }
 
-    pub fn read_binary(&mut self, length: usize) -> Bytes {
-        debug_assert!(self.position + length <= self.limit);
-
-        let start = self.position;
-        let end = start + length;
-        self.position = end;
-
-        self.segment.slice(start..end)
+    pub fn read_binary(&self, pos: usize) -> (&'a [u8], usize) {
+        self.read_bytes(pos)
     }
 
-    pub fn read_bytes(&mut self) -> Box<[u8]> {
-        let len = self.read_int();
-        debug_assert!(len >= 0);
-
+    pub fn read_bytes(&self, pos: usize) -> (&'a [u8], usize) {
+        let (len, data_pos) = self.read_int(pos);
         let len = len as usize;
-        debug_assert!(self.position + len <= self.limit);
-
-        let start = self.position;
-        let end = start + len;
-        self.position = end;
-
-        self.segment[start..end].to_vec().into_boxed_slice()
+        let next_pos = data_pos + len;
+        debug_assert!(next_pos <= self.limit);
+        (&self.segment[data_pos..next_pos], next_pos)
     }
 
-    pub fn read_string(&mut self) -> String {
-        let bytes = self.read_bytes();
-        String::from_utf8(bytes.into_vec())
-            .unwrap_or_else(|e| panic!("Invalid UTF-8 in string data: {e}"))
+    pub fn read_string(&self, pos: usize) -> (&'a str, usize) {
+        let (bytes, next_pos) = self.read_bytes(pos);
+        let s = from_utf8(bytes).expect("Invalid UTF-8 when reading string");
+        (s, next_pos)
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index 834512350c..4f535c6bf0 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -18,7 +18,7 @@
 use bytes::{Bytes, BytesMut};
 use std::cmp;
 
-use crate::row::compacted::compacted_row::CompactedRow;
+use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 
 // Writer for CompactedRow
 // Reference implementation:
@@ -36,7 +36,7 @@ impl CompactedRowWriter {
     pub const MAX_LONG_SIZE: usize = 10;
 
     pub fn new(field_count: usize) -> Self {
-        let header_size = CompactedRow::calculate_bit_set_width_in_bytes(field_count);
+        let header_size = calculate_bit_set_width_in_bytes(field_count);
         let cap = cmp::max(64, header_size);
 
         let mut buffer = BytesMut::with_capacity(cap);
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index fa85ded4b8..ad7948dcef 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -403,7 +403,7 @@ mod tests {
 
     #[test]
     fn datum_accessors_and_conversions() {
-        let datum = Datum::String("value");
+        let datum = Datum::String("value".into());
         assert_eq!(datum.as_str(), "value");
         assert!(!datum.is_null());
 

From 979c0d4285a59470adf5873592c98547b626f01e Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 12 Jan 2026 02:18:27 +0000
Subject: [PATCH 061/287] chore: fix potential deadlock with holding lock
 during await (#145)

---
 .../fluss/src/client/write/accumulator.rs     | 195 +++++++++++-------
 1 file changed, 121 insertions(+), 74 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 001d0aa7d0..74aab9f4fa 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -31,6 +31,9 @@ use std::sync::Arc;
 use std::sync::atomic::{AtomicI32, AtomicI64, Ordering};
 use tokio::sync::Mutex;
 
+// Type alias to simplify complex nested types
+type BucketBatches = Vec<(BucketId, Arc<Mutex<VecDeque<WriteBatch>>>)>;
+
 #[allow(dead_code)]
 pub struct RecordAccumulator {
     config: Config,
@@ -138,20 +141,25 @@ impl RecordAccumulator {
         abort_if_batch_full: bool,
     ) -> Result<RecordAppendResult> {
         let table_path = &record.table_path;
-        let mut binding = self
-            .write_batches
-            .entry(table_path.as_ref().clone())
-            .or_insert_with(|| BucketAndWriteBatches {
-                table_id: 0,
-                is_partitioned_table: false,
-                partition_id: None,
-                batches: Default::default(),
-            });
-        let bucket_and_batches = binding.value_mut();
-        let dq = bucket_and_batches
-            .batches
-            .entry(bucket_id)
-            .or_insert_with(|| Mutex::new(VecDeque::new()));
+
+        let dq = {
+            let mut binding = self
+                .write_batches
+                .entry(table_path.as_ref().clone())
+                .or_insert_with(|| BucketAndWriteBatches {
+                    table_id: 0,
+                    is_partitioned_table: false,
+                    partition_id: None,
+                    batches: Default::default(),
+                });
+            let bucket_and_batches = binding.value_mut();
+            bucket_and_batches
+                .batches
+                .entry(bucket_id)
+                .or_insert_with(|| Arc::new(Mutex::new(VecDeque::new())))
+                .clone()
+        };
+
         let mut dq_guard = dq.lock().await;
         if let Some(append_result) = self.try_append(record, &mut dq_guard)? {
             return Ok(append_result);
@@ -166,16 +174,31 @@ impl RecordAccumulator {
     }
 
     pub async fn ready(&self, cluster: &Arc<Cluster>) -> ReadyCheckResult {
+        // Snapshot just the Arcs we need, avoiding cloning the entire BucketAndWriteBatches struct
+        let entries: Vec<(TablePath, BucketBatches)> = self
+            .write_batches
+            .iter()
+            .map(|entry| {
+                let table_path = entry.key().clone();
+                let bucket_batches: Vec<_> = entry
+                    .value()
+                    .batches
+                    .iter()
+                    .map(|(bucket_id, batch_arc)| (*bucket_id, batch_arc.clone()))
+                    .collect();
+                (table_path, bucket_batches)
+            })
+            .collect();
+
         let mut ready_nodes = HashSet::new();
         let mut next_ready_check_delay_ms = self.batch_timeout_ms;
         let mut unknown_leader_tables = HashSet::new();
-        for entry in self.write_batches.iter() {
-            let table_path = entry.key();
-            let batches = entry.value();
+
+        for (table_path, bucket_batches) in entries {
             next_ready_check_delay_ms = self
                 .bucket_ready(
-                    table_path,
-                    batches,
+                    &table_path,
+                    bucket_batches,
                     &mut ready_nodes,
                     &mut unknown_leader_tables,
                     cluster,
@@ -194,7 +217,7 @@ impl RecordAccumulator {
     async fn bucket_ready(
         &self,
         table_path: &TablePath,
-        batches: &BucketAndWriteBatches,
+        bucket_batches: BucketBatches,
         ready_nodes: &mut HashSet<ServerNode>,
         unknown_leader_tables: &mut HashSet<TablePath>,
         cluster: &Cluster,
@@ -202,7 +225,7 @@ impl RecordAccumulator {
     ) -> i64 {
         let mut next_delay = next_ready_check_delay_ms;
 
-        for (bucket_id, batch) in batches.batches.iter() {
+        for (bucket_id, batch) in bucket_batches {
             let batch_guard = batch.lock().await;
             if batch_guard.is_empty() {
                 continue;
@@ -212,7 +235,7 @@ impl RecordAccumulator {
             let waited_time_ms = batch.waited_time_ms(current_time_ms());
             let deque_size = batch_guard.len();
             let full = deque_size > 1 || batch.is_closed();
-            let table_bucket = cluster.get_table_bucket(table_path, *bucket_id);
+            let table_bucket = cluster.get_table_bucket(table_path, bucket_id);
             if let Some(leader) = cluster.leader_for(&table_bucket) {
                 next_delay =
                     self.batch_ready(leader, waited_time_ms, full, ready_nodes, next_delay);
@@ -281,60 +304,77 @@ impl RecordAccumulator {
             return Ok(ready);
         }
 
-        let mut nodes_drain_index_guard = self.nodes_drain_index.lock().await;
-        let drain_index = nodes_drain_index_guard.entry(node.id()).or_insert(0);
-        let start = *drain_index % buckets.len();
+        // Get the start index without holding the lock across awaits
+        let start = {
+            let mut nodes_drain_index_guard = self.nodes_drain_index.lock().await;
+            let drain_index = nodes_drain_index_guard.entry(node.id()).or_insert(0);
+            *drain_index % buckets.len()
+        };
+
         let mut current_index = start;
+        // Assigned at the start of each loop iteration (line 323), used after loop (line 376)
+        let mut last_processed_index;
 
         loop {
             let bucket = &buckets[current_index];
             let table_path = bucket.table_path.clone();
             let table_bucket = bucket.table_bucket.clone();
-            nodes_drain_index_guard.insert(node.id(), current_index);
+            last_processed_index = current_index;
             current_index = (current_index + 1) % buckets.len();
 
-            let bucket_and_write_batches = self.write_batches.get(&table_path);
-            if let Some(bucket_and_write_batches) = bucket_and_write_batches {
-                if let Some(deque) = bucket_and_write_batches
-                    .batches
-                    .get(&table_bucket.bucket_id())
+            let deque = self
+                .write_batches
+                .get(&table_path)
+                .and_then(|bucket_and_write_batches| {
+                    bucket_and_write_batches
+                        .batches
+                        .get(&table_bucket.bucket_id())
+                        .cloned()
+                });
+
+            if let Some(deque) = deque {
+                let mut maybe_batch = None;
                 {
-                    let mut maybe_batch = None;
-                    {
-                        let mut batch_lock = deque.lock().await;
-                        if !batch_lock.is_empty() {
-                            let first_batch = batch_lock.front().unwrap();
-
-                            if size + first_batch.estimated_size_in_bytes() > max_size as i64
-                                && !ready.is_empty()
-                            {
-                                // there is a rare case that a single batch size is larger than the request size
-                                // due to compression; in this case we will still eventually send this batch in
-                                // a single request.
-                                break;
-                            }
-
-                            maybe_batch = Some(batch_lock.pop_front().unwrap());
+                    let mut batch_lock = deque.lock().await;
+                    if !batch_lock.is_empty() {
+                        let first_batch = batch_lock.front().unwrap();
+
+                        if size + first_batch.estimated_size_in_bytes() > max_size as i64
+                            && !ready.is_empty()
+                        {
+                            // there is a rare case that a single batch size is larger than the request size
+                            // due to compression; in this case we will still eventually send this batch in
+                            // a single request.
+                            break;
                         }
+
+                        maybe_batch = Some(batch_lock.pop_front().unwrap());
                     }
+                }
 
-                    if let Some(mut batch) = maybe_batch {
-                        let current_batch_size = batch.estimated_size_in_bytes();
-                        size += current_batch_size;
+                if let Some(mut batch) = maybe_batch {
+                    let current_batch_size = batch.estimated_size_in_bytes();
+                    size += current_batch_size;
 
-                        // mark the batch as drained.
-                        batch.drained(current_time_ms());
-                        ready.push(ReadyWriteBatch {
-                            table_bucket,
-                            write_batch: batch,
-                        });
-                    }
+                    // mark the batch as drained.
+                    batch.drained(current_time_ms());
+                    ready.push(ReadyWriteBatch {
+                        table_bucket,
+                        write_batch: batch,
+                    });
                 }
             }
             if current_index == start {
                 break;
             }
         }
+
+        // Store the last processed index to maintain round-robin fairness
+        {
+            let mut nodes_drain_index_guard = self.nodes_drain_index.lock().await;
+            nodes_drain_index_guard.insert(node.id(), last_processed_index);
+        }
+
         Ok(ready)
     }
 
@@ -347,20 +387,25 @@ impl RecordAccumulator {
         let table_path = ready_write_batch.write_batch.table_path().clone();
         let bucket_id = ready_write_batch.table_bucket.bucket_id();
         let table_id = u64::try_from(ready_write_batch.table_bucket.table_id()).unwrap_or(0);
-        let mut binding =
-            self.write_batches
-                .entry(table_path)
-                .or_insert_with(|| BucketAndWriteBatches {
-                    table_id,
-                    is_partitioned_table: false,
-                    partition_id: None,
-                    batches: Default::default(),
-                });
-        let bucket_and_batches = binding.value_mut();
-        let dq = bucket_and_batches
-            .batches
-            .entry(bucket_id)
-            .or_insert_with(|| Mutex::new(VecDeque::new()));
+
+        let dq = {
+            let mut binding =
+                self.write_batches
+                    .entry(table_path)
+                    .or_insert_with(|| BucketAndWriteBatches {
+                        table_id,
+                        is_partitioned_table: false,
+                        partition_id: None,
+                        batches: Default::default(),
+                    });
+            let bucket_and_batches = binding.value_mut();
+            bucket_and_batches
+                .batches
+                .entry(bucket_id)
+                .or_insert_with(|| Arc::new(Mutex::new(VecDeque::new())))
+                .clone()
+        };
+
         let mut dq_guard = dq.lock().await;
         dq_guard.push_front(ready_write_batch.write_batch);
     }
@@ -392,9 +437,11 @@ impl RecordAccumulator {
     }
 
     #[allow(unused_must_use)]
-    #[allow(clippy::await_holding_lock)]
     pub async fn await_flush_completion(&self) -> Result<()> {
-        for result_handle in self.incomplete_batches.read().values() {
+        // Clone handles before awaiting to avoid holding RwLock read guard across await points
+        let handles: Vec<_> = self.incomplete_batches.read().values().cloned().collect();
+
+        for result_handle in handles {
             result_handle.wait().await?;
         }
         Ok(())
@@ -411,7 +458,7 @@ struct BucketAndWriteBatches {
     table_id: TableId,
     is_partitioned_table: bool,
     partition_id: Option<PartitionId>,
-    batches: HashMap<BucketId, Mutex<VecDeque<WriteBatch>>>,
+    batches: HashMap<BucketId, Arc<Mutex<VecDeque<WriteBatch>>>>,
 }
 
 pub struct RecordAppendResult {

From 63509b155d44ceae8f5195c33e31edbae45622b3 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 12 Jan 2026 07:12:27 +0000
Subject: [PATCH 062/287] chore: decrement flushes_in_progress counter in
 await_flush_comp (#147)

---
 .../fluss/src/client/write/accumulator.rs     | 47 +++++++++++++++++--
 1 file changed, 44 insertions(+), 3 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 74aab9f4fa..83f11ab782 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -441,10 +441,20 @@ impl RecordAccumulator {
         // Clone handles before awaiting to avoid holding RwLock read guard across await points
         let handles: Vec<_> = self.incomplete_batches.read().values().cloned().collect();
 
-        for result_handle in handles {
-            result_handle.wait().await?;
+        // Await on all handles
+        let result = async {
+            for result_handle in handles {
+                result_handle.wait().await?;
+            }
+            Ok(())
         }
-        Ok(())
+        .await;
+
+        // Always decrement flushes_in_progress, even if an error occurred
+        // This mimics the Java finally block behavior
+        self.flushes_in_progress.fetch_sub(1, Ordering::SeqCst);
+
+        result
     }
 }
 
@@ -557,4 +567,35 @@ mod tests {
         assert_eq!(batch.write_batch.attempts(), 1);
         Ok(())
     }
+
+    #[tokio::test]
+    async fn flush_counter_decremented_on_error() -> Result<()> {
+        use crate::client::write::broadcast::BroadcastOnce;
+        use std::sync::atomic::Ordering;
+
+        let config = Config::default();
+        let accumulator = RecordAccumulator::new(config);
+
+        accumulator.begin_flush();
+        assert_eq!(accumulator.flushes_in_progress.load(Ordering::SeqCst), 1);
+
+        // Create a failing batch by dropping the BroadcastOnce without broadcasting
+        {
+            let broadcast = BroadcastOnce::default();
+            let receiver = broadcast.receiver();
+            let handle = ResultHandle::new(receiver);
+            accumulator.incomplete_batches.write().insert(1, handle);
+            // broadcast is dropped here, causing an error
+        }
+
+        // Await flush completion should fail but still decrement counter
+        let result = accumulator.await_flush_completion().await;
+        assert!(result.is_err());
+
+        // Counter should still be decremented (this is the critical fix!)
+        assert_eq!(accumulator.flushes_in_progress.load(Ordering::SeqCst), 0);
+        assert!(!accumulator.flush_in_progress());
+
+        Ok(())
+    }
 }

From 3cdc49526ee2a8159df976f49944ca55251972b9 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Wed, 14 Jan 2026 01:42:19 +0000
Subject: [PATCH 063/287] chore: add DEVELOPMENT.md (#155)

---
 fluss-rust/DEVELOPMENT.md | 115 ++++++++++++++++++++++++++++++++++++++
 1 file changed, 115 insertions(+)
 create mode 100644 fluss-rust/DEVELOPMENT.md

diff --git a/fluss-rust/DEVELOPMENT.md b/fluss-rust/DEVELOPMENT.md
new file mode 100644
index 0000000000..a8a6d5380c
--- /dev/null
+++ b/fluss-rust/DEVELOPMENT.md
@@ -0,0 +1,115 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Development Guide
+
+Welcome to the development guide of `fluss-rust`! This project builds `fluss-rust` client and language specific bindings.  
+
+## Pre-requisites
+
+- protobuf
+- rust
+
+You can install these using your favourite package / version manager. Example installation using mise:
+
+```bash
+mise install protobuf
+mise install rust
+```
+
+## IDE Setup
+
+We recommend [RustRover](https://www.jetbrains.com/rust/) IDE to work with fluss-rust code base.
+
+### Importing fluss-rust
+
+1. On your terminal, clone fluss-rust project from GitHub
+   ```bash
+   git clone https://github.com/apache/fluss-rust.git
+   ```
+1. Open RustRover, on `Projects` tab, click `Open` and navigate to the root directory of fluss-rust
+1. Click `Open`
+
+### Copyright Profile
+
+Fluss and Fluss-rust are Apache projects and as such every files need to have Apache licence header. This can be automated in RustRover by adding a Copyright profile:
+
+1. Go to `Settings` -> `Editor` -> `Copyright` -> `Copyright Profiles`.
+1. Add a new profile and name it `Apache`.
+1. Add the following text as the license text:
+   ```
+   Licensed to the Apache Software Foundation (ASF) under one
+   or more contributor license agreements.  See the NOTICE file
+   distributed with this work for additional information
+   regarding copyright ownership.  The ASF licenses this file
+   to you under the Apache License, Version 2.0 (the
+   "License"); you may not use this file except in compliance
+   with the License.  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing,
+   software distributed under the License is distributed on an
+   "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+   KIND, either express or implied.  See the License for the
+   specific language governing permissions and limitations
+   under the License.
+   ```
+1. Go to `Editor` -> `Copyright` and choose the `Apache` profile as the default profile for this project.
+1. Click `Apply`
+
+We also use line comment formatting for licence headers. 
+1. Go to `Editor` -> `Copyright` -> `Formatting` -> `Rust`
+1. Choose `Use custom formatting`  
+1. Choose `Use line comment`
+
+## Project directories
+
+Source files are organized in the following manner
+
+1. `crates/fluss` - fluss rust client crate source
+1. `crates/examples` - fluss rust client examples
+1. `bindings` - bindings to other languages e.g. C++ under `bindings/cpp` and Python under `bindings/python`
+1. Click `Apply`
+2. 
+## Building & Testing
+
+See [quickstart](README.md#quick-start) for steps to run example code.
+
+Running all unit tests for fluss rust client: 
+
+```bash
+cargo test --workspace
+```
+
+Running all integration test cases:
+
+```bash
+cargo test --features integration_tests --workspace
+```
+
+
+### Formatting and Clippy
+
+Our CI runs cargo formatting and clippy to help keep the code base styling tidy and readable. Run the following commands and address any errors or warnings to ensure that your PR can complete CI successfully.
+
+```bash
+cargo fmt --all
+cargo clippy --all-targets --fix --allow-dirty --allow-staged
+```
+

From d8fdcc7a3589991b1cae9fc5e70addcfc3ff9e12 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Thu, 15 Jan 2026 02:51:57 +0000
Subject: [PATCH 064/287] feat: introduce KvRecordBatchBuilder (#156)

---
 .../crates/fluss/src/record/kv/kv_record.rs   | 343 +++++++++++
 .../fluss/src/record/kv/kv_record_batch.rs    | 394 ++++++++++++
 .../src/record/kv/kv_record_batch_builder.rs  | 581 ++++++++++++++++++
 fluss-rust/crates/fluss/src/record/kv/mod.rs  |  35 ++
 fluss-rust/crates/fluss/src/record/mod.rs     |   1 +
 .../src/row/compacted/compacted_key_writer.rs |   6 +
 .../src/row/compacted/compacted_row_reader.rs |  35 +-
 .../src/row/compacted/compacted_row_writer.rs |  31 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |   7 +-
 fluss-rust/crates/fluss/src/util/mod.rs       |   1 +
 fluss-rust/crates/fluss/src/util/varint.rs    | 502 +++++++++++++++
 11 files changed, 1893 insertions(+), 43 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/record/kv/kv_record.rs
 create mode 100644 fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
 create mode 100644 fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
 create mode 100644 fluss-rust/crates/fluss/src/record/kv/mod.rs
 create mode 100644 fluss-rust/crates/fluss/src/util/varint.rs

diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
new file mode 100644
index 0000000000..8c30713d42
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
@@ -0,0 +1,343 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Key-Value record implementation.
+//!
+//! This module provides the KvRecord struct which represents an immutable key-value record.
+//! The record format is:
+//! - Length => Int32
+//! - KeyLength => Unsigned VarInt
+//! - Key => bytes
+//! - Row => BinaryRow (optional, if null then this is a deletion record)
+
+use bytes::{BufMut, Bytes, BytesMut};
+use std::io;
+
+use crate::util::varint::{
+    read_unsigned_varint_bytes, size_of_unsigned_varint, write_unsigned_varint_buf,
+};
+
+/// Length field size in bytes
+pub const LENGTH_LENGTH: usize = 4;
+
+/// A key-value record.
+///
+/// The schema is:
+/// - Length => Int32
+/// - KeyLength => Unsigned VarInt
+/// - Key => bytes
+/// - Value => bytes (BinaryRow, written directly without length prefix)
+///
+/// When the value is None (deletion), no Value bytes are present.
+// Reference implementation:
+// https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/record/KvRecord.java
+#[derive(Debug, Clone)]
+pub struct KvRecord {
+    key: Bytes,
+    value: Option<Bytes>,
+    size_in_bytes: usize,
+}
+
+impl KvRecord {
+    /// Create a new KvRecord with the given key and optional value.
+    pub fn new(key: Bytes, value: Option<Bytes>) -> Self {
+        let size_in_bytes = Self::size_of(&key, value.as_deref());
+        Self {
+            key,
+            value,
+            size_in_bytes,
+        }
+    }
+
+    /// Get the key bytes.
+    pub fn key(&self) -> &Bytes {
+        &self.key
+    }
+
+    /// Get the value bytes (None indicates a deletion).
+    pub fn value(&self) -> Option<&Bytes> {
+        self.value.as_ref()
+    }
+
+    /// Calculate the total size of the record when serialized (including length prefix).
+    pub fn size_of(key: &[u8], value: Option<&[u8]>) -> usize {
+        Self::size_without_length(key, value) + LENGTH_LENGTH
+    }
+
+    /// Calculate the size without the length prefix.
+    fn size_without_length(key: &[u8], value: Option<&[u8]>) -> usize {
+        let key_len = key.len();
+        let key_len_size = size_of_unsigned_varint(key_len as u32);
+
+        match value {
+            Some(v) => key_len_size.saturating_add(key_len).saturating_add(v.len()),
+            None => {
+                // Deletion: no value bytes
+                key_len_size.saturating_add(key_len)
+            }
+        }
+    }
+
+    /// Write a KV record to a buffer.
+    ///
+    /// Returns the number of bytes written.
+    pub fn write_to_buf(buf: &mut BytesMut, key: &[u8], value: Option<&[u8]>) -> io::Result<usize> {
+        let size_in_bytes = Self::size_without_length(key, value);
+
+        let size_i32 = i32::try_from(size_in_bytes).map_err(|_| {
+            io::Error::new(
+                io::ErrorKind::InvalidInput,
+                format!("Record size {} exceeds i32::MAX", size_in_bytes),
+            )
+        })?;
+        buf.put_i32_le(size_i32);
+        let key_len = key.len() as u32;
+        write_unsigned_varint_buf(key_len, buf);
+
+        buf.put_slice(key);
+
+        if let Some(v) = value {
+            buf.put_slice(v);
+        }
+        // For None (deletion), don't write any value bytes
+
+        Ok(size_in_bytes + LENGTH_LENGTH)
+    }
+
+    /// Read a KV record from bytes at the given position.
+    ///
+    /// Returns the KvRecord and the number of bytes consumed.
+    ///
+    /// TODO: Connect KvReadContext and return CompactedRow records.
+    pub fn read_from(bytes: &Bytes, position: usize) -> io::Result<(Self, usize)> {
+        if bytes.len() < position.saturating_add(LENGTH_LENGTH) {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to read record length",
+            ));
+        }
+
+        let size_in_bytes_i32 = i32::from_le_bytes([
+            bytes[position],
+            bytes[position + 1],
+            bytes[position + 2],
+            bytes[position + 3],
+        ]);
+
+        if size_in_bytes_i32 < 0 {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidData,
+                format!("Invalid record length: {}", size_in_bytes_i32),
+            ));
+        }
+
+        let size_in_bytes = size_in_bytes_i32 as usize;
+
+        let total_size = size_in_bytes.checked_add(LENGTH_LENGTH).ok_or_else(|| {
+            io::Error::new(
+                io::ErrorKind::InvalidData,
+                format!(
+                    "Record size overflow: {} + {}",
+                    size_in_bytes, LENGTH_LENGTH
+                ),
+            )
+        })?;
+
+        let available = bytes.len().saturating_sub(position);
+        if available < total_size {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                format!(
+                    "Not enough bytes to read record: expected {}, available {}",
+                    total_size, available
+                ),
+            ));
+        }
+
+        let mut current_offset = position + LENGTH_LENGTH;
+        let record_end = position + total_size;
+
+        // Read key length as unsigned varint (bounded by record end)
+        let (key_len, varint_size) =
+            read_unsigned_varint_bytes(&bytes[current_offset..record_end])?;
+        current_offset += varint_size;
+
+        // Read key bytes
+        let key_end = current_offset + key_len as usize;
+        if key_end > position + total_size {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidData,
+                "Key length exceeds record size",
+            ));
+        }
+        let key = bytes.slice(current_offset..key_end);
+        current_offset = key_end;
+
+        // Read value bytes directly
+        let value = if current_offset < record_end {
+            // Value is present: all remaining bytes are the value
+            let value_bytes = bytes.slice(current_offset..record_end);
+            Some(value_bytes)
+        } else {
+            // No remaining bytes: this is a deletion record
+            None
+        };
+
+        Ok((
+            Self {
+                key,
+                value,
+                size_in_bytes: total_size,
+            },
+            total_size,
+        ))
+    }
+
+    /// Get the total size in bytes of this record.
+    pub fn get_size_in_bytes(&self) -> usize {
+        self.size_in_bytes
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_kv_record_size_calculation() {
+        let key = b"test_key";
+        let value = b"test_value";
+
+        // With value (no value length varint)
+        let size_with_value = KvRecord::size_of(key, Some(value));
+        assert_eq!(
+            size_with_value,
+            LENGTH_LENGTH + size_of_unsigned_varint(key.len() as u32) + key.len() + value.len()
+        );
+
+        // Without value
+        let size_without_value = KvRecord::size_of(key, None);
+        assert_eq!(
+            size_without_value,
+            LENGTH_LENGTH + size_of_unsigned_varint(key.len() as u32) + key.len()
+        );
+    }
+
+    #[test]
+    fn test_kv_record_write_read_round_trip() {
+        let key = b"my_key";
+        let value = b"my_value_data";
+
+        let mut buf = BytesMut::new();
+        let written = KvRecord::write_to_buf(&mut buf, key, Some(value)).unwrap();
+
+        let bytes = buf.freeze();
+        let (record, read_size) = KvRecord::read_from(&bytes, 0).unwrap();
+
+        assert_eq!(written, read_size);
+        assert_eq!(record.key().as_ref(), key);
+        assert_eq!(record.value().unwrap().as_ref(), value);
+        assert_eq!(record.get_size_in_bytes(), written);
+    }
+
+    #[test]
+    fn test_kv_record_deletion() {
+        let key = b"delete_me";
+
+        // Write deletion record (no value)
+        let mut buf = BytesMut::new();
+        let written = KvRecord::write_to_buf(&mut buf, key, None).unwrap();
+
+        let bytes = buf.freeze();
+        let (record, read_size) = KvRecord::read_from(&bytes, 0).unwrap();
+
+        assert_eq!(written, read_size);
+        assert_eq!(record.key().as_ref(), key);
+        assert!(record.value().is_none());
+    }
+
+    #[test]
+    fn test_kv_record_with_large_key() {
+        let key = vec![0u8; 1024];
+        let value = vec![1u8; 4096];
+
+        let mut buf = BytesMut::new();
+        let written = KvRecord::write_to_buf(&mut buf, &key, Some(&value)).unwrap();
+
+        let bytes = buf.freeze();
+        let (record, read_size) = KvRecord::read_from(&bytes, 0).unwrap();
+
+        assert_eq!(written, read_size);
+        assert_eq!(record.key().len(), key.len());
+        assert_eq!(record.value().unwrap().len(), value.len());
+    }
+
+    #[test]
+    fn test_invalid_record_lengths() {
+        let mut buf = BytesMut::new();
+        buf.put_i32_le(-1); // Negative length
+        buf.put_u8(1); // Some dummy data
+        buf.put_slice(b"key");
+        let bytes = buf.freeze();
+        let result = KvRecord::read_from(&bytes, 0);
+        assert!(result.is_err());
+        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidData);
+
+        // Test overflow length
+        let mut buf = BytesMut::new();
+        buf.put_i32_le(i32::MAX); // Very large length
+        buf.put_u8(1); // Some dummy data
+        let bytes = buf.freeze();
+        let result = KvRecord::read_from(&bytes, 0);
+        assert!(result.is_err());
+
+        // Test impossibly large but non-negative length
+        let mut buf = BytesMut::new();
+        buf.put_i32_le(1_000_000);
+        let bytes = buf.freeze();
+        let result = KvRecord::read_from(&bytes, 0);
+        assert!(result.is_err());
+        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::UnexpectedEof);
+    }
+
+    #[test]
+    fn test_multiple_records_in_buffer() {
+        let records = vec![
+            (b"key1".as_slice(), Some(b"value1".as_slice())),
+            (b"key2".as_slice(), None),
+            (b"key3".as_slice(), Some(b"value3".as_slice())),
+        ];
+
+        let mut buf = BytesMut::new();
+        for (key, value) in &records {
+            KvRecord::write_to_buf(&mut buf, key, *value).unwrap();
+        }
+
+        let bytes = buf.freeze();
+        let mut offset = 0;
+        for (expected_key, expected_value) in &records {
+            let (record, size) = KvRecord::read_from(&bytes, offset).unwrap();
+            assert_eq!(record.key().as_ref(), *expected_key);
+            match expected_value {
+                Some(v) => assert_eq!(record.value().unwrap().as_ref(), *v),
+                None => assert!(record.value().is_none()),
+            }
+            offset += size;
+        }
+        assert_eq!(offset, bytes.len());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
new file mode 100644
index 0000000000..fdd4ad7322
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
@@ -0,0 +1,394 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! KV record batch implementation.
+//!
+//! The schema of a KvRecordBatch is:
+//! - Length => Int32
+//! - Magic => Int8
+//! - CRC => Uint32
+//! - SchemaId => Int16
+//! - Attributes => Int8
+//! - WriterId => Int64
+//! - BatchSequence => Int32
+//! - RecordCount => Int32
+//! - Records => [Record]
+//!
+//! The CRC covers data from the SchemaId to the end of the batch.
+
+use bytes::Bytes;
+use std::io;
+
+use crate::record::kv::KvRecord;
+
+// Field lengths in bytes
+pub const LENGTH_LENGTH: usize = 4;
+pub const MAGIC_LENGTH: usize = 1;
+pub const CRC_LENGTH: usize = 4;
+pub const SCHEMA_ID_LENGTH: usize = 2;
+pub const ATTRIBUTE_LENGTH: usize = 1;
+pub const WRITE_CLIENT_ID_LENGTH: usize = 8;
+pub const BATCH_SEQUENCE_LENGTH: usize = 4;
+pub const RECORDS_COUNT_LENGTH: usize = 4;
+
+// Field offsets
+pub const LENGTH_OFFSET: usize = 0;
+pub const MAGIC_OFFSET: usize = LENGTH_OFFSET + LENGTH_LENGTH;
+pub const CRC_OFFSET: usize = MAGIC_OFFSET + MAGIC_LENGTH;
+pub const SCHEMA_ID_OFFSET: usize = CRC_OFFSET + CRC_LENGTH;
+pub const ATTRIBUTES_OFFSET: usize = SCHEMA_ID_OFFSET + SCHEMA_ID_LENGTH;
+pub const WRITE_CLIENT_ID_OFFSET: usize = ATTRIBUTES_OFFSET + ATTRIBUTE_LENGTH;
+pub const BATCH_SEQUENCE_OFFSET: usize = WRITE_CLIENT_ID_OFFSET + WRITE_CLIENT_ID_LENGTH;
+pub const RECORDS_COUNT_OFFSET: usize = BATCH_SEQUENCE_OFFSET + BATCH_SEQUENCE_LENGTH;
+pub const RECORDS_OFFSET: usize = RECORDS_COUNT_OFFSET + RECORDS_COUNT_LENGTH;
+
+/// Total header size
+pub const RECORD_BATCH_HEADER_SIZE: usize = RECORDS_OFFSET;
+
+/// Overhead of the batch (length field)
+pub const KV_OVERHEAD: usize = LENGTH_OFFSET + LENGTH_LENGTH;
+
+/// A KV record batch.
+///
+/// This struct provides read access to a serialized KV record batch.
+// Reference implementation:
+// https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/record/KvRecordBatch.java
+pub struct KvRecordBatch {
+    data: Bytes,
+    position: usize,
+}
+
+impl KvRecordBatch {
+    /// Create a new KvRecordBatch pointing to the given data at the specified position.
+    pub fn new(data: Bytes, position: usize) -> Self {
+        Self { data, position }
+    }
+
+    /// Get the size in bytes of this batch.
+    pub fn size_in_bytes(&self) -> io::Result<usize> {
+        if self.data.len() < self.position.saturating_add(LENGTH_LENGTH) {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to read batch length",
+            ));
+        }
+        let length_i32 = i32::from_le_bytes([
+            self.data[self.position],
+            self.data[self.position + 1],
+            self.data[self.position + 2],
+            self.data[self.position + 3],
+        ]);
+
+        if length_i32 < 0 {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidData,
+                format!("Invalid batch length: {}", length_i32),
+            ));
+        }
+
+        let length = length_i32 as usize;
+
+        Ok(length.saturating_add(KV_OVERHEAD))
+    }
+
+    /// Check if this batch is valid by verifying the checksum.
+    pub fn is_valid(&self) -> bool {
+        if !matches!(self.size_in_bytes(), Ok(s) if s >= RECORD_BATCH_HEADER_SIZE) {
+            return false;
+        }
+
+        match (self.checksum(), self.compute_checksum()) {
+            (Ok(stored), Ok(computed)) => stored == computed,
+            _ => false,
+        }
+    }
+
+    /// Get the magic byte.
+    pub fn magic(&self) -> io::Result<u8> {
+        if self.data.len() < self.position.saturating_add(MAGIC_OFFSET).saturating_add(1) {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to read magic byte",
+            ));
+        }
+        Ok(self.data[self.position + MAGIC_OFFSET])
+    }
+
+    /// Get the checksum.
+    pub fn checksum(&self) -> io::Result<u32> {
+        if self.data.len() < self.position.saturating_add(CRC_OFFSET).saturating_add(4) {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to read checksum",
+            ));
+        }
+        Ok(u32::from_le_bytes([
+            self.data[self.position + CRC_OFFSET],
+            self.data[self.position + CRC_OFFSET + 1],
+            self.data[self.position + CRC_OFFSET + 2],
+            self.data[self.position + CRC_OFFSET + 3],
+        ]))
+    }
+
+    /// Compute the checksum of this batch.
+    pub fn compute_checksum(&self) -> io::Result<u32> {
+        let size = self.size_in_bytes()?;
+        if size < RECORD_BATCH_HEADER_SIZE {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidData,
+                format!(
+                    "Batch size {} is less than header size {}",
+                    size, RECORD_BATCH_HEADER_SIZE
+                ),
+            ));
+        }
+
+        let start = self.position.saturating_add(SCHEMA_ID_OFFSET);
+        let end = self.position.saturating_add(size);
+
+        if end > self.data.len() || start >= end {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to compute checksum",
+            ));
+        }
+
+        Ok(crc32c::crc32c(&self.data[start..end]))
+    }
+
+    /// Get the schema ID.
+    pub fn schema_id(&self) -> io::Result<i16> {
+        if self.data.len()
+            < self
+                .position
+                .saturating_add(SCHEMA_ID_OFFSET)
+                .saturating_add(2)
+        {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to read schema ID",
+            ));
+        }
+        Ok(i16::from_le_bytes([
+            self.data[self.position + SCHEMA_ID_OFFSET],
+            self.data[self.position + SCHEMA_ID_OFFSET + 1],
+        ]))
+    }
+
+    /// Get the writer ID.
+    pub fn writer_id(&self) -> io::Result<i64> {
+        if self.data.len()
+            < self
+                .position
+                .saturating_add(WRITE_CLIENT_ID_OFFSET)
+                .saturating_add(8)
+        {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to read writer ID",
+            ));
+        }
+        Ok(i64::from_le_bytes([
+            self.data[self.position + WRITE_CLIENT_ID_OFFSET],
+            self.data[self.position + WRITE_CLIENT_ID_OFFSET + 1],
+            self.data[self.position + WRITE_CLIENT_ID_OFFSET + 2],
+            self.data[self.position + WRITE_CLIENT_ID_OFFSET + 3],
+            self.data[self.position + WRITE_CLIENT_ID_OFFSET + 4],
+            self.data[self.position + WRITE_CLIENT_ID_OFFSET + 5],
+            self.data[self.position + WRITE_CLIENT_ID_OFFSET + 6],
+            self.data[self.position + WRITE_CLIENT_ID_OFFSET + 7],
+        ]))
+    }
+
+    /// Get the batch sequence.
+    pub fn batch_sequence(&self) -> io::Result<i32> {
+        if self.data.len()
+            < self
+                .position
+                .saturating_add(BATCH_SEQUENCE_OFFSET)
+                .saturating_add(4)
+        {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to read batch sequence",
+            ));
+        }
+        Ok(i32::from_le_bytes([
+            self.data[self.position + BATCH_SEQUENCE_OFFSET],
+            self.data[self.position + BATCH_SEQUENCE_OFFSET + 1],
+            self.data[self.position + BATCH_SEQUENCE_OFFSET + 2],
+            self.data[self.position + BATCH_SEQUENCE_OFFSET + 3],
+        ]))
+    }
+
+    /// Get the number of records in this batch.
+    pub fn record_count(&self) -> io::Result<i32> {
+        if self.data.len()
+            < self
+                .position
+                .saturating_add(RECORDS_COUNT_OFFSET)
+                .saturating_add(4)
+        {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Not enough bytes to read record count",
+            ));
+        }
+        Ok(i32::from_le_bytes([
+            self.data[self.position + RECORDS_COUNT_OFFSET],
+            self.data[self.position + RECORDS_COUNT_OFFSET + 1],
+            self.data[self.position + RECORDS_COUNT_OFFSET + 2],
+            self.data[self.position + RECORDS_COUNT_OFFSET + 3],
+        ]))
+    }
+
+    /// Create an iterator over the records in this batch.
+    /// This validates the batch checksum before returning the iterator.
+    /// For trusted data paths, use `records_unchecked()` to skip validation.
+    pub fn records(&self) -> io::Result<KvRecordIterator> {
+        if !self.is_valid() {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidData,
+                "Invalid batch checksum",
+            ));
+        }
+        self.records_unchecked()
+    }
+
+    /// Create an iterator over the records in this batch without validating the checksum
+    pub fn records_unchecked(&self) -> io::Result<KvRecordIterator> {
+        let size = self.size_in_bytes()?;
+        let count = self.record_count()?;
+        if count < 0 {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidData,
+                format!("Invalid record count: {}", count),
+            ));
+        }
+        Ok(KvRecordIterator {
+            data: self.data.clone(),
+            position: self.position + RECORDS_OFFSET,
+            end: self.position + size,
+            remaining_count: count,
+        })
+    }
+}
+
+/// Iterator over records in a KV record batch.
+pub struct KvRecordIterator {
+    data: Bytes,
+    position: usize,
+    end: usize,
+    remaining_count: i32,
+}
+
+impl Iterator for KvRecordIterator {
+    type Item = io::Result<KvRecord>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.remaining_count <= 0 || self.position >= self.end {
+            return None;
+        }
+
+        match KvRecord::read_from(&self.data, self.position) {
+            Ok((record, size)) => {
+                self.position += size;
+                self.remaining_count -= 1;
+                Some(Ok(record))
+            }
+            Err(e) => {
+                self.remaining_count = 0; // Stop iteration on error
+                Some(Err(e))
+            }
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::KvFormat;
+    use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, KvRecordBatchBuilder};
+    use bytes::{BufMut, BytesMut};
+
+    #[test]
+    fn test_invalid_batch_lengths() {
+        // Test negative length
+        let mut buf = BytesMut::new();
+        buf.put_i32_le(-1);
+        let bytes = buf.freeze();
+        let batch = KvRecordBatch::new(bytes, 0);
+        assert!(batch.size_in_bytes().is_err()); // Should error for invalid
+        assert!(!batch.is_valid());
+
+        // Test overflow length
+        let mut buf = BytesMut::new();
+        buf.put_i32_le(i32::MAX);
+        let bytes = buf.freeze();
+        let batch = KvRecordBatch::new(bytes, 0);
+        assert!(!batch.is_valid());
+
+        // Test too-short buffer
+        let mut buf = BytesMut::new();
+        buf.put_i32_le(100); // Claims 100 bytes but buffer is tiny
+        let bytes = buf.freeze();
+        let batch = KvRecordBatch::new(bytes, 0);
+        assert!(!batch.is_valid());
+    }
+
+    #[test]
+    fn test_kv_record_batch_build_and_read() {
+        use crate::row::compacted::CompactedRowWriter;
+
+        let schema_id = 42;
+        let write_limit = 4096;
+
+        let mut builder = KvRecordBatchBuilder::new(schema_id, write_limit, KvFormat::COMPACTED);
+        builder.set_writer_state(100, 5);
+
+        let key1 = b"key1";
+        let mut value1_writer = CompactedRowWriter::new(1);
+        value1_writer.write_bytes(&[1, 2, 3, 4, 5]);
+        builder.append_row(key1, Some(&value1_writer)).unwrap();
+
+        let key2 = b"key2";
+        builder
+            .append_row::<CompactedRowWriter>(key2, None)
+            .unwrap();
+
+        let bytes = builder.build().unwrap();
+
+        let batch = KvRecordBatch::new(bytes.clone(), 0);
+        assert!(batch.is_valid());
+        assert_eq!(batch.magic().unwrap(), CURRENT_KV_MAGIC_VALUE);
+        assert_eq!(batch.schema_id().unwrap(), schema_id as i16);
+        assert_eq!(batch.writer_id().unwrap(), 100);
+        assert_eq!(batch.batch_sequence().unwrap(), 5);
+        assert_eq!(batch.record_count().unwrap(), 2);
+
+        let records: Vec<_> = batch.records().unwrap().collect();
+        assert_eq!(records.len(), 2);
+
+        let record1 = records[0].as_ref().unwrap();
+        assert_eq!(record1.key().as_ref(), key1);
+        assert_eq!(record1.value().unwrap().as_ref(), value1_writer.buffer());
+
+        let record2 = records[1].as_ref().unwrap();
+        assert_eq!(record2.key().as_ref(), key2);
+        assert!(record2.value().is_none());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
new file mode 100644
index 0000000000..773c7789b5
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
@@ -0,0 +1,581 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! KV record batch builder implementation.
+//!
+//! This module provides the KvRecordBatchBuilder for building batches of KV records.
+
+use bytes::{Bytes, BytesMut};
+use std::io;
+
+use crate::metadata::KvFormat;
+use crate::record::kv::kv_record::KvRecord;
+use crate::record::kv::kv_record_batch::{
+    ATTRIBUTES_OFFSET, BATCH_SEQUENCE_OFFSET, CRC_OFFSET, LENGTH_LENGTH, LENGTH_OFFSET,
+    MAGIC_OFFSET, RECORD_BATCH_HEADER_SIZE, RECORDS_COUNT_OFFSET, SCHEMA_ID_OFFSET,
+    WRITE_CLIENT_ID_OFFSET,
+};
+use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, NO_BATCH_SEQUENCE, NO_WRITER_ID};
+use crate::row::BinaryRow;
+
+/// Builder for KvRecordBatch.
+///
+/// This builder accumulates KV records and produces a serialized batch with proper
+/// header information and checksums.
+// Reference implementation:
+// https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/record/KvRecordBatchBuilder.java
+pub struct KvRecordBatchBuilder {
+    schema_id: i32,
+    magic: u8,
+    write_limit: usize,
+    buffer: BytesMut,
+    writer_id: i64,
+    batch_sequence: i32,
+    current_record_number: i32,
+    size_in_bytes: usize,
+    is_closed: bool,
+    kv_format: KvFormat,
+    aborted: bool,
+    built_buffer: Option<Bytes>,
+}
+
+impl KvRecordBatchBuilder {
+    /// Create a new KvRecordBatchBuilder.
+    ///
+    /// # Arguments
+    /// * `schema_id` - The schema ID for records in this batch (must fit in i16)
+    /// * `write_limit` - Maximum bytes that can be appended
+    /// * `kv_format` - The KV format (Compacted, Indexed, or Aligned)
+    pub fn new(schema_id: i32, write_limit: usize, kv_format: KvFormat) -> Self {
+        assert!(
+            schema_id <= i16::MAX as i32,
+            "schema_id shouldn't be greater than the max value of i16: {}",
+            i16::MAX
+        );
+
+        let mut buffer = BytesMut::with_capacity(write_limit.max(RECORD_BATCH_HEADER_SIZE));
+
+        // Reserve space for header (we'll write it at the end)
+        buffer.resize(RECORD_BATCH_HEADER_SIZE, 0);
+
+        Self {
+            schema_id,
+            magic: CURRENT_KV_MAGIC_VALUE,
+            write_limit,
+            buffer,
+            writer_id: NO_WRITER_ID,
+            batch_sequence: NO_BATCH_SEQUENCE,
+            current_record_number: 0,
+            size_in_bytes: RECORD_BATCH_HEADER_SIZE,
+            is_closed: false,
+            kv_format,
+            aborted: false,
+            built_buffer: None,
+        }
+    }
+
+    /// Check if there is room for a new record containing the given key and row.
+    /// If no records have been appended, this always returns true.
+    pub fn has_room_for_row<R: BinaryRow>(&self, key: &[u8], row: Option<&R>) -> bool {
+        let value = row.map(|r| r.as_bytes());
+        self.size_in_bytes + KvRecord::size_of(key, value) <= self.write_limit
+    }
+
+    /// Append a KV record with a row value to the batch.
+    ///
+    /// Returns an error if:
+    /// - The builder has been aborted
+    /// - The builder is closed
+    /// - Adding this record would exceed the write limit
+    /// - The maximum number of records is exceeded
+    /// - The KV format is not COMPACTED
+    pub fn append_row<R: BinaryRow>(&mut self, key: &[u8], row: Option<&R>) -> io::Result<()> {
+        if self.kv_format != KvFormat::COMPACTED {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidInput,
+                "append_row can only be used with KvFormat::COMPACTED",
+            ));
+        }
+
+        if self.aborted {
+            return Err(io::Error::other(
+                "Tried to append a record, but KvRecordBatchBuilder has already been aborted",
+            ));
+        }
+
+        if self.is_closed {
+            return Err(io::Error::other(
+                "Tried to append a record, but KvRecordBatchBuilder is closed for record appends",
+            ));
+        }
+
+        // Check record count limit before mutation
+        if self.current_record_number == i32::MAX {
+            return Err(io::Error::new(
+                io::ErrorKind::InvalidInput,
+                format!(
+                    "Maximum number of records per batch exceeded, max records: {}",
+                    i32::MAX
+                ),
+            ));
+        }
+
+        let value = row.map(|r| r.as_bytes());
+        let record_size = KvRecord::size_of(key, value);
+        if self.size_in_bytes + record_size > self.write_limit {
+            return Err(io::Error::new(
+                io::ErrorKind::WriteZero,
+                format!(
+                    "Adding record would exceed write limit: {} + {} > {}",
+                    self.size_in_bytes, record_size, self.write_limit
+                ),
+            ));
+        }
+
+        let record_byte_size = KvRecord::write_to_buf(&mut self.buffer, key, value)?;
+        debug_assert_eq!(record_byte_size, record_size, "Record size mismatch");
+
+        self.current_record_number += 1;
+        self.size_in_bytes += record_byte_size;
+
+        // Invalidate cached buffer since we modified the batch
+        self.built_buffer = None;
+
+        Ok(())
+    }
+
+    /// Set the writer state (writer ID and batch base sequence).
+    ///
+    /// This invalidates any cached buffer, ensuring the batch header will be rebuilt
+    /// on the next call to [`build`](Self::build).
+    pub fn set_writer_state(&mut self, writer_id: i64, batch_base_sequence: i32) {
+        self.writer_id = writer_id;
+        self.batch_sequence = batch_base_sequence;
+        // Invalidate cached buffer since header fields changed
+        self.built_buffer = None;
+    }
+
+    /// Build the batch and return the serialized bytes.
+    ///
+    /// This can be called multiple times as the batch is cached after the first build.
+    ///
+    /// # Caching and Mutations
+    ///
+    /// The builder caches the result after the first successful build. However, the cache
+    /// is invalidated (and the batch rebuilt) if any of the following occur after building:
+    /// - Calling [`append_row`](Self::append_row) to add records
+    /// - Calling [`set_writer_state`](Self::set_writer_state) to modify writer metadata
+    ///
+    /// This allows the builder to be reused with different writer states or to continue
+    /// appending records after an initial build, but callers should be aware that the
+    /// built bytes may change if mutations occur between builds.
+    ///
+    /// Note: [`close`](Self::close) prevents further appends but does not prevent writer state modifications.
+    pub fn build(&mut self) -> io::Result<Bytes> {
+        if self.aborted {
+            return Err(io::Error::other(
+                "Attempting to build an aborted record batch",
+            ));
+        }
+
+        if let Some(ref cached) = self.built_buffer {
+            return Ok(cached.clone());
+        }
+
+        self.write_batch_header()?;
+        let bytes = self.buffer.clone().freeze();
+        self.built_buffer = Some(bytes);
+        Ok(self.built_buffer.as_ref().unwrap().clone())
+    }
+
+    /// Get the writer ID.
+    pub fn writer_id(&self) -> i64 {
+        self.writer_id
+    }
+
+    /// Get the batch sequence.
+    pub fn batch_sequence(&self) -> i32 {
+        self.batch_sequence
+    }
+
+    /// Check if the builder is closed.
+    pub fn is_closed(&self) -> bool {
+        self.is_closed
+    }
+
+    /// Abort the builder.
+    /// After aborting, no more records can be appended and the batch cannot be built.
+    pub fn abort(&mut self) {
+        self.aborted = true;
+    }
+
+    /// Close the builder.
+    /// After closing, no more records can be appended, but the batch can still be built.
+    pub fn close(&mut self) -> io::Result<()> {
+        if self.aborted {
+            return Err(io::Error::other(
+                "Cannot close KvRecordBatchBuilder as it has already been aborted",
+            ));
+        }
+        self.is_closed = true;
+        Ok(())
+    }
+
+    /// Get the current size in bytes of the batch.
+    pub fn get_size_in_bytes(&self) -> usize {
+        self.size_in_bytes
+    }
+
+    // ----------------------- Internal methods -------------------------------
+
+    /// Write the batch header.
+    fn write_batch_header(&mut self) -> io::Result<()> {
+        let size_without_length = self.size_in_bytes - LENGTH_LENGTH;
+        let total_size = i32::try_from(size_without_length).map_err(|_| {
+            io::Error::new(
+                io::ErrorKind::InvalidInput,
+                format!("Batch size {} exceeds i32::MAX", size_without_length),
+            )
+        })?;
+
+        // Compute attributes before borrowing buffer mutably
+        let attributes = self.compute_attributes();
+
+        // Write to the beginning of the buffer
+        let header = &mut self.buffer[0..RECORD_BATCH_HEADER_SIZE];
+
+        // Write length
+        header[LENGTH_OFFSET..LENGTH_OFFSET + LENGTH_LENGTH]
+            .copy_from_slice(&total_size.to_le_bytes());
+
+        // Write magic
+        header[MAGIC_OFFSET] = self.magic;
+
+        // Write empty CRC first (will update later)
+        header[CRC_OFFSET..CRC_OFFSET + 4].copy_from_slice(&0u32.to_le_bytes());
+
+        // Write schema ID
+        header[SCHEMA_ID_OFFSET..SCHEMA_ID_OFFSET + 2]
+            .copy_from_slice(&(self.schema_id as i16).to_le_bytes());
+
+        // Write attributes
+        header[ATTRIBUTES_OFFSET] = attributes;
+
+        // Write writer ID
+        header[WRITE_CLIENT_ID_OFFSET..WRITE_CLIENT_ID_OFFSET + 8]
+            .copy_from_slice(&self.writer_id.to_le_bytes());
+
+        // Write batch sequence
+        header[BATCH_SEQUENCE_OFFSET..BATCH_SEQUENCE_OFFSET + 4]
+            .copy_from_slice(&self.batch_sequence.to_le_bytes());
+
+        // Write record count
+        header[RECORDS_COUNT_OFFSET..RECORDS_COUNT_OFFSET + 4]
+            .copy_from_slice(&self.current_record_number.to_le_bytes());
+
+        // Compute and update CRC
+        let crc = crc32c::crc32c(&self.buffer[SCHEMA_ID_OFFSET..self.size_in_bytes]);
+        self.buffer[CRC_OFFSET..CRC_OFFSET + 4].copy_from_slice(&crc.to_le_bytes());
+
+        Ok(())
+    }
+
+    /// Compute the attributes byte.
+    fn compute_attributes(&self) -> u8 {
+        // Currently no attributes are used
+        0
+    }
+}
+
+impl Drop for KvRecordBatchBuilder {
+    fn drop(&mut self) {
+        // Warn if the builder has records but was never built or was aborted
+        if self.current_record_number > 0 && !self.aborted && self.built_buffer.is_none() {
+            eprintln!(
+                "Warning: KvRecordBatchBuilder dropped with {} record(s) that were never built. \
+                 Call build() to serialize the batch before dropping.",
+                self.current_record_number
+            );
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::row::compacted::CompactedRowWriter;
+
+    // Helper function to create a CompactedRowWriter with a single bytes field for testing
+    fn create_test_row(data: &[u8]) -> CompactedRowWriter {
+        let mut writer = CompactedRowWriter::new(1);
+        writer.write_bytes(data);
+        writer
+    }
+
+    #[test]
+    fn test_builder_basic_workflow() {
+        let schema_id = 42;
+        let write_limit = 4096;
+        let mut builder = KvRecordBatchBuilder::new(schema_id, write_limit, KvFormat::COMPACTED);
+
+        // Test initial state
+        assert!(!builder.is_closed());
+        assert_eq!(builder.writer_id(), NO_WRITER_ID);
+        assert_eq!(builder.batch_sequence(), NO_BATCH_SEQUENCE);
+
+        // Test writer state
+        builder.set_writer_state(100, 5);
+        assert_eq!(builder.writer_id(), 100);
+        assert_eq!(builder.batch_sequence(), 5);
+
+        // Test appending records
+        let key1 = b"key1";
+        let value1 = create_test_row(b"value1");
+        assert!(builder.has_room_for_row(key1, Some(&value1)));
+        builder.append_row(key1, Some(&value1)).unwrap();
+
+        let key2 = b"key2";
+        assert!(builder.has_room_for_row::<CompactedRowWriter>(key2, None));
+        builder
+            .append_row::<CompactedRowWriter>(key2, None)
+            .unwrap();
+
+        // Test close and build
+        builder.close().unwrap();
+        assert!(builder.is_closed());
+
+        let bytes = builder.build().unwrap();
+        assert!(bytes.len() > RECORD_BATCH_HEADER_SIZE);
+
+        // Building again should return cached result
+        let bytes2 = builder.build().unwrap();
+        assert_eq!(bytes.len(), bytes2.len());
+    }
+
+    #[test]
+    fn test_builder_lifecycle() {
+        // Test abort behavior
+        let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
+        let value = create_test_row(b"value");
+        builder.append_row(b"key", Some(&value)).unwrap();
+        builder.abort();
+        assert!(
+            builder
+                .append_row::<CompactedRowWriter>(b"key2", None)
+                .is_err()
+        );
+        assert!(builder.build().is_err());
+        assert!(builder.close().is_err());
+
+        // Test close behavior
+        let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
+        let value = create_test_row(b"value");
+        builder.append_row(b"key", Some(&value)).unwrap();
+        builder.close().unwrap();
+        assert!(
+            builder
+                .append_row::<CompactedRowWriter>(b"key2", None)
+                .is_err()
+        ); // Can't append after close
+        assert!(builder.build().is_ok()); // But can still build
+    }
+
+    #[test]
+    fn test_write_limit_enforcement() {
+        let write_limit = 100; // Very small limit
+        let mut builder = KvRecordBatchBuilder::new(1, write_limit, KvFormat::COMPACTED);
+
+        // Test has_room_for_row helper
+        let large_key = vec![0u8; 1000];
+        let large_value = vec![1u8; 1000];
+        let large_row = create_test_row(&large_value);
+        assert!(!builder.has_room_for_row(&large_key, Some(&large_row)));
+        let small_value = create_test_row(b"value");
+        assert!(builder.has_room_for_row(b"key", Some(&small_value)));
+
+        // Test append enforcement - add small record first
+        builder.append_row(b"key", Some(&small_value)).unwrap();
+
+        // Try to add large record that exceeds limit (reuse large_row from above)
+        let result = builder.append_row(b"key2", Some(&large_row));
+        assert!(result.is_err());
+        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::WriteZero);
+    }
+
+    #[test]
+    fn test_append_checks_record_count_limit() {
+        let mut builder = KvRecordBatchBuilder::new(1, 100000, KvFormat::COMPACTED);
+        builder.current_record_number = i32::MAX - 1;
+
+        let value1 = create_test_row(b"value1");
+        builder.append_row(b"key1", Some(&value1)).unwrap();
+
+        let value2 = create_test_row(b"value2");
+        let result = builder.append_row(b"key2", Some(&value2));
+        assert!(result.is_err());
+        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidInput);
+    }
+
+    #[test]
+    #[should_panic(expected = "schema_id shouldn't be greater than")]
+    fn test_builder_invalid_schema_id() {
+        KvRecordBatchBuilder::new(i16::MAX as i32 + 1, 4096, KvFormat::COMPACTED);
+    }
+
+    #[test]
+    fn test_cache_invalidation_on_append() {
+        let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
+        builder.set_writer_state(100, 5);
+
+        let value1 = create_test_row(b"value1");
+        builder.append_row(b"key1", Some(&value1)).unwrap();
+        let bytes1 = builder.build().unwrap();
+        let len1 = bytes1.len();
+
+        // Append another record - this should invalidate the cache
+        let value2 = create_test_row(b"value2");
+        builder.append_row(b"key2", Some(&value2)).unwrap();
+        let bytes2 = builder.build().unwrap();
+        let len2 = bytes2.len();
+
+        // Verify the second build includes both records
+        assert!(len2 > len1, "Second build should be larger");
+
+        use crate::record::kv::KvRecordBatch;
+        let batch = KvRecordBatch::new(bytes2, 0);
+        assert!(batch.is_valid());
+        assert_eq!(batch.record_count().unwrap(), 2, "Should have 2 records");
+    }
+
+    #[test]
+    fn test_cache_invalidation_on_set_writer_state() {
+        let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
+
+        builder.set_writer_state(100, 5);
+        let value = create_test_row(b"value");
+        builder.append_row(b"key", Some(&value)).unwrap();
+        let bytes1 = builder.build().unwrap();
+
+        // Change writer state - this should invalidate the cache
+        builder.set_writer_state(200, 10);
+        let bytes2 = builder.build().unwrap();
+
+        assert_ne!(
+            bytes1, bytes2,
+            "Bytes should differ after writer state change"
+        );
+
+        use crate::record::kv::KvRecordBatch;
+        let batch1 = KvRecordBatch::new(bytes1, 0);
+        let batch2 = KvRecordBatch::new(bytes2, 0);
+
+        assert_eq!(batch1.writer_id().unwrap(), 100);
+        assert_eq!(batch1.batch_sequence().unwrap(), 5);
+
+        assert_eq!(batch2.writer_id().unwrap(), 200);
+        assert_eq!(batch2.batch_sequence().unwrap(), 10);
+    }
+
+    #[test]
+    fn test_builder_with_compacted_row_writer() {
+        use crate::metadata::{DataType, IntType, StringType};
+        use crate::record::kv::KvRecordBatch;
+        use crate::row::InternalRow;
+        use crate::row::compacted::CompactedRow;
+
+        let mut builder = KvRecordBatchBuilder::new(1, 100000, KvFormat::COMPACTED);
+        builder.set_writer_state(100, 5);
+
+        let types = vec![
+            DataType::Int(IntType::new()),
+            DataType::String(StringType::new()),
+        ];
+
+        // Create and append first record with CompactedRowWriter
+        let mut row_writer1 = CompactedRowWriter::new(2);
+        row_writer1.write_int(42);
+        row_writer1.write_string("hello");
+
+        let key1 = b"key1";
+        assert!(builder.has_room_for_row(key1, Some(&row_writer1)));
+        builder.append_row(key1, Some(&row_writer1)).unwrap();
+
+        // Create and append second record
+        let mut row_writer2 = CompactedRowWriter::new(2);
+        row_writer2.write_int(100);
+        row_writer2.write_string("world");
+
+        let key2 = b"key2";
+        builder.append_row(key2, Some(&row_writer2)).unwrap();
+
+        // Append a deletion record
+        let key3 = b"key3";
+        builder
+            .append_row::<CompactedRowWriter>(key3, None)
+            .unwrap();
+
+        // Build and verify
+        builder.close().unwrap();
+        let bytes = builder.build().unwrap();
+
+        let batch = KvRecordBatch::new(bytes, 0);
+        assert!(batch.is_valid());
+        assert_eq!(batch.record_count().unwrap(), 3);
+        assert_eq!(batch.writer_id().unwrap(), 100);
+        assert_eq!(batch.batch_sequence().unwrap(), 5);
+
+        // Read back and verify records
+        let records: Vec<_> = batch.records().unwrap().collect();
+        assert_eq!(records.len(), 3);
+
+        // Verify first record
+        let record1 = records[0].as_ref().unwrap();
+        assert_eq!(record1.key().as_ref(), key1);
+        let row1 = CompactedRow::from_bytes(&types, record1.value().unwrap());
+        assert_eq!(row1.get_int(0), 42);
+        assert_eq!(row1.get_string(1), "hello");
+
+        // Verify second record
+        let record2 = records[1].as_ref().unwrap();
+        assert_eq!(record2.key().as_ref(), key2);
+        let row2 = CompactedRow::from_bytes(&types, record2.value().unwrap());
+        assert_eq!(row2.get_int(0), 100);
+        assert_eq!(row2.get_string(1), "world");
+
+        // Verify deletion record
+        let record3 = records[2].as_ref().unwrap();
+        assert_eq!(record3.key().as_ref(), key3);
+        assert!(record3.value().is_none());
+    }
+
+    #[test]
+    fn test_kv_format_validation() {
+        let mut row_writer = CompactedRowWriter::new(1);
+        row_writer.write_int(42);
+
+        // INDEXED format should reject append_row
+        let mut indexed_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::INDEXED);
+        let result = indexed_builder.append_row(b"key", Some(&row_writer));
+        assert!(result.is_err());
+        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidInput);
+
+        // COMPACTED format should accept append_row
+        let mut compacted_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
+        let result = compacted_builder.append_row(b"key", Some(&row_writer));
+        assert!(result.is_ok());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/record/kv/mod.rs b/fluss-rust/crates/fluss/src/record/kv/mod.rs
new file mode 100644
index 0000000000..ecb762df16
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/kv/mod.rs
@@ -0,0 +1,35 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Key-Value record and batch implementations.
+
+mod kv_record;
+mod kv_record_batch;
+mod kv_record_batch_builder;
+
+pub use kv_record::{KvRecord, LENGTH_LENGTH as KV_RECORD_LENGTH_LENGTH};
+pub use kv_record_batch::*;
+pub use kv_record_batch_builder::*;
+
+/// Current KV magic value
+pub const CURRENT_KV_MAGIC_VALUE: u8 = 0;
+
+/// No writer ID constant
+pub const NO_WRITER_ID: i64 = -1;
+
+/// No batch sequence constant
+pub const NO_BATCH_SEQUENCE: i32 = -1;
diff --git a/fluss-rust/crates/fluss/src/record/mod.rs b/fluss-rust/crates/fluss/src/record/mod.rs
index 35928ea082..c5a3f8e4b6 100644
--- a/fluss-rust/crates/fluss/src/record/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/mod.rs
@@ -22,6 +22,7 @@ use std::collections::HashMap;
 
 mod arrow;
 mod error;
+pub mod kv;
 
 pub use arrow::*;
 
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
index 84a6b22724..1152b0c5d2 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
@@ -30,6 +30,12 @@ pub struct CompactedKeyWriter {
     delegate: CompactedRowWriter,
 }
 
+impl Default for CompactedKeyWriter {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
 impl CompactedKeyWriter {
     pub fn new() -> CompactedKeyWriter {
         CompactedKeyWriter {
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index c053d4ec31..5ec260897e 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -19,6 +19,7 @@ use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 use crate::{
     metadata::DataType,
     row::{Datum, GenericRow, compacted::compacted_row_writer::CompactedRowWriter},
+    util::varint::{read_unsigned_varint_at, read_unsigned_varint_u64_at},
 };
 use std::str::from_utf8;
 
@@ -150,36 +151,18 @@ impl<'a> CompactedRowReader<'a> {
         (val, next_pos)
     }
 
-    pub fn read_int(&self, mut pos: usize) -> (i32, usize) {
-        let mut result: u32 = 0;
-        let mut shift = 0;
-
-        for _ in 0..CompactedRowWriter::MAX_INT_SIZE {
-            let (b, next_pos) = self.read_byte(pos);
-            pos = next_pos;
-            result |= ((b & 0x7F) as u32) << shift;
-            if (b & 0x80) == 0 {
-                return (result as i32, pos);
-            }
-            shift += 7;
+    pub fn read_int(&self, pos: usize) -> (i32, usize) {
+        match read_unsigned_varint_at(self.segment, pos, CompactedRowWriter::MAX_INT_SIZE) {
+            Ok((value, next_pos)) => (value as i32, next_pos),
+            Err(_) => panic!("Invalid VarInt32 input stream."),
         }
-        panic!("Invalid VarInt32 input stream.");
     }
 
-    pub fn read_long(&self, mut pos: usize) -> (i64, usize) {
-        let mut result: u64 = 0;
-        let mut shift = 0;
-
-        for _ in 0..CompactedRowWriter::MAX_LONG_SIZE {
-            let (b, next_pos) = self.read_byte(pos);
-            pos = next_pos;
-            result |= ((b & 0x7F) as u64) << shift;
-            if (b & 0x80) == 0 {
-                return (result as i64, pos);
-            }
-            shift += 7;
+    pub fn read_long(&self, pos: usize) -> (i64, usize) {
+        match read_unsigned_varint_u64_at(self.segment, pos, CompactedRowWriter::MAX_LONG_SIZE) {
+            Ok((value, next_pos)) => (value as i64, next_pos),
+            Err(_) => panic!("Invalid VarInt64 input stream."),
         }
-        panic!("Invalid VarInt64 input stream.");
     }
 
     pub fn read_float(&self, pos: usize) -> (f32, usize) {
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index 4f535c6bf0..63b32a3dca 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -18,7 +18,9 @@
 use bytes::{Bytes, BytesMut};
 use std::cmp;
 
+use crate::row::BinaryRow;
 use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
+use crate::util::varint::{write_unsigned_varint_to_slice, write_unsigned_varint_u64_to_slice};
 
 // Writer for CompactedRow
 // Reference implementation:
@@ -125,25 +127,16 @@ impl CompactedRowWriter {
 
     pub fn write_int(&mut self, value: i32) {
         self.ensure_capacity(Self::MAX_INT_SIZE);
-        let mut v = value as u32;
-        while (v & !0x7F) != 0 {
-            self.buffer[self.position] = ((v as u8) & 0x7F) | 0x80;
-            self.position += 1;
-            v >>= 7;
-        }
-        self.buffer[self.position] = v as u8;
-        self.position += 1;
+        let bytes_written =
+            write_unsigned_varint_to_slice(value as u32, &mut self.buffer[self.position..]);
+        self.position += bytes_written;
     }
+
     pub fn write_long(&mut self, value: i64) {
         self.ensure_capacity(Self::MAX_LONG_SIZE);
-        let mut v = value as u64;
-        while (v & !0x7F) != 0 {
-            self.buffer[self.position] = ((v as u8) & 0x7F) | 0x80;
-            self.position += 1;
-            v >>= 7;
-        }
-        self.buffer[self.position] = v as u8;
-        self.position += 1;
+        let bytes_written =
+            write_unsigned_varint_u64_to_slice(value as u64, &mut self.buffer[self.position..]);
+        self.position += bytes_written;
     }
 
     pub fn write_float(&mut self, value: f32) {
@@ -154,3 +147,9 @@ impl CompactedRowWriter {
         self.write_raw(&value.to_ne_bytes());
     }
 }
+
+impl BinaryRow for CompactedRowWriter {
+    fn as_bytes(&self) -> &[u8] {
+        self.buffer()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index c321ab9d6b..144d64fd88 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -20,13 +20,18 @@ mod column;
 mod datum;
 
 mod binary;
-mod compacted;
+pub mod compacted;
 mod encode;
 mod field_getter;
 
 pub use column::*;
 pub use datum::*;
 
+pub trait BinaryRow {
+    /// Returns the binary representation of this row as a byte slice.
+    fn as_bytes(&self) -> &[u8];
+}
+
 // TODO make functions return Result<?> for better error handling
 pub trait InternalRow {
     /// Returns the number of fields in this row
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index 5f67290e43..d191615e86 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 pub mod murmur_hash;
+pub mod varint;
 
 use crate::metadata::TableBucket;
 use linked_hash_map::LinkedHashMap;
diff --git a/fluss-rust/crates/fluss/src/util/varint.rs b/fluss-rust/crates/fluss/src/util/varint.rs
new file mode 100644
index 0000000000..96fd1f50bf
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/util/varint.rs
@@ -0,0 +1,502 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Variable-length integer encoding utilities.
+//!
+//! This module provides utilities for encoding integers in variable-length format,
+//! which can save space when encoding small integers. The encoding uses 7 bits per byte
+//! with the most significant bit as a continuation flag.
+
+use bytes::BufMut;
+use std::io::{self, Read, Write};
+
+/// Write an unsigned integer in variable-length format.
+///
+/// The encoding uses 7 bits per byte with the MSB set to 1 if more bytes follow.
+/// This matches the encoding used in Google Protocol Buffers.
+#[allow(dead_code)]
+pub fn write_unsigned_varint<W: Write>(value: u32, writer: &mut W) -> io::Result<usize> {
+    let mut v = value;
+    let mut bytes_written = 0;
+
+    while (v & !0x7F) != 0 {
+        writer.write_all(&[((v as u8) & 0x7F) | 0x80])?;
+        bytes_written += 1;
+        v >>= 7;
+    }
+    writer.write_all(&[v as u8])?;
+    bytes_written += 1;
+
+    Ok(bytes_written)
+}
+
+/// Write an unsigned integer in variable-length format to a buffer.
+pub fn write_unsigned_varint_buf(value: u32, buf: &mut impl BufMut) {
+    let mut v = value;
+
+    while (v & !0x7F) != 0 {
+        buf.put_u8(((v as u8) & 0x7F) | 0x80);
+        v >>= 7;
+    }
+    buf.put_u8(v as u8);
+}
+
+/// Read an unsigned integer stored in variable-length format.
+#[allow(dead_code)]
+pub fn read_unsigned_varint<R: Read>(reader: &mut R) -> io::Result<u32> {
+    let mut tmp = [0u8; 1];
+    reader.read_exact(&mut tmp)?;
+    let mut byte = tmp[0] as i8;
+
+    if byte >= 0 {
+        return Ok(byte as u32);
+    }
+
+    let mut result = (byte & 127) as u32;
+
+    reader.read_exact(&mut tmp)?;
+    byte = tmp[0] as i8;
+    if byte >= 0 {
+        result |= (byte as u32) << 7;
+    } else {
+        result |= ((byte & 127) as u32) << 7;
+
+        reader.read_exact(&mut tmp)?;
+        byte = tmp[0] as i8;
+        if byte >= 0 {
+            result |= (byte as u32) << 14;
+        } else {
+            result |= ((byte & 127) as u32) << 14;
+
+            reader.read_exact(&mut tmp)?;
+            byte = tmp[0] as i8;
+            if byte >= 0 {
+                result |= (byte as u32) << 21;
+            } else {
+                result |= ((byte & 127) as u32) << 21;
+
+                reader.read_exact(&mut tmp)?;
+                byte = tmp[0] as i8;
+                result |= (byte as u32) << 28;
+
+                if byte < 0 {
+                    return Err(io::Error::new(
+                        io::ErrorKind::InvalidData,
+                        "Invalid u32 varint encoding: too many bytes (most significant bit in the 5th byte is set)",
+                    ));
+                }
+            }
+        }
+    }
+
+    Ok(result)
+}
+
+/// Read an unsigned integer from a byte slice in variable-length format.
+pub fn read_unsigned_varint_bytes(bytes: &[u8]) -> io::Result<(u32, usize)> {
+    if bytes.is_empty() {
+        return Err(io::Error::new(
+            io::ErrorKind::UnexpectedEof,
+            "Cannot read varint from empty buffer",
+        ));
+    }
+
+    let mut byte = bytes[0] as i8;
+    let mut index = 1;
+
+    if byte >= 0 {
+        return Ok((byte as u32, index));
+    }
+
+    let mut result = (byte & 127) as u32;
+
+    if index >= bytes.len() {
+        return Err(io::Error::new(
+            io::ErrorKind::UnexpectedEof,
+            "Incomplete varint",
+        ));
+    }
+    byte = bytes[index] as i8;
+    index += 1;
+    if byte >= 0 {
+        result |= (byte as u32) << 7;
+    } else {
+        result |= ((byte & 127) as u32) << 7;
+
+        if index >= bytes.len() {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Incomplete varint",
+            ));
+        }
+        byte = bytes[index] as i8;
+        index += 1;
+        if byte >= 0 {
+            result |= (byte as u32) << 14;
+        } else {
+            result |= ((byte & 127) as u32) << 14;
+
+            if index >= bytes.len() {
+                return Err(io::Error::new(
+                    io::ErrorKind::UnexpectedEof,
+                    "Incomplete varint",
+                ));
+            }
+            byte = bytes[index] as i8;
+            index += 1;
+            if byte >= 0 {
+                result |= (byte as u32) << 21;
+            } else {
+                result |= ((byte & 127) as u32) << 21;
+
+                if index >= bytes.len() {
+                    return Err(io::Error::new(
+                        io::ErrorKind::UnexpectedEof,
+                        "Incomplete varint",
+                    ));
+                }
+                byte = bytes[index] as i8;
+                index += 1;
+                result |= (byte as u32) << 28;
+
+                if byte < 0 {
+                    return Err(io::Error::new(
+                        io::ErrorKind::InvalidData,
+                        "Invalid u32 varint encoding: too many bytes (most significant bit in the 5th byte is set)",
+                    ));
+                }
+            }
+        }
+    }
+
+    Ok((result, index))
+}
+
+/// Calculate the number of bytes needed to encode a u32 in variable-length format.
+///
+/// Varint encoding uses 7 bits per byte, so we need `ceil(bits_used / 7)` bytes.
+/// This function computes that efficiently using the formula:
+///
+/// size = ((38 - leading_zeros) * 74899) >> 19  +  (leading_zeros >> 5)
+///
+/// Where:
+/// - `38 = 32 + 6` (6 accounts for ceiling in division)
+/// - `74899 = 2^19 / 7` (enables division by 7 via multiply + shift)
+/// - `leading_zeros >> 5` adds 1 when value is 0 (minimum 1 byte)
+pub fn size_of_unsigned_varint(value: u32) -> usize {
+    let leading_zeros = value.leading_zeros();
+    let leading_zeros_below_38_divided_by_7 = ((38 - leading_zeros) * 0b10010010010010011) >> 19;
+    (leading_zeros_below_38_divided_by_7 + (leading_zeros >> 5)) as usize
+}
+
+/// Calculate the number of bytes needed to encode a u64 in variable-length format.
+///
+/// Varint encoding uses 7 bits per byte, so we need `ceil(bits_used / 7)` bytes.
+/// This function computes that efficiently using the formula:
+///
+/// size = ((70 - leading_zeros) * 74899) >> 19  +  (leading_zeros >> 6)
+///
+/// - `70 = 64 + 6` (6 accounts for ceiling in division)
+/// - `74899 = 2^19 / 7` (enables division by 7 via multiply + shift)
+/// - `leading_zeros >> 6` adds 1 when value is 0 (minimum 1 byte)
+#[allow(dead_code)]
+pub fn size_of_unsigned_varint_u64(value: u64) -> usize {
+    let leading_zeros = value.leading_zeros();
+    let leading_zeros_below_70_divided_by_7 = ((70 - leading_zeros) * 0b10010010010010011) >> 19;
+    (leading_zeros_below_70_divided_by_7 + (leading_zeros >> 6)) as usize
+}
+
+/// Write an unsigned 64-bit integer in variable-length format to a buffer.
+#[allow(dead_code)]
+pub fn write_unsigned_varint_u64_buf(value: u64, buf: &mut impl BufMut) {
+    let mut v = value;
+    while (v & !0x7F) != 0 {
+        buf.put_u8(((v as u8) & 0x7F) | 0x80);
+        v >>= 7;
+    }
+    buf.put_u8(v as u8);
+}
+
+/// Write directly to a mutable byte slice, returning the number of bytes written.
+/// Used by CompactedRowWriter which manages its own position.
+///
+/// # Panics
+/// Panics if the slice is too small to hold the encoded varint.
+/// The slice must have at least 5 bytes available (the maximum size for a u32 varint).
+/// Use [`size_of_unsigned_varint`] to calculate the required size beforehand.
+pub fn write_unsigned_varint_to_slice(value: u32, slice: &mut [u8]) -> usize {
+    let mut v = value;
+    let mut written = 0;
+
+    while (v & !0x7F) != 0 {
+        slice[written] = ((v as u8) & 0x7F) | 0x80;
+        written += 1;
+        v >>= 7;
+    }
+    slice[written] = v as u8;
+    written + 1
+}
+
+/// Write unsigned 64-bit varint directly to a mutable byte slice.
+///
+/// # Panics
+/// Panics if the slice is too small to hold the encoded varint.
+/// The slice must have at least 10 bytes available (the maximum size for a u64 varint).
+pub fn write_unsigned_varint_u64_to_slice(value: u64, slice: &mut [u8]) -> usize {
+    let mut v = value;
+    let mut written = 0;
+
+    while (v & !0x7F) != 0 {
+        slice[written] = ((v as u8) & 0x7F) | 0x80;
+        written += 1;
+        v >>= 7;
+    }
+    slice[written] = v as u8;
+    written + 1
+}
+
+/// Read unsigned varint from a slice starting at given position.
+/// Returns (value, next_position).
+/// Used by CompactedRowReader which manages positions.
+pub fn read_unsigned_varint_at(
+    slice: &[u8],
+    mut pos: usize,
+    max_bytes: usize,
+) -> io::Result<(u32, usize)> {
+    let mut result: u32 = 0;
+    let mut shift = 0;
+
+    for _ in 0..max_bytes {
+        if pos >= slice.len() {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Unexpected end of varint",
+            ));
+        }
+        let b = slice[pos];
+        pos += 1;
+        result |= ((b & 0x7F) as u32) << shift;
+        if (b & 0x80) == 0 {
+            return Ok((result, pos));
+        }
+        shift += 7;
+    }
+
+    Err(io::Error::new(
+        io::ErrorKind::InvalidData,
+        "Invalid VarInt32 input stream",
+    ))
+}
+
+/// Read unsigned 64-bit varint from a slice starting at given position.
+pub fn read_unsigned_varint_u64_at(
+    slice: &[u8],
+    mut pos: usize,
+    max_bytes: usize,
+) -> io::Result<(u64, usize)> {
+    let mut result: u64 = 0;
+    let mut shift = 0;
+
+    for _ in 0..max_bytes {
+        if pos >= slice.len() {
+            return Err(io::Error::new(
+                io::ErrorKind::UnexpectedEof,
+                "Unexpected end of varint",
+            ));
+        }
+        let b = slice[pos];
+        pos += 1;
+        result |= ((b & 0x7F) as u64) << shift;
+        if (b & 0x80) == 0 {
+            return Ok((result, pos));
+        }
+        shift += 7;
+    }
+
+    Err(io::Error::new(
+        io::ErrorKind::InvalidData,
+        "Invalid VarInt64 input stream",
+    ))
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::io::Cursor;
+
+    #[test]
+    fn test_unsigned_varint_round_trip() {
+        let test_values = vec![
+            0u32,
+            1,
+            127,
+            128,
+            255,
+            256,
+            16383,
+            16384,
+            2097151,
+            2097152,
+            268435455,
+            268435456,
+            u32::MAX,
+        ];
+
+        for value in test_values {
+            // Test with Write trait
+            let mut buffer = Vec::new();
+            let written = write_unsigned_varint(value, &mut buffer).unwrap();
+
+            let mut reader = Cursor::new(&buffer);
+            let read_value = read_unsigned_varint(&mut reader).unwrap();
+
+            assert_eq!(value, read_value, "Round trip failed for value {}", value);
+            assert_eq!(
+                written,
+                buffer.len(),
+                "Bytes written mismatch for value {}",
+                value
+            );
+
+            // Test with BufMut
+            let mut buf = bytes::BytesMut::new();
+            write_unsigned_varint_buf(value, &mut buf);
+            assert_eq!(buf.len(), written, "BufMut write length mismatch");
+
+            // Test size calculation
+            let calculated_size = size_of_unsigned_varint(value);
+            assert_eq!(
+                calculated_size,
+                buffer.len(),
+                "Size calculation failed for value {}",
+                value
+            );
+
+            // Test reading from bytes
+            let (read_value_bytes, bytes_read) = read_unsigned_varint_bytes(&buffer).unwrap();
+            assert_eq!(
+                value, read_value_bytes,
+                "Bytes read failed for value {}",
+                value
+            );
+            assert_eq!(
+                bytes_read,
+                buffer.len(),
+                "Bytes read count mismatch for value {}",
+                value
+            );
+        }
+    }
+
+    #[test]
+    fn test_size_of_unsigned_varint() {
+        assert_eq!(size_of_unsigned_varint(0), 1);
+        assert_eq!(size_of_unsigned_varint(127), 1);
+        assert_eq!(size_of_unsigned_varint(128), 2);
+        assert_eq!(size_of_unsigned_varint(16383), 2);
+        assert_eq!(size_of_unsigned_varint(16384), 3);
+        assert_eq!(size_of_unsigned_varint(2097151), 3);
+        assert_eq!(size_of_unsigned_varint(2097152), 4);
+        assert_eq!(size_of_unsigned_varint(268435455), 4);
+        assert_eq!(size_of_unsigned_varint(268435456), 5);
+        assert_eq!(size_of_unsigned_varint(u32::MAX), 5);
+    }
+
+    #[test]
+    fn test_size_of_unsigned_varint_u64() {
+        assert_eq!(size_of_unsigned_varint_u64(0), 1);
+        assert_eq!(size_of_unsigned_varint_u64(127), 1);
+        assert_eq!(size_of_unsigned_varint_u64(128), 2);
+        assert_eq!(size_of_unsigned_varint_u64(16383), 2);
+        assert_eq!(size_of_unsigned_varint_u64(16384), 3);
+        assert_eq!(size_of_unsigned_varint_u64(2097151), 3);
+        assert_eq!(size_of_unsigned_varint_u64(2097152), 4);
+        assert_eq!(size_of_unsigned_varint_u64(268435455), 4);
+        assert_eq!(size_of_unsigned_varint_u64(268435456), 5);
+        assert_eq!(size_of_unsigned_varint_u64(u32::MAX as u64), 5);
+        assert_eq!(size_of_unsigned_varint_u64(34359738367), 5);
+        assert_eq!(size_of_unsigned_varint_u64(34359738368), 6);
+        assert_eq!(size_of_unsigned_varint_u64(4398046511103), 6);
+        assert_eq!(size_of_unsigned_varint_u64(4398046511104), 7);
+        assert_eq!(size_of_unsigned_varint_u64(562949953421311), 7);
+        assert_eq!(size_of_unsigned_varint_u64(562949953421312), 8);
+        assert_eq!(size_of_unsigned_varint_u64(72057594037927935), 8);
+        assert_eq!(size_of_unsigned_varint_u64(72057594037927936), 9);
+        assert_eq!(size_of_unsigned_varint_u64(9223372036854775807), 9);
+        assert_eq!(size_of_unsigned_varint_u64(9223372036854775808), 10);
+        assert_eq!(size_of_unsigned_varint_u64(u64::MAX), 10);
+    }
+
+    #[test]
+    fn test_read_unsigned_varint_bytes_error_handling() {
+        // Empty buffer
+        assert!(read_unsigned_varint_bytes(&[]).is_err());
+
+        // Incomplete varint (continuation bit set but no next byte)
+        assert!(read_unsigned_varint_bytes(&[0x80]).is_err());
+        assert!(read_unsigned_varint_bytes(&[0xFF, 0x80]).is_err());
+    }
+
+    #[test]
+    fn test_write_read_to_slice() {
+        // Test u32 varint to slice
+        let test_values_u32 = vec![0u32, 127, 128, 16384, u32::MAX];
+
+        for value in test_values_u32 {
+            let mut buffer = vec![0u8; 10];
+            let written = write_unsigned_varint_to_slice(value, &mut buffer);
+
+            let (read_value, next_pos) = read_unsigned_varint_at(&buffer, 0, 5).unwrap();
+            assert_eq!(value, read_value);
+            assert_eq!(written, next_pos);
+        }
+
+        // Test u64 varint to slice
+        let test_values_u64 = vec![0u64, 127, 128, 16384, u32::MAX as u64, u64::MAX];
+
+        for value in test_values_u64 {
+            let mut buffer = vec![0u8; 10];
+            let written = write_unsigned_varint_u64_to_slice(value, &mut buffer);
+
+            let (read_value, next_pos) = read_unsigned_varint_u64_at(&buffer, 0, 10).unwrap();
+            assert_eq!(value, read_value);
+            assert_eq!(written, next_pos);
+        }
+    }
+
+    #[test]
+    fn test_read_at_with_offset() {
+        // Write multiple varints and read at different positions
+        let mut buffer = vec![0u8; 20];
+        let mut pos = 0;
+
+        pos += write_unsigned_varint_to_slice(127, &mut buffer[pos..]);
+        pos += write_unsigned_varint_to_slice(16384, &mut buffer[pos..]);
+        let end_pos = pos + write_unsigned_varint_to_slice(u32::MAX, &mut buffer[pos..]);
+
+        // Read back
+        let (val1, pos1) = read_unsigned_varint_at(&buffer, 0, 5).unwrap();
+        assert_eq!(val1, 127);
+
+        let (val2, pos2) = read_unsigned_varint_at(&buffer, pos1, 5).unwrap();
+        assert_eq!(val2, 16384);
+
+        let (val3, pos3) = read_unsigned_varint_at(&buffer, pos2, 5).unwrap();
+        assert_eq!(val3, u32::MAX);
+        assert_eq!(pos3, end_pos);
+    }
+}

From 207a7d183c34d8230bdf049e02dc54754723e97b Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Thu, 15 Jan 2026 09:25:31 +0000
Subject: [PATCH 065/287] chore: Introduce WriteFormat and various small
 changes to unblock Upsert implementation (#158)

---
 fluss-rust/crates/fluss/Cargo.toml            |  2 +
 .../crates/fluss/src/client/write/mod.rs      |  2 +
 .../fluss/src/client/write/write_format.rs    | 65 +++++++++++++++++++
 fluss-rust/crates/fluss/src/error.rs          |  9 +++
 .../fluss/src/metadata/data_lake_format.rs    |  3 +
 .../crates/fluss/src/metadata/datatype.rs     | 23 +++++++
 fluss-rust/crates/fluss/src/metadata/table.rs | 22 ++++++-
 .../crates/fluss/src/row/field_getter.rs      | 14 +++-
 8 files changed, 138 insertions(+), 2 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/write/write_format.rs

diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index e8c851f7b7..8942ffc7db 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -60,6 +60,8 @@ tempfile = "3.23.0"
 snafu = "0.8.3"
 scopeguard = "1.2.0"
 delegate = "0.13.5"
+strum = "0.26"
+strum_macros = "0.26"
 
 [target.'cfg(target_arch = "wasm32")'.dependencies]
 jiff = { workspace = true, features = ["js"] }
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index d79418bfc2..00a71c51fa 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -30,8 +30,10 @@ pub(crate) mod broadcast;
 mod bucket_assigner;
 
 mod sender;
+mod write_format;
 mod writer_client;
 
+pub use write_format::WriteFormat;
 pub use writer_client::WriterClient;
 
 pub struct WriteRecord<'a> {
diff --git a/fluss-rust/crates/fluss/src/client/write/write_format.rs b/fluss-rust/crates/fluss/src/client/write/write_format.rs
new file mode 100644
index 0000000000..d65e42de68
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/write_format.rs
@@ -0,0 +1,65 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::KvFormat;
+use std::fmt::Display;
+
+pub enum WriteFormat {
+    ArrowLog,
+    CompactedLog,
+    CompactedKv,
+}
+
+impl WriteFormat {
+    pub const fn is_log(&self) -> bool {
+        matches!(self, Self::ArrowLog | Self::CompactedLog)
+    }
+
+    pub fn is_kv(&self) -> bool {
+        !self.is_log()
+    }
+
+    pub fn to_kv_format(&self) -> Result<KvFormat> {
+        match self {
+            WriteFormat::CompactedKv => Ok(KvFormat::COMPACTED),
+            other => Err(IllegalArgument {
+                message: format!("WriteFormat `{}` is not a KvFormat", other),
+            }),
+        }
+    }
+
+    pub fn from_kv_format(kv_format: &KvFormat) -> Result<Self> {
+        match kv_format {
+            KvFormat::COMPACTED => Ok(WriteFormat::CompactedKv),
+            other => Err(IllegalArgument {
+                message: format!("Unknown KvFormat: `{}`", other),
+            }),
+        }
+    }
+}
+
+impl Display for WriteFormat {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        match self {
+            WriteFormat::ArrowLog => f.write_str("ArrowLog"),
+            WriteFormat::CompactedLog => f.write_str("CompactedLog"),
+            WriteFormat::CompactedKv => f.write_str("CompactedKv"),
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index e04fde14d7..0a368b7be9 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -21,6 +21,7 @@ pub use crate::rpc::{ApiError, FlussError};
 use arrow_schema::ArrowError;
 use snafu::Snafu;
 use std::{io, result};
+use strum::ParseError;
 
 pub type Result<T> = result::Result<T, Error>;
 
@@ -155,3 +156,11 @@ impl From<ApiError> for Error {
         Error::FlussAPIError { api_error: value }
     }
 }
+
+impl From<ParseError> for Error {
+    fn from(value: ParseError) -> Self {
+        Error::IllegalArgument {
+            message: value.to_string(),
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs b/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
index 76a23f8d96..c1861098c3 100644
--- a/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
+++ b/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
@@ -15,11 +15,14 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use strum_macros::{Display, EnumString};
+
 /// Identifies the logical format of a data lake table supported by Fluss.
 ///
 /// This enum is typically used in metadata and configuration to distinguish
 /// between different table formats so that the appropriate integration and
 /// semantics can be applied.
+#[derive(Debug, EnumString, Display, PartialEq)]
 pub enum DataLakeFormat {
     /// Apache Paimon data lake table format.
     Paimon,
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index c53cd273cb..dc1f40730f 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -15,6 +15,8 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
 use serde::{Deserialize, Serialize};
 use std::fmt::{Display, Formatter};
 
@@ -857,6 +859,27 @@ impl RowType {
         self.fields.iter().position(|f| f.name == field_name)
     }
 
+    pub fn get_field_names(&self) -> Vec<&str> {
+        self.fields.iter().map(|f| f.name.as_str()).collect()
+    }
+
+    pub fn project(&self, project_field_positions: &[usize]) -> Result<RowType> {
+        Ok(RowType::with_nullable(
+            self.nullable,
+            project_field_positions
+                .iter()
+                .map(|pos| {
+                    self.fields
+                        .get(*pos)
+                        .cloned()
+                        .ok_or_else(|| IllegalArgument {
+                            message: format!("invalid field position: {}", *pos),
+                        })
+                })
+                .collect::<Result<Vec<_>>>()?,
+        ))
+    }
+
     #[cfg(test)]
     pub fn with_data_types(data_types: Vec<DataType>) -> Self {
         let mut fields: Vec<DataField> = Vec::new();
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 4f6c04bc61..b1e8a90ba2 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -18,11 +18,13 @@
 use crate::compression::ArrowCompressionInfo;
 use crate::error::Error::InvalidTableError;
 use crate::error::{Error, Result};
+use crate::metadata::DataLakeFormat;
 use crate::metadata::datatype::{DataField, DataType, RowType};
 use core::fmt;
 use serde::{Deserialize, Serialize};
 use std::collections::{HashMap, HashSet};
 use std::fmt::{Display, Formatter};
+use strum_macros::EnumString;
 
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 pub struct Column {
@@ -603,7 +605,7 @@ impl LogFormat {
     }
 }
 
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, EnumString)]
 pub enum KvFormat {
     INDEXED,
     COMPACTED,
@@ -726,6 +728,24 @@ impl TableConfig {
     pub fn get_arrow_compression_info(&self) -> Result<ArrowCompressionInfo> {
         ArrowCompressionInfo::from_conf(&self.properties)
     }
+
+    pub fn get_datalake_format(&self) -> Result<Option<DataLakeFormat>> {
+        self.properties
+            .get("table.datalake.format")
+            .map(|f| f.parse().map_err(Error::from))
+            .transpose()
+    }
+
+    pub fn get_kv_format(&self) -> Result<KvFormat> {
+        // TODO: Consolidate configurations logic, constants, defaults in a single place
+        const DEFAULT_KV_FORMAT: &str = "COMPACTED";
+        let kv_format = self
+            .properties
+            .get("table.kv.format")
+            .map(String::as_str)
+            .unwrap_or(DEFAULT_KV_FORMAT);
+        kv_format.parse().map_err(Into::into)
+    }
 }
 
 impl TableInfo {
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
index 8e529e5446..97f9e395fc 100644
--- a/fluss-rust/crates/fluss/src/row/field_getter.rs
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -15,9 +15,10 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::metadata::DataType;
+use crate::metadata::{DataType, RowType};
 use crate::row::{Datum, InternalRow};
 
+#[derive(Clone)]
 pub enum FieldGetter {
     Nullable(InnerFieldGetter),
     NonNullable(InnerFieldGetter),
@@ -36,6 +37,16 @@ impl FieldGetter {
         }
     }
 
+    #[allow(dead_code)]
+    pub fn create_field_getters(row_type: &RowType) -> Box<[FieldGetter]> {
+        row_type
+            .fields()
+            .iter()
+            .enumerate()
+            .map(|(pos, field)| Self::create(field.data_type(), pos))
+            .collect()
+    }
+
     pub fn create(data_type: &DataType, pos: usize) -> FieldGetter {
         let inner_field_getter = match data_type {
             DataType::Char(t) => InnerFieldGetter::Char {
@@ -66,6 +77,7 @@ impl FieldGetter {
     }
 }
 
+#[derive(Clone)]
 pub enum InnerFieldGetter {
     Char { pos: usize, len: usize },
     String { pos: usize },

From b9cc78bf37f04c6d2ff3bd0151dd9750ad90a9db Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Thu, 15 Jan 2026 15:45:41 +0000
Subject: [PATCH 066/287] feat: Introduce CompactedRowEncoder (#161)

---
 .../crates/fluss/src/metadata/datatype.rs     | 10 ++-
 .../fluss/src/record/kv/kv_record_batch.rs    | 13 +--
 .../src/record/kv/kv_record_batch_builder.rs  | 51 ++++++------
 .../fluss/src/row/compacted/compacted_row.rs  | 41 ++++++---
 .../src/row/compacted/compacted_row_reader.rs | 18 +++-
 .../src/row/compacted/compacted_row_writer.rs | 59 +++++++------
 .../src/row/encode/compacted_row_encoder.rs   | 83 +++++++++++++++++++
 fluss-rust/crates/fluss/src/row/encode/mod.rs | 68 ++++++++++++++-
 fluss-rust/crates/fluss/src/row/mod.rs        |  4 +-
 9 files changed, 263 insertions(+), 84 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs

diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index dc1f40730f..f1574665eb 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -682,11 +682,11 @@ impl Default for BytesType {
 }
 
 impl BytesType {
-    pub fn new() -> Self {
+    pub const fn new() -> Self {
         Self::with_nullable(true)
     }
 
-    pub fn with_nullable(nullable: bool) -> Self {
+    pub const fn with_nullable(nullable: bool) -> Self {
         Self { nullable }
     }
 
@@ -859,6 +859,10 @@ impl RowType {
         self.fields.iter().position(|f| f.name == field_name)
     }
 
+    pub fn field_types(&self) -> impl Iterator<Item = &DataType> + '_ {
+        self.fields.iter().map(|f| &f.data_type)
+    }
+
     pub fn get_field_names(&self) -> Vec<&str> {
         self.fields.iter().map(|f| f.name.as_str()).collect()
     }
@@ -931,7 +935,7 @@ impl DataTypes {
         DataType::Binary(BinaryType::new(length))
     }
 
-    pub fn bytes() -> DataType {
+    pub const fn bytes() -> DataType {
         DataType::Bytes(BytesType::new())
     }
 
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
index fdd4ad7322..6ead64276a 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
@@ -321,8 +321,10 @@ impl Iterator for KvRecordIterator {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::KvFormat;
+    use crate::metadata::{DataTypes, KvFormat};
     use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, KvRecordBatchBuilder};
+    use crate::row::binary::BinaryWriter;
+    use crate::row::compacted::CompactedRow;
     use bytes::{BufMut, BytesMut};
 
     #[test]
@@ -363,12 +365,13 @@ mod tests {
         let key1 = b"key1";
         let mut value1_writer = CompactedRowWriter::new(1);
         value1_writer.write_bytes(&[1, 2, 3, 4, 5]);
-        builder.append_row(key1, Some(&value1_writer)).unwrap();
+
+        let data_types = &[DataTypes::bytes()];
+        let row = &CompactedRow::from_bytes(data_types, value1_writer.buffer());
+        builder.append_row(key1, Some(row)).unwrap();
 
         let key2 = b"key2";
-        builder
-            .append_row::<CompactedRowWriter>(key2, None)
-            .unwrap();
+        builder.append_row::<CompactedRow>(key2, None).unwrap();
 
         let bytes = builder.build().unwrap();
 
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
index 773c7789b5..7d1a7972e4 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
@@ -317,13 +317,14 @@ impl Drop for KvRecordBatchBuilder {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::row::compacted::CompactedRowWriter;
+    use crate::metadata::{DataType, DataTypes};
+    use crate::row::binary::BinaryWriter;
+    use crate::row::compacted::{CompactedRow, CompactedRowWriter};
 
     // Helper function to create a CompactedRowWriter with a single bytes field for testing
-    fn create_test_row(data: &[u8]) -> CompactedRowWriter {
-        let mut writer = CompactedRowWriter::new(1);
-        writer.write_bytes(data);
-        writer
+    fn create_test_row(data: &[u8]) -> CompactedRow<'_> {
+        const DATA_TYPE: &[DataType] = &[DataTypes::bytes()];
+        CompactedRow::from_bytes(DATA_TYPE, data)
     }
 
     #[test]
@@ -349,10 +350,8 @@ mod tests {
         builder.append_row(key1, Some(&value1)).unwrap();
 
         let key2 = b"key2";
-        assert!(builder.has_room_for_row::<CompactedRowWriter>(key2, None));
-        builder
-            .append_row::<CompactedRowWriter>(key2, None)
-            .unwrap();
+        assert!(builder.has_room_for_row::<CompactedRow>(key2, None));
+        builder.append_row::<CompactedRow>(key2, None).unwrap();
 
         // Test close and build
         builder.close().unwrap();
@@ -373,11 +372,7 @@ mod tests {
         let value = create_test_row(b"value");
         builder.append_row(b"key", Some(&value)).unwrap();
         builder.abort();
-        assert!(
-            builder
-                .append_row::<CompactedRowWriter>(b"key2", None)
-                .is_err()
-        );
+        assert!(builder.append_row::<CompactedRow>(b"key2", None).is_err());
         assert!(builder.build().is_err());
         assert!(builder.close().is_err());
 
@@ -386,11 +381,7 @@ mod tests {
         let value = create_test_row(b"value");
         builder.append_row(b"key", Some(&value)).unwrap();
         builder.close().unwrap();
-        assert!(
-            builder
-                .append_row::<CompactedRowWriter>(b"key2", None)
-                .is_err()
-        ); // Can't append after close
+        assert!(builder.append_row::<CompactedRow>(b"key2", None).is_err()); // Can't append after close
         assert!(builder.build().is_ok()); // But can still build
     }
 
@@ -510,23 +501,26 @@ mod tests {
         row_writer1.write_int(42);
         row_writer1.write_string("hello");
 
+        let data_types = &[DataTypes::int(), DataTypes::string()];
+        let row1 = &CompactedRow::from_bytes(data_types, row_writer1.buffer());
+
         let key1 = b"key1";
-        assert!(builder.has_room_for_row(key1, Some(&row_writer1)));
-        builder.append_row(key1, Some(&row_writer1)).unwrap();
+        assert!(builder.has_room_for_row(key1, Some(row1)));
+        builder.append_row(key1, Some(row1)).unwrap();
 
         // Create and append second record
         let mut row_writer2 = CompactedRowWriter::new(2);
         row_writer2.write_int(100);
         row_writer2.write_string("world");
 
+        let row2 = &CompactedRow::from_bytes(data_types, row_writer2.buffer());
+
         let key2 = b"key2";
-        builder.append_row(key2, Some(&row_writer2)).unwrap();
+        builder.append_row(key2, Some(row2)).unwrap();
 
         // Append a deletion record
         let key3 = b"key3";
-        builder
-            .append_row::<CompactedRowWriter>(key3, None)
-            .unwrap();
+        builder.append_row::<CompactedRow>(key3, None).unwrap();
 
         // Build and verify
         builder.close().unwrap();
@@ -567,15 +561,18 @@ mod tests {
         let mut row_writer = CompactedRowWriter::new(1);
         row_writer.write_int(42);
 
+        let data_types = &[DataTypes::int()];
+        let row = &CompactedRow::from_bytes(data_types, row_writer.buffer());
+
         // INDEXED format should reject append_row
         let mut indexed_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::INDEXED);
-        let result = indexed_builder.append_row(b"key", Some(&row_writer));
+        let result = indexed_builder.append_row(b"key", Some(row));
         assert!(result.is_err());
         assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidInput);
 
         // COMPACTED format should accept append_row
         let mut compacted_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
-        let result = compacted_builder.append_row(b"key", Some(&row_writer));
+        let result = compacted_builder.append_row(b"key", Some(row));
         assert!(result.is_ok());
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 481f9be502..9ff3b5ffd5 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -15,11 +15,10 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use std::sync::OnceLock;
-
 use crate::metadata::DataType;
 use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
-use crate::row::{GenericRow, InternalRow};
+use crate::row::{BinaryRow, GenericRow, InternalRow};
+use std::sync::{Arc, OnceLock};
 
 // Reference implementation:
 // https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRow.java
@@ -28,9 +27,9 @@ pub struct CompactedRow<'a> {
     arity: usize,
     size_in_bytes: usize,
     decoded_row: OnceLock<GenericRow<'a>>,
-    deserializer: CompactedRowDeserializer<'a>,
+    deserializer: Arc<CompactedRowDeserializer<'a>>,
     reader: CompactedRowReader<'a>,
-    data_types: &'a [DataType],
+    data: &'a [u8],
 }
 
 pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
@@ -40,15 +39,25 @@ pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
 #[allow(dead_code)]
 impl<'a> CompactedRow<'a> {
     pub fn from_bytes(data_types: &'a [DataType], data: &'a [u8]) -> Self {
-        let arity = data_types.len();
-        let size = data.len();
+        Self::deserialize(
+            Arc::new(CompactedRowDeserializer::new(data_types)),
+            data_types.len(),
+            data,
+        )
+    }
+
+    pub fn deserialize(
+        deserializer: Arc<CompactedRowDeserializer<'a>>,
+        arity: usize,
+        data: &'a [u8],
+    ) -> Self {
         Self {
             arity,
-            size_in_bytes: size,
+            size_in_bytes: data.len(),
             decoded_row: OnceLock::new(),
-            deserializer: CompactedRowDeserializer::new(data_types),
-            reader: CompactedRowReader::new(arity, data, 0, size),
-            data_types,
+            deserializer: Arc::clone(&deserializer),
+            reader: CompactedRowReader::new(arity, data, 0, data.len()),
+            data,
         }
     }
 
@@ -62,6 +71,12 @@ impl<'a> CompactedRow<'a> {
     }
 }
 
+impl BinaryRow for CompactedRow<'_> {
+    fn as_bytes(&self) -> &[u8] {
+        self.data
+    }
+}
+
 #[allow(dead_code)]
 impl<'a> InternalRow for CompactedRow<'a> {
     fn get_field_count(&self) -> usize {
@@ -69,7 +84,7 @@ impl<'a> InternalRow for CompactedRow<'a> {
     }
 
     fn is_null_at(&self, pos: usize) -> bool {
-        self.data_types[pos].is_nullable() && self.reader.is_null_at(pos)
+        self.deserializer.get_data_types()[pos].is_nullable() && self.reader.is_null_at(pos)
     }
 
     fn get_boolean(&self, pos: usize) -> bool {
@@ -120,6 +135,8 @@ impl<'a> InternalRow for CompactedRow<'a> {
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::row::binary::BinaryWriter;
+
     use crate::metadata::{
         BigIntType, BooleanType, BytesType, DoubleType, FloatType, IntType, SmallIntType,
         StringType, TinyIntType,
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 5ec260897e..9ce50952f4 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -21,17 +21,31 @@ use crate::{
     row::{Datum, GenericRow, compacted::compacted_row_writer::CompactedRowWriter},
     util::varint::{read_unsigned_varint_at, read_unsigned_varint_u64_at},
 };
+use std::borrow::Cow;
 use std::str::from_utf8;
 
 #[allow(dead_code)]
+#[derive(Clone)]
 pub struct CompactedRowDeserializer<'a> {
-    schema: &'a [DataType],
+    schema: Cow<'a, [DataType]>,
 }
 
 #[allow(dead_code)]
 impl<'a> CompactedRowDeserializer<'a> {
     pub fn new(schema: &'a [DataType]) -> Self {
-        Self { schema }
+        Self {
+            schema: Cow::Borrowed(schema),
+        }
+    }
+
+    pub fn new_from_owned(schema: Vec<DataType>) -> Self {
+        Self {
+            schema: Cow::Owned(schema),
+        }
+    }
+
+    pub fn get_data_types(&self) -> &[DataType] {
+        self.schema.as_ref()
     }
 
     pub fn deserialize(&self, reader: &CompactedRowReader<'a>) -> GenericRow<'a> {
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index 63b32a3dca..c130e94cce 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -15,12 +15,11 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use bytes::{Bytes, BytesMut};
-use std::cmp;
-
-use crate::row::BinaryRow;
+use crate::row::binary::BinaryWriter;
 use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 use crate::util::varint::{write_unsigned_varint_to_slice, write_unsigned_varint_u64_to_slice};
+use bytes::{Bytes, BytesMut};
+use std::cmp;
 
 // Writer for CompactedRow
 // Reference implementation:
@@ -51,11 +50,6 @@ impl CompactedRowWriter {
         }
     }
 
-    pub fn reset(&mut self) {
-        self.position = self.header_size_in_bytes;
-        self.buffer[..self.header_size_in_bytes].fill(0);
-    }
-
     pub fn position(&self) -> usize {
         self.position
     }
@@ -81,75 +75,78 @@ impl CompactedRowWriter {
         self.buffer[self.position..end].copy_from_slice(src);
         self.position = end;
     }
+}
+impl BinaryWriter for CompactedRowWriter {
+    fn reset(&mut self) {
+        self.position = self.header_size_in_bytes;
+        self.buffer[..self.header_size_in_bytes].fill(0);
+    }
 
-    pub fn set_null_at(&mut self, pos: usize) {
+    fn set_null_at(&mut self, pos: usize) {
         let byte_index = pos >> 3;
         let bit = pos & 7;
         debug_assert!(byte_index < self.header_size_in_bytes);
         self.buffer[byte_index] |= 1u8 << bit;
     }
 
-    pub fn write_boolean(&mut self, value: bool) {
+    fn write_boolean(&mut self, value: bool) {
         let b = if value { 1u8 } else { 0u8 };
         self.write_raw(&[b]);
     }
 
-    pub fn write_byte(&mut self, value: u8) {
+    fn write_byte(&mut self, value: u8) {
         self.write_raw(&[value]);
     }
 
-    pub fn write_binary(&mut self, bytes: &[u8], length: usize) {
-        // TODO: currently, we encoding BINARY(length) as the same with BYTES, the length info can
-        //  be omitted and the bytes length should be enforced in the future.
-        self.write_bytes(&bytes[..length.min(bytes.len())]);
-    }
-
-    pub fn write_bytes(&mut self, value: &[u8]) {
+    fn write_bytes(&mut self, value: &[u8]) {
         let len_i32 =
             i32::try_from(value.len()).expect("byte slice too large to encode length as i32");
         self.write_int(len_i32);
         self.write_raw(value);
     }
 
-    pub fn write_char(&mut self, value: &str, _length: usize) {
+    fn write_char(&mut self, value: &str, _length: usize) {
         // TODO: currently, we encoding CHAR(length) as the same with STRING, the length info can be
         //  omitted and the bytes length should be enforced in the future.
         self.write_string(value);
     }
 
-    pub fn write_string(&mut self, value: &str) {
+    fn write_string(&mut self, value: &str) {
         self.write_bytes(value.as_ref());
     }
 
-    pub fn write_short(&mut self, value: i16) {
+    fn write_short(&mut self, value: i16) {
         self.write_raw(&value.to_ne_bytes());
     }
 
-    pub fn write_int(&mut self, value: i32) {
+    fn write_int(&mut self, value: i32) {
         self.ensure_capacity(Self::MAX_INT_SIZE);
         let bytes_written =
             write_unsigned_varint_to_slice(value as u32, &mut self.buffer[self.position..]);
         self.position += bytes_written;
     }
 
-    pub fn write_long(&mut self, value: i64) {
+    fn write_long(&mut self, value: i64) {
         self.ensure_capacity(Self::MAX_LONG_SIZE);
         let bytes_written =
             write_unsigned_varint_u64_to_slice(value as u64, &mut self.buffer[self.position..]);
         self.position += bytes_written;
     }
-
-    pub fn write_float(&mut self, value: f32) {
+    fn write_float(&mut self, value: f32) {
         self.write_raw(&value.to_ne_bytes());
     }
 
-    pub fn write_double(&mut self, value: f64) {
+    fn write_double(&mut self, value: f64) {
         self.write_raw(&value.to_ne_bytes());
     }
-}
 
-impl BinaryRow for CompactedRowWriter {
-    fn as_bytes(&self) -> &[u8] {
-        self.buffer()
+    fn write_binary(&mut self, bytes: &[u8], length: usize) {
+        // TODO: currently, we encoding BINARY(length) as the same with BYTES, the length info can
+        //  be omitted and the bytes length should be enforced in the future.
+        self.write_bytes(&bytes[..length.min(bytes.len())]);
+    }
+
+    fn complete(&mut self) {
+        // do nothing
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs
new file mode 100644
index 0000000000..fc39bb7a26
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs
@@ -0,0 +1,83 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::DataType;
+use crate::row::Datum;
+use crate::row::binary::{BinaryRowFormat, BinaryWriter, ValueWriter};
+use crate::row::compacted::{CompactedRow, CompactedRowDeserializer, CompactedRowWriter};
+use crate::row::encode::{BinaryRow, RowEncoder};
+use std::sync::Arc;
+
+#[allow(dead_code)]
+pub struct CompactedRowEncoder<'a> {
+    arity: usize,
+    writer: CompactedRowWriter,
+    field_writers: Vec<ValueWriter>,
+    compacted_row_deserializer: Arc<CompactedRowDeserializer<'a>>,
+}
+
+impl<'a> CompactedRowEncoder<'a> {
+    pub fn new(field_data_types: Vec<DataType>) -> Result<Self> {
+        let field_writers = field_data_types
+            .iter()
+            .map(|d| ValueWriter::create_value_writer(d, Some(&BinaryRowFormat::Compacted)))
+            .collect::<Result<Vec<_>>>()?;
+
+        Ok(Self {
+            arity: field_data_types.len(),
+            writer: CompactedRowWriter::new(field_data_types.len()),
+            field_writers,
+            compacted_row_deserializer: Arc::new(CompactedRowDeserializer::new_from_owned(
+                field_data_types,
+            )),
+        })
+    }
+}
+
+impl RowEncoder for CompactedRowEncoder<'_> {
+    fn start_new_row(&mut self) -> Result<()> {
+        self.writer.reset();
+        Ok(())
+    }
+
+    fn encode_field(&mut self, pos: usize, value: Datum) -> Result<()> {
+        self.field_writers
+            .get(pos)
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "invalid position {} when attempting to encode value {}",
+                    pos, value
+                ),
+            })?
+            .write_value(&mut self.writer, pos, &value)
+    }
+
+    fn finish_row(&mut self) -> Result<impl BinaryRow> {
+        Ok(CompactedRow::deserialize(
+            Arc::clone(&self.compacted_row_deserializer),
+            self.arity,
+            self.writer.buffer(),
+        ))
+    }
+
+    fn close(&mut self) -> Result<()> {
+        // do nothing
+        Ok(())
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/encode/mod.rs b/fluss-rust/crates/fluss/src/row/encode/mod.rs
index 6c6eed9936..34863aba19 100644
--- a/fluss-rust/crates/fluss/src/row/encode/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/mod.rs
@@ -16,11 +16,13 @@
 // under the License.
 
 mod compacted_key_encoder;
+mod compacted_row_encoder;
 
 use crate::error::Result;
-use crate::metadata::{DataLakeFormat, RowType};
-use crate::row::InternalRow;
+use crate::metadata::{DataLakeFormat, DataType, KvFormat, RowType};
 use crate::row::encode::compacted_key_encoder::CompactedKeyEncoder;
+use crate::row::encode::compacted_row_encoder::CompactedRowEncoder;
+use crate::row::{BinaryRow, Datum, InternalRow};
 use bytes::Bytes;
 
 /// An interface for encoding key of row into bytes.
@@ -62,3 +64,65 @@ impl dyn KeyEncoder {
         }
     }
 }
+
+/// An encoder to write [`BinaryRow`]. It's used to write row
+/// multi-times one by one. When writing a new row:
+///
+/// 1. call method [`RowEncoder::start_new_row()`] to start the writing.
+/// 2. call method [`RowEncoder::encode_field()`] to write the row's field.
+/// 3. call method [`RowEncoder::finishRow()`] to finish the writing and get the written row.
+#[allow(dead_code)]
+pub trait RowEncoder {
+    /// Start to write a new row.
+    ///
+    /// # Returns
+    /// * Ok(()) if successful
+    fn start_new_row(&mut self) -> Result<()>;
+
+    /// Write the row's field in given pos with given value.
+    ///
+    /// # Arguments
+    /// * pos - the position of the field to write.
+    /// * value - the value of the field to write.
+    ///
+    /// # Returns
+    /// * Ok(()) if successful
+    fn encode_field(&mut self, pos: usize, value: Datum) -> Result<()>;
+
+    /// Finish write the row, returns the written row.
+    ///
+    /// Note that returned row borrows from [`RowEncoder`]'s internal buffer which is reused for subsequent rows
+    /// [`RowEncoder::start_new_row()`] should only be called after the returned row goes out of scope.
+    ///
+    /// # Returns
+    /// * the written row
+    fn finish_row(&mut self) -> Result<impl BinaryRow>;
+
+    /// Closes the row encoder
+    ///
+    /// # Returns
+    /// * Ok(()) if successful
+    fn close(&mut self) -> Result<()>;
+}
+
+#[allow(dead_code)]
+pub struct RowEncoderFactory {}
+
+#[allow(dead_code)]
+impl RowEncoderFactory {
+    pub fn create(kv_format: KvFormat, row_type: &RowType) -> Result<impl RowEncoder> {
+        Self::create_for_field_types(kv_format, row_type.field_types().cloned().collect())
+    }
+
+    pub fn create_for_field_types(
+        kv_format: KvFormat,
+        field_data_types: Vec<DataType>,
+    ) -> Result<impl RowEncoder> {
+        match kv_format {
+            KvFormat::INDEXED => {
+                todo!()
+            }
+            KvFormat::COMPACTED => CompactedRowEncoder::new(field_data_types),
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 144d64fd88..499606354c 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -19,7 +19,7 @@ mod column;
 
 mod datum;
 
-mod binary;
+pub mod binary;
 pub mod compacted;
 mod encode;
 mod field_getter;
@@ -27,7 +27,7 @@ mod field_getter;
 pub use column::*;
 pub use datum::*;
 
-pub trait BinaryRow {
+pub trait BinaryRow: InternalRow {
     /// Returns the binary representation of this row as a byte slice.
     fn as_bytes(&self) -> &[u8];
 }

From c4d5b0214faf7797968b9e478482b0869b6bdb5a Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Fri, 16 Jan 2026 02:27:04 +0000
Subject: [PATCH 067/287] feat: add column projection support to Python
 LogScanner (#151)

---
 fluss-rust/bindings/python/example/example.py |  22 ++++
 fluss-rust/bindings/python/src/table.rs       | 112 ++++++++++++++----
 2 files changed, 109 insertions(+), 25 deletions(-)

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 0523f943e4..0b1e67d3e6 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -178,6 +178,28 @@ async def main():
     except Exception as e:
         print(f"Error during scanning: {e}")
 
+    # Demo: Column projection
+    print("\n--- Testing Column Projection ---")
+    try:
+        # Project specific columns by index
+        print("\n1. Projection by index [0, 1] (id, name):")
+        scanner_index = await table.new_log_scanner(project=[0, 1])
+        scanner_index.subscribe(None, None)
+        df_projected = scanner_index.to_pandas()
+        print(df_projected.head())
+        print(f"   Projected {df_projected.shape[1]} columns: {list(df_projected.columns)}")
+
+        # Project specific columns by name (Pythonic!)
+        print("\n2. Projection by name ['name', 'score'] (Pythonic):")
+        scanner_names = await table.new_log_scanner(columns=["name", "score"])
+        scanner_names.subscribe(None, None)
+        df_named = scanner_names.to_pandas()
+        print(df_named.head())
+        print(f"   Projected {df_named.shape[1]} columns: {list(df_named.columns)}")
+
+    except Exception as e:
+        print(f"Error during projection: {e}")
+
     # Close connection
     conn.close()
     print("\nConnection closed")
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 8a1164856b..6cd13c4fa1 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -34,6 +34,12 @@ pub struct FlussTable {
     has_primary_key: bool,
 }
 
+/// Internal enum to represent different projection types
+enum ProjectionType {
+    Indices(Vec<usize>),
+    Names(Vec<String>),
+}
+
 #[pymethods]
 impl FlussTable {
     /// Create a new append writer for the table
@@ -57,32 +63,39 @@ impl FlussTable {
         })
     }
 
-    /// Create a new log scanner for the table
-    fn new_log_scanner<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let conn = self.connection.clone();
-        let metadata = self.metadata.clone();
-        let table_info = self.table_info.clone();
-
-        future_into_py(py, async move {
-            let fluss_table =
-                fcore::client::FlussTable::new(&conn, metadata.clone(), table_info.clone());
-
-            let table_scan = fluss_table.new_scan();
-
-            let rust_scanner = table_scan.create_log_scanner().map_err(|e| {
-                PyErr::new::<pyo3::exceptions::PyRuntimeError, _>(format!(
-                    "Failed to create log scanner: {e:?}"
-                ))
-            })?;
-
-            let admin = conn
-                .get_admin()
-                .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+    /// Create a new log scanner for the table.
+    ///
+    /// Args:
+    ///     project: Optional list of column indices (0-based) to include in the scan.
+    ///     columns: Optional list of column names to include in the scan.
+    ///
+    /// Returns:
+    ///     LogScanner, optionally with projection applied
+    ///
+    /// Note:
+    ///     Specify only one of 'project' or 'columns'.
+    ///     If neither is specified, all columns are included.
+    ///     Rust side will validate the projection parameters.
+    ///
+    #[pyo3(signature = (project=None, columns=None))]
+    pub fn new_log_scanner<'py>(
+        &self,
+        py: Python<'py>,
+        project: Option<Vec<usize>>,
+        columns: Option<Vec<String>>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let projection = match (project, columns) {
+            (Some(_), Some(_)) => {
+                return Err(FlussError::new_err(
+                    "Specify only one of 'project' or 'columns'".to_string(),
+                ));
+            }
+            (Some(indices), None) => Some(ProjectionType::Indices(indices)),
+            (None, Some(names)) => Some(ProjectionType::Names(names)),
+            (None, None) => None,
+        };
 
-            let py_scanner = LogScanner::from_core(rust_scanner, admin, table_info.clone());
-            Python::attach(|py| Py::new(py, py_scanner))
-        })
+        self.create_log_scanner_internal(py, projection)
     }
 
     /// Get table information
@@ -126,6 +139,55 @@ impl FlussTable {
             has_primary_key,
         }
     }
+
+    /// Internal helper to create log scanner with optional projection
+    fn create_log_scanner_internal<'py>(
+        &self,
+        py: Python<'py>,
+        projection: Option<ProjectionType>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let conn = self.connection.clone();
+        let metadata = self.metadata.clone();
+        let table_info = self.table_info.clone();
+
+        future_into_py(py, async move {
+            let fluss_table =
+                fcore::client::FlussTable::new(&conn, metadata.clone(), table_info.clone());
+
+            let mut table_scan = fluss_table.new_scan();
+
+            // Apply projection if specified
+            if let Some(proj) = projection {
+                table_scan = match proj {
+                    ProjectionType::Indices(indices) => {
+                        table_scan.project(&indices).map_err(|e| {
+                            FlussError::new_err(format!("Failed to project columns: {e}"))
+                        })?
+                    }
+                    ProjectionType::Names(names) => {
+                        // Convert Vec<String> to Vec<&str> for the API
+                        let column_name_refs: Vec<&str> =
+                            names.iter().map(|s| s.as_str()).collect();
+                        table_scan.project_by_name(&column_name_refs).map_err(|e| {
+                            FlussError::new_err(format!("Failed to project columns: {e}"))
+                        })?
+                    }
+                };
+            }
+
+            let rust_scanner = table_scan
+                .create_log_scanner()
+                .map_err(|e| FlussError::new_err(format!("Failed to create log scanner: {e}")))?;
+
+            let admin = conn
+                .get_admin()
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+            let py_scanner = LogScanner::from_core(rust_scanner, admin, table_info.clone());
+            Python::attach(|py| Py::new(py, py_scanner))
+        })
+    }
 }
 
 /// Writer for appending data to a Fluss table

From dce62d6d4a0fa9d4a38ee1aec23a57b8dfe35b18 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Fri, 16 Jan 2026 14:22:48 +0800
Subject: [PATCH 068/287] chore: fix read deadlock (#165)

---
 .../src/client/table/log_fetch_buffer.rs      | 26 ++++++++++++-------
 1 file changed, 17 insertions(+), 9 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index e9bac53f1a..c55c994b03 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -211,19 +211,27 @@ impl LogFetchBuffer {
     pub fn buffered_buckets(&self) -> Vec<TableBucket> {
         let mut buckets = Vec::new();
 
-        let next_in_line_fetch = self.next_in_line_fetch.lock();
-        if let Some(complete_fetch) = next_in_line_fetch.as_ref() {
-            if !complete_fetch.is_consumed() {
-                buckets.push(complete_fetch.table_bucket().clone());
+        // Avoid holding multiple locks at once to prevent lock-order inversion.
+        {
+            let next_in_line_fetch = self.next_in_line_fetch.lock();
+            if let Some(complete_fetch) = next_in_line_fetch.as_ref() {
+                if !complete_fetch.is_consumed() {
+                    buckets.push(complete_fetch.table_bucket().clone());
+                }
             }
         }
 
-        let completed = self.completed_fetches.lock();
-        for fetch in completed.iter() {
-            buckets.push(fetch.table_bucket().clone());
+        {
+            let completed = self.completed_fetches.lock();
+            for fetch in completed.iter() {
+                buckets.push(fetch.table_bucket().clone());
+            }
+        }
+
+        {
+            let pending = self.pending_fetches.lock();
+            buckets.extend(pending.keys().cloned());
         }
-        let pending = self.pending_fetches.lock();
-        buckets.extend(pending.keys().cloned());
         buckets
     }
 }

From 93048ed0d783987da266904ee216d5506e0b2204 Mon Sep 17 00:00:00 2001
From: Andrea Bozzo <andreabozzo92@gmail.com>
Date: Sat, 17 Jan 2026 02:45:00 +0100
Subject: [PATCH 069/287] feat: introduce lookup support for primary key tables
 (#159)

---
 .../crates/fluss/src/client/table/lookup.rs   | 252 ++++++++++++++++++
 .../crates/fluss/src/client/table/mod.rs      |  38 ++-
 .../fluss/src/client/write/write_format.rs    |   4 +-
 fluss-rust/crates/fluss/src/metadata/table.rs |   1 +
 .../crates/fluss/src/proto/fluss_api.proto    |  28 ++
 .../crates/fluss/src/record/kv/kv_record.rs   |  12 +-
 .../fluss/src/record/kv/kv_record_batch.rs    |  15 +-
 .../src/record/kv/kv_record_batch_builder.rs  |  30 +--
 .../fluss/src/row/compacted/compacted_row.rs  |  58 ++--
 .../src/row/compacted/compacted_row_reader.rs |  18 +-
 .../src/row/encode/compacted_row_encoder.rs   |  19 +-
 fluss-rust/crates/fluss/src/row/encode/mod.rs |   8 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |   4 +-
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |   4 +
 .../crates/fluss/src/rpc/message/lookup.rs    |  67 +++++
 .../crates/fluss/src/rpc/message/mod.rs       |   2 +
 fluss-rust/crates/fluss/src/util/varint.rs    |  14 +-
 17 files changed, 478 insertions(+), 96 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/table/lookup.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/lookup.rs

diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
new file mode 100644
index 0000000000..1d32ebd75e
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -0,0 +1,252 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::bucketing::BucketingFunction;
+use crate::client::connection::FlussConnection;
+use crate::client::metadata::Metadata;
+use crate::error::{Error, Result};
+use crate::metadata::{RowType, TableBucket, TableInfo};
+use crate::row::InternalRow;
+use crate::row::compacted::CompactedRow;
+use crate::row::encode::KeyEncoder;
+use crate::rpc::ApiError;
+use crate::rpc::message::LookupRequest;
+use std::sync::Arc;
+
+/// The result of a lookup operation.
+///
+/// Contains the rows returned from a lookup. For primary key lookups,
+/// this will contain at most one row. For prefix key lookups (future),
+/// this may contain multiple rows.
+pub struct LookupResult<'a> {
+    rows: Vec<Vec<u8>>,
+    row_type: &'a RowType,
+}
+
+impl<'a> LookupResult<'a> {
+    /// Creates a new LookupResult from a list of row bytes.
+    fn new(rows: Vec<Vec<u8>>, row_type: &'a RowType) -> Self {
+        Self { rows, row_type }
+    }
+
+    /// Creates an empty LookupResult.
+    fn empty(row_type: &'a RowType) -> Self {
+        Self {
+            rows: Vec::new(),
+            row_type,
+        }
+    }
+
+    /// Returns the only row in the result set as a [`CompactedRow`].
+    ///
+    /// This method provides a zero-copy view of the row data, which means the returned
+    /// `CompactedRow` borrows from this result set and cannot outlive it.
+    ///
+    /// # Returns
+    /// - `Ok(Some(row))`: If exactly one row exists.
+    /// - `Ok(None)`: If the result set is empty.
+    /// - `Err(Error::UnexpectedError)`: If the result set contains more than one row.
+    ///
+    pub fn get_single_row(&self) -> Result<Option<CompactedRow<'_>>> {
+        match self.rows.len() {
+            0 => Ok(None),
+            1 => Ok(Some(CompactedRow::from_bytes(self.row_type, &self.rows[0]))),
+            _ => Err(Error::UnexpectedError {
+                message: "LookupResult contains multiple rows, use get_rows() instead".to_string(),
+                source: None,
+            }),
+        }
+    }
+
+    /// Returns all rows as CompactedRows.
+    pub fn get_rows(&self) -> Vec<CompactedRow<'_>> {
+        self.rows
+            .iter()
+            .map(|bytes| CompactedRow::from_bytes(self.row_type, bytes))
+            .collect()
+    }
+}
+
+/// Configuration and factory struct for creating lookup operations.
+///
+/// `TableLookup` follows the same pattern as `TableScan` and `TableAppend`,
+/// providing a builder-style API for configuring lookup operations before
+/// creating the actual `Lookuper`.
+///
+/// # Example
+/// ```ignore
+/// let table = conn.get_table(&table_path).await?;
+/// let lookuper = table.new_lookup()?.create_lookuper()?;
+/// let result = lookuper.lookup(&row).await?;
+/// if let Some(value) = result.get_single_row() {
+///     println!("Found: {:?}", value);
+/// }
+/// ```
+// TODO: Add lookup_by(column_names) for prefix key lookups (PrefixKeyLookuper)
+// TODO: Add create_typed_lookuper<T>() for typed lookups with POJO mapping
+pub struct TableLookup<'a> {
+    conn: &'a FlussConnection,
+    table_info: TableInfo,
+    metadata: Arc<Metadata>,
+}
+
+impl<'a> TableLookup<'a> {
+    pub(super) fn new(
+        conn: &'a FlussConnection,
+        table_info: TableInfo,
+        metadata: Arc<Metadata>,
+    ) -> Self {
+        Self {
+            conn,
+            table_info,
+            metadata,
+        }
+    }
+
+    /// Creates a `Lookuper` for performing key-based lookups.
+    ///
+    /// The lookuper will automatically encode the key and compute the bucket
+    /// for each lookup using the appropriate bucketing function.
+    pub fn create_lookuper(self) -> Result<Lookuper<'a>> {
+        let num_buckets = self.table_info.get_num_buckets();
+
+        // Get data lake format from table config for bucketing function
+        let data_lake_format = self.table_info.get_table_config().get_datalake_format()?;
+        let bucketing_function = <dyn BucketingFunction>::of(data_lake_format.as_ref());
+
+        // Create key encoder for the primary key fields
+        let pk_fields = self.table_info.get_physical_primary_keys().to_vec();
+        let key_encoder =
+            <dyn KeyEncoder>::of(self.table_info.row_type(), pk_fields, data_lake_format)?;
+
+        Ok(Lookuper {
+            conn: self.conn,
+            table_info: self.table_info,
+            metadata: self.metadata,
+            bucketing_function,
+            key_encoder,
+            num_buckets,
+        })
+    }
+}
+
+/// Performs key-based lookups against a primary key table.
+///
+/// The `Lookuper` automatically encodes the lookup key, computes the target
+/// bucket, finds the appropriate tablet server, and retrieves the value.
+///
+/// # Example
+/// ```ignore
+/// let lookuper = table.new_lookup()?.create_lookuper()?;
+/// let row = GenericRow::new(vec![Datum::Int32(42)]); // lookup key
+/// let result = lookuper.lookup(&row).await?;
+/// ```
+// TODO: Support partitioned tables (extract partition from key)
+pub struct Lookuper<'a> {
+    conn: &'a FlussConnection,
+    table_info: TableInfo,
+    metadata: Arc<Metadata>,
+    bucketing_function: Box<dyn BucketingFunction>,
+    key_encoder: Box<dyn KeyEncoder>,
+    num_buckets: i32,
+}
+
+impl<'a> Lookuper<'a> {
+    /// Looks up a value by its primary key.
+    ///
+    /// The key is encoded and the bucket is automatically computed using
+    /// the table's bucketing function.
+    ///
+    /// # Arguments
+    /// * `row` - The row containing the primary key field values
+    ///
+    /// # Returns
+    /// * `Ok(LookupResult)` - The lookup result (may be empty if key not found)
+    /// * `Err(Error)` - If the lookup fails
+    pub async fn lookup(&mut self, row: &dyn InternalRow) -> Result<LookupResult<'_>> {
+        // todo: support batch lookup
+        // Encode the key from the row
+        let encoded_key = self.key_encoder.encode_key(row)?;
+        let key_bytes = encoded_key.to_vec();
+
+        // Compute bucket from encoded key
+        let bucket_id = self
+            .bucketing_function
+            .bucketing(&key_bytes, self.num_buckets)?;
+
+        let table_id = self.table_info.get_table_id();
+        let table_bucket = TableBucket::new(table_id, bucket_id);
+
+        // Find the leader for this bucket
+        let cluster = self.metadata.get_cluster();
+        let leader =
+            cluster
+                .leader_for(&table_bucket)
+                .ok_or_else(|| Error::LeaderNotAvailable {
+                    message: format!("No leader found for table bucket: {table_bucket}"),
+                })?;
+
+        // Get connection to the tablet server
+        let tablet_server =
+            cluster
+                .get_tablet_server(leader.id())
+                .ok_or_else(|| Error::LeaderNotAvailable {
+                    message: format!(
+                        "Tablet server {} is not found in metadata cache",
+                        leader.id()
+                    ),
+                })?;
+
+        let connections = self.conn.get_connections();
+        let connection = connections.get_connection(tablet_server).await?;
+
+        // Send lookup request
+        let request = LookupRequest::new(table_id, None, bucket_id, vec![key_bytes]);
+        let response = connection.request(request).await?;
+
+        // Extract the values from response
+        if let Some(bucket_resp) = response.buckets_resp.into_iter().next() {
+            // Check for errors
+            if let Some(error_code) = bucket_resp.error_code {
+                if error_code != 0 {
+                    return Err(Error::FlussAPIError {
+                        api_error: ApiError {
+                            code: error_code,
+                            message: bucket_resp.error_message.unwrap_or_default(),
+                        },
+                    });
+                }
+            }
+
+            // Collect all values
+            let rows: Vec<Vec<u8>> = bucket_resp
+                .values
+                .into_iter()
+                .filter_map(|pb_value| pb_value.values)
+                .collect();
+
+            return Ok(LookupResult::new(rows, self.table_info.row_type()));
+        }
+
+        Ok(LookupResult::empty(self.table_info.row_type()))
+    }
+
+    /// Returns a reference to the table info.
+    pub fn table_info(&self) -> &TableInfo {
+        &self.table_info
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 26341d70a6..7356be2393 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -17,14 +17,14 @@
 
 use crate::client::connection::FlussConnection;
 use crate::client::metadata::Metadata;
+use crate::error::{Error, Result};
 use crate::metadata::{TableInfo, TablePath};
 use std::sync::Arc;
 
-use crate::error::Result;
-
 pub const EARLIEST_OFFSET: i64 = -2;
 
 mod append;
+mod lookup;
 
 mod log_fetch_buffer;
 mod remote_log;
@@ -32,6 +32,7 @@ mod scanner;
 mod writer;
 
 pub use append::{AppendWriter, TableAppend};
+pub use lookup::{LookupResult, Lookuper, TableLookup};
 pub use scanner::{LogScanner, RecordBatchLogScanner, TableScan};
 
 #[allow(dead_code)]
@@ -85,6 +86,39 @@ impl<'a> FlussTable<'a> {
     pub fn has_primary_key(&self) -> bool {
         self.has_primary_key
     }
+
+    /// Creates a new `TableLookup` for configuring lookup operations.
+    ///
+    /// This follows the same pattern as `new_scan()` and `new_append()`,
+    /// returning a configuration object that can be used to create a `Lookuper`.
+    ///
+    /// The table must have a primary key (be a primary key table).
+    ///
+    /// # Returns
+    /// * `Ok(TableLookup)` - A lookup configuration object
+    /// * `Err(Error)` - If the table doesn't have a primary key
+    ///
+    /// # Example
+    /// ```ignore
+    /// let table = conn.get_table(&table_path).await?;
+    /// let lookuper = table.new_lookup()?.create_lookuper()?;
+    /// let key = vec![1, 2, 3]; // encoded primary key bytes
+    /// if let Some(value) = lookuper.lookup(key).await? {
+    ///     println!("Found value: {:?}", value);
+    /// }
+    /// ```
+    pub fn new_lookup(&self) -> Result<TableLookup<'_>> {
+        if !self.has_primary_key {
+            return Err(Error::UnsupportedOperation {
+                message: "Lookup is only supported for primary key tables".to_string(),
+            });
+        }
+        Ok(TableLookup::new(
+            self.conn,
+            self.table_info.clone(),
+            self.metadata.clone(),
+        ))
+    }
 }
 
 impl<'a> Drop for FlussTable<'a> {
diff --git a/fluss-rust/crates/fluss/src/client/write/write_format.rs b/fluss-rust/crates/fluss/src/client/write/write_format.rs
index d65e42de68..4a0c0d8afa 100644
--- a/fluss-rust/crates/fluss/src/client/write/write_format.rs
+++ b/fluss-rust/crates/fluss/src/client/write/write_format.rs
@@ -39,7 +39,7 @@ impl WriteFormat {
         match self {
             WriteFormat::CompactedKv => Ok(KvFormat::COMPACTED),
             other => Err(IllegalArgument {
-                message: format!("WriteFormat `{}` is not a KvFormat", other),
+                message: format!("WriteFormat `{other}` is not a KvFormat"),
             }),
         }
     }
@@ -48,7 +48,7 @@ impl WriteFormat {
         match kv_format {
             KvFormat::COMPACTED => Ok(WriteFormat::CompactedKv),
             other => Err(IllegalArgument {
-                message: format!("Unknown KvFormat: `{}`", other),
+                message: format!("Unknown KvFormat: `{other}`"),
             }),
         }
     }
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index b1e8a90ba2..da85b0c2da 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -729,6 +729,7 @@ impl TableConfig {
         ArrowCompressionInfo::from_conf(&self.properties)
     }
 
+    /// Returns the data lake format if configured, or None if not set.
     pub fn get_datalake_format(&self) -> Result<Option<DataLakeFormat>> {
         self.properties
             .get("table.datalake.format")
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index dbbb45daea..b4ae8405aa 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -317,4 +317,32 @@ message GetFileSystemSecurityTokenResponse {
   required bytes token = 2;
   optional int64 expiration_time = 3;
   repeated PbKeyValue addition_info = 4;
+}
+
+// lookup request and response
+message LookupRequest {
+  required int64 table_id = 1;
+  repeated PbLookupReqForBucket buckets_req = 2;
+}
+
+message LookupResponse {
+  repeated PbLookupRespForBucket buckets_resp = 1;
+}
+
+message PbLookupReqForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  repeated bytes key = 3;
+}
+
+message PbLookupRespForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  optional int32 error_code = 3;
+  optional string error_message = 4;
+  repeated PbValue values = 5;
+}
+
+message PbValue {
+  optional bytes values = 1;
 }
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
index 8c30713d42..ab8c2ac1dd 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
@@ -101,7 +101,7 @@ impl KvRecord {
         let size_i32 = i32::try_from(size_in_bytes).map_err(|_| {
             io::Error::new(
                 io::ErrorKind::InvalidInput,
-                format!("Record size {} exceeds i32::MAX", size_in_bytes),
+                format!("Record size {size_in_bytes} exceeds i32::MAX"),
             )
         })?;
         buf.put_i32_le(size_i32);
@@ -141,7 +141,7 @@ impl KvRecord {
         if size_in_bytes_i32 < 0 {
             return Err(io::Error::new(
                 io::ErrorKind::InvalidData,
-                format!("Invalid record length: {}", size_in_bytes_i32),
+                format!("Invalid record length: {size_in_bytes_i32}"),
             ));
         }
 
@@ -150,10 +150,7 @@ impl KvRecord {
         let total_size = size_in_bytes.checked_add(LENGTH_LENGTH).ok_or_else(|| {
             io::Error::new(
                 io::ErrorKind::InvalidData,
-                format!(
-                    "Record size overflow: {} + {}",
-                    size_in_bytes, LENGTH_LENGTH
-                ),
+                format!("Record size overflow: {size_in_bytes} + {LENGTH_LENGTH}"),
             )
         })?;
 
@@ -162,8 +159,7 @@ impl KvRecord {
             return Err(io::Error::new(
                 io::ErrorKind::UnexpectedEof,
                 format!(
-                    "Not enough bytes to read record: expected {}, available {}",
-                    total_size, available
+                    "Not enough bytes to read record: expected {total_size}, available {available}"
                 ),
             ));
         }
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
index 6ead64276a..eb3c09ad34 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
@@ -96,7 +96,7 @@ impl KvRecordBatch {
         if length_i32 < 0 {
             return Err(io::Error::new(
                 io::ErrorKind::InvalidData,
-                format!("Invalid batch length: {}", length_i32),
+                format!("Invalid batch length: {length_i32}"),
             ));
         }
 
@@ -150,10 +150,7 @@ impl KvRecordBatch {
         if size < RECORD_BATCH_HEADER_SIZE {
             return Err(io::Error::new(
                 io::ErrorKind::InvalidData,
-                format!(
-                    "Batch size {} is less than header size {}",
-                    size, RECORD_BATCH_HEADER_SIZE
-                ),
+                format!("Batch size {size} is less than header size {RECORD_BATCH_HEADER_SIZE}"),
             ));
         }
 
@@ -276,7 +273,7 @@ impl KvRecordBatch {
         if count < 0 {
             return Err(io::Error::new(
                 io::ErrorKind::InvalidData,
-                format!("Invalid record count: {}", count),
+                format!("Invalid record count: {count}"),
             ));
         }
         Ok(KvRecordIterator {
@@ -321,7 +318,7 @@ impl Iterator for KvRecordIterator {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::{DataTypes, KvFormat};
+    use crate::metadata::{DataTypes, KvFormat, RowType};
     use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, KvRecordBatchBuilder};
     use crate::row::binary::BinaryWriter;
     use crate::row::compacted::CompactedRow;
@@ -366,8 +363,8 @@ mod tests {
         let mut value1_writer = CompactedRowWriter::new(1);
         value1_writer.write_bytes(&[1, 2, 3, 4, 5]);
 
-        let data_types = &[DataTypes::bytes()];
-        let row = &CompactedRow::from_bytes(data_types, value1_writer.buffer());
+        let row_type = RowType::with_data_types([DataTypes::bytes()].to_vec());
+        let row = &CompactedRow::from_bytes(&row_type, value1_writer.buffer());
         builder.append_row(key1, Some(row)).unwrap();
 
         let key2 = b"key2";
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
index 7d1a7972e4..c36a86121b 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
@@ -248,7 +248,7 @@ impl KvRecordBatchBuilder {
         let total_size = i32::try_from(size_without_length).map_err(|_| {
             io::Error::new(
                 io::ErrorKind::InvalidInput,
-                format!("Batch size {} exceeds i32::MAX", size_without_length),
+                format!("Batch size {size_without_length} exceeds i32::MAX"),
             )
         })?;
 
@@ -317,14 +317,16 @@ impl Drop for KvRecordBatchBuilder {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::{DataType, DataTypes};
+    use crate::metadata::{DataTypes, RowType};
     use crate::row::binary::BinaryWriter;
     use crate::row::compacted::{CompactedRow, CompactedRowWriter};
+    use std::sync::LazyLock;
+    static TEST_ROW_TYPE: LazyLock<RowType> =
+        LazyLock::new(|| RowType::with_data_types(vec![DataTypes::bytes()]));
 
     // Helper function to create a CompactedRowWriter with a single bytes field for testing
     fn create_test_row(data: &[u8]) -> CompactedRow<'_> {
-        const DATA_TYPE: &[DataType] = &[DataTypes::bytes()];
-        CompactedRow::from_bytes(DATA_TYPE, data)
+        CompactedRow::from_bytes(&TEST_ROW_TYPE, data)
     }
 
     #[test]
@@ -483,7 +485,6 @@ mod tests {
 
     #[test]
     fn test_builder_with_compacted_row_writer() {
-        use crate::metadata::{DataType, IntType, StringType};
         use crate::record::kv::KvRecordBatch;
         use crate::row::InternalRow;
         use crate::row::compacted::CompactedRow;
@@ -491,18 +492,13 @@ mod tests {
         let mut builder = KvRecordBatchBuilder::new(1, 100000, KvFormat::COMPACTED);
         builder.set_writer_state(100, 5);
 
-        let types = vec![
-            DataType::Int(IntType::new()),
-            DataType::String(StringType::new()),
-        ];
-
         // Create and append first record with CompactedRowWriter
         let mut row_writer1 = CompactedRowWriter::new(2);
         row_writer1.write_int(42);
         row_writer1.write_string("hello");
 
-        let data_types = &[DataTypes::int(), DataTypes::string()];
-        let row1 = &CompactedRow::from_bytes(data_types, row_writer1.buffer());
+        let row_type = RowType::with_data_types([DataTypes::int(), DataTypes::string()].to_vec());
+        let row1 = &CompactedRow::from_bytes(&row_type, row_writer1.buffer());
 
         let key1 = b"key1";
         assert!(builder.has_room_for_row(key1, Some(row1)));
@@ -513,7 +509,7 @@ mod tests {
         row_writer2.write_int(100);
         row_writer2.write_string("world");
 
-        let row2 = &CompactedRow::from_bytes(data_types, row_writer2.buffer());
+        let row2 = &CompactedRow::from_bytes(&row_type, row_writer2.buffer());
 
         let key2 = b"key2";
         builder.append_row(key2, Some(row2)).unwrap();
@@ -539,14 +535,14 @@ mod tests {
         // Verify first record
         let record1 = records[0].as_ref().unwrap();
         assert_eq!(record1.key().as_ref(), key1);
-        let row1 = CompactedRow::from_bytes(&types, record1.value().unwrap());
+        let row1 = CompactedRow::from_bytes(&row_type, record1.value().unwrap());
         assert_eq!(row1.get_int(0), 42);
         assert_eq!(row1.get_string(1), "hello");
 
         // Verify second record
         let record2 = records[1].as_ref().unwrap();
         assert_eq!(record2.key().as_ref(), key2);
-        let row2 = CompactedRow::from_bytes(&types, record2.value().unwrap());
+        let row2 = CompactedRow::from_bytes(&row_type, record2.value().unwrap());
         assert_eq!(row2.get_int(0), 100);
         assert_eq!(row2.get_string(1), "world");
 
@@ -561,8 +557,8 @@ mod tests {
         let mut row_writer = CompactedRowWriter::new(1);
         row_writer.write_int(42);
 
-        let data_types = &[DataTypes::int()];
-        let row = &CompactedRow::from_bytes(data_types, row_writer.buffer());
+        let row_type = RowType::with_data_types([DataTypes::int()].to_vec());
+        let row = &CompactedRow::from_bytes(&row_type, row_writer.buffer());
 
         // INDEXED format should reject append_row
         let mut indexed_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::INDEXED);
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 9ff3b5ffd5..144f8985cf 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::metadata::DataType;
+use crate::metadata::RowType;
 use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
 use crate::row::{BinaryRow, GenericRow, InternalRow};
 use std::sync::{Arc, OnceLock};
@@ -38,10 +38,10 @@ pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
 
 #[allow(dead_code)]
 impl<'a> CompactedRow<'a> {
-    pub fn from_bytes(data_types: &'a [DataType], data: &'a [u8]) -> Self {
+    pub fn from_bytes(row_type: &'a RowType, data: &'a [u8]) -> Self {
         Self::deserialize(
-            Arc::new(CompactedRowDeserializer::new(data_types)),
-            data_types.len(),
+            Arc::new(CompactedRowDeserializer::new(row_type)),
+            row_type.fields().len(),
             data,
         )
     }
@@ -84,7 +84,10 @@ impl<'a> InternalRow for CompactedRow<'a> {
     }
 
     fn is_null_at(&self, pos: usize) -> bool {
-        self.deserializer.get_data_types()[pos].is_nullable() && self.reader.is_null_at(pos)
+        self.deserializer.get_row_type().fields().as_slice()[pos]
+            .data_type
+            .is_nullable()
+            && self.reader.is_null_at(pos)
     }
 
     fn get_boolean(&self, pos: usize) -> bool {
@@ -138,7 +141,7 @@ mod tests {
     use crate::row::binary::BinaryWriter;
 
     use crate::metadata::{
-        BigIntType, BooleanType, BytesType, DoubleType, FloatType, IntType, SmallIntType,
+        BigIntType, BooleanType, BytesType, DataType, DoubleType, FloatType, IntType, SmallIntType,
         StringType, TinyIntType,
     };
     use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
@@ -146,7 +149,7 @@ mod tests {
     #[test]
     fn test_compacted_row() {
         // Test all primitive types
-        let types = vec![
+        let row_type = RowType::with_data_types(vec![
             DataType::Boolean(BooleanType::new()),
             DataType::TinyInt(TinyIntType::new()),
             DataType::SmallInt(SmallIntType::new()),
@@ -156,9 +159,9 @@ mod tests {
             DataType::Double(DoubleType::new()),
             DataType::String(StringType::new()),
             DataType::Bytes(BytesType::new()),
-        ];
+        ]);
 
-        let mut writer = CompactedRowWriter::new(types.len());
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
 
         writer.write_boolean(true);
         writer.write_byte(1);
@@ -171,7 +174,7 @@ mod tests {
         writer.write_bytes(&[1, 2, 3, 4, 5]);
 
         let bytes = writer.to_bytes();
-        let mut row = CompactedRow::from_bytes(types.as_slice(), bytes.as_ref());
+        let mut row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
         assert_eq!(row.get_field_count(), 9);
         assert!(row.get_boolean(0));
@@ -185,20 +188,23 @@ mod tests {
         assert_eq!(row.get_bytes(8), &[1, 2, 3, 4, 5]);
 
         // Test with nulls
-        let types = vec![
-            DataType::Int(IntType::new()),
-            DataType::String(StringType::new()),
-            DataType::Double(DoubleType::new()),
-        ];
+        let row_type = RowType::with_data_types(
+            [
+                DataType::Int(IntType::new()),
+                DataType::String(StringType::new()),
+                DataType::Double(DoubleType::new()),
+            ]
+            .to_vec(),
+        );
 
-        let mut writer = CompactedRowWriter::new(types.len());
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
 
         writer.write_int(100);
         writer.set_null_at(1);
         writer.write_double(2.71);
 
         let bytes = writer.to_bytes();
-        row = CompactedRow::from_bytes(types.as_slice(), bytes.as_ref());
+        row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
         assert!(!row.is_null_at(0));
         assert!(row.is_null_at(1));
@@ -211,26 +217,28 @@ mod tests {
         assert_eq!(row.get_int(0), 100);
 
         // Test from_bytes
-        let types = vec![
+        let row_type = RowType::with_data_types(vec![
             DataType::Int(IntType::new()),
             DataType::String(StringType::new()),
-        ];
+        ]);
 
-        let mut writer = CompactedRowWriter::new(types.len());
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
         writer.write_int(-1);
         writer.write_string("test");
 
         let bytes = writer.to_bytes();
-        let mut row = CompactedRow::from_bytes(types.as_slice(), bytes.as_ref());
+        let mut row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
         assert_eq!(row.get_int(0), -1);
         assert_eq!(row.get_string(1), "test");
 
         // Test large row
         let num_fields = 100;
-        let types: Vec<DataType> = (0..num_fields)
-            .map(|_| DataType::Int(IntType::new()))
-            .collect();
+        let row_type = RowType::with_data_types(
+            (0..num_fields)
+                .map(|_| DataType::Int(IntType::new()))
+                .collect(),
+        );
 
         let mut writer = CompactedRowWriter::new(num_fields);
 
@@ -239,7 +247,7 @@ mod tests {
         }
 
         let bytes = writer.to_bytes();
-        row = CompactedRow::from_bytes(types.as_slice(), bytes.as_ref());
+        row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
         for i in 0..num_fields {
             assert_eq!(row.get_int(i), (i * 10) as i32);
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 9ce50952f4..408706cc83 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -15,6 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::metadata::RowType;
 use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 use crate::{
     metadata::DataType,
@@ -27,31 +28,32 @@ use std::str::from_utf8;
 #[allow(dead_code)]
 #[derive(Clone)]
 pub struct CompactedRowDeserializer<'a> {
-    schema: Cow<'a, [DataType]>,
+    row_type: Cow<'a, RowType>,
 }
 
 #[allow(dead_code)]
 impl<'a> CompactedRowDeserializer<'a> {
-    pub fn new(schema: &'a [DataType]) -> Self {
+    pub fn new(row_type: &'a RowType) -> Self {
         Self {
-            schema: Cow::Borrowed(schema),
+            row_type: Cow::Borrowed(row_type),
         }
     }
 
-    pub fn new_from_owned(schema: Vec<DataType>) -> Self {
+    pub fn new_from_owned(row_type: RowType) -> Self {
         Self {
-            schema: Cow::Owned(schema),
+            row_type: Cow::Owned(row_type),
         }
     }
 
-    pub fn get_data_types(&self) -> &[DataType] {
-        self.schema.as_ref()
+    pub fn get_row_type(&self) -> &RowType {
+        self.row_type.as_ref()
     }
 
     pub fn deserialize(&self, reader: &CompactedRowReader<'a>) -> GenericRow<'a> {
         let mut row = GenericRow::new();
         let mut cursor = reader.initial_position();
-        for (col_pos, dtype) in self.schema.iter().enumerate() {
+        for (col_pos, data_field) in self.row_type.fields().iter().enumerate() {
+            let dtype = &data_field.data_type;
             if dtype.is_nullable() && reader.is_null_at(col_pos) {
                 row.set_field(col_pos, Datum::Null);
                 continue;
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs
index fc39bb7a26..48b9f3ff58 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs
@@ -17,7 +17,7 @@
 
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::DataType;
+use crate::metadata::RowType;
 use crate::row::Datum;
 use crate::row::binary::{BinaryRowFormat, BinaryWriter, ValueWriter};
 use crate::row::compacted::{CompactedRow, CompactedRowDeserializer, CompactedRowWriter};
@@ -33,18 +33,18 @@ pub struct CompactedRowEncoder<'a> {
 }
 
 impl<'a> CompactedRowEncoder<'a> {
-    pub fn new(field_data_types: Vec<DataType>) -> Result<Self> {
-        let field_writers = field_data_types
-            .iter()
+    pub fn new(row_type: RowType) -> Result<Self> {
+        let field_writers = row_type
+            .field_types()
             .map(|d| ValueWriter::create_value_writer(d, Some(&BinaryRowFormat::Compacted)))
             .collect::<Result<Vec<_>>>()?;
 
         Ok(Self {
-            arity: field_data_types.len(),
-            writer: CompactedRowWriter::new(field_data_types.len()),
+            arity: field_writers.len(),
+            writer: CompactedRowWriter::new(field_writers.len()),
             field_writers,
             compacted_row_deserializer: Arc::new(CompactedRowDeserializer::new_from_owned(
-                field_data_types,
+                row_type,
             )),
         })
     }
@@ -60,10 +60,7 @@ impl RowEncoder for CompactedRowEncoder<'_> {
         self.field_writers
             .get(pos)
             .ok_or_else(|| IllegalArgument {
-                message: format!(
-                    "invalid position {} when attempting to encode value {}",
-                    pos, value
-                ),
+                message: format!("invalid position {pos} when attempting to encode value {value}"),
             })?
             .write_value(&mut self.writer, pos, &value)
     }
diff --git a/fluss-rust/crates/fluss/src/row/encode/mod.rs b/fluss-rust/crates/fluss/src/row/encode/mod.rs
index 34863aba19..c294ecf1d1 100644
--- a/fluss-rust/crates/fluss/src/row/encode/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/mod.rs
@@ -19,7 +19,7 @@ mod compacted_key_encoder;
 mod compacted_row_encoder;
 
 use crate::error::Result;
-use crate::metadata::{DataLakeFormat, DataType, KvFormat, RowType};
+use crate::metadata::{DataLakeFormat, KvFormat, RowType};
 use crate::row::encode::compacted_key_encoder::CompactedKeyEncoder;
 use crate::row::encode::compacted_row_encoder::CompactedRowEncoder;
 use crate::row::{BinaryRow, Datum, InternalRow};
@@ -111,18 +111,18 @@ pub struct RowEncoderFactory {}
 #[allow(dead_code)]
 impl RowEncoderFactory {
     pub fn create(kv_format: KvFormat, row_type: &RowType) -> Result<impl RowEncoder> {
-        Self::create_for_field_types(kv_format, row_type.field_types().cloned().collect())
+        Self::create_for_field_types(kv_format, row_type.clone())
     }
 
     pub fn create_for_field_types(
         kv_format: KvFormat,
-        field_data_types: Vec<DataType>,
+        row_type: RowType,
     ) -> Result<impl RowEncoder> {
         match kv_format {
             KvFormat::INDEXED => {
                 todo!()
             }
-            KvFormat::COMPACTED => CompactedRowEncoder::new(field_data_types),
+            KvFormat::COMPACTED => CompactedRowEncoder::new(row_type),
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 499606354c..3477f1de20 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -21,11 +21,13 @@ mod datum;
 
 pub mod binary;
 pub mod compacted;
-mod encode;
+pub mod encode;
 mod field_getter;
 
 pub use column::*;
+pub use compacted::CompactedRow;
 pub use datum::*;
+pub use encode::KeyEncoder;
 
 pub trait BinaryRow: InternalRow {
     /// Returns the binary representation of this row as a byte slice.
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index c51539642b..9f9268e857 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -31,6 +31,7 @@ pub enum ApiKey {
     MetaData,
     ProduceLog,
     FetchLog,
+    Lookup,
     ListOffsets,
     GetFileSystemSecurityToken,
     GetDatabaseInfo,
@@ -53,6 +54,7 @@ impl From<i16> for ApiKey {
             1012 => ApiKey::MetaData,
             1014 => ApiKey::ProduceLog,
             1015 => ApiKey::FetchLog,
+            1017 => ApiKey::Lookup,
             1021 => ApiKey::ListOffsets,
             1025 => ApiKey::GetFileSystemSecurityToken,
             1032 => ApiKey::GetLatestLakeSnapshot,
@@ -77,6 +79,7 @@ impl From<ApiKey> for i16 {
             ApiKey::MetaData => 1012,
             ApiKey::ProduceLog => 1014,
             ApiKey::FetchLog => 1015,
+            ApiKey::Lookup => 1017,
             ApiKey::ListOffsets => 1021,
             ApiKey::GetFileSystemSecurityToken => 1025,
             ApiKey::GetLatestLakeSnapshot => 1032,
@@ -105,6 +108,7 @@ mod tests {
             (1012, ApiKey::MetaData),
             (1014, ApiKey::ProduceLog),
             (1015, ApiKey::FetchLog),
+            (1017, ApiKey::Lookup),
             (1021, ApiKey::ListOffsets),
             (1025, ApiKey::GetFileSystemSecurityToken),
             (1032, ApiKey::GetLatestLakeSnapshot),
diff --git a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
new file mode 100644
index 0000000000..3de47d64dd
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
@@ -0,0 +1,67 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::LookupResponse;
+use crate::rpc::frame::ReadError;
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::WriteError;
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use prost::Message;
+
+use bytes::{Buf, BufMut};
+
+pub struct LookupRequest {
+    pub inner_request: proto::LookupRequest,
+}
+
+impl LookupRequest {
+    pub fn new(
+        table_id: i64,
+        partition_id: Option<i64>,
+        bucket_id: i32,
+        keys: Vec<Vec<u8>>,
+    ) -> Self {
+        let bucket_req = proto::PbLookupReqForBucket {
+            partition_id,
+            bucket_id,
+            key: keys,
+        };
+
+        let request = proto::LookupRequest {
+            table_id,
+            buckets_req: vec![bucket_req],
+        };
+
+        Self {
+            inner_request: request,
+        }
+    }
+}
+
+impl RequestBody for LookupRequest {
+    type ResponseBody = LookupResponse;
+
+    const API_KEY: ApiKey = ApiKey::Lookup;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(LookupRequest);
+impl_read_version_type!(LookupResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index b619ee4023..2fe506bc37 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -34,6 +34,7 @@ mod header;
 mod list_databases;
 mod list_offsets;
 mod list_tables;
+mod lookup;
 mod produce_log;
 mod table_exists;
 mod update_metadata;
@@ -53,6 +54,7 @@ pub use header::*;
 pub use list_databases::*;
 pub use list_offsets::*;
 pub use list_tables::*;
+pub use lookup::*;
 pub use produce_log::*;
 pub use table_exists::*;
 pub use update_metadata::*;
diff --git a/fluss-rust/crates/fluss/src/util/varint.rs b/fluss-rust/crates/fluss/src/util/varint.rs
index 96fd1f50bf..83a75f6c37 100644
--- a/fluss-rust/crates/fluss/src/util/varint.rs
+++ b/fluss-rust/crates/fluss/src/util/varint.rs
@@ -364,12 +364,11 @@ mod tests {
             let mut reader = Cursor::new(&buffer);
             let read_value = read_unsigned_varint(&mut reader).unwrap();
 
-            assert_eq!(value, read_value, "Round trip failed for value {}", value);
+            assert_eq!(value, read_value, "Round trip failed for value {value}");
             assert_eq!(
                 written,
                 buffer.len(),
-                "Bytes written mismatch for value {}",
-                value
+                "Bytes written mismatch for value {value}"
             );
 
             // Test with BufMut
@@ -382,22 +381,19 @@ mod tests {
             assert_eq!(
                 calculated_size,
                 buffer.len(),
-                "Size calculation failed for value {}",
-                value
+                "Size calculation failed for value {value}"
             );
 
             // Test reading from bytes
             let (read_value_bytes, bytes_read) = read_unsigned_varint_bytes(&buffer).unwrap();
             assert_eq!(
                 value, read_value_bytes,
-                "Bytes read failed for value {}",
-                value
+                "Bytes read failed for value {value}"
             );
             assert_eq!(
                 bytes_read,
                 buffer.len(),
-                "Bytes read count mismatch for value {}",
-                value
+                "Bytes read count mismatch for value {value}"
             );
         }
     }

From 9ce10ce55d2978ab068b6e4f18b1b3b5f3195184 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 17 Jan 2026 01:53:30 +0000
Subject: [PATCH 070/287] feat: Introduce python bindings row-based append API
 (#142)

---
 fluss-rust/.gitignore                         |  11 +-
 fluss-rust/bindings/python/example/example.py |  14 +-
 fluss-rust/bindings/python/fluss/__init__.pyi |  26 ++
 fluss-rust/bindings/python/src/table.rs       | 250 ++++++++++++++++--
 4 files changed, 283 insertions(+), 18 deletions(-)

diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
index c6edfb706d..8202bbca02 100644
--- a/fluss-rust/.gitignore
+++ b/fluss-rust/.gitignore
@@ -17,4 +17,13 @@ Cargo.lock
 #  and can be added to the global gitignore or merged into this file.  For a more nuclear
 #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
 .idea/
-.vscode/
\ No newline at end of file
+.vscode/
+
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+*.egg-info/
+dist/
+build/
\ No newline at end of file
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 0b1e67d3e6..f1f20d1503 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -118,11 +118,21 @@ async def main():
         append_writer.write_arrow_batch(pa_record_batch)
         print("Successfully wrote PyArrow RecordBatch")
 
-        # Test 3: Write Pandas DataFrame
+        # Test 3: Append single rows
+        print("\n--- Testing single row append ---")
+        # Dict input
+        await append_writer.append({"id": 8, "name": "Helen", "score": 93.5, "age": 26})
+        print("Successfully appended row (dict)")
+
+        # List input
+        await append_writer.append([9, "Ivan", 90.0, 31])
+        print("Successfully appended row (list)")
+
+        # Test 4: Write Pandas DataFrame
         print("\n--- Testing Pandas DataFrame write ---")
         df = pd.DataFrame(
             {
-                "id": [6, 7],
+                "id": [10, 11],
                 "name": ["Frank", "Grace"],
                 "score": [89.3, 94.7],
                 "age": [29, 27],
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 45652425ba..6073070c0d 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -68,6 +68,32 @@ class FlussTable:
     def __repr__(self) -> str: ...
 
 class AppendWriter:
+    async def append(self, row: dict | list | tuple) -> None:
+        """Append a single row to the table.
+
+        Args:
+            row: Dictionary mapping field names to values, or
+                 list/tuple of values in schema order
+
+        Supported Types:
+            Currently supports primitive types only:
+            - Boolean, TinyInt, SmallInt, Int, BigInt (integers)
+            - Float, Double (floating point)
+            - String, Char (text)
+            - Bytes, Binary (binary data)
+            - Null values
+
+            Temporal types (Date, Timestamp, Decimal) are not yet supported.
+
+        Example:
+            await writer.append({'id': 1, 'name': 'Alice', 'score': 95.5})
+            await writer.append([1, 'Alice', 95.5])
+
+        Note:
+            For high-throughput bulk loading, prefer write_arrow_batch().
+            Use flush() to ensure all queued records are sent and acknowledged.
+        """
+        ...
     def write_arrow(self, table: pa.Table) -> None: ...
     def write_arrow_batch(self, batch: pa.RecordBatch) -> None: ...
     def write_pandas(self, df: pd.DataFrame) -> None: ...
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 6cd13c4fa1..db85c51f5a 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -49,7 +49,7 @@ impl FlussTable {
         let table_info = self.table_info.clone();
 
         future_into_py(py, async move {
-            let fluss_table = fcore::client::FlussTable::new(&conn, metadata, table_info);
+            let fluss_table = fcore::client::FlussTable::new(&conn, metadata, table_info.clone());
 
             let table_append = fluss_table
                 .new_append()
@@ -57,7 +57,7 @@ impl FlussTable {
 
             let rust_writer = table_append.create_writer();
 
-            let py_writer = AppendWriter::from_core(rust_writer);
+            let py_writer = AppendWriter::from_core(rust_writer, table_info);
 
             Python::attach(|py| Py::new(py, py_writer))
         })
@@ -193,13 +193,14 @@ impl FlussTable {
 /// Writer for appending data to a Fluss table
 #[pyclass]
 pub struct AppendWriter {
-    inner: fcore::client::AppendWriter,
+    inner: Arc<fcore::client::AppendWriter>,
+    table_info: fcore::metadata::TableInfo,
 }
 
 #[pymethods]
 impl AppendWriter {
     /// Write Arrow table data
-    pub fn write_arrow(&mut self, py: Python, table: Py<PyAny>) -> PyResult<()> {
+    pub fn write_arrow(&self, py: Python, table: Py<PyAny>) -> PyResult<()> {
         // Convert Arrow Table to batches and write each batch
         let batches = table.call_method0(py, "to_batches")?;
         let batch_list: Vec<Py<PyAny>> = batches.extract(py)?;
@@ -211,22 +212,40 @@ impl AppendWriter {
     }
 
     /// Write Arrow batch data
-    pub fn write_arrow_batch(&mut self, py: Python, batch: Py<PyAny>) -> PyResult<()> {
+    pub fn write_arrow_batch(&self, py: Python, batch: Py<PyAny>) -> PyResult<()> {
         // This shares the underlying Arrow buffers without copying data
         let batch_bound = batch.bind(py);
         let rust_batch: RecordBatch = FromPyArrow::from_pyarrow_bound(batch_bound)
             .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch: {e}")))?;
 
+        let inner = self.inner.clone();
         // Release the GIL before blocking on async operation
         let result = py.detach(|| {
-            TOKIO_RUNTIME.block_on(async { self.inner.append_arrow_batch(rust_batch).await })
+            TOKIO_RUNTIME.block_on(async { inner.append_arrow_batch(rust_batch).await })
         });
 
         result.map_err(|e| FlussError::new_err(e.to_string()))
     }
 
+    /// Append a single row to the table
+    pub fn append<'py>(
+        &self,
+        py: Python<'py>,
+        row: &Bound<'py, PyAny>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let generic_row = python_to_generic_row(row, &self.table_info)?;
+        let inner = self.inner.clone();
+
+        future_into_py(py, async move {
+            inner
+                .append(generic_row)
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))
+        })
+    }
+
     /// Write Pandas DataFrame data
-    pub fn write_pandas(&mut self, py: Python, df: Py<PyAny>) -> PyResult<()> {
+    pub fn write_pandas(&self, py: Python, df: Py<PyAny>) -> PyResult<()> {
         // Import pyarrow module
         let pyarrow = py.import("pyarrow")?;
 
@@ -241,12 +260,16 @@ impl AppendWriter {
     }
 
     /// Flush any pending data
-    pub fn flush(&mut self) -> PyResult<()> {
-        TOKIO_RUNTIME.block_on(async {
-            self.inner
-                .flush()
-                .await
-                .map_err(|e| FlussError::new_err(e.to_string()))
+    pub fn flush(&self, py: Python) -> PyResult<()> {
+        let inner = self.inner.clone();
+        // Release the GIL before blocking on I/O
+        py.detach(|| {
+            TOKIO_RUNTIME.block_on(async {
+                inner
+                    .flush()
+                    .await
+                    .map_err(|e| FlussError::new_err(e.to_string()))
+            })
         })
     }
 
@@ -257,8 +280,205 @@ impl AppendWriter {
 
 impl AppendWriter {
     /// Create a AppendWriter from a core append writer
-    pub fn from_core(append: fcore::client::AppendWriter) -> Self {
-        Self { inner: append }
+    pub fn from_core(
+        append: fcore::client::AppendWriter,
+        table_info: fcore::metadata::TableInfo,
+    ) -> Self {
+        Self {
+            inner: Arc::new(append),
+            table_info,
+        }
+    }
+}
+
+/// Represents different input shapes for a row
+#[derive(FromPyObject)]
+enum RowInput<'py> {
+    Dict(Bound<'py, pyo3::types::PyDict>),
+    Tuple(Bound<'py, pyo3::types::PyTuple>),
+    List(Bound<'py, pyo3::types::PyList>),
+}
+
+/// Helper function to process sequence types (list/tuple) into datums
+fn process_sequence_to_datums<'a, I>(
+    values: I,
+    len: usize,
+    fields: &[fcore::metadata::DataField],
+) -> PyResult<Vec<fcore::row::Datum<'static>>>
+where
+    I: Iterator<Item = Bound<'a, PyAny>>,
+{
+    if len != fields.len() {
+        return Err(FlussError::new_err(format!(
+            "Expected {} values, got {}",
+            fields.len(),
+            len
+        )));
+    }
+
+    let mut datums = Vec::with_capacity(fields.len());
+    for (i, (field, value)) in fields.iter().zip(values).enumerate() {
+        datums.push(
+            python_value_to_datum(&value, field.data_type()).map_err(|e| {
+                FlussError::new_err(format!("Field '{}' (index {}): {}", field.name(), i, e))
+            })?,
+        );
+    }
+    Ok(datums)
+}
+
+/// Convert Python row (dict/list/tuple) to GenericRow based on schema
+fn python_to_generic_row(
+    row: &Bound<PyAny>,
+    table_info: &fcore::metadata::TableInfo,
+) -> PyResult<fcore::row::GenericRow<'static>> {
+    // Extract with user-friendly error message
+    let row_input: RowInput = row.extract().map_err(|_| {
+        let type_name = row
+            .get_type()
+            .name()
+            .map(|n| n.to_string())
+            .unwrap_or_else(|_| "unknown".to_string());
+        FlussError::new_err(format!(
+            "Row must be a dict, list, or tuple; got {}",
+            type_name
+        ))
+    })?;
+    let schema = table_info.row_type();
+    let fields = schema.fields();
+
+    let datums = match row_input {
+        RowInput::Dict(dict) => {
+            // Strict: reject unknown keys (and also reject non-str keys nicely)
+            for (k, _) in dict.iter() {
+                let key_str = k.extract::<&str>().map_err(|_| {
+                    let key_type = k
+                        .get_type()
+                        .name()
+                        .map(|n| n.to_string())
+                        .unwrap_or_else(|_| "unknown".to_string());
+                    FlussError::new_err(format!("Row dict keys must be strings; got {}", key_type))
+                })?;
+
+                if fields.iter().all(|f| f.name() != key_str) {
+                    let expected = fields
+                        .iter()
+                        .map(|f| f.name())
+                        .collect::<Vec<_>>()
+                        .join(", ");
+                    return Err(FlussError::new_err(format!(
+                        "Unknown field '{}'. Expected fields: {}",
+                        key_str, expected
+                    )));
+                }
+            }
+
+            let mut datums = Vec::with_capacity(fields.len());
+            for field in fields {
+                let value = dict.get_item(field.name())?.ok_or_else(|| {
+                    FlussError::new_err(format!("Missing field: {}", field.name()))
+                })?;
+                datums.push(
+                    python_value_to_datum(&value, field.data_type()).map_err(|e| {
+                        FlussError::new_err(format!("Field '{}': {}", field.name(), e))
+                    })?,
+                );
+            }
+            datums
+        }
+
+        RowInput::List(list) => process_sequence_to_datums(list.iter(), list.len(), fields)?,
+
+        RowInput::Tuple(tuple) => process_sequence_to_datums(tuple.iter(), tuple.len(), fields)?,
+    };
+
+    Ok(fcore::row::GenericRow { values: datums })
+}
+
+/// Convert Python value to Datum based on data type
+fn python_value_to_datum(
+    value: &Bound<PyAny>,
+    data_type: &fcore::metadata::DataType,
+) -> PyResult<fcore::row::Datum<'static>> {
+    use fcore::row::{Datum, F32, F64};
+
+    if value.is_none() {
+        return Ok(Datum::Null);
+    }
+
+    match data_type {
+        fcore::metadata::DataType::Boolean(_) => {
+            let v: bool = value.extract()?;
+            Ok(Datum::Bool(v))
+        }
+        fcore::metadata::DataType::TinyInt(_) => {
+            // Strict type checking: reject bool for int columns
+            if value.is_instance_of::<pyo3::types::PyBool>() {
+                return Err(FlussError::new_err(
+                    "Expected int for TinyInt column, got bool. Use 0 or 1 explicitly.".to_string(),
+                ));
+            }
+            let v: i8 = value.extract()?;
+            Ok(Datum::Int8(v))
+        }
+        fcore::metadata::DataType::SmallInt(_) => {
+            if value.is_instance_of::<pyo3::types::PyBool>() {
+                return Err(FlussError::new_err(
+                    "Expected int for SmallInt column, got bool. Use 0 or 1 explicitly."
+                        .to_string(),
+                ));
+            }
+            let v: i16 = value.extract()?;
+            Ok(Datum::Int16(v))
+        }
+        fcore::metadata::DataType::Int(_) => {
+            if value.is_instance_of::<pyo3::types::PyBool>() {
+                return Err(FlussError::new_err(
+                    "Expected int for Int column, got bool. Use 0 or 1 explicitly.".to_string(),
+                ));
+            }
+            let v: i32 = value.extract()?;
+            Ok(Datum::Int32(v))
+        }
+        fcore::metadata::DataType::BigInt(_) => {
+            if value.is_instance_of::<pyo3::types::PyBool>() {
+                return Err(FlussError::new_err(
+                    "Expected int for BigInt column, got bool. Use 0 or 1 explicitly.".to_string(),
+                ));
+            }
+            let v: i64 = value.extract()?;
+            Ok(Datum::Int64(v))
+        }
+        fcore::metadata::DataType::Float(_) => {
+            let v: f32 = value.extract()?;
+            Ok(Datum::Float32(F32::from(v)))
+        }
+        fcore::metadata::DataType::Double(_) => {
+            let v: f64 = value.extract()?;
+            Ok(Datum::Float64(F64::from(v)))
+        }
+        fcore::metadata::DataType::String(_) | fcore::metadata::DataType::Char(_) => {
+            let v: String = value.extract()?;
+            Ok(v.into())
+        }
+        fcore::metadata::DataType::Bytes(_) | fcore::metadata::DataType::Binary(_) => {
+            // Efficient extraction: downcast to specific type and use bulk copy.
+            // PyBytes::as_bytes() and PyByteArray::to_vec() are O(n) bulk copies of the underlying data.
+            if let Ok(bytes) = value.downcast::<pyo3::types::PyBytes>() {
+                Ok(bytes.as_bytes().to_vec().into())
+            } else if let Ok(bytearray) = value.downcast::<pyo3::types::PyByteArray>() {
+                Ok(bytearray.to_vec().into())
+            } else {
+                Err(FlussError::new_err(format!(
+                    "Expected bytes or bytearray, got {}",
+                    value.get_type().name()?
+                )))
+            }
+        }
+        _ => Err(FlussError::new_err(format!(
+            "Unsupported data type for row-level operations: {:?}",
+            data_type
+        ))),
     }
 }
 

From a4409833d235dfec67b3004136bf0ffa155b543c Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Sat, 17 Jan 2026 14:33:57 +0800
Subject: [PATCH 071/287] chore: Improve read path error handling logic (#143)

---
 .../src/client/table/log_fetch_buffer.rs      | 378 ++++++++++-
 .../fluss/src/client/table/remote_log.rs      |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  | 628 ++++++++++++++----
 .../crates/fluss/src/client/write/sender.rs   |   2 +-
 fluss-rust/crates/fluss/src/error.rs          |   5 +
 fluss-rust/crates/fluss/src/record/arrow.rs   |  67 +-
 fluss-rust/crates/fluss/src/record/mod.rs     |  62 ++
 fluss-rust/crates/fluss/src/row/column.rs     |  64 ++
 .../fluss/src/rpc/message/list_offsets.rs     |  52 +-
 fluss-rust/crates/fluss/src/util/mod.rs       |  54 ++
 10 files changed, 1122 insertions(+), 192 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index c55c994b03..fb6981f4b5 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -18,7 +18,7 @@
 use arrow::array::RecordBatch;
 use parking_lot::Mutex;
 
-use crate::error::Result;
+use crate::error::{ApiError, Error, Result};
 use crate::metadata::TableBucket;
 use crate::record::{
     LogRecordBatch, LogRecordIterator, LogRecordsBatches, ReadContext, ScanRecord,
@@ -29,12 +29,38 @@ use std::sync::atomic::{AtomicBool, Ordering};
 use std::time::Duration;
 use tokio::sync::Notify;
 
+#[derive(Clone, Copy, Debug, PartialEq, Eq)]
+pub(crate) enum FetchErrorAction {
+    Ignore,
+    LogOffsetOutOfRange,
+    Authorization,
+    CorruptMessage,
+    Unexpected,
+}
+
+#[derive(Clone, Copy, Debug, PartialEq, Eq)]
+pub(crate) enum FetchErrorLogLevel {
+    Debug,
+    Warn,
+}
+
+#[derive(Clone, Debug)]
+pub(crate) struct FetchErrorContext {
+    pub(crate) action: FetchErrorAction,
+    pub(crate) log_level: FetchErrorLogLevel,
+    pub(crate) log_message: String,
+}
+
 /// Represents a completed fetch that can be consumed
 pub trait CompletedFetch: Send + Sync {
     fn table_bucket(&self) -> &TableBucket;
+    fn api_error(&self) -> Option<&ApiError>;
+    fn fetch_error_context(&self) -> Option<&FetchErrorContext>;
+    fn take_error(&mut self) -> Option<Error>;
     fn fetch_records(&mut self, max_records: usize) -> Result<Vec<ScanRecord>>;
     fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<RecordBatch>>;
     fn is_consumed(&self) -> bool;
+    fn records_read(&self) -> usize;
     fn drain(&mut self);
     fn size_in_bytes(&self) -> usize;
     fn high_watermark(&self) -> i64;
@@ -52,6 +78,7 @@ pub trait PendingFetch: Send + Sync {
 
 /// Thread-safe buffer for completed fetches
 pub struct LogFetchBuffer {
+    read_context: ReadContext,
     completed_fetches: Mutex<VecDeque<Box<dyn CompletedFetch>>>,
     pending_fetches: Mutex<HashMap<TableBucket, VecDeque<Box<dyn PendingFetch>>>>,
     next_in_line_fetch: Mutex<Option<Box<dyn CompletedFetch>>>,
@@ -60,8 +87,9 @@ pub struct LogFetchBuffer {
 }
 
 impl LogFetchBuffer {
-    pub fn new() -> Self {
+    pub fn new(read_context: ReadContext) -> Self {
         Self {
+            read_context,
             completed_fetches: Mutex::new(VecDeque::new()),
             pending_fetches: Mutex::new(HashMap::new()),
             next_in_line_fetch: Mutex::new(None),
@@ -75,26 +103,28 @@ impl LogFetchBuffer {
         self.completed_fetches.lock().is_empty()
     }
 
-    /// Wait for the buffer to become non-empty, with timeout
-    /// Returns true if data became available, false if timeout
-    pub async fn await_not_empty(&self, timeout: Duration) -> bool {
+    /// Wait for the buffer to become non-empty, with timeout.
+    /// Returns true if data became available, false if timeout.
+    pub async fn await_not_empty(&self, timeout: Duration) -> Result<bool> {
         let deadline = std::time::Instant::now() + timeout;
 
         loop {
             // Check if buffer is not empty
             if !self.is_empty() {
-                return true;
+                return Ok(true);
             }
 
             // Check if woken up
             if self.woken_up.swap(false, Ordering::Acquire) {
-                return true;
+                return Err(Error::WakeupError {
+                    message: "The await operation was interrupted by wakeup.".to_string(),
+                });
             }
 
             // Check if timeout
             let now = std::time::Instant::now();
             if now >= deadline {
-                return false;
+                return Ok(false);
             }
 
             // Wait for notification with remaining time
@@ -102,7 +132,7 @@ impl LogFetchBuffer {
             let notified = self.not_empty_notify.notified();
             tokio::select! {
                 _ = tokio::time::sleep(remaining) => {
-                    return false; // Timeout
+                    return Ok(false); // Timeout
                 }
                 _ = notified => {
                     // Got notification, check again
@@ -119,6 +149,26 @@ impl LogFetchBuffer {
         self.not_empty_notify.notify_waiters();
     }
 
+    pub(crate) fn add_api_error(
+        &self,
+        table_bucket: TableBucket,
+        api_error: ApiError,
+        fetch_error_context: FetchErrorContext,
+        fetch_offset: i64,
+    ) {
+        let error_fetch = DefaultCompletedFetch::from_api_error(
+            table_bucket,
+            api_error,
+            fetch_error_context,
+            fetch_offset,
+            self.read_context.clone(),
+        );
+        self.completed_fetches
+            .lock()
+            .push_back(Box::new(error_fetch));
+        self.not_empty_notify.notify_waiters();
+    }
+
     /// Add a pending fetch to the buffer
     pub fn pend(&self, pending_fetch: Box<dyn PendingFetch>) {
         let table_bucket = pending_fetch.table_bucket().clone();
@@ -136,6 +186,7 @@ impl LogFetchBuffer {
         // holding both locks simultaneously.
         let mut completed_to_push: Vec<Box<dyn CompletedFetch>> = Vec::new();
         let mut has_completed = false;
+        let mut pending_error: Option<Error> = None;
         {
             let mut pending_map = self.pending_fetches.lock();
             if let Some(pendings) = pending_map.get_mut(table_bucket) {
@@ -148,8 +199,9 @@ impl LogFetchBuffer {
                                 has_completed = true;
                             }
                             Err(e) => {
-                                // todo: handle exception?
-                                log::error!("Error when completing: {e}");
+                                pending_error = Some(e);
+                                has_completed = true;
+                                break;
                             }
                         }
                     } else {
@@ -162,11 +214,22 @@ impl LogFetchBuffer {
             }
         }
 
+        if let Some(error) = pending_error {
+            let error_fetch = DefaultCompletedFetch::from_error(
+                table_bucket.clone(),
+                error,
+                -1,
+                self.read_context.clone(),
+            );
+            completed_to_push.push(Box::new(error_fetch));
+        }
+
         if !completed_to_push.is_empty() {
             let mut completed_queue = self.completed_fetches.lock();
             for completed in completed_to_push {
                 completed_queue.push_back(completed);
             }
+            has_completed = true;
         }
 
         if has_completed {
@@ -236,12 +299,6 @@ impl LogFetchBuffer {
     }
 }
 
-impl Default for LogFetchBuffer {
-    fn default() -> Self {
-        Self::new()
-    }
-}
-
 /// A wrapper that makes a completed fetch look like a pending fetch
 struct CompletedPendingFetch {
     completed_fetch: Box<dyn CompletedFetch>,
@@ -270,6 +327,9 @@ impl PendingFetch for CompletedPendingFetch {
 /// Default implementation of CompletedFetch for in-memory log records
 pub struct DefaultCompletedFetch {
     table_bucket: TableBucket,
+    api_error: Option<ApiError>,
+    fetch_error_context: Option<FetchErrorContext>,
+    error: Option<Error>,
     log_record_batch: LogRecordsBatches,
     read_context: ReadContext,
     next_fetch_offset: i64,
@@ -280,6 +340,9 @@ pub struct DefaultCompletedFetch {
     records_read: usize,
     current_record_iterator: Option<LogRecordIterator>,
     current_record_batch: Option<LogRecordBatch>,
+    last_record: Option<ScanRecord>,
+    cached_record_error: Option<String>,
+    corrupt_last_record: bool,
 }
 
 impl DefaultCompletedFetch {
@@ -290,9 +353,12 @@ impl DefaultCompletedFetch {
         read_context: ReadContext,
         fetch_offset: i64,
         high_watermark: i64,
-    ) -> Result<Self> {
-        Ok(Self {
+    ) -> Self {
+        Self {
             table_bucket,
+            api_error: None,
+            fetch_error_context: None,
+            error: None,
             log_record_batch,
             read_context,
             next_fetch_offset: fetch_offset,
@@ -303,7 +369,65 @@ impl DefaultCompletedFetch {
             records_read: 0,
             current_record_iterator: None,
             current_record_batch: None,
-        })
+            last_record: None,
+            cached_record_error: None,
+            corrupt_last_record: false,
+        }
+    }
+
+    pub(crate) fn from_error(
+        table_bucket: TableBucket,
+        error: Error,
+        fetch_offset: i64,
+        read_context: ReadContext,
+    ) -> Self {
+        Self {
+            table_bucket,
+            api_error: None,
+            fetch_error_context: None,
+            error: Some(error),
+            log_record_batch: LogRecordsBatches::new(Vec::new()),
+            read_context,
+            next_fetch_offset: fetch_offset,
+            high_watermark: -1,
+            size_in_bytes: 0,
+            consumed: false,
+            initialized: false,
+            records_read: 0,
+            current_record_iterator: None,
+            current_record_batch: None,
+            last_record: None,
+            cached_record_error: None,
+            corrupt_last_record: false,
+        }
+    }
+
+    pub(crate) fn from_api_error(
+        table_bucket: TableBucket,
+        api_error: ApiError,
+        fetch_error_context: FetchErrorContext,
+        fetch_offset: i64,
+        read_context: ReadContext,
+    ) -> Self {
+        Self {
+            table_bucket,
+            api_error: Some(api_error),
+            fetch_error_context: Some(fetch_error_context),
+            error: None,
+            log_record_batch: LogRecordsBatches::new(Vec::new()),
+            read_context,
+            next_fetch_offset: fetch_offset,
+            high_watermark: -1,
+            size_in_bytes: 0,
+            consumed: false,
+            initialized: false,
+            records_read: 0,
+            current_record_iterator: None,
+            current_record_batch: None,
+            last_record: None,
+            cached_record_error: None,
+            corrupt_last_record: false,
+        }
     }
 
     /// Get the next fetched record, handling batch iteration and record skipping
@@ -330,6 +454,19 @@ impl DefaultCompletedFetch {
         }
     }
 
+    fn fetch_error(&self) -> Error {
+        let mut message = format!(
+            "Received exception when fetching the next record from {table_bucket}. If needed, please back to past the record to continue scanning.",
+            table_bucket = self.table_bucket
+        );
+        if let Some(cause) = self.cached_record_error.as_deref() {
+            message.push_str(&format!(" Cause: {cause}"));
+        }
+        Error::UnexpectedError {
+            message,
+            source: None,
+        }
+    }
     /// Get the next batch directly without row iteration
     fn next_fetched_batch(&mut self) -> Result<Option<RecordBatch>> {
         loop {
@@ -368,8 +505,36 @@ impl CompletedFetch for DefaultCompletedFetch {
         &self.table_bucket
     }
 
+    fn api_error(&self) -> Option<&ApiError> {
+        self.api_error.as_ref()
+    }
+
+    fn fetch_error_context(&self) -> Option<&FetchErrorContext> {
+        self.fetch_error_context.as_ref()
+    }
+
+    fn take_error(&mut self) -> Option<Error> {
+        self.error.take()
+    }
+
     fn fetch_records(&mut self, max_records: usize) -> Result<Vec<ScanRecord>> {
-        // todo: handle corrupt_last_record
+        if let Some(error) = self.error.take() {
+            return Err(error);
+        }
+
+        if let Some(api_error) = self.api_error.as_ref() {
+            return Err(Error::FlussAPIError {
+                api_error: ApiError {
+                    code: api_error.code,
+                    message: api_error.message.clone(),
+                },
+            });
+        }
+
+        if self.corrupt_last_record {
+            return Err(self.fetch_error());
+        }
+
         if self.consumed {
             return Ok(Vec::new());
         }
@@ -377,19 +542,53 @@ impl CompletedFetch for DefaultCompletedFetch {
         let mut scan_records = Vec::new();
 
         for _ in 0..max_records {
-            if let Some(record) = self.next_fetched_record()? {
-                self.next_fetch_offset = record.offset() + 1;
-                self.records_read += 1;
-                scan_records.push(record);
-            } else {
-                break;
+            if self.cached_record_error.is_none() {
+                self.corrupt_last_record = true;
+                match self.next_fetched_record() {
+                    Ok(Some(record)) => {
+                        self.corrupt_last_record = false;
+                        self.last_record = Some(record);
+                    }
+                    Ok(None) => {
+                        self.corrupt_last_record = false;
+                        self.last_record = None;
+                    }
+                    Err(e) => {
+                        self.cached_record_error = Some(e.to_string());
+                    }
+                }
             }
+
+            let Some(record) = self.last_record.take() else {
+                break;
+            };
+
+            self.next_fetch_offset = record.offset() + 1;
+            self.records_read += 1;
+            scan_records.push(record);
+        }
+
+        if self.cached_record_error.is_some() && scan_records.is_empty() {
+            return Err(self.fetch_error());
         }
 
         Ok(scan_records)
     }
 
     fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<RecordBatch>> {
+        if let Some(error) = self.error.take() {
+            return Err(error);
+        }
+
+        if let Some(api_error) = self.api_error.as_ref() {
+            return Err(Error::FlussAPIError {
+                api_error: ApiError {
+                    code: api_error.code,
+                    message: api_error.message.clone(),
+                },
+            });
+        }
+
         if self.consumed {
             return Ok(Vec::new());
         }
@@ -410,8 +609,18 @@ impl CompletedFetch for DefaultCompletedFetch {
         self.consumed
     }
 
+    fn records_read(&self) -> usize {
+        self.records_read
+    }
+
     fn drain(&mut self) {
         self.consumed = true;
+        self.api_error = None;
+        self.fetch_error_context = None;
+        self.error = None;
+        self.cached_record_error = None;
+        self.corrupt_last_record = false;
+        self.last_record = None;
     }
 
     fn size_in_bytes(&self) -> usize {
@@ -434,3 +643,118 @@ impl CompletedFetch for DefaultCompletedFetch {
         self.next_fetch_offset
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::client::WriteRecord;
+    use crate::compression::{
+        ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+    };
+    use crate::metadata::{DataField, DataTypes, TablePath};
+    use crate::record::{MemoryLogRecordsArrowBuilder, ReadContext, to_arrow_schema};
+    use crate::row::GenericRow;
+    use std::sync::Arc;
+    use std::time::Duration;
+
+    fn test_read_context() -> ReadContext {
+        let row_type = DataTypes::row(vec![DataField::new(
+            "id".to_string(),
+            DataTypes::int(),
+            None,
+        )]);
+        ReadContext::new(to_arrow_schema(&row_type), false)
+    }
+
+    struct ErrorPendingFetch {
+        table_bucket: TableBucket,
+    }
+
+    impl PendingFetch for ErrorPendingFetch {
+        fn table_bucket(&self) -> &TableBucket {
+            &self.table_bucket
+        }
+
+        fn is_completed(&self) -> bool {
+            true
+        }
+
+        fn to_completed_fetch(self: Box<Self>) -> Result<Box<dyn CompletedFetch>> {
+            Err(Error::UnexpectedError {
+                message: "pending fetch failure".to_string(),
+                source: None,
+            })
+        }
+    }
+
+    #[tokio::test]
+    async fn await_not_empty_returns_wakeup_error() {
+        let buffer = LogFetchBuffer::new(test_read_context());
+        buffer.wakeup();
+
+        let result = buffer.await_not_empty(Duration::from_millis(10)).await;
+        assert!(matches!(result, Err(Error::WakeupError { .. })));
+    }
+
+    #[tokio::test]
+    async fn await_not_empty_returns_pending_error() {
+        let buffer = LogFetchBuffer::new(test_read_context());
+        let table_bucket = TableBucket::new(1, 0);
+        buffer.pend(Box::new(ErrorPendingFetch {
+            table_bucket: table_bucket.clone(),
+        }));
+        buffer.try_complete(&table_bucket);
+
+        let result = buffer.await_not_empty(Duration::from_millis(10)).await;
+        assert!(matches!(result, Ok(true)));
+
+        let mut completed = buffer.poll().expect("completed fetch");
+        assert!(completed.take_error().is_some());
+    }
+
+    #[test]
+    fn default_completed_fetch_reads_records() -> Result<()> {
+        let row_type = DataTypes::row(vec![
+            DataField::new("id".to_string(), DataTypes::int(), None),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+        ]);
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+
+        let mut builder = MemoryLogRecordsArrowBuilder::new(
+            1,
+            &row_type,
+            false,
+            ArrowCompressionInfo {
+                compression_type: ArrowCompressionType::None,
+                compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+            },
+        );
+
+        let mut row = GenericRow::new();
+        row.set_field(0, 1_i32);
+        row.set_field(1, "alice");
+        let record = WriteRecord::new(table_path, row);
+        builder.append(&record)?;
+
+        let data = builder.build()?;
+        let log_records = LogRecordsBatches::new(data.clone());
+        let read_context = ReadContext::new(to_arrow_schema(&row_type), false);
+        let mut fetch = DefaultCompletedFetch::new(
+            TableBucket::new(1, 0),
+            log_records,
+            data.len(),
+            read_context,
+            0,
+            0,
+        );
+
+        let records = fetch.fetch_records(10)?;
+        assert_eq!(records.len(), 1);
+        assert_eq!(records[0].offset(), 0);
+
+        let empty = fetch.fetch_records(10)?;
+        assert!(empty.is_empty());
+
+        Ok(())
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index d9abd19c29..0142515783 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -409,7 +409,7 @@ impl PendingFetch for RemotePendingFetch {
             self.read_context,
             self.fetch_offset,
             self.high_watermark,
-        )?;
+        );
 
         Ok(Box::new(completed_fetch))
     }
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 7d22324d6b..3e7d61ff99 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -17,7 +17,7 @@
 
 use arrow::array::RecordBatch;
 use arrow_schema::SchemaRef;
-use log::{debug, error, warn};
+use log::{debug, warn};
 use parking_lot::{Mutex, RwLock};
 use std::collections::{HashMap, HashSet};
 use std::slice::from_ref;
@@ -29,16 +29,17 @@ use crate::client::connection::FlussConnection;
 use crate::client::credentials::CredentialsCache;
 use crate::client::metadata::Metadata;
 use crate::client::table::log_fetch_buffer::{
-    CompletedFetch, DefaultCompletedFetch, LogFetchBuffer,
+    CompletedFetch, DefaultCompletedFetch, FetchErrorAction, FetchErrorContext, FetchErrorLogLevel,
+    LogFetchBuffer,
 };
 use crate::client::table::remote_log::{
     RemoteLogDownloader, RemoteLogFetchInfo, RemotePendingFetch,
 };
-use crate::error::{Error, Result, RpcError};
+use crate::error::{ApiError, Error, FlussError, Result};
 use crate::metadata::{TableBucket, TableInfo, TablePath};
-use crate::proto::{FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
+use crate::proto::{ErrorResponse, FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
 use crate::record::{LogRecordsBatches, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
-use crate::rpc::{RpcClient, message};
+use crate::rpc::{RpcClient, RpcError, message};
 use crate::util::FairBucketStatusMap;
 
 const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
@@ -318,7 +319,7 @@ impl LogScannerInner {
                 .log_fetcher
                 .log_fetch_buffer
                 .await_not_empty(remaining)
-                .await;
+                .await?;
 
             if !has_data {
                 // Timeout while waiting
@@ -396,7 +397,7 @@ impl LogScannerInner {
                 .log_fetcher
                 .log_fetch_buffer
                 .await_not_empty(remaining)
-                .await;
+                .await?;
 
             if !has_data {
                 return Ok(Vec::new());
@@ -448,6 +449,8 @@ impl RecordBatchLogScanner {
 struct LogFetcher {
     conns: Arc<RpcClient>,
     metadata: Arc<Metadata>,
+    table_path: TablePath,
+    is_partitioned: bool,
     log_scanner_status: Arc<LogScannerStatus>,
     read_context: ReadContext,
     remote_read_context: ReadContext,
@@ -457,8 +460,6 @@ struct LogFetcher {
     credentials_cache: Arc<CredentialsCache>,
     log_fetch_buffer: Arc<LogFetchBuffer>,
     nodes_with_pending_fetch_requests: Arc<Mutex<HashSet<i32>>>,
-    table_path: TablePath,
-    is_partitioned: bool,
 }
 
 impl LogFetcher {
@@ -471,24 +472,25 @@ impl LogFetcher {
     ) -> Result<Self> {
         let full_arrow_schema = to_arrow_schema(table_info.get_row_type());
         let read_context =
-            Self::create_read_context(full_arrow_schema.clone(), projected_fields.clone(), false);
+            Self::create_read_context(full_arrow_schema.clone(), projected_fields.clone(), false)?;
         let remote_read_context =
-            Self::create_read_context(full_arrow_schema, projected_fields.clone(), true);
+            Self::create_read_context(full_arrow_schema, projected_fields.clone(), true)?;
 
         let tmp_dir = TempDir::with_prefix("fluss-remote-logs")?;
+        let log_fetch_buffer = Arc::new(LogFetchBuffer::new(read_context.clone()));
 
         Ok(LogFetcher {
             conns: conns.clone(),
             metadata: metadata.clone(),
+            table_path: table_info.table_path.clone(),
+            is_partitioned: table_info.is_partitioned(),
             log_scanner_status,
             read_context,
             remote_read_context,
             remote_log_downloader: Arc::new(RemoteLogDownloader::new(tmp_dir)?),
             credentials_cache: Arc::new(CredentialsCache::new(conns.clone(), metadata.clone())),
-            log_fetch_buffer: Arc::new(LogFetchBuffer::new()),
+            log_fetch_buffer,
             nodes_with_pending_fetch_requests: Arc::new(Mutex::new(HashSet::new())),
-            table_path: table_info.table_path.clone(),
-            is_partitioned: table_info.is_partitioned(),
         })
     }
 
@@ -496,23 +498,79 @@ impl LogFetcher {
         full_arrow_schema: SchemaRef,
         projected_fields: Option<Vec<usize>>,
         is_from_remote: bool,
-    ) -> ReadContext {
+    ) -> Result<ReadContext> {
         match projected_fields {
-            None => ReadContext::new(full_arrow_schema, is_from_remote),
+            None => Ok(ReadContext::new(full_arrow_schema, is_from_remote)),
             Some(fields) => {
                 ReadContext::with_projection_pushdown(full_arrow_schema, fields, is_from_remote)
             }
         }
     }
 
-    async fn check_and_update_metadata(&self) -> Result<()> {
-        if self.is_partitioned {
-            // TODO: Implement partition-aware metadata refresh for buckets whose leaders are unknown.
-            // The implementation will likely need to collect partition IDs for such buckets and
-            // perform targeted metadata updates. Until then, we avoid computing unused partition_ids.
-            return Ok(());
+    fn describe_fetch_error(
+        error: FlussError,
+        table_bucket: &TableBucket,
+        fetch_offset: i64,
+        error_message: &str,
+    ) -> FetchErrorContext {
+        match error {
+            FlussError::NotLeaderOrFollower
+            | FlussError::LogStorageException
+            | FlussError::KvStorageException
+            | FlussError::StorageException
+            | FlussError::FencedLeaderEpochException => FetchErrorContext {
+                action: FetchErrorAction::Ignore,
+                log_level: FetchErrorLogLevel::Debug,
+                log_message: format!(
+                    "Error in fetch for bucket {table_bucket}: {error:?}: {error_message}"
+                ),
+            },
+            FlussError::UnknownTableOrBucketException => FetchErrorContext {
+                action: FetchErrorAction::Ignore,
+                log_level: FetchErrorLogLevel::Warn,
+                log_message: format!(
+                    "Received unknown table or bucket error in fetch for bucket {table_bucket}"
+                ),
+            },
+            FlussError::LogOffsetOutOfRangeException => FetchErrorContext {
+                action: FetchErrorAction::LogOffsetOutOfRange,
+                log_level: FetchErrorLogLevel::Debug,
+                log_message: format!(
+                    "The fetching offset {fetch_offset} is out of range for bucket {table_bucket}: {error_message}"
+                ),
+            },
+            FlussError::AuthorizationException => FetchErrorContext {
+                action: FetchErrorAction::Authorization,
+                log_level: FetchErrorLogLevel::Debug,
+                log_message: format!(
+                    "Authorization error while fetching offset {fetch_offset} for bucket {table_bucket}: {error_message}"
+                ),
+            },
+            FlussError::UnknownServerError => FetchErrorContext {
+                action: FetchErrorAction::Ignore,
+                log_level: FetchErrorLogLevel::Warn,
+                log_message: format!(
+                    "Unknown server error while fetching offset {fetch_offset} for bucket {table_bucket}: {error_message}"
+                ),
+            },
+            FlussError::CorruptMessage => FetchErrorContext {
+                action: FetchErrorAction::CorruptMessage,
+                log_level: FetchErrorLogLevel::Debug,
+                log_message: format!(
+                    "Encountered corrupt message when fetching offset {fetch_offset} for bucket {table_bucket}: {error_message}"
+                ),
+            },
+            _ => FetchErrorContext {
+                action: FetchErrorAction::Unexpected,
+                log_level: FetchErrorLogLevel::Debug,
+                log_message: format!(
+                    "Unexpected error code {error:?} while fetching at offset {fetch_offset} from bucket {table_bucket}: {error_message}"
+                ),
+            },
         }
+    }
 
+    async fn check_and_update_metadata(&self) -> Result<()> {
         let need_update = self
             .fetchable_buckets()
             .iter()
@@ -522,6 +580,26 @@ impl LogFetcher {
             return Ok(());
         }
 
+        if self.is_partitioned {
+            // Fallback to full table metadata refresh until partition-aware updates are available.
+            self.metadata
+                .update_tables_metadata(&HashSet::from([&self.table_path]))
+                .await
+                .or_else(|e| {
+                    if let Error::RpcError { source, .. } = &e
+                        && matches!(source, RpcError::ConnectionError(_) | RpcError::Poisoned(_))
+                    {
+                        warn!(
+                            "Retrying after encountering error while updating table metadata: {e}"
+                        );
+                        Ok(())
+                    } else {
+                        Err(e)
+                    }
+                })?;
+            return Ok(());
+        }
+
         // TODO: Handle PartitionNotExist error
         self.metadata
             .update_tables_metadata(&HashSet::from([&self.table_path]))
@@ -561,7 +639,6 @@ impl LogFetcher {
             let creds_cache = self.credentials_cache.clone();
             let nodes_with_pending = self.nodes_with_pending_fetch_requests.clone();
             let metadata = self.metadata.clone();
-
             // Spawn async task to handle the fetch request
             // Note: These tasks are not explicitly tracked or cancelled when LogFetcher is dropped.
             // This is acceptable because:
@@ -607,7 +684,7 @@ impl LogFetcher {
                     }
                 };
 
-                if let Err(e) = Self::handle_fetch_response(
+                Self::handle_fetch_response(
                     fetch_response,
                     &log_fetch_buffer,
                     &log_scanner_status,
@@ -616,10 +693,7 @@ impl LogFetcher {
                     &remote_log_downloader,
                     &creds_cache,
                 )
-                .await
-                {
-                    error!("Fail to handle fetch response: {e:?}");
-                }
+                .await;
             });
         }
 
@@ -644,7 +718,7 @@ impl LogFetcher {
         remote_read_context: &ReadContext,
         remote_log_downloader: &Arc<RemoteLogDownloader>,
         credentials_cache: &Arc<CredentialsCache>,
-    ) -> Result<()> {
+    ) {
         for pb_fetch_log_resp in fetch_response.tables_resp {
             let table_id = pb_fetch_log_resp.table_id;
             let fetch_log_for_buckets = pb_fetch_log_resp.buckets_resp;
@@ -661,11 +735,45 @@ impl LogFetcher {
                     continue;
                 };
 
+                if let Some(error_code) = fetch_log_for_bucket.error_code
+                    && error_code != FlussError::None.code()
+                {
+                    let api_error: ApiError = ErrorResponse {
+                        error_code,
+                        error_message: fetch_log_for_bucket.error_message.clone(),
+                    }
+                    .into();
+
+                    let error = FlussError::for_code(error_code);
+                    let error_context = Self::describe_fetch_error(
+                        error,
+                        &table_bucket,
+                        fetch_offset,
+                        api_error.message.as_str(),
+                    );
+                    log_scanner_status.move_bucket_to_end(table_bucket.clone());
+                    match error_context.log_level {
+                        FetchErrorLogLevel::Debug => {
+                            debug!("{}", error_context.log_message);
+                        }
+                        FetchErrorLogLevel::Warn => {
+                            warn!("{}", error_context.log_message);
+                        }
+                    }
+                    log_fetch_buffer.add_api_error(
+                        table_bucket.clone(),
+                        api_error,
+                        error_context,
+                        fetch_offset,
+                    );
+                    continue;
+                }
+
                 // Check if this is a remote log fetch
                 if let Some(ref remote_log_fetch_info) = fetch_log_for_bucket.remote_log_fetch_info
                 {
                     // set remote fs props
-                    let remote_fs_props = credentials_cache.get_or_refresh().await?;
+                    let remote_fs_props = credentials_cache.get_or_refresh().await.unwrap();
                     remote_log_downloader.set_remote_fs_props(remote_fs_props);
 
                     let remote_fetch_info =
@@ -688,26 +796,18 @@ impl LogFetcher {
                     let size_in_bytes = records.len();
                     let log_record_batch = LogRecordsBatches::new(records);
 
-                    match DefaultCompletedFetch::new(
+                    let completed_fetch = DefaultCompletedFetch::new(
                         table_bucket.clone(),
                         log_record_batch,
                         size_in_bytes,
                         read_context.clone(),
                         fetch_offset,
                         high_watermark,
-                    ) {
-                        Ok(completed_fetch) => {
-                            log_fetch_buffer.add(Box::new(completed_fetch));
-                        }
-                        Err(e) => {
-                            // todo: handle error
-                            log::warn!("Failed to create completed fetch: {e:?}");
-                        }
-                    }
+                    );
+                    log_fetch_buffer.add(Box::new(completed_fetch));
                 }
             }
         }
-        Ok(())
     }
 
     fn pending_remote_fetches(
@@ -763,69 +863,91 @@ impl LogFetcher {
         let mut result: HashMap<TableBucket, Vec<ScanRecord>> = HashMap::new();
         let mut records_remaining = MAX_POLL_RECORDS;
 
-        while records_remaining > 0 {
-            // Get the next in line fetch, or get a new one from buffer
-            let next_in_line = self.log_fetch_buffer.next_in_line_fetch();
-
-            if next_in_line.is_none() || next_in_line.as_ref().unwrap().is_consumed() {
-                // Get a new fetch from buffer
-                if let Some(completed_fetch) = self.log_fetch_buffer.poll() {
-                    // Initialize the fetch if not already initialized
-                    if !completed_fetch.is_initialized() {
-                        let size_in_bytes = completed_fetch.size_in_bytes();
-                        match self.initialize_fetch(completed_fetch) {
-                            Ok(initialized) => {
-                                self.log_fetch_buffer.set_next_in_line_fetch(initialized);
-                                continue;
+        let collect_result: Result<()> = {
+            while records_remaining > 0 {
+                // Get the next in line fetch, or get a new one from buffer
+                let next_in_line = self.log_fetch_buffer.next_in_line_fetch();
+
+                if next_in_line.is_none() || next_in_line.as_ref().unwrap().is_consumed() {
+                    // Get a new fetch from buffer
+                    if let Some(completed_fetch) = self.log_fetch_buffer.poll() {
+                        // Initialize the fetch if not already initialized
+                        if !completed_fetch.is_initialized() {
+                            let size_in_bytes = completed_fetch.size_in_bytes();
+                            match self.initialize_fetch(completed_fetch) {
+                                Ok(initialized) => {
+                                    self.log_fetch_buffer.set_next_in_line_fetch(initialized);
+                                    continue;
+                                }
+                                Err(e) => {
+                                    // Remove a completedFetch upon a parse with exception if
+                                    // (1) it contains no records, and
+                                    // (2) there are no fetched records with actual content preceding this
+                                    // exception.
+                                    if result.is_empty() && size_in_bytes == 0 {
+                                        // todo: do we need to consider it like java ?
+                                        // self.log_fetch_buffer.poll();
+                                    }
+                                    return Err(e);
+                                }
                             }
+                        } else {
+                            self.log_fetch_buffer
+                                .set_next_in_line_fetch(Some(completed_fetch));
+                        }
+                        // Note: poll() already removed the fetch from buffer, so no need to call poll()
+                    } else {
+                        // No more fetches available
+                        break;
+                    }
+                } else {
+                    // Fetch records from next_in_line
+                    if let Some(mut next_fetch) = next_in_line {
+                        let records = match self
+                            .fetch_records_from_fetch(&mut next_fetch, records_remaining)
+                        {
+                            Ok(records) => records,
                             Err(e) => {
-                                // Remove a completedFetch upon a parse with exception if
-                                // (1) it contains no records, and
-                                // (2) there are no fetched records with actual content preceding this
-                                // exception.
-                                if result.is_empty() && size_in_bytes == 0 {
-                                    // todo: do we need to consider it like java ?
-                                    // self.log_fetch_buffer.poll();
+                                if !next_fetch.is_consumed() {
+                                    self.log_fetch_buffer
+                                        .set_next_in_line_fetch(Some(next_fetch));
                                 }
                                 return Err(e);
                             }
+                        };
+
+                        if !records.is_empty() {
+                            let table_bucket = next_fetch.table_bucket().clone();
+                            // Merge with existing records for this bucket
+                            let existing = result.entry(table_bucket).or_default();
+                            let records_count = records.len();
+                            existing.extend(records);
+
+                            records_remaining = records_remaining.saturating_sub(records_count);
                         }
-                    } else {
-                        self.log_fetch_buffer
-                            .set_next_in_line_fetch(Some(completed_fetch));
+
+                        // If the fetch is not fully consumed, put it back for the next round
+                        if !next_fetch.is_consumed() {
+                            self.log_fetch_buffer
+                                .set_next_in_line_fetch(Some(next_fetch));
+                        }
+                        // If consumed, next_fetch will be dropped here (which is correct)
                     }
-                    // Note: poll() already removed the fetch from buffer, so no need to call poll()
-                } else {
-                    // No more fetches available
-                    break;
                 }
-            } else {
-                // Fetch records from next_in_line
-                if let Some(mut next_fetch) = next_in_line {
-                    let records =
-                        self.fetch_records_from_fetch(&mut next_fetch, records_remaining)?;
-
-                    if !records.is_empty() {
-                        let table_bucket = next_fetch.table_bucket().clone();
-                        // Merge with existing records for this bucket
-                        let existing = result.entry(table_bucket).or_default();
-                        let records_count = records.len();
-                        existing.extend(records);
-
-                        records_remaining = records_remaining.saturating_sub(records_count);
-                    }
+            }
+            Ok(())
+        };
 
-                    // If the fetch is not fully consumed, put it back for the next round
-                    if !next_fetch.is_consumed() {
-                        self.log_fetch_buffer
-                            .set_next_in_line_fetch(Some(next_fetch));
-                    }
-                    // If consumed, next_fetch will be dropped here (which is correct)
+        match collect_result {
+            Ok(()) => Ok(result),
+            Err(e) => {
+                if result.is_empty() {
+                    Err(e)
+                } else {
+                    Ok(result)
                 }
             }
         }
-
-        Ok(result)
     }
 
     /// Initialize a completed fetch, checking offset match and updating high watermark
@@ -833,12 +955,63 @@ impl LogFetcher {
         &self,
         mut completed_fetch: Box<dyn CompletedFetch>,
     ) -> Result<Option<Box<dyn CompletedFetch>>> {
-        // todo: handle error in initialize fetch
-        let table_bucket = completed_fetch.table_bucket();
+        if let Some(error) = completed_fetch.take_error() {
+            return Err(error);
+        }
+
+        let table_bucket = completed_fetch.table_bucket().clone();
         let fetch_offset = completed_fetch.next_fetch_offset();
 
+        if let Some(api_error) = completed_fetch.api_error() {
+            let error = FlussError::for_code(api_error.code);
+            let error_message = api_error.message.as_str();
+            self.log_scanner_status
+                .move_bucket_to_end(table_bucket.clone());
+            let action = completed_fetch
+                .fetch_error_context()
+                .map(|context| context.action)
+                .unwrap_or(FetchErrorAction::Unexpected);
+            match action {
+                FetchErrorAction::Ignore => {
+                    return Ok(None);
+                }
+                FetchErrorAction::LogOffsetOutOfRange => {
+                    return Err(Error::UnexpectedError {
+                        message: format!(
+                            "The fetching offset {fetch_offset} is out of range: {error_message}"
+                        ),
+                        source: None,
+                    });
+                }
+                FetchErrorAction::Authorization => {
+                    return Err(Error::FlussAPIError {
+                        api_error: ApiError {
+                            code: api_error.code,
+                            message: api_error.message.to_string(),
+                        },
+                    });
+                }
+                FetchErrorAction::CorruptMessage => {
+                    return Err(Error::UnexpectedError {
+                        message: format!(
+                            "Encountered corrupt message when fetching offset {fetch_offset} for bucket {table_bucket}: {error_message}"
+                        ),
+                        source: None,
+                    });
+                }
+                FetchErrorAction::Unexpected => {
+                    return Err(Error::UnexpectedError {
+                        message: format!(
+                            "Unexpected error code {error:?} while fetching at offset {fetch_offset} from bucket {table_bucket}: {error_message}"
+                        ),
+                        source: None,
+                    });
+                }
+            }
+        }
+
         // Check if bucket is still subscribed
-        let Some(current_offset) = self.log_scanner_status.get_bucket_offset(table_bucket) else {
+        let Some(current_offset) = self.log_scanner_status.get_bucket_offset(&table_bucket) else {
             warn!(
                 "Discarding stale fetch response for bucket {table_bucket:?} since the bucket has been unsubscribed"
             );
@@ -857,7 +1030,7 @@ impl LogFetcher {
         let high_watermark = completed_fetch.high_watermark();
         if high_watermark >= 0 {
             self.log_scanner_status
-                .update_high_watermark(table_bucket, high_watermark);
+                .update_high_watermark(&table_bucket, high_watermark);
         }
 
         completed_fetch.set_initialized();
@@ -894,6 +1067,11 @@ impl LogFetcher {
                     .update_offset(&table_bucket, next_fetch_offset);
             }
 
+            if next_in_line_fetch.is_consumed() && next_in_line_fetch.records_read() > 0 {
+                self.log_scanner_status
+                    .move_bucket_to_end(table_bucket.clone());
+            }
+
             Ok(records)
         } else {
             // These records aren't next in line, ignore them
@@ -915,58 +1093,70 @@ impl LogFetcher {
         let mut batches_remaining = MAX_BATCHES;
         let mut bytes_consumed: usize = 0;
 
-        while batches_remaining > 0 && bytes_consumed < MAX_BYTES {
-            let next_in_line = self.log_fetch_buffer.next_in_line_fetch();
+        let collect_result: Result<()> = {
+            while batches_remaining > 0 && bytes_consumed < MAX_BYTES {
+                let next_in_line = self.log_fetch_buffer.next_in_line_fetch();
 
-            match next_in_line {
-                Some(mut next_fetch) if !next_fetch.is_consumed() => {
-                    let batches =
-                        self.fetch_batches_from_fetch(&mut next_fetch, batches_remaining)?;
-                    let batch_count = batches.len();
+                match next_in_line {
+                    Some(mut next_fetch) if !next_fetch.is_consumed() => {
+                        let batches =
+                            self.fetch_batches_from_fetch(&mut next_fetch, batches_remaining)?;
+                        let batch_count = batches.len();
 
-                    if !batches.is_empty() {
-                        // Track bytes consumed (soft cap - may exceed by one fetch)
-                        let batch_bytes: usize =
-                            batches.iter().map(|b| b.get_array_memory_size()).sum();
-                        bytes_consumed += batch_bytes;
+                        if !batches.is_empty() {
+                            // Track bytes consumed (soft cap - may exceed by one fetch)
+                            let batch_bytes: usize =
+                                batches.iter().map(|b| b.get_array_memory_size()).sum();
+                            bytes_consumed += batch_bytes;
 
-                        result.extend(batches);
-                        batches_remaining = batches_remaining.saturating_sub(batch_count);
-                    }
+                            result.extend(batches);
+                            batches_remaining = batches_remaining.saturating_sub(batch_count);
+                        }
 
-                    if !next_fetch.is_consumed() {
-                        self.log_fetch_buffer
-                            .set_next_in_line_fetch(Some(next_fetch));
+                        if !next_fetch.is_consumed() {
+                            self.log_fetch_buffer
+                                .set_next_in_line_fetch(Some(next_fetch));
+                        }
                     }
-                }
-                _ => {
-                    if let Some(completed_fetch) = self.log_fetch_buffer.poll() {
-                        if !completed_fetch.is_initialized() {
-                            let size_in_bytes = completed_fetch.size_in_bytes();
-                            match self.initialize_fetch(completed_fetch) {
-                                Ok(initialized) => {
-                                    self.log_fetch_buffer.set_next_in_line_fetch(initialized);
-                                    continue;
-                                }
-                                Err(e) => {
-                                    if result.is_empty() && size_in_bytes == 0 {
+                    _ => {
+                        if let Some(completed_fetch) = self.log_fetch_buffer.poll() {
+                            if !completed_fetch.is_initialized() {
+                                let size_in_bytes = completed_fetch.size_in_bytes();
+                                match self.initialize_fetch(completed_fetch) {
+                                    Ok(initialized) => {
+                                        self.log_fetch_buffer.set_next_in_line_fetch(initialized);
                                         continue;
                                     }
-                                    return Err(e);
+                                    Err(e) => {
+                                        if result.is_empty() && size_in_bytes == 0 {
+                                            continue;
+                                        }
+                                        return Err(e);
+                                    }
                                 }
+                            } else {
+                                self.log_fetch_buffer
+                                    .set_next_in_line_fetch(Some(completed_fetch));
                             }
                         } else {
-                            self.log_fetch_buffer
-                                .set_next_in_line_fetch(Some(completed_fetch));
+                            break;
                         }
-                    } else {
-                        break;
                     }
                 }
             }
-        }
+            Ok(())
+        };
 
-        Ok(result)
+        match collect_result {
+            Ok(()) => Ok(result),
+            Err(e) => {
+                if result.is_empty() {
+                    Err(e)
+                } else {
+                    Ok(result)
+                }
+            }
+        }
     }
 
     fn fetch_batches_from_fetch(
@@ -1231,3 +1421,175 @@ impl BucketScanStatus {
         *self.high_watermark.write() = high_watermark
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::client::WriteRecord;
+    use crate::client::metadata::Metadata;
+    use crate::compression::{
+        ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+    };
+    use crate::metadata::{TableInfo, TablePath};
+    use crate::record::MemoryLogRecordsArrowBuilder;
+    use crate::row::{Datum, GenericRow};
+    use crate::rpc::FlussError;
+    use crate::test_utils::{build_cluster_arc, build_table_info};
+
+    fn build_records(table_info: &TableInfo, table_path: Arc<TablePath>) -> Result<Vec<u8>> {
+        let mut builder = MemoryLogRecordsArrowBuilder::new(
+            1,
+            table_info.get_row_type(),
+            false,
+            ArrowCompressionInfo {
+                compression_type: ArrowCompressionType::None,
+                compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+            },
+        );
+        let record = WriteRecord::new(
+            table_path,
+            GenericRow {
+                values: vec![Datum::Int32(1)],
+            },
+        );
+        builder.append(&record)?;
+        builder.build()
+    }
+
+    #[tokio::test]
+    async fn collect_fetches_updates_offset() -> Result<()> {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = build_table_info(table_path.clone(), 1, 1);
+        let cluster = build_cluster_arc(&table_path, 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster));
+        let status = Arc::new(LogScannerStatus::new());
+        let fetcher = LogFetcher::new(
+            table_info.clone(),
+            Arc::new(RpcClient::new()),
+            metadata,
+            status.clone(),
+            None,
+        )?;
+
+        let bucket = TableBucket::new(1, 0);
+        status.assign_scan_bucket(bucket.clone(), 0);
+
+        let data = build_records(&table_info, Arc::new(table_path))?;
+        let log_records = LogRecordsBatches::new(data.clone());
+        let read_context = ReadContext::new(to_arrow_schema(table_info.get_row_type()), false);
+        let completed =
+            DefaultCompletedFetch::new(bucket.clone(), log_records, data.len(), read_context, 0, 0);
+        fetcher.log_fetch_buffer.add(Box::new(completed));
+
+        let fetched = fetcher.collect_fetches()?;
+        assert_eq!(fetched.get(&bucket).unwrap().len(), 1);
+        assert_eq!(status.get_bucket_offset(&bucket), Some(1));
+        Ok(())
+    }
+
+    #[test]
+    fn fetch_records_from_fetch_drains_unassigned_bucket() -> Result<()> {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = build_table_info(table_path.clone(), 1, 1);
+        let cluster = build_cluster_arc(&table_path, 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster));
+        let status = Arc::new(LogScannerStatus::new());
+        let fetcher = LogFetcher::new(
+            table_info.clone(),
+            Arc::new(RpcClient::new()),
+            metadata,
+            status,
+            None,
+        )?;
+
+        let bucket = TableBucket::new(1, 0);
+        let data = build_records(&table_info, Arc::new(table_path))?;
+        let log_records = LogRecordsBatches::new(data.clone());
+        let read_context = ReadContext::new(to_arrow_schema(table_info.get_row_type()), false);
+        let mut completed: Box<dyn CompletedFetch> = Box::new(DefaultCompletedFetch::new(
+            bucket,
+            log_records,
+            data.len(),
+            read_context,
+            0,
+            0,
+        ));
+
+        let records = fetcher.fetch_records_from_fetch(&mut completed, 10)?;
+        assert!(records.is_empty());
+        assert!(completed.is_consumed());
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn prepare_fetch_log_requests_skips_pending() -> Result<()> {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = build_table_info(table_path.clone(), 1, 1);
+        let cluster = build_cluster_arc(&table_path, 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster));
+        let status = Arc::new(LogScannerStatus::new());
+        status.assign_scan_bucket(TableBucket::new(1, 0), 0);
+        let fetcher = LogFetcher::new(
+            table_info,
+            Arc::new(RpcClient::new()),
+            metadata,
+            status,
+            None,
+        )?;
+
+        fetcher.nodes_with_pending_fetch_requests.lock().insert(1);
+
+        let requests = fetcher.prepare_fetch_log_requests().await;
+        assert!(requests.is_empty());
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn handle_fetch_response_sets_error() -> Result<()> {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = build_table_info(table_path.clone(), 1, 1);
+        let cluster = build_cluster_arc(&table_path, 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster));
+        let status = Arc::new(LogScannerStatus::new());
+        status.assign_scan_bucket(TableBucket::new(1, 0), 5);
+        let fetcher = LogFetcher::new(
+            table_info.clone(),
+            Arc::new(RpcClient::new()),
+            metadata.clone(),
+            status.clone(),
+            None,
+        )?;
+
+        let response = crate::proto::FetchLogResponse {
+            tables_resp: vec![crate::proto::PbFetchLogRespForTable {
+                table_id: 1,
+                buckets_resp: vec![crate::proto::PbFetchLogRespForBucket {
+                    partition_id: None,
+                    bucket_id: 0,
+                    error_code: Some(FlussError::AuthorizationException.code()),
+                    error_message: Some("denied".to_string()),
+                    high_watermark: None,
+                    log_start_offset: None,
+                    remote_log_fetch_info: None,
+                    records: None,
+                }],
+            }],
+        };
+
+        LogFetcher::handle_fetch_response(
+            response,
+            &fetcher.log_fetch_buffer,
+            &fetcher.log_scanner_status,
+            &fetcher.read_context,
+            &fetcher.remote_read_context,
+            &fetcher.remote_log_downloader,
+            &fetcher.credentials_cache,
+        )
+        .await;
+
+        let completed = fetcher.log_fetch_buffer.poll().expect("completed fetch");
+        let api_error = completed.api_error().expect("api error");
+        assert_eq!(api_error.code, FlussError::AuthorizationException.code());
+        Ok(())
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index cb03a2c462..ffac0af8ae 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -455,7 +455,7 @@ mod tests {
     use crate::row::{Datum, GenericRow};
     use crate::rpc::FlussError;
     use crate::test_utils::build_cluster_arc;
-    use std::collections::HashSet;
+    use std::collections::{HashMap, HashSet};
 
     async fn build_ready_batch(
         accumulator: &RecordAccumulator,
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index 0a368b7be9..368d8abc80 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -99,6 +99,11 @@ pub enum Error {
     )]
     IoUnsupported { message: String },
 
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting wakeup error {}.", message)
+    )]
+    WakeupError { message: String },
     #[snafu(
         visibility(pub(crate)),
         display("Fluss hitting unsupported operation error {}.", message)
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 89fb7b9c94..c166ebe8f6 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -17,7 +17,7 @@
 
 use crate::client::{Record, WriteRecord};
 use crate::compression::ArrowCompressionInfo;
-use crate::error::Result;
+use crate::error::{Error, Result};
 use crate::metadata::DataType;
 use crate::record::{ChangeType, ScanRecord};
 use crate::row::{ColumnarRow, GenericRow};
@@ -446,7 +446,7 @@ impl LogRecordBatch {
     }
 
     pub fn ensure_valid(&self) -> Result<()> {
-        // todo
+        // TODO enable validation once checksum handling is corrected.
         Ok(())
     }
 
@@ -780,8 +780,10 @@ impl ReadContext {
         arrow_schema: SchemaRef,
         projected_fields: Vec<usize>,
         is_from_remote: bool,
-    ) -> ReadContext {
-        let target_schema = Self::project_schema(arrow_schema.clone(), projected_fields.as_slice());
+    ) -> Result<ReadContext> {
+        Self::validate_projection(&arrow_schema, projected_fields.as_slice())?;
+        let target_schema =
+            Self::project_schema(arrow_schema.clone(), projected_fields.as_slice())?;
         // the logic is little bit of hard to understand, to refactor it to follow
         // java side
         let (need_do_reorder, sorted_fields) = {
@@ -804,16 +806,20 @@ impl ReadContext {
                 // Calculate reordering indexes to transform from sorted order to user-requested order
                 let mut reordering_indexes = Vec::with_capacity(projected_fields.len());
                 for &original_idx in &projected_fields {
-                    let pos = sorted_fields
-                        .binary_search(&original_idx)
-                        .expect("projection index should exist in sorted list");
+                    let pos = sorted_fields.binary_search(&original_idx).map_err(|_| {
+                        Error::IllegalArgument {
+                            message: format!(
+                                "Projection index {original_idx} is invalid for the current schema."
+                            ),
+                        }
+                    })?;
                     reordering_indexes.push(pos);
                 }
                 Projection {
                     ordered_schema: Self::project_schema(
                         arrow_schema.clone(),
                         sorted_fields.as_slice(),
-                    ),
+                    )?,
                     projected_fields,
                     ordered_fields: sorted_fields,
                     reordering_indexes,
@@ -824,7 +830,7 @@ impl ReadContext {
                     ordered_schema: Self::project_schema(
                         arrow_schema.clone(),
                         projected_fields.as_slice(),
-                    ),
+                    )?,
                     ordered_fields: projected_fields.clone(),
                     projected_fields,
                     reordering_indexes: vec![],
@@ -833,21 +839,34 @@ impl ReadContext {
             }
         };
 
-        ReadContext {
+        Ok(ReadContext {
             target_schema,
             full_schema: arrow_schema,
             projection: Some(project),
             is_from_remote,
+        })
+    }
+
+    fn validate_projection(schema: &SchemaRef, projected_fields: &[usize]) -> Result<()> {
+        let field_count = schema.fields().len();
+        for &index in projected_fields {
+            if index >= field_count {
+                return Err(Error::IllegalArgument {
+                    message: format!(
+                        "Projection index {index} is out of bounds for schema with {field_count} fields."
+                    ),
+                });
+            }
         }
+        Ok(())
     }
 
-    pub fn project_schema(schema: SchemaRef, projected_fields: &[usize]) -> SchemaRef {
-        // todo: handle the exception
-        SchemaRef::new(
-            schema
-                .project(projected_fields)
-                .expect("can't project schema"),
-        )
+    pub fn project_schema(schema: SchemaRef, projected_fields: &[usize]) -> Result<SchemaRef> {
+        Ok(SchemaRef::new(schema.project(projected_fields).map_err(
+            |e| Error::IllegalArgument {
+                message: format!("Invalid projection: {e}"),
+            },
+        )?))
     }
 
     pub fn project_fields(&self) -> Option<&[usize]> {
@@ -1035,6 +1054,8 @@ pub struct MyVec<T>(pub StreamReader<T>);
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::error::Error;
+    use crate::metadata::DataField;
     use crate::metadata::DataTypes;
 
     #[test]
@@ -1207,6 +1228,18 @@ mod tests {
         );
     }
 
+    #[test]
+    fn projection_rejects_out_of_bounds_index() {
+        let row_type = DataTypes::row(vec![
+            DataField::new("id".to_string(), DataTypes::int(), None),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+        ]);
+        let schema = to_arrow_schema(&row_type);
+        let result = ReadContext::with_projection_pushdown(schema, vec![0, 2], false);
+
+        assert!(matches!(result, Err(Error::IllegalArgument { .. })));
+    }
+
     fn le_bytes(vals: &[u32]) -> Vec<u8> {
         let mut out = Vec::with_capacity(vals.len() * 4);
         for &v in vals {
diff --git a/fluss-rust/crates/fluss/src/record/mod.rs b/fluss-rust/crates/fluss/src/record/mod.rs
index c5a3f8e4b6..94997e8d80 100644
--- a/fluss-rust/crates/fluss/src/record/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/mod.rs
@@ -182,3 +182,65 @@ impl IntoIterator for ScanRecords {
             .into_iter()
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use ::arrow::array::{Int32Array, RecordBatch};
+    use ::arrow::datatypes::{DataType, Field, Schema};
+    use std::sync::Arc;
+
+    fn make_row(values: Vec<i32>, row_id: usize) -> ColumnarRow {
+        let schema = Arc::new(Schema::new(vec![Field::new("v", DataType::Int32, false)]));
+        let batch = RecordBatch::try_new(schema, vec![Arc::new(Int32Array::from(values))])
+            .expect("record batch");
+        ColumnarRow::new_with_row_id(Arc::new(batch), row_id)
+    }
+
+    #[test]
+    fn change_type_round_trip() {
+        let cases = [
+            (ChangeType::AppendOnly, "+A", 0),
+            (ChangeType::Insert, "+I", 1),
+            (ChangeType::UpdateBefore, "-U", 2),
+            (ChangeType::UpdateAfter, "+U", 3),
+            (ChangeType::Delete, "-D", 4),
+        ];
+
+        for (change_type, short, byte) in cases {
+            assert_eq!(change_type.short_string(), short);
+            assert_eq!(change_type.to_byte_value(), byte);
+            assert_eq!(ChangeType::from_byte_value(byte).unwrap(), change_type);
+        }
+
+        let err = ChangeType::from_byte_value(9).unwrap_err();
+        assert!(err.contains("Unsupported byte value"));
+    }
+
+    #[test]
+    fn scan_records_counts_and_iterates() {
+        let bucket0 = TableBucket::new(1, 0);
+        let bucket1 = TableBucket::new(1, 1);
+        let record0 = ScanRecord::new(make_row(vec![10, 11], 0), 5, 7, ChangeType::Insert);
+        let record1 = ScanRecord::new(make_row(vec![10, 11], 1), 6, 8, ChangeType::Delete);
+
+        let mut records = HashMap::new();
+        records.insert(bucket0.clone(), vec![record0.clone(), record1.clone()]);
+
+        let scan_records = ScanRecords::new(records);
+        assert_eq!(scan_records.records(&bucket0).len(), 2);
+        assert!(scan_records.records(&bucket1).is_empty());
+        assert_eq!(scan_records.count(), 2);
+
+        let collected: Vec<_> = scan_records.into_iter().collect();
+        assert_eq!(collected.len(), 2);
+    }
+
+    #[test]
+    fn scan_record_default_values() {
+        let record = ScanRecord::new_default(make_row(vec![1], 0));
+        assert_eq!(record.offset(), -1);
+        assert_eq!(record.timestamp(), -1);
+        assert_eq!(record.change_type(), &ChangeType::Insert);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 31f0fdf298..90437c11aa 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -166,3 +166,67 @@ impl InternalRow for ColumnarRow {
             .value(self.row_id)
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use arrow::array::{
+        BinaryArray, BooleanArray, FixedSizeBinaryArray, Float32Array, Float64Array, Int8Array,
+        Int16Array, Int32Array, Int64Array, StringArray,
+    };
+    use arrow::datatypes::{DataType, Field, Schema};
+
+    #[test]
+    fn columnar_row_reads_values() {
+        let schema = Arc::new(Schema::new(vec![
+            Field::new("b", DataType::Boolean, false),
+            Field::new("i8", DataType::Int8, false),
+            Field::new("i16", DataType::Int16, false),
+            Field::new("i32", DataType::Int32, false),
+            Field::new("i64", DataType::Int64, false),
+            Field::new("f32", DataType::Float32, false),
+            Field::new("f64", DataType::Float64, false),
+            Field::new("s", DataType::Utf8, false),
+            Field::new("bin", DataType::Binary, false),
+            Field::new("char", DataType::FixedSizeBinary(2), false),
+        ]));
+
+        let batch = RecordBatch::try_new(
+            schema,
+            vec![
+                Arc::new(BooleanArray::from(vec![true])),
+                Arc::new(Int8Array::from(vec![1])),
+                Arc::new(Int16Array::from(vec![2])),
+                Arc::new(Int32Array::from(vec![3])),
+                Arc::new(Int64Array::from(vec![4])),
+                Arc::new(Float32Array::from(vec![1.25])),
+                Arc::new(Float64Array::from(vec![2.5])),
+                Arc::new(StringArray::from(vec!["hello"])),
+                Arc::new(BinaryArray::from(vec![b"data".as_slice()])),
+                Arc::new(
+                    FixedSizeBinaryArray::try_from_sparse_iter_with_size(
+                        vec![Some(b"ab".as_slice())].into_iter(),
+                        2,
+                    )
+                    .expect("fixed array"),
+                ),
+            ],
+        )
+        .expect("record batch");
+
+        let mut row = ColumnarRow::new(Arc::new(batch));
+        assert_eq!(row.get_field_count(), 10);
+        assert!(row.get_boolean(0));
+        assert_eq!(row.get_byte(1), 1);
+        assert_eq!(row.get_short(2), 2);
+        assert_eq!(row.get_int(3), 3);
+        assert_eq!(row.get_long(4), 4);
+        assert_eq!(row.get_float(5), 1.25);
+        assert_eq!(row.get_double(6), 2.5);
+        assert_eq!(row.get_string(7), "hello");
+        assert_eq!(row.get_bytes(8), b"data");
+        assert_eq!(row.get_char(9, 2), "ab");
+        row.set_row_id(0);
+        assert_eq!(row.get_row_id(), 0);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
index 9ab1f143f3..fcecb4188c 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
@@ -17,9 +17,9 @@
 
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 
-use crate::error::Error;
 use crate::error::Result as FlussResult;
-use crate::proto::ListOffsetsResponse;
+use crate::error::{Error, FlussError};
+use crate::proto::{ErrorResponse, ListOffsetsResponse};
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
@@ -108,22 +108,48 @@ impl ListOffsetsResponse {
         self.buckets_resp
             .iter()
             .map(|resp| {
-                if resp.error_code.is_some() {
-                    // todo: consider use another suitable error
-                    Err(Error::UnexpectedError {
+                if let Some(error_code) = resp.error_code
+                    && error_code != FlussError::None.code()
+                {
+                    let api_error = ErrorResponse {
+                        error_code,
+                        error_message: resp.error_message.clone(),
+                    }
+                    .into();
+                    return Err(Error::FlussAPIError { api_error });
+                }
+                // if no error msg, offset must exists
+                resp.offset
+                    .map(|offset| (resp.bucket_id, offset))
+                    .ok_or_else(|| Error::UnexpectedError {
                         message: format!(
-                            "Missing offset, error message: {}",
-                            resp.error_message
-                                .as_deref()
-                                .unwrap_or("unknown server exception")
+                            "Missing offset for bucket {} without error code.",
+                            resp.bucket_id
                         ),
                         source: None,
                     })
-                } else {
-                    // if no error msg, offset must exists
-                    Ok((resp.bucket_id, resp.offset.unwrap()))
-                }
             })
             .collect()
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::proto::{ListOffsetsResponse, PbListOffsetsRespForBucket};
+
+    #[test]
+    fn offsets_returns_api_error_on_error_code() {
+        let response = ListOffsetsResponse {
+            buckets_resp: vec![PbListOffsetsRespForBucket {
+                bucket_id: 1,
+                error_code: Some(FlussError::TableNotExist.code()),
+                error_message: Some("missing".to_string()),
+                offset: None,
+            }],
+        };
+
+        let result = response.offsets();
+        assert!(matches!(result, Err(Error::FlussAPIError { .. })));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index d191615e86..30424e5d16 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -184,3 +184,57 @@ impl<S> Default for FairBucketStatusMap<S> {
         Self::new()
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::sync::Arc;
+
+    #[test]
+    fn fair_bucket_status_map_tracks_order_and_size() {
+        let bucket0 = TableBucket::new(1, 0);
+        let bucket1 = TableBucket::new(1, 1);
+
+        let mut map = FairBucketStatusMap::new();
+        map.update_and_move_to_end(bucket0.clone(), 10);
+        map.update_and_move_to_end(bucket1.clone(), 20);
+        assert_eq!(map.size(), 2);
+
+        let values: Vec<i32> = map
+            .bucket_status_values()
+            .into_iter()
+            .map(|value| **value)
+            .collect();
+        assert_eq!(values, vec![10, 20]);
+
+        map.move_to_end(bucket0.clone());
+        let values: Vec<i32> = map
+            .bucket_status_values()
+            .into_iter()
+            .map(|value| **value)
+            .collect();
+        assert_eq!(values, vec![20, 10]);
+    }
+
+    #[test]
+    fn fair_bucket_status_map_mutations() {
+        let bucket0 = TableBucket::new(1, 0);
+        let bucket1 = TableBucket::new(2, 1);
+
+        let mut map = FairBucketStatusMap::new();
+        let mut input = HashMap::new();
+        input.insert(bucket0.clone(), Arc::new(1));
+        input.insert(bucket1.clone(), Arc::new(2));
+        map.set(input);
+
+        assert!(map.contains(&bucket0));
+        assert!(map.contains(&bucket1));
+        assert_eq!(map.bucket_set().len(), 2);
+
+        map.remove(&bucket1);
+        assert_eq!(map.size(), 1);
+
+        map.clear();
+        assert_eq!(map.size(), 0);
+    }
+}

From ffc026ddcab8c22c281909afaa75265774b374e3 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Sat, 17 Jan 2026 15:37:07 +0800
Subject: [PATCH 072/287] chore: correct log record batch checksum bounds
 (#172)

---
 fluss-rust/crates/fluss/src/record/arrow.rs | 30 ++++++++++++++++++---
 1 file changed, 26 insertions(+), 4 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index c166ebe8f6..b331ae9d7f 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -86,6 +86,8 @@ pub enum LogMagicValue {
     V0 = 0,
 }
 
+// NOTE: Rust layout/offsets currently match Java only for V0.
+// TODO: Add V1 layout/offsets to keep parity with Java's V1 format.
 pub const CURRENT_LOG_MAGIC_VALUE: u8 = LogMagicValue::V0 as u8;
 
 /// Value used if writer ID is not available or non-idempotent.
@@ -457,8 +459,7 @@ impl LogRecordBatch {
 
     fn compute_checksum(&self) -> u32 {
         let start = SCHEMA_ID_OFFSET;
-        let end = start + self.data.len();
-        crc32c(&self.data[start..end])
+        crc32c(&self.data[start..])
     }
 
     fn attributes(&self) -> u8 {
@@ -471,12 +472,12 @@ impl LogRecordBatch {
 
     pub fn checksum(&self) -> u32 {
         let offset = CRC_OFFSET;
-        LittleEndian::read_u32(&self.data[offset..offset + CRC_OFFSET])
+        LittleEndian::read_u32(&self.data[offset..offset + CRC_LENGTH])
     }
 
     pub fn schema_id(&self) -> i16 {
         let offset = SCHEMA_ID_OFFSET;
-        LittleEndian::read_i16(&self.data[offset..offset + SCHEMA_ID_OFFSET])
+        LittleEndian::read_i16(&self.data[offset..offset + SCHEMA_ID_LENGTH])
     }
 
     pub fn base_log_offset(&self) -> i64 {
@@ -1240,6 +1241,27 @@ mod tests {
         assert!(matches!(result, Err(Error::IllegalArgument { .. })));
     }
 
+    #[test]
+    fn checksum_and_schema_id_read_minimum_header() {
+        // Header-only batches with record_count == 0 are valid; this covers the minimal bytes
+        // needed for checksum/schema_id access.
+        let mut data = vec![0u8; SCHEMA_ID_OFFSET + SCHEMA_ID_LENGTH];
+        let crc = 0xA1B2C3D4u32;
+        let schema_id = 42i16;
+        LittleEndian::write_u32(&mut data[CRC_OFFSET..CRC_OFFSET + CRC_LENGTH], crc);
+        LittleEndian::write_i16(
+            &mut data[SCHEMA_ID_OFFSET..SCHEMA_ID_OFFSET + SCHEMA_ID_LENGTH],
+            schema_id,
+        );
+
+        let batch = LogRecordBatch::new(Bytes::from(data));
+        assert_eq!(batch.checksum(), crc);
+        assert_eq!(batch.schema_id(), schema_id);
+
+        let expected = crc32c(&batch.data[SCHEMA_ID_OFFSET..]);
+        assert_eq!(batch.compute_checksum(), expected);
+    }
+
     fn le_bytes(vals: &[u32]) -> Vec<u8> {
         let mut out = Vec::with_capacity(vals.len() * 4);
         for &v in vals {

From 41f824fe778ab648df844a295747c2da32cbb220 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 17 Jan 2026 15:41:12 +0000
Subject: [PATCH 073/287] feat: Introduce KVReadContext and read path wiring
 (#174)

---
 .../crates/fluss/src/record/kv/kv_record.rs   | 166 ++++++++--------
 .../fluss/src/record/kv/kv_record_batch.rs    | 115 ++++++++---
 .../src/record/kv/kv_record_batch_builder.rs  | 154 ++++++++-------
 .../src/record/kv/kv_record_read_context.rs   | 179 ++++++++++++++++++
 fluss-rust/crates/fluss/src/record/kv/mod.rs  |   7 +
 .../fluss/src/record/kv/read_context.rs       |  45 +++++
 .../crates/fluss/src/record/kv/test_util.rs   |  50 +++++
 fluss-rust/crates/fluss/src/row/mod.rs        |   2 +
 .../crates/fluss/src/row/row_decoder.rs       | 137 ++++++++++++++
 9 files changed, 674 insertions(+), 181 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
 create mode 100644 fluss-rust/crates/fluss/src/record/kv/read_context.rs
 create mode 100644 fluss-rust/crates/fluss/src/record/kv/test_util.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/row_decoder.rs

diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
index ab8c2ac1dd..a9c45d6971 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
@@ -27,6 +27,8 @@
 use bytes::{BufMut, Bytes, BytesMut};
 use std::io;
 
+use crate::row::RowDecoder;
+use crate::row::compacted::CompactedRow;
 use crate::util::varint::{
     read_unsigned_varint_bytes, size_of_unsigned_varint, write_unsigned_varint_buf,
 };
@@ -34,7 +36,7 @@ use crate::util::varint::{
 /// Length field size in bytes
 pub const LENGTH_LENGTH: usize = 4;
 
-/// A key-value record.
+/// A key-value record containing raw key and value bytes.
 ///
 /// The schema is:
 /// - Length => Int32
@@ -43,34 +45,39 @@ pub const LENGTH_LENGTH: usize = 4;
 /// - Value => bytes (BinaryRow, written directly without length prefix)
 ///
 /// When the value is None (deletion), no Value bytes are present.
-// Reference implementation:
-// https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/record/KvRecord.java
+///
+/// This struct stores only raw bytes. To decode the value into a typed row,
+/// use the `row()` method with a RowDecoder (typically obtained from the iterator).
+///
+/// Reference implementation:
+/// https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/record/KvRecord.java
 #[derive(Debug, Clone)]
 pub struct KvRecord {
     key: Bytes,
-    value: Option<Bytes>,
+    value_bytes: Option<Bytes>,
     size_in_bytes: usize,
 }
 
 impl KvRecord {
-    /// Create a new KvRecord with the given key and optional value.
-    pub fn new(key: Bytes, value: Option<Bytes>) -> Self {
-        let size_in_bytes = Self::size_of(&key, value.as_deref());
-        Self {
-            key,
-            value,
-            size_in_bytes,
-        }
-    }
-
     /// Get the key bytes.
     pub fn key(&self) -> &Bytes {
         &self.key
     }
 
-    /// Get the value bytes (None indicates a deletion).
-    pub fn value(&self) -> Option<&Bytes> {
-        self.value.as_ref()
+    /// Get the raw value bytes (for testing).
+    #[cfg(test)]
+    pub(crate) fn value_bytes(&self) -> Option<&Bytes> {
+        self.value_bytes.as_ref()
+    }
+
+    /// Decode the value bytes into a typed row using the provided decoder.
+    /// This creates a lightweight CompactedRow view over the raw bytes.
+    /// Actual field parsing is lazy (on first access).
+    pub fn row<'a>(&'a self, decoder: &dyn RowDecoder) -> Option<CompactedRow<'a>> {
+        self.value_bytes.as_ref().map(|bytes| {
+            // Decode on-demand - CompactedRow<'a> lifetime tied to &'a self
+            decoder.decode(bytes.as_ref())
+        })
     }
 
     /// Calculate the total size of the record when serialized (including length prefix).
@@ -121,8 +128,7 @@ impl KvRecord {
     /// Read a KV record from bytes at the given position.
     ///
     /// Returns the KvRecord and the number of bytes consumed.
-    ///
-    /// TODO: Connect KvReadContext and return CompactedRow records.
+    /// The record contains only raw bytes; use `row()` with a RowDecoder to decode the value.
     pub fn read_from(bytes: &Bytes, position: usize) -> io::Result<(Self, usize)> {
         if bytes.len() < position.saturating_add(LENGTH_LENGTH) {
             return Err(io::Error::new(
@@ -183,11 +189,10 @@ impl KvRecord {
         let key = bytes.slice(current_offset..key_end);
         current_offset = key_end;
 
-        // Read value bytes directly
-        let value = if current_offset < record_end {
+        // Read value bytes directly (don't decode yet - will decode on-demand)
+        let value_bytes = if current_offset < record_end {
             // Value is present: all remaining bytes are the value
-            let value_bytes = bytes.slice(current_offset..record_end);
-            Some(value_bytes)
+            Some(bytes.slice(current_offset..record_end))
         } else {
             // No remaining bytes: this is a deletion record
             None
@@ -196,7 +201,7 @@ impl KvRecord {
         Ok((
             Self {
                 key,
-                value,
+                value_bytes,
                 size_in_bytes: total_size,
             },
             total_size,
@@ -207,6 +212,11 @@ impl KvRecord {
     pub fn get_size_in_bytes(&self) -> usize {
         self.size_in_bytes
     }
+
+    /// Check if this is a deletion record (no value).
+    pub fn is_deletion(&self) -> bool {
+        self.value_bytes.is_none()
+    }
 }
 
 #[cfg(test)]
@@ -214,30 +224,25 @@ mod tests {
     use super::*;
 
     #[test]
-    fn test_kv_record_size_calculation() {
+    fn test_kv_record_basic_operations() {
         let key = b"test_key";
         let value = b"test_value";
 
-        // With value (no value length varint)
+        // Test size calculation with value
         let size_with_value = KvRecord::size_of(key, Some(value));
         assert_eq!(
             size_with_value,
             LENGTH_LENGTH + size_of_unsigned_varint(key.len() as u32) + key.len() + value.len()
         );
 
-        // Without value
+        // Test size calculation without value (deletion)
         let size_without_value = KvRecord::size_of(key, None);
         assert_eq!(
             size_without_value,
             LENGTH_LENGTH + size_of_unsigned_varint(key.len() as u32) + key.len()
         );
-    }
-
-    #[test]
-    fn test_kv_record_write_read_round_trip() {
-        let key = b"my_key";
-        let value = b"my_value_data";
 
+        // Test write/read round trip with value
         let mut buf = BytesMut::new();
         let written = KvRecord::write_to_buf(&mut buf, key, Some(value)).unwrap();
 
@@ -246,40 +251,70 @@ mod tests {
 
         assert_eq!(written, read_size);
         assert_eq!(record.key().as_ref(), key);
-        assert_eq!(record.value().unwrap().as_ref(), value);
+        assert_eq!(record.value_bytes().unwrap().as_ref(), value);
         assert_eq!(record.get_size_in_bytes(), written);
-    }
-
-    #[test]
-    fn test_kv_record_deletion() {
-        let key = b"delete_me";
+        assert!(!record.is_deletion());
 
-        // Write deletion record (no value)
+        // Test deletion record (no value)
+        let delete_key = b"delete_me";
         let mut buf = BytesMut::new();
-        let written = KvRecord::write_to_buf(&mut buf, key, None).unwrap();
+        let written = KvRecord::write_to_buf(&mut buf, delete_key, None).unwrap();
 
         let bytes = buf.freeze();
         let (record, read_size) = KvRecord::read_from(&bytes, 0).unwrap();
 
         assert_eq!(written, read_size);
-        assert_eq!(record.key().as_ref(), key);
-        assert!(record.value().is_none());
+        assert_eq!(record.key().as_ref(), delete_key);
+        assert!(record.is_deletion());
+        assert!(record.value_bytes().is_none());
     }
 
     #[test]
-    fn test_kv_record_with_large_key() {
-        let key = vec![0u8; 1024];
-        let value = vec![1u8; 4096];
+    fn test_kv_record_multiple_records() {
+        // Test multiple regular-sized records in buffer
+        let records = vec![
+            (b"key1".as_slice(), Some(b"value1".as_slice())),
+            (b"key2".as_slice(), None), // Deletion
+            (b"key3".as_slice(), Some(b"value3".as_slice())),
+        ];
 
         let mut buf = BytesMut::new();
-        let written = KvRecord::write_to_buf(&mut buf, &key, Some(&value)).unwrap();
+        for (key, value) in &records {
+            KvRecord::write_to_buf(&mut buf, key, *value).unwrap();
+        }
+
+        let bytes = buf.freeze();
+        let mut offset = 0;
+        for (expected_key, expected_value) in &records {
+            let (record, size) = KvRecord::read_from(&bytes, offset).unwrap();
+            assert_eq!(record.key().as_ref(), *expected_key);
+            match expected_value {
+                Some(v) => {
+                    assert_eq!(record.value_bytes().unwrap().as_ref(), *v);
+                    assert!(!record.is_deletion());
+                }
+                None => {
+                    assert!(record.is_deletion());
+                    assert!(record.value_bytes().is_none());
+                }
+            }
+            offset += size;
+        }
+        assert_eq!(offset, bytes.len());
+
+        // Test large keys and values
+        let large_key = vec![0u8; 1024];
+        let large_value = vec![1u8; 4096];
+
+        let mut buf = BytesMut::new();
+        let written = KvRecord::write_to_buf(&mut buf, &large_key, Some(&large_value)).unwrap();
 
         let bytes = buf.freeze();
         let (record, read_size) = KvRecord::read_from(&bytes, 0).unwrap();
 
         assert_eq!(written, read_size);
-        assert_eq!(record.key().len(), key.len());
-        assert_eq!(record.value().unwrap().len(), value.len());
+        assert_eq!(record.key().len(), large_key.len());
+        assert_eq!(record.value_bytes().unwrap().len(), large_value.len());
     }
 
     #[test]
@@ -291,7 +326,9 @@ mod tests {
         let bytes = buf.freeze();
         let result = KvRecord::read_from(&bytes, 0);
         assert!(result.is_err());
-        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidData);
+        if let Err(e) = result {
+            assert_eq!(e.kind(), io::ErrorKind::InvalidData);
+        }
 
         // Test overflow length
         let mut buf = BytesMut::new();
@@ -307,33 +344,8 @@ mod tests {
         let bytes = buf.freeze();
         let result = KvRecord::read_from(&bytes, 0);
         assert!(result.is_err());
-        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::UnexpectedEof);
-    }
-
-    #[test]
-    fn test_multiple_records_in_buffer() {
-        let records = vec![
-            (b"key1".as_slice(), Some(b"value1".as_slice())),
-            (b"key2".as_slice(), None),
-            (b"key3".as_slice(), Some(b"value3".as_slice())),
-        ];
-
-        let mut buf = BytesMut::new();
-        for (key, value) in &records {
-            KvRecord::write_to_buf(&mut buf, key, *value).unwrap();
+        if let Err(e) = result {
+            assert_eq!(e.kind(), io::ErrorKind::UnexpectedEof);
         }
-
-        let bytes = buf.freeze();
-        let mut offset = 0;
-        for (expected_key, expected_value) in &records {
-            let (record, size) = KvRecord::read_from(&bytes, offset).unwrap();
-            assert_eq!(record.key().as_ref(), *expected_key);
-            match expected_value {
-                Some(v) => assert_eq!(record.value().unwrap().as_ref(), *v),
-                None => assert!(record.value().is_none()),
-            }
-            offset += size;
-        }
-        assert_eq!(offset, bytes.len());
     }
 }
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
index eb3c09ad34..32f712f82e 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
@@ -32,8 +32,11 @@
 
 use bytes::Bytes;
 use std::io;
+use std::sync::Arc;
 
-use crate::record::kv::KvRecord;
+use crate::error::Result;
+use crate::record::kv::{KvRecord, ReadContext};
+use crate::row::RowDecoder;
 
 // Field lengths in bytes
 pub const LENGTH_LENGTH: usize = 4;
@@ -253,38 +256,87 @@ impl KvRecordBatch {
         ]))
     }
 
-    /// Create an iterator over the records in this batch.
-    /// This validates the batch checksum before returning the iterator.
+    /// Create an iterable collection of records in this batch.
+    ///
+    /// This validates the batch checksum before returning the records.
     /// For trusted data paths, use `records_unchecked()` to skip validation.
-    pub fn records(&self) -> io::Result<KvRecordIterator> {
+    ///
+    /// Mirrors: KvRecordBatch.records(ReadContext)
+    pub fn records(&self, read_context: &dyn ReadContext) -> Result<KvRecords> {
         if !self.is_valid() {
-            return Err(io::Error::new(
-                io::ErrorKind::InvalidData,
-                "Invalid batch checksum",
-            ));
+            return Err(crate::error::Error::IoUnexpectedError {
+                message: "Invalid batch checksum".to_string(),
+                source: io::Error::new(io::ErrorKind::InvalidData, "Invalid batch checksum"),
+            });
         }
-        self.records_unchecked()
+        self.records_unchecked(read_context)
     }
 
-    /// Create an iterator over the records in this batch without validating the checksum
-    pub fn records_unchecked(&self) -> io::Result<KvRecordIterator> {
+    /// Create an iterable collection of records in this batch without validating the checksum.
+    pub fn records_unchecked(&self, read_context: &dyn ReadContext) -> Result<KvRecords> {
         let size = self.size_in_bytes()?;
         let count = self.record_count()?;
+        let schema_id = self.schema_id()?;
+
         if count < 0 {
-            return Err(io::Error::new(
-                io::ErrorKind::InvalidData,
-                format!("Invalid record count: {count}"),
-            ));
+            return Err(crate::error::Error::IoUnexpectedError {
+                message: format!("Invalid record count: {count}"),
+                source: io::Error::new(io::ErrorKind::InvalidData, "Invalid record count"),
+            });
         }
-        Ok(KvRecordIterator {
-            data: self.data.clone(),
-            position: self.position + RECORDS_OFFSET,
-            end: self.position + size,
-            remaining_count: count,
+
+        // Get row decoder for this schema from context (cached)
+        let row_decoder = read_context.get_row_decoder(schema_id)?;
+
+        Ok(KvRecords {
+            iter: KvRecordIterator {
+                data: self.data.clone(),
+                position: self.position + RECORDS_OFFSET,
+                end: self.position + size,
+                remaining_count: count,
+            },
+            row_decoder,
         })
     }
 }
 
+/// Iterable collection of KV records with associated decoder.
+///
+/// This wrapper provides both iteration capability and access to the row decoder
+/// needed to decode record values into typed rows.
+pub struct KvRecords {
+    iter: KvRecordIterator,
+    row_decoder: Arc<dyn RowDecoder>,
+}
+
+impl KvRecords {
+    /// Get a reference to the row decoder for decoding record values.
+    ///
+    /// Returns a reference tied to the lifetime of `&self`.
+    /// Use this when iterating by reference.
+    pub fn decoder(&self) -> &dyn RowDecoder {
+        &*self.row_decoder
+    }
+
+    /// Get an owned Arc to the row decoder.
+    ///
+    /// Returns a cloned Arc that can outlive the KvRecords,
+    /// allowing you to grab it before consuming the iterator.
+    /// Useful if you must keep the decoder beyond the iterable’s lifetime(collect then decode style)
+    pub fn decoder_arc(&self) -> Arc<dyn RowDecoder> {
+        Arc::clone(&self.row_decoder)
+    }
+}
+
+impl IntoIterator for KvRecords {
+    type Item = io::Result<KvRecord>;
+    type IntoIter = KvRecordIterator;
+
+    fn into_iter(self) -> Self::IntoIter {
+        self.iter
+    }
+}
+
 /// Iterator over records in a KV record batch.
 pub struct KvRecordIterator {
     data: Bytes,
@@ -319,7 +371,9 @@ impl Iterator for KvRecordIterator {
 mod tests {
     use super::*;
     use crate::metadata::{DataTypes, KvFormat, RowType};
+    use crate::record::kv::test_util::TestReadContext;
     use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, KvRecordBatchBuilder};
+    use crate::row::InternalRow;
     use crate::row::binary::BinaryWriter;
     use crate::row::compacted::CompactedRow;
     use bytes::{BufMut, BytesMut};
@@ -380,15 +434,24 @@ mod tests {
         assert_eq!(batch.batch_sequence().unwrap(), 5);
         assert_eq!(batch.record_count().unwrap(), 2);
 
-        let records: Vec<_> = batch.records().unwrap().collect();
-        assert_eq!(records.len(), 2);
+        // Create ReadContext for reading
+        let read_context = TestReadContext::compacted(vec![DataTypes::bytes()]);
 
-        let record1 = records[0].as_ref().unwrap();
+        // Iterate and verify records using typed API
+        let records = batch.records(&read_context).unwrap();
+        let decoder = records.decoder_arc(); // Get Arc before consuming
+
+        let mut iter = records.into_iter();
+        let record1 = iter.next().unwrap().unwrap();
         assert_eq!(record1.key().as_ref(), key1);
-        assert_eq!(record1.value().unwrap().as_ref(), value1_writer.buffer());
+        assert!(!record1.is_deletion());
+        let row1 = record1.row(&*decoder).unwrap();
+        assert_eq!(row1.get_bytes(0), &[1, 2, 3, 4, 5]);
 
-        let record2 = records[1].as_ref().unwrap();
+        let record2 = iter.next().unwrap().unwrap();
         assert_eq!(record2.key().as_ref(), key2);
-        assert!(record2.value().is_none());
+        assert!(record2.is_deletion());
+
+        assert!(iter.next().is_none());
     }
 }
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
index c36a86121b..636104d176 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
@@ -330,22 +330,20 @@ mod tests {
     }
 
     #[test]
-    fn test_builder_basic_workflow() {
+    fn test_builder_basic_operations() {
+        // Test basic workflow: initial state, writer state, append, close, build
         let schema_id = 42;
         let write_limit = 4096;
         let mut builder = KvRecordBatchBuilder::new(schema_id, write_limit, KvFormat::COMPACTED);
 
-        // Test initial state
         assert!(!builder.is_closed());
         assert_eq!(builder.writer_id(), NO_WRITER_ID);
         assert_eq!(builder.batch_sequence(), NO_BATCH_SEQUENCE);
 
-        // Test writer state
         builder.set_writer_state(100, 5);
         assert_eq!(builder.writer_id(), 100);
         assert_eq!(builder.batch_sequence(), 5);
 
-        // Test appending records
         let key1 = b"key1";
         let value1 = create_test_row(b"value1");
         assert!(builder.has_room_for_row(key1, Some(&value1)));
@@ -355,7 +353,6 @@ mod tests {
         assert!(builder.has_room_for_row::<CompactedRow>(key2, None));
         builder.append_row::<CompactedRow>(key2, None).unwrap();
 
-        // Test close and build
         builder.close().unwrap();
         assert!(builder.is_closed());
 
@@ -365,11 +362,8 @@ mod tests {
         // Building again should return cached result
         let bytes2 = builder.build().unwrap();
         assert_eq!(bytes.len(), bytes2.len());
-    }
 
-    #[test]
-    fn test_builder_lifecycle() {
-        // Test abort behavior
+        // Test lifecycle: abort behavior
         let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
         let value = create_test_row(b"value");
         builder.append_row(b"key", Some(&value)).unwrap();
@@ -378,13 +372,30 @@ mod tests {
         assert!(builder.build().is_err());
         assert!(builder.close().is_err());
 
-        // Test close behavior
+        // Test lifecycle: close behavior
         let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
         let value = create_test_row(b"value");
         builder.append_row(b"key", Some(&value)).unwrap();
         builder.close().unwrap();
-        assert!(builder.append_row::<CompactedRow>(b"key2", None).is_err()); // Can't append after close
-        assert!(builder.build().is_ok()); // But can still build
+        assert!(builder.append_row::<CompactedRow>(b"key2", None).is_err());
+        assert!(builder.build().is_ok());
+
+        // Test KvFormat validation
+        let mut row_writer = CompactedRowWriter::new(1);
+        row_writer.write_int(42);
+        let row_type = RowType::with_data_types(vec![DataTypes::int()]);
+        let row = &CompactedRow::from_bytes(&row_type, row_writer.buffer());
+
+        // INDEXED format should reject append_row
+        let mut indexed_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::INDEXED);
+        let result = indexed_builder.append_row(b"key", Some(row));
+        assert!(result.is_err());
+        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidInput);
+
+        // COMPACTED format should accept append_row
+        let mut compacted_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
+        let result = compacted_builder.append_row(b"key", Some(row));
+        assert!(result.is_ok());
     }
 
     #[test]
@@ -430,7 +441,10 @@ mod tests {
     }
 
     #[test]
-    fn test_cache_invalidation_on_append() {
+    fn test_builder_cache_invalidation() {
+        use crate::record::kv::KvRecordBatch;
+
+        // Test cache invalidation on append
         let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
         builder.set_writer_state(100, 5);
 
@@ -446,18 +460,13 @@ mod tests {
         let len2 = bytes2.len();
 
         // Verify the second build includes both records
-        assert!(len2 > len1, "Second build should be larger");
-
-        use crate::record::kv::KvRecordBatch;
+        assert!(len2 > len1);
         let batch = KvRecordBatch::new(bytes2, 0);
         assert!(batch.is_valid());
-        assert_eq!(batch.record_count().unwrap(), 2, "Should have 2 records");
-    }
+        assert_eq!(batch.record_count().unwrap(), 2);
 
-    #[test]
-    fn test_cache_invalidation_on_set_writer_state() {
+        // Test cache invalidation on writer state change
         let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
-
         builder.set_writer_state(100, 5);
         let value = create_test_row(b"value");
         builder.append_row(b"key", Some(&value)).unwrap();
@@ -467,24 +476,19 @@ mod tests {
         builder.set_writer_state(200, 10);
         let bytes2 = builder.build().unwrap();
 
-        assert_ne!(
-            bytes1, bytes2,
-            "Bytes should differ after writer state change"
-        );
+        assert_ne!(bytes1, bytes2);
 
-        use crate::record::kv::KvRecordBatch;
         let batch1 = KvRecordBatch::new(bytes1, 0);
         let batch2 = KvRecordBatch::new(bytes2, 0);
 
         assert_eq!(batch1.writer_id().unwrap(), 100);
         assert_eq!(batch1.batch_sequence().unwrap(), 5);
-
         assert_eq!(batch2.writer_id().unwrap(), 200);
         assert_eq!(batch2.batch_sequence().unwrap(), 10);
     }
 
     #[test]
-    fn test_builder_with_compacted_row_writer() {
+    fn test_builder_with_compacted_row_writer() -> crate::error::Result<()> {
         use crate::record::kv::KvRecordBatch;
         use crate::row::InternalRow;
         use crate::row::compacted::CompactedRow;
@@ -502,7 +506,7 @@ mod tests {
 
         let key1 = b"key1";
         assert!(builder.has_room_for_row(key1, Some(row1)));
-        builder.append_row(key1, Some(row1)).unwrap();
+        builder.append_row(key1, Some(row1))?;
 
         // Create and append second record
         let mut row_writer2 = CompactedRowWriter::new(2);
@@ -512,63 +516,57 @@ mod tests {
         let row2 = &CompactedRow::from_bytes(&row_type, row_writer2.buffer());
 
         let key2 = b"key2";
-        builder.append_row(key2, Some(row2)).unwrap();
+        builder.append_row(key2, Some(row2))?;
 
         // Append a deletion record
         let key3 = b"key3";
-        builder.append_row::<CompactedRow>(key3, None).unwrap();
+        builder.append_row::<CompactedRow>(key3, None)?;
 
         // Build and verify
-        builder.close().unwrap();
-        let bytes = builder.build().unwrap();
+        builder.close()?;
+        let bytes = builder.build()?;
 
         let batch = KvRecordBatch::new(bytes, 0);
         assert!(batch.is_valid());
-        assert_eq!(batch.record_count().unwrap(), 3);
-        assert_eq!(batch.writer_id().unwrap(), 100);
-        assert_eq!(batch.batch_sequence().unwrap(), 5);
-
-        // Read back and verify records
-        let records: Vec<_> = batch.records().unwrap().collect();
-        assert_eq!(records.len(), 3);
-
-        // Verify first record
-        let record1 = records[0].as_ref().unwrap();
-        assert_eq!(record1.key().as_ref(), key1);
-        let row1 = CompactedRow::from_bytes(&row_type, record1.value().unwrap());
-        assert_eq!(row1.get_int(0), 42);
-        assert_eq!(row1.get_string(1), "hello");
-
-        // Verify second record
-        let record2 = records[1].as_ref().unwrap();
-        assert_eq!(record2.key().as_ref(), key2);
-        let row2 = CompactedRow::from_bytes(&row_type, record2.value().unwrap());
-        assert_eq!(row2.get_int(0), 100);
-        assert_eq!(row2.get_string(1), "world");
-
-        // Verify deletion record
-        let record3 = records[2].as_ref().unwrap();
-        assert_eq!(record3.key().as_ref(), key3);
-        assert!(record3.value().is_none());
-    }
-
-    #[test]
-    fn test_kv_format_validation() {
-        let mut row_writer = CompactedRowWriter::new(1);
-        row_writer.write_int(42);
-
-        let row_type = RowType::with_data_types([DataTypes::int()].to_vec());
-        let row = &CompactedRow::from_bytes(&row_type, row_writer.buffer());
-
-        // INDEXED format should reject append_row
-        let mut indexed_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::INDEXED);
-        let result = indexed_builder.append_row(b"key", Some(row));
-        assert!(result.is_err());
-        assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidInput);
+        assert_eq!(batch.record_count()?, 3);
+        assert_eq!(batch.writer_id()?, 100);
+        assert_eq!(batch.batch_sequence()?, 5);
+
+        // Create ReadContext for reading typed rows
+        let types = vec![DataTypes::int(), DataTypes::string()];
+        let read_context = crate::record::kv::test_util::TestReadContext::compacted(types);
+
+        // Read back and verify records using idiomatic for-loop
+        let records = batch.records(&read_context)?;
+        let decoder = records.decoder_arc();
+        let mut record_count = 0;
+
+        for rec in records {
+            let rec = rec?;
+            record_count += 1;
+
+            match record_count {
+                1 => {
+                    assert_eq!(rec.key().as_ref(), key1);
+                    let row = rec.row(&*decoder).unwrap();
+                    assert_eq!(row.get_int(0), 42);
+                    assert_eq!(row.get_string(1), "hello");
+                }
+                2 => {
+                    assert_eq!(rec.key().as_ref(), key2);
+                    let row = rec.row(&*decoder).unwrap();
+                    assert_eq!(row.get_int(0), 100);
+                    assert_eq!(row.get_string(1), "world");
+                }
+                3 => {
+                    assert_eq!(rec.key().as_ref(), key3);
+                    assert!(rec.is_deletion());
+                }
+                _ => panic!("Unexpected record count"),
+            }
+        }
 
-        // COMPACTED format should accept append_row
-        let mut compacted_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
-        let result = compacted_builder.append_row(b"key", Some(row));
-        assert!(result.is_ok());
+        assert_eq!(record_count, 3);
+        Ok(())
     }
 }
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
new file mode 100644
index 0000000000..2049c32680
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
@@ -0,0 +1,179 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Default implementation of ReadContext with decoder caching.
+
+use super::ReadContext;
+use crate::error::{Error, Result};
+use crate::metadata::{KvFormat, Schema};
+use crate::row::{RowDecoder, RowDecoderFactory};
+use std::collections::HashMap;
+use std::sync::{Arc, Mutex};
+
+/// Trait for fetching schemas by ID.
+///
+/// This trait abstracts schema retrieval, allowing different implementations
+/// (e.g., from metadata store, cache, or test mocks).
+pub trait SchemaGetter: Send + Sync {
+    /// Get the schema for the given schema ID.
+    ///
+    /// # Arguments
+    /// * `schema_id` - The schema ID to fetch
+    ///
+    /// # Returns
+    /// An Arc-wrapped Schema for the specified ID, or an error if the schema
+    /// cannot be fetched (missing ID, network error, etc.)
+    fn get_schema(&self, schema_id: i16) -> Result<Arc<Schema>>;
+}
+
+/// Default implementation of ReadContext with decoder caching.
+///
+/// This implementation caches RowDecoders by schema ID for performance,
+/// avoiding repeated schema lookups and decoder creation.
+///
+/// Reference: org.apache.fluss.record.KvRecordReadContext
+pub struct KvRecordReadContext {
+    kv_format: KvFormat,
+    schema_getter: Arc<dyn SchemaGetter>,
+    row_decoder_cache: Mutex<HashMap<i16, Arc<dyn RowDecoder>>>,
+}
+
+impl KvRecordReadContext {
+    /// Create a new KvRecordReadContext.
+    ///
+    /// # Arguments
+    /// * `kv_format` - The KV format (COMPACTED or INDEXED)
+    /// * `schema_getter` - The schema getter for fetching schemas by ID
+    ///
+    /// # Returns
+    /// A new KvRecordReadContext instance
+    pub fn new(kv_format: KvFormat, schema_getter: Arc<dyn SchemaGetter>) -> Self {
+        Self {
+            kv_format,
+            schema_getter,
+            row_decoder_cache: Mutex::new(HashMap::new()),
+        }
+    }
+}
+
+impl ReadContext for KvRecordReadContext {
+    fn get_row_decoder(&self, schema_id: i16) -> Result<Arc<dyn RowDecoder>> {
+        // First check: fast path
+        {
+            let cache = self
+                .row_decoder_cache
+                .lock()
+                .unwrap_or_else(|poisoned| poisoned.into_inner());
+            if let Some(decoder) = cache.get(&schema_id) {
+                return Ok(Arc::clone(decoder));
+            }
+        } // Release lock before expensive operations
+
+        // Build decoder outside the lock to avoid blocking other threads
+        let schema = self.schema_getter.get_schema(schema_id)?;
+        let row_type = match schema.row_type() {
+            crate::metadata::DataType::Row(row_type) => row_type.clone(),
+            other => {
+                return Err(Error::IoUnexpectedError {
+                    message: format!(
+                        "Schema {} has invalid row type: expected Row, got {:?}",
+                        schema_id, other
+                    ),
+                    source: std::io::Error::new(
+                        std::io::ErrorKind::InvalidData,
+                        "Invalid row type",
+                    ),
+                });
+            }
+        };
+
+        // Create decoder outside lock
+        let decoder = RowDecoderFactory::create(self.kv_format.clone(), row_type)?;
+
+        // Second check: insert only if another thread didn't beat us to it
+        {
+            let mut cache = self
+                .row_decoder_cache
+                .lock()
+                .unwrap_or_else(|poisoned| poisoned.into_inner());
+            // Check again - another thread might have inserted while we were building
+            if let Some(existing) = cache.get(&schema_id) {
+                return Ok(Arc::clone(existing));
+            }
+            cache.insert(schema_id, Arc::clone(&decoder));
+        }
+
+        Ok(decoder)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{DataTypes, Schema};
+
+    struct MockSchemaGetter {
+        schema: Arc<Schema>,
+    }
+
+    impl MockSchemaGetter {
+        fn new(data_types: Vec<crate::metadata::DataType>) -> Self {
+            let mut builder = Schema::builder();
+            for (i, dt) in data_types.iter().enumerate() {
+                builder = builder.column(&format!("field{}", i), dt.clone());
+            }
+            let schema = builder.build().expect("Failed to build schema");
+
+            Self {
+                schema: Arc::new(schema),
+            }
+        }
+    }
+
+    impl SchemaGetter for MockSchemaGetter {
+        fn get_schema(&self, _schema_id: i16) -> Result<Arc<Schema>> {
+            Ok(Arc::clone(&self.schema))
+        }
+    }
+
+    #[test]
+    fn test_kv_record_read_context() {
+        // Test decoder caching for same schema ID
+        let schema_getter = Arc::new(MockSchemaGetter::new(vec![
+            DataTypes::int(),
+            DataTypes::string(),
+        ]));
+        let read_context = KvRecordReadContext::new(KvFormat::COMPACTED, schema_getter);
+
+        // Get decoder twice - should return the same instance (cached)
+        let decoder1 = read_context.get_row_decoder(42).unwrap();
+        let decoder2 = read_context.get_row_decoder(42).unwrap();
+
+        // Verify same instance (Arc pointer equality)
+        assert!(Arc::ptr_eq(&decoder1, &decoder2));
+
+        // Test different schema IDs get different decoders
+        let schema_getter = Arc::new(MockSchemaGetter::new(vec![DataTypes::int()]));
+        let read_context = KvRecordReadContext::new(KvFormat::COMPACTED, schema_getter);
+
+        let decoder1 = read_context.get_row_decoder(10).unwrap();
+        let decoder2 = read_context.get_row_decoder(20).unwrap();
+
+        // Should be different instances
+        assert!(!Arc::ptr_eq(&decoder1, &decoder2));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/record/kv/mod.rs b/fluss-rust/crates/fluss/src/record/kv/mod.rs
index ecb762df16..857c5e5fc9 100644
--- a/fluss-rust/crates/fluss/src/record/kv/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/mod.rs
@@ -20,10 +20,17 @@
 mod kv_record;
 mod kv_record_batch;
 mod kv_record_batch_builder;
+mod kv_record_read_context;
+mod read_context;
+
+#[cfg(test)]
+mod test_util;
 
 pub use kv_record::{KvRecord, LENGTH_LENGTH as KV_RECORD_LENGTH_LENGTH};
 pub use kv_record_batch::*;
 pub use kv_record_batch_builder::*;
+pub use kv_record_read_context::{KvRecordReadContext, SchemaGetter};
+pub use read_context::ReadContext;
 
 /// Current KV magic value
 pub const CURRENT_KV_MAGIC_VALUE: u8 = 0;
diff --git a/fluss-rust/crates/fluss/src/record/kv/read_context.rs b/fluss-rust/crates/fluss/src/record/kv/read_context.rs
new file mode 100644
index 0000000000..63502613d1
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/kv/read_context.rs
@@ -0,0 +1,45 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Read context for KV record batches.
+//!
+//! Provides schema and decoder information needed for typed record reading.
+
+use crate::error::Result;
+use crate::row::RowDecoder;
+use std::sync::Arc;
+
+/// Context for reading KV records with type information.
+///
+/// The ReadContext provides access to RowDecoders based on schema IDs,
+/// enabling typed deserialization of KV record values.
+///
+/// Reference: org.apache.fluss.record.KvRecordBatch.ReadContext
+pub trait ReadContext: Send + Sync {
+    /// Get the row decoder for the given schema ID.
+    ///
+    /// The decoder is typically cached, so repeated calls with the same
+    /// schema ID should return the same decoder instance.
+    ///
+    /// # Arguments
+    /// * `schema_id` - The schema ID for which to get the decoder
+    ///
+    /// # Returns
+    /// An Arc-wrapped RowDecoder for the specified schema, or an error if
+    /// the schema is invalid or cannot be retrieved
+    fn get_row_decoder(&self, schema_id: i16) -> Result<Arc<dyn RowDecoder>>;
+}
diff --git a/fluss-rust/crates/fluss/src/record/kv/test_util.rs b/fluss-rust/crates/fluss/src/record/kv/test_util.rs
new file mode 100644
index 0000000000..50ab911db2
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/kv/test_util.rs
@@ -0,0 +1,50 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Test utilities for KV record reading.
+
+use super::ReadContext;
+use crate::error::Result;
+use crate::metadata::{DataType, KvFormat, RowType};
+use crate::row::{RowDecoder, RowDecoderFactory};
+use std::sync::Arc;
+
+/// Simple test-only ReadContext that creates decoders directly from data types.
+///
+/// This bypasses the production Schema/SchemaGetter machinery for simpler tests.
+pub(crate) struct TestReadContext {
+    kv_format: KvFormat,
+    data_types: Vec<DataType>,
+}
+
+impl TestReadContext {
+    /// Create a test context for COMPACTED format (most common case).
+    pub(crate) fn compacted(data_types: Vec<DataType>) -> Self {
+        Self {
+            kv_format: KvFormat::COMPACTED,
+            data_types,
+        }
+    }
+}
+
+impl ReadContext for TestReadContext {
+    fn get_row_decoder(&self, _schema_id: i16) -> Result<Arc<dyn RowDecoder>> {
+        // Directly create decoder from data types - no Schema needed!
+        let row_type = RowType::with_data_types(self.data_types.clone());
+        RowDecoderFactory::create(self.kv_format.clone(), row_type)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 3477f1de20..536409efde 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -23,11 +23,13 @@ pub mod binary;
 pub mod compacted;
 pub mod encode;
 mod field_getter;
+mod row_decoder;
 
 pub use column::*;
 pub use compacted::CompactedRow;
 pub use datum::*;
 pub use encode::KeyEncoder;
+pub use row_decoder::{CompactedRowDecoder, RowDecoder, RowDecoderFactory};
 
 pub trait BinaryRow: InternalRow {
     /// Returns the binary representation of this row as a byte slice.
diff --git a/fluss-rust/crates/fluss/src/row/row_decoder.rs b/fluss-rust/crates/fluss/src/row/row_decoder.rs
new file mode 100644
index 0000000000..9f9b4217a2
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/row_decoder.rs
@@ -0,0 +1,137 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Row decoder for deserializing binary row formats.
+//!
+//! Mirrors the Java org.apache.fluss.row.decode package.
+
+use crate::error::{Error, Result};
+use crate::metadata::{KvFormat, RowType};
+use crate::row::compacted::{CompactedRow, CompactedRowDeserializer};
+use std::sync::Arc;
+
+/// Decoder for creating BinaryRow from bytes.
+///
+/// This trait provides an abstraction for decoding different row formats
+/// (COMPACTED, INDEXED, etc.) from binary data.
+///
+/// Reference: org.apache.fluss.row.decode.RowDecoder
+pub trait RowDecoder: Send + Sync {
+    /// Decode bytes into a CompactedRow.
+    ///
+    /// The lifetime 'a ties the returned row to the input data, ensuring
+    /// the data remains valid as long as the row is used.
+    fn decode<'a>(&self, data: &'a [u8]) -> CompactedRow<'a>;
+}
+
+/// Decoder for CompactedRow format.
+///
+/// Uses the existing CompactedRow infrastructure for decoding.
+/// This is a thin wrapper that implements the RowDecoder trait.
+///
+/// Reference: org.apache.fluss.row.decode.CompactedRowDecoder
+pub struct CompactedRowDecoder {
+    field_count: usize,
+    deserializer: Arc<CompactedRowDeserializer<'static>>,
+}
+
+impl CompactedRowDecoder {
+    /// Create a new CompactedRowDecoder with the given row type.
+    pub fn new(row_type: RowType) -> Self {
+        let field_count = row_type.fields().len();
+        let deserializer = Arc::new(CompactedRowDeserializer::new_from_owned(row_type));
+
+        Self {
+            field_count,
+            deserializer,
+        }
+    }
+}
+
+impl RowDecoder for CompactedRowDecoder {
+    fn decode<'a>(&self, data: &'a [u8]) -> CompactedRow<'a> {
+        // Use existing CompactedRow::deserialize() infrastructure
+        CompactedRow::deserialize(Arc::clone(&self.deserializer), self.field_count, data)
+    }
+}
+
+/// Factory for creating RowDecoders based on KvFormat.
+///
+/// Reference: org.apache.fluss.row.decode.RowDecoder.create()
+pub struct RowDecoderFactory;
+
+impl RowDecoderFactory {
+    /// Create a RowDecoder for the given format and row type.
+    pub fn create(kv_format: KvFormat, row_type: RowType) -> Result<Arc<dyn RowDecoder>> {
+        match kv_format {
+            KvFormat::COMPACTED => Ok(Arc::new(CompactedRowDecoder::new(row_type))),
+            KvFormat::INDEXED => Err(Error::UnsupportedOperation {
+                message: "INDEXED format is not yet supported".to_string(),
+            }),
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::DataTypes;
+    use crate::row::InternalRow;
+    use crate::row::binary::BinaryWriter;
+    use crate::row::compacted::CompactedRowWriter;
+
+    #[test]
+    fn test_compacted_row_decoder() {
+        // Write a CompactedRow
+        let mut writer = CompactedRowWriter::new(2);
+        writer.write_int(42);
+        writer.write_string("hello");
+
+        let data = writer.to_bytes();
+
+        // Create decoder with RowType
+        let row_type = RowType::with_data_types(vec![DataTypes::int(), DataTypes::string()]);
+        let decoder = CompactedRowDecoder::new(row_type);
+
+        // Decode
+        let row = decoder.decode(&data);
+
+        // Verify
+        assert_eq!(row.get_field_count(), 2);
+        assert_eq!(row.get_int(0), 42);
+        assert_eq!(row.get_string(1), "hello");
+    }
+
+    #[test]
+    fn test_row_decoder_factory() {
+        let row_type = RowType::with_data_types(vec![DataTypes::int(), DataTypes::string()]);
+        let decoder = RowDecoderFactory::create(KvFormat::COMPACTED, row_type).unwrap();
+
+        // Write a row
+        let mut writer = CompactedRowWriter::new(2);
+        writer.write_int(100);
+        writer.write_string("world");
+        let data = writer.to_bytes();
+
+        // Decode
+        let row = decoder.decode(&data);
+
+        // Verify
+        assert_eq!(row.get_int(0), 100);
+        assert_eq!(row.get_string(1), "world");
+    }
+}

From f519ad9f840fbb3cf7c86458b20803c72f2dc7c5 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 18 Jan 2026 22:09:25 +0800
Subject: [PATCH 074/287] feat: introduce KvWriteBatch and PutKvRequest (#176)

---
 fluss-rust/bindings/python/src/table.rs       |  11 +-
 fluss-rust/crates/fluss/build.rs              |   5 +-
 .../crates/fluss/src/client/table/append.rs   |  11 +-
 .../src/client/table/log_fetch_buffer.rs      |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  |   3 +-
 .../crates/fluss/src/client/table/writer.rs   |   5 +-
 .../fluss/src/client/write/accumulator.rs     |   7 +-
 .../crates/fluss/src/client/write/batch.rs    | 133 +++++++++++++++---
 .../crates/fluss/src/client/write/mod.rs      |  79 +++++++++--
 .../crates/fluss/src/client/write/sender.rs   |  15 +-
 .../crates/fluss/src/proto/fluss_api.proto    |  28 ++++
 fluss-rust/crates/fluss/src/record/arrow.rs   |  17 ++-
 .../src/record/kv/kv_record_batch_builder.rs  |  25 ++--
 .../src/record/kv/kv_record_read_context.rs   |   5 +-
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |   4 +
 .../crates/fluss/src/rpc/message/mod.rs       |   1 +
 .../fluss/src/rpc/message/produce_log.rs      |   2 +-
 .../crates/fluss/src/rpc/message/put_kv.rs    |  73 ++++++++++
 18 files changed, 360 insertions(+), 66 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/put_kv.rs

diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index db85c51f5a..773354e8d8 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -340,8 +340,7 @@ fn python_to_generic_row(
             .map(|n| n.to_string())
             .unwrap_or_else(|_| "unknown".to_string());
         FlussError::new_err(format!(
-            "Row must be a dict, list, or tuple; got {}",
-            type_name
+            "Row must be a dict, list, or tuple; got {type_name}"
         ))
     })?;
     let schema = table_info.row_type();
@@ -357,7 +356,7 @@ fn python_to_generic_row(
                         .name()
                         .map(|n| n.to_string())
                         .unwrap_or_else(|_| "unknown".to_string());
-                    FlussError::new_err(format!("Row dict keys must be strings; got {}", key_type))
+                    FlussError::new_err(format!("Row dict keys must be strings; got {key_type}"))
                 })?;
 
                 if fields.iter().all(|f| f.name() != key_str) {
@@ -367,8 +366,7 @@ fn python_to_generic_row(
                         .collect::<Vec<_>>()
                         .join(", ");
                     return Err(FlussError::new_err(format!(
-                        "Unknown field '{}'. Expected fields: {}",
-                        key_str, expected
+                        "Unknown field '{key_str}'. Expected fields: {expected}"
                     )));
                 }
             }
@@ -476,8 +474,7 @@ fn python_value_to_datum(
             }
         }
         _ => Err(FlussError::new_err(format!(
-            "Unsupported data type for row-level operations: {:?}",
-            data_type
+            "Unsupported data type for row-level operations: {data_type}"
         ))),
     }
 }
diff --git a/fluss-rust/crates/fluss/build.rs b/fluss-rust/crates/fluss/build.rs
index 1564313732..265208a7c3 100644
--- a/fluss-rust/crates/fluss/build.rs
+++ b/fluss-rust/crates/fluss/build.rs
@@ -19,7 +19,10 @@ use std::io::Result;
 
 fn main() -> Result<()> {
     let mut config = prost_build::Config::new();
-    config.bytes([".proto.PbProduceLogReqForBucket.records"]);
+    config.bytes([
+        ".proto.PbProduceLogReqForBucket.records",
+        ".proto.PbPutKvReqForBucket.records",
+    ]);
     config.compile_protos(&["src/proto/fluss_api.proto"], &["src/proto"])?;
     Ok(())
 }
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index ad3e55e288..6d76f28b32 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -46,6 +46,7 @@ impl TableAppend {
         AppendWriter {
             table_path: Arc::new(self.table_path.clone()),
             writer_client: self.writer_client.clone(),
+            table_info: Arc::new(self.table_info.clone()),
         }
     }
 }
@@ -53,18 +54,24 @@ impl TableAppend {
 pub struct AppendWriter {
     table_path: Arc<TablePath>,
     writer_client: Arc<WriterClient>,
+    table_info: Arc<TableInfo>,
 }
 
 impl AppendWriter {
     pub async fn append(&self, row: GenericRow<'_>) -> Result<()> {
-        let record = WriteRecord::new(self.table_path.clone(), row);
+        let record =
+            WriteRecord::for_append(self.table_path.clone(), self.table_info.schema_id, row);
         let result_handle = self.writer_client.send(&record).await?;
         let result = result_handle.wait().await?;
         result_handle.result(result)
     }
 
     pub async fn append_arrow_batch(&self, batch: RecordBatch) -> Result<()> {
-        let record = WriteRecord::new_record_batch(self.table_path.clone(), batch);
+        let record = WriteRecord::for_append_record_batch(
+            self.table_path.clone(),
+            self.table_info.schema_id,
+            batch,
+        );
         let result_handle = self.writer_client.send(&record).await?;
         let result = result_handle.wait().await?;
         result_handle.result(result)
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index fb6981f4b5..ac44cc1728 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -733,7 +733,7 @@ mod tests {
         let mut row = GenericRow::new();
         row.set_field(0, 1_i32);
         row.set_field(1, "alice");
-        let record = WriteRecord::new(table_path, row);
+        let record = WriteRecord::for_append(table_path, 1, row);
         builder.append(&record)?;
 
         let data = builder.build()?;
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 3e7d61ff99..e9b2ce106d 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -1446,8 +1446,9 @@ mod tests {
                 compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
             },
         );
-        let record = WriteRecord::new(
+        let record = WriteRecord::for_append(
             table_path,
+            1,
             GenericRow {
                 values: vec![Datum::Int32(1)],
             },
diff --git a/fluss-rust/crates/fluss/src/client/table/writer.rs b/fluss-rust/crates/fluss/src/client/table/writer.rs
index b2ba881b36..8a83b5e356 100644
--- a/fluss-rust/crates/fluss/src/client/table/writer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/writer.rs
@@ -43,6 +43,7 @@ pub struct AbstractTableWriter {
     table_path: Arc<TablePath>,
     writer_client: Arc<WriterClient>,
     field_count: i32,
+    schema_id: i32,
 }
 
 #[allow(dead_code)]
@@ -57,6 +58,7 @@ impl AbstractTableWriter {
             table_path: Arc::new(table_path),
             writer_client,
             field_count: table_info.row_type().fields().len() as i32,
+            schema_id: table_info.schema_id,
         }
     }
 
@@ -82,7 +84,8 @@ pub struct AppendWriterImpl {
 #[allow(dead_code)]
 impl AppendWriterImpl {
     pub async fn append(&self, row: GenericRow<'_>) -> Result<()> {
-        let record = WriteRecord::new(self.base.table_path.clone(), row);
+        let record =
+            WriteRecord::for_append(self.base.table_path.clone(), self.base.schema_id, row);
         self.base.send(&record).await
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 83f11ab782..0afc9d4bc1 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -17,7 +17,7 @@
 
 use crate::client::write::batch::WriteBatch::ArrowLog;
 use crate::client::write::batch::{ArrowLogWriteBatch, WriteBatch};
-use crate::client::{Record, ResultHandle, WriteRecord};
+use crate::client::{LogWriteRecord, Record, ResultHandle, WriteRecord};
 use crate::cluster::{BucketLocation, Cluster, ServerNode};
 use crate::config::Config;
 use crate::error::Result;
@@ -110,7 +110,7 @@ impl RecordAccumulator {
             row_type,
             bucket_id,
             current_time_ms(),
-            matches!(record.row, Record::RecordBatch(_)),
+            matches!(&record.record, Record::Log(LogWriteRecord::RecordBatch(_))),
         ));
 
         let batch_id = batch.batch_id();
@@ -541,8 +541,9 @@ mod tests {
         let accumulator = RecordAccumulator::new(config);
         let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
         let cluster = Arc::new(build_cluster(table_path.as_ref(), 1, 1));
-        let record = WriteRecord::new(
+        let record = WriteRecord::for_append(
             table_path.clone(),
+            1,
             GenericRow {
                 values: vec![Datum::Int32(1)],
             },
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index 1f54226f39..01597538c8 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -17,13 +17,13 @@
 
 use crate::BucketId;
 use crate::client::broadcast::{BatchWriteResult, BroadcastOnce};
-use crate::client::{ResultHandle, WriteRecord};
+use crate::client::{Record, ResultHandle, WriteRecord};
 use crate::compression::ArrowCompressionInfo;
-use crate::error::Result;
-use crate::metadata::{DataType, TablePath};
+use crate::error::{Error, Result};
+use crate::metadata::{DataType, KvFormat, TablePath};
 use crate::record::MemoryLogRecordsArrowBuilder;
+use crate::record::kv::KvRecordBatchBuilder;
 use bytes::Bytes;
-use parking_lot::Mutex;
 use std::cmp::max;
 use std::sync::atomic::{AtomicBool, AtomicI32, Ordering};
 
@@ -92,18 +92,28 @@ impl InnerWriteBatch {
 
 pub enum WriteBatch {
     ArrowLog(ArrowLogWriteBatch),
+    Kv(KvWriteBatch),
 }
 
 impl WriteBatch {
     pub fn inner_batch(&self) -> &InnerWriteBatch {
         match self {
             WriteBatch::ArrowLog(batch) => &batch.write_batch,
+            WriteBatch::Kv(batch) => &batch.write_batch,
+        }
+    }
+
+    pub fn inner_batch_mut(&mut self) -> &mut InnerWriteBatch {
+        match self {
+            WriteBatch::ArrowLog(batch) => &mut batch.write_batch,
+            WriteBatch::Kv(batch) => &mut batch.write_batch,
         }
     }
 
     pub fn try_append(&mut self, write_record: &WriteRecord) -> Result<Option<ResultHandle>> {
         match self {
             WriteBatch::ArrowLog(batch) => batch.try_append(write_record),
+            WriteBatch::Kv(batch) => batch.try_append(write_record),
         }
     }
 
@@ -111,11 +121,13 @@ impl WriteBatch {
         self.inner_batch().waited_time_ms(now)
     }
 
-    pub fn close(&mut self) {
+    pub fn close(&mut self) -> Result<()> {
         match self {
             WriteBatch::ArrowLog(batch) => {
                 batch.close();
+                Ok(())
             }
+            WriteBatch::Kv(batch) => batch.close(),
         }
     }
 
@@ -127,20 +139,18 @@ impl WriteBatch {
     pub fn is_closed(&self) -> bool {
         match self {
             WriteBatch::ArrowLog(batch) => batch.is_closed(),
+            WriteBatch::Kv(batch) => batch.is_closed(),
         }
     }
 
     pub fn drained(&mut self, now_ms: i64) {
-        match self {
-            WriteBatch::ArrowLog(batch) => {
-                batch.write_batch.drained(now_ms);
-            }
-        }
+        self.inner_batch_mut().drained(now_ms);
     }
 
-    pub fn build(&self) -> Result<Bytes> {
+    pub fn build(&mut self) -> Result<Bytes> {
         match self {
             WriteBatch::ArrowLog(batch) => batch.build(),
+            WriteBatch::Kv(batch) => batch.build(),
         }
     }
 
@@ -172,7 +182,7 @@ impl WriteBatch {
 pub struct ArrowLogWriteBatch {
     pub write_batch: InnerWriteBatch,
     pub arrow_builder: MemoryLogRecordsArrowBuilder,
-    built_records: Mutex<Option<Bytes>>,
+    built_records: Option<Bytes>,
 }
 
 impl ArrowLogWriteBatch {
@@ -196,7 +206,7 @@ impl ArrowLogWriteBatch {
                 to_append_record_batch,
                 arrow_compression_info,
             ),
-            built_records: Mutex::new(None),
+            built_records: None,
         }
     }
 
@@ -218,13 +228,12 @@ impl ArrowLogWriteBatch {
         }
     }
 
-    pub fn build(&self) -> Result<Bytes> {
-        let mut cached = self.built_records.lock();
-        if let Some(bytes) = cached.as_ref() {
+    pub fn build(&mut self) -> Result<Bytes> {
+        if let Some(bytes) = &self.built_records {
             return Ok(bytes.clone());
         }
         let bytes = Bytes::from(self.arrow_builder.build()?);
-        *cached = Some(bytes.clone());
+        self.built_records = Some(bytes.clone());
         Ok(bytes)
     }
 
@@ -237,6 +246,96 @@ impl ArrowLogWriteBatch {
     }
 }
 
+pub struct KvWriteBatch {
+    write_batch: InnerWriteBatch,
+    kv_batch_builder: KvRecordBatchBuilder,
+    target_columns: Option<Vec<usize>>,
+    schema_id: i32,
+}
+
+impl KvWriteBatch {
+    #[allow(clippy::too_many_arguments)]
+    pub fn new(
+        batch_id: i64,
+        table_path: TablePath,
+        schema_id: i32,
+        write_limit: usize,
+        kv_format: KvFormat,
+        bucket_id: BucketId,
+        target_columns: Option<Vec<usize>>,
+        create_ms: i64,
+    ) -> Self {
+        let base = InnerWriteBatch::new(batch_id, table_path, create_ms, bucket_id);
+        Self {
+            write_batch: base,
+            kv_batch_builder: KvRecordBatchBuilder::new(schema_id, write_limit, kv_format),
+            target_columns,
+            schema_id,
+        }
+    }
+
+    pub fn try_append(&mut self, write_record: &WriteRecord) -> Result<Option<ResultHandle>> {
+        let kv_write_record = match &write_record.record {
+            Record::Kv(record) => record,
+            _ => {
+                return Err(Error::UnsupportedOperation {
+                    message: "Only KvRecord to append to KvWriteBatch ".to_string(),
+                });
+            }
+        };
+
+        let key = kv_write_record.key;
+
+        if self.schema_id != write_record.schema_id {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "schema id {} of the write record to append is not the same as the current schema id {} in the batch.",
+                    write_record.schema_id, self.schema_id
+                ),
+                source: None,
+            });
+        };
+
+        if self.target_columns.as_deref() != kv_write_record.target_columns {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "target columns {:?} of the write record to append are not the same as the current target columns {:?} in the batch.",
+                    kv_write_record.target_columns,
+                    self.target_columns.as_deref()
+                ),
+                source: None,
+            });
+        }
+
+        let row = kv_write_record.compacted_row.as_ref();
+
+        if self.is_closed() || !self.kv_batch_builder.has_room_for_row(key, row) {
+            Ok(None)
+        } else {
+            // append successfully
+            self.kv_batch_builder
+                .append_row(key, row)
+                .map_err(|e| Error::UnexpectedError {
+                    message: "Failed to append row to KvWriteBatch".to_string(),
+                    source: Some(Box::new(e)),
+                })?;
+            Ok(Some(ResultHandle::new(self.write_batch.results.receiver())))
+        }
+    }
+
+    pub fn build(&mut self) -> Result<Bytes> {
+        self.kv_batch_builder.build()
+    }
+
+    pub fn is_closed(&self) -> bool {
+        self.kv_batch_builder.is_closed()
+    }
+
+    pub fn close(&mut self) -> Result<()> {
+        self.kv_batch_builder.close()
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index 00a71c51fa..248218e076 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -21,7 +21,7 @@ mod batch;
 use crate::client::broadcast::{self as client_broadcast, BatchWriteResult, BroadcastOnceReceiver};
 use crate::error::Error;
 use crate::metadata::TablePath;
-use crate::row::GenericRow;
+use crate::row::{CompactedRow, GenericRow};
 pub use accumulator::*;
 use arrow::array::RecordBatch;
 use std::sync::Arc;
@@ -36,28 +36,91 @@ mod writer_client;
 pub use write_format::WriteFormat;
 pub use writer_client::WriterClient;
 
+#[allow(dead_code)]
 pub struct WriteRecord<'a> {
-    pub row: Record<'a>,
-    pub table_path: Arc<TablePath>,
+    record: Record<'a>,
+    table_path: Arc<TablePath>,
+    bucket_key: Option<&'a [u8]>,
+    schema_id: i32,
+    write_format: WriteFormat,
+}
+
+impl<'a> WriteRecord<'a> {
+    pub fn record(&self) -> &Record<'a> {
+        &self.record
+    }
 }
 
 pub enum Record<'a> {
-    Row(GenericRow<'a>),
+    Log(LogWriteRecord<'a>),
+    Kv(KvWriteRecord<'a>),
+}
+
+pub enum LogWriteRecord<'a> {
+    Generic(GenericRow<'a>),
     RecordBatch(Arc<RecordBatch>),
 }
 
+pub struct KvWriteRecord<'a> {
+    // only valid for primary key table
+    key: &'a [u8],
+    target_columns: Option<&'a [usize]>,
+    compacted_row: Option<CompactedRow<'a>>,
+}
+
+impl<'a> KvWriteRecord<'a> {
+    fn new(
+        key: &'a [u8],
+        target_columns: Option<&'a [usize]>,
+        compacted_row: Option<CompactedRow<'a>>,
+    ) -> Self {
+        KvWriteRecord {
+            key,
+            target_columns,
+            compacted_row,
+        }
+    }
+}
+
 impl<'a> WriteRecord<'a> {
-    pub fn new(table_path: Arc<TablePath>, row: GenericRow<'a>) -> Self {
+    pub fn for_append(table_path: Arc<TablePath>, schema_id: i32, row: GenericRow<'a>) -> Self {
+        Self {
+            record: Record::Log(LogWriteRecord::Generic(row)),
+            table_path,
+            bucket_key: None,
+            schema_id,
+            write_format: WriteFormat::ArrowLog,
+        }
+    }
+
+    pub fn for_append_record_batch(
+        table_path: Arc<TablePath>,
+        schema_id: i32,
+        row: RecordBatch,
+    ) -> Self {
         Self {
-            row: Record::Row(row),
+            record: Record::Log(LogWriteRecord::RecordBatch(Arc::new(row))),
             table_path,
+            bucket_key: None,
+            schema_id,
+            write_format: WriteFormat::ArrowLog,
         }
     }
 
-    pub fn new_record_batch(table_path: Arc<TablePath>, row: RecordBatch) -> Self {
+    pub fn for_upsert(
+        table_path: Arc<TablePath>,
+        schema_id: i32,
+        bucket_key: &'a [u8],
+        key: &'a [u8],
+        target_columns: Option<&'a [usize]>,
+        row: CompactedRow<'a>,
+    ) -> Self {
         Self {
-            row: Record::RecordBatch(Arc::new(row)),
+            record: Record::Kv(KvWriteRecord::new(key, target_columns, Some(row))),
             table_path,
+            bucket_key: Some(bucket_key),
+            schema_id,
+            write_format: WriteFormat::CompactedKv,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index ffac0af8ae..7ea24e30f6 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -178,9 +178,9 @@ impl Sender {
         };
 
         for (table_id, table_buckets) in write_batch_by_table {
-            let request_batches: Vec<&ReadyWriteBatch> = table_buckets
+            let mut request_batches: Vec<ReadyWriteBatch> = table_buckets
                 .iter()
-                .filter_map(|bucket| records_by_bucket.get(bucket))
+                .filter_map(|bucket| records_by_bucket.remove(bucket))
                 .collect();
             if request_batches.is_empty() {
                 continue;
@@ -189,7 +189,7 @@ impl Sender {
                 table_id,
                 acks,
                 self.max_request_timeout_ms,
-                request_batches.as_slice(),
+                &mut request_batches,
             ) {
                 Ok(request) => request,
                 Err(e) => {
@@ -205,6 +205,12 @@ impl Sender {
                 }
             };
 
+            // let's put in back into records_by_bucket
+            // since response handle will use it.
+            for request_batch in request_batches {
+                records_by_bucket.insert(request_batch.table_bucket.clone(), request_batch);
+            }
+
             let response = match connection.request(request).await {
                 Ok(response) => response,
                 Err(e) => {
@@ -462,8 +468,9 @@ mod tests {
         cluster: Arc<Cluster>,
         table_path: Arc<TablePath>,
     ) -> Result<(ReadyWriteBatch, crate::client::ResultHandle)> {
-        let record = WriteRecord::new(
+        let record = WriteRecord::for_append(
             table_path,
+            1,
             GenericRow {
                 values: vec![Datum::Int32(1)],
             },
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index b4ae8405aa..eaee94c36c 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -119,6 +119,34 @@ message PbProduceLogRespForBucket {
   optional int64 base_offset = 5;
 }
 
+// put kv request and response
+message PutKvRequest {
+  required int32 acks = 1;
+  required int64 table_id = 2;
+  required int32 timeout_ms = 3;
+  // the indexes for the columns to write,
+  // if empty, means write all columns
+  repeated int32 target_columns = 4 [packed = true];
+  repeated PbPutKvReqForBucket buckets_req = 5;
+}
+
+message PutKvResponse {
+  repeated PbPutKvRespForBucket buckets_resp = 1;
+}
+
+message PbPutKvReqForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  required bytes records = 3;
+}
+
+message PbPutKvRespForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  optional int32 error_code = 3;
+  optional string error_message = 4;
+}
+
 message CreateTableRequest {
   required PbTablePath table_path = 1;
   required bytes table_json = 2;
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index b331ae9d7f..aa48376bb6 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::client::{Record, WriteRecord};
+use crate::client::{LogWriteRecord, Record, WriteRecord};
 use crate::compression::ArrowCompressionInfo;
 use crate::error::{Error, Result};
 use crate::metadata::DataType;
@@ -275,11 +275,16 @@ impl MemoryLogRecordsArrowBuilder {
     }
 
     pub fn append(&mut self, record: &WriteRecord) -> Result<bool> {
-        match &record.row {
-            Record::Row(row) => Ok(self.arrow_record_batch_builder.append(row)?),
-            Record::RecordBatch(record_batch) => Ok(self
-                .arrow_record_batch_builder
-                .append_batch(record_batch.clone())?),
+        match &record.record() {
+            Record::Log(log_write_record) => match log_write_record {
+                LogWriteRecord::Generic(row) => Ok(self.arrow_record_batch_builder.append(row)?),
+                LogWriteRecord::RecordBatch(record_batch) => Ok(self
+                    .arrow_record_batch_builder
+                    .append_batch(record_batch.clone())?),
+            },
+            Record::Kv(_) => Err(Error::UnsupportedOperation {
+                message: "Only LogRecord is supported to append".to_string(),
+            }),
         }
         // todo: consider write other change type
     }
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
index 636104d176..e3da8640f7 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
@@ -19,9 +19,7 @@
 //!
 //! This module provides the KvRecordBatchBuilder for building batches of KV records.
 
-use bytes::{Bytes, BytesMut};
-use std::io;
-
+use crate::error::{Error, Result};
 use crate::metadata::KvFormat;
 use crate::record::kv::kv_record::KvRecord;
 use crate::record::kv::kv_record_batch::{
@@ -31,6 +29,8 @@ use crate::record::kv::kv_record_batch::{
 };
 use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, NO_BATCH_SEQUENCE, NO_WRITER_ID};
 use crate::row::BinaryRow;
+use bytes::{Bytes, BytesMut};
+use std::io;
 
 /// Builder for KvRecordBatch.
 ///
@@ -185,11 +185,12 @@ impl KvRecordBatchBuilder {
     /// built bytes may change if mutations occur between builds.
     ///
     /// Note: [`close`](Self::close) prevents further appends but does not prevent writer state modifications.
-    pub fn build(&mut self) -> io::Result<Bytes> {
+    pub fn build(&mut self) -> Result<Bytes> {
         if self.aborted {
-            return Err(io::Error::other(
-                "Attempting to build an aborted record batch",
-            ));
+            return Err(Error::UnexpectedError {
+                message: "Attempting to build an aborted record batch".to_string(),
+                source: None,
+            });
         }
 
         if let Some(ref cached) = self.built_buffer {
@@ -225,11 +226,13 @@ impl KvRecordBatchBuilder {
 
     /// Close the builder.
     /// After closing, no more records can be appended, but the batch can still be built.
-    pub fn close(&mut self) -> io::Result<()> {
+    pub fn close(&mut self) -> Result<()> {
         if self.aborted {
-            return Err(io::Error::other(
-                "Cannot close KvRecordBatchBuilder as it has already been aborted",
-            ));
+            return Err(Error::UnexpectedError {
+                message: "Cannot close KvRecordBatchBuilder as it has already been aborted"
+                    .to_string(),
+                source: None,
+            });
         }
         self.is_closed = true;
         Ok(())
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
index 2049c32680..fe6c6f0598 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
@@ -90,8 +90,7 @@ impl ReadContext for KvRecordReadContext {
             other => {
                 return Err(Error::IoUnexpectedError {
                     message: format!(
-                        "Schema {} has invalid row type: expected Row, got {:?}",
-                        schema_id, other
+                        "Schema {schema_id} has invalid row type: expected Row, got {other:?}"
                     ),
                     source: std::io::Error::new(
                         std::io::ErrorKind::InvalidData,
@@ -134,7 +133,7 @@ mod tests {
         fn new(data_types: Vec<crate::metadata::DataType>) -> Self {
             let mut builder = Schema::builder();
             for (i, dt) in data_types.iter().enumerate() {
-                builder = builder.column(&format!("field{}", i), dt.clone());
+                builder = builder.column(&format!("field{i}"), dt.clone());
             }
             let schema = builder.build().expect("Failed to build schema");
 
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index 9f9268e857..66e4beb8e4 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -30,6 +30,7 @@ pub enum ApiKey {
     TableExists,
     MetaData,
     ProduceLog,
+    PutKv,
     FetchLog,
     Lookup,
     ListOffsets,
@@ -54,6 +55,7 @@ impl From<i16> for ApiKey {
             1012 => ApiKey::MetaData,
             1014 => ApiKey::ProduceLog,
             1015 => ApiKey::FetchLog,
+            1016 => ApiKey::PutKv,
             1017 => ApiKey::Lookup,
             1021 => ApiKey::ListOffsets,
             1025 => ApiKey::GetFileSystemSecurityToken,
@@ -79,6 +81,7 @@ impl From<ApiKey> for i16 {
             ApiKey::MetaData => 1012,
             ApiKey::ProduceLog => 1014,
             ApiKey::FetchLog => 1015,
+            ApiKey::PutKv => 1016,
             ApiKey::Lookup => 1017,
             ApiKey::ListOffsets => 1021,
             ApiKey::GetFileSystemSecurityToken => 1025,
@@ -108,6 +111,7 @@ mod tests {
             (1012, ApiKey::MetaData),
             (1014, ApiKey::ProduceLog),
             (1015, ApiKey::FetchLog),
+            (1016, ApiKey::PutKv),
             (1017, ApiKey::Lookup),
             (1021, ApiKey::ListOffsets),
             (1025, ApiKey::GetFileSystemSecurityToken),
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 2fe506bc37..4e6c8e1eaf 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -36,6 +36,7 @@ mod list_offsets;
 mod list_tables;
 mod lookup;
 mod produce_log;
+mod put_kv;
 mod table_exists;
 mod update_metadata;
 
diff --git a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
index eb725751c7..dab7ea9a57 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
@@ -37,7 +37,7 @@ impl ProduceLogRequest {
         table_id: i64,
         ack: i16,
         max_request_timeout_ms: i32,
-        ready_batches: &[&ReadyWriteBatch],
+        ready_batches: &mut [ReadyWriteBatch],
     ) -> FlussResult<Self> {
         let mut request = proto::ProduceLogRequest {
             table_id,
diff --git a/fluss-rust/crates/fluss/src/rpc/message/put_kv.rs b/fluss-rust/crates/fluss/src/rpc/message/put_kv.rs
new file mode 100644
index 0000000000..983faa6646
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/put_kv.rs
@@ -0,0 +1,73 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+use crate::client::ReadyWriteBatch;
+use crate::proto::{PbPutKvReqForBucket, PutKvResponse};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::ReadError;
+use crate::rpc::frame::WriteError;
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[allow(dead_code)]
+pub struct PutKvRequest {
+    pub inner_request: proto::PutKvRequest,
+}
+
+#[allow(dead_code)]
+impl PutKvRequest {
+    pub fn new(
+        table_id: i64,
+        ack: i16,
+        max_request_timeout_ms: i32,
+        target_columns: Vec<i32>,
+        ready_batches: &mut [ReadyWriteBatch],
+    ) -> crate::error::Result<Self> {
+        let mut request = proto::PutKvRequest {
+            table_id,
+            acks: ack as i32,
+            timeout_ms: max_request_timeout_ms,
+            target_columns,
+            ..Default::default()
+        };
+        for ready_batch in ready_batches {
+            request.buckets_req.push(PbPutKvReqForBucket {
+                partition_id: ready_batch.table_bucket.partition_id(),
+                bucket_id: ready_batch.table_bucket.bucket_id(),
+                records: ready_batch.write_batch.build()?,
+            })
+        }
+
+        Ok(PutKvRequest {
+            inner_request: request,
+        })
+    }
+}
+
+impl RequestBody for PutKvRequest {
+    type ResponseBody = PutKvResponse;
+
+    const API_KEY: ApiKey = ApiKey::PutKv;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(PutKvRequest);
+impl_read_version_type!(PutKvResponse);

From db565f97e671cb81e7bd40e1eda64f6d527be440 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 19 Jan 2026 13:27:22 +0000
Subject: [PATCH 075/287] feat: support all basic datatypes in compacted key
 encoder(continuation) (#175)

---
 fluss-rust/crates/fluss/Cargo.toml            |   2 +-
 .../crates/fluss/src/metadata/datatype.rs     | 272 +++++++---
 .../crates/fluss/src/metadata/json_serde.rs   | 112 +++-
 fluss-rust/crates/fluss/src/record/arrow.rs   |  21 +-
 .../fluss/src/row/binary/binary_writer.rs     |  57 ++-
 fluss-rust/crates/fluss/src/row/column.rs     | 198 +++++++-
 .../src/row/compacted/compacted_key_writer.rs |   7 +
 .../fluss/src/row/compacted/compacted_row.rs  | 147 ++++--
 .../src/row/compacted/compacted_row_reader.rs |  72 ++-
 .../src/row/compacted/compacted_row_writer.rs | 125 ++++-
 fluss-rust/crates/fluss/src/row/datum.rs      | 181 ++++++-
 fluss-rust/crates/fluss/src/row/decimal.rs    | 477 ++++++++++++++++++
 .../src/row/encode/compacted_key_encoder.rs   | 175 ++++---
 .../crates/fluss/src/row/field_getter.rs      | 101 +++-
 fluss-rust/crates/fluss/src/row/mod.rs        |  63 ++-
 15 files changed, 1739 insertions(+), 271 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/row/decimal.rs

diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 8942ffc7db..c3bdd4475a 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -48,7 +48,7 @@ tokio = { workspace = true }
 parking_lot = "0.12"
 bytes = "1.10.1"
 dashmap = "6.1.0"
-rust_decimal = "1"
+bigdecimal = { version = "0.4", features = ["serde"] }
 ordered-float = { version = "5", features = ["serde"] }
 parse-display = "0.10"
 ref-cast = "1.0"
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index f1574665eb..e365237030 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -453,16 +453,40 @@ impl DecimalType {
 
     pub const DEFAULT_SCALE: u32 = 0;
 
-    pub fn new(precision: u32, scale: u32) -> Self {
+    pub fn new(precision: u32, scale: u32) -> Result<Self> {
         Self::with_nullable(true, precision, scale)
     }
 
-    pub fn with_nullable(nullable: bool, precision: u32, scale: u32) -> Self {
-        DecimalType {
+    /// Create a DecimalType with validation, returning an error if parameters are invalid.
+    pub fn with_nullable(nullable: bool, precision: u32, scale: u32) -> Result<Self> {
+        // Validate precision
+        if !(Self::MIN_PRECISION..=Self::MAX_PRECISION).contains(&precision) {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Decimal precision must be between {} and {} (both inclusive), got: {}",
+                    Self::MIN_PRECISION,
+                    Self::MAX_PRECISION,
+                    precision
+                ),
+            });
+        }
+        // Validate scale
+        // Note: MIN_SCALE is 0, and scale is u32, so scale >= MIN_SCALE is always true
+        if scale > precision {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Decimal scale must be between {} and the precision {} (both inclusive), got: {}",
+                    Self::MIN_SCALE,
+                    precision,
+                    scale
+                ),
+            });
+        }
+        Ok(DecimalType {
             nullable,
             precision,
             scale,
-        }
+        })
     }
 
     pub fn precision(&self) -> u32 {
@@ -475,6 +499,7 @@ impl DecimalType {
 
     pub fn as_non_nullable(&self) -> Self {
         Self::with_nullable(false, self.precision, self.scale)
+            .expect("Invalid decimal precision or scale")
     }
 }
 
@@ -531,7 +556,7 @@ pub struct TimeType {
 
 impl TimeType {
     fn default() -> Self {
-        Self::new(Self::DEFAULT_PRECISION)
+        Self::new(Self::DEFAULT_PRECISION).expect("Invalid default time precision")
     }
 }
 
@@ -542,15 +567,27 @@ impl TimeType {
 
     pub const DEFAULT_PRECISION: u32 = 0;
 
-    pub fn new(precision: u32) -> Self {
+    pub fn new(precision: u32) -> Result<Self> {
         Self::with_nullable(true, precision)
     }
 
-    pub fn with_nullable(nullable: bool, precision: u32) -> Self {
-        TimeType {
+    /// Create a TimeType with validation, returning an error if precision is invalid.
+    pub fn with_nullable(nullable: bool, precision: u32) -> Result<Self> {
+        // Validate precision
+        if !(Self::MIN_PRECISION..=Self::MAX_PRECISION).contains(&precision) {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Time precision must be between {} and {} (both inclusive), got: {}",
+                    Self::MIN_PRECISION,
+                    Self::MAX_PRECISION,
+                    precision
+                ),
+            });
+        }
+        Ok(TimeType {
             nullable,
             precision,
-        }
+        })
     }
 
     pub fn precision(&self) -> u32 {
@@ -558,7 +595,7 @@ impl TimeType {
     }
 
     pub fn as_non_nullable(&self) -> Self {
-        Self::with_nullable(false, self.precision)
+        Self::with_nullable(false, self.precision).expect("Invalid time precision")
     }
 }
 
@@ -580,7 +617,7 @@ pub struct TimestampType {
 
 impl Default for TimestampType {
     fn default() -> Self {
-        Self::new(Self::DEFAULT_PRECISION)
+        Self::new(Self::DEFAULT_PRECISION).expect("Invalid default timestamp precision")
     }
 }
 
@@ -591,15 +628,27 @@ impl TimestampType {
 
     pub const DEFAULT_PRECISION: u32 = 6;
 
-    pub fn new(precision: u32) -> Self {
+    pub fn new(precision: u32) -> Result<Self> {
         Self::with_nullable(true, precision)
     }
 
-    pub fn with_nullable(nullable: bool, precision: u32) -> Self {
-        TimestampType {
+    /// Create a TimestampType with validation, returning an error if precision is invalid.
+    pub fn with_nullable(nullable: bool, precision: u32) -> Result<Self> {
+        // Validate precision
+        if !(Self::MIN_PRECISION..=Self::MAX_PRECISION).contains(&precision) {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Timestamp precision must be between {} and {} (both inclusive), got: {}",
+                    Self::MIN_PRECISION,
+                    Self::MAX_PRECISION,
+                    precision
+                ),
+            });
+        }
+        Ok(TimestampType {
             nullable,
             precision,
-        }
+        })
     }
 
     pub fn precision(&self) -> u32 {
@@ -607,7 +656,7 @@ impl TimestampType {
     }
 
     pub fn as_non_nullable(&self) -> Self {
-        Self::with_nullable(false, self.precision)
+        Self::with_nullable(false, self.precision).expect("Invalid timestamp precision")
     }
 }
 
@@ -630,6 +679,7 @@ pub struct TimestampLTzType {
 impl Default for TimestampLTzType {
     fn default() -> Self {
         Self::new(Self::DEFAULT_PRECISION)
+            .expect("Invalid default timestamp with local time zone precision")
     }
 }
 
@@ -640,15 +690,27 @@ impl TimestampLTzType {
 
     pub const DEFAULT_PRECISION: u32 = 6;
 
-    pub fn new(precision: u32) -> Self {
+    pub fn new(precision: u32) -> Result<Self> {
         Self::with_nullable(true, precision)
     }
 
-    pub fn with_nullable(nullable: bool, precision: u32) -> Self {
-        TimestampLTzType {
+    /// Create a TimestampLTzType with validation, returning an error if precision is invalid.
+    pub fn with_nullable(nullable: bool, precision: u32) -> Result<Self> {
+        // Validate precision
+        if !(Self::MIN_PRECISION..=Self::MAX_PRECISION).contains(&precision) {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Timestamp with local time zone precision must be between {} and {} (both inclusive), got: {}",
+                    Self::MIN_PRECISION,
+                    Self::MAX_PRECISION,
+                    precision
+                ),
+            });
+        }
+        Ok(TimestampLTzType {
             nullable,
             precision,
-        }
+        })
     }
 
     pub fn precision(&self) -> u32 {
@@ -657,6 +719,7 @@ impl TimestampLTzType {
 
     pub fn as_non_nullable(&self) -> Self {
         Self::with_nullable(false, self.precision)
+            .expect("Invalid timestamp with local time zone precision")
     }
 }
 
@@ -985,7 +1048,7 @@ impl DataTypes {
     /// digits to the right of the decimal point in a number (=scale). `p` must have a value
     /// between 1 and 38 (both inclusive). `s` must have a value between 0 and `p` (both inclusive).
     pub fn decimal(precision: u32, scale: u32) -> DataType {
-        DataType::Decimal(DecimalType::new(precision, scale))
+        DataType::Decimal(DecimalType::new(precision, scale).expect("Invalid decimal parameters"))
     }
 
     pub fn date() -> DataType {
@@ -1000,7 +1063,7 @@ impl DataTypes {
     /// Data type of a time WITHOUT time zone `TIME(p)` where `p` is the number of digits
     /// of fractional seconds (=precision). `p` must have a value between 0 and 9 (both inclusive).
     pub fn time_with_precision(precision: u32) -> DataType {
-        DataType::Time(TimeType::new(precision))
+        DataType::Time(TimeType::new(precision).expect("Invalid time precision"))
     }
 
     /// Data type of a timestamp WITHOUT time zone `TIMESTAMP` with 6 digits of fractional
@@ -1013,7 +1076,7 @@ impl DataTypes {
     /// of digits of fractional seconds (=precision). `p` must have a value between 0 and 9
     /// (both inclusive).
     pub fn timestamp_with_precision(precision: u32) -> DataType {
-        DataType::Timestamp(TimestampType::new(precision))
+        DataType::Timestamp(TimestampType::new(precision).expect("Invalid timestamp precision"))
     }
 
     /// Data type of a timestamp WITH time zone `TIMESTAMP WITH TIME ZONE` with 6 digits of
@@ -1025,7 +1088,10 @@ impl DataTypes {
     /// Data type of a timestamp WITH time zone `TIMESTAMP WITH TIME ZONE(p)` where `p` is the number
     /// of digits of fractional seconds (=precision). `p` must have a value between 0 and 9 (both inclusive).
     pub fn timestamp_ltz_with_precision(precision: u32) -> DataType {
-        DataType::TimestampLTz(TimestampLTzType::new(precision))
+        DataType::TimestampLTz(
+            TimestampLTzType::new(precision)
+                .expect("Invalid timestamp with local time zone precision"),
+        )
     }
 
     /// Data type of an array of elements with same subtype.
@@ -1100,82 +1166,56 @@ impl Display for DataField {
 }
 
 #[test]
-fn test_boolean_display() {
+fn test_primitive_types_display() {
+    // Test simple primitive types with nullable and non-nullable variants
     assert_eq!(BooleanType::new().to_string(), "BOOLEAN");
     assert_eq!(
         BooleanType::with_nullable(false).to_string(),
         "BOOLEAN NOT NULL"
     );
-}
 
-#[test]
-fn test_tinyint_display() {
     assert_eq!(TinyIntType::new().to_string(), "TINYINT");
     assert_eq!(
         TinyIntType::with_nullable(false).to_string(),
         "TINYINT NOT NULL"
     );
-}
 
-#[test]
-fn test_smallint_display() {
     assert_eq!(SmallIntType::new().to_string(), "SMALLINT");
     assert_eq!(
         SmallIntType::with_nullable(false).to_string(),
         "SMALLINT NOT NULL"
     );
-}
 
-#[test]
-fn test_int_display() {
     assert_eq!(IntType::new().to_string(), "INT");
     assert_eq!(IntType::with_nullable(false).to_string(), "INT NOT NULL");
-}
 
-#[test]
-fn test_bigint_display() {
     assert_eq!(BigIntType::new().to_string(), "BIGINT");
     assert_eq!(
         BigIntType::with_nullable(false).to_string(),
         "BIGINT NOT NULL"
     );
-}
 
-#[test]
-fn test_float_display() {
     assert_eq!(FloatType::new().to_string(), "FLOAT");
     assert_eq!(
         FloatType::with_nullable(false).to_string(),
         "FLOAT NOT NULL"
     );
-}
 
-#[test]
-fn test_double_display() {
     assert_eq!(DoubleType::new().to_string(), "DOUBLE");
     assert_eq!(
         DoubleType::with_nullable(false).to_string(),
         "DOUBLE NOT NULL"
     );
-}
 
-#[test]
-fn test_string_display() {
     assert_eq!(StringType::new().to_string(), "STRING");
     assert_eq!(
         StringType::with_nullable(false).to_string(),
         "STRING NOT NULL"
     );
-}
 
-#[test]
-fn test_date_display() {
     assert_eq!(DateType::new().to_string(), "DATE");
     assert_eq!(DateType::with_nullable(false).to_string(), "DATE NOT NULL");
-}
 
-#[test]
-fn test_bytes_display() {
     assert_eq!(BytesType::new().to_string(), "BYTES");
     assert_eq!(
         BytesType::with_nullable(false).to_string(),
@@ -1184,59 +1224,58 @@ fn test_bytes_display() {
 }
 
 #[test]
-fn test_char_display() {
+fn test_parameterized_types_display() {
+    // Test types with parameters (length, precision, scale, etc.)
     assert_eq!(CharType::new(10).to_string(), "CHAR(10)");
     assert_eq!(
         CharType::with_nullable(20, false).to_string(),
         "CHAR(20) NOT NULL"
     );
-}
 
-#[test]
-fn test_decimal_display() {
-    assert_eq!(DecimalType::new(10, 2).to_string(), "DECIMAL(10, 2)");
+    assert_eq!(BinaryType::new(100).to_string(), "BINARY(100)");
+    assert_eq!(
+        BinaryType::with_nullable(false, 256).to_string(),
+        "BINARY(256) NOT NULL"
+    );
+
     assert_eq!(
-        DecimalType::with_nullable(false, 38, 10).to_string(),
+        DecimalType::new(10, 2).unwrap().to_string(),
+        "DECIMAL(10, 2)"
+    );
+    assert_eq!(
+        DecimalType::with_nullable(false, 38, 10)
+            .unwrap()
+            .to_string(),
         "DECIMAL(38, 10) NOT NULL"
     );
-}
 
-#[test]
-fn test_time_display() {
-    assert_eq!(TimeType::new(0).to_string(), "TIME(0)");
-    assert_eq!(TimeType::new(3).to_string(), "TIME(3)");
+    assert_eq!(TimeType::new(0).unwrap().to_string(), "TIME(0)");
+    assert_eq!(TimeType::new(3).unwrap().to_string(), "TIME(3)");
     assert_eq!(
-        TimeType::with_nullable(false, 9).to_string(),
+        TimeType::with_nullable(false, 9).unwrap().to_string(),
         "TIME(9) NOT NULL"
     );
-}
 
-#[test]
-fn test_timestamp_display() {
-    assert_eq!(TimestampType::new(6).to_string(), "TIMESTAMP(6)");
-    assert_eq!(TimestampType::new(0).to_string(), "TIMESTAMP(0)");
+    assert_eq!(TimestampType::new(6).unwrap().to_string(), "TIMESTAMP(6)");
+    assert_eq!(TimestampType::new(0).unwrap().to_string(), "TIMESTAMP(0)");
     assert_eq!(
-        TimestampType::with_nullable(false, 9).to_string(),
+        TimestampType::with_nullable(false, 9).unwrap().to_string(),
         "TIMESTAMP(9) NOT NULL"
     );
-}
 
-#[test]
-fn test_timestamp_ltz_display() {
-    assert_eq!(TimestampLTzType::new(6).to_string(), "TIMESTAMP_LTZ(6)");
-    assert_eq!(TimestampLTzType::new(3).to_string(), "TIMESTAMP_LTZ(3)");
     assert_eq!(
-        TimestampLTzType::with_nullable(false, 9).to_string(),
-        "TIMESTAMP_LTZ(9) NOT NULL"
+        TimestampLTzType::new(6).unwrap().to_string(),
+        "TIMESTAMP_LTZ(6)"
     );
-}
-
-#[test]
-fn test_binary_display() {
-    assert_eq!(BinaryType::new(100).to_string(), "BINARY(100)");
     assert_eq!(
-        BinaryType::with_nullable(false, 256).to_string(),
-        "BINARY(256) NOT NULL"
+        TimestampLTzType::new(3).unwrap().to_string(),
+        "TIMESTAMP_LTZ(3)"
+    );
+    assert_eq!(
+        TimestampLTzType::with_nullable(false, 9)
+            .unwrap()
+            .to_string(),
+        "TIMESTAMP_LTZ(9) NOT NULL"
     );
 }
 
@@ -1352,3 +1391,68 @@ fn test_deeply_nested_types() {
     ));
     assert_eq!(nested.to_string(), "ARRAY<MAP<STRING, ROW<x INT, y INT>>>");
 }
+
+#[test]
+fn test_decimal_invalid_precision() {
+    // DecimalType::with_nullable should return an error for invalid precision
+    let result = DecimalType::with_nullable(true, 50, 2);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("Decimal precision must be between 1 and 38")
+    );
+}
+
+#[test]
+fn test_decimal_invalid_scale() {
+    // DecimalType::with_nullable should return an error when scale > precision
+    let result = DecimalType::with_nullable(true, 10, 15);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("Decimal scale must be between 0 and the precision 10")
+    );
+}
+
+#[test]
+fn test_time_invalid_precision() {
+    // TimeType::with_nullable should return an error for invalid precision
+    let result = TimeType::with_nullable(true, 10);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("Time precision must be between 0 and 9")
+    );
+}
+
+#[test]
+fn test_timestamp_invalid_precision() {
+    // TimestampType::with_nullable should return an error for invalid precision
+    let result = TimestampType::with_nullable(true, 10);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("Timestamp precision must be between 0 and 9")
+    );
+}
+
+#[test]
+fn test_timestamp_ltz_invalid_precision() {
+    // TimestampLTzType::with_nullable should return an error for invalid precision
+    let result = TimestampLTzType::with_nullable(true, 10);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("Timestamp with local time zone precision must be between 0 and 9")
+    );
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
index 7d94e194e2..faa5583bed 100644
--- a/fluss-rust/crates/fluss/src/metadata/json_serde.rs
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -202,7 +202,12 @@ impl JsonSerde for DataType {
                     .get(Self::FIELD_NAME_SCALE)
                     .and_then(|v| v.as_u64())
                     .unwrap_or(0) as u32;
-                DataTypes::decimal(precision, scale)
+                DataType::Decimal(
+                    crate::metadata::datatype::DecimalType::with_nullable(true, precision, scale)
+                        .map_err(|e| Error::JsonSerdeError {
+                        message: format!("Invalid DECIMAL parameters: {}", e),
+                    })?,
+                )
             }
             "DATE" => DataTypes::date(),
             "TIME_WITHOUT_TIME_ZONE" => {
@@ -210,21 +215,43 @@ impl JsonSerde for DataType {
                     .get(Self::FIELD_NAME_PRECISION)
                     .and_then(|v| v.as_u64())
                     .unwrap_or(0) as u32;
-                DataTypes::time_with_precision(precision)
+                DataType::Time(
+                    crate::metadata::datatype::TimeType::with_nullable(true, precision).map_err(
+                        |e| Error::JsonSerdeError {
+                            message: format!("Invalid TIME_WITHOUT_TIME_ZONE precision: {}", e),
+                        },
+                    )?,
+                )
             }
             "TIMESTAMP_WITHOUT_TIME_ZONE" => {
                 let precision = node
                     .get(Self::FIELD_NAME_PRECISION)
                     .and_then(|v| v.as_u64())
                     .unwrap_or(6) as u32;
-                DataTypes::timestamp_with_precision(precision)
+                DataType::Timestamp(
+                    crate::metadata::datatype::TimestampType::with_nullable(true, precision)
+                        .map_err(|e| Error::JsonSerdeError {
+                            message: format!(
+                                "Invalid TIMESTAMP_WITHOUT_TIME_ZONE precision: {}",
+                                e
+                            ),
+                        })?,
+                )
             }
             "TIMESTAMP_WITH_LOCAL_TIME_ZONE" => {
                 let precision = node
                     .get(Self::FIELD_NAME_PRECISION)
                     .and_then(|v| v.as_u64())
                     .unwrap_or(6) as u32;
-                DataTypes::timestamp_ltz_with_precision(precision)
+                DataType::TimestampLTz(
+                    crate::metadata::datatype::TimestampLTzType::with_nullable(true, precision)
+                        .map_err(|e| Error::JsonSerdeError {
+                            message: format!(
+                                "Invalid TIMESTAMP_WITH_LOCAL_TIME_ZONE precision: {}",
+                                e
+                            ),
+                        })?,
+                )
             }
             "BYTES" => DataTypes::bytes(),
             "BINARY" => {
@@ -689,4 +716,81 @@ mod tests {
             assert_eq!(dt, deserialized);
         }
     }
+
+    #[test]
+    fn test_invalid_datatype_validation() {
+        use serde_json::json;
+
+        // Invalid DECIMAL precision (> 38)
+        let invalid_decimal = json!({
+            "type": "DECIMAL",
+            "precision": 50,
+            "scale": 2
+        });
+        let result = DataType::deserialize_json(&invalid_decimal);
+        assert!(result.is_err());
+        assert!(
+            result
+                .unwrap_err()
+                .to_string()
+                .contains("Invalid DECIMAL parameters")
+        );
+
+        // Invalid TIME precision (> 9)
+        let invalid_time = json!({
+            "type": "TIME_WITHOUT_TIME_ZONE",
+            "precision": 15
+        });
+        let result = DataType::deserialize_json(&invalid_time);
+        assert!(result.is_err());
+        assert!(
+            result
+                .unwrap_err()
+                .to_string()
+                .contains("Invalid TIME_WITHOUT_TIME_ZONE precision")
+        );
+
+        // Invalid TIMESTAMP precision (> 9)
+        let invalid_timestamp = json!({
+            "type": "TIMESTAMP_WITHOUT_TIME_ZONE",
+            "precision": 20
+        });
+        let result = DataType::deserialize_json(&invalid_timestamp);
+        assert!(result.is_err());
+        assert!(
+            result
+                .unwrap_err()
+                .to_string()
+                .contains("Invalid TIMESTAMP_WITHOUT_TIME_ZONE precision")
+        );
+
+        // Invalid TIMESTAMP_LTZ precision (> 9)
+        let invalid_timestamp_ltz = json!({
+            "type": "TIMESTAMP_WITH_LOCAL_TIME_ZONE",
+            "precision": 10
+        });
+        let result = DataType::deserialize_json(&invalid_timestamp_ltz);
+        assert!(result.is_err());
+        assert!(
+            result
+                .unwrap_err()
+                .to_string()
+                .contains("Invalid TIMESTAMP_WITH_LOCAL_TIME_ZONE precision")
+        );
+
+        // Invalid DECIMAL scale (> precision)
+        let invalid_decimal_scale = json!({
+            "type": "DECIMAL",
+            "precision": 10,
+            "scale": 15
+        });
+        let result = DataType::deserialize_json(&invalid_decimal_scale);
+        assert!(result.is_err());
+        assert!(
+            result
+                .unwrap_err()
+                .to_string()
+                .contains("Invalid DECIMAL parameters")
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index aa48376bb6..3c46f9b5cd 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -1061,8 +1061,7 @@ pub struct MyVec<T>(pub StreamReader<T>);
 mod tests {
     use super::*;
     use crate::error::Error;
-    use crate::metadata::DataField;
-    use crate::metadata::DataTypes;
+    use crate::metadata::{DataField, DataTypes};
 
     #[test]
     fn test_to_array_type() {
@@ -1166,24 +1165,6 @@ mod tests {
         );
     }
 
-    #[test]
-    #[should_panic(expected = "Invalid precision value for TimeType: 10")]
-    fn test_time_invalid_precision() {
-        to_arrow_type(&DataTypes::time_with_precision(10));
-    }
-
-    #[test]
-    #[should_panic(expected = "Invalid precision value for TimestampType: 10")]
-    fn test_timestamp_invalid_precision() {
-        to_arrow_type(&DataTypes::timestamp_with_precision(10));
-    }
-
-    #[test]
-    #[should_panic(expected = "Invalid precision value for TimestampLTzType: 10")]
-    fn test_timestamp_ltz_invalid_precision() {
-        to_arrow_type(&DataTypes::timestamp_ltz_with_precision(10));
-    }
-
     #[test]
     fn test_parse_ipc_message() {
         let empty_body: &[u8] = &le_bytes(&[0xFFFFFFFF, 0x00000000]);
diff --git a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
index 9917c7b76a..af2765c445 100644
--- a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
@@ -52,14 +52,20 @@ pub trait BinaryWriter {
 
     fn write_binary(&mut self, bytes: &[u8], length: usize);
 
-    // TODO Decimal type
-    // fn write_decimal(&mut self, pos: i32, value: f64);
+    fn write_decimal(&mut self, value: &crate::row::Decimal, precision: u32);
 
-    // TODO Timestamp type
-    // fn write_timestamp_ntz(&mut self, pos: i32, value: i64);
+    /// Writes a TIME value.
+    ///
+    /// Note: TIME is physically stored as an i32 (milliseconds since midnight).
+    /// This method exists for type safety and semantic clarity, even though it's
+    /// currently equivalent to `write_int()`. The precision parameter is accepted
+    /// for API consistency with TIMESTAMP types, though TIME encoding doesn't
+    /// currently vary by precision.
+    fn write_time(&mut self, value: i32, precision: u32);
 
-    // TODO Timestamp type
-    // fn write_timestamp_ltz(&mut self, pos: i32, value: i64);
+    fn write_timestamp_ntz(&mut self, value: &crate::row::datum::TimestampNtz, precision: u32);
+
+    fn write_timestamp_ltz(&mut self, value: &crate::row::datum::TimestampLtz, precision: u32);
 
     // TODO InternalArray, ArraySerializer
     // fn write_array(&mut self, pos: i32, value: i64);
@@ -125,7 +131,12 @@ pub enum InnerValueWriter {
     BigInt,
     Float,
     Double,
-    // TODO Decimal, Date, TimeWithoutTimeZone, TimestampWithoutTimeZone, TimestampWithLocalTimeZone, Array, Row
+    Decimal(u32, u32), // precision, scale
+    Date,
+    Time(u32),         // precision (not used in wire format, but kept for consistency)
+    TimestampNtz(u32), // precision
+    TimestampLtz(u32), // precision
+                       // TODO Array, Row
 }
 
 /// Accessor for writing the fields/elements of a binary writer during runtime, the
@@ -147,6 +158,23 @@ impl InnerValueWriter {
             DataType::BigInt(_) => Ok(InnerValueWriter::BigInt),
             DataType::Float(_) => Ok(InnerValueWriter::Float),
             DataType::Double(_) => Ok(InnerValueWriter::Double),
+            DataType::Decimal(d) => {
+                // Validation is done at DecimalType construction time
+                Ok(InnerValueWriter::Decimal(d.precision(), d.scale()))
+            }
+            DataType::Date(_) => Ok(InnerValueWriter::Date),
+            DataType::Time(t) => {
+                // Validation is done at TimeType construction time
+                Ok(InnerValueWriter::Time(t.precision()))
+            }
+            DataType::Timestamp(t) => {
+                // Validation is done at TimestampType construction time
+                Ok(InnerValueWriter::TimestampNtz(t.precision()))
+            }
+            DataType::TimestampLTz(t) => {
+                // Validation is done at TimestampLTzType construction time
+                Ok(InnerValueWriter::TimestampLtz(t.precision()))
+            }
             _ => unimplemented!(
                 "ValueWriter for DataType {:?} is currently not implemented",
                 data_type
@@ -194,6 +222,21 @@ impl InnerValueWriter {
             (InnerValueWriter::Double, Datum::Float64(v)) => {
                 writer.write_double(v.into_inner());
             }
+            (InnerValueWriter::Decimal(p, _s), Datum::Decimal(v)) => {
+                writer.write_decimal(v, *p);
+            }
+            (InnerValueWriter::Date, Datum::Date(d)) => {
+                writer.write_int(d.get_inner());
+            }
+            (InnerValueWriter::Time(p), Datum::Time(t)) => {
+                writer.write_time(t.get_inner(), *p);
+            }
+            (InnerValueWriter::TimestampNtz(p), Datum::TimestampNtz(ts)) => {
+                writer.write_timestamp_ntz(ts, *p);
+            }
+            (InnerValueWriter::TimestampLtz(p), Datum::TimestampLtz(ts)) => {
+                writer.write_timestamp_ltz(ts, *p);
+            }
             _ => {
                 return Err(IllegalArgument {
                     message: format!("{self:?} used to write value {value:?}"),
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 90437c11aa..615e038454 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -17,9 +17,10 @@
 
 use crate::row::InternalRow;
 use arrow::array::{
-    AsArray, BinaryArray, FixedSizeBinaryArray, Float32Array, Float64Array, Int8Array, Int16Array,
-    Int32Array, Int64Array, RecordBatch, StringArray,
+    Array, AsArray, BinaryArray, Decimal128Array, FixedSizeBinaryArray, Float32Array, Float64Array,
+    Int8Array, Int16Array, Int32Array, Int64Array, RecordBatch, StringArray,
 };
+use arrow::datatypes::{DataType as ArrowDataType, TimeUnit};
 use std::sync::Arc;
 
 #[derive(Clone)]
@@ -54,6 +55,49 @@ impl ColumnarRow {
     pub fn get_record_batch(&self) -> &RecordBatch {
         &self.record_batch
     }
+
+    /// Generic helper to read timestamp from Arrow, handling all TimeUnit conversions.
+    /// Like Java, the precision parameter is ignored - conversion is determined by Arrow TimeUnit.
+    fn read_timestamp_from_arrow<T>(
+        &self,
+        pos: usize,
+        _precision: u32,
+        construct_compact: impl FnOnce(i64) -> T,
+        construct_with_nanos: impl FnOnce(i64, i32) -> crate::error::Result<T>,
+    ) -> T {
+        let schema = self.record_batch.schema();
+        let arrow_field = schema.field(pos);
+        let value = self.get_long(pos);
+
+        match arrow_field.data_type() {
+            ArrowDataType::Timestamp(time_unit, _) => {
+                // Convert based on Arrow TimeUnit
+                let (millis, nanos) = match time_unit {
+                    TimeUnit::Second => (value * 1000, 0),
+                    TimeUnit::Millisecond => (value, 0),
+                    TimeUnit::Microsecond => {
+                        let millis = value / 1000;
+                        let nanos = ((value % 1000) * 1000) as i32;
+                        (millis, nanos)
+                    }
+                    TimeUnit::Nanosecond => {
+                        let millis = value / 1_000_000;
+                        let nanos = (value % 1_000_000) as i32;
+                        (millis, nanos)
+                    }
+                };
+
+                if nanos == 0 {
+                    construct_compact(millis)
+                } else {
+                    // nanos is guaranteed to be in valid range [0, 999_999] by arithmetic
+                    construct_with_nanos(millis, nanos)
+                        .expect("nanos in valid range by construction")
+                }
+            }
+            other => panic!("Expected Timestamp column at position {pos}, got {other:?}"),
+        }
+    }
 }
 
 impl InternalRow for ColumnarRow {
@@ -126,6 +170,88 @@ impl InternalRow for ColumnarRow {
             .value(self.row_id)
     }
 
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> crate::row::Decimal {
+        use arrow::datatypes::DataType;
+
+        let column = self.record_batch.column(pos);
+        let array = column
+            .as_any()
+            .downcast_ref::<Decimal128Array>()
+            .unwrap_or_else(|| {
+                panic!(
+                    "Expected Decimal128Array at column {}, found: {:?}",
+                    pos,
+                    column.data_type()
+                )
+            });
+
+        // Contract: caller must check is_null_at() before calling get_decimal.
+        // Calling on null value violates the contract and returns garbage data
+        debug_assert!(
+            !array.is_null(self.row_id),
+            "get_decimal called on null value at pos {} row {}",
+            pos,
+            self.row_id
+        );
+
+        // Read scale from Arrow schema field metadata
+        let schema = self.record_batch.schema();
+        let field = schema.field(pos);
+        let arrow_scale = match field.data_type() {
+            DataType::Decimal128(_p, s) => *s as i64,
+            dt => panic!(
+                "Expected Decimal128 data type at column {}, found: {:?}",
+                pos, dt
+            ),
+        };
+
+        let i128_val = array.value(self.row_id);
+
+        // Convert Arrow Decimal128 to Fluss Decimal (handles rescaling and validation)
+        crate::row::Decimal::from_arrow_decimal128(
+            i128_val,
+            arrow_scale,
+            precision as u32,
+            scale as u32,
+        )
+        .unwrap_or_else(|e| {
+            panic!(
+                "Failed to create Decimal at column {} row {}: {}",
+                pos, self.row_id, e
+            )
+        })
+    }
+
+    fn get_date(&self, pos: usize) -> crate::row::datum::Date {
+        crate::row::datum::Date::new(self.get_int(pos))
+    }
+
+    fn get_time(&self, pos: usize) -> crate::row::datum::Time {
+        crate::row::datum::Time::new(self.get_int(pos))
+    }
+
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampNtz {
+        // Like Java's ArrowTimestampNtzColumnVector, we ignore the precision parameter
+        // and determine the conversion from the Arrow column's TimeUnit.
+        self.read_timestamp_from_arrow(
+            pos,
+            precision,
+            crate::row::datum::TimestampNtz::new,
+            crate::row::datum::TimestampNtz::from_millis_nanos,
+        )
+    }
+
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampLtz {
+        // Like Java's ArrowTimestampLtzColumnVector, we ignore the precision parameter
+        // and determine the conversion from the Arrow column's TimeUnit.
+        self.read_timestamp_from_arrow(
+            pos,
+            precision,
+            crate::row::datum::TimestampLtz::new,
+            crate::row::datum::TimestampLtz::from_millis_nanos,
+        )
+    }
+
     fn get_char(&self, pos: usize, _length: usize) -> &str {
         let array = self
             .record_batch
@@ -229,4 +355,72 @@ mod tests {
         row.set_row_id(0);
         assert_eq!(row.get_row_id(), 0);
     }
+
+    #[test]
+    fn columnar_row_reads_decimal() {
+        use arrow::datatypes::DataType;
+        use bigdecimal::{BigDecimal, num_bigint::BigInt};
+
+        // Test with Decimal128
+        let schema = Arc::new(Schema::new(vec![
+            Field::new("dec1", DataType::Decimal128(10, 2), false),
+            Field::new("dec2", DataType::Decimal128(20, 5), false),
+            Field::new("dec3", DataType::Decimal128(38, 10), false),
+        ]));
+
+        // Create decimal values: 123.45, 12345.67890, large decimal
+        let dec1_val = 12345i128; // 123.45 with scale 2
+        let dec2_val = 1234567890i128; // 12345.67890 with scale 5
+        let dec3_val = 999999999999999999i128; // Large value (18 nines) with scale 10
+
+        let batch = RecordBatch::try_new(
+            schema,
+            vec![
+                Arc::new(
+                    Decimal128Array::from(vec![dec1_val])
+                        .with_precision_and_scale(10, 2)
+                        .unwrap(),
+                ),
+                Arc::new(
+                    Decimal128Array::from(vec![dec2_val])
+                        .with_precision_and_scale(20, 5)
+                        .unwrap(),
+                ),
+                Arc::new(
+                    Decimal128Array::from(vec![dec3_val])
+                        .with_precision_and_scale(38, 10)
+                        .unwrap(),
+                ),
+            ],
+        )
+        .expect("record batch");
+
+        let row = ColumnarRow::new(Arc::new(batch));
+        assert_eq!(row.get_field_count(), 3);
+
+        // Verify decimal values
+        assert_eq!(
+            row.get_decimal(0, 10, 2),
+            crate::row::Decimal::from_big_decimal(BigDecimal::new(BigInt::from(12345), 2), 10, 2)
+                .unwrap()
+        );
+        assert_eq!(
+            row.get_decimal(1, 20, 5),
+            crate::row::Decimal::from_big_decimal(
+                BigDecimal::new(BigInt::from(1234567890), 5),
+                20,
+                5
+            )
+            .unwrap()
+        );
+        assert_eq!(
+            row.get_decimal(2, 38, 10),
+            crate::row::Decimal::from_big_decimal(
+                BigDecimal::new(BigInt::from(999999999999999999i128), 10),
+                38,
+                10
+            )
+            .unwrap()
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
index 1152b0c5d2..339e366155 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
@@ -20,6 +20,7 @@ use bytes::Bytes;
 
 use crate::error::Result;
 use crate::metadata::DataType;
+use crate::row::Decimal;
 use crate::row::binary::{BinaryRowFormat, BinaryWriter, ValueWriter};
 use delegate::delegate;
 
@@ -93,7 +94,13 @@ impl BinaryWriter for CompactedKeyWriter {
 
             fn write_double(&mut self, value: f64);
 
+            fn write_decimal(&mut self, value: &Decimal, precision: u32);
 
+            fn write_time(&mut self, value: i32, precision: u32);
+
+            fn write_timestamp_ntz(&mut self, value: &crate::row::datum::TimestampNtz, precision: u32);
+
+            fn write_timestamp_ltz(&mut self, value: &crate::row::datum::TimestampLtz, precision: u32);
         }
     }
 
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 144f8985cf..bc68ea10e5 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -133,6 +133,26 @@ impl<'a> InternalRow for CompactedRow<'a> {
     fn get_bytes(&self, pos: usize) -> &[u8] {
         self.decoded_row().get_bytes(pos)
     }
+
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> crate::row::Decimal {
+        self.decoded_row().get_decimal(pos, precision, scale)
+    }
+
+    fn get_date(&self, pos: usize) -> crate::row::datum::Date {
+        self.decoded_row().get_date(pos)
+    }
+
+    fn get_time(&self, pos: usize) -> crate::row::datum::Time {
+        self.decoded_row().get_time(pos)
+    }
+
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampNtz {
+        self.decoded_row().get_timestamp_ntz(pos, precision)
+    }
+
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampLtz {
+        self.decoded_row().get_timestamp_ltz(pos, precision)
+    }
 }
 
 #[cfg(test)]
@@ -174,7 +194,7 @@ mod tests {
         writer.write_bytes(&[1, 2, 3, 4, 5]);
 
         let bytes = writer.to_bytes();
-        let mut row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
         assert_eq!(row.get_field_count(), 9);
         assert!(row.get_boolean(0));
@@ -187,70 +207,107 @@ mod tests {
         assert_eq!(row.get_string(7), "Hello World");
         assert_eq!(row.get_bytes(8), &[1, 2, 3, 4, 5]);
 
-        // Test with nulls
-        let row_type = RowType::with_data_types(
-            [
-                DataType::Int(IntType::new()),
-                DataType::String(StringType::new()),
-                DataType::Double(DoubleType::new()),
-            ]
-            .to_vec(),
-        );
+        // Test with nulls and negative values
+        let row_type = RowType::with_data_types(vec![
+            DataType::Int(IntType::new()),
+            DataType::String(StringType::new()),
+            DataType::Double(DoubleType::new()),
+        ]);
 
         let mut writer = CompactedRowWriter::new(row_type.fields().len());
-
-        writer.write_int(100);
+        writer.write_int(-42);
         writer.set_null_at(1);
         writer.write_double(2.71);
 
         let bytes = writer.to_bytes();
-        row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
         assert!(!row.is_null_at(0));
         assert!(row.is_null_at(1));
         assert!(!row.is_null_at(2));
-        assert_eq!(row.get_int(0), 100);
+        assert_eq!(row.get_int(0), -42);
         assert_eq!(row.get_double(2), 2.71);
+        // Verify caching works on repeated reads
+        assert_eq!(row.get_int(0), -42);
+    }
 
-        // Test multiple reads (caching)
-        assert_eq!(row.get_int(0), 100);
-        assert_eq!(row.get_int(0), 100);
+    #[test]
+    fn test_compacted_row_temporal_and_decimal_types() {
+        // Comprehensive test covering DATE, TIME, TIMESTAMP (compact/non-compact), and DECIMAL (compact/non-compact)
+        use crate::metadata::{DataTypes, DecimalType, TimestampLTzType, TimestampType};
+        use crate::row::Decimal;
+        use crate::row::datum::{TimestampLtz, TimestampNtz};
+        use bigdecimal::{BigDecimal, num_bigint::BigInt};
 
-        // Test from_bytes
         let row_type = RowType::with_data_types(vec![
-            DataType::Int(IntType::new()),
-            DataType::String(StringType::new()),
+            DataTypes::date(),
+            DataTypes::time(),
+            DataType::Timestamp(TimestampType::with_nullable(true, 3).unwrap()), // Compact (precision <= 3)
+            DataType::TimestampLTz(TimestampLTzType::with_nullable(true, 3).unwrap()), // Compact
+            DataType::Timestamp(TimestampType::with_nullable(true, 6).unwrap()), // Non-compact (precision > 3)
+            DataType::TimestampLTz(TimestampLTzType::with_nullable(true, 9).unwrap()), // Non-compact
+            DataType::Decimal(DecimalType::new(10, 2).unwrap()), // Compact (precision <= 18)
+            DataType::Decimal(DecimalType::new(28, 10).unwrap()), // Non-compact (precision > 18)
         ]);
 
         let mut writer = CompactedRowWriter::new(row_type.fields().len());
-        writer.write_int(-1);
-        writer.write_string("test");
-
-        let bytes = writer.to_bytes();
-        let mut row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
-
-        assert_eq!(row.get_int(0), -1);
-        assert_eq!(row.get_string(1), "test");
 
-        // Test large row
-        let num_fields = 100;
-        let row_type = RowType::with_data_types(
-            (0..num_fields)
-                .map(|_| DataType::Int(IntType::new()))
-                .collect(),
-        );
-
-        let mut writer = CompactedRowWriter::new(num_fields);
+        // Write values
+        writer.write_int(19651); // Date: 2023-10-25
+        writer.write_time(34200000, 0); // Time: 09:30:00.0
+        writer.write_timestamp_ntz(&TimestampNtz::new(1698235273182), 3); // Compact timestamp
+        writer.write_timestamp_ltz(&TimestampLtz::new(1698235273182), 3); // Compact timestamp ltz
+        let ts_ntz_high = TimestampNtz::from_millis_nanos(1698235273182, 123456).unwrap();
+        let ts_ltz_high = TimestampLtz::from_millis_nanos(1698235273182, 987654).unwrap();
+        writer.write_timestamp_ntz(&ts_ntz_high, 6); // Non-compact timestamp with nanos
+        writer.write_timestamp_ltz(&ts_ltz_high, 9); // Non-compact timestamp ltz with nanos
+
+        // Create Decimal values for testing
+        let small_decimal =
+            Decimal::from_big_decimal(BigDecimal::new(BigInt::from(12345), 2), 10, 2).unwrap(); // Compact decimal: 123.45
+        let large_decimal = Decimal::from_big_decimal(
+            BigDecimal::new(BigInt::from(999999999999999999i128), 10),
+            28,
+            10,
+        )
+        .unwrap(); // Non-compact decimal
 
-        for i in 0..num_fields {
-            writer.write_int((i * 10) as i32);
-        }
+        writer.write_decimal(&small_decimal, 10);
+        writer.write_decimal(&large_decimal, 28);
 
         let bytes = writer.to_bytes();
-        row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
-
-        for i in 0..num_fields {
-            assert_eq!(row.get_int(i), (i * 10) as i32);
-        }
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        // Verify all values
+        assert_eq!(row.get_date(0).get_inner(), 19651);
+        assert_eq!(row.get_time(1).get_inner(), 34200000);
+        assert_eq!(row.get_timestamp_ntz(2, 3).get_millisecond(), 1698235273182);
+        assert_eq!(
+            row.get_timestamp_ltz(3, 3).get_epoch_millisecond(),
+            1698235273182
+        );
+        let read_ts_ntz = row.get_timestamp_ntz(4, 6);
+        assert_eq!(read_ts_ntz.get_millisecond(), 1698235273182);
+        assert_eq!(read_ts_ntz.get_nano_of_millisecond(), 123456);
+        let read_ts_ltz = row.get_timestamp_ltz(5, 9);
+        assert_eq!(read_ts_ltz.get_epoch_millisecond(), 1698235273182);
+        assert_eq!(read_ts_ltz.get_nano_of_millisecond(), 987654);
+        // Assert on Decimal equality
+        assert_eq!(row.get_decimal(6, 10, 2), small_decimal);
+        assert_eq!(row.get_decimal(7, 28, 10), large_decimal);
+
+        // Assert on Decimal components to catch any regressions
+        let read_small_decimal = row.get_decimal(6, 10, 2);
+        assert_eq!(read_small_decimal.precision(), 10);
+        assert_eq!(read_small_decimal.scale(), 2);
+        assert_eq!(read_small_decimal.to_unscaled_long().unwrap(), 12345);
+
+        let read_large_decimal = row.get_decimal(7, 28, 10);
+        assert_eq!(read_large_decimal.precision(), 28);
+        assert_eq!(read_large_decimal.scale(), 10);
+        assert_eq!(
+            read_large_decimal.to_unscaled_long().unwrap(),
+            999999999999999999i64
+        );
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 408706cc83..40470db170 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -19,7 +19,7 @@ use crate::metadata::RowType;
 use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 use crate::{
     metadata::DataType,
-    row::{Datum, GenericRow, compacted::compacted_row_writer::CompactedRowWriter},
+    row::{Datum, Decimal, GenericRow, compacted::compacted_row_writer::CompactedRowWriter},
     util::varint::{read_unsigned_varint_at, read_unsigned_varint_u64_at},
 };
 use std::borrow::Cow;
@@ -97,7 +97,75 @@ impl<'a> CompactedRowDeserializer<'a> {
                     let (val, next) = reader.read_bytes(cursor);
                     (Datum::Blob(val.into()), next)
                 }
-                _ => panic!("unsupported DataType in CompactedRowDeserializer"),
+                DataType::Decimal(decimal_type) => {
+                    let precision = decimal_type.precision();
+                    let scale = decimal_type.scale();
+                    if Decimal::is_compact_precision(precision) {
+                        // Compact: stored as i64
+                        let (val, next) = reader.read_long(cursor);
+                        let decimal = Decimal::from_unscaled_long(val, precision, scale)
+                            .expect("Failed to create decimal from unscaled long");
+                        (Datum::Decimal(decimal), next)
+                    } else {
+                        // Non-compact: stored as minimal big-endian bytes
+                        let (bytes, next) = reader.read_bytes(cursor);
+                        let decimal = Decimal::from_unscaled_bytes(bytes, precision, scale)
+                            .expect("Failed to create decimal from unscaled bytes");
+                        (Datum::Decimal(decimal), next)
+                    }
+                }
+                DataType::Date(_) => {
+                    let (val, next) = reader.read_int(cursor);
+                    (Datum::Date(crate::row::datum::Date::new(val)), next)
+                }
+                DataType::Time(_) => {
+                    let (val, next) = reader.read_int(cursor);
+                    (Datum::Time(crate::row::datum::Time::new(val)), next)
+                }
+                DataType::Timestamp(timestamp_type) => {
+                    let precision = timestamp_type.precision();
+                    if crate::row::datum::TimestampNtz::is_compact(precision) {
+                        // Compact: only milliseconds
+                        let (millis, next) = reader.read_long(cursor);
+                        (
+                            Datum::TimestampNtz(crate::row::datum::TimestampNtz::new(millis)),
+                            next,
+                        )
+                    } else {
+                        // Non-compact: milliseconds + nanos
+                        let (millis, mid) = reader.read_long(cursor);
+                        let (nanos, next) = reader.read_int(mid);
+                        let timestamp =
+                            crate::row::datum::TimestampNtz::from_millis_nanos(millis, nanos)
+                                .expect("Invalid nano_of_millisecond value in compacted row");
+                        (Datum::TimestampNtz(timestamp), next)
+                    }
+                }
+                DataType::TimestampLTz(timestamp_ltz_type) => {
+                    let precision = timestamp_ltz_type.precision();
+                    if crate::row::datum::TimestampLtz::is_compact(precision) {
+                        // Compact: only epoch milliseconds
+                        let (epoch_millis, next) = reader.read_long(cursor);
+                        (
+                            Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(epoch_millis)),
+                            next,
+                        )
+                    } else {
+                        // Non-compact: epoch milliseconds + nanos
+                        let (epoch_millis, mid) = reader.read_long(cursor);
+                        let (nanos, next) = reader.read_int(mid);
+                        let timestamp_ltz =
+                            crate::row::datum::TimestampLtz::from_millis_nanos(epoch_millis, nanos)
+                                .expect("Invalid nano_of_millisecond value in compacted row");
+                        (Datum::TimestampLtz(timestamp_ltz), next)
+                    }
+                }
+                _ => {
+                    panic!(
+                        "Unsupported DataType in CompactedRowDeserializer: {:?}",
+                        dtype
+                    );
+                }
             };
             cursor = next_cursor;
             row.set_field(col_pos, datum);
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index c130e94cce..d1ad047a72 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -15,6 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::row::Decimal;
 use crate::row::binary::BinaryWriter;
 use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 use crate::util::varint::{write_unsigned_varint_to_slice, write_unsigned_varint_u64_to_slice};
@@ -76,6 +77,7 @@ impl CompactedRowWriter {
         self.position = end;
     }
 }
+
 impl BinaryWriter for CompactedRowWriter {
     fn reset(&mut self) {
         self.position = self.header_size_in_bytes;
@@ -91,32 +93,34 @@ impl BinaryWriter for CompactedRowWriter {
 
     fn write_boolean(&mut self, value: bool) {
         let b = if value { 1u8 } else { 0u8 };
-        self.write_raw(&[b]);
+        self.write_raw(&[b])
     }
 
     fn write_byte(&mut self, value: u8) {
-        self.write_raw(&[value]);
+        self.write_raw(&[value])
     }
 
     fn write_bytes(&mut self, value: &[u8]) {
-        let len_i32 =
-            i32::try_from(value.len()).expect("byte slice too large to encode length as i32");
+        let len_i32 = i32::try_from(value.len())
+            .expect("Byte slice too large to encode length as i32: exceeds i32::MAX");
         self.write_int(len_i32);
-        self.write_raw(value);
+        self.write_raw(value)
     }
 
     fn write_char(&mut self, value: &str, _length: usize) {
         // TODO: currently, we encoding CHAR(length) as the same with STRING, the length info can be
         //  omitted and the bytes length should be enforced in the future.
-        self.write_string(value);
+        self.write_string(value)
     }
 
     fn write_string(&mut self, value: &str) {
-        self.write_bytes(value.as_ref());
+        self.write_bytes(value.as_ref())
     }
 
     fn write_short(&mut self, value: i16) {
-        self.write_raw(&value.to_ne_bytes());
+        // Use native endianness to match Java's UnsafeUtils.putShort behavior
+        // Java uses sun.misc.Unsafe which writes in native byte order (typically LE on x86/ARM)
+        self.write_raw(&value.to_ne_bytes())
     }
 
     fn write_int(&mut self, value: i32) {
@@ -132,21 +136,120 @@ impl BinaryWriter for CompactedRowWriter {
             write_unsigned_varint_u64_to_slice(value as u64, &mut self.buffer[self.position..]);
         self.position += bytes_written;
     }
+
     fn write_float(&mut self, value: f32) {
-        self.write_raw(&value.to_ne_bytes());
+        // Use native endianness to match Java's UnsafeUtils.putFloat behavior
+        self.write_raw(&value.to_ne_bytes())
     }
 
     fn write_double(&mut self, value: f64) {
-        self.write_raw(&value.to_ne_bytes());
+        // Use native endianness to match Java's UnsafeUtils.putDouble behavior
+        self.write_raw(&value.to_ne_bytes())
     }
 
     fn write_binary(&mut self, bytes: &[u8], length: usize) {
         // TODO: currently, we encoding BINARY(length) as the same with BYTES, the length info can
         //  be omitted and the bytes length should be enforced in the future.
-        self.write_bytes(&bytes[..length.min(bytes.len())]);
+        self.write_bytes(&bytes[..length.min(bytes.len())])
     }
 
     fn complete(&mut self) {
         // do nothing
     }
+
+    fn write_decimal(&mut self, value: &Decimal, precision: u32) {
+        // Decimal is already validated and rescaled during construction.
+        // Just serialize the precomputed unscaled representation.
+        if Decimal::is_compact_precision(precision) {
+            self.write_long(
+                value
+                    .to_unscaled_long()
+                    .expect("Decimal should fit in i64 for compact precision"),
+            )
+        } else {
+            self.write_bytes(&value.to_unscaled_bytes())
+        }
+    }
+
+    fn write_time(&mut self, value: i32, _precision: u32) {
+        // TIME is always encoded as i32 (milliseconds since midnight) regardless of precision
+        self.write_int(value)
+    }
+
+    fn write_timestamp_ntz(&mut self, value: &crate::row::datum::TimestampNtz, precision: u32) {
+        if crate::row::datum::TimestampNtz::is_compact(precision) {
+            // Compact: write only milliseconds
+            self.write_long(value.get_millisecond());
+        } else {
+            // Non-compact: write milliseconds + nanoOfMillisecond
+            self.write_long(value.get_millisecond());
+            self.write_int(value.get_nano_of_millisecond());
+        }
+    }
+
+    fn write_timestamp_ltz(&mut self, value: &crate::row::datum::TimestampLtz, precision: u32) {
+        if crate::row::datum::TimestampLtz::is_compact(precision) {
+            // Compact: write only epoch milliseconds
+            self.write_long(value.get_epoch_millisecond());
+        } else {
+            // Non-compact: write epoch milliseconds + nanoOfMillisecond
+            self.write_long(value.get_epoch_millisecond());
+            self.write_int(value.get_nano_of_millisecond());
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use bigdecimal::{BigDecimal, num_bigint::BigInt};
+
+    #[test]
+    fn test_write_decimal_compact() {
+        // Compact decimal (precision <= 18)
+        let bd = BigDecimal::new(BigInt::from(12345), 2); // 123.45
+        let decimal = Decimal::from_big_decimal(bd, 10, 2).unwrap();
+
+        let mut w = CompactedRowWriter::new(1);
+        w.write_decimal(&decimal, 10);
+
+        let (val, _) = crate::util::varint::read_unsigned_varint_u64_at(
+            w.buffer(),
+            w.header_size_in_bytes,
+            CompactedRowWriter::MAX_LONG_SIZE,
+        )
+        .unwrap();
+        assert_eq!(val as i64, 12345);
+    }
+
+    #[test]
+    fn test_write_decimal_rounding() {
+        // Test HALF_UP rounding: 12.345 → 12.35
+        let bd = BigDecimal::new(BigInt::from(12345), 3);
+        let decimal = Decimal::from_big_decimal(bd, 10, 2).unwrap();
+
+        let mut w = CompactedRowWriter::new(1);
+        w.write_decimal(&decimal, 10);
+
+        let (val, _) = crate::util::varint::read_unsigned_varint_u64_at(
+            w.buffer(),
+            w.header_size_in_bytes,
+            CompactedRowWriter::MAX_LONG_SIZE,
+        )
+        .unwrap();
+        assert_eq!(val as i64, 1235); // 12.35 with scale 2
+    }
+
+    #[test]
+    fn test_write_decimal_non_compact() {
+        // Non-compact (precision > 18): uses byte array
+        let bd = BigDecimal::new(BigInt::from(12345), 0);
+        let decimal = Decimal::from_big_decimal(bd, 28, 0).unwrap();
+
+        let mut w = CompactedRowWriter::new(1);
+        w.write_decimal(&decimal, 28);
+
+        // Verify something was written (at least length varint + some bytes)
+        assert!(w.position() > w.header_size_in_bytes);
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index ad7948dcef..5b21b3899b 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -17,6 +17,7 @@
 
 use crate::error::Error::RowConvertError;
 use crate::error::Result;
+use crate::row::Decimal;
 use arrow::array::{
     ArrayBuilder, BinaryBuilder, BooleanBuilder, Float32Builder, Float64Builder, Int8Builder,
     Int16Builder, Int32Builder, Int64Builder, StringBuilder,
@@ -24,7 +25,6 @@ use arrow::array::{
 use jiff::ToSpan;
 use ordered_float::OrderedFloat;
 use parse_display::Display;
-use rust_decimal::Decimal;
 use serde::Serialize;
 use std::borrow::Cow;
 
@@ -58,9 +58,11 @@ pub enum Datum<'a> {
     #[display("{0}")]
     Date(Date),
     #[display("{0}")]
-    Timestamp(Timestamp),
+    Time(Time),
     #[display("{0}")]
-    TimestampTz(TimestampLtz),
+    TimestampNtz(TimestampNtz),
+    #[display("{0}")]
+    TimestampLtz(TimestampLtz),
 }
 
 impl Datum<'_> {
@@ -296,7 +298,11 @@ impl Datum<'_> {
             Datum::Float64(v) => append_value_to_arrow!(Float64Builder, v.into_inner()),
             Datum::String(v) => append_value_to_arrow!(StringBuilder, v.as_ref()),
             Datum::Blob(v) => append_value_to_arrow!(BinaryBuilder, v.as_ref()),
-            Datum::Decimal(_) | Datum::Date(_) | Datum::Timestamp(_) | Datum::TimestampTz(_) => {
+            Datum::Decimal(_)
+            | Datum::Date(_)
+            | Datum::Time(_)
+            | Datum::TimestampNtz(_)
+            | Datum::TimestampLtz(_) => {
                 return Err(RowConvertError {
                     message: format!(
                         "Type {:?} is not yet supported for Arrow conversion",
@@ -350,10 +356,122 @@ pub type F64 = OrderedFloat<f64>;
 pub struct Date(i32);
 
 #[derive(PartialOrd, Ord, Display, PartialEq, Eq, Debug, Copy, Clone, Default, Hash, Serialize)]
-pub struct Timestamp(i64);
+pub struct Time(i32);
+
+impl Time {
+    pub const fn new(inner: i32) -> Self {
+        Time(inner)
+    }
+
+    /// Get the inner value of time type (milliseconds since midnight)
+    pub fn get_inner(&self) -> i32 {
+        self.0
+    }
+}
+
+/// Maximum timestamp precision that can be stored compactly (milliseconds only).
+/// Values with precision > MAX_COMPACT_TIMESTAMP_PRECISION require additional nanosecond storage.
+pub const MAX_COMPACT_TIMESTAMP_PRECISION: u32 = 3;
+
+/// Maximum valid value for nanoseconds within a millisecond (0 to 999,999 inclusive).
+/// A millisecond contains 1,000,000 nanoseconds, so the fractional part ranges from 0 to 999,999.
+pub const MAX_NANO_OF_MILLISECOND: i32 = 999_999;
 
 #[derive(PartialOrd, Ord, Display, PartialEq, Eq, Debug, Copy, Clone, Default, Hash, Serialize)]
-pub struct TimestampLtz(i64);
+#[display("{millisecond}")]
+pub struct TimestampNtz {
+    millisecond: i64,
+    nano_of_millisecond: i32,
+}
+
+impl TimestampNtz {
+    pub const fn new(millisecond: i64) -> Self {
+        TimestampNtz {
+            millisecond,
+            nano_of_millisecond: 0,
+        }
+    }
+
+    pub fn from_millis_nanos(
+        millisecond: i64,
+        nano_of_millisecond: i32,
+    ) -> crate::error::Result<Self> {
+        if !(0..=MAX_NANO_OF_MILLISECOND).contains(&nano_of_millisecond) {
+            return Err(crate::error::Error::IllegalArgument {
+                message: format!(
+                    "nanoOfMillisecond must be in range [0, {}], got: {}",
+                    MAX_NANO_OF_MILLISECOND, nano_of_millisecond
+                ),
+            });
+        }
+        Ok(TimestampNtz {
+            millisecond,
+            nano_of_millisecond,
+        })
+    }
+
+    pub fn get_millisecond(&self) -> i64 {
+        self.millisecond
+    }
+
+    pub fn get_nano_of_millisecond(&self) -> i32 {
+        self.nano_of_millisecond
+    }
+
+    /// Check if the timestamp is compact based on precision.
+    /// Precision <= MAX_COMPACT_TIMESTAMP_PRECISION means millisecond precision, no need for nanos.
+    pub fn is_compact(precision: u32) -> bool {
+        precision <= MAX_COMPACT_TIMESTAMP_PRECISION
+    }
+}
+
+#[derive(PartialOrd, Ord, Display, PartialEq, Eq, Debug, Copy, Clone, Default, Hash, Serialize)]
+#[display("{epoch_millisecond}")]
+pub struct TimestampLtz {
+    epoch_millisecond: i64,
+    nano_of_millisecond: i32,
+}
+
+impl TimestampLtz {
+    pub const fn new(epoch_millisecond: i64) -> Self {
+        TimestampLtz {
+            epoch_millisecond,
+            nano_of_millisecond: 0,
+        }
+    }
+
+    pub fn from_millis_nanos(
+        epoch_millisecond: i64,
+        nano_of_millisecond: i32,
+    ) -> crate::error::Result<Self> {
+        if !(0..=MAX_NANO_OF_MILLISECOND).contains(&nano_of_millisecond) {
+            return Err(crate::error::Error::IllegalArgument {
+                message: format!(
+                    "nanoOfMillisecond must be in range [0, {}], got: {}",
+                    MAX_NANO_OF_MILLISECOND, nano_of_millisecond
+                ),
+            });
+        }
+        Ok(TimestampLtz {
+            epoch_millisecond,
+            nano_of_millisecond,
+        })
+    }
+
+    pub fn get_epoch_millisecond(&self) -> i64 {
+        self.epoch_millisecond
+    }
+
+    pub fn get_nano_of_millisecond(&self) -> i32 {
+        self.nano_of_millisecond
+    }
+
+    /// Check if the timestamp is compact based on precision.
+    /// Precision <= MAX_COMPACT_TIMESTAMP_PRECISION means millisecond precision, no need for nanos.
+    pub fn is_compact(precision: u32) -> bool {
+        precision <= MAX_COMPACT_TIMESTAMP_PRECISION
+    }
+}
 
 pub type Blob<'a> = Cow<'a, [u8]>;
 
@@ -461,3 +579,54 @@ mod tests {
         assert_eq!(date.day(), 1);
     }
 }
+
+#[cfg(test)]
+mod timestamp_tests {
+    use super::*;
+
+    #[test]
+    fn test_timestamp_valid_nanos() {
+        // Valid range: 0 to MAX_NANO_OF_MILLISECOND for both TimestampNtz and TimestampLtz
+        let ntz1 = TimestampNtz::from_millis_nanos(1000, 0).unwrap();
+        assert_eq!(ntz1.get_nano_of_millisecond(), 0);
+
+        let ntz2 = TimestampNtz::from_millis_nanos(1000, MAX_NANO_OF_MILLISECOND).unwrap();
+        assert_eq!(ntz2.get_nano_of_millisecond(), MAX_NANO_OF_MILLISECOND);
+
+        let ntz3 = TimestampNtz::from_millis_nanos(1000, 500_000).unwrap();
+        assert_eq!(ntz3.get_nano_of_millisecond(), 500_000);
+
+        let ltz1 = TimestampLtz::from_millis_nanos(1000, 0).unwrap();
+        assert_eq!(ltz1.get_nano_of_millisecond(), 0);
+
+        let ltz2 = TimestampLtz::from_millis_nanos(1000, MAX_NANO_OF_MILLISECOND).unwrap();
+        assert_eq!(ltz2.get_nano_of_millisecond(), MAX_NANO_OF_MILLISECOND);
+    }
+
+    #[test]
+    fn test_timestamp_nanos_out_of_range() {
+        // Test that both TimestampNtz and TimestampLtz reject invalid nanos
+        let expected_msg = format!(
+            "nanoOfMillisecond must be in range [0, {}]",
+            MAX_NANO_OF_MILLISECOND
+        );
+
+        // Too large (1,000,000 is just beyond the valid range)
+        let result_ntz = TimestampNtz::from_millis_nanos(1000, MAX_NANO_OF_MILLISECOND + 1);
+        assert!(result_ntz.is_err());
+        assert!(result_ntz.unwrap_err().to_string().contains(&expected_msg));
+
+        let result_ltz = TimestampLtz::from_millis_nanos(1000, MAX_NANO_OF_MILLISECOND + 1);
+        assert!(result_ltz.is_err());
+        assert!(result_ltz.unwrap_err().to_string().contains(&expected_msg));
+
+        // Negative
+        let result_ntz = TimestampNtz::from_millis_nanos(1000, -1);
+        assert!(result_ntz.is_err());
+        assert!(result_ntz.unwrap_err().to_string().contains(&expected_msg));
+
+        let result_ltz = TimestampLtz::from_millis_nanos(1000, -1);
+        assert!(result_ltz.is_err());
+        assert!(result_ltz.unwrap_err().to_string().contains(&expected_msg));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/decimal.rs b/fluss-rust/crates/fluss/src/row/decimal.rs
new file mode 100644
index 0000000000..b14bde50a4
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/decimal.rs
@@ -0,0 +1,477 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::{Error, Result};
+use bigdecimal::num_bigint::BigInt;
+use bigdecimal::num_traits::Zero;
+use bigdecimal::{BigDecimal, RoundingMode};
+use std::fmt;
+
+#[cfg(test)]
+use std::str::FromStr;
+
+/// Maximum decimal precision that can be stored compactly as a single i64.
+/// Values with precision > MAX_COMPACT_PRECISION require byte array storage.
+pub const MAX_COMPACT_PRECISION: u32 = 18;
+
+/// An internal data structure representing a decimal value with fixed precision and scale.
+///
+/// This data structure is immutable and stores decimal values in a compact representation
+/// (as a long value) if values are small enough (precision ≤ 18).
+///
+/// Matches Java's org.apache.fluss.row.Decimal class.
+#[derive(Debug, Clone, serde::Serialize)]
+pub struct Decimal {
+    precision: u32,
+    scale: u32,
+    // If precision <= MAX_COMPACT_PRECISION, this holds the unscaled value
+    long_val: Option<i64>,
+    // BigDecimal representation (may be cached)
+    decimal_val: Option<BigDecimal>,
+}
+
+impl Decimal {
+    /// Returns the precision of this Decimal.
+    ///
+    /// The precision is the number of digits in the unscaled value.
+    pub fn precision(&self) -> u32 {
+        self.precision
+    }
+
+    /// Returns the scale of this Decimal.
+    pub fn scale(&self) -> u32 {
+        self.scale
+    }
+
+    /// Returns whether the decimal value is small enough to be stored in a long.
+    pub fn is_compact(&self) -> bool {
+        self.precision <= MAX_COMPACT_PRECISION
+    }
+
+    /// Returns whether a given precision can be stored compactly.
+    pub fn is_compact_precision(precision: u32) -> bool {
+        precision <= MAX_COMPACT_PRECISION
+    }
+
+    /// Converts this Decimal into a BigDecimal.
+    pub fn to_big_decimal(&self) -> BigDecimal {
+        if let Some(bd) = &self.decimal_val {
+            bd.clone()
+        } else if let Some(long_val) = self.long_val {
+            BigDecimal::new(BigInt::from(long_val), self.scale as i64)
+        } else {
+            // Should never happen - we always have one representation
+            BigDecimal::new(BigInt::from(0), self.scale as i64)
+        }
+    }
+
+    /// Returns a long describing the unscaled value of this Decimal.
+    pub fn to_unscaled_long(&self) -> Result<i64> {
+        if let Some(long_val) = self.long_val {
+            Ok(long_val)
+        } else {
+            // Extract unscaled value from BigDecimal
+            let bd = self.to_big_decimal();
+            let (unscaled, _) = bd.as_bigint_and_exponent();
+            unscaled.try_into().map_err(|_| Error::IllegalArgument {
+                message: format!(
+                    "Decimal unscaled value does not fit in i64: precision={}",
+                    self.precision
+                ),
+            })
+        }
+    }
+
+    /// Returns a byte array describing the unscaled value of this Decimal.
+    pub fn to_unscaled_bytes(&self) -> Vec<u8> {
+        let bd = self.to_big_decimal();
+        let (unscaled, _) = bd.as_bigint_and_exponent();
+        unscaled.to_signed_bytes_be()
+    }
+
+    /// Creates a Decimal from Arrow's Decimal128 representation.
+    // TODO: For compact decimals with matching scale we may call from_unscaled_long
+    pub fn from_arrow_decimal128(
+        i128_val: i128,
+        arrow_scale: i64,
+        precision: u32,
+        scale: u32,
+    ) -> Result<Self> {
+        let bd = BigDecimal::new(BigInt::from(i128_val), arrow_scale);
+        Self::from_big_decimal(bd, precision, scale)
+    }
+
+    /// Creates an instance of Decimal from a BigDecimal with the given precision and scale.
+    ///
+    /// The returned decimal value may be rounded to have the desired scale. The precision
+    /// will be checked. If the precision overflows, an error is returned.
+    pub fn from_big_decimal(bd: BigDecimal, precision: u32, scale: u32) -> Result<Self> {
+        // Rescale to the target scale with HALF_UP rounding (matches Java)
+        let scaled = bd.with_scale_round(scale as i64, RoundingMode::HalfUp);
+
+        // Extract unscaled value
+        let (unscaled, exp) = scaled.as_bigint_and_exponent();
+
+        // Sanity check that scale matches
+        debug_assert_eq!(
+            exp, scale as i64,
+            "Scaled decimal exponent ({}) != expected scale ({})",
+            exp, scale
+        );
+
+        let actual_precision = Self::compute_precision(&unscaled);
+        if actual_precision > precision as usize {
+            return Err(Error::IllegalArgument {
+                message: format!(
+                    "Decimal precision overflow: value has {} digits but precision is {} (value: {})",
+                    actual_precision, precision, scaled
+                ),
+            });
+        }
+
+        // Compute compact representation if possible
+        let long_val = if precision <= MAX_COMPACT_PRECISION {
+            Some(i64::try_from(&unscaled).map_err(|_| Error::IllegalArgument {
+                message: format!(
+                    "Decimal mantissa exceeds i64 range for compact precision {}: unscaled={} (value={})",
+                    precision, unscaled, scaled
+                ),
+            })?)
+        } else {
+            None
+        };
+
+        Ok(Decimal {
+            precision,
+            scale,
+            long_val,
+            decimal_val: Some(scaled),
+        })
+    }
+
+    /// Creates an instance of Decimal from an unscaled long value with the given precision and scale.
+    pub fn from_unscaled_long(unscaled_long: i64, precision: u32, scale: u32) -> Result<Self> {
+        if precision > MAX_COMPACT_PRECISION {
+            return Err(Error::IllegalArgument {
+                message: format!(
+                    "Precision {} exceeds MAX_COMPACT_PRECISION ({})",
+                    precision, MAX_COMPACT_PRECISION
+                ),
+            });
+        }
+
+        let actual_precision = Self::compute_precision(&BigInt::from(unscaled_long));
+        if actual_precision > precision as usize {
+            return Err(Error::IllegalArgument {
+                message: format!(
+                    "Decimal precision overflow: unscaled value has {} digits but precision is {}",
+                    actual_precision, precision
+                ),
+            });
+        }
+
+        Ok(Decimal {
+            precision,
+            scale,
+            long_val: Some(unscaled_long),
+            decimal_val: None,
+        })
+    }
+
+    /// Creates an instance of Decimal from an unscaled byte array with the given precision and scale.
+    pub fn from_unscaled_bytes(unscaled_bytes: &[u8], precision: u32, scale: u32) -> Result<Self> {
+        let unscaled = BigInt::from_signed_bytes_be(unscaled_bytes);
+        let bd = BigDecimal::new(unscaled, scale as i64);
+        Self::from_big_decimal(bd, precision, scale)
+    }
+
+    /// Computes the precision of a decimal's unscaled value, matching Java's BigDecimal.precision().
+    pub fn compute_precision(unscaled: &BigInt) -> usize {
+        if unscaled.is_zero() {
+            return 1;
+        }
+
+        // Count ALL digits in the unscaled value (matches Java's BigDecimal.precision())
+        // For bounded precision (≤ 38 digits), string conversion is cheap and simple.
+        unscaled.magnitude().to_str_radix(10).len()
+    }
+}
+
+impl fmt::Display for Decimal {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        write!(f, "{}", self.to_big_decimal())
+    }
+}
+
+// Manual implementations of comparison traits to ignore cached fields
+impl PartialEq for Decimal {
+    fn eq(&self, other: &Self) -> bool {
+        // Use numeric equality like Java's Decimal.equals() which delegates to compareTo.
+        // This means 1.0 (scale=1) equals 1.00 (scale=2).
+        self.cmp(other) == std::cmp::Ordering::Equal
+    }
+}
+
+impl Eq for Decimal {}
+
+impl PartialOrd for Decimal {
+    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
+        Some(self.cmp(other))
+    }
+}
+
+impl Ord for Decimal {
+    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
+        // If both are compact and have the same scale, compare directly
+        if self.is_compact() && other.is_compact() && self.scale == other.scale {
+            self.long_val.cmp(&other.long_val)
+        } else {
+            // Otherwise, compare as BigDecimal
+            self.to_big_decimal().cmp(&other.to_big_decimal())
+        }
+    }
+}
+
+impl std::hash::Hash for Decimal {
+    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
+        // Hash the BigDecimal representation.
+        //
+        // IMPORTANT: Unlike Java's BigDecimal, Rust's bigdecimal crate normalizes
+        // before hashing, so hash(1.0) == hash(1.00). Combined with our numeric
+        // equality (1.0 == 1.00), this CORRECTLY satisfies the hash/equals contract.
+        //
+        // This is BETTER than Java's implementation which has a hash/equals violation:
+        // - Java: equals(1.0, 1.00) = true, but hashCode(1.0) != hashCode(1.00)
+        // - Rust: equals(1.0, 1.00) = true, and hash(1.0) == hash(1.00) ✓
+        //
+        // Result: HashMap/HashSet will work correctly even if you create Decimals
+        // with different scales for the same numeric value (though this is rare in
+        // practice since decimals are schema-driven with fixed precision/scale).
+        self.to_big_decimal().hash(state);
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_precision_calculation() {
+        // Zero is special case
+        assert_eq!(Decimal::compute_precision(&BigInt::from(0)), 1);
+
+        // Must count ALL digits including trailing zeros (matches Java BigDecimal.precision())
+        assert_eq!(Decimal::compute_precision(&BigInt::from(10)), 2);
+        assert_eq!(Decimal::compute_precision(&BigInt::from(100)), 3);
+        assert_eq!(Decimal::compute_precision(&BigInt::from(12300)), 5);
+        assert_eq!(
+            Decimal::compute_precision(&BigInt::from(10000000000i64)),
+            11
+        );
+
+        // Test the case: value=1, scale=10 → unscaled=10000000000 (11 digits)
+        let bd = BigDecimal::new(BigInt::from(1), 0);
+        assert!(
+            Decimal::from_big_decimal(bd.clone(), 1, 10).is_err(),
+            "Should reject: unscaled 10000000000 has 11 digits, precision=1 is too small"
+        );
+        assert!(
+            Decimal::from_big_decimal(bd, 11, 10).is_ok(),
+            "Should accept with correct precision=11"
+        );
+    }
+
+    /// Test precision validation boundaries
+    #[test]
+    fn test_precision_validation() {
+        let test_cases = vec![
+            (10i64, 1, 2),            // 1.0 → unscaled: 10 (2 digits)
+            (100i64, 2, 3),           // 1.00 → unscaled: 100 (3 digits)
+            (10000000000i64, 10, 11), // 1.0000000000 → unscaled: 10000000000 (11 digits)
+        ];
+
+        for (unscaled, scale, min_precision) in test_cases {
+            let bd = BigDecimal::new(BigInt::from(unscaled), scale as i64);
+
+            // Reject if precision too small
+            assert!(Decimal::from_big_decimal(bd.clone(), min_precision - 1, scale).is_err());
+            // Accept with correct precision
+            assert!(Decimal::from_big_decimal(bd, min_precision, scale).is_ok());
+        }
+
+        // i64::MAX has 19 digits, should reject with precision=5
+        let bd = BigDecimal::new(BigInt::from(i64::MAX), 0);
+        assert!(Decimal::from_big_decimal(bd, 5, 0).is_err());
+    }
+
+    /// Test creation and basic operations for both compact and non-compact decimals
+    #[test]
+    fn test_creation_and_representation() {
+        // Compact (precision ≤ 18): from unscaled long
+        let compact = Decimal::from_unscaled_long(12345, 10, 2).unwrap();
+        assert_eq!(compact.precision(), 10);
+        assert_eq!(compact.scale(), 2);
+        assert!(compact.is_compact());
+        assert_eq!(compact.to_unscaled_long().unwrap(), 12345);
+        assert_eq!(compact.to_big_decimal().to_string(), "123.45");
+
+        // Non-compact (precision > 18): from BigDecimal
+        let bd = BigDecimal::new(BigInt::from(12345), 0);
+        let non_compact = Decimal::from_big_decimal(bd, 28, 0).unwrap();
+        assert_eq!(non_compact.precision(), 28);
+        assert!(!non_compact.is_compact());
+        assert_eq!(
+            non_compact.to_unscaled_bytes(),
+            BigInt::from(12345).to_signed_bytes_be()
+        );
+
+        // Test compact boundary
+        assert!(Decimal::is_compact_precision(18));
+        assert!(!Decimal::is_compact_precision(19));
+
+        // Test rounding during creation
+        let bd = BigDecimal::new(BigInt::from(12345), 3); // 12.345
+        let rounded = Decimal::from_big_decimal(bd, 10, 2).unwrap();
+        assert_eq!(rounded.to_unscaled_long().unwrap(), 1235); // 12.35
+    }
+
+    /// Test serialization round-trip (unscaled bytes)
+    #[test]
+    fn test_serialization_roundtrip() {
+        // Compact decimal
+        let bd1 = BigDecimal::new(BigInt::from(1314567890123i64), 5); // 13145678.90123
+        let decimal1 = Decimal::from_big_decimal(bd1.clone(), 15, 5).unwrap();
+        let (unscaled1, _) = bd1.as_bigint_and_exponent();
+        let from_bytes1 =
+            Decimal::from_unscaled_bytes(&unscaled1.to_signed_bytes_be(), 15, 5).unwrap();
+        assert_eq!(from_bytes1, decimal1);
+        assert_eq!(
+            from_bytes1.to_unscaled_bytes(),
+            unscaled1.to_signed_bytes_be()
+        );
+
+        // Non-compact decimal
+        let bd2 = BigDecimal::new(BigInt::from(12345678900987654321i128), 10);
+        let decimal2 = Decimal::from_big_decimal(bd2.clone(), 23, 10).unwrap();
+        let (unscaled2, _) = bd2.as_bigint_and_exponent();
+        let from_bytes2 =
+            Decimal::from_unscaled_bytes(&unscaled2.to_signed_bytes_be(), 23, 10).unwrap();
+        assert_eq!(from_bytes2, decimal2);
+        assert_eq!(
+            from_bytes2.to_unscaled_bytes(),
+            unscaled2.to_signed_bytes_be()
+        );
+    }
+
+    /// Test numeric equality and ordering (matches Java semantics)
+    #[test]
+    fn test_equality_and_ordering() {
+        // Same value, different precision/scale → should be equal (numeric equality)
+        let d1 = Decimal::from_big_decimal(BigDecimal::new(BigInt::from(10), 1), 2, 1).unwrap(); // 1.0
+        let d2 = Decimal::from_big_decimal(BigDecimal::new(BigInt::from(100), 2), 3, 2).unwrap(); // 1.00
+        assert_eq!(d1, d2, "Numeric equality: 1.0 == 1.00");
+        assert_eq!(d1.cmp(&d2), std::cmp::Ordering::Equal);
+
+        // Test ordering with positive values
+        let small = Decimal::from_unscaled_long(10, 5, 0).unwrap();
+        let large = Decimal::from_unscaled_long(15, 5, 0).unwrap();
+        assert!(small < large);
+        assert_eq!(small.cmp(&large), std::cmp::Ordering::Less);
+
+        // Test ordering with negative values
+        let negative_large = Decimal::from_unscaled_long(-10, 5, 0).unwrap(); // -10
+        let negative_small = Decimal::from_unscaled_long(-15, 5, 0).unwrap(); // -15
+        assert!(negative_small < negative_large); // -15 < -10
+        assert_eq!(
+            negative_small.cmp(&negative_large),
+            std::cmp::Ordering::Less
+        );
+
+        // Test ordering with mixed positive and negative
+        let positive = Decimal::from_unscaled_long(5, 5, 0).unwrap();
+        let negative = Decimal::from_unscaled_long(-5, 5, 0).unwrap();
+        assert!(negative < positive);
+        assert_eq!(negative.cmp(&positive), std::cmp::Ordering::Less);
+
+        // Test clone and round-trip equality
+        let original = Decimal::from_unscaled_long(10, 5, 0).unwrap();
+        assert_eq!(original.clone(), original);
+        assert_eq!(
+            Decimal::from_unscaled_long(original.to_unscaled_long().unwrap(), 5, 0).unwrap(),
+            original
+        );
+    }
+
+    /// Test hash/equals contract (Rust implementation is correct, unlike Java)
+    #[test]
+    fn test_hash_equals_contract() {
+        use std::collections::hash_map::DefaultHasher;
+        use std::hash::{Hash, Hasher};
+
+        let d1 = Decimal::from_big_decimal(BigDecimal::new(BigInt::from(10), 1), 2, 1).unwrap(); // 1.0
+        let d2 = Decimal::from_big_decimal(BigDecimal::new(BigInt::from(100), 2), 3, 2).unwrap(); // 1.00
+
+        // Numeric equality
+        assert_eq!(d1, d2);
+
+        // Hash contract: if a == b, then hash(a) == hash(b)
+        let mut hasher1 = DefaultHasher::new();
+        d1.hash(&mut hasher1);
+        let hash1 = hasher1.finish();
+
+        let mut hasher2 = DefaultHasher::new();
+        d2.hash(&mut hasher2);
+        let hash2 = hasher2.finish();
+
+        assert_eq!(hash1, hash2, "Equal decimals must have equal hashes");
+
+        // Verify HashMap works correctly (this would fail in Java due to their hash/equals bug)
+        let mut map = std::collections::HashMap::new();
+        map.insert(d1.clone(), "value");
+        assert_eq!(map.get(&d2), Some(&"value"));
+    }
+
+    /// Test edge cases: zeros, large numbers, rescaling
+    #[test]
+    fn test_edge_cases() {
+        // Zero handling (compact and non-compact)
+        let zero_compact = Decimal::from_unscaled_long(0, 5, 2).unwrap();
+        assert_eq!(
+            zero_compact.to_big_decimal(),
+            BigDecimal::new(BigInt::from(0), 2)
+        );
+
+        let zero_non_compact =
+            Decimal::from_big_decimal(BigDecimal::new(BigInt::from(0), 2), 20, 2).unwrap();
+        assert_eq!(
+            zero_non_compact.to_big_decimal(),
+            BigDecimal::new(BigInt::from(0), 2)
+        );
+
+        // Large number (39 digits)
+        let large_bd = BigDecimal::from_str("123456789012345678901234567890123456789").unwrap();
+        let large = Decimal::from_big_decimal(large_bd, 39, 0).unwrap();
+        let double_val = large.to_big_decimal().to_string().parse::<f64>().unwrap();
+        assert!((double_val - 1.2345678901234568E38).abs() < 0.01);
+
+        // Rescaling: 5.0 (scale=1) → 5.00 (scale=2)
+        let d1 = Decimal::from_big_decimal(BigDecimal::new(BigInt::from(50), 1), 10, 1).unwrap();
+        let d2 = Decimal::from_big_decimal(d1.to_big_decimal(), 10, 2).unwrap();
+        assert_eq!(d2.to_big_decimal().to_string(), "5.00");
+        assert_eq!(d2.scale(), 2);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
index ebe3da2a0a..563c1c960e 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
@@ -238,86 +238,121 @@ mod tests {
     }
 
     #[test]
-    fn test_all_data_types() {
+    fn test_all_data_types_java_compatible() {
+        // Test encoding compatibility with Java using reference from:
+        // https://github.com/apache/fluss/blob/main/fluss-common/src/test/resources/encoding/encoded_key.hex
+        use crate::metadata::{DataType, TimestampLTzType, TimestampType};
+
         let row_type = RowType::with_data_types(vec![
-            DataTypes::boolean(),
-            DataTypes::tinyint(),
-            DataTypes::smallint(),
-            DataTypes::int(),
-            DataTypes::bigint(),
-            DataTypes::float(),
-            DataTypes::double(),
-            // TODO Date
-            // TODO Time
-            DataTypes::binary(20),
-            DataTypes::bytes(),
-            DataTypes::char(2),
-            DataTypes::string(),
-            // TODO Decimal
-            // TODO Timestamp
-            // TODO Timestamp LTZ
-            // TODO Array of Int
-            // TODO Array of Float
-            // TODO Array of String
-            // TODO: Add Map and Row fields in Issue #1973
+            DataTypes::boolean(),                                                 // BOOLEAN
+            DataTypes::tinyint(),                                                 // TINYINT
+            DataTypes::smallint(),                                                // SMALLINT
+            DataTypes::int(),                                                     // INT
+            DataTypes::bigint(),                                                  // BIGINT
+            DataTypes::float(),                                                   // FLOAT
+            DataTypes::double(),                                                  // DOUBLE
+            DataTypes::date(),                                                    // DATE
+            DataTypes::time(),                                                    // TIME
+            DataTypes::binary(20),                                                // BINARY(20)
+            DataTypes::bytes(),                                                   // BYTES
+            DataTypes::char(2),                                                   // CHAR(2)
+            DataTypes::string(),                                                  // STRING
+            DataTypes::decimal(5, 2),                                             // DECIMAL(5,2)
+            DataTypes::decimal(20, 0),                                            // DECIMAL(20,0)
+            DataType::Timestamp(TimestampType::with_nullable(false, 1).unwrap()), // TIMESTAMP(1)
+            DataType::Timestamp(TimestampType::with_nullable(false, 5).unwrap()), // TIMESTAMP(5)
+            DataType::TimestampLTz(TimestampLTzType::with_nullable(false, 1).unwrap()), // TIMESTAMP_LTZ(1)
+            DataType::TimestampLTz(TimestampLTzType::with_nullable(false, 5).unwrap()), // TIMESTAMP_LTZ(5)
+                                                                                        // TODO: Add support for ARRAY type
+                                                                                        // TODO: Add support for MAP type
+                                                                                        // TODO: Add support for ROW type
         ]);
 
+        // Exact values from Java's IndexedRowTest.genRecordForAllTypes()
         let row = GenericRow::from_data(vec![
-            Datum::from(true),
-            Datum::from(2i8),
-            Datum::from(10i16),
-            Datum::from(100i32),
-            Datum::from(-6101065172474983726i64), // from Java test case: new BigInteger("12345678901234567890").longValue()
-            Datum::from(13.2f32),
-            Datum::from(15.21f64),
-            // TODO Date
-            // TODO Time
-            Datum::from("1234567890".as_bytes()),
-            Datum::from("20".as_bytes()),
-            Datum::from("1"),
-            Datum::from("hello"),
-            // TODO Decimal
-            // TODO Timestamp
-            // TODO Timestamp LTZ
-            // TODO Array of Int
-            // TODO Array of Float
-            // TODO Array of String
-            // TODO: Add Map and Row fields in Issue #1973
+            Datum::from(true),                                   // BOOLEAN: true
+            Datum::from(2i8),                                    // TINYINT: 2
+            Datum::from(10i16),                                  // SMALLINT: 10
+            Datum::from(100i32),                                 // INT: 100
+            Datum::from(-6101065172474983726i64),                // BIGINT
+            Datum::from(13.2f32),                                // FLOAT: 13.2
+            Datum::from(15.21f64),                               // DOUBLE: 15.21
+            Datum::Date(crate::row::datum::Date::new(19655)), // DATE: 2023-10-25 (19655 days since epoch)
+            Datum::Time(crate::row::datum::Time::new(34200000)), // TIME: 09:30:00.0
+            Datum::from("1234567890".as_bytes()),             // BINARY(20)
+            Datum::from("20".as_bytes()),                     // BYTES
+            Datum::from("1"),                                 // CHAR(2): "1"
+            Datum::from("hello"),                             // STRING: "hello"
+            Datum::Decimal(crate::row::Decimal::from_unscaled_long(9, 5, 2).unwrap()), // DECIMAL(5,2)
+            Datum::Decimal(
+                crate::row::Decimal::from_big_decimal(
+                    bigdecimal::BigDecimal::new(bigdecimal::num_bigint::BigInt::from(10), 0),
+                    20,
+                    0,
+                )
+                .unwrap(),
+            ), // DECIMAL(20,0)
+            Datum::TimestampNtz(crate::row::datum::TimestampNtz::new(1698235273182)), // TIMESTAMP(1)
+            Datum::TimestampNtz(crate::row::datum::TimestampNtz::new(1698235273182)), // TIMESTAMP(5)
+            Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(1698235273182)), // TIMESTAMP_LTZ(1)
+            Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(1698235273182)), // TIMESTAMP_LTZ(5)
         ]);
 
-        let mut encoder = for_test_row_type(&row_type);
-
-        let mut expected: Vec<u8> = Vec::new();
-        // BOOLEAN: true
-        expected.extend(vec![0x01]);
-        // TINYINT: 2
-        expected.extend(vec![0x02]);
-        // SMALLINT: 10
-        expected.extend(vec![0x0A]);
-        // INT: 100
-        expected.extend(vec![0x00, 0x64]);
-        // BIGINT: -6101065172474983726
-        expected.extend(vec![
+        // Expected bytes from Java's encoded_key.hex reference file
+        #[rustfmt::skip]
+        let expected: Vec<u8> = vec![
+            // BOOLEAN: true
+            0x01,
+            // TINYINT: 2
+            0x02,
+            // SMALLINT: 10 (varint encoded)
+            0x0A,
+            // INT: 100 (varint encoded)
+            0x00, 0x64,
+            // BIGINT: -6101065172474983726
             0xD2, 0x95, 0xFC, 0xD8, 0xCE, 0xB1, 0xAA, 0xAA, 0xAB, 0x01,
-        ]);
-        // FLOAT: 13.2
-        expected.extend(vec![0x33, 0x33, 0x53, 0x41]);
-        // DOUBLE: 15.21
-        expected.extend(vec![0xEC, 0x51, 0xB8, 0x1E, 0x85, 0x6B, 0x2E, 0x40]);
-        // BINARY(20): "1234567890".getBytes()
-        expected.extend(vec![
+            // FLOAT: 13.2
+            0x33, 0x33, 0x53, 0x41,
+            // DOUBLE: 15.21
+            0xEC, 0x51, 0xB8, 0x1E, 0x85, 0x6B, 0x2E, 0x40,
+            // DATE: 2023-10-25
+            0xC7, 0x99, 0x01,
+            // TIME: 09:30:00.0
+            0xC0, 0xB3, 0xA7, 0x10,
+            // BINARY(20): "1234567890"
             0x0A, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39, 0x30,
-        ]);
+            // BYTES: "20"
+            0x02, 0x32, 0x30,
+            // CHAR(2): "1"
+            0x01, 0x31,
+            // STRING: "hello"
+            0x05, 0x68, 0x65, 0x6C, 0x6C, 0x6F,
+            // DECIMAL(5,2): 9
+            0x09,
+            // DECIMAL(20,0): 10
+            0x01, 0x0A,
+            // TIMESTAMP(1): 1698235273182
+            0xDE, 0x9F, 0xD7, 0xB5, 0xB6, 0x31,
+            // TIMESTAMP(5): 1698235273182
+            0xDE, 0x9F, 0xD7, 0xB5, 0xB6, 0x31, 0x00,
+            // TIMESTAMP_LTZ(1): 1698235273182
+            0xDE, 0x9F, 0xD7, 0xB5, 0xB6, 0x31,
+            // TIMESTAMP_LTZ(5): 1698235273182
+            0xDE, 0x9F, 0xD7, 0xB5, 0xB6, 0x31, 0x00,
+        ];
 
-        // BYTES: "20".getBytes()
-        expected.extend(vec![0x02, 0x32, 0x30]);
-        // CHAR(2): "1"
-        expected.extend(vec![0x01, 0x31]);
-        // STRING: String: "hello"
-        expected.extend(vec![0x05, 0x68, 0x65, 0x6C, 0x6C, 0x6F]);
+        let mut encoder = for_test_row_type(&row_type);
+        let encoded = encoder.encode_key(&row).unwrap();
+
+        // Assert byte-for-byte compatibility with Java's encoded_key.hex
         assert_eq!(
-            encoder.encode_key(&row).unwrap().iter().as_slice(),
-            expected.as_slice()
+            encoded.iter().as_slice(),
+            expected.as_slice(),
+            "\n\nRust encoding does not match Java reference from encoded_key.hex\n\
+             Expected: {:02X?}\n\
+             Actual:   {:02X?}\n",
+            expected,
+            encoded.iter().as_slice()
         );
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
index 97f9e395fc..cbffa4d09f 100644
--- a/fluss-rust/crates/fluss/src/row/field_getter.rs
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -66,6 +66,21 @@ impl FieldGetter {
             DataType::BigInt(_) => InnerFieldGetter::BigInt { pos },
             DataType::Float(_) => InnerFieldGetter::Float { pos },
             DataType::Double(_) => InnerFieldGetter::Double { pos },
+            DataType::Decimal(decimal_type) => InnerFieldGetter::Decimal {
+                pos,
+                precision: decimal_type.precision() as usize,
+                scale: decimal_type.scale() as usize,
+            },
+            DataType::Date(_) => InnerFieldGetter::Date { pos },
+            DataType::Time(_) => InnerFieldGetter::Time { pos },
+            DataType::Timestamp(t) => InnerFieldGetter::Timestamp {
+                pos,
+                precision: t.precision(),
+            },
+            DataType::TimestampLTz(t) => InnerFieldGetter::TimestampLtz {
+                pos,
+                precision: t.precision(),
+            },
             _ => unimplemented!("DataType {:?} is currently unimplemented", data_type),
         };
 
@@ -79,17 +94,60 @@ impl FieldGetter {
 
 #[derive(Clone)]
 pub enum InnerFieldGetter {
-    Char { pos: usize, len: usize },
-    String { pos: usize },
-    Bool { pos: usize },
-    Binary { pos: usize, len: usize },
-    Bytes { pos: usize },
-    TinyInt { pos: usize },
-    SmallInt { pos: usize },
-    Int { pos: usize },
-    BigInt { pos: usize },
-    Float { pos: usize },
-    Double { pos: usize },
+    Char {
+        pos: usize,
+        len: usize,
+    },
+    String {
+        pos: usize,
+    },
+    Bool {
+        pos: usize,
+    },
+    Binary {
+        pos: usize,
+        len: usize,
+    },
+    Bytes {
+        pos: usize,
+    },
+    TinyInt {
+        pos: usize,
+    },
+    SmallInt {
+        pos: usize,
+    },
+    Int {
+        pos: usize,
+    },
+    BigInt {
+        pos: usize,
+    },
+    Float {
+        pos: usize,
+    },
+    Double {
+        pos: usize,
+    },
+    Decimal {
+        pos: usize,
+        precision: usize,
+        scale: usize,
+    },
+    Date {
+        pos: usize,
+    },
+    Time {
+        pos: usize,
+    },
+    Timestamp {
+        pos: usize,
+        precision: u32,
+    },
+    TimestampLtz {
+        pos: usize,
+        precision: u32,
+    },
 }
 
 impl InnerFieldGetter {
@@ -106,7 +164,19 @@ impl InnerFieldGetter {
             InnerFieldGetter::BigInt { pos } => Datum::from(row.get_long(*pos)),
             InnerFieldGetter::Float { pos } => Datum::from(row.get_float(*pos)),
             InnerFieldGetter::Double { pos } => Datum::from(row.get_double(*pos)),
-            //TODO Decimal, Date, Time, Timestamp, TimestampLTZ, Array, Map, Row
+            InnerFieldGetter::Decimal {
+                pos,
+                precision,
+                scale,
+            } => Datum::Decimal(row.get_decimal(*pos, *precision, *scale)),
+            InnerFieldGetter::Date { pos } => Datum::Date(row.get_date(*pos)),
+            InnerFieldGetter::Time { pos } => Datum::Time(row.get_time(*pos)),
+            InnerFieldGetter::Timestamp { pos, precision } => {
+                Datum::TimestampNtz(row.get_timestamp_ntz(*pos, *precision))
+            }
+            InnerFieldGetter::TimestampLtz { pos, precision } => {
+                Datum::TimestampLtz(row.get_timestamp_ltz(*pos, *precision))
+            } //TODO Array, Map, Row
         }
     }
 
@@ -122,7 +192,12 @@ impl InnerFieldGetter {
             | Self::Int { pos }
             | Self::BigInt { pos }
             | Self::Float { pos, .. }
-            | Self::Double { pos } => *pos,
+            | Self::Double { pos }
+            | Self::Decimal { pos, .. }
+            | Self::Date { pos }
+            | Self::Time { pos }
+            | Self::Timestamp { pos, .. }
+            | Self::TimestampLtz { pos, .. } => *pos,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 536409efde..d2f640e4dc 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -18,6 +18,7 @@
 mod column;
 
 mod datum;
+mod decimal;
 
 pub mod binary;
 pub mod compacted;
@@ -28,6 +29,7 @@ mod row_decoder;
 pub use column::*;
 pub use compacted::CompactedRow;
 pub use datum::*;
+pub use decimal::{Decimal, MAX_COMPACT_PRECISION};
 pub use encode::KeyEncoder;
 pub use row_decoder::{CompactedRowDecoder, RowDecoder, RowDecoderFactory};
 
@@ -71,14 +73,26 @@ pub trait InternalRow {
     /// Returns the string value at the given position
     fn get_string(&self, pos: usize) -> &str;
 
-    // /// Returns the decimal value at the given position
-    // fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Decimal;
+    /// Returns the decimal value at the given position
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Decimal;
 
-    // /// Returns the timestamp value at the given position
-    // fn get_timestamp_ntz(&self, pos: usize, precision: usize) -> TimestampNtz;
+    /// Returns the date value at the given position (date as days since epoch)
+    fn get_date(&self, pos: usize) -> datum::Date;
 
-    // /// Returns the timestamp value at the given position
-    // fn get_timestamp_ltz(&self, pos: usize, precision: usize) -> TimestampLtz;
+    /// Returns the time value at the given position (time as milliseconds since midnight)
+    fn get_time(&self, pos: usize) -> datum::Time;
+
+    /// Returns the timestamp value at the given position (timestamp without timezone)
+    ///
+    /// The precision is required to determine whether the timestamp value was stored
+    /// in a compact representation (precision <= 3) or with nanosecond precision.
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> datum::TimestampNtz;
+
+    /// Returns the timestamp value at the given position (timestamp with local timezone)
+    ///
+    /// The precision is required to determine whether the timestamp value was stored
+    /// in a compact representation (precision <= 3) or with nanosecond precision.
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> datum::TimestampLtz;
 
     /// Returns the binary value at the given position with fixed length
     fn get_binary(&self, pos: usize, length: usize) -> &[u8];
@@ -123,6 +137,43 @@ impl<'a> InternalRow for GenericRow<'a> {
         self.values.get(_pos).unwrap().try_into().unwrap()
     }
 
+    fn get_decimal(&self, pos: usize, _precision: usize, _scale: usize) -> Decimal {
+        match self.values.get(pos).unwrap() {
+            Datum::Decimal(d) => d.clone(),
+            other => panic!("Expected Decimal at pos {pos:?}, got {other:?}"),
+        }
+    }
+
+    fn get_date(&self, pos: usize) -> datum::Date {
+        match self.values.get(pos).unwrap() {
+            Datum::Date(d) => *d,
+            Datum::Int32(i) => datum::Date::new(*i),
+            other => panic!("Expected Date or Int32 at pos {pos:?}, got {other:?}"),
+        }
+    }
+
+    fn get_time(&self, pos: usize) -> datum::Time {
+        match self.values.get(pos).unwrap() {
+            Datum::Time(t) => *t,
+            Datum::Int32(i) => datum::Time::new(*i),
+            other => panic!("Expected Time or Int32 at pos {pos:?}, got {other:?}"),
+        }
+    }
+
+    fn get_timestamp_ntz(&self, pos: usize, _precision: u32) -> datum::TimestampNtz {
+        match self.values.get(pos).unwrap() {
+            Datum::TimestampNtz(t) => *t,
+            other => panic!("Expected TimestampNtz at pos {pos:?}, got {other:?}"),
+        }
+    }
+
+    fn get_timestamp_ltz(&self, pos: usize, _precision: u32) -> datum::TimestampLtz {
+        match self.values.get(pos).unwrap() {
+            Datum::TimestampLtz(t) => *t,
+            other => panic!("Expected TimestampLtz at pos {pos:?}, got {other:?}"),
+        }
+    }
+
     fn get_float(&self, pos: usize) -> f32 {
         self.values.get(pos).unwrap().try_into().unwrap()
     }

From 0e31ef49c0939deb6890bb7c045816001b7eef20 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Tue, 20 Jan 2026 13:09:49 +0000
Subject: [PATCH 076/287] feat: Introduce UpsertWriter (#169)

---
 fluss-rust/crates/fluss/Cargo.toml            |   1 +
 .../src/client/table/log_fetch_buffer.rs      |   6 +-
 .../crates/fluss/src/client/table/lookup.rs   |   9 +-
 .../crates/fluss/src/client/table/mod.rs      |  18 +
 .../src/client/table/partition_getter.rs      |  56 ++
 .../crates/fluss/src/client/table/upsert.rs   | 522 ++++++++++++++++++
 .../crates/fluss/src/client/table/writer.rs   |  20 +-
 .../fluss/src/client/write/accumulator.rs     |  39 +-
 .../crates/fluss/src/client/write/batch.rs    |  20 +-
 .../fluss/src/client/write/bucket_assigner.rs |   9 +-
 .../crates/fluss/src/client/write/mod.rs      |  54 +-
 .../fluss/src/client/write/write_format.rs    |   1 +
 .../fluss/src/client/write/writer_client.rs   |   9 +-
 fluss-rust/crates/fluss/src/metadata/table.rs |  66 ++-
 fluss-rust/crates/fluss/src/record/arrow.rs   |  62 +--
 .../fluss/src/record/kv/kv_record_batch.rs    |  11 +-
 .../src/record/kv/kv_record_batch_builder.rs  |  80 +--
 .../src/record/kv/kv_record_read_context.rs   |  17 +-
 .../fluss/src/row/compacted/compacted_row.rs  |  15 +-
 .../src/row/compacted/compacted_row_writer.rs |  12 +
 .../src/row/encode/compacted_row_encoder.rs   |  13 +-
 fluss-rust/crates/fluss/src/row/encode/mod.rs |  23 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |  27 +-
 23 files changed, 895 insertions(+), 195 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/table/partition_getter.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/table/upsert.rs

diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index c3bdd4475a..9aeee72db4 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -33,6 +33,7 @@ integration_tests = []
 [dependencies]
 arrow = { workspace = true }
 arrow-schema = "57.0.0"
+bitvec = "1"
 byteorder = "1.5"
 futures = "0.3"
 clap = { workspace = true }
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index ac44cc1728..ca0a2532c8 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -651,14 +651,14 @@ mod tests {
     use crate::compression::{
         ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
     };
-    use crate::metadata::{DataField, DataTypes, TablePath};
+    use crate::metadata::{DataField, DataTypes, RowType, TablePath};
     use crate::record::{MemoryLogRecordsArrowBuilder, ReadContext, to_arrow_schema};
     use crate::row::GenericRow;
     use std::sync::Arc;
     use std::time::Duration;
 
     fn test_read_context() -> ReadContext {
-        let row_type = DataTypes::row(vec![DataField::new(
+        let row_type = RowType::new(vec![DataField::new(
             "id".to_string(),
             DataTypes::int(),
             None,
@@ -714,7 +714,7 @@ mod tests {
 
     #[test]
     fn default_completed_fetch_reads_records() -> Result<()> {
-        let row_type = DataTypes::row(vec![
+        let row_type = RowType::new(vec![
             DataField::new("id".to_string(), DataTypes::int(), None),
             DataField::new("name".to_string(), DataTypes::string(), None),
         ]);
diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index 1d32ebd75e..cd23503a5b 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -22,7 +22,7 @@ use crate::error::{Error, Result};
 use crate::metadata::{RowType, TableBucket, TableInfo};
 use crate::row::InternalRow;
 use crate::row::compacted::CompactedRow;
-use crate::row::encode::KeyEncoder;
+use crate::row::encode::{KeyEncoder, KeyEncoderFactory};
 use crate::rpc::ApiError;
 use crate::rpc::message::LookupRequest;
 use std::sync::Arc;
@@ -130,8 +130,11 @@ impl<'a> TableLookup<'a> {
 
         // Create key encoder for the primary key fields
         let pk_fields = self.table_info.get_physical_primary_keys().to_vec();
-        let key_encoder =
-            <dyn KeyEncoder>::of(self.table_info.row_type(), pk_fields, data_lake_format)?;
+        let key_encoder = KeyEncoderFactory::of(
+            self.table_info.row_type(),
+            pk_fields.as_slice(),
+            &data_lake_format,
+        )?;
 
         Ok(Lookuper {
             conn: self.conn,
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 7356be2393..2bfa054105 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -27,13 +27,17 @@ mod append;
 mod lookup;
 
 mod log_fetch_buffer;
+mod partition_getter;
 mod remote_log;
 mod scanner;
+mod upsert;
 mod writer;
 
+use crate::client::table::upsert::TableUpsert;
 pub use append::{AppendWriter, TableAppend};
 pub use lookup::{LookupResult, Lookuper, TableLookup};
 pub use scanner::{LogScanner, RecordBatchLogScanner, TableScan};
+pub use writer::{TableWriter, UpsertWriter};
 
 #[allow(dead_code)]
 pub struct FlussTable<'a> {
@@ -119,6 +123,20 @@ impl<'a> FlussTable<'a> {
             self.metadata.clone(),
         ))
     }
+
+    pub fn new_upsert(&self) -> Result<TableUpsert> {
+        if !self.has_primary_key {
+            return Err(Error::UnsupportedOperation {
+                message: "Upsert is only supported for primary key tables".to_string(),
+            });
+        }
+
+        Ok(TableUpsert::new(
+            self.table_path.clone(),
+            self.table_info.clone(),
+            self.conn.get_or_create_writer_client()?,
+        ))
+    }
 }
 
 impl<'a> Drop for FlussTable<'a> {
diff --git a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
new file mode 100644
index 0000000000..4529d8684f
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
@@ -0,0 +1,56 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::{DataType, RowType};
+use crate::row::field_getter::FieldGetter;
+
+#[allow(dead_code)]
+pub struct PartitionGetter<'a> {
+    partitions: Vec<(&'a String, &'a DataType, FieldGetter)>,
+}
+
+#[allow(dead_code)]
+impl<'a> PartitionGetter<'a> {
+    pub fn new(row_type: &'a RowType, partition_keys: &'a Vec<String>) -> Result<Self> {
+        let mut partitions = Vec::with_capacity(partition_keys.len());
+
+        for partition_key in partition_keys {
+            if let Some(partition_col_index) = row_type.get_field_index(partition_key.as_str()) {
+                let data_type = &row_type
+                    .fields()
+                    .get(partition_col_index)
+                    .unwrap()
+                    .data_type;
+                let field_getter = FieldGetter::create(data_type, partition_col_index);
+
+                partitions.push((partition_key, data_type, field_getter));
+            } else {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "The partition column {partition_key} is not in the row {row_type}."
+                    ),
+                });
+            };
+        }
+
+        Ok(Self { partitions })
+    }
+
+    // TODO Implement get partition
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
new file mode 100644
index 0000000000..a3909e7258
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -0,0 +1,522 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::client::table::writer::{DeleteResult, TableWriter, UpsertResult, UpsertWriter};
+use crate::client::{RowBytes, WriteFormat, WriteRecord, WriterClient};
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::{KvFormat, RowType, TableInfo, TablePath};
+use crate::row::InternalRow;
+use crate::row::encode::{KeyEncoder, KeyEncoderFactory, RowEncoder, RowEncoderFactory};
+use crate::row::field_getter::FieldGetter;
+use std::sync::Arc;
+
+use bitvec::prelude::bitvec;
+use bytes::Bytes;
+
+#[allow(dead_code)]
+pub struct TableUpsert {
+    table_path: TablePath,
+    table_info: TableInfo,
+    writer_client: Arc<WriterClient>,
+    target_columns: Option<Arc<Vec<usize>>>,
+}
+
+#[allow(dead_code)]
+impl TableUpsert {
+    pub fn new(
+        table_path: TablePath,
+        table_info: TableInfo,
+        writer_client: Arc<WriterClient>,
+    ) -> Self {
+        Self {
+            table_path,
+            table_info,
+            writer_client,
+            target_columns: None,
+        }
+    }
+
+    pub fn partial_update(&self, target_columns: Option<Vec<usize>>) -> Result<Self> {
+        if let Some(columns) = &target_columns {
+            let num_columns = self.table_info.row_type().fields().len();
+
+            if let Some(&invalid_column) = columns.iter().find(|&&col| col >= num_columns) {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "Invalid target column index: {invalid_column} for table {}. The table only has {num_columns} columns.",
+                        self.table_path
+                    ),
+                });
+            }
+        }
+
+        Ok(Self {
+            table_path: self.table_path.clone(),
+            table_info: self.table_info.clone(),
+            writer_client: self.writer_client.clone(),
+            target_columns: target_columns.map(Arc::new),
+        })
+    }
+
+    pub fn partial_update_with_column_names(&self, target_column_names: &[&str]) -> Result<Self> {
+        let row_type = self.table_info.row_type();
+        let col_indices: Vec<(&str, Option<usize>)> = target_column_names
+            .iter()
+            .map(|col_name| (*col_name, row_type.get_field_index(col_name)))
+            .collect();
+
+        if let Some((missing_name, _)) = col_indices.iter().find(|(_, ix)| ix.is_none()) {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Cannot find target column `{}` for table {}.",
+                    missing_name, self.table_path
+                ),
+            });
+        }
+
+        let valid_col_indices: Vec<usize> = col_indices
+            .into_iter()
+            .map(|(_, index)| index.unwrap())
+            .collect();
+
+        self.partial_update(Some(valid_col_indices))
+    }
+
+    pub fn create_writer(&self) -> Result<impl UpsertWriter> {
+        UpsertWriterFactory::create(
+            Arc::new(self.table_path.clone()),
+            Arc::new(self.table_info.clone()),
+            self.target_columns.clone(),
+            Arc::clone(&self.writer_client),
+        )
+    }
+}
+
+#[allow(dead_code)]
+struct UpsertWriterImpl<RE>
+where
+    RE: RowEncoder,
+{
+    table_path: Arc<TablePath>,
+    writer_client: Arc<WriterClient>,
+    // TODO: Partitioning
+    // partition_field_getter: Option<Box<dyn KeyEncoder>>,
+    primary_key_encoder: Box<dyn KeyEncoder>,
+    target_columns: Option<Arc<Vec<usize>>>,
+    // Use primary key encoder as bucket key encoder when None
+    bucket_key_encoder: Option<Box<dyn KeyEncoder>>,
+    kv_format: KvFormat,
+    write_format: WriteFormat,
+    row_encoder: RE,
+    field_getters: Box<[FieldGetter]>,
+    table_info: Arc<TableInfo>,
+}
+
+#[allow(dead_code)]
+struct UpsertWriterFactory;
+
+#[allow(dead_code)]
+impl UpsertWriterFactory {
+    pub fn create(
+        table_path: Arc<TablePath>,
+        table_info: Arc<TableInfo>,
+        partial_update_columns: Option<Arc<Vec<usize>>>,
+        writer_client: Arc<WriterClient>,
+    ) -> Result<impl UpsertWriter> {
+        let data_lake_format = &table_info.table_config.get_datalake_format()?;
+        let row_type = table_info.row_type();
+        let physical_pks = table_info.get_physical_primary_keys();
+
+        let names = table_info.get_schema().auto_increment_col_names();
+
+        Self::sanity_check(
+            row_type,
+            &table_info.primary_keys,
+            names,
+            &partial_update_columns,
+        )?;
+
+        let primary_key_encoder = KeyEncoderFactory::of(row_type, physical_pks, data_lake_format)?;
+        let bucket_key_encoder = if !table_info.is_default_bucket_key() {
+            Some(KeyEncoderFactory::of(
+                row_type,
+                table_info.get_bucket_keys(),
+                data_lake_format,
+            )?)
+        } else {
+            // Defaults to using primary key encoder when None for bucket key
+            None
+        };
+
+        let kv_format = table_info.get_table_config().get_kv_format()?;
+        let write_format = WriteFormat::from_kv_format(&kv_format)?;
+
+        let field_getters = FieldGetter::create_field_getters(row_type);
+
+        Ok(UpsertWriterImpl {
+            table_path,
+            writer_client,
+            primary_key_encoder,
+            target_columns: partial_update_columns,
+            bucket_key_encoder,
+            kv_format: kv_format.clone(),
+            write_format,
+            row_encoder: RowEncoderFactory::create(kv_format, row_type.clone())?,
+            field_getters,
+            table_info: table_info.clone(),
+        })
+    }
+
+    #[allow(dead_code)]
+    fn sanity_check(
+        row_type: &RowType,
+        primary_keys: &Vec<String>,
+        auto_increment_col_names: &Vec<String>,
+        target_columns: &Option<Arc<Vec<usize>>>,
+    ) -> Result<()> {
+        if target_columns.is_none() {
+            if !auto_increment_col_names.is_empty() {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "This table has auto increment column {}. Explicitly specifying values for an auto increment column is not allowed. Please Specify non-auto-increment columns as target columns using partialUpdate first.",
+                        auto_increment_col_names.join(", ")
+                    ),
+                });
+            }
+            return Ok(());
+        }
+
+        let field_count = row_type.fields().len();
+
+        let mut target_column_set = bitvec![0; field_count];
+
+        let columns = target_columns.as_ref().unwrap().as_ref();
+
+        for &target_index in columns {
+            target_column_set.set(target_index, true);
+        }
+
+        let mut pk_column_set = bitvec![0; field_count];
+
+        // check the target columns contains the primary key
+        for primary_key in primary_keys {
+            let pk_index = row_type.get_field_index(primary_key.as_str());
+            match pk_index {
+                Some(pk_index) => {
+                    if !target_column_set[pk_index] {
+                        return Err(IllegalArgument {
+                            message: format!(
+                                "The target write columns {} must contain the primary key columns {}",
+                                row_type.project(columns)?.get_field_names().join(", "),
+                                primary_keys.join(", ")
+                            ),
+                        });
+                    }
+                    pk_column_set.set(pk_index, true);
+                }
+                None => {
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "The specified primary key {} is not in row type {}",
+                            primary_key, row_type
+                        ),
+                    });
+                }
+            }
+        }
+
+        let mut auto_increment_column_set = bitvec![0; field_count];
+        // explicitly specifying values for an auto increment column is not allowed
+        for auto_increment_col_name in auto_increment_col_names {
+            let auto_increment_field_index =
+                row_type.get_field_index(auto_increment_col_name.as_str());
+
+            if let Some(index) = auto_increment_field_index {
+                if target_column_set[index] {
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "Explicitly specifying values for the auto increment column {} is not allowed.",
+                            auto_increment_col_name
+                        ),
+                    });
+                }
+
+                auto_increment_column_set.set(index, true);
+            }
+        }
+
+        // check the columns not in targetColumns should be nullable
+        for i in 0..field_count {
+            // column not in primary key and not in auto increment column
+            if !pk_column_set[i] && !auto_increment_column_set[i] {
+                // the column should be nullable
+                if !row_type.fields().get(i).unwrap().data_type.is_nullable() {
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "Partial Update requires all columns except primary key to be nullable, but column {} is NOT NULL.",
+                            row_type.fields().get(i).unwrap().name()
+                        ),
+                    });
+                }
+            }
+        }
+
+        Ok(())
+    }
+}
+
+#[allow(dead_code)]
+impl<RE: RowEncoder> UpsertWriterImpl<RE> {
+    fn check_field_count<R: InternalRow>(&self, row: &R) -> Result<()> {
+        let expected = self.table_info.get_row_type().fields().len();
+        if row.get_field_count() != expected {
+            return Err(IllegalArgument {
+                message: format!(
+                    "The field count of the row does not match the table schema. Expected: {}, Actual: {}",
+                    expected,
+                    row.get_field_count()
+                ),
+            });
+        }
+        Ok(())
+    }
+
+    fn get_keys(&mut self, row: &dyn InternalRow) -> Result<(Bytes, Option<Bytes>)> {
+        let key = self.primary_key_encoder.encode_key(row)?;
+        let bucket_key = match &mut self.bucket_key_encoder {
+            Some(bucket_key_encoder) => Some(bucket_key_encoder.encode_key(row)?),
+            None => Some(key.clone()),
+        };
+        Ok((key, bucket_key))
+    }
+
+    fn encode_row<R: InternalRow>(&mut self, row: &R) -> Result<Bytes> {
+        self.row_encoder.start_new_row()?;
+        for (pos, field_getter) in self.field_getters.iter().enumerate() {
+            let datum = field_getter.get_field(row);
+            self.row_encoder.encode_field(pos, datum)?;
+        }
+        self.row_encoder.finish_row()
+    }
+}
+
+impl<RE: RowEncoder> TableWriter for UpsertWriterImpl<RE> {
+    /// Flush data written that have not yet been sent to the server, forcing the client to send the
+    /// requests to server and blocks on the completion of the requests associated with these
+    /// records. A request is considered completed when it is successfully acknowledged according to
+    /// the CLIENT_WRITER_ACKS configuration option you have specified or else it
+    /// results in an error.
+    async fn flush(&self) -> Result<()> {
+        self.writer_client.flush().await
+    }
+}
+
+impl<RE: RowEncoder> UpsertWriter for UpsertWriterImpl<RE> {
+    /// Inserts row into Fluss table if they do not already exist, or updates them if they do exist.
+    ///
+    /// # Arguments
+    /// * row - the row to upsert.
+    ///
+    /// # Returns
+    /// Ok(UpsertResult) when completed normally
+    async fn upsert<R: InternalRow>(&mut self, row: &R) -> Result<UpsertResult> {
+        self.check_field_count(row)?;
+
+        let (key, bucket_key) = self.get_keys(row)?;
+
+        let row_bytes: RowBytes<'_> = match row.as_encoded_bytes(self.write_format) {
+            Some(bytes) => RowBytes::Borrowed(bytes),
+            None => RowBytes::Owned(self.encode_row(row)?),
+        };
+
+        let write_record = WriteRecord::for_upsert(
+            Arc::clone(&self.table_path),
+            self.table_info.schema_id,
+            key,
+            bucket_key,
+            self.write_format,
+            self.target_columns.clone(),
+            Some(row_bytes),
+        );
+
+        let result_handle = self.writer_client.send(&write_record).await?;
+        let result = result_handle.wait().await?;
+
+        result_handle.result(result).map(|_| UpsertResult)
+    }
+
+    /// Delete certain row by the input row in Fluss table, the input row must contain the primary
+    /// key.
+    ///
+    /// # Arguments
+    /// * row - the row to delete.
+    ///
+    /// # Returns
+    /// Ok(DeleteResult) when completed normally
+    async fn delete<R: InternalRow>(&mut self, row: &R) -> Result<DeleteResult> {
+        self.check_field_count(row)?;
+
+        let (key, bucket_key) = self.get_keys(row)?;
+
+        let write_record = WriteRecord::for_upsert(
+            Arc::clone(&self.table_path),
+            self.table_info.schema_id,
+            key,
+            bucket_key,
+            self.write_format,
+            self.target_columns.clone(),
+            None,
+        );
+
+        let result_handle = self.writer_client.send(&write_record).await?;
+        let result = result_handle.wait().await?;
+
+        result_handle.result(result).map(|_| DeleteResult)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{DataField, DataTypes};
+
+    #[test]
+    fn sanity_check() {
+        // No target columns specified but table has auto-increment column
+        let fields = vec![
+            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+        ];
+        let row_type = RowType::new(fields);
+        let primary_keys = vec!["id".to_string()];
+        let auto_increment_col_names = vec!["id".to_string()];
+        let target_columns = None;
+
+        let result = UpsertWriterFactory::sanity_check(
+            &row_type,
+            &primary_keys,
+            &auto_increment_col_names,
+            &target_columns,
+        );
+
+        assert!(result.unwrap_err().to_string().contains(
+            "This table has auto increment column id. Explicitly specifying values for an auto increment column is not allowed. Please Specify non-auto-increment columns as target columns using partialUpdate first."
+        ));
+
+        // Target columns do not contain primary key
+        let fields = vec![
+            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+            DataField::new("value".to_string(), DataTypes::int(), None),
+        ];
+        let row_type = RowType::new(fields);
+        let primary_keys = vec!["id".to_string()];
+        let auto_increment_col_names = vec![];
+        let target_columns = Some(Arc::new(vec![1usize]));
+
+        let result = UpsertWriterFactory::sanity_check(
+            &row_type,
+            &primary_keys,
+            &auto_increment_col_names,
+            &target_columns,
+        );
+
+        assert!(
+            result
+                .unwrap_err()
+                .to_string()
+                .contains("The target write columns name must contain the primary key columns id")
+        );
+
+        // Primary key column not found in row type
+        let fields = vec![
+            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+        ];
+        let row_type = RowType::new(fields);
+        let primary_keys = vec!["nonexistent_pk".to_string()];
+        let auto_increment_col_names = vec![];
+        let target_columns = Some(Arc::new(vec![0usize, 1]));
+
+        let result = UpsertWriterFactory::sanity_check(
+            &row_type,
+            &primary_keys,
+            &auto_increment_col_names,
+            &target_columns,
+        );
+
+        assert!(
+            result
+                .unwrap_err()
+                .to_string()
+                .contains("The specified primary key nonexistent_pk is not in row type")
+        );
+
+        // Target columns include auto-increment column
+        let fields = vec![
+            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
+            DataField::new(
+                "seq".to_string(),
+                DataTypes::bigint().as_non_nullable(),
+                None,
+            ),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+        ];
+        let row_type = RowType::new(fields);
+        let primary_keys = vec!["id".to_string()];
+        let auto_increment_col_names = vec!["seq".to_string()];
+        let target_columns = Some(Arc::new(vec![0usize, 1, 2]));
+
+        let result = UpsertWriterFactory::sanity_check(
+            &row_type,
+            &primary_keys,
+            &auto_increment_col_names,
+            &target_columns,
+        );
+
+        assert!(result.unwrap_err().to_string().contains(
+            "Explicitly specifying values for the auto increment column seq is not allowed."
+        ));
+
+        // Non-nullable column not in target columns (partial update requires nullable)
+        let fields = vec![
+            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
+            DataField::new(
+                "required_field".to_string(),
+                DataTypes::string().as_non_nullable(),
+                None,
+            ),
+            DataField::new("optional_field".to_string(), DataTypes::int(), None),
+        ];
+        let row_type = RowType::new(fields);
+        let primary_keys = vec!["id".to_string()];
+        let auto_increment_col_names = vec![];
+        let target_columns = Some(Arc::new(vec![0usize]));
+
+        let result = UpsertWriterFactory::sanity_check(
+            &row_type,
+            &primary_keys,
+            &auto_increment_col_names,
+            &target_columns,
+        );
+
+        assert!(result.unwrap_err().to_string().contains(
+            "Partial Update requires all columns except primary key to be nullable, but column required_field is NOT NULL."
+        ));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/writer.rs b/fluss-rust/crates/fluss/src/client/table/writer.rs
index 8a83b5e356..8276545703 100644
--- a/fluss-rust/crates/fluss/src/client/table/writer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/writer.rs
@@ -16,13 +16,13 @@
 // under the License.
 
 use crate::client::{WriteRecord, WriterClient};
-use crate::row::GenericRow;
+use crate::row::{GenericRow, InternalRow};
 use std::sync::Arc;
 
 use crate::error::Result;
 use crate::metadata::{TableInfo, TablePath};
 
-#[allow(dead_code)]
+#[allow(dead_code, async_fn_in_trait)]
 pub trait TableWriter {
     async fn flush(&self) -> Result<()>;
 }
@@ -32,12 +32,22 @@ pub trait AppendWriter: TableWriter {
     async fn append(&self, row: GenericRow) -> Result<()>;
 }
 
-#[allow(dead_code)]
+#[allow(dead_code, async_fn_in_trait)]
 pub trait UpsertWriter: TableWriter {
-    async fn upsert(&self, row: GenericRow) -> Result<()>;
-    async fn delete(&self, row: GenericRow) -> Result<()>;
+    async fn upsert<R: InternalRow>(&mut self, row: &R) -> Result<UpsertResult>;
+    async fn delete<R: InternalRow>(&mut self, row: &R) -> Result<DeleteResult>;
 }
 
+/// The result of upserting a record
+/// Currently this is an empty struct to allow for compatible evolution in the future
+#[derive(Default)]
+pub struct UpsertResult;
+
+/// The result of deleting a record
+/// Currently this is an empty struct to allow for compatible evolution in the future
+#[derive(Default)]
+pub struct DeleteResult;
+
 #[allow(dead_code)]
 pub struct AbstractTableWriter {
     table_path: Arc<TablePath>,
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 0afc9d4bc1..fb7b54470d 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -15,8 +15,8 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::client::write::batch::WriteBatch::ArrowLog;
-use crate::client::write::batch::{ArrowLogWriteBatch, WriteBatch};
+use crate::client::write::batch::WriteBatch::{ArrowLog, Kv};
+use crate::client::write::batch::{ArrowLogWriteBatch, KvWriteBatch, WriteBatch};
 use crate::client::{LogWriteRecord, Record, ResultHandle, WriteRecord};
 use crate::cluster::{BucketLocation, Cluster, ServerNode};
 use crate::config::Config;
@@ -102,16 +102,29 @@ impl RecordAccumulator {
 
         let schema_id = table_info.schema_id;
 
-        let mut batch = ArrowLog(ArrowLogWriteBatch::new(
-            self.batch_id.fetch_add(1, Ordering::Relaxed),
-            table_path.as_ref().clone(),
-            schema_id,
-            arrow_compression_info,
-            row_type,
-            bucket_id,
-            current_time_ms(),
-            matches!(&record.record, Record::Log(LogWriteRecord::RecordBatch(_))),
-        ));
+        let mut batch: WriteBatch = match record.record() {
+            Record::Log(_) => ArrowLog(ArrowLogWriteBatch::new(
+                self.batch_id.fetch_add(1, Ordering::Relaxed),
+                table_path.as_ref().clone(),
+                schema_id,
+                arrow_compression_info,
+                row_type,
+                bucket_id,
+                current_time_ms(),
+                matches!(&record.record, Record::Log(LogWriteRecord::RecordBatch(_))),
+            )),
+            Record::Kv(kv_record) => Kv(KvWriteBatch::new(
+                self.batch_id.fetch_add(1, Ordering::Relaxed),
+                table_path.as_ref().clone(),
+                schema_id,
+                // TODO: Decide how to derive write limit in the absence of java's equivalent of PreAllocatedPagedOutputView
+                KvWriteBatch::DEFAULT_WRITE_LIMIT,
+                record.write_format.to_kv_format()?,
+                bucket_id,
+                kv_record.target_columns.clone(),
+                current_time_ms(),
+            )),
+        };
 
         let batch_id = batch.batch_id();
 
@@ -142,6 +155,8 @@ impl RecordAccumulator {
     ) -> Result<RecordAppendResult> {
         let table_path = &record.table_path;
 
+        // TODO: Implement partitioning
+
         let dq = {
             let mut binding = self
                 .write_batches
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index 01597538c8..2ddf5192ed 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -20,11 +20,12 @@ use crate::client::broadcast::{BatchWriteResult, BroadcastOnce};
 use crate::client::{Record, ResultHandle, WriteRecord};
 use crate::compression::ArrowCompressionInfo;
 use crate::error::{Error, Result};
-use crate::metadata::{DataType, KvFormat, TablePath};
+use crate::metadata::{KvFormat, RowType, TablePath};
 use crate::record::MemoryLogRecordsArrowBuilder;
 use crate::record::kv::KvRecordBatchBuilder;
 use bytes::Bytes;
 use std::cmp::max;
+use std::sync::Arc;
 use std::sync::atomic::{AtomicBool, AtomicI32, Ordering};
 
 #[allow(dead_code)]
@@ -192,7 +193,7 @@ impl ArrowLogWriteBatch {
         table_path: TablePath,
         schema_id: i32,
         arrow_compression_info: ArrowCompressionInfo,
-        row_type: &DataType,
+        row_type: &RowType,
         bucket_id: BucketId,
         create_ms: i64,
         to_append_record_batch: bool,
@@ -249,11 +250,12 @@ impl ArrowLogWriteBatch {
 pub struct KvWriteBatch {
     write_batch: InnerWriteBatch,
     kv_batch_builder: KvRecordBatchBuilder,
-    target_columns: Option<Vec<usize>>,
+    target_columns: Option<Arc<Vec<usize>>>,
     schema_id: i32,
 }
 
 impl KvWriteBatch {
+    pub const DEFAULT_WRITE_LIMIT: usize = 256;
     #[allow(clippy::too_many_arguments)]
     pub fn new(
         batch_id: i64,
@@ -262,7 +264,7 @@ impl KvWriteBatch {
         write_limit: usize,
         kv_format: KvFormat,
         bucket_id: BucketId,
-        target_columns: Option<Vec<usize>>,
+        target_columns: Option<Arc<Vec<usize>>>,
         create_ms: i64,
     ) -> Self {
         let base = InnerWriteBatch::new(batch_id, table_path, create_ms, bucket_id);
@@ -284,7 +286,7 @@ impl KvWriteBatch {
             }
         };
 
-        let key = kv_write_record.key;
+        let key = kv_write_record.key.as_ref();
 
         if self.schema_id != write_record.schema_id {
             return Err(Error::UnexpectedError {
@@ -296,7 +298,7 @@ impl KvWriteBatch {
             });
         };
 
-        if self.target_columns.as_deref() != kv_write_record.target_columns {
+        if self.target_columns != kv_write_record.target_columns {
             return Err(Error::UnexpectedError {
                 message: format!(
                     "target columns {:?} of the write record to append are not the same as the current target columns {:?} in the batch.",
@@ -307,14 +309,14 @@ impl KvWriteBatch {
             });
         }
 
-        let row = kv_write_record.compacted_row.as_ref();
+        let row_bytes = kv_write_record.row_bytes();
 
-        if self.is_closed() || !self.kv_batch_builder.has_room_for_row(key, row) {
+        if self.is_closed() || !self.kv_batch_builder.has_room_for_row(key, row_bytes) {
             Ok(None)
         } else {
             // append successfully
             self.kv_batch_builder
-                .append_row(key, row)
+                .append_row(key, row_bytes)
                 .map_err(|e| Error::UnexpectedError {
                     message: "Failed to append row to KvWriteBatch".to_string(),
                     source: Some(Box::new(e)),
diff --git a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
index 2370719efe..817101a41a 100644
--- a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
+++ b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
@@ -20,6 +20,7 @@ use crate::cluster::Cluster;
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::TablePath;
+use bytes::Bytes;
 use rand::Rng;
 use std::sync::atomic::{AtomicI32, Ordering};
 
@@ -28,7 +29,7 @@ pub trait BucketAssigner: Sync + Send {
 
     fn on_new_batch(&self, cluster: &Cluster, prev_bucket_id: i32);
 
-    fn assign_bucket(&self, bucket_key: Option<&[u8]>, cluster: &Cluster) -> Result<i32>;
+    fn assign_bucket(&self, bucket_key: Option<&Bytes>, cluster: &Cluster) -> Result<i32>;
 }
 
 #[derive(Debug)]
@@ -94,7 +95,7 @@ impl BucketAssigner for StickyBucketAssigner {
         self.next_bucket(cluster, prev_bucket_id);
     }
 
-    fn assign_bucket(&self, _bucket_key: Option<&[u8]>, cluster: &Cluster) -> Result<i32> {
+    fn assign_bucket(&self, _bucket_key: Option<&Bytes>, cluster: &Cluster) -> Result<i32> {
         let bucket_id = self.current_bucket_id.load(Ordering::Relaxed);
         if bucket_id < 0 {
             Ok(self.next_bucket(cluster, bucket_id))
@@ -139,7 +140,7 @@ impl BucketAssigner for HashBucketAssigner {
         // do nothing
     }
 
-    fn assign_bucket(&self, bucket_key: Option<&[u8]>, _: &Cluster) -> Result<i32> {
+    fn assign_bucket(&self, bucket_key: Option<&Bytes>, _: &Cluster) -> Result<i32> {
         let key = bucket_key.ok_or_else(|| IllegalArgument {
             message: "no bucket key provided".to_string(),
         })?;
@@ -181,7 +182,7 @@ mod tests {
         let assigner = HashBucketAssigner::new(4, <dyn BucketingFunction>::of(None));
         let cluster = Cluster::default();
         let bucket = assigner
-            .assign_bucket(Some(b"key"), &cluster)
+            .assign_bucket(Some(&Bytes::from_static(b"key")), &cluster)
             .expect("bucket");
         assert!((0..4).contains(&bucket));
     }
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index 248218e076..dcc6795996 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -21,9 +21,10 @@ mod batch;
 use crate::client::broadcast::{self as client_broadcast, BatchWriteResult, BroadcastOnceReceiver};
 use crate::error::Error;
 use crate::metadata::TablePath;
-use crate::row::{CompactedRow, GenericRow};
+use crate::row::GenericRow;
 pub use accumulator::*;
 use arrow::array::RecordBatch;
+use bytes::Bytes;
 use std::sync::Arc;
 
 pub(crate) mod broadcast;
@@ -40,7 +41,7 @@ pub use writer_client::WriterClient;
 pub struct WriteRecord<'a> {
     record: Record<'a>,
     table_path: Arc<TablePath>,
-    bucket_key: Option<&'a [u8]>,
+    bucket_key: Option<Bytes>,
     schema_id: i32,
     write_format: WriteFormat,
 }
@@ -61,25 +62,43 @@ pub enum LogWriteRecord<'a> {
     RecordBatch(Arc<RecordBatch>),
 }
 
+#[derive(Clone)]
+pub enum RowBytes<'a> {
+    Borrowed(&'a [u8]),
+    Owned(Bytes),
+}
+
+impl<'a> RowBytes<'a> {
+    pub fn as_slice(&self) -> &[u8] {
+        match self {
+            RowBytes::Borrowed(slice) => slice,
+            RowBytes::Owned(bytes) => bytes.as_ref(),
+        }
+    }
+}
+
 pub struct KvWriteRecord<'a> {
-    // only valid for primary key table
-    key: &'a [u8],
-    target_columns: Option<&'a [usize]>,
-    compacted_row: Option<CompactedRow<'a>>,
+    key: Bytes,
+    target_columns: Option<Arc<Vec<usize>>>,
+    row_bytes: Option<RowBytes<'a>>,
 }
 
 impl<'a> KvWriteRecord<'a> {
     fn new(
-        key: &'a [u8],
-        target_columns: Option<&'a [usize]>,
-        compacted_row: Option<CompactedRow<'a>>,
+        key: Bytes,
+        target_columns: Option<Arc<Vec<usize>>>,
+        row_bytes: Option<RowBytes<'a>>,
     ) -> Self {
         KvWriteRecord {
             key,
             target_columns,
-            compacted_row,
+            row_bytes,
         }
     }
+
+    pub fn row_bytes(&self) -> Option<&[u8]> {
+        self.row_bytes.as_ref().map(|rb| rb.as_slice())
+    }
 }
 
 impl<'a> WriteRecord<'a> {
@@ -110,17 +129,18 @@ impl<'a> WriteRecord<'a> {
     pub fn for_upsert(
         table_path: Arc<TablePath>,
         schema_id: i32,
-        bucket_key: &'a [u8],
-        key: &'a [u8],
-        target_columns: Option<&'a [usize]>,
-        row: CompactedRow<'a>,
+        key: Bytes,
+        bucket_key: Option<Bytes>,
+        write_format: WriteFormat,
+        target_columns: Option<Arc<Vec<usize>>>,
+        row_bytes: Option<RowBytes<'a>>,
     ) -> Self {
         Self {
-            record: Record::Kv(KvWriteRecord::new(key, target_columns, Some(row))),
+            record: Record::Kv(KvWriteRecord::new(key, target_columns, row_bytes)),
             table_path,
-            bucket_key: Some(bucket_key),
+            bucket_key,
             schema_id,
-            write_format: WriteFormat::CompactedKv,
+            write_format,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/write_format.rs b/fluss-rust/crates/fluss/src/client/write/write_format.rs
index 4a0c0d8afa..147152cae4 100644
--- a/fluss-rust/crates/fluss/src/client/write/write_format.rs
+++ b/fluss-rust/crates/fluss/src/client/write/write_format.rs
@@ -20,6 +20,7 @@ use crate::error::Result;
 use crate::metadata::KvFormat;
 use std::fmt::Display;
 
+#[derive(Copy, Clone)]
 pub enum WriteFormat {
     ArrowLog,
     CompactedLog,
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index 22e0397212..65b04f5621 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -21,6 +21,7 @@ use crate::client::write::sender::Sender;
 use crate::client::{RecordAccumulator, ResultHandle, WriteRecord};
 use crate::config::Config;
 use crate::metadata::TablePath;
+use bytes::Bytes;
 use dashmap::DashMap;
 use std::sync::Arc;
 use tokio::sync::mpsc;
@@ -90,8 +91,9 @@ impl WriterClient {
     pub async fn send(&self, record: &WriteRecord<'_>) -> Result<ResultHandle> {
         let table_path = &record.table_path;
         let cluster = self.metadata.get_cluster();
+        let bucket_key = record.bucket_key.as_ref();
 
-        let (bucket_assigner, bucket_id) = self.assign_bucket(table_path)?;
+        let (bucket_assigner, bucket_id) = self.assign_bucket(bucket_key, table_path)?;
 
         let mut result = self
             .accumulate
@@ -101,7 +103,7 @@ impl WriterClient {
         if result.abort_record_for_new_batch {
             let prev_bucket_id = bucket_id;
             bucket_assigner.on_new_batch(&cluster, prev_bucket_id);
-            let bucket_id = bucket_assigner.assign_bucket(None, &cluster)?;
+            let bucket_id = bucket_assigner.assign_bucket(bucket_key, &cluster)?;
             result = self
                 .accumulate
                 .append(record, bucket_id, &cluster, false)
@@ -116,6 +118,7 @@ impl WriterClient {
     }
     fn assign_bucket(
         &self,
+        bucket_key: Option<&Bytes>,
         table_path: &Arc<TablePath>,
     ) -> Result<(Arc<Box<dyn BucketAssigner>>, i32)> {
         let cluster = self.metadata.get_cluster();
@@ -129,7 +132,7 @@ impl WriterClient {
                 assigner
             }
         };
-        let bucket_id = bucket_assigner.assign_bucket(None, &cluster)?;
+        let bucket_id = bucket_assigner.assign_bucket(bucket_key, &cluster)?;
         Ok((bucket_assigner, bucket_id))
     }
 
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index da85b0c2da..8204e7c46c 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -16,7 +16,7 @@
 // under the License.
 
 use crate::compression::ArrowCompressionInfo;
-use crate::error::Error::InvalidTableError;
+use crate::error::Error::{IllegalArgument, InvalidTableError};
 use crate::error::{Error, Result};
 use crate::metadata::DataLakeFormat;
 use crate::metadata::datatype::{DataField, DataType, RowType};
@@ -97,8 +97,8 @@ impl PrimaryKey {
 pub struct Schema {
     columns: Vec<Column>,
     primary_key: Option<PrimaryKey>,
-    // must be Row data type kind
-    row_type: DataType,
+    row_type: RowType,
+    auto_increment_col_names: Vec<String>,
 }
 
 impl Schema {
@@ -118,7 +118,7 @@ impl Schema {
         self.primary_key.as_ref()
     }
 
-    pub fn row_type(&self) -> &DataType {
+    pub fn row_type(&self) -> &RowType {
         &self.row_type
     }
 
@@ -144,12 +144,17 @@ impl Schema {
     pub fn column_names(&self) -> Vec<&str> {
         self.columns.iter().map(|c| c.name.as_str()).collect()
     }
+
+    pub fn auto_increment_col_names(&self) -> &Vec<String> {
+        &self.auto_increment_col_names
+    }
 }
 
 #[derive(Debug, Default)]
 pub struct SchemaBuilder {
     columns: Vec<Column>,
     primary_key: Option<PrimaryKey>,
+    auto_increment_col_names: Vec<String>,
 }
 
 impl SchemaBuilder {
@@ -198,9 +203,36 @@ impl SchemaBuilder {
         self
     }
 
+    /// Declares a column to be auto-incremented. With an auto-increment column in the table,
+    /// whenever a new row is inserted into the table, the new row will be assigned with the next
+    /// available value from the auto-increment sequence. A table can have at most one auto
+    /// increment column.
+    pub fn enable_auto_increment(mut self, column_name: &str) -> Result<Self> {
+        if !self.auto_increment_col_names.is_empty() {
+            return Err(IllegalArgument {
+                message: "Multiple auto increment columns are not supported yet.".to_string(),
+            });
+        }
+
+        self.auto_increment_col_names.push(column_name.to_string());
+        Ok(self)
+    }
+
     pub fn build(&mut self) -> Result<Schema> {
         let columns = Self::normalize_columns(&mut self.columns, self.primary_key.as_ref())?;
 
+        let column_names: HashSet<_> = columns.iter().map(|c| &c.name).collect();
+        for auto_inc_col in &self.auto_increment_col_names {
+            if !column_names.contains(auto_inc_col) {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "Auto increment column '{}' is not found in the schema columns.",
+                        auto_inc_col
+                    ),
+                });
+            }
+        }
+
         let data_fields = columns
             .iter()
             .map(|c| DataField {
@@ -213,7 +245,8 @@ impl SchemaBuilder {
         Ok(Schema {
             columns,
             primary_key: self.primary_key.clone(),
-            row_type: DataType::Row(RowType::new(data_fields)),
+            row_type: RowType::new(data_fields),
+            auto_increment_col_names: self.auto_increment_col_names.clone(),
         })
     }
 
@@ -500,7 +533,7 @@ impl TableDescriptor {
         bucket_keys.retain(|k| !partition_keys.contains(k));
 
         if bucket_keys.is_empty() {
-            return Err(Error::InvalidTableError {
+            return Err(InvalidTableError {
                 message: format!(
                     "Primary Key constraint {:?} should not be same with partition fields {:?}.",
                     schema.primary_key().unwrap().column_names(),
@@ -580,7 +613,7 @@ pub enum LogFormat {
 }
 
 impl Display for LogFormat {
-    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
         match self {
             LogFormat::ARROW => {
                 write!(f, "ARROW")?;
@@ -612,7 +645,7 @@ pub enum KvFormat {
 }
 
 impl Display for KvFormat {
-    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
         match self {
             KvFormat::COMPACTED => write!(f, "COMPACTED")?,
             KvFormat::INDEXED => write!(f, "INDEXED")?,
@@ -626,7 +659,7 @@ impl KvFormat {
         match s.to_uppercase().as_str() {
             "INDEXED" => Ok(KvFormat::INDEXED),
             "COMPACTED" => Ok(KvFormat::COMPACTED),
-            _ => Err(Error::InvalidTableError {
+            _ => Err(InvalidTableError {
                 message: format!("Unknown kv format: {s}"),
             }),
         }
@@ -692,7 +725,7 @@ pub struct TableInfo {
     pub table_id: i64,
     pub schema_id: i32,
     pub schema: Schema,
-    pub row_type: DataType,
+    pub row_type: RowType,
     pub primary_keys: Vec<String>,
     pub physical_primary_keys: Vec<String>,
     pub bucket_keys: Vec<String>,
@@ -708,10 +741,7 @@ pub struct TableInfo {
 
 impl TableInfo {
     pub fn row_type(&self) -> &RowType {
-        match &self.row_type {
-            DataType::Row(row_type) => row_type,
-            _ => panic!("should be a row type"),
-        }
+        &self.row_type
     }
 }
 
@@ -847,7 +877,7 @@ impl TableInfo {
         &self.schema
     }
 
-    pub fn get_row_type(&self) -> &DataType {
+    pub fn get_row_type(&self) -> &RowType {
         &self.row_type
     }
 
@@ -946,8 +976,8 @@ impl TableInfo {
     }
 }
 
-impl fmt::Display for TableInfo {
-    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+impl Display for TableInfo {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
         write!(
             f,
             "TableInfo{{ table_path={:?}, table_id={}, schema_id={}, schema={:?}, physical_primary_keys={:?}, bucket_keys={:?}, partition_keys={:?}, num_buckets={}, properties={:?}, custom_properties={:?}, comment={:?}, created_time={}, modified_time={} }}",
@@ -998,7 +1028,7 @@ impl TableBucket {
 }
 
 impl Display for TableBucket {
-    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
         if let Some(partition_id) = self.partition_id {
             write!(
                 f,
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 3c46f9b5cd..3c94b7208f 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -18,7 +18,7 @@
 use crate::client::{LogWriteRecord, Record, WriteRecord};
 use crate::compression::ArrowCompressionInfo;
 use crate::error::{Error, Result};
-use crate::metadata::DataType;
+use crate::metadata::{DataType, RowType};
 use crate::record::{ChangeType, ScanRecord};
 use crate::row::{ColumnarRow, GenericRow};
 use arrow::array::{
@@ -48,6 +48,7 @@ use std::{
     sync::Arc,
 };
 
+use crate::error::Error::IllegalArgument;
 use arrow::ipc::writer::IpcWriteOptions;
 /// const for record batch
 pub const BASE_OFFSET_LENGTH: usize = 8;
@@ -171,7 +172,7 @@ pub struct RowAppendRecordBatchBuilder {
 }
 
 impl RowAppendRecordBatchBuilder {
-    pub fn new(row_type: &DataType) -> Self {
+    pub fn new(row_type: &RowType) -> Self {
         let schema_ref = to_arrow_schema(row_type);
         let builders = Mutex::new(
             schema_ref
@@ -251,7 +252,7 @@ impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
 impl MemoryLogRecordsArrowBuilder {
     pub fn new(
         schema_id: i32,
-        row_type: &DataType,
+        row_type: &RowType,
         to_append_record_batch: bool,
         arrow_compression_info: ArrowCompressionInfo,
     ) -> Self {
@@ -329,7 +330,7 @@ impl MemoryLogRecordsArrowBuilder {
         // write arrow batch bytes
         let mut cursor = Cursor::new(&mut batch_bytes[..]);
         cursor.set_position(RECORD_BATCH_HEADER_SIZE as u64);
-        cursor.write_all(real_arrow_batch_bytes).unwrap();
+        cursor.write_all(real_arrow_batch_bytes)?;
 
         let calcute_crc_bytes = &cursor.get_ref()[SCHEMA_ID_OFFSET..];
         // then update crc
@@ -562,16 +563,17 @@ impl LogRecordBatch {
             return Ok(RecordBatch::new_empty(read_context.target_schema.clone()));
         }
 
-        let data = self.data.get(RECORDS_OFFSET..).ok_or_else(|| {
-            crate::error::Error::UnexpectedError {
+        let data = self
+            .data
+            .get(RECORDS_OFFSET..)
+            .ok_or_else(|| Error::UnexpectedError {
                 message: format!(
                     "Corrupt log record batch: data length {} is less than RECORDS_OFFSET {}",
                     self.data.len(),
                     RECORDS_OFFSET
                 ),
                 source: None,
-            }
-        })?;
+            })?;
         read_context.record_batch(data)
     }
 }
@@ -639,27 +641,20 @@ fn parse_ipc_message(
     Ok((batch_metadata, body_buffer, message.version()))
 }
 
-pub fn to_arrow_schema(fluss_schema: &DataType) -> SchemaRef {
-    match &fluss_schema {
-        DataType::Row(row_type) => {
-            let fields: Vec<Field> = row_type
-                .fields()
-                .iter()
-                .map(|f| {
-                    Field::new(
-                        f.name(),
-                        to_arrow_type(f.data_type()),
-                        f.data_type().is_nullable(),
-                    )
-                })
-                .collect();
+pub fn to_arrow_schema(fluss_schema: &RowType) -> SchemaRef {
+    let fields: Vec<Field> = fluss_schema
+        .fields()
+        .iter()
+        .map(|f| {
+            Field::new(
+                f.name(),
+                to_arrow_type(f.data_type()),
+                f.data_type().is_nullable(),
+            )
+        })
+        .collect();
 
-            SchemaRef::new(arrow_schema::Schema::new(fields))
-        }
-        _ => {
-            panic!("must be row data type.")
-        }
-    }
+    SchemaRef::new(arrow_schema::Schema::new(fields))
 }
 
 pub fn to_arrow_type(fluss_type: &DataType) -> ArrowDataType {
@@ -813,7 +808,7 @@ impl ReadContext {
                 let mut reordering_indexes = Vec::with_capacity(projected_fields.len());
                 for &original_idx in &projected_fields {
                     let pos = sorted_fields.binary_search(&original_idx).map_err(|_| {
-                        Error::IllegalArgument {
+                        IllegalArgument {
                             message: format!(
                                 "Projection index {original_idx} is invalid for the current schema."
                             ),
@@ -857,7 +852,7 @@ impl ReadContext {
         let field_count = schema.fields().len();
         for &index in projected_fields {
             if index >= field_count {
-                return Err(Error::IllegalArgument {
+                return Err(IllegalArgument {
                     message: format!(
                         "Projection index {index} is out of bounds for schema with {field_count} fields."
                     ),
@@ -869,7 +864,7 @@ impl ReadContext {
 
     pub fn project_schema(schema: SchemaRef, projected_fields: &[usize]) -> Result<SchemaRef> {
         Ok(SchemaRef::new(schema.project(projected_fields).map_err(
-            |e| Error::IllegalArgument {
+            |e| IllegalArgument {
                 message: format!("Invalid projection: {e}"),
             },
         )?))
@@ -1060,7 +1055,6 @@ pub struct MyVec<T>(pub StreamReader<T>);
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::error::Error;
     use crate::metadata::{DataField, DataTypes};
 
     #[test]
@@ -1217,14 +1211,14 @@ mod tests {
 
     #[test]
     fn projection_rejects_out_of_bounds_index() {
-        let row_type = DataTypes::row(vec![
+        let row_type = RowType::new(vec![
             DataField::new("id".to_string(), DataTypes::int(), None),
             DataField::new("name".to_string(), DataTypes::string(), None),
         ]);
         let schema = to_arrow_schema(&row_type);
         let result = ReadContext::with_projection_pushdown(schema, vec![0, 2], false);
 
-        assert!(matches!(result, Err(Error::IllegalArgument { .. })));
+        assert!(matches!(result, Err(IllegalArgument { .. })));
     }
 
     #[test]
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
index 32f712f82e..eb89d69cda 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
@@ -370,12 +370,12 @@ impl Iterator for KvRecordIterator {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::{DataTypes, KvFormat, RowType};
+    use crate::metadata::{DataTypes, KvFormat};
     use crate::record::kv::test_util::TestReadContext;
     use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, KvRecordBatchBuilder};
     use crate::row::InternalRow;
     use crate::row::binary::BinaryWriter;
-    use crate::row::compacted::CompactedRow;
+
     use bytes::{BufMut, BytesMut};
 
     #[test]
@@ -417,12 +417,11 @@ mod tests {
         let mut value1_writer = CompactedRowWriter::new(1);
         value1_writer.write_bytes(&[1, 2, 3, 4, 5]);
 
-        let row_type = RowType::with_data_types([DataTypes::bytes()].to_vec());
-        let row = &CompactedRow::from_bytes(&row_type, value1_writer.buffer());
-        builder.append_row(key1, Some(row)).unwrap();
+        let row_bytes = value1_writer.buffer();
+        builder.append_row(key1, Some(row_bytes)).unwrap();
 
         let key2 = b"key2";
-        builder.append_row::<CompactedRow>(key2, None).unwrap();
+        builder.append_row(key2, None).unwrap();
 
         let bytes = builder.build().unwrap();
 
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
index e3da8640f7..0b65500fd4 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
@@ -28,7 +28,6 @@ use crate::record::kv::kv_record_batch::{
     WRITE_CLIENT_ID_OFFSET,
 };
 use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, NO_BATCH_SEQUENCE, NO_WRITER_ID};
-use crate::row::BinaryRow;
 use bytes::{Bytes, BytesMut};
 use std::io;
 
@@ -88,14 +87,13 @@ impl KvRecordBatchBuilder {
         }
     }
 
-    /// Check if there is room for a new record containing the given key and row.
+    /// Check if there is room for a new record containing the given key and row bytes.
     /// If no records have been appended, this always returns true.
-    pub fn has_room_for_row<R: BinaryRow>(&self, key: &[u8], row: Option<&R>) -> bool {
-        let value = row.map(|r| r.as_bytes());
-        self.size_in_bytes + KvRecord::size_of(key, value) <= self.write_limit
+    pub fn has_room_for_row(&self, key: &[u8], row_bytes: Option<&[u8]>) -> bool {
+        self.size_in_bytes + KvRecord::size_of(key, row_bytes) <= self.write_limit
     }
 
-    /// Append a KV record with a row value to the batch.
+    /// Append a KV record with row bytes to the batch.
     ///
     /// Returns an error if:
     /// - The builder has been aborted
@@ -103,7 +101,7 @@ impl KvRecordBatchBuilder {
     /// - Adding this record would exceed the write limit
     /// - The maximum number of records is exceeded
     /// - The KV format is not COMPACTED
-    pub fn append_row<R: BinaryRow>(&mut self, key: &[u8], row: Option<&R>) -> io::Result<()> {
+    pub fn append_row(&mut self, key: &[u8], row_bytes: Option<&[u8]>) -> io::Result<()> {
         if self.kv_format != KvFormat::COMPACTED {
             return Err(io::Error::new(
                 io::ErrorKind::InvalidInput,
@@ -134,8 +132,7 @@ impl KvRecordBatchBuilder {
             ));
         }
 
-        let value = row.map(|r| r.as_bytes());
-        let record_size = KvRecord::size_of(key, value);
+        let record_size = KvRecord::size_of(key, row_bytes);
         if self.size_in_bytes + record_size > self.write_limit {
             return Err(io::Error::new(
                 io::ErrorKind::WriteZero,
@@ -146,7 +143,7 @@ impl KvRecordBatchBuilder {
             ));
         }
 
-        let record_byte_size = KvRecord::write_to_buf(&mut self.buffer, key, value)?;
+        let record_byte_size = KvRecord::write_to_buf(&mut self.buffer, key, row_bytes)?;
         debug_assert_eq!(record_byte_size, record_size, "Record size mismatch");
 
         self.current_record_number += 1;
@@ -349,12 +346,12 @@ mod tests {
 
         let key1 = b"key1";
         let value1 = create_test_row(b"value1");
-        assert!(builder.has_room_for_row(key1, Some(&value1)));
-        builder.append_row(key1, Some(&value1)).unwrap();
+        assert!(builder.has_room_for_row(key1, Some(value1.as_bytes())));
+        builder.append_row(key1, Some(value1.as_bytes())).unwrap();
 
         let key2 = b"key2";
-        assert!(builder.has_room_for_row::<CompactedRow>(key2, None));
-        builder.append_row::<CompactedRow>(key2, None).unwrap();
+        assert!(builder.has_room_for_row(key2, None));
+        builder.append_row(key2, None).unwrap();
 
         builder.close().unwrap();
         assert!(builder.is_closed());
@@ -369,35 +366,34 @@ mod tests {
         // Test lifecycle: abort behavior
         let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
         let value = create_test_row(b"value");
-        builder.append_row(b"key", Some(&value)).unwrap();
+        builder.append_row(b"key", Some(value.as_bytes())).unwrap();
         builder.abort();
-        assert!(builder.append_row::<CompactedRow>(b"key2", None).is_err());
+        assert!(builder.append_row(b"key2", None).is_err());
         assert!(builder.build().is_err());
         assert!(builder.close().is_err());
 
         // Test lifecycle: close behavior
         let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
         let value = create_test_row(b"value");
-        builder.append_row(b"key", Some(&value)).unwrap();
+        builder.append_row(b"key", Some(value.as_bytes())).unwrap();
         builder.close().unwrap();
-        assert!(builder.append_row::<CompactedRow>(b"key2", None).is_err());
+        assert!(builder.append_row(b"key2", None).is_err());
         assert!(builder.build().is_ok());
 
         // Test KvFormat validation
         let mut row_writer = CompactedRowWriter::new(1);
         row_writer.write_int(42);
-        let row_type = RowType::with_data_types(vec![DataTypes::int()]);
-        let row = &CompactedRow::from_bytes(&row_type, row_writer.buffer());
+        let row_bytes = row_writer.buffer();
 
         // INDEXED format should reject append_row
         let mut indexed_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::INDEXED);
-        let result = indexed_builder.append_row(b"key", Some(row));
+        let result = indexed_builder.append_row(b"key", Some(row_bytes));
         assert!(result.is_err());
         assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidInput);
 
         // COMPACTED format should accept append_row
         let mut compacted_builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
-        let result = compacted_builder.append_row(b"key", Some(row));
+        let result = compacted_builder.append_row(b"key", Some(row_bytes));
         assert!(result.is_ok());
     }
 
@@ -410,15 +406,17 @@ mod tests {
         let large_key = vec![0u8; 1000];
         let large_value = vec![1u8; 1000];
         let large_row = create_test_row(&large_value);
-        assert!(!builder.has_room_for_row(&large_key, Some(&large_row)));
+        assert!(!builder.has_room_for_row(&large_key, Some(large_row.as_bytes())));
         let small_value = create_test_row(b"value");
-        assert!(builder.has_room_for_row(b"key", Some(&small_value)));
+        assert!(builder.has_room_for_row(b"key", Some(small_value.as_bytes())));
 
         // Test append enforcement - add small record first
-        builder.append_row(b"key", Some(&small_value)).unwrap();
+        builder
+            .append_row(b"key", Some(small_value.as_bytes()))
+            .unwrap();
 
         // Try to add large record that exceeds limit (reuse large_row from above)
-        let result = builder.append_row(b"key2", Some(&large_row));
+        let result = builder.append_row(b"key2", Some(large_row.as_bytes()));
         assert!(result.is_err());
         assert_eq!(result.unwrap_err().kind(), io::ErrorKind::WriteZero);
     }
@@ -429,10 +427,12 @@ mod tests {
         builder.current_record_number = i32::MAX - 1;
 
         let value1 = create_test_row(b"value1");
-        builder.append_row(b"key1", Some(&value1)).unwrap();
+        builder
+            .append_row(b"key1", Some(value1.as_bytes()))
+            .unwrap();
 
         let value2 = create_test_row(b"value2");
-        let result = builder.append_row(b"key2", Some(&value2));
+        let result = builder.append_row(b"key2", Some(value2.as_bytes()));
         assert!(result.is_err());
         assert_eq!(result.unwrap_err().kind(), io::ErrorKind::InvalidInput);
     }
@@ -452,13 +452,17 @@ mod tests {
         builder.set_writer_state(100, 5);
 
         let value1 = create_test_row(b"value1");
-        builder.append_row(b"key1", Some(&value1)).unwrap();
+        builder
+            .append_row(b"key1", Some(value1.as_bytes()))
+            .unwrap();
         let bytes1 = builder.build().unwrap();
         let len1 = bytes1.len();
 
         // Append another record - this should invalidate the cache
         let value2 = create_test_row(b"value2");
-        builder.append_row(b"key2", Some(&value2)).unwrap();
+        builder
+            .append_row(b"key2", Some(value2.as_bytes()))
+            .unwrap();
         let bytes2 = builder.build().unwrap();
         let len2 = bytes2.len();
 
@@ -472,7 +476,7 @@ mod tests {
         let mut builder = KvRecordBatchBuilder::new(1, 4096, KvFormat::COMPACTED);
         builder.set_writer_state(100, 5);
         let value = create_test_row(b"value");
-        builder.append_row(b"key", Some(&value)).unwrap();
+        builder.append_row(b"key", Some(value.as_bytes())).unwrap();
         let bytes1 = builder.build().unwrap();
 
         // Change writer state - this should invalidate the cache
@@ -494,7 +498,6 @@ mod tests {
     fn test_builder_with_compacted_row_writer() -> crate::error::Result<()> {
         use crate::record::kv::KvRecordBatch;
         use crate::row::InternalRow;
-        use crate::row::compacted::CompactedRow;
 
         let mut builder = KvRecordBatchBuilder::new(1, 100000, KvFormat::COMPACTED);
         builder.set_writer_state(100, 5);
@@ -504,26 +507,25 @@ mod tests {
         row_writer1.write_int(42);
         row_writer1.write_string("hello");
 
-        let row_type = RowType::with_data_types([DataTypes::int(), DataTypes::string()].to_vec());
-        let row1 = &CompactedRow::from_bytes(&row_type, row_writer1.buffer());
+        let row_bytes1 = row_writer1.buffer();
 
         let key1 = b"key1";
-        assert!(builder.has_room_for_row(key1, Some(row1)));
-        builder.append_row(key1, Some(row1))?;
+        assert!(builder.has_room_for_row(key1, Some(row_bytes1)));
+        builder.append_row(key1, Some(row_bytes1))?;
 
         // Create and append second record
         let mut row_writer2 = CompactedRowWriter::new(2);
         row_writer2.write_int(100);
         row_writer2.write_string("world");
 
-        let row2 = &CompactedRow::from_bytes(&row_type, row_writer2.buffer());
+        let row_bytes2 = row_writer2.buffer();
 
         let key2 = b"key2";
-        builder.append_row(key2, Some(row2))?;
+        builder.append_row(key2, Some(row_bytes2))?;
 
         // Append a deletion record
         let key3 = b"key3";
-        builder.append_row::<CompactedRow>(key3, None)?;
+        builder.append_row(key3, None)?;
 
         // Build and verify
         builder.close()?;
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
index fe6c6f0598..9236321668 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
@@ -18,7 +18,7 @@
 //! Default implementation of ReadContext with decoder caching.
 
 use super::ReadContext;
-use crate::error::{Error, Result};
+use crate::error::Result;
 use crate::metadata::{KvFormat, Schema};
 use crate::row::{RowDecoder, RowDecoderFactory};
 use std::collections::HashMap;
@@ -85,20 +85,7 @@ impl ReadContext for KvRecordReadContext {
 
         // Build decoder outside the lock to avoid blocking other threads
         let schema = self.schema_getter.get_schema(schema_id)?;
-        let row_type = match schema.row_type() {
-            crate::metadata::DataType::Row(row_type) => row_type.clone(),
-            other => {
-                return Err(Error::IoUnexpectedError {
-                    message: format!(
-                        "Schema {schema_id} has invalid row type: expected Row, got {other:?}"
-                    ),
-                    source: std::io::Error::new(
-                        std::io::ErrorKind::InvalidData,
-                        "Invalid row type",
-                    ),
-                });
-            }
-        };
+        let row_type = schema.row_type().clone();
 
         // Create decoder outside lock
         let decoder = RowDecoderFactory::create(self.kv_format.clone(), row_type)?;
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index bc68ea10e5..35d684db6f 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -15,9 +15,10 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::client::WriteFormat;
 use crate::metadata::RowType;
 use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
-use crate::row::{BinaryRow, GenericRow, InternalRow};
+use crate::row::{GenericRow, InternalRow};
 use std::sync::{Arc, OnceLock};
 
 // Reference implementation:
@@ -69,10 +70,8 @@ impl<'a> CompactedRow<'a> {
         self.decoded_row
             .get_or_init(|| self.deserializer.deserialize(&self.reader))
     }
-}
 
-impl BinaryRow for CompactedRow<'_> {
-    fn as_bytes(&self) -> &[u8] {
+    pub fn as_bytes(&self) -> &[u8] {
         self.data
     }
 }
@@ -153,6 +152,14 @@ impl<'a> InternalRow for CompactedRow<'a> {
     fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampLtz {
         self.decoded_row().get_timestamp_ltz(pos, precision)
     }
+
+    fn as_encoded_bytes(&self, write_format: WriteFormat) -> Option<&[u8]> {
+        match write_format {
+            WriteFormat::CompactedKv => Some(self.as_bytes()),
+            WriteFormat::ArrowLog => None,
+            WriteFormat::CompactedLog => None,
+        }
+    }
 }
 
 #[cfg(test)]
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index d1ad047a72..ac0100eefb 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -63,6 +63,18 @@ impl CompactedRowWriter {
         Bytes::copy_from_slice(&self.buffer[..self.position])
     }
 
+    /// Flushes writer's ByteMut, resetting writer's inner state and returns Byte of flushed state
+    pub fn flush_bytes(&mut self) -> Bytes {
+        let used = self.buffer.split_to(self.position);
+        self.position = self.header_size_in_bytes;
+        if self.buffer.len() < self.header_size_in_bytes {
+            self.buffer.resize(self.header_size_in_bytes.max(64), 0);
+        } else {
+            self.buffer[..self.header_size_in_bytes].fill(0);
+        }
+        used.freeze()
+    }
+
     fn ensure_capacity(&mut self, need_len: usize) {
         if (self.buffer.len() - self.position) < need_len {
             let new_len = cmp::max(self.buffer.len() * 2, self.buffer.len() + need_len);
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs
index 48b9f3ff58..20f28820cf 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_row_encoder.rs
@@ -20,8 +20,9 @@ use crate::error::Result;
 use crate::metadata::RowType;
 use crate::row::Datum;
 use crate::row::binary::{BinaryRowFormat, BinaryWriter, ValueWriter};
-use crate::row::compacted::{CompactedRow, CompactedRowDeserializer, CompactedRowWriter};
-use crate::row::encode::{BinaryRow, RowEncoder};
+use crate::row::compacted::{CompactedRowDeserializer, CompactedRowWriter};
+use crate::row::encode::RowEncoder;
+use bytes::Bytes;
 use std::sync::Arc;
 
 #[allow(dead_code)]
@@ -65,12 +66,8 @@ impl RowEncoder for CompactedRowEncoder<'_> {
             .write_value(&mut self.writer, pos, &value)
     }
 
-    fn finish_row(&mut self) -> Result<impl BinaryRow> {
-        Ok(CompactedRow::deserialize(
-            Arc::clone(&self.compacted_row_deserializer),
-            self.arity,
-            self.writer.buffer(),
-        ))
+    fn finish_row(&mut self) -> Result<Bytes> {
+        Ok(self.writer.flush_bytes())
     }
 
     fn close(&mut self) -> Result<()> {
diff --git a/fluss-rust/crates/fluss/src/row/encode/mod.rs b/fluss-rust/crates/fluss/src/row/encode/mod.rs
index c294ecf1d1..468d4d182b 100644
--- a/fluss-rust/crates/fluss/src/row/encode/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/mod.rs
@@ -22,7 +22,7 @@ use crate::error::Result;
 use crate::metadata::{DataLakeFormat, KvFormat, RowType};
 use crate::row::encode::compacted_key_encoder::CompactedKeyEncoder;
 use crate::row::encode::compacted_row_encoder::CompactedRowEncoder;
-use crate::row::{BinaryRow, Datum, InternalRow};
+use crate::row::{Datum, InternalRow};
 use bytes::Bytes;
 
 /// An interface for encoding key of row into bytes.
@@ -31,8 +31,9 @@ pub trait KeyEncoder {
     fn encode_key(&mut self, row: &dyn InternalRow) -> Result<Bytes>;
 }
 
-#[allow(dead_code)]
-impl dyn KeyEncoder {
+pub struct KeyEncoderFactory;
+
+impl KeyEncoderFactory {
     /// Create a key encoder to encode the key bytes of the input row.
     /// # Arguments
     /// * `row_type` - the row type of the input row
@@ -43,23 +44,21 @@ impl dyn KeyEncoder {
     /// key encoder
     pub fn of(
         row_type: &RowType,
-        key_fields: Vec<String>,
-        data_lake_format: Option<DataLakeFormat>,
+        key_fields: &[String],
+        data_lake_format: &Option<DataLakeFormat>,
     ) -> Result<Box<dyn KeyEncoder>> {
         match data_lake_format {
             Some(DataLakeFormat::Paimon) => {
                 unimplemented!("KeyEncoder for Paimon format is currently unimplemented")
             }
             Some(DataLakeFormat::Lance) => Ok(Box::new(CompactedKeyEncoder::create_key_encoder(
-                row_type,
-                key_fields.as_slice(),
+                row_type, key_fields,
             )?)),
             Some(DataLakeFormat::Iceberg) => {
                 unimplemented!("KeyEncoder for Iceberg format is currently unimplemented")
             }
             None => Ok(Box::new(CompactedKeyEncoder::create_key_encoder(
-                row_type,
-                key_fields.as_slice(),
+                row_type, key_fields,
             )?)),
         }
     }
@@ -96,7 +95,7 @@ pub trait RowEncoder {
     ///
     /// # Returns
     /// * the written row
-    fn finish_row(&mut self) -> Result<impl BinaryRow>;
+    fn finish_row(&mut self) -> Result<Bytes>;
 
     /// Closes the row encoder
     ///
@@ -110,8 +109,8 @@ pub struct RowEncoderFactory {}
 
 #[allow(dead_code)]
 impl RowEncoderFactory {
-    pub fn create(kv_format: KvFormat, row_type: &RowType) -> Result<impl RowEncoder> {
-        Self::create_for_field_types(kv_format, row_type.clone())
+    pub fn create(kv_format: KvFormat, row_type: RowType) -> Result<impl RowEncoder> {
+        Self::create_for_field_types(kv_format, row_type)
     }
 
     pub fn create_for_field_types(
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index d2f640e4dc..bc8134dde6 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -23,9 +23,11 @@ mod decimal;
 pub mod binary;
 pub mod compacted;
 pub mod encode;
-mod field_getter;
+pub mod field_getter;
 mod row_decoder;
 
+use crate::client::WriteFormat;
+use bytes::Bytes;
 pub use column::*;
 pub use compacted::CompactedRow;
 pub use datum::*;
@@ -33,9 +35,23 @@ pub use decimal::{Decimal, MAX_COMPACT_PRECISION};
 pub use encode::KeyEncoder;
 pub use row_decoder::{CompactedRowDecoder, RowDecoder, RowDecoderFactory};
 
-pub trait BinaryRow: InternalRow {
+pub struct BinaryRow<'a> {
+    data: BinaryDataWrapper<'a>,
+}
+
+pub enum BinaryDataWrapper<'a> {
+    Bytes(Bytes),
+    Ref(&'a [u8]),
+}
+
+impl<'a> BinaryRow<'a> {
     /// Returns the binary representation of this row as a byte slice.
-    fn as_bytes(&self) -> &[u8];
+    pub fn as_bytes(&'a self) -> &'a [u8] {
+        match &self.data {
+            BinaryDataWrapper::Bytes(bytes) => bytes.as_ref(),
+            BinaryDataWrapper::Ref(r) => r,
+        }
+    }
 }
 
 // TODO make functions return Result<?> for better error handling
@@ -99,6 +115,11 @@ pub trait InternalRow {
 
     /// Returns the binary value at the given position
     fn get_bytes(&self, pos: usize) -> &[u8];
+
+    /// Returns encoded bytes if already encoded
+    fn as_encoded_bytes(&self, _write_format: WriteFormat) -> Option<&[u8]> {
+        None
+    }
 }
 
 pub struct GenericRow<'a> {

From d263743b060b5771b78b6a58a199396e82ab08c2 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Tue, 20 Jan 2026 15:56:22 +0000
Subject: [PATCH 077/287] feat: Introduce Kv table example (#181)

---
 fluss-rust/crates/examples/Cargo.toml         |   6 +-
 .../crates/examples/src/example_kv_table.rs   | 116 ++++++++++++++++++
 .../crates/examples/src/example_table.rs      |   2 +
 fluss-rust/crates/fluss/src/row/mod.rs        |   1 +
 4 files changed, 124 insertions(+), 1 deletion(-)
 create mode 100644 fluss-rust/crates/examples/src/example_kv_table.rs

diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
index e1fa531764..117ceb2708 100644
--- a/fluss-rust/crates/examples/Cargo.toml
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -29,4 +29,8 @@ tokio = { workspace = true }
 clap = { workspace = true }
 [[example]]
 name = "example-table"
-path = "src/example_table.rs"
\ No newline at end of file
+path = "src/example_table.rs"
+
+[[example]]
+name = "example-upsert-lookup"
+path = "src/example_kv_table.rs"
\ No newline at end of file
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
new file mode 100644
index 0000000000..75821a37e6
--- /dev/null
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -0,0 +1,116 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use clap::Parser;
+use fluss::client::{FlussConnection, UpsertWriter};
+use fluss::config::Config;
+use fluss::error::Result;
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+use fluss::row::{GenericRow, InternalRow};
+
+#[tokio::main]
+#[allow(dead_code)]
+pub async fn main() -> Result<()> {
+    let mut config = Config::parse();
+    config.bootstrap_server = Some("127.0.0.1:9123".to_string());
+
+    let conn = FlussConnection::new(config).await?;
+
+    let table_descriptor = TableDescriptor::builder()
+        .schema(
+            Schema::builder()
+                .column("id", DataTypes::int())
+                .column("name", DataTypes::string())
+                .column("age", DataTypes::bigint())
+                .primary_key(vec!["id".to_string()])
+                .build()?,
+        )
+        .build()?;
+
+    let table_path = TablePath::new("fluss".to_owned(), "rust_upsert_lookup_example".to_owned());
+
+    let admin = conn.get_admin().await?;
+    admin
+        .create_table(&table_path, &table_descriptor, true)
+        .await?;
+    println!(
+        "Created KV Table:\n {}\n",
+        admin.get_table(&table_path).await?
+    );
+
+    let table = conn.get_table(&table_path).await?;
+    let table_upsert = table.new_upsert()?;
+    let mut upsert_writer = table_upsert.create_writer()?;
+
+    println!("\n=== Upserting ===");
+    for (id, name, age) in [(1, "Verso", 32i64), (2, "Noco", 25), (3, "Esquie", 35)] {
+        let mut row = GenericRow::new();
+        row.set_field(0, id);
+        row.set_field(1, name);
+        row.set_field(2, age);
+        upsert_writer.upsert(&row).await?;
+        println!("Upserted: {row:?}");
+    }
+
+    println!("\n=== Looking up ===");
+    let mut lookuper = table.new_lookup()?.create_lookuper()?;
+
+    for id in 1..=2 {
+        let result = lookuper.lookup(&make_key(id)).await?;
+        let row = result.get_single_row()?.unwrap();
+        println!(
+            "Found id={id}: name={}, age={}",
+            row.get_string(1),
+            row.get_long(2)
+        );
+    }
+
+    println!("\n=== Updating ===");
+    let mut row = GenericRow::new();
+    row.set_field(0, 1);
+    row.set_field(1, "Verso");
+    row.set_field(2, 33i64);
+    upsert_writer.upsert(&row).await?;
+    println!("Updated: {row:?}");
+
+    let result = lookuper.lookup(&make_key(1)).await?;
+    let row = result.get_single_row()?.unwrap();
+    println!(
+        "Verified update: name={}, age={}",
+        row.get_string(1),
+        row.get_long(2)
+    );
+
+    println!("\n=== Deleting ===");
+    let mut row = GenericRow::new();
+    row.set_field(0, 2);
+    upsert_writer.delete(&row).await?;
+    println!("Deleted: {row:?}");
+
+    let result = lookuper.lookup(&make_key(2)).await?;
+    if result.get_single_row()?.is_none() {
+        println!("Verified deletion");
+    }
+
+    Ok(())
+}
+
+fn make_key(id: i32) -> GenericRow<'static> {
+    let mut row = GenericRow::new();
+    row.set_field(0, id);
+    row
+}
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index 2d6ac53d8f..7333056feb 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -15,6 +15,8 @@
 // specific language governing permissions and limitations
 // under the License.
 
+mod example_kv_table;
+
 use clap::Parser;
 use fluss::client::FlussConnection;
 use fluss::config::Config;
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index bc8134dde6..81a425408f 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -122,6 +122,7 @@ pub trait InternalRow {
     }
 }
 
+#[derive(Debug)]
 pub struct GenericRow<'a> {
     pub values: Vec<Datum<'a>>,
 }

From 76029f7d61b1d34b8b3dba35f0b5dc4ba4a67070 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Wed, 21 Jan 2026 01:50:55 +0000
Subject: [PATCH 078/287] feat: KvWriteBatch wiring in Sender (#184)

---
 .../crates/examples/src/example_kv_table.rs   |   4 +-
 .../crates/fluss/src/client/write/batch.rs    |   4 +
 .../crates/fluss/src/client/write/sender.rs   | 248 +++++++++++++-----
 .../crates/fluss/src/rpc/message/mod.rs       |   1 +
 4 files changed, 197 insertions(+), 60 deletions(-)

diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 75821a37e6..dcf7db8f05 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -69,7 +69,7 @@ pub async fn main() -> Result<()> {
     println!("\n=== Looking up ===");
     let mut lookuper = table.new_lookup()?.create_lookuper()?;
 
-    for id in 1..=2 {
+    for id in 1..=3 {
         let result = lookuper.lookup(&make_key(id)).await?;
         let row = result.get_single_row()?.unwrap();
         println!(
@@ -98,6 +98,8 @@ pub async fn main() -> Result<()> {
     println!("\n=== Deleting ===");
     let mut row = GenericRow::new();
     row.set_field(0, 2);
+    row.set_field(1, "");
+    row.set_field(2, 0i64);
     upsert_writer.delete(&row).await?;
     println!("Deleted: {row:?}");
 
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index 2ddf5192ed..159e3136e8 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -336,6 +336,10 @@ impl KvWriteBatch {
     pub fn close(&mut self) -> Result<()> {
         self.kv_batch_builder.close()
     }
+
+    pub fn target_columns(&self) -> Option<&Arc<Vec<usize>>> {
+        self.target_columns.as_ref()
+    }
 }
 
 #[cfg(test)]
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index 7ea24e30f6..ceed245621 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -17,11 +17,16 @@
 
 use crate::client::broadcast;
 use crate::client::metadata::Metadata;
+use crate::client::write::batch::WriteBatch;
 use crate::client::{ReadyWriteBatch, RecordAccumulator};
+use crate::error::Error::UnexpectedError;
 use crate::error::{FlussError, Result};
 use crate::metadata::{TableBucket, TablePath};
-use crate::proto::ProduceLogResponse;
-use crate::rpc::message::ProduceLogRequest;
+use crate::proto::{
+    PbProduceLogRespForBucket, PbPutKvRespForBucket, ProduceLogResponse, PutKvResponse,
+};
+use crate::rpc::ServerConnection;
+use crate::rpc::message::{ProduceLogRequest, PutKvRequest};
 use log::warn;
 use parking_lot::Mutex;
 use std::collections::{HashMap, HashSet};
@@ -182,23 +187,22 @@ impl Sender {
                 .iter()
                 .filter_map(|bucket| records_by_bucket.remove(bucket))
                 .collect();
+
             if request_batches.is_empty() {
                 continue;
             }
-            let request = match ProduceLogRequest::new(
+
+            let write_request = match Self::build_write_request(
                 table_id,
                 acks,
                 self.max_request_timeout_ms,
                 &mut request_batches,
             ) {
-                Ok(request) => request,
+                Ok(req) => req,
                 Err(e) => {
                     self.handle_batches_with_local_error(
-                        table_buckets
-                            .iter()
-                            .filter_map(|bucket| records_by_bucket.remove(bucket))
-                            .collect(),
-                        format!("Failed to build produce request: {e}"),
+                        request_batches,
+                        format!("Failed to build write request: {e}"),
                     )
                     .await?;
                     continue;
@@ -211,27 +215,12 @@ impl Sender {
                 records_by_bucket.insert(request_batch.table_bucket.clone(), request_batch);
             }
 
-            let response = match connection.request(request).await {
-                Ok(response) => response,
-                Err(e) => {
-                    self.handle_batches_with_error(
-                        table_buckets
-                            .iter()
-                            .filter_map(|bucket| records_by_bucket.remove(bucket))
-                            .collect(),
-                        FlussError::NetworkException,
-                        format!("Failed to send produce request: {e}"),
-                    )
-                    .await?;
-                    continue;
-                }
-            };
-
-            self.handle_produce_response(
+            self.send_and_handle_response(
+                &connection,
+                write_request,
                 table_id,
                 &table_buckets,
                 &mut records_by_bucket,
-                response,
             )
             .await?;
         }
@@ -239,50 +228,120 @@ impl Sender {
         Ok(())
     }
 
-    async fn handle_produce_response(
+    fn build_write_request(
+        table_id: i64,
+        acks: i16,
+        timeout_ms: i32,
+        request_batches: &mut [ReadyWriteBatch],
+    ) -> Result<WriteRequest> {
+        let first_batch = &request_batches.first().unwrap().write_batch;
+
+        let request = match first_batch {
+            WriteBatch::ArrowLog(_) => {
+                let req = ProduceLogRequest::new(table_id, acks, timeout_ms, request_batches)?;
+                WriteRequest::ProduceLog(req)
+            }
+            WriteBatch::Kv(kv_write_batch) => {
+                let target_columns = kv_write_batch.target_columns();
+                for batch in request_batches.iter().skip(1) {
+                    match &batch.write_batch {
+                        WriteBatch::ArrowLog(_) => {
+                            return Err(UnexpectedError {
+                                message: "Expecting KvWriteBatch but found ArrowLogWriteBatch"
+                                    .to_string(),
+                                source: None,
+                            });
+                        }
+                        WriteBatch::Kv(kvb) => {
+                            if target_columns != kvb.target_columns() {
+                                return Err(UnexpectedError {
+                                    message: format!(
+                                        "All the write batches to make put kv request should have the same target columns, but got {:?} and {:?}.",
+                                        target_columns,
+                                        kvb.target_columns()
+                                    ),
+                                    source: None,
+                                });
+                            }
+                        }
+                    }
+                }
+                let cols = target_columns
+                    .map(|arc| arc.iter().map(|&c| c as i32).collect())
+                    .unwrap_or_default();
+                let req = PutKvRequest::new(table_id, acks, timeout_ms, cols, request_batches)?;
+                WriteRequest::PutKv(req)
+            }
+        };
+
+        Ok(request)
+    }
+
+    async fn send_and_handle_response(
+        &self,
+        connection: &ServerConnection,
+        write_request: WriteRequest,
+        table_id: i64,
+        table_buckets: &[TableBucket],
+        records_by_bucket: &mut HashMap<TableBucket, ReadyWriteBatch>,
+    ) -> Result<()> {
+        macro_rules! send {
+            ($request:expr) => {
+                match connection.request($request).await {
+                    Ok(response) => {
+                        self.handle_write_response(
+                            table_id,
+                            table_buckets,
+                            records_by_bucket,
+                            response,
+                        )
+                        .await
+                    }
+                    Err(e) => {
+                        self.handle_batches_with_error(
+                            table_buckets
+                                .iter()
+                                .filter_map(|b| records_by_bucket.remove(b))
+                                .collect(),
+                            FlussError::NetworkException,
+                            format!("Failed to send write request: {e}"),
+                        )
+                        .await
+                    }
+                }
+            };
+        }
+
+        match write_request {
+            WriteRequest::ProduceLog(req) => send!(req),
+            WriteRequest::PutKv(req) => send!(req),
+        }
+    }
+
+    async fn handle_write_response<R: WriteResponse>(
         &self,
         table_id: i64,
         request_buckets: &[TableBucket],
         records_by_bucket: &mut HashMap<TableBucket, ReadyWriteBatch>,
-        response: ProduceLogResponse,
+        response: R,
     ) -> Result<()> {
         let mut invalid_metadata_tables: HashSet<TablePath> = HashSet::new();
         let mut pending_buckets: HashSet<TableBucket> = request_buckets.iter().cloned().collect();
-        for produce_log_response_for_bucket in response.buckets_resp.iter() {
-            let tb = TableBucket::new(table_id, produce_log_response_for_bucket.bucket_id);
 
+        for bucket_resp in response.buckets_resp() {
+            let tb = TableBucket::new(table_id, bucket_resp.bucket_id());
             let Some(ready_batch) = records_by_bucket.remove(&tb) else {
                 panic!("Missing ready batch for table bucket {tb}");
             };
             pending_buckets.remove(&tb);
 
-            if let Some(error_code) = produce_log_response_for_bucket.error_code {
-                if error_code == FlussError::None.code() {
-                    self.complete_batch(ready_batch);
-                    continue;
-                }
-
-                let error = FlussError::for_code(error_code);
-                let message = produce_log_response_for_bucket
-                    .error_message
-                    .clone()
-                    .unwrap_or_else(|| error.message().to_string());
-                if let Some(table_path) = self
-                    .handle_write_batch_error(ready_batch, error, message)
-                    .await?
-                {
-                    invalid_metadata_tables.insert(table_path);
-                }
-            } else {
-                self.complete_batch(ready_batch)
-            }
-        }
-        if !pending_buckets.is_empty() {
-            for bucket in pending_buckets {
-                if let Some(ready_batch) = records_by_bucket.remove(&bucket) {
-                    let message =
-                        format!("Missing response for table bucket {bucket} in produce response.");
-                    let error = FlussError::UnknownServerError;
+            match bucket_resp.error_code() {
+                Some(code) if code != FlussError::None.code() => {
+                    let error = FlussError::for_code(code);
+                    let message = bucket_resp
+                        .error_message()
+                        .cloned()
+                        .unwrap_or_else(|| error.message().to_string());
                     if let Some(table_path) = self
                         .handle_write_batch_error(ready_batch, error, message)
                         .await?
@@ -290,8 +349,25 @@ impl Sender {
                         invalid_metadata_tables.insert(table_path);
                     }
                 }
+                _ => self.complete_batch(ready_batch),
             }
         }
+
+        for bucket in pending_buckets {
+            if let Some(ready_batch) = records_by_bucket.remove(&bucket) {
+                if let Some(table_path) = self
+                    .handle_write_batch_error(
+                        ready_batch,
+                        FlussError::UnknownServerError,
+                        format!("Missing response for table bucket {bucket}"),
+                    )
+                    .await?
+                {
+                    invalid_metadata_tables.insert(table_path);
+                }
+            }
+        }
+
         self.update_metadata_if_needed(invalid_metadata_tables)
             .await;
         Ok(())
@@ -450,6 +526,60 @@ impl Sender {
     }
 }
 
+enum WriteRequest {
+    ProduceLog(ProduceLogRequest),
+    PutKv(PutKvRequest),
+}
+
+trait BucketResponse {
+    fn bucket_id(&self) -> i32;
+    fn error_code(&self) -> Option<i32>;
+    fn error_message(&self) -> Option<&String>;
+}
+
+impl BucketResponse for PbProduceLogRespForBucket {
+    fn bucket_id(&self) -> i32 {
+        self.bucket_id
+    }
+    fn error_code(&self) -> Option<i32> {
+        self.error_code
+    }
+    fn error_message(&self) -> Option<&String> {
+        self.error_message.as_ref()
+    }
+}
+
+impl BucketResponse for PbPutKvRespForBucket {
+    fn bucket_id(&self) -> i32 {
+        self.bucket_id
+    }
+    fn error_code(&self) -> Option<i32> {
+        self.error_code
+    }
+    fn error_message(&self) -> Option<&String> {
+        self.error_message.as_ref()
+    }
+}
+
+trait WriteResponse {
+    type BucketResp: BucketResponse;
+    fn buckets_resp(&self) -> &[Self::BucketResp];
+}
+
+impl WriteResponse for ProduceLogResponse {
+    type BucketResp = PbProduceLogRespForBucket;
+    fn buckets_resp(&self) -> &[Self::BucketResp] {
+        &self.buckets_resp
+    }
+}
+
+impl WriteResponse for PutKvResponse {
+    type BucketResp = PbPutKvRespForBucket;
+    fn buckets_resp(&self) -> &[Self::BucketResp] {
+        &self.buckets_resp
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -563,7 +693,7 @@ mod tests {
         };
 
         sender
-            .handle_produce_response(1, &request_buckets, &mut records_by_bucket, response)
+            .handle_write_response(1, &request_buckets, &mut records_by_bucket, response)
             .await?;
 
         let batch_result = handle.wait().await?;
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 4e6c8e1eaf..881a64f687 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -57,6 +57,7 @@ pub use list_offsets::*;
 pub use list_tables::*;
 pub use lookup::*;
 pub use produce_log::*;
+pub use put_kv::*;
 pub use table_exists::*;
 pub use update_metadata::*;
 

From 203093cdb46a2825fc0e743cb43eb19152f83d0c Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Wed, 21 Jan 2026 12:56:37 +0000
Subject: [PATCH 079/287] feat: Fix TableLookup so that SchemaId field bytes
 are not passed to CompactedRow::from_bytes(), these fields can be skipped as
 current rust client implementation does not check schema and already passes
 row_type (#190)

---
 fluss-rust/crates/fluss/src/client/table/lookup.rs | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index cd23503a5b..4e89176a61 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -20,6 +20,7 @@ use crate::client::connection::FlussConnection;
 use crate::client::metadata::Metadata;
 use crate::error::{Error, Result};
 use crate::metadata::{RowType, TableBucket, TableInfo};
+use crate::record::kv::SCHEMA_ID_LENGTH;
 use crate::row::InternalRow;
 use crate::row::compacted::CompactedRow;
 use crate::row::encode::{KeyEncoder, KeyEncoderFactory};
@@ -64,7 +65,10 @@ impl<'a> LookupResult<'a> {
     pub fn get_single_row(&self) -> Result<Option<CompactedRow<'_>>> {
         match self.rows.len() {
             0 => Ok(None),
-            1 => Ok(Some(CompactedRow::from_bytes(self.row_type, &self.rows[0]))),
+            1 => Ok(Some(CompactedRow::from_bytes(
+                self.row_type,
+                &self.rows[0][SCHEMA_ID_LENGTH..],
+            ))),
             _ => Err(Error::UnexpectedError {
                 message: "LookupResult contains multiple rows, use get_rows() instead".to_string(),
                 source: None,
@@ -76,7 +80,8 @@ impl<'a> LookupResult<'a> {
     pub fn get_rows(&self) -> Vec<CompactedRow<'_>> {
         self.rows
             .iter()
-            .map(|bytes| CompactedRow::from_bytes(self.row_type, bytes))
+            // TODO Add schema id check and fetch when implementing prefix lookup
+            .map(|bytes| CompactedRow::from_bytes(self.row_type, &bytes[SCHEMA_ID_LENGTH..]))
             .collect()
     }
 }

From 2f3269d2c04429ef5671262225dac6b6c26f169d Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Fri, 23 Jan 2026 03:34:58 +0000
Subject: [PATCH 080/287] feat: Arrow serialization for decimal and temporal
 types (#196)

---
 .../src/client/table/log_fetch_buffer.rs      |  12 +-
 .../crates/fluss/src/client/table/scanner.rs  |   8 +-
 .../fluss/src/client/write/accumulator.rs     |   2 +-
 .../crates/fluss/src/client/write/batch.rs    |   8 +-
 fluss-rust/crates/fluss/src/record/arrow.rs   | 569 ++++++++++++++----
 fluss-rust/crates/fluss/src/row/datum.rs      | 468 +++++++++++++-
 6 files changed, 916 insertions(+), 151 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index ca0a2532c8..214a79cd7d 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -657,13 +657,13 @@ mod tests {
     use std::sync::Arc;
     use std::time::Duration;
 
-    fn test_read_context() -> ReadContext {
+    fn test_read_context() -> Result<ReadContext> {
         let row_type = RowType::new(vec![DataField::new(
             "id".to_string(),
             DataTypes::int(),
             None,
         )]);
-        ReadContext::new(to_arrow_schema(&row_type), false)
+        Ok(ReadContext::new(to_arrow_schema(&row_type)?, false))
     }
 
     struct ErrorPendingFetch {
@@ -689,7 +689,7 @@ mod tests {
 
     #[tokio::test]
     async fn await_not_empty_returns_wakeup_error() {
-        let buffer = LogFetchBuffer::new(test_read_context());
+        let buffer = LogFetchBuffer::new(test_read_context().unwrap());
         buffer.wakeup();
 
         let result = buffer.await_not_empty(Duration::from_millis(10)).await;
@@ -698,7 +698,7 @@ mod tests {
 
     #[tokio::test]
     async fn await_not_empty_returns_pending_error() {
-        let buffer = LogFetchBuffer::new(test_read_context());
+        let buffer = LogFetchBuffer::new(test_read_context().unwrap());
         let table_bucket = TableBucket::new(1, 0);
         buffer.pend(Box::new(ErrorPendingFetch {
             table_bucket: table_bucket.clone(),
@@ -728,7 +728,7 @@ mod tests {
                 compression_type: ArrowCompressionType::None,
                 compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
             },
-        );
+        )?;
 
         let mut row = GenericRow::new();
         row.set_field(0, 1_i32);
@@ -738,7 +738,7 @@ mod tests {
 
         let data = builder.build()?;
         let log_records = LogRecordsBatches::new(data.clone());
-        let read_context = ReadContext::new(to_arrow_schema(&row_type), false);
+        let read_context = ReadContext::new(to_arrow_schema(&row_type)?, false);
         let mut fetch = DefaultCompletedFetch::new(
             TableBucket::new(1, 0),
             log_records,
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index e9b2ce106d..cf0b257f00 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -470,7 +470,7 @@ impl LogFetcher {
         log_scanner_status: Arc<LogScannerStatus>,
         projected_fields: Option<Vec<usize>>,
     ) -> Result<Self> {
-        let full_arrow_schema = to_arrow_schema(table_info.get_row_type());
+        let full_arrow_schema = to_arrow_schema(table_info.get_row_type())?;
         let read_context =
             Self::create_read_context(full_arrow_schema.clone(), projected_fields.clone(), false)?;
         let remote_read_context =
@@ -1445,7 +1445,7 @@ mod tests {
                 compression_type: ArrowCompressionType::None,
                 compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
             },
-        );
+        )?;
         let record = WriteRecord::for_append(
             table_path,
             1,
@@ -1477,7 +1477,7 @@ mod tests {
 
         let data = build_records(&table_info, Arc::new(table_path))?;
         let log_records = LogRecordsBatches::new(data.clone());
-        let read_context = ReadContext::new(to_arrow_schema(table_info.get_row_type()), false);
+        let read_context = ReadContext::new(to_arrow_schema(table_info.get_row_type())?, false);
         let completed =
             DefaultCompletedFetch::new(bucket.clone(), log_records, data.len(), read_context, 0, 0);
         fetcher.log_fetch_buffer.add(Box::new(completed));
@@ -1506,7 +1506,7 @@ mod tests {
         let bucket = TableBucket::new(1, 0);
         let data = build_records(&table_info, Arc::new(table_path))?;
         let log_records = LogRecordsBatches::new(data.clone());
-        let read_context = ReadContext::new(to_arrow_schema(table_info.get_row_type()), false);
+        let read_context = ReadContext::new(to_arrow_schema(table_info.get_row_type())?, false);
         let mut completed: Box<dyn CompletedFetch> = Box::new(DefaultCompletedFetch::new(
             bucket,
             log_records,
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index fb7b54470d..46c822c1a2 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -112,7 +112,7 @@ impl RecordAccumulator {
                 bucket_id,
                 current_time_ms(),
                 matches!(&record.record, Record::Log(LogWriteRecord::RecordBatch(_))),
-            )),
+            )?),
             Record::Kv(kv_record) => Kv(KvWriteBatch::new(
                 self.batch_id.fetch_add(1, Ordering::Relaxed),
                 table_path.as_ref().clone(),
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index 159e3136e8..78381c6e76 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -197,18 +197,18 @@ impl ArrowLogWriteBatch {
         bucket_id: BucketId,
         create_ms: i64,
         to_append_record_batch: bool,
-    ) -> Self {
+    ) -> Result<Self> {
         let base = InnerWriteBatch::new(batch_id, table_path, create_ms, bucket_id);
-        Self {
+        Ok(Self {
             write_batch: base,
             arrow_builder: MemoryLogRecordsArrowBuilder::new(
                 schema_id,
                 row_type,
                 to_append_record_batch,
                 arrow_compression_info,
-            ),
+            )?,
             built_records: None,
-        }
+        })
     }
 
     pub fn batch_id(&self) -> i64 {
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 3c94b7208f..39114d3273 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -22,9 +22,12 @@ use crate::metadata::{DataType, RowType};
 use crate::record::{ChangeType, ScanRecord};
 use crate::row::{ColumnarRow, GenericRow};
 use arrow::array::{
-    ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Float32Builder, Float64Builder,
-    Int8Builder, Int16Builder, Int32Builder, Int64Builder, StringBuilder, UInt8Builder,
-    UInt16Builder, UInt32Builder, UInt64Builder,
+    ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
+    Float32Builder, Float64Builder, Int8Builder, Int16Builder, Int32Builder, Int64Builder,
+    StringBuilder, Time32MillisecondBuilder, Time32SecondBuilder, Time64MicrosecondBuilder,
+    Time64NanosecondBuilder, TimestampMicrosecondBuilder, TimestampMillisecondBuilder,
+    TimestampNanosecondBuilder, TimestampSecondBuilder, UInt8Builder, UInt16Builder, UInt32Builder,
+    UInt64Builder,
 };
 use arrow::{
     array::RecordBatch,
@@ -42,7 +45,6 @@ use byteorder::WriteBytesExt;
 use byteorder::{ByteOrder, LittleEndian};
 use bytes::Bytes;
 use crc32c::crc32c;
-use parking_lot::Mutex;
 use std::{
     io::{Cursor, Write},
     sync::Arc,
@@ -113,7 +115,7 @@ pub struct MemoryLogRecordsArrowBuilder {
 }
 
 pub trait ArrowRecordBatchInnerBuilder: Send + Sync {
-    fn build_arrow_record_batch(&self) -> Result<Arc<RecordBatch>>;
+    fn build_arrow_record_batch(&mut self) -> Result<Arc<RecordBatch>>;
 
     fn append(&mut self, row: &GenericRow) -> Result<bool>;
 
@@ -133,7 +135,7 @@ pub struct PrebuiltRecordBatchBuilder {
 }
 
 impl ArrowRecordBatchInnerBuilder for PrebuiltRecordBatchBuilder {
-    fn build_arrow_record_batch(&self) -> Result<Arc<RecordBatch>> {
+    fn build_arrow_record_batch(&mut self) -> Result<Arc<RecordBatch>> {
         Ok(self.arrow_record_batch.as_ref().unwrap().clone())
     }
 
@@ -167,66 +169,132 @@ impl ArrowRecordBatchInnerBuilder for PrebuiltRecordBatchBuilder {
 
 pub struct RowAppendRecordBatchBuilder {
     table_schema: SchemaRef,
-    arrow_column_builders: Mutex<Vec<Box<dyn ArrayBuilder>>>,
+    arrow_column_builders: Vec<Box<dyn ArrayBuilder>>,
     records_count: i32,
 }
 
 impl RowAppendRecordBatchBuilder {
-    pub fn new(row_type: &RowType) -> Self {
-        let schema_ref = to_arrow_schema(row_type);
-        let builders = Mutex::new(
-            schema_ref
-                .fields()
-                .iter()
-                .map(|field| Self::create_builder(field.data_type()))
-                .collect(),
-        );
-        Self {
+    pub fn new(row_type: &RowType) -> Result<Self> {
+        let schema_ref = to_arrow_schema(row_type)?;
+        let builders: Result<Vec<_>> = schema_ref
+            .fields()
+            .iter()
+            .map(|field| Self::create_builder(field.data_type()))
+            .collect();
+        Ok(Self {
             table_schema: schema_ref.clone(),
-            arrow_column_builders: builders,
+            arrow_column_builders: builders?,
             records_count: 0,
-        }
+        })
     }
 
-    fn create_builder(data_type: &arrow_schema::DataType) -> Box<dyn ArrayBuilder> {
+    fn create_builder(data_type: &arrow_schema::DataType) -> Result<Box<dyn ArrayBuilder>> {
         match data_type {
-            arrow_schema::DataType::Int8 => Box::new(Int8Builder::new()),
-            arrow_schema::DataType::Int16 => Box::new(Int16Builder::new()),
-            arrow_schema::DataType::Int32 => Box::new(Int32Builder::new()),
-            arrow_schema::DataType::Int64 => Box::new(Int64Builder::new()),
-            arrow_schema::DataType::UInt8 => Box::new(UInt8Builder::new()),
-            arrow_schema::DataType::UInt16 => Box::new(UInt16Builder::new()),
-            arrow_schema::DataType::UInt32 => Box::new(UInt32Builder::new()),
-            arrow_schema::DataType::UInt64 => Box::new(UInt64Builder::new()),
-            arrow_schema::DataType::Float32 => Box::new(Float32Builder::new()),
-            arrow_schema::DataType::Float64 => Box::new(Float64Builder::new()),
-            arrow_schema::DataType::Boolean => Box::new(BooleanBuilder::new()),
-            arrow_schema::DataType::Utf8 => Box::new(StringBuilder::new()),
-            arrow_schema::DataType::Binary => Box::new(BinaryBuilder::new()),
-            dt => panic!("Unsupported data type: {dt:?}"),
+            arrow_schema::DataType::Int8 => Ok(Box::new(Int8Builder::new())),
+            arrow_schema::DataType::Int16 => Ok(Box::new(Int16Builder::new())),
+            arrow_schema::DataType::Int32 => Ok(Box::new(Int32Builder::new())),
+            arrow_schema::DataType::Int64 => Ok(Box::new(Int64Builder::new())),
+            arrow_schema::DataType::UInt8 => Ok(Box::new(UInt8Builder::new())),
+            arrow_schema::DataType::UInt16 => Ok(Box::new(UInt16Builder::new())),
+            arrow_schema::DataType::UInt32 => Ok(Box::new(UInt32Builder::new())),
+            arrow_schema::DataType::UInt64 => Ok(Box::new(UInt64Builder::new())),
+            arrow_schema::DataType::Float32 => Ok(Box::new(Float32Builder::new())),
+            arrow_schema::DataType::Float64 => Ok(Box::new(Float64Builder::new())),
+            arrow_schema::DataType::Boolean => Ok(Box::new(BooleanBuilder::new())),
+            arrow_schema::DataType::Utf8 => Ok(Box::new(StringBuilder::new())),
+            arrow_schema::DataType::Binary => Ok(Box::new(BinaryBuilder::new())),
+            arrow_schema::DataType::Decimal128(precision, scale) => {
+                let builder = Decimal128Builder::new()
+                    .with_precision_and_scale(*precision, *scale)
+                    .map_err(|e| Error::IllegalArgument {
+                        message: format!(
+                            "Invalid decimal precision {} or scale {}: {}",
+                            precision, scale, e
+                        ),
+                    })?;
+                Ok(Box::new(builder))
+            }
+            arrow_schema::DataType::Date32 => Ok(Box::new(Date32Builder::new())),
+            arrow_schema::DataType::Time32(unit) => match unit {
+                arrow_schema::TimeUnit::Second => Ok(Box::new(Time32SecondBuilder::new())),
+                arrow_schema::TimeUnit::Millisecond => {
+                    Ok(Box::new(Time32MillisecondBuilder::new()))
+                }
+                _ => Err(Error::IllegalArgument {
+                    message: format!(
+                        "Time32 only supports Second and Millisecond units, got: {:?}",
+                        unit
+                    ),
+                }),
+            },
+            arrow_schema::DataType::Time64(unit) => match unit {
+                arrow_schema::TimeUnit::Microsecond => {
+                    Ok(Box::new(Time64MicrosecondBuilder::new()))
+                }
+                arrow_schema::TimeUnit::Nanosecond => Ok(Box::new(Time64NanosecondBuilder::new())),
+                _ => Err(Error::IllegalArgument {
+                    message: format!(
+                        "Time64 only supports Microsecond and Nanosecond units, got: {:?}",
+                        unit
+                    ),
+                }),
+            },
+            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Second, _) => {
+                Ok(Box::new(TimestampSecondBuilder::new()))
+            }
+            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Millisecond, _) => {
+                Ok(Box::new(TimestampMillisecondBuilder::new()))
+            }
+            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Microsecond, _) => {
+                Ok(Box::new(TimestampMicrosecondBuilder::new()))
+            }
+            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, _) => {
+                Ok(Box::new(TimestampNanosecondBuilder::new()))
+            }
+            dt => Err(Error::IllegalArgument {
+                message: format!("Unsupported data type: {dt:?}"),
+            }),
         }
     }
 }
 
 impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
-    fn build_arrow_record_batch(&self) -> Result<Arc<RecordBatch>> {
-        let arrays = self
+    fn build_arrow_record_batch(&mut self) -> Result<Arc<RecordBatch>> {
+        let arrays: Result<Vec<ArrayRef>> = self
             .arrow_column_builders
-            .lock()
             .iter_mut()
-            .map(|b| b.finish())
-            .collect::<Vec<ArrayRef>>();
+            .enumerate()
+            .map(|(idx, b)| {
+                let array = b.finish();
+                let expected_type = self.table_schema.field(idx).data_type();
+
+                // Validate array type matches schema
+                if array.data_type() != expected_type {
+                    return Err(Error::IllegalArgument {
+                        message: format!(
+                            "Builder type mismatch at column {}: expected {:?}, got {:?}",
+                            idx,
+                            expected_type,
+                            array.data_type()
+                        ),
+                    });
+                }
+
+                Ok(array)
+            })
+            .collect();
+
         Ok(Arc::new(RecordBatch::try_new(
             self.table_schema.clone(),
-            arrays,
+            arrays?,
         )?))
     }
 
     fn append(&mut self, row: &GenericRow) -> Result<bool> {
         for (idx, value) in row.values.iter().enumerate() {
-            let mut builder_binding = self.arrow_column_builders.lock();
-            let builder = builder_binding.get_mut(idx).unwrap();
-            value.append_to(builder.as_mut())?;
+            let field_type = self.table_schema.field(idx).data_type();
+            let builder = self.arrow_column_builders.get_mut(idx).unwrap();
+            value.append_to(builder.as_mut(), field_type)?;
         }
         self.records_count += 1;
         Ok(true)
@@ -255,15 +323,15 @@ impl MemoryLogRecordsArrowBuilder {
         row_type: &RowType,
         to_append_record_batch: bool,
         arrow_compression_info: ArrowCompressionInfo,
-    ) -> Self {
+    ) -> Result<Self> {
         let arrow_batch_builder: Box<dyn ArrowRecordBatchInnerBuilder> = {
             if to_append_record_batch {
                 Box::new(PrebuiltRecordBatchBuilder::default())
             } else {
-                Box::new(RowAppendRecordBatchBuilder::new(row_type))
+                Box::new(RowAppendRecordBatchBuilder::new(row_type)?)
             }
         };
-        MemoryLogRecordsArrowBuilder {
+        Ok(MemoryLogRecordsArrowBuilder {
             base_log_offset: BUILDER_DEFAULT_OFFSET,
             schema_id,
             magic: CURRENT_LOG_MAGIC_VALUE,
@@ -272,7 +340,7 @@ impl MemoryLogRecordsArrowBuilder {
             is_closed: false,
             arrow_record_batch_builder: arrow_batch_builder,
             arrow_compression_info,
-        }
+        })
     }
 
     pub fn append(&mut self, record: &WriteRecord) -> Result<bool> {
@@ -302,7 +370,7 @@ impl MemoryLogRecordsArrowBuilder {
         self.is_closed = true;
     }
 
-    pub fn build(&self) -> Result<Vec<u8>> {
+    pub fn build(&mut self) -> Result<Vec<u8>> {
         // serialize arrow batch
         let mut arrow_batch_bytes = vec![];
         let table_schema = self.arrow_record_batch_builder.schema();
@@ -641,24 +709,24 @@ fn parse_ipc_message(
     Ok((batch_metadata, body_buffer, message.version()))
 }
 
-pub fn to_arrow_schema(fluss_schema: &RowType) -> SchemaRef {
-    let fields: Vec<Field> = fluss_schema
+pub fn to_arrow_schema(fluss_schema: &RowType) -> Result<SchemaRef> {
+    let fields: Result<Vec<Field>> = fluss_schema
         .fields()
         .iter()
         .map(|f| {
-            Field::new(
+            Ok(Field::new(
                 f.name(),
-                to_arrow_type(f.data_type()),
+                to_arrow_type(f.data_type())?,
                 f.data_type().is_nullable(),
-            )
+            ))
         })
         .collect();
 
-    SchemaRef::new(arrow_schema::Schema::new(fields))
+    Ok(SchemaRef::new(arrow_schema::Schema::new(fields?)))
 }
 
-pub fn to_arrow_type(fluss_type: &DataType) -> ArrowDataType {
-    match fluss_type {
+pub fn to_arrow_type(fluss_type: &DataType) -> Result<ArrowDataType> {
+    Ok(match fluss_type {
         DataType::Boolean(_) => ArrowDataType::Boolean,
         DataType::TinyInt(_) => ArrowDataType::Int8,
         DataType::SmallInt(_) => ArrowDataType::Int16,
@@ -668,58 +736,91 @@ pub fn to_arrow_type(fluss_type: &DataType) -> ArrowDataType {
         DataType::Double(_) => ArrowDataType::Float64,
         DataType::Char(_) => ArrowDataType::Utf8,
         DataType::String(_) => ArrowDataType::Utf8,
-        DataType::Decimal(decimal_type) => ArrowDataType::Decimal128(
-            decimal_type
-                .precision()
-                .try_into()
-                .expect("precision exceeds u8::MAX"),
-            decimal_type
+        DataType::Decimal(decimal_type) => {
+            let precision =
+                decimal_type
+                    .precision()
+                    .try_into()
+                    .map_err(|_| Error::IllegalArgument {
+                        message: format!(
+                            "Decimal precision {} exceeds Arrow's maximum (u8::MAX)",
+                            decimal_type.precision()
+                        ),
+                    })?;
+            let scale = decimal_type
                 .scale()
                 .try_into()
-                .expect("scale exceeds i8::MAX"),
-        ),
+                .map_err(|_| Error::IllegalArgument {
+                    message: format!(
+                        "Decimal scale {} exceeds Arrow's maximum (i8::MAX)",
+                        decimal_type.scale()
+                    ),
+                })?;
+            ArrowDataType::Decimal128(precision, scale)
+        }
         DataType::Date(_) => ArrowDataType::Date32,
         DataType::Time(time_type) => match time_type.precision() {
             0 => ArrowDataType::Time32(arrow_schema::TimeUnit::Second),
             1..=3 => ArrowDataType::Time32(arrow_schema::TimeUnit::Millisecond),
             4..=6 => ArrowDataType::Time64(arrow_schema::TimeUnit::Microsecond),
             7..=9 => ArrowDataType::Time64(arrow_schema::TimeUnit::Nanosecond),
-            // This arm should never be reached due to validation in TimeType.
-            invalid => panic!("Invalid precision value for TimeType: {invalid}"),
+            invalid => {
+                return Err(Error::IllegalArgument {
+                    message: format!("Invalid precision {} for TimeType (must be 0-9)", invalid),
+                });
+            }
         },
         DataType::Timestamp(timestamp_type) => match timestamp_type.precision() {
             0 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, None),
             1..=3 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, None),
             4..=6 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, None),
             7..=9 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None),
-            // This arm should never be reached due to validation in Timestamp.
-            invalid => panic!("Invalid precision value for TimestampType: {invalid}"),
+            invalid => {
+                return Err(Error::IllegalArgument {
+                    message: format!(
+                        "Invalid precision {} for TimestampType (must be 0-9)",
+                        invalid
+                    ),
+                });
+            }
         },
         DataType::TimestampLTz(timestamp_ltz_type) => match timestamp_ltz_type.precision() {
             0 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, None),
             1..=3 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, None),
             4..=6 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, None),
             7..=9 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None),
-            // This arm should never be reached due to validation in TimestampLTz.
-            invalid => panic!("Invalid precision value for TimestampLTzType: {invalid}"),
+            invalid => {
+                return Err(Error::IllegalArgument {
+                    message: format!(
+                        "Invalid precision {} for TimestampLTzType (must be 0-9)",
+                        invalid
+                    ),
+                });
+            }
         },
         DataType::Bytes(_) => ArrowDataType::Binary,
-        DataType::Binary(binary_type) => ArrowDataType::FixedSizeBinary(
-            binary_type
+        DataType::Binary(binary_type) => {
+            let length = binary_type
                 .length()
                 .try_into()
-                .expect("length exceeds i32::MAX"),
-        ),
+                .map_err(|_| Error::IllegalArgument {
+                    message: format!(
+                        "Binary length {} exceeds Arrow's maximum (i32::MAX)",
+                        binary_type.length()
+                    ),
+                })?;
+            ArrowDataType::FixedSizeBinary(length)
+        }
         DataType::Array(array_type) => ArrowDataType::List(
             Field::new_list_field(
-                to_arrow_type(array_type.get_element_type()),
+                to_arrow_type(array_type.get_element_type())?,
                 fluss_type.is_nullable(),
             )
             .into(),
         ),
         DataType::Map(map_type) => {
-            let key_type = to_arrow_type(map_type.key_type());
-            let value_type = to_arrow_type(map_type.value_type());
+            let key_type = to_arrow_type(map_type.key_type())?;
+            let value_type = to_arrow_type(map_type.value_type())?;
             let entry_fields = vec![
                 Field::new("key", key_type, map_type.key_type().is_nullable()),
                 Field::new("value", value_type, map_type.value_type().is_nullable()),
@@ -733,20 +834,21 @@ pub fn to_arrow_type(fluss_type: &DataType) -> ArrowDataType {
                 false,
             )
         }
-        DataType::Row(row_type) => ArrowDataType::Struct(arrow_schema::Fields::from(
-            row_type
+        DataType::Row(row_type) => {
+            let fields: Result<Vec<Field>> = row_type
                 .fields()
                 .iter()
                 .map(|f| {
-                    Field::new(
+                    Ok(Field::new(
                         f.name(),
-                        to_arrow_type(f.data_type()),
+                        to_arrow_type(f.data_type())?,
                         f.data_type().is_nullable(),
-                    )
+                    ))
                 })
-                .collect::<Vec<Field>>(),
-        )),
-    }
+                .collect();
+            ArrowDataType::Struct(arrow_schema::Fields::from(fields?))
+        }
+    })
 }
 
 #[derive(Clone)]
@@ -1059,81 +1161,114 @@ mod tests {
 
     #[test]
     fn test_to_array_type() {
-        assert_eq!(to_arrow_type(&DataTypes::boolean()), ArrowDataType::Boolean);
-        assert_eq!(to_arrow_type(&DataTypes::tinyint()), ArrowDataType::Int8);
-        assert_eq!(to_arrow_type(&DataTypes::smallint()), ArrowDataType::Int16);
-        assert_eq!(to_arrow_type(&DataTypes::bigint()), ArrowDataType::Int64);
-        assert_eq!(to_arrow_type(&DataTypes::int()), ArrowDataType::Int32);
-        assert_eq!(to_arrow_type(&DataTypes::float()), ArrowDataType::Float32);
-        assert_eq!(to_arrow_type(&DataTypes::double()), ArrowDataType::Float64);
-        assert_eq!(to_arrow_type(&DataTypes::char(16)), ArrowDataType::Utf8);
-        assert_eq!(to_arrow_type(&DataTypes::string()), ArrowDataType::Utf8);
         assert_eq!(
-            to_arrow_type(&DataTypes::decimal(10, 2)),
+            to_arrow_type(&DataTypes::boolean()).unwrap(),
+            ArrowDataType::Boolean
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::tinyint()).unwrap(),
+            ArrowDataType::Int8
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::smallint()).unwrap(),
+            ArrowDataType::Int16
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::bigint()).unwrap(),
+            ArrowDataType::Int64
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::int()).unwrap(),
+            ArrowDataType::Int32
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::float()).unwrap(),
+            ArrowDataType::Float32
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::double()).unwrap(),
+            ArrowDataType::Float64
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::char(16)).unwrap(),
+            ArrowDataType::Utf8
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::string()).unwrap(),
+            ArrowDataType::Utf8
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::decimal(10, 2)).unwrap(),
             ArrowDataType::Decimal128(10, 2)
         );
-        assert_eq!(to_arrow_type(&DataTypes::date()), ArrowDataType::Date32);
         assert_eq!(
-            to_arrow_type(&DataTypes::time()),
+            to_arrow_type(&DataTypes::date()).unwrap(),
+            ArrowDataType::Date32
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::time()).unwrap(),
             ArrowDataType::Time32(arrow_schema::TimeUnit::Second)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::time_with_precision(3)),
+            to_arrow_type(&DataTypes::time_with_precision(3)).unwrap(),
             ArrowDataType::Time32(arrow_schema::TimeUnit::Millisecond)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::time_with_precision(6)),
+            to_arrow_type(&DataTypes::time_with_precision(6)).unwrap(),
             ArrowDataType::Time64(arrow_schema::TimeUnit::Microsecond)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::time_with_precision(9)),
+            to_arrow_type(&DataTypes::time_with_precision(9)).unwrap(),
             ArrowDataType::Time64(arrow_schema::TimeUnit::Nanosecond)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::timestamp_with_precision(0)),
+            to_arrow_type(&DataTypes::timestamp_with_precision(0)).unwrap(),
             ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, None)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::timestamp_with_precision(3)),
+            to_arrow_type(&DataTypes::timestamp_with_precision(3)).unwrap(),
             ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, None)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::timestamp_with_precision(6)),
+            to_arrow_type(&DataTypes::timestamp_with_precision(6)).unwrap(),
             ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, None)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::timestamp_with_precision(9)),
+            to_arrow_type(&DataTypes::timestamp_with_precision(9)).unwrap(),
             ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(0)),
+            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(0)).unwrap(),
             ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, None)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(3)),
+            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(3)).unwrap(),
             ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, None)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(6)),
+            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(6)).unwrap(),
             ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, None)
         );
         assert_eq!(
-            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(9)),
+            to_arrow_type(&DataTypes::timestamp_ltz_with_precision(9)).unwrap(),
             ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None)
         );
-        assert_eq!(to_arrow_type(&DataTypes::bytes()), ArrowDataType::Binary);
         assert_eq!(
-            to_arrow_type(&DataTypes::binary(16)),
+            to_arrow_type(&DataTypes::bytes()).unwrap(),
+            ArrowDataType::Binary
+        );
+        assert_eq!(
+            to_arrow_type(&DataTypes::binary(16)).unwrap(),
             ArrowDataType::FixedSizeBinary(16)
         );
 
         assert_eq!(
-            to_arrow_type(&DataTypes::array(DataTypes::int())),
+            to_arrow_type(&DataTypes::array(DataTypes::int())).unwrap(),
             ArrowDataType::List(Field::new_list_field(ArrowDataType::Int32, true).into())
         );
 
         assert_eq!(
-            to_arrow_type(&DataTypes::map(DataTypes::string(), DataTypes::int())),
+            to_arrow_type(&DataTypes::map(DataTypes::string(), DataTypes::int())).unwrap(),
             ArrowDataType::Map(
                 Arc::new(Field::new(
                     "entries",
@@ -1151,7 +1286,8 @@ mod tests {
             to_arrow_type(&DataTypes::row(vec![
                 DataTypes::field("f1".to_string(), DataTypes::int()),
                 DataTypes::field("f2".to_string(), DataTypes::string()),
-            ])),
+            ]))
+            .unwrap(),
             ArrowDataType::Struct(arrow_schema::Fields::from(vec![
                 Field::new("f1", ArrowDataType::Int32, true),
                 Field::new("f2", ArrowDataType::Utf8, true),
@@ -1215,7 +1351,7 @@ mod tests {
             DataField::new("id".to_string(), DataTypes::int(), None),
             DataField::new("name".to_string(), DataTypes::string(), None),
         ]);
-        let schema = to_arrow_schema(&row_type);
+        let schema = to_arrow_schema(&row_type).unwrap();
         let result = ReadContext::with_projection_pushdown(schema, vec![0, 2], false);
 
         assert!(matches!(result, Err(IllegalArgument { .. })));
@@ -1249,4 +1385,209 @@ mod tests {
         }
         out
     }
+
+    #[test]
+    fn test_temporal_and_decimal_builder_validation() {
+        use arrow::array::Array;
+
+        // Test valid builder creation with precision=10, scale=2
+        let mut builder =
+            RowAppendRecordBatchBuilder::create_builder(&ArrowDataType::Decimal128(10, 2)).unwrap();
+        let decimal_builder = builder
+            .as_any_mut()
+            .downcast_mut::<Decimal128Builder>()
+            .expect("Expected Decimal128Builder");
+        // Verify precision and scale
+        let array = decimal_builder.finish();
+        assert_eq!(array.data_type(), &ArrowDataType::Decimal128(10, 2));
+
+        // Test error case: invalid precision/scale
+        let result =
+            RowAppendRecordBatchBuilder::create_builder(&ArrowDataType::Decimal128(100, 50));
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_decimal_rescaling_and_validation() -> Result<()> {
+        use crate::row::{Datum, Decimal, GenericRow};
+        use arrow::array::Decimal128Array;
+        use bigdecimal::BigDecimal;
+        use std::str::FromStr;
+
+        // Test 1: Rescaling from scale 3 to scale 2
+        let row_type = RowType::new(vec![DataField::new(
+            "amount".to_string(),
+            DataTypes::decimal(10, 2),
+            None,
+        )]);
+        let mut builder = RowAppendRecordBatchBuilder::new(&row_type)?;
+        let decimal = Decimal::from_big_decimal(BigDecimal::from_str("123.456").unwrap(), 10, 3)?;
+        builder.append(&GenericRow {
+            values: vec![Datum::Decimal(decimal)],
+        })?;
+        let batch = builder.build_arrow_record_batch()?;
+        let array = batch
+            .column(0)
+            .as_any()
+            .downcast_ref::<Decimal128Array>()
+            .unwrap();
+        assert_eq!(array.value(0), 12346); // 123.456 rounded to 2 decimal places
+        assert_eq!(array.scale(), 2);
+
+        // Test 2: Precision overflow (should error)
+        let row_type = RowType::new(vec![DataField::new(
+            "amount".to_string(),
+            DataTypes::decimal(5, 2),
+            None,
+        )]);
+        let mut builder = RowAppendRecordBatchBuilder::new(&row_type)?;
+        let decimal = Decimal::from_big_decimal(BigDecimal::from_str("123456.78").unwrap(), 10, 2)?;
+        let result = builder.append(&GenericRow {
+            values: vec![Datum::Decimal(decimal)],
+        });
+        assert!(result.is_err());
+        assert!(
+            result
+                .unwrap_err()
+                .to_string()
+                .contains("precision overflow")
+        );
+
+        Ok(())
+    }
+
+    #[test]
+    fn test_all_types_end_to_end() -> Result<()> {
+        use crate::row::{Date, Datum, Decimal, GenericRow, Time, TimestampLtz, TimestampNtz};
+        use arrow::array::{
+            Date32Array, Decimal128Array, Int32Array, Time32MillisecondArray,
+            Time64NanosecondArray, TimestampMicrosecondArray, TimestampNanosecondArray,
+        };
+        use bigdecimal::BigDecimal;
+        use std::str::FromStr;
+
+        // Schema with int, decimal, date, time (ms + ns), timestamps (μs + ns)
+        let row_type = RowType::new(vec![
+            DataField::new("id".to_string(), DataTypes::int(), None),
+            DataField::new("amount".to_string(), DataTypes::decimal(10, 2), None),
+            DataField::new("date".to_string(), DataTypes::date(), None),
+            DataField::new(
+                "time_ms".to_string(),
+                DataTypes::time_with_precision(3),
+                None,
+            ),
+            DataField::new(
+                "time_ns".to_string(),
+                DataTypes::time_with_precision(9),
+                None,
+            ),
+            DataField::new(
+                "ts_us".to_string(),
+                DataTypes::timestamp_with_precision(6),
+                None,
+            ),
+            DataField::new(
+                "ts_ltz_ns".to_string(),
+                DataTypes::timestamp_ltz_with_precision(9),
+                None,
+            ),
+        ]);
+
+        let mut builder = RowAppendRecordBatchBuilder::new(&row_type)?;
+
+        // Append rows with various data types
+        builder.append(&GenericRow {
+            values: vec![
+                Datum::Int32(1),
+                Datum::Decimal(Decimal::from_big_decimal(
+                    BigDecimal::from_str("123.456").unwrap(),
+                    10,
+                    3,
+                )?),
+                // 18000 days since epoch = 2019-04-14
+                Datum::Date(Date::new(18000)),
+                // 43200000 ms = 12:00:00.000 (noon)
+                Datum::Time(Time::new(43200000)),
+                // 12345 ms = 00:00:12.345
+                Datum::Time(Time::new(12345)),
+                // 1609459200000 ms = 2021-01-01 00:00:00 UTC, with 123456 additional nanoseconds
+                Datum::TimestampNtz(TimestampNtz::from_millis_nanos(1609459200000, 123456)?),
+                // 1609459200000 ms = 2021-01-01 00:00:00 UTC, with 987654 additional nanoseconds
+                Datum::TimestampLtz(TimestampLtz::from_millis_nanos(1609459200000, 987654)?),
+            ],
+        })?;
+
+        let batch = builder.build_arrow_record_batch()?;
+
+        // Verify all conversions
+        assert_eq!(
+            batch
+                .column(0)
+                .as_any()
+                .downcast_ref::<Int32Array>()
+                .unwrap()
+                .value(0),
+            1
+        );
+
+        let dec = batch
+            .column(1)
+            .as_any()
+            .downcast_ref::<Decimal128Array>()
+            .unwrap();
+        assert_eq!(dec.value(0), 12346); // 123.456 rounded to 2 decimal places
+
+        assert_eq!(
+            batch
+                .column(2)
+                .as_any()
+                .downcast_ref::<Date32Array>()
+                .unwrap()
+                .value(0),
+            18000
+        );
+
+        assert_eq!(
+            batch
+                .column(3)
+                .as_any()
+                .downcast_ref::<Time32MillisecondArray>()
+                .unwrap()
+                .value(0),
+            43200000
+        );
+
+        assert_eq!(
+            batch
+                .column(4)
+                .as_any()
+                .downcast_ref::<Time64NanosecondArray>()
+                .unwrap()
+                .value(0),
+            12345000000
+        );
+
+        // Timestamp with sub-millisecond nanos preserved
+        assert_eq!(
+            batch
+                .column(5)
+                .as_any()
+                .downcast_ref::<TimestampMicrosecondArray>()
+                .unwrap()
+                .value(0),
+            1609459200000123
+        );
+
+        assert_eq!(
+            batch
+                .column(6)
+                .as_any()
+                .downcast_ref::<TimestampNanosecondArray>()
+                .unwrap()
+                .value(0),
+            1609459200000987654
+        );
+
+        Ok(())
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 5b21b3899b..7b3850f880 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -19,9 +19,13 @@ use crate::error::Error::RowConvertError;
 use crate::error::Result;
 use crate::row::Decimal;
 use arrow::array::{
-    ArrayBuilder, BinaryBuilder, BooleanBuilder, Float32Builder, Float64Builder, Int8Builder,
-    Int16Builder, Int32Builder, Int64Builder, StringBuilder,
+    ArrayBuilder, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder, Float32Builder,
+    Float64Builder, Int8Builder, Int16Builder, Int32Builder, Int64Builder, StringBuilder,
+    Time32MillisecondBuilder, Time32SecondBuilder, Time64MicrosecondBuilder,
+    Time64NanosecondBuilder, TimestampMicrosecondBuilder, TimestampMillisecondBuilder,
+    TimestampNanosecondBuilder, TimestampSecondBuilder,
 };
+use arrow::datatypes as arrow_schema;
 use jiff::ToSpan;
 use ordered_float::OrderedFloat;
 use parse_display::Display;
@@ -83,6 +87,41 @@ impl Datum<'_> {
             _ => panic!("not a blob: {self:?}"),
         }
     }
+
+    pub fn as_decimal(&self) -> &Decimal {
+        match self {
+            Self::Decimal(d) => d,
+            _ => panic!("not a decimal: {self:?}"),
+        }
+    }
+
+    pub fn as_date(&self) -> Date {
+        match self {
+            Self::Date(d) => *d,
+            _ => panic!("not a date: {self:?}"),
+        }
+    }
+
+    pub fn as_time(&self) -> Time {
+        match self {
+            Self::Time(t) => *t,
+            _ => panic!("not a time: {self:?}"),
+        }
+    }
+
+    pub fn as_timestamp_ntz(&self) -> TimestampNtz {
+        match self {
+            Self::TimestampNtz(ts) => *ts,
+            _ => panic!("not a timestamp ntz: {self:?}"),
+        }
+    }
+
+    pub fn as_timestamp_ltz(&self) -> TimestampLtz {
+        match self {
+            Self::TimestampLtz(ts) => *ts,
+            _ => panic!("not a timestamp ltz: {self:?}"),
+        }
+    }
 }
 
 // ----------- implement from
@@ -246,6 +285,66 @@ impl TryFrom<&Datum<'_>> for i8 {
     }
 }
 
+impl TryFrom<&Datum<'_>> for Decimal {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Decimal(d) => Ok(d.clone()),
+            _ => Err(()),
+        }
+    }
+}
+
+impl TryFrom<&Datum<'_>> for Date {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Date(d) => Ok(*d),
+            _ => Err(()),
+        }
+    }
+}
+
+impl TryFrom<&Datum<'_>> for Time {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::Time(t) => Ok(*t),
+            _ => Err(()),
+        }
+    }
+}
+
+impl TryFrom<&Datum<'_>> for TimestampNtz {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::TimestampNtz(ts) => Ok(*ts),
+            _ => Err(()),
+        }
+    }
+}
+
+impl TryFrom<&Datum<'_>> for TimestampLtz {
+    type Error = ();
+
+    #[inline]
+    fn try_from(from: &Datum) -> std::result::Result<Self, Self::Error> {
+        match from {
+            Datum::TimestampLtz(ts) => Ok(*ts),
+            _ => Err(()),
+        }
+    }
+}
+
 impl<'a> From<bool> for Datum<'a> {
     #[inline]
     fn from(b: bool) -> Datum<'a> {
@@ -253,12 +352,103 @@ impl<'a> From<bool> for Datum<'a> {
     }
 }
 
+impl<'a> From<Decimal> for Datum<'a> {
+    #[inline]
+    fn from(d: Decimal) -> Datum<'a> {
+        Datum::Decimal(d)
+    }
+}
+
+impl<'a> From<Date> for Datum<'a> {
+    #[inline]
+    fn from(d: Date) -> Datum<'a> {
+        Datum::Date(d)
+    }
+}
+
+impl<'a> From<Time> for Datum<'a> {
+    #[inline]
+    fn from(t: Time) -> Datum<'a> {
+        Datum::Time(t)
+    }
+}
+
+impl<'a> From<TimestampNtz> for Datum<'a> {
+    #[inline]
+    fn from(ts: TimestampNtz) -> Datum<'a> {
+        Datum::TimestampNtz(ts)
+    }
+}
+
+impl<'a> From<TimestampLtz> for Datum<'a> {
+    #[inline]
+    fn from(ts: TimestampLtz) -> Datum<'a> {
+        Datum::TimestampLtz(ts)
+    }
+}
+
 pub trait ToArrow {
-    fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()>;
+    fn append_to(
+        &self,
+        builder: &mut dyn ArrayBuilder,
+        data_type: &arrow_schema::DataType,
+    ) -> Result<()>;
+}
+
+// Time unit conversion constants
+const MILLIS_PER_SECOND: i64 = 1_000;
+const MICROS_PER_MILLI: i64 = 1_000;
+const NANOS_PER_MILLI: i64 = 1_000_000;
+
+/// Converts milliseconds and nanoseconds-within-millisecond to total microseconds.
+/// Returns an error if the conversion would overflow.
+fn millis_nanos_to_micros(millis: i64, nanos: i32) -> Result<i64> {
+    let millis_micros = millis
+        .checked_mul(MICROS_PER_MILLI)
+        .ok_or_else(|| RowConvertError {
+            message: format!(
+                "Timestamp milliseconds {} overflows when converting to microseconds",
+                millis
+            ),
+        })?;
+    let nanos_micros = (nanos as i64) / MICROS_PER_MILLI;
+    millis_micros
+        .checked_add(nanos_micros)
+        .ok_or_else(|| RowConvertError {
+            message: format!(
+                "Timestamp overflow when adding microseconds: {} + {}",
+                millis_micros, nanos_micros
+            ),
+        })
+}
+
+/// Converts milliseconds and nanoseconds-within-millisecond to total nanoseconds.
+/// Returns an error if the conversion would overflow.
+fn millis_nanos_to_nanos(millis: i64, nanos: i32) -> Result<i64> {
+    let millis_nanos = millis
+        .checked_mul(NANOS_PER_MILLI)
+        .ok_or_else(|| RowConvertError {
+            message: format!(
+                "Timestamp milliseconds {} overflows when converting to nanoseconds",
+                millis
+            ),
+        })?;
+    millis_nanos
+        .checked_add(nanos as i64)
+        .ok_or_else(|| RowConvertError {
+            message: format!(
+                "Timestamp overflow when adding nanoseconds: {} + {}",
+                millis_nanos, nanos
+            ),
+        })
 }
 
 impl Datum<'_> {
-    pub fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()> {
+    pub fn append_to(
+        &self,
+        builder: &mut dyn ArrayBuilder,
+        data_type: &arrow_schema::DataType,
+    ) -> Result<()> {
         macro_rules! append_null_to_arrow {
             ($builder_type:ty) => {
                 if let Some(b) = builder.as_any_mut().downcast_mut::<$builder_type>() {
@@ -288,6 +478,16 @@ impl Datum<'_> {
                 append_null_to_arrow!(Float64Builder);
                 append_null_to_arrow!(StringBuilder);
                 append_null_to_arrow!(BinaryBuilder);
+                append_null_to_arrow!(Decimal128Builder);
+                append_null_to_arrow!(Date32Builder);
+                append_null_to_arrow!(Time32SecondBuilder);
+                append_null_to_arrow!(Time32MillisecondBuilder);
+                append_null_to_arrow!(Time64MicrosecondBuilder);
+                append_null_to_arrow!(Time64NanosecondBuilder);
+                append_null_to_arrow!(TimestampSecondBuilder);
+                append_null_to_arrow!(TimestampMillisecondBuilder);
+                append_null_to_arrow!(TimestampMicrosecondBuilder);
+                append_null_to_arrow!(TimestampNanosecondBuilder);
             }
             Datum::Bool(v) => append_value_to_arrow!(BooleanBuilder, *v),
             Datum::Int8(v) => append_value_to_arrow!(Int8Builder, *v),
@@ -298,16 +498,221 @@ impl Datum<'_> {
             Datum::Float64(v) => append_value_to_arrow!(Float64Builder, v.into_inner()),
             Datum::String(v) => append_value_to_arrow!(StringBuilder, v.as_ref()),
             Datum::Blob(v) => append_value_to_arrow!(BinaryBuilder, v.as_ref()),
-            Datum::Decimal(_)
-            | Datum::Date(_)
-            | Datum::Time(_)
-            | Datum::TimestampNtz(_)
-            | Datum::TimestampLtz(_) => {
+            Datum::Decimal(decimal) => {
+                // Extract target precision and scale from Arrow schema
+                let (p, s) = match data_type {
+                    arrow_schema::DataType::Decimal128(p, s) => (*p, *s),
+                    _ => {
+                        return Err(RowConvertError {
+                            message: format!(
+                                "Expected Decimal128 Arrow type, got: {:?}",
+                                data_type
+                            ),
+                        });
+                    }
+                };
+
+                // Validate scale is non-negative (Fluss doesn't support negative scales)
+                if s < 0 {
+                    return Err(RowConvertError {
+                        message: format!("Negative decimal scale {} is not supported", s),
+                    });
+                }
+
+                let target_precision = p as u32;
+                let target_scale = s as i64; // Safe now: 0..127 → 0i64..127i64
+
+                if let Some(b) = builder.as_any_mut().downcast_mut::<Decimal128Builder>() {
+                    use bigdecimal::RoundingMode;
+
+                    // Rescale the decimal to match Arrow's target scale
+                    let bd = decimal.to_big_decimal();
+                    let rescaled = bd.with_scale_round(target_scale, RoundingMode::HalfUp);
+                    let (unscaled, _) = rescaled.as_bigint_and_exponent();
+
+                    // Validate precision
+                    let actual_precision = Decimal::compute_precision(&unscaled);
+                    if actual_precision > target_precision as usize {
+                        return Err(RowConvertError {
+                            message: format!(
+                                "Decimal precision overflow: value has {} digits but Arrow expects {} (value: {})",
+                                actual_precision, target_precision, rescaled
+                            ),
+                        });
+                    }
+
+                    // Convert to i128 for Arrow
+                    let i128_val: i128 = match unscaled.try_into() {
+                        Ok(v) => v,
+                        Err(_) => {
+                            return Err(RowConvertError {
+                                message: format!("Decimal value exceeds i128 range: {}", rescaled),
+                            });
+                        }
+                    };
+
+                    b.append_value(i128_val);
+                    return Ok(());
+                }
+
                 return Err(RowConvertError {
-                    message: format!(
-                        "Type {:?} is not yet supported for Arrow conversion",
-                        std::mem::discriminant(self)
-                    ),
+                    message: "Builder type mismatch for Decimal128".to_string(),
+                });
+            }
+            Datum::Date(date) => {
+                append_value_to_arrow!(Date32Builder, date.get_inner());
+            }
+            Datum::Time(time) => {
+                // Time is stored as milliseconds since midnight in Fluss
+                // Convert to Arrow's time unit based on schema
+                let millis = time.get_inner();
+
+                match data_type {
+                    arrow_schema::DataType::Time32(arrow_schema::TimeUnit::Second) => {
+                        if let Some(b) = builder.as_any_mut().downcast_mut::<Time32SecondBuilder>()
+                        {
+                            // Validate no sub-second precision is lost
+                            if millis % MILLIS_PER_SECOND as i32 != 0 {
+                                return Err(RowConvertError {
+                                    message: format!(
+                                        "Time value {} ms has sub-second precision but schema expects seconds only",
+                                        millis
+                                    ),
+                                });
+                            }
+                            b.append_value(millis / MILLIS_PER_SECOND as i32);
+                            return Ok(());
+                        }
+                    }
+                    arrow_schema::DataType::Time32(arrow_schema::TimeUnit::Millisecond) => {
+                        if let Some(b) = builder
+                            .as_any_mut()
+                            .downcast_mut::<Time32MillisecondBuilder>()
+                        {
+                            b.append_value(millis);
+                            return Ok(());
+                        }
+                    }
+                    arrow_schema::DataType::Time64(arrow_schema::TimeUnit::Microsecond) => {
+                        if let Some(b) = builder
+                            .as_any_mut()
+                            .downcast_mut::<Time64MicrosecondBuilder>()
+                        {
+                            let micros = (millis as i64)
+                                .checked_mul(MICROS_PER_MILLI)
+                                .ok_or_else(|| RowConvertError {
+                                    message: format!(
+                                        "Time value {} ms overflows when converting to microseconds",
+                                        millis
+                                    ),
+                                })?;
+                            b.append_value(micros);
+                            return Ok(());
+                        }
+                    }
+                    arrow_schema::DataType::Time64(arrow_schema::TimeUnit::Nanosecond) => {
+                        if let Some(b) = builder
+                            .as_any_mut()
+                            .downcast_mut::<Time64NanosecondBuilder>()
+                        {
+                            let nanos = (millis as i64).checked_mul(NANOS_PER_MILLI).ok_or_else(
+                                || RowConvertError {
+                                    message: format!(
+                                        "Time value {} ms overflows when converting to nanoseconds",
+                                        millis
+                                    ),
+                                },
+                            )?;
+                            b.append_value(nanos);
+                            return Ok(());
+                        }
+                    }
+                    _ => {
+                        return Err(RowConvertError {
+                            message: format!(
+                                "Expected Time32/Time64 Arrow type, got: {:?}",
+                                data_type
+                            ),
+                        });
+                    }
+                }
+
+                return Err(RowConvertError {
+                    message: "Builder type mismatch for Time".to_string(),
+                });
+            }
+            Datum::TimestampNtz(ts) => {
+                let millis = ts.get_millisecond();
+                let nanos = ts.get_nano_of_millisecond();
+
+                if let Some(b) = builder
+                    .as_any_mut()
+                    .downcast_mut::<TimestampSecondBuilder>()
+                {
+                    b.append_value(millis / MILLIS_PER_SECOND);
+                    return Ok(());
+                }
+                if let Some(b) = builder
+                    .as_any_mut()
+                    .downcast_mut::<TimestampMillisecondBuilder>()
+                {
+                    b.append_value(millis);
+                    return Ok(());
+                }
+                if let Some(b) = builder
+                    .as_any_mut()
+                    .downcast_mut::<TimestampMicrosecondBuilder>()
+                {
+                    b.append_value(millis_nanos_to_micros(millis, nanos)?);
+                    return Ok(());
+                }
+                if let Some(b) = builder
+                    .as_any_mut()
+                    .downcast_mut::<TimestampNanosecondBuilder>()
+                {
+                    b.append_value(millis_nanos_to_nanos(millis, nanos)?);
+                    return Ok(());
+                }
+
+                return Err(RowConvertError {
+                    message: "Builder type mismatch for TimestampNtz".to_string(),
+                });
+            }
+            Datum::TimestampLtz(ts) => {
+                let millis = ts.get_epoch_millisecond();
+                let nanos = ts.get_nano_of_millisecond();
+
+                if let Some(b) = builder
+                    .as_any_mut()
+                    .downcast_mut::<TimestampSecondBuilder>()
+                {
+                    b.append_value(millis / MILLIS_PER_SECOND);
+                    return Ok(());
+                }
+                if let Some(b) = builder
+                    .as_any_mut()
+                    .downcast_mut::<TimestampMillisecondBuilder>()
+                {
+                    b.append_value(millis);
+                    return Ok(());
+                }
+                if let Some(b) = builder
+                    .as_any_mut()
+                    .downcast_mut::<TimestampMicrosecondBuilder>()
+                {
+                    b.append_value(millis_nanos_to_micros(millis, nanos)?);
+                    return Ok(());
+                }
+                if let Some(b) = builder
+                    .as_any_mut()
+                    .downcast_mut::<TimestampNanosecondBuilder>()
+                {
+                    b.append_value(millis_nanos_to_nanos(millis, nanos)?);
+                    return Ok(());
+                }
+
+                return Err(RowConvertError {
+                    message: "Builder type mismatch for TimestampLtz".to_string(),
                 });
             }
         }
@@ -325,7 +730,11 @@ impl Datum<'_> {
 macro_rules! impl_to_arrow {
     ($ty:ty, $variant:ident) => {
         impl ToArrow for $ty {
-            fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()> {
+            fn append_to(
+                &self,
+                builder: &mut dyn ArrayBuilder,
+                _data_type: &arrow_schema::DataType,
+            ) -> Result<()> {
                 if let Some(b) = builder.as_any_mut().downcast_mut::<$variant>() {
                     b.append_value(*self);
                     Ok(())
@@ -536,24 +945,39 @@ mod tests {
         assert_eq!(value, 42);
         let value: std::result::Result<i16, _> = (&datum).try_into();
         assert!(value.is_err());
+
+        // Test temporal types
+        let decimal = Decimal::from_unscaled_long(12345, 10, 2).unwrap();
+        let datum: Datum = decimal.clone().into();
+        assert_eq!(datum.as_decimal(), &decimal);
+        let extracted: Decimal = (&datum).try_into().unwrap();
+        assert_eq!(extracted, decimal);
+
+        let date = Date::new(19000);
+        let datum: Datum = date.into();
+        assert_eq!(datum.as_date(), date);
+
+        let ts_ltz = TimestampLtz::new(1672531200000);
+        let datum: Datum = ts_ltz.into();
+        assert_eq!(datum.as_timestamp_ltz(), ts_ltz);
     }
 
     #[test]
     fn datum_append_to_builder() {
         let mut builder = Int32Builder::new();
-        Datum::Null.append_to(&mut builder).unwrap();
-        Datum::Int32(5).append_to(&mut builder).unwrap();
+        Datum::Null
+            .append_to(&mut builder, &arrow_schema::DataType::Int32)
+            .unwrap();
+        Datum::Int32(5)
+            .append_to(&mut builder, &arrow_schema::DataType::Int32)
+            .unwrap();
         let array = builder.finish();
         assert!(array.is_null(0));
         assert_eq!(array.value(1), 5);
 
         let mut builder = StringBuilder::new();
-        let err = Datum::Int32(1).append_to(&mut builder).unwrap_err();
-        assert!(matches!(err, crate::error::Error::RowConvertError { .. }));
-
-        let mut builder = Int32Builder::new();
-        let err = Datum::Date(Date::new(0))
-            .append_to(&mut builder)
+        let err = Datum::Int32(1)
+            .append_to(&mut builder, &arrow_schema::DataType::Utf8)
             .unwrap_err();
         assert!(matches!(err, crate::error::Error::RowConvertError { .. }));
     }

From ed9bca6787f4e860e2f78c4831d4e184daa57b77 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Fri, 23 Jan 2026 14:44:55 +0800
Subject: [PATCH 081/287] chore: invalidate leader info on stale metadata error
 when handling fetch response (#189)

---
 .../crates/fluss/src/client/metadata.rs       |  12 +-
 .../crates/fluss/src/client/table/scanner.rs  | 149 ++++++++++++++----
 .../crates/fluss/src/cluster/cluster.rs       |  64 ++++++--
 fluss-rust/crates/fluss/src/metadata/table.rs |   2 +-
 4 files changed, 185 insertions(+), 42 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index 0e6f965131..3c6730b545 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -17,7 +17,7 @@
 
 use crate::cluster::{Cluster, ServerNode, ServerType};
 use crate::error::Result;
-use crate::metadata::{TableBucket, TablePath};
+use crate::metadata::{PhysicalTablePath, TableBucket, TablePath};
 use crate::proto::MetadataResponse;
 use crate::rpc::message::UpdateMetadataRequest;
 use crate::rpc::{RpcClient, ServerConnection};
@@ -71,6 +71,16 @@ impl Metadata {
         *cluster_guard = Arc::new(updated_cluster);
     }
 
+    pub fn invalidate_physical_table_meta(
+        &self,
+        physical_tables_to_invalid: &HashSet<PhysicalTablePath>,
+    ) {
+        let mut cluster_guard = self.cluster.write();
+        let updated_cluster =
+            cluster_guard.invalidate_physical_table_meta(physical_tables_to_invalid);
+        *cluster_guard = Arc::new(updated_cluster);
+    }
+
     pub async fn update(&self, metadata_response: MetadataResponse) -> Result<()> {
         let origin_cluster = self.cluster.read().clone();
         let new_cluster =
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index cf0b257f00..afa44f350b 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -36,7 +36,7 @@ use crate::client::table::remote_log::{
     RemoteLogDownloader, RemoteLogFetchInfo, RemotePendingFetch,
 };
 use crate::error::{ApiError, Error, FlussError, Result};
-use crate::metadata::{TableBucket, TableInfo, TablePath};
+use crate::metadata::{PhysicalTablePath, TableBucket, TableInfo, TablePath};
 use crate::proto::{ErrorResponse, FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
 use crate::record::{LogRecordsBatches, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
 use crate::rpc::{RpcClient, RpcError, message};
@@ -462,6 +462,16 @@ struct LogFetcher {
     nodes_with_pending_fetch_requests: Arc<Mutex<HashSet<i32>>>,
 }
 
+struct FetchResponseContext {
+    metadata: Arc<Metadata>,
+    log_fetch_buffer: Arc<LogFetchBuffer>,
+    log_scanner_status: Arc<LogScannerStatus>,
+    read_context: ReadContext,
+    remote_read_context: ReadContext,
+    remote_log_downloader: Arc<RemoteLogDownloader>,
+    credentials_cache: Arc<CredentialsCache>,
+}
+
 impl LogFetcher {
     pub fn new(
         table_info: TableInfo,
@@ -518,7 +528,8 @@ impl LogFetcher {
             | FlussError::LogStorageException
             | FlussError::KvStorageException
             | FlussError::StorageException
-            | FlussError::FencedLeaderEpochException => FetchErrorContext {
+            | FlussError::FencedLeaderEpochException
+            | FlussError::LeaderNotAvailableException => FetchErrorContext {
                 action: FetchErrorAction::Ignore,
                 log_level: FetchErrorLogLevel::Debug,
                 log_message: format!(
@@ -570,6 +581,17 @@ impl LogFetcher {
         }
     }
 
+    fn should_invalidate_table_meta(error: FlussError) -> bool {
+        matches!(
+            error,
+            FlussError::NotLeaderOrFollower
+                | FlussError::LeaderNotAvailableException
+                | FlussError::FencedLeaderEpochException
+                | FlussError::UnknownTableOrBucketException
+                | FlussError::InvalidCoordinatorException
+        )
+    }
+
     async fn check_and_update_metadata(&self) -> Result<()> {
         let need_update = self
             .fetchable_buckets()
@@ -639,6 +661,15 @@ impl LogFetcher {
             let creds_cache = self.credentials_cache.clone();
             let nodes_with_pending = self.nodes_with_pending_fetch_requests.clone();
             let metadata = self.metadata.clone();
+            let response_context = FetchResponseContext {
+                metadata: metadata.clone(),
+                log_fetch_buffer,
+                log_scanner_status,
+                read_context,
+                remote_read_context,
+                remote_log_downloader,
+                credentials_cache: creds_cache,
+            };
             // Spawn async task to handle the fetch request
             // Note: These tasks are not explicitly tracked or cancelled when LogFetcher is dropped.
             // This is acceptable because:
@@ -684,16 +715,7 @@ impl LogFetcher {
                     }
                 };
 
-                Self::handle_fetch_response(
-                    fetch_response,
-                    &log_fetch_buffer,
-                    &log_scanner_status,
-                    &read_context,
-                    &remote_read_context,
-                    &remote_log_downloader,
-                    &creds_cache,
-                )
-                .await;
+                Self::handle_fetch_response(fetch_response, response_context).await;
             });
         }
 
@@ -712,13 +734,18 @@ impl LogFetcher {
     /// Handle fetch response and add completed fetches to buffer
     async fn handle_fetch_response(
         fetch_response: crate::proto::FetchLogResponse,
-        log_fetch_buffer: &Arc<LogFetchBuffer>,
-        log_scanner_status: &Arc<LogScannerStatus>,
-        read_context: &ReadContext,
-        remote_read_context: &ReadContext,
-        remote_log_downloader: &Arc<RemoteLogDownloader>,
-        credentials_cache: &Arc<CredentialsCache>,
+        context: FetchResponseContext,
     ) {
+        let FetchResponseContext {
+            metadata,
+            log_fetch_buffer,
+            log_scanner_status,
+            read_context,
+            remote_read_context,
+            remote_log_downloader,
+            credentials_cache,
+        } = context;
+
         for pb_fetch_log_resp in fetch_response.tables_resp {
             let table_id = pb_fetch_log_resp.table_id;
             let fetch_log_for_buckets = pb_fetch_log_resp.buckets_resp;
@@ -745,6 +772,20 @@ impl LogFetcher {
                     .into();
 
                     let error = FlussError::for_code(error_code);
+                    if Self::should_invalidate_table_meta(error) {
+                        // TODO: Consider triggering table meta invalidation from sender/lookup paths.
+                        let table_id = table_bucket.table_id();
+                        let cluster = metadata.get_cluster();
+                        if let Some(table_path) = cluster.get_table_path_by_id(table_id) {
+                            let physical_tables =
+                                HashSet::from([PhysicalTablePath::of(table_path.clone())]);
+                            metadata.invalidate_physical_table_meta(&physical_tables);
+                        } else {
+                            warn!(
+                                "Table id {table_id} is missing from table_path_by_id while invalidating table metadata"
+                            );
+                        }
+                    }
                     let error_context = Self::describe_fetch_error(
                         error,
                         &table_bucket,
@@ -1577,20 +1618,72 @@ mod tests {
             }],
         };
 
-        LogFetcher::handle_fetch_response(
-            response,
-            &fetcher.log_fetch_buffer,
-            &fetcher.log_scanner_status,
-            &fetcher.read_context,
-            &fetcher.remote_read_context,
-            &fetcher.remote_log_downloader,
-            &fetcher.credentials_cache,
-        )
-        .await;
+        let response_context = FetchResponseContext {
+            metadata: metadata.clone(),
+            log_fetch_buffer: fetcher.log_fetch_buffer.clone(),
+            log_scanner_status: fetcher.log_scanner_status.clone(),
+            read_context: fetcher.read_context.clone(),
+            remote_read_context: fetcher.remote_read_context.clone(),
+            remote_log_downloader: fetcher.remote_log_downloader.clone(),
+            credentials_cache: fetcher.credentials_cache.clone(),
+        };
+
+        LogFetcher::handle_fetch_response(response, response_context).await;
 
         let completed = fetcher.log_fetch_buffer.poll().expect("completed fetch");
         let api_error = completed.api_error().expect("api error");
         assert_eq!(api_error.code, FlussError::AuthorizationException.code());
         Ok(())
     }
+
+    #[tokio::test]
+    async fn handle_fetch_response_invalidates_table_meta() -> Result<()> {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = build_table_info(table_path.clone(), 1, 1);
+        let cluster = build_cluster_arc(&table_path, 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
+        let status = Arc::new(LogScannerStatus::new());
+        status.assign_scan_bucket(TableBucket::new(1, 0), 5);
+        let fetcher = LogFetcher::new(
+            table_info.clone(),
+            Arc::new(RpcClient::new()),
+            metadata.clone(),
+            status.clone(),
+            None,
+        )?;
+
+        let bucket = TableBucket::new(1, 0);
+        assert!(metadata.leader_for(&bucket).is_some());
+
+        let response = crate::proto::FetchLogResponse {
+            tables_resp: vec![crate::proto::PbFetchLogRespForTable {
+                table_id: 1,
+                buckets_resp: vec![crate::proto::PbFetchLogRespForBucket {
+                    partition_id: None,
+                    bucket_id: 0,
+                    error_code: Some(FlussError::NotLeaderOrFollower.code()),
+                    error_message: Some("not leader".to_string()),
+                    high_watermark: None,
+                    log_start_offset: None,
+                    remote_log_fetch_info: None,
+                    records: None,
+                }],
+            }],
+        };
+
+        let response_context = FetchResponseContext {
+            metadata: metadata.clone(),
+            log_fetch_buffer: fetcher.log_fetch_buffer.clone(),
+            log_scanner_status: fetcher.log_scanner_status.clone(),
+            read_context: fetcher.read_context.clone(),
+            remote_read_context: fetcher.remote_read_context.clone(),
+            remote_log_downloader: fetcher.remote_log_downloader.clone(),
+            credentials_cache: fetcher.credentials_cache.clone(),
+        };
+
+        LogFetcher::handle_fetch_response(response, response_context).await;
+
+        assert!(metadata.leader_for(&bucket).is_none());
+        Ok(())
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
index f14d055f9b..2484026a98 100644
--- a/fluss-rust/crates/fluss/src/cluster/cluster.rs
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -18,7 +18,9 @@
 use crate::BucketId;
 use crate::cluster::{BucketLocation, ServerNode, ServerType};
 use crate::error::Result;
-use crate::metadata::{JsonSerde, TableBucket, TableDescriptor, TableInfo, TablePath};
+use crate::metadata::{
+    JsonSerde, PhysicalTablePath, TableBucket, TableDescriptor, TableInfo, TablePath,
+};
 use crate::proto::MetadataResponse;
 use crate::rpc::{from_pb_server_node, from_pb_table_path};
 use rand::random_range;
@@ -77,23 +79,33 @@ impl Cluster {
             .filter_map(|id| self.table_path_by_id.get(id))
             .collect();
 
-        let available_locations_by_path = self
-            .available_locations_by_path
-            .iter()
-            .filter(|&(path, _)| !table_paths.contains(path))
-            .map(|(path, locations)| (path.clone(), locations.clone()))
-            .collect();
+        let (available_locations_by_path, available_locations_by_bucket) =
+            self.filter_bucket_locations_by_path(&table_paths);
 
-        let available_locations_by_bucket = self
-            .available_locations_by_bucket
+        Cluster::new(
+            self.coordinator_server.clone(),
+            alive_tablet_servers_by_id,
+            available_locations_by_path,
+            available_locations_by_bucket,
+            self.table_id_by_path.clone(),
+            self.table_info_by_path.clone(),
+        )
+    }
+
+    pub fn invalidate_physical_table_meta(
+        &self,
+        physical_tables_to_invalid: &HashSet<PhysicalTablePath>,
+    ) -> Self {
+        let table_paths: HashSet<&TablePath> = physical_tables_to_invalid
             .iter()
-            .filter(|&(_bucket, location)| !table_paths.contains(&location.table_path))
-            .map(|(bucket, location)| (bucket.clone(), location.clone()))
+            .map(|path| path.get_table_path())
             .collect();
+        let (available_locations_by_path, available_locations_by_bucket) =
+            self.filter_bucket_locations_by_path(&table_paths);
 
         Cluster::new(
             self.coordinator_server.clone(),
-            alive_tablet_servers_by_id,
+            self.alive_tablet_servers_by_id.clone(),
             available_locations_by_path,
             available_locations_by_bucket,
             self.table_id_by_path.clone(),
@@ -122,6 +134,30 @@ impl Cluster {
         self.table_info_by_path = table_info_by_path;
     }
 
+    fn filter_bucket_locations_by_path(
+        &self,
+        table_paths: &HashSet<&TablePath>,
+    ) -> (
+        HashMap<TablePath, Vec<BucketLocation>>,
+        HashMap<TableBucket, BucketLocation>,
+    ) {
+        let available_locations_by_path = self
+            .available_locations_by_path
+            .iter()
+            .filter(|&(path, _)| !table_paths.contains(path))
+            .map(|(path, locations)| (path.clone(), locations.clone()))
+            .collect();
+
+        let available_locations_by_bucket = self
+            .available_locations_by_bucket
+            .iter()
+            .filter(|&(_bucket, location)| !table_paths.contains(&location.table_path))
+            .map(|(bucket, location)| (bucket.clone(), location.clone()))
+            .collect();
+
+        (available_locations_by_path, available_locations_by_bucket)
+    }
+
     pub fn from_metadata_response(
         metadata_response: MetadataResponse,
         origin_cluster: Option<&Cluster>,
@@ -242,6 +278,10 @@ impl Cluster {
         &self.table_id_by_path
     }
 
+    pub fn get_table_path_by_id(&self, table_id: i64) -> Option<&TablePath> {
+        self.table_path_by_id.get(&table_id)
+    }
+
     pub fn get_available_buckets_for_table_path(
         &self,
         table_path: &TablePath,
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 8204e7c46c..f4cf972d26 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -697,7 +697,7 @@ impl TablePath {
     }
 }
 
-#[derive(Debug, Clone)]
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct PhysicalTablePath {
     table_path: TablePath,
     #[allow(dead_code)]

From e2e0c22ab83477d41d90a72ffedc1ca295f9d18a Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Fri, 23 Jan 2026 07:39:34 +0000
Subject: [PATCH 082/287] test: Kv Table Integration tests (#192)

---
 .../crates/fluss/tests/integration/admin.rs   |  40 +-
 .../fluss/tests/integration/kv_table.rs       | 444 ++++++++++++++++++
 .../crates/fluss/tests/integration/table.rs   |  44 +-
 .../tests/integration/table_remote_scan.rs    |  34 +-
 .../crates/fluss/tests/integration/utils.rs   |  74 +++
 fluss-rust/crates/fluss/tests/test_fluss.rs   |   1 +
 6 files changed, 538 insertions(+), 99 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/tests/integration/kv_table.rs

diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index ccb717228e..fbdb295d40 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -33,55 +33,25 @@ static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>>
 #[after_all]
 mod admin_test {
     use super::SHARED_FLUSS_CLUSTER;
-    use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
+    use crate::integration::fluss_cluster::FlussTestingCluster;
+    use crate::integration::utils::{get_cluster, start_cluster, stop_cluster};
     use fluss::error::FlussError;
     use fluss::metadata::{
         DataTypes, DatabaseDescriptorBuilder, KvFormat, LogFormat, Schema, TableDescriptor,
         TablePath,
     };
     use std::sync::Arc;
-    use std::thread;
 
     fn before_all() {
-        // Create a new tokio runtime in a separate thread
-        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
-        thread::spawn(move || {
-            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
-            rt.block_on(async {
-                let cluster = FlussTestingClusterBuilder::new("test-admin").build().await;
-                let mut guard = cluster_guard.write();
-                *guard = Some(cluster);
-            });
-        })
-        .join()
-        .expect("Failed to create cluster");
-        // wait for 20 seconds to avoid the error like
-        // CoordinatorEventProcessor is not initialized yet
-        thread::sleep(std::time::Duration::from_secs(20));
+        start_cluster("test-admin", SHARED_FLUSS_CLUSTER.clone());
     }
 
     fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
-        let cluster_guard = SHARED_FLUSS_CLUSTER.read();
-        if cluster_guard.is_none() {
-            panic!("Fluss cluster not initialized. Make sure before_all() was called.");
-        }
-        Arc::new(cluster_guard.as_ref().unwrap().clone())
+        get_cluster(&SHARED_FLUSS_CLUSTER)
     }
 
     fn after_all() {
-        // Create a new tokio runtime in a separate thread
-        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
-        std::thread::spawn(move || {
-            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
-            rt.block_on(async {
-                let mut guard = cluster_guard.write();
-                if let Some(cluster) = guard.take() {
-                    cluster.stop().await;
-                }
-            });
-        })
-        .join()
-        .expect("Failed to cleanup cluster");
+        stop_cluster(SHARED_FLUSS_CLUSTER.clone());
     }
 
     #[tokio::test]
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
new file mode 100644
index 0000000000..efd7957549
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -0,0 +1,444 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+use parking_lot::RwLock;
+use std::sync::Arc;
+use std::sync::LazyLock;
+
+use crate::integration::fluss_cluster::FlussTestingCluster;
+#[cfg(test)]
+use test_env_helpers::*;
+
+// Module-level shared cluster instance (only for this test file)
+static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>> =
+    LazyLock::new(|| Arc::new(RwLock::new(None)));
+
+#[cfg(test)]
+#[before_all]
+#[after_all]
+mod kv_table_test {
+    use super::SHARED_FLUSS_CLUSTER;
+    use crate::integration::fluss_cluster::FlussTestingCluster;
+    use crate::integration::utils::{create_table, get_cluster, start_cluster, stop_cluster};
+    use fluss::client::UpsertWriter;
+    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    use fluss::row::{GenericRow, InternalRow};
+    use std::sync::Arc;
+
+    fn before_all() {
+        start_cluster("test_kv_table", SHARED_FLUSS_CLUSTER.clone());
+    }
+
+    fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
+        get_cluster(&SHARED_FLUSS_CLUSTER)
+    }
+
+    fn after_all() {
+        stop_cluster(SHARED_FLUSS_CLUSTER.clone());
+    }
+
+    fn make_key(id: i32) -> GenericRow<'static> {
+        let mut row = GenericRow::new();
+        row.set_field(0, id);
+        row.set_field(1, "");
+        row.set_field(2, 0i64);
+        row
+    }
+
+    #[tokio::test]
+    async fn upsert_delete_and_lookup() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_upsert_and_lookup".to_string());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .column("age", DataTypes::bigint())
+                    .primary_key(vec!["id".to_string()])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+        let mut upsert_writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let test_data = [(1, "Verso", 32i64), (2, "Noco", 25), (3, "Esquie", 35)];
+
+        // Upsert rows
+        for (id, name, age) in &test_data {
+            let mut row = GenericRow::new();
+            row.set_field(0, *id);
+            row.set_field(1, *name);
+            row.set_field(2, *age);
+            upsert_writer
+                .upsert(&row)
+                .await
+                .expect("Failed to upsert row");
+        }
+
+        // Lookup records
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        // Verify lookup results
+        for (id, expected_name, expected_age) in &test_data {
+            let result = lookuper
+                .lookup(&make_key(*id))
+                .await
+                .expect("Failed to lookup");
+            let row = result
+                .get_single_row()
+                .expect("Failed to get row")
+                .expect("Row should exist");
+
+            assert_eq!(row.get_int(0), *id, "id mismatch");
+            assert_eq!(row.get_string(1), *expected_name, "name mismatch");
+            assert_eq!(row.get_long(2), *expected_age, "age mismatch");
+        }
+
+        // Update the record with new age
+        let mut updated_row = GenericRow::new();
+        updated_row.set_field(0, 1);
+        updated_row.set_field(1, "Verso");
+        updated_row.set_field(2, 33i64);
+        upsert_writer
+            .upsert(&updated_row)
+            .await
+            .expect("Failed to upsert updated row");
+
+        // Verify the update
+        let result = lookuper
+            .lookup(&make_key(1))
+            .await
+            .expect("Failed to lookup after update");
+        let found_row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+        assert_eq!(
+            found_row.get_long(2),
+            updated_row.get_long(2),
+            "Age should be updated"
+        );
+        assert_eq!(
+            found_row.get_string(1),
+            updated_row.get_string(1),
+            "Name should remain unchanged"
+        );
+
+        // Delete record with id=1
+        let mut delete_row = GenericRow::new();
+        delete_row.set_field(0, 1);
+        delete_row.set_field(1, "");
+        delete_row.set_field(2, 0i64);
+        upsert_writer
+            .delete(&delete_row)
+            .await
+            .expect("Failed to delete");
+
+        // Verify deletion
+        let result = lookuper
+            .lookup(&make_key(1))
+            .await
+            .expect("Failed to lookup deleted record");
+        assert!(
+            result
+                .get_single_row()
+                .expect("Failed to get row")
+                .is_none(),
+            "Record 1 should not exist after delete"
+        );
+
+        // Verify other records still exist
+        for i in [2, 3] {
+            let result = lookuper
+                .lookup(&make_key(i))
+                .await
+                .expect("Failed to lookup");
+            assert!(
+                result
+                    .get_single_row()
+                    .expect("Failed to get row")
+                    .is_some(),
+                "Record {} should still exist after deleting record 1",
+                i
+            );
+        }
+
+        // Lookup non-existent key
+        let result = lookuper
+            .lookup(&make_key(999))
+            .await
+            .expect("Failed to lookup non-existent key");
+        assert!(
+            result
+                .get_single_row()
+                .expect("Failed to get row")
+                .is_none(),
+            "Non-existent key should return None"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn composite_primary_keys() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_composite_pk".to_string());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("region", DataTypes::string())
+                    .column("user_id", DataTypes::int())
+                    .column("score", DataTypes::bigint())
+                    .primary_key(vec!["region".to_string(), "user_id".to_string()])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+        let mut upsert_writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        // Insert records with composite keys
+        let test_data = [
+            ("US", 1, 100i64),
+            ("US", 2, 200i64),
+            ("EU", 1, 150i64),
+            ("EU", 2, 250i64),
+        ];
+
+        for (region, user_id, score) in &test_data {
+            let mut row = GenericRow::new();
+            row.set_field(0, *region);
+            row.set_field(1, *user_id);
+            row.set_field(2, *score);
+            upsert_writer.upsert(&row).await.expect("Failed to upsert");
+        }
+
+        // Lookup with composite key
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        // Lookup (US, 1) - should return score 100
+        let mut key = GenericRow::new();
+        key.set_field(0, "US");
+        key.set_field(1, 1);
+        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+        let row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+        assert_eq!(row.get_long(2), 100, "Score for (US, 1) should be 100");
+
+        // Lookup (EU, 2) - should return score 250
+        let mut key = GenericRow::new();
+        key.set_field(0, "EU");
+        key.set_field(1, 2);
+        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+        let row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+        assert_eq!(row.get_long(2), 250, "Score for (EU, 2) should be 250");
+
+        // Update (US, 1) score
+        let mut update_row = GenericRow::new();
+        update_row.set_field(0, "US");
+        update_row.set_field(1, 1);
+        update_row.set_field(2, 500i64);
+        upsert_writer
+            .upsert(&update_row)
+            .await
+            .expect("Failed to update");
+
+        // Verify update
+        let mut key = GenericRow::new();
+        key.set_field(0, "US");
+        key.set_field(1, 1);
+        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+        let row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+        assert_eq!(
+            row.get_long(2),
+            update_row.get_long(2),
+            "Row score should be updated"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn partial_update() {
+        use fluss::row::Datum;
+
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_partial_update".to_string());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .column("age", DataTypes::bigint())
+                    .column("score", DataTypes::bigint())
+                    .primary_key(vec!["id".to_string()])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        // Insert initial record with all columns
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+        let mut upsert_writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let mut row = GenericRow::new();
+        row.set_field(0, 1);
+        row.set_field(1, "Verso");
+        row.set_field(2, 32i64);
+        row.set_field(3, 6942i64);
+        upsert_writer
+            .upsert(&row)
+            .await
+            .expect("Failed to upsert initial row");
+
+        // Verify initial record
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        let result = lookuper
+            .lookup(&make_key(1))
+            .await
+            .expect("Failed to lookup");
+        let found_row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+
+        assert_eq!(found_row.get_int(0), 1);
+        assert_eq!(found_row.get_string(1), "Verso");
+        assert_eq!(found_row.get_long(2), 32i64);
+        assert_eq!(found_row.get_long(3), 6942i64);
+
+        // Create partial update writer to update only score column
+        let partial_upsert = table_upsert
+            .partial_update_with_column_names(&["id", "score"])
+            .expect("Failed to create TableUpsert with partial update");
+        let mut partial_writer = partial_upsert
+            .create_writer()
+            .expect("Failed to create UpsertWriter with partial write");
+
+        // Update only the score column
+        let mut partial_row = GenericRow::new();
+        partial_row.set_field(0, 1);
+        partial_row.set_field(1, Datum::Null); // not in partial update column
+        partial_row.set_field(2, Datum::Null); // not in partial update column
+        partial_row.set_field(3, 420i64);
+        partial_writer
+            .upsert(&partial_row)
+            .await
+            .expect("Failed to upsert");
+
+        // Verify partial update - name and age should remain unchanged
+        let result = lookuper
+            .lookup(&make_key(1))
+            .await
+            .expect("Failed to lookup after partial update");
+        let found_row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+
+        assert_eq!(found_row.get_int(0), 1, "id should remain 1");
+        assert_eq!(
+            found_row.get_string(1),
+            "Verso",
+            "name should remain unchanged"
+        );
+        assert_eq!(found_row.get_long(2), 32, "age should remain unchanged");
+        assert_eq!(found_row.get_long(3), 420, "score should be updated to 420");
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index 4cba46993f..ef73b5685f 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -33,8 +33,8 @@ static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>>
 #[after_all]
 mod table_test {
     use super::SHARED_FLUSS_CLUSTER;
-    use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
-    use crate::integration::utils::create_table;
+    use crate::integration::fluss_cluster::FlussTestingCluster;
+    use crate::integration::utils::{create_table, get_cluster, start_cluster, stop_cluster};
     use arrow::array::record_batch;
     use fluss::client::{FlussTable, TableScan};
     use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
@@ -44,50 +44,18 @@ mod table_test {
     use jiff::Timestamp;
     use std::collections::HashMap;
     use std::sync::Arc;
-    use std::thread;
     use std::time::Duration;
 
     fn before_all() {
-        // Create a new tokio runtime in a separate thread
-        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
-        thread::spawn(move || {
-            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
-            rt.block_on(async {
-                let cluster = FlussTestingClusterBuilder::new("test_table").build().await;
-                let mut guard = cluster_guard.write();
-                *guard = Some(cluster);
-            });
-        })
-        .join()
-        .expect("Failed to create cluster");
-
-        // wait for 20 seconds to avoid the error like
-        // CoordinatorEventProcessor is not initialized yet
-        thread::sleep(std::time::Duration::from_secs(20));
+        start_cluster("test_table", SHARED_FLUSS_CLUSTER.clone());
     }
 
     fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
-        let cluster_guard = SHARED_FLUSS_CLUSTER.read();
-        if cluster_guard.is_none() {
-            panic!("Fluss cluster not initialized. Make sure before_all() was called.");
-        }
-        Arc::new(cluster_guard.as_ref().unwrap().clone())
+        get_cluster(&SHARED_FLUSS_CLUSTER)
     }
 
     fn after_all() {
-        // Create a new tokio runtime in a separate thread
-        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
-        thread::spawn(move || {
-            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
-            rt.block_on(async {
-                let mut guard = cluster_guard.write();
-                if let Some(cluster) = guard.take() {
-                    cluster.stop().await;
-                }
-            });
-        })
-        .join()
-        .expect("Failed to cleanup cluster");
+        stop_cluster(SHARED_FLUSS_CLUSTER.clone());
     }
 
     #[tokio::test]
@@ -527,7 +495,7 @@ mod table_test {
 
         use arrow::array::Int32Array;
         let batches = scanner.poll(Duration::from_secs(10)).await.unwrap();
-        let mut all_ids: Vec<i32> = batches
+        let all_ids: Vec<i32> = batches
             .iter()
             .flat_map(|b| {
                 (0..b.num_rows()).map(|i| {
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index 43c89b5468..e28a8362e0 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -33,19 +33,20 @@ static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>>
 mod table_remote_scan_test {
     use super::SHARED_FLUSS_CLUSTER;
     use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
-    use crate::integration::utils::create_table;
+    use crate::integration::utils::{
+        create_table, get_cluster, stop_cluster, wait_for_cluster_ready,
+    };
     use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::row::{GenericRow, InternalRow};
     use std::collections::HashMap;
     use std::sync::Arc;
     use std::thread;
-    use std::thread::sleep;
     use std::time::Duration;
     use uuid::Uuid;
 
     fn before_all() {
         // Create a new tokio runtime in a separate thread
-        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
+        let cluster_lock = SHARED_FLUSS_CLUSTER.clone();
         thread::spawn(move || {
             let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
             rt.block_on(async {
@@ -94,32 +95,17 @@ mod table_remote_scan_test {
                 .with_remote_data_dir(temp_dir)
                 .build()
                 .await;
-                let mut guard = cluster_guard.write();
+                wait_for_cluster_ready(&cluster).await;
+                let mut guard = cluster_lock.write();
                 *guard = Some(cluster);
             });
         })
         .join()
         .expect("Failed to create cluster");
-
-        // wait for 20 seconds to avoid the error like
-        // CoordinatorEventProcessor is not initialized yet
-        sleep(Duration::from_secs(20));
     }
 
     fn after_all() {
-        // Create a new tokio runtime in a separate thread
-        let cluster_guard = SHARED_FLUSS_CLUSTER.clone();
-        thread::spawn(move || {
-            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
-            rt.block_on(async {
-                let mut guard = cluster_guard.write();
-                if let Some(cluster) = guard.take() {
-                    cluster.stop().await;
-                }
-            });
-        })
-        .join()
-        .expect("Failed to cleanup cluster");
+        stop_cluster(SHARED_FLUSS_CLUSTER.clone());
     }
 
     #[tokio::test]
@@ -215,10 +201,6 @@ mod table_remote_scan_test {
     }
 
     fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
-        let cluster_guard = SHARED_FLUSS_CLUSTER.read();
-        if cluster_guard.is_none() {
-            panic!("Fluss cluster not initialized. Make sure before_all() was called.");
-        }
-        Arc::new(cluster_guard.as_ref().unwrap().clone())
+        get_cluster(&SHARED_FLUSS_CLUSTER)
     }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index cd1f6ccb2d..4d0c349f0c 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -15,8 +15,43 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
+use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
 use fluss::client::FlussAdmin;
 use fluss::metadata::{TableDescriptor, TablePath};
+use parking_lot::RwLock;
+use std::sync::Arc;
+use std::time::Duration;
+
+/// Polls the cluster until CoordinatorEventProcessor is initialized and tablet server is available.
+/// Times out after 20 seconds.
+pub async fn wait_for_cluster_ready(cluster: &FlussTestingCluster) {
+    let timeout = Duration::from_secs(20);
+    let poll_interval = Duration::from_millis(500);
+    let start = std::time::Instant::now();
+
+    loop {
+        let connection = cluster.get_fluss_connection().await;
+        if connection.get_admin().await.is_ok()
+            && connection
+                .get_metadata()
+                .get_cluster()
+                .get_one_available_server()
+                .is_some()
+        {
+            return;
+        }
+
+        if start.elapsed() >= timeout {
+            panic!(
+                "Server readiness check timed out after {} seconds. \
+                 CoordinatorEventProcessor may not be initialized or TabletServer may not be available.",
+                timeout.as_secs()
+            );
+        }
+
+        tokio::time::sleep(poll_interval).await;
+    }
+}
 
 pub async fn create_table(
     admin: &FlussAdmin,
@@ -28,3 +63,42 @@ pub async fn create_table(
         .await
         .expect("Failed to create table");
 }
+
+pub fn start_cluster(name: &str, cluster_lock: Arc<RwLock<Option<FlussTestingCluster>>>) {
+    let name = name.to_string();
+    std::thread::spawn(move || {
+        let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+        rt.block_on(async {
+            let cluster = FlussTestingClusterBuilder::new(&name).build().await;
+            wait_for_cluster_ready(&cluster).await;
+            let mut guard = cluster_lock.write();
+            *guard = Some(cluster);
+        });
+    })
+    .join()
+    .expect("Failed to create cluster");
+}
+
+pub fn stop_cluster(cluster_lock: Arc<RwLock<Option<FlussTestingCluster>>>) {
+    std::thread::spawn(move || {
+        let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+        rt.block_on(async {
+            let mut guard = cluster_lock.write();
+            if let Some(cluster) = guard.take() {
+                cluster.stop().await;
+            }
+        });
+    })
+    .join()
+    .expect("Failed to cleanup cluster");
+}
+
+pub fn get_cluster(cluster_lock: &RwLock<Option<FlussTestingCluster>>) -> Arc<FlussTestingCluster> {
+    let guard = cluster_lock.read();
+    Arc::new(
+        guard
+            .as_ref()
+            .expect("Fluss cluster not initialized. Make sure before_all() was called.")
+            .clone(),
+    )
+}
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
index 65111af218..f3987e62db 100644
--- a/fluss-rust/crates/fluss/tests/test_fluss.rs
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -22,6 +22,7 @@ extern crate fluss;
 mod integration {
     mod admin;
     mod fluss_cluster;
+    mod kv_table;
     mod table;
 
     mod utils;

From add9dd72e9af1ed020f2bafa3f347ed3363efa74 Mon Sep 17 00:00:00 2001
From: SkylerLin <44233950+linguoxuan@users.noreply.github.com>
Date: Sat, 24 Jan 2026 10:37:34 +0800
Subject: [PATCH 083/287] test: add it test for put & get kv for all supported
 datatypes (#204)

---
 .../fluss/tests/integration/kv_table.rs       | 248 ++++++++++++++++++
 1 file changed, 248 insertions(+)

diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index efd7957549..3f46f9f6eb 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -441,4 +441,252 @@ mod kv_table_test {
             .await
             .expect("Failed to drop table");
     }
+
+    /// Integration test covering put and get operations for all supported datatypes.
+    #[tokio::test]
+    async fn all_supported_datatypes() {
+        use fluss::row::{Date, Datum, Decimal, Time, TimestampLtz, TimestampNtz};
+
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_all_datatypes".to_string());
+
+        // Create a table with all supported primitive datatypes
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    // Primary key column
+                    .column("pk_int", DataTypes::int())
+                    // Boolean type
+                    .column("col_boolean", DataTypes::boolean())
+                    // Integer types
+                    .column("col_tinyint", DataTypes::tinyint())
+                    .column("col_smallint", DataTypes::smallint())
+                    .column("col_int", DataTypes::int())
+                    .column("col_bigint", DataTypes::bigint())
+                    // Floating point types
+                    .column("col_float", DataTypes::float())
+                    .column("col_double", DataTypes::double())
+                    // String types
+                    .column("col_char", DataTypes::char(10))
+                    .column("col_string", DataTypes::string())
+                    // Decimal type
+                    .column("col_decimal", DataTypes::decimal(10, 2))
+                    // Date and time types
+                    .column("col_date", DataTypes::date())
+                    .column("col_time", DataTypes::time())
+                    .column("col_timestamp", DataTypes::timestamp())
+                    .column("col_timestamp_ltz", DataTypes::timestamp_ltz())
+                    // Binary types
+                    .column("col_bytes", DataTypes::bytes())
+                    .column("col_binary", DataTypes::binary(20))
+                    .primary_key(vec!["pk_int".to_string()])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+        let mut upsert_writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        // Test data for all datatypes
+        let pk_int = 1i32;
+        let col_boolean = true;
+        let col_tinyint = 127i8;
+        let col_smallint = 32767i16;
+        let col_int = 2147483647i32;
+        let col_bigint = 9223372036854775807i64;
+        let col_float = 3.14f32;
+        let col_double = 2.718281828459045f64;
+        let col_char = "hello";
+        let col_string = "world of fluss rust client";
+        let col_decimal = Decimal::from_unscaled_long(12345, 10, 2).unwrap(); // 123.45
+        let col_date = Date::new(20476); // 2026-01-23
+        let col_time = Time::new(36827123); // 10:13:47.123
+        let col_timestamp = TimestampNtz::new(1769163227123); // 2026-01-23 10:13:47.123 UTC
+        let col_timestamp_ltz = TimestampLtz::new(1769163227123); // 2026-01-23 10:13:47.123 UTC
+        let col_bytes: &[u8] = b"binary data";
+        let col_binary: &[u8] = b"fixed binary data!!!";
+
+        // Upsert a row with all datatypes
+        let mut row = GenericRow::new();
+        row.set_field(0, pk_int);
+        row.set_field(1, col_boolean);
+        row.set_field(2, col_tinyint);
+        row.set_field(3, col_smallint);
+        row.set_field(4, col_int);
+        row.set_field(5, col_bigint);
+        row.set_field(6, col_float);
+        row.set_field(7, col_double);
+        row.set_field(8, col_char);
+        row.set_field(9, col_string);
+        row.set_field(10, col_decimal.clone());
+        row.set_field(11, col_date);
+        row.set_field(12, col_time);
+        row.set_field(13, col_timestamp);
+        row.set_field(14, col_timestamp_ltz);
+        row.set_field(15, col_bytes);
+        row.set_field(16, col_binary);
+
+        upsert_writer
+            .upsert(&row)
+            .await
+            .expect("Failed to upsert row with all datatypes");
+
+        // Lookup the record
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        let mut key = GenericRow::new();
+        key.set_field(0, pk_int);
+
+        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+        let found_row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+
+        // Verify all datatypes
+        assert_eq!(found_row.get_int(0), pk_int, "pk_int mismatch");
+        assert_eq!(
+            found_row.get_boolean(1),
+            col_boolean,
+            "col_boolean mismatch"
+        );
+        assert_eq!(found_row.get_byte(2), col_tinyint, "col_tinyint mismatch");
+        assert_eq!(
+            found_row.get_short(3),
+            col_smallint,
+            "col_smallint mismatch"
+        );
+        assert_eq!(found_row.get_int(4), col_int, "col_int mismatch");
+        assert_eq!(found_row.get_long(5), col_bigint, "col_bigint mismatch");
+        assert!(
+            (found_row.get_float(6) - col_float).abs() < f32::EPSILON,
+            "col_float mismatch: expected {}, got {}",
+            col_float,
+            found_row.get_float(6)
+        );
+        assert!(
+            (found_row.get_double(7) - col_double).abs() < f64::EPSILON,
+            "col_double mismatch: expected {}, got {}",
+            col_double,
+            found_row.get_double(7)
+        );
+        assert_eq!(found_row.get_char(8, 10), col_char, "col_char mismatch");
+        assert_eq!(found_row.get_string(9), col_string, "col_string mismatch");
+        assert_eq!(
+            found_row.get_decimal(10, 10, 2),
+            col_decimal,
+            "col_decimal mismatch"
+        );
+        assert_eq!(
+            found_row.get_date(11).get_inner(),
+            col_date.get_inner(),
+            "col_date mismatch"
+        );
+        assert_eq!(
+            found_row.get_time(12).get_inner(),
+            col_time.get_inner(),
+            "col_time mismatch"
+        );
+        assert_eq!(
+            found_row.get_timestamp_ntz(13, 6).get_millisecond(),
+            col_timestamp.get_millisecond(),
+            "col_timestamp mismatch"
+        );
+        assert_eq!(
+            found_row.get_timestamp_ltz(14, 6).get_epoch_millisecond(),
+            col_timestamp_ltz.get_epoch_millisecond(),
+            "col_timestamp_ltz mismatch"
+        );
+        assert_eq!(found_row.get_bytes(15), col_bytes, "col_bytes mismatch");
+        assert_eq!(
+            found_row.get_binary(16, 20),
+            col_binary,
+            "col_binary mismatch"
+        );
+
+        // Test with null values for nullable columns
+        let pk_int_2 = 2i32;
+        let mut row_with_nulls = GenericRow::new();
+        row_with_nulls.set_field(0, pk_int_2);
+        row_with_nulls.set_field(1, Datum::Null); // col_boolean
+        row_with_nulls.set_field(2, Datum::Null); // col_tinyint
+        row_with_nulls.set_field(3, Datum::Null); // col_smallint
+        row_with_nulls.set_field(4, Datum::Null); // col_int
+        row_with_nulls.set_field(5, Datum::Null); // col_bigint
+        row_with_nulls.set_field(6, Datum::Null); // col_float
+        row_with_nulls.set_field(7, Datum::Null); // col_double
+        row_with_nulls.set_field(8, Datum::Null); // col_char
+        row_with_nulls.set_field(9, Datum::Null); // col_string
+        row_with_nulls.set_field(10, Datum::Null); // col_decimal
+        row_with_nulls.set_field(11, Datum::Null); // col_date
+        row_with_nulls.set_field(12, Datum::Null); // col_time
+        row_with_nulls.set_field(13, Datum::Null); // col_timestamp
+        row_with_nulls.set_field(14, Datum::Null); // col_timestamp_ltz
+        row_with_nulls.set_field(15, Datum::Null); // col_bytes
+        row_with_nulls.set_field(16, Datum::Null); // col_binary
+
+        upsert_writer
+            .upsert(&row_with_nulls)
+            .await
+            .expect("Failed to upsert row with nulls");
+
+        // Lookup row with nulls
+        let mut key2 = GenericRow::new();
+        key2.set_field(0, pk_int_2);
+
+        let result = lookuper.lookup(&key2).await.expect("Failed to lookup");
+        let found_row_nulls = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+
+        // Verify all nullable columns are null
+        assert_eq!(found_row_nulls.get_int(0), pk_int_2, "pk_int mismatch");
+        assert!(found_row_nulls.is_null_at(1), "col_boolean should be null");
+        assert!(found_row_nulls.is_null_at(2), "col_tinyint should be null");
+        assert!(found_row_nulls.is_null_at(3), "col_smallint should be null");
+        assert!(found_row_nulls.is_null_at(4), "col_int should be null");
+        assert!(found_row_nulls.is_null_at(5), "col_bigint should be null");
+        assert!(found_row_nulls.is_null_at(6), "col_float should be null");
+        assert!(found_row_nulls.is_null_at(7), "col_double should be null");
+        assert!(found_row_nulls.is_null_at(8), "col_char should be null");
+        assert!(found_row_nulls.is_null_at(9), "col_string should be null");
+        assert!(found_row_nulls.is_null_at(10), "col_decimal should be null");
+        assert!(found_row_nulls.is_null_at(11), "col_date should be null");
+        assert!(found_row_nulls.is_null_at(12), "col_time should be null");
+        assert!(
+            found_row_nulls.is_null_at(13),
+            "col_timestamp should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(14),
+            "col_timestamp_ltz should be null"
+        );
+        assert!(found_row_nulls.is_null_at(15), "col_bytes should be null");
+        assert!(found_row_nulls.is_null_at(16), "col_binary should be null");
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
 }

From eda19e2230015095818bb0022e6fbabf6aca31a7 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 25 Jan 2026 01:09:12 +0000
Subject: [PATCH 084/287] feat: introduce priority queue for downloading remote
 segments (#187)

---
 .../crates/fluss/src/client/connection.rs     |    4 +
 .../src/client/table/log_fetch_buffer.rs      |  195 ++-
 .../crates/fluss/src/client/table/mod.rs      |    3 +
 .../fluss/src/client/table/remote_log.rs      | 1087 +++++++++++++++--
 .../crates/fluss/src/client/table/scanner.rs  |   44 +-
 fluss-rust/crates/fluss/src/config.rs         |   12 +
 .../crates/fluss/src/proto/fluss_api.proto    |    1 +
 fluss-rust/crates/fluss/src/record/arrow.rs   |  432 ++++++-
 fluss-rust/crates/fluss/src/util/mod.rs       |    9 +-
 9 files changed, 1611 insertions(+), 176 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 595daf55f5..0e41bbe756 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -59,6 +59,10 @@ impl FlussConnection {
         self.network_connects.clone()
     }
 
+    pub fn config(&self) -> &Config {
+        &self.args
+    }
+
     pub async fn get_admin(&self) -> Result<FlussAdmin> {
         FlussAdmin::new(self.network_connects.clone(), self.metadata.clone()).await
     }
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index 214a79cd7d..4a64eda25a 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -18,15 +18,22 @@
 use arrow::array::RecordBatch;
 use parking_lot::Mutex;
 
+use crate::client::table::remote_log::{
+    PrefetchPermit, RemoteLogDownloadFuture, RemoteLogFile, RemoteLogSegment,
+};
 use crate::error::{ApiError, Error, Result};
 use crate::metadata::TableBucket;
 use crate::record::{
     LogRecordBatch, LogRecordIterator, LogRecordsBatches, ReadContext, ScanRecord,
 };
-use std::collections::{HashMap, VecDeque};
-use std::sync::Arc;
-use std::sync::atomic::{AtomicBool, Ordering};
-use std::time::Duration;
+use std::{
+    collections::{HashMap, VecDeque},
+    sync::{
+        Arc,
+        atomic::{AtomicBool, Ordering},
+    },
+    time::{Duration, Instant},
+};
 use tokio::sync::Notify;
 
 #[derive(Clone, Copy, Debug, PartialEq, Eq)]
@@ -106,7 +113,7 @@ impl LogFetchBuffer {
     /// Wait for the buffer to become non-empty, with timeout.
     /// Returns true if data became available, false if timeout.
     pub async fn await_not_empty(&self, timeout: Duration) -> Result<bool> {
-        let deadline = std::time::Instant::now() + timeout;
+        let deadline = Instant::now() + timeout;
 
         loop {
             // Check if buffer is not empty
@@ -122,7 +129,7 @@ impl LogFetchBuffer {
             }
 
             // Check if timeout
-            let now = std::time::Instant::now();
+            let now = Instant::now();
             if now >= deadline {
                 return Ok(false);
             }
@@ -325,6 +332,7 @@ impl PendingFetch for CompletedPendingFetch {
 }
 
 /// Default implementation of CompletedFetch for in-memory log records
+/// Used for local fetches from tablet server
 pub struct DefaultCompletedFetch {
     table_bucket: TableBucket,
     api_error: Option<ApiError>,
@@ -441,7 +449,8 @@ impl DefaultCompletedFetch {
                 if record.offset() >= self.next_fetch_offset {
                     return Ok(Some(record));
                 }
-            } else if let Some(batch) = self.log_record_batch.next() {
+            } else if let Some(batch_result) = self.log_record_batch.next() {
+                let batch = batch_result?;
                 self.current_record_iterator = Some(batch.records(&self.read_context)?);
                 self.current_record_batch = Some(batch);
             } else {
@@ -470,11 +479,12 @@ impl DefaultCompletedFetch {
     /// Get the next batch directly without row iteration
     fn next_fetched_batch(&mut self) -> Result<Option<RecordBatch>> {
         loop {
-            let Some(log_batch) = self.log_record_batch.next() else {
+            let Some(log_batch_result) = self.log_record_batch.next() else {
                 self.drain();
                 return Ok(None);
             };
 
+            let log_batch = log_batch_result?;
             let mut record_batch = log_batch.record_batch(&self.read_context)?;
 
             // Skip empty batches
@@ -644,6 +654,174 @@ impl CompletedFetch for DefaultCompletedFetch {
     }
 }
 
+/// Completed fetch for remote log segments
+/// Matches Java's RemoteCompletedFetch design - separate class for remote vs local
+/// Holds RAII permit until consumed (data is in inner)
+pub struct RemoteCompletedFetch {
+    inner: DefaultCompletedFetch,
+    permit: Option<PrefetchPermit>,
+}
+
+impl RemoteCompletedFetch {
+    pub fn new(inner: DefaultCompletedFetch, permit: PrefetchPermit) -> Self {
+        Self {
+            inner,
+            permit: Some(permit),
+        }
+    }
+}
+
+impl CompletedFetch for RemoteCompletedFetch {
+    fn table_bucket(&self) -> &TableBucket {
+        self.inner.table_bucket()
+    }
+
+    fn api_error(&self) -> Option<&ApiError> {
+        self.inner.api_error()
+    }
+
+    fn fetch_error_context(&self) -> Option<&FetchErrorContext> {
+        self.inner.fetch_error_context()
+    }
+
+    fn take_error(&mut self) -> Option<Error> {
+        self.inner.take_error()
+    }
+
+    fn fetch_records(&mut self, max_records: usize) -> Result<Vec<ScanRecord>> {
+        self.inner.fetch_records(max_records)
+    }
+
+    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<RecordBatch>> {
+        self.inner.fetch_batches(max_batches)
+    }
+
+    fn is_consumed(&self) -> bool {
+        self.inner.is_consumed()
+    }
+
+    fn records_read(&self) -> usize {
+        self.inner.records_read()
+    }
+
+    fn drain(&mut self) {
+        self.inner.drain();
+        // Release permit immediately (don't wait for struct drop)
+        // Critical: allows prefetch to continue even if Box<dyn CompletedFetch> kept around
+        self.permit.take(); // drops permit here, triggers recycle notification
+    }
+
+    fn size_in_bytes(&self) -> usize {
+        self.inner.size_in_bytes()
+    }
+
+    fn high_watermark(&self) -> i64 {
+        self.inner.high_watermark()
+    }
+
+    fn is_initialized(&self) -> bool {
+        self.inner.is_initialized()
+    }
+
+    fn set_initialized(&mut self) {
+        self.inner.set_initialized()
+    }
+
+    fn next_fetch_offset(&self) -> i64 {
+        self.inner.next_fetch_offset()
+    }
+}
+// Permit released explicitly in drain() or automatically when struct drops
+
+/// Pending fetch that waits for remote log file to be downloaded
+pub struct RemotePendingFetch {
+    segment: RemoteLogSegment,
+    download_future: RemoteLogDownloadFuture,
+    pos_in_log_segment: i32,
+    fetch_offset: i64,
+    high_watermark: i64,
+    read_context: ReadContext,
+}
+
+impl RemotePendingFetch {
+    pub fn new(
+        segment: RemoteLogSegment,
+        download_future: RemoteLogDownloadFuture,
+        pos_in_log_segment: i32,
+        fetch_offset: i64,
+        high_watermark: i64,
+        read_context: ReadContext,
+    ) -> Self {
+        Self {
+            segment,
+            download_future,
+            pos_in_log_segment,
+            fetch_offset,
+            high_watermark,
+            read_context,
+        }
+    }
+}
+
+impl PendingFetch for RemotePendingFetch {
+    fn table_bucket(&self) -> &TableBucket {
+        &self.segment.table_bucket
+    }
+
+    fn is_completed(&self) -> bool {
+        self.download_future.is_done()
+    }
+
+    fn to_completed_fetch(self: Box<Self>) -> Result<Box<dyn CompletedFetch>> {
+        // Take the RemoteLogFile and destructure
+        let remote_log_file = self.download_future.take_remote_log_file()?;
+        let RemoteLogFile {
+            file_path,
+            file_size: _,
+            permit,
+        } = remote_log_file;
+
+        // Open file for streaming (no memory allocation for entire file)
+        let file = std::fs::File::open(&file_path)?;
+        let file_size = file.metadata()?.len() as usize;
+
+        // Create file-backed LogRecordsBatches with cleanup (streaming!)
+        // Data will be read batch-by-batch on-demand, not all at once
+        // FileSource will delete the file when dropped (after file is closed)
+        let log_record_batch =
+            LogRecordsBatches::from_file(file, self.pos_in_log_segment as usize, file_path)?;
+
+        // Calculate size based on position offset
+        let size_in_bytes = if self.pos_in_log_segment > 0 {
+            let pos = self.pos_in_log_segment as usize;
+            if pos >= file_size {
+                return Err(Error::UnexpectedError {
+                    message: format!("Position {} exceeds file size {}", pos, file_size),
+                    source: None,
+                });
+            }
+            file_size - pos
+        } else {
+            file_size
+        };
+
+        // Create DefaultCompletedFetch
+        let inner_fetch = DefaultCompletedFetch::new(
+            self.segment.table_bucket.clone(),
+            log_record_batch,
+            size_in_bytes,
+            self.read_context,
+            self.fetch_offset,
+            self.high_watermark,
+        );
+
+        // Wrap it with RemoteCompletedFetch to hold the permit
+        // Permit manages the prefetch slot (releases semaphore and notifies coordinator) when dropped;
+        // file deletion is handled by FileCleanupGuard in the file-backed source created via from_file
+        Ok(Box::new(RemoteCompletedFetch::new(inner_fetch, permit)))
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -655,7 +833,6 @@ mod tests {
     use crate::record::{MemoryLogRecordsArrowBuilder, ReadContext, to_arrow_schema};
     use crate::row::GenericRow;
     use std::sync::Arc;
-    use std::time::Duration;
 
     fn test_read_context() -> Result<ReadContext> {
         let row_type = RowType::new(vec![DataField::new(
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 2bfa054105..2dc56d52d2 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -36,6 +36,9 @@ mod writer;
 use crate::client::table::upsert::TableUpsert;
 pub use append::{AppendWriter, TableAppend};
 pub use lookup::{LookupResult, Lookuper, TableLookup};
+pub use remote_log::{
+    DEFAULT_SCANNER_REMOTE_LOG_DOWNLOAD_THREADS, DEFAULT_SCANNER_REMOTE_LOG_PREFETCH_NUM,
+};
 pub use scanner::{LogScanner, RecordBatchLogScanner, TableScan};
 pub use writer::{TableWriter, UpsertWriter};
 
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index 0142515783..c39056db11 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -14,21 +14,84 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
-use crate::client::table::log_fetch_buffer::{CompletedFetch, DefaultCompletedFetch, PendingFetch};
 use crate::error::{Error, Result};
 use crate::io::{FileIO, Storage};
 use crate::metadata::TableBucket;
 use crate::proto::{PbRemoteLogFetchInfo, PbRemoteLogSegment};
-use crate::record::{LogRecordsBatches, ReadContext};
-use crate::util::delete_file;
 use parking_lot::{Mutex, RwLock};
-use std::collections::HashMap;
-use std::io;
-use std::path::{Path, PathBuf};
-use std::sync::Arc;
+use std::{
+    cmp::{Ordering, Reverse, min},
+    collections::{BinaryHeap, HashMap},
+    future::Future,
+    io, mem,
+    path::{Path, PathBuf},
+    pin::Pin,
+    sync::Arc,
+    time::Duration,
+};
+
+#[cfg(test)]
+use std::{
+    env,
+    time::{SystemTime, UNIX_EPOCH},
+};
 use tempfile::TempDir;
 use tokio::io::AsyncWriteExt;
-use tokio::sync::oneshot;
+use tokio::sync::{Notify, OwnedSemaphorePermit, Semaphore, mpsc, oneshot};
+use tokio::task::JoinSet;
+
+/// Default maximum number of remote log segments to prefetch
+/// Matches Java's CLIENT_SCANNER_REMOTE_LOG_PREFETCH_NUM (default: 4)
+pub const DEFAULT_SCANNER_REMOTE_LOG_PREFETCH_NUM: usize = 4;
+
+/// Default maximum concurrent remote log downloads
+/// Matches Java's REMOTE_FILE_DOWNLOAD_THREAD_NUM (default: 3)
+pub const DEFAULT_SCANNER_REMOTE_LOG_DOWNLOAD_THREADS: usize = 3;
+
+/// Initial retry backoff delay (milliseconds)
+/// Prevents hot-spin retry loops on persistent failures
+const RETRY_BACKOFF_BASE_MS: u64 = 100;
+
+/// Maximum retry backoff delay (milliseconds)
+/// Caps exponential backoff to avoid excessive delays
+const RETRY_BACKOFF_MAX_MS: u64 = 5_000;
+
+/// Maximum number of retries before giving up
+/// After this many retries, the download will fail permanently
+const MAX_RETRY_COUNT: u32 = 10;
+
+/// Calculate exponential backoff delay with jitter for retries
+fn calculate_backoff_delay(retry_count: u32) -> tokio::time::Duration {
+    use rand::Rng;
+
+    // Exponential backoff: base * 2^retry_count
+    let exponential_ms = RETRY_BACKOFF_BASE_MS.saturating_mul(1 << retry_count.min(10)); // Cap exponent to prevent overflow
+
+    // Cap at maximum
+    let capped_ms = exponential_ms.min(RETRY_BACKOFF_MAX_MS);
+
+    // Add jitter (±25% randomness) to avoid thundering herd
+    let mut rng = rand::rng();
+    let jitter = rng.random_range(0.75..=1.25);
+    let final_ms = ((capped_ms as f64) * jitter) as u64;
+
+    tokio::time::Duration::from_millis(final_ms)
+}
+
+/// Result of a fetch operation containing file path and size
+#[derive(Debug)]
+pub struct FetchResult {
+    pub file_path: PathBuf,
+    pub file_size: usize,
+}
+
+/// Trait for fetching remote log segments (allows dependency injection for testing)
+pub trait RemoteLogFetcher: Send + Sync {
+    fn fetch(
+        &self,
+        request: &RemoteLogDownloadRequest,
+    ) -> Pin<Box<dyn Future<Output = Result<FetchResult>> + Send>>;
+}
 
 /// Represents a remote log segment that needs to be downloaded
 #[derive(Debug, Clone)]
@@ -40,6 +103,7 @@ pub struct RemoteLogSegment {
     #[allow(dead_code)]
     pub size_in_bytes: i32,
     pub table_bucket: TableBucket,
+    pub max_timestamp: i64,
 }
 
 impl RemoteLogSegment {
@@ -50,6 +114,9 @@ impl RemoteLogSegment {
             end_offset: segment.remote_log_end_offset,
             size_in_bytes: segment.segment_size_in_bytes,
             table_bucket,
+            // Match Java's behavior: use -1 for missing timestamp
+            // (Java: CommonRpcMessageUtils.java:171-174)
+            max_timestamp: segment.max_timestamp.unwrap_or(-1),
         }
     }
 
@@ -88,17 +155,473 @@ impl RemoteLogFetchInfo {
     }
 }
 
+/// RAII guard for prefetch permit that notifies coordinator on drop
+///
+/// NOTE: File deletion is now handled by FileSource::drop(), not here.
+/// This ensures the file is closed before deletion
+#[derive(Debug)]
+pub struct PrefetchPermit {
+    permit: Option<OwnedSemaphorePermit>,
+    recycle_notify: Arc<Notify>,
+}
+
+impl PrefetchPermit {
+    fn new(permit: OwnedSemaphorePermit, recycle_notify: Arc<Notify>) -> Self {
+        Self {
+            permit: Some(permit),
+            recycle_notify,
+        }
+    }
+}
+
+impl Drop for PrefetchPermit {
+    fn drop(&mut self) {
+        // Release capacity (critical: permit must be dropped before notify)
+        let _ = self.permit.take(); // drops permit here
+
+        // Then wake coordinator so it can acquire the now-available permit
+        self.recycle_notify.notify_one();
+    }
+}
+
+/// Downloaded remote log file with prefetch permit
+/// File remains on disk for memory efficiency; file deletion is handled by FileCleanupGuard in FileSource
+#[derive(Debug)]
+pub struct RemoteLogFile {
+    /// Path to the downloaded file on local disk
+    pub file_path: PathBuf,
+    /// Size of the file in bytes
+    /// Currently unused but kept for potential future use (logging, metrics, etc.)
+    #[allow(dead_code)]
+    pub file_size: usize,
+    /// RAII permit that releases prefetch semaphore slot and notifies coordinator when dropped
+    pub permit: PrefetchPermit,
+}
+
+/// Represents a request to download a remote log segment with priority ordering
+#[derive(Debug)]
+pub struct RemoteLogDownloadRequest {
+    segment: RemoteLogSegment,
+    remote_log_tablet_dir: String,
+    result_sender: oneshot::Sender<Result<RemoteLogFile>>,
+    retry_count: u32,
+    next_retry_at: Option<tokio::time::Instant>,
+}
+
+impl RemoteLogDownloadRequest {
+    /// Get the segment (used by test fetcher implementations)
+    #[cfg(test)]
+    pub fn segment(&self) -> &RemoteLogSegment {
+        &self.segment
+    }
+}
+
+// Total ordering for priority queue (Rust requirement: cmp==Equal implies Eq)
+// Primary: Java semantics (timestamp cross-bucket, offset within-bucket)
+// Tie-breakers: table_bucket fields (table_id, partition_id, bucket_id), then segment_id
+impl Ord for RemoteLogDownloadRequest {
+    fn cmp(&self, other: &Self) -> Ordering {
+        if self.segment.table_bucket == other.segment.table_bucket {
+            // Same bucket: order by start_offset (ascending - earlier segments first)
+            self.segment
+                .start_offset
+                .cmp(&other.segment.start_offset)
+                .then_with(|| self.segment.segment_id.cmp(&other.segment.segment_id))
+        } else {
+            // Different buckets: order by max_timestamp (ascending - older segments first)
+            // Then by table_bucket fields for true total ordering
+            self.segment
+                .max_timestamp
+                .cmp(&other.segment.max_timestamp)
+                .then_with(|| {
+                    self.segment
+                        .table_bucket
+                        .table_id()
+                        .cmp(&other.segment.table_bucket.table_id())
+                })
+                .then_with(|| {
+                    self.segment
+                        .table_bucket
+                        .partition_id()
+                        .cmp(&other.segment.table_bucket.partition_id())
+                })
+                .then_with(|| {
+                    self.segment
+                        .table_bucket
+                        .bucket_id()
+                        .cmp(&other.segment.table_bucket.bucket_id())
+                })
+                .then_with(|| self.segment.segment_id.cmp(&other.segment.segment_id))
+        }
+    }
+}
+
+impl PartialOrd for RemoteLogDownloadRequest {
+    fn partial_cmp(&self, other: &Self) -> Option<Ordering> {
+        Some(self.cmp(other))
+    }
+}
+
+impl PartialEq for RemoteLogDownloadRequest {
+    fn eq(&self, other: &Self) -> bool {
+        self.cmp(other) == Ordering::Equal
+    }
+}
+
+impl Eq for RemoteLogDownloadRequest {}
+
+/// Result of a download task
+enum DownloadResult {
+    /// Successful download - deliver result to future
+    Success {
+        result: RemoteLogFile,
+        result_sender: oneshot::Sender<Result<RemoteLogFile>>,
+    },
+    /// Download failed - re-queue request for retry (Java pattern)
+    FailedRetry { request: RemoteLogDownloadRequest },
+    /// Download failed permanently after max retries - fail the future
+    FailedPermanently {
+        error: Error,
+        result_sender: oneshot::Sender<Result<RemoteLogFile>>,
+    },
+    /// Cancelled - don't deliver, don't re-queue
+    Cancelled,
+}
+
+/// Production implementation of RemoteLogFetcher that downloads from actual storage
+struct ProductionFetcher {
+    remote_fs_props: Arc<RwLock<HashMap<String, String>>>,
+    local_log_dir: Arc<TempDir>,
+}
+
+impl RemoteLogFetcher for ProductionFetcher {
+    fn fetch(
+        &self,
+        request: &RemoteLogDownloadRequest,
+    ) -> Pin<Box<dyn Future<Output = Result<FetchResult>> + Send>> {
+        let remote_fs_props = self.remote_fs_props.clone();
+        let local_log_dir = self.local_log_dir.clone();
+
+        // Clone data needed for async operation to avoid lifetime issues
+        let segment = request.segment.clone();
+        let remote_log_tablet_dir = request.remote_log_tablet_dir.to_string();
+
+        Box::pin(async move {
+            let local_file_name = segment.local_file_name();
+            let local_file_path = local_log_dir.path().join(&local_file_name);
+
+            // Build remote path
+            let offset_prefix = format!("{:020}", segment.start_offset);
+            let remote_path = format!(
+                "{}/{}/{}.log",
+                remote_log_tablet_dir, segment.segment_id, offset_prefix
+            );
+
+            let remote_fs_props_map = remote_fs_props.read().clone();
+
+            // Download file to disk (streaming, no memory spike)
+            let file_path = RemoteLogDownloader::download_file(
+                &remote_log_tablet_dir,
+                &remote_path,
+                &local_file_path,
+                &remote_fs_props_map,
+            )
+            .await?;
+
+            // Get file size
+            let metadata = tokio::fs::metadata(&file_path).await?;
+            let file_size = metadata.len() as usize;
+
+            // Return file path - file stays on disk until PrefetchPermit is dropped
+            Ok(FetchResult {
+                file_path,
+                file_size,
+            })
+        })
+    }
+}
+
+/// Coordinator that owns all download state and orchestrates downloads
+struct DownloadCoordinator {
+    download_queue: BinaryHeap<Reverse<RemoteLogDownloadRequest>>,
+    active_downloads: JoinSet<DownloadResult>,
+    in_flight: usize,
+    prefetch_semaphore: Arc<Semaphore>,
+    max_concurrent_downloads: usize,
+    recycle_notify: Arc<Notify>,
+    fetcher: Arc<dyn RemoteLogFetcher>,
+}
+
+impl DownloadCoordinator {
+    /// Check if we should wait for recycle notification
+    /// Only wait if we're blocked on permits AND have pending work
+    fn should_wait_for_recycle(&self) -> bool {
+        !self.download_queue.is_empty()
+            && self.in_flight < self.max_concurrent_downloads
+            && self.prefetch_semaphore.available_permits() == 0
+    }
+
+    /// Find the earliest retry deadline among pending requests
+    fn next_retry_deadline(&self) -> Option<tokio::time::Instant> {
+        self.download_queue
+            .iter()
+            .filter_map(|Reverse(req)| req.next_retry_at)
+            .min()
+    }
+}
+
+impl DownloadCoordinator {
+    /// Try to start as many downloads as possible (event-driven drain)
+    fn drain(&mut self) {
+        // Collect deferred requests (backoff not ready) to push back later
+        let mut deferred = Vec::new();
+        // Scan entire queue once to find ready requests (prevents head-of-line blocking)
+        // Bound to reasonable max to avoid excessive work if queue is huge
+        let max_scan = self.download_queue.len().min(100);
+        let mut scanned = 0;
+
+        while !self.download_queue.is_empty()
+            && self.in_flight < self.max_concurrent_downloads
+            && scanned < max_scan
+        {
+            // Try acquire prefetch permit (non-blocking)
+            let permit = match self.prefetch_semaphore.clone().try_acquire_owned() {
+                Ok(p) => p,
+                Err(_) => break, // No permits available
+            };
+
+            // Pop highest priority request
+            let Some(Reverse(request)) = self.download_queue.pop() else {
+                drop(permit);
+                break;
+            };
+
+            scanned += 1;
+
+            // Retry backoff check: defer if retry time hasn't arrived yet
+            if let Some(next_retry_at) = request.next_retry_at {
+                let now = tokio::time::Instant::now();
+                if next_retry_at > now {
+                    // Not ready for retry yet - defer and continue looking for ready requests
+                    drop(permit);
+                    deferred.push(request);
+                    continue; // Don't block - keep looking for ready requests
+                }
+            }
+
+            // Cancellation check: skip if sender closed
+            if request.result_sender.is_closed() {
+                drop(permit);
+                continue; // Try next request
+            }
+
+            // Clone data for the spawned task
+            let fetcher = self.fetcher.clone();
+            let recycle_notify = self.recycle_notify.clone();
+
+            // Spawn download task
+            self.active_downloads.spawn(async move {
+                spawn_download_task(request, permit, fetcher, recycle_notify).await
+            });
+            self.in_flight += 1;
+        }
+
+        // Push deferred requests back to queue (maintains priority order)
+        if !deferred.is_empty() {
+            for req in deferred {
+                self.download_queue.push(Reverse(req));
+            }
+        }
+    }
+}
+
+/// Spawn a download task that attempts download once
+/// Matches Java's RemoteLogDownloader.java
+///
+/// Benefits over infinite in-place retry:
+/// - Failed downloads don't block prefetch slots
+/// - Other segments can make progress while one is failing
+/// - Natural retry through coordinator re-picking from queue
+async fn spawn_download_task(
+    request: RemoteLogDownloadRequest,
+    permit: tokio::sync::OwnedSemaphorePermit,
+    fetcher: Arc<dyn RemoteLogFetcher>,
+    recycle_notify: Arc<Notify>,
+) -> DownloadResult {
+    // Check if receiver still alive (early cancellation check)
+    if request.result_sender.is_closed() {
+        drop(permit);
+        return DownloadResult::Cancelled;
+    }
+
+    // Try download ONCE
+    let download_result = fetcher.fetch(&request).await;
+
+    match download_result {
+        Ok(fetch_result) => {
+            // Success - permit will be released on drop (FileSource handles file deletion)
+            DownloadResult::Success {
+                result: RemoteLogFile {
+                    file_path: fetch_result.file_path,
+                    file_size: fetch_result.file_size,
+                    permit: PrefetchPermit::new(permit, recycle_notify.clone()),
+                },
+                result_sender: request.result_sender,
+            }
+        }
+        Err(e) if request.result_sender.is_closed() => {
+            // Receiver dropped (cancelled) - release permit, don't re-queue
+            drop(permit);
+            DownloadResult::Cancelled
+        }
+        Err(e) => {
+            // Download failed - check if we should retry or give up
+            let retry_count = request.retry_count + 1;
+
+            if retry_count > MAX_RETRY_COUNT {
+                // Too many retries - give up and fail the future
+                log::error!(
+                    "Failed to download remote log segment {} after {} retries: {}. Giving up.",
+                    request.segment.segment_id,
+                    retry_count,
+                    e
+                );
+                drop(permit); // Release immediately
+
+                DownloadResult::FailedPermanently {
+                    error: Error::UnexpectedError {
+                        message: format!(
+                            "Failed to download remote log segment after {} retries: {}",
+                            retry_count, e
+                        ),
+                        source: Some(Box::new(e)),
+                    },
+                    result_sender: request.result_sender,
+                }
+            } else {
+                // Retry with exponential backoff
+                let backoff_delay = calculate_backoff_delay(retry_count);
+                let next_retry_at = tokio::time::Instant::now() + backoff_delay;
+
+                log::warn!(
+                    "Failed to download remote log segment {}: {}. Retry {}/{} after {:?}",
+                    request.segment.segment_id,
+                    e,
+                    retry_count,
+                    MAX_RETRY_COUNT,
+                    backoff_delay
+                );
+                drop(permit); // Release immediately - critical!
+
+                // Update retry state
+                let mut retry_request = request;
+                retry_request.retry_count = retry_count;
+                retry_request.next_retry_at = Some(next_retry_at);
+
+                // Re-queue request to same priority queue
+                // Future stays with request, NOT completed - will complete on successful retry
+                DownloadResult::FailedRetry {
+                    request: retry_request,
+                }
+            }
+        }
+    }
+}
+
+/// Coordinator event loop - owns all download state and reacts to events
+async fn coordinator_loop(
+    mut coordinator: DownloadCoordinator,
+    mut request_receiver: mpsc::UnboundedReceiver<RemoteLogDownloadRequest>,
+) {
+    loop {
+        // Drain once at start of iteration to process ready work
+        coordinator.drain();
+
+        // Calculate sleep duration until next retry (if any deferred requests)
+        let next_retry_sleep = coordinator.next_retry_deadline().map(|deadline| {
+            let now = tokio::time::Instant::now();
+            if deadline > now {
+                deadline - now
+            } else {
+                tokio::time::Duration::from_millis(0) // Ready now
+            }
+        });
+
+        tokio::select! {
+            // Event 1: NewRequest
+            Some(request) = request_receiver.recv() => {
+                coordinator.download_queue.push(Reverse(request));
+                // Immediately try to start this download
+                continue;
+            }
+
+            // Event 2: DownloadFinished
+            Some(result) = coordinator.active_downloads.join_next() => {
+                coordinator.in_flight -= 1;
+
+                match result {
+                    Ok(DownloadResult::Success { result, result_sender }) => {
+                        // Success - deliver result to future
+                        if !result_sender.is_closed() {
+                            let _ = result_sender.send(Ok(result));
+                        }
+                        // Permit held in RemoteLogFile until consumed
+                    }
+                    Ok(DownloadResult::FailedRetry { request }) => {
+                        // Re-queue immediately (don't block coordinator with sleep)
+                        // The retry time will be checked in drain() before processing
+                        // (Java line 177: segmentsToFetch.add(request))
+                        // Permit already released (Java line 174)
+                        coordinator.download_queue.push(Reverse(request));
+                    }
+                    Ok(DownloadResult::FailedPermanently { error, result_sender }) => {
+                        // Permanent failure - deliver error to future
+                        if !result_sender.is_closed() {
+                            let _ = result_sender.send(Err(error));
+                        }
+                        // Permit already released
+                    }
+                    Ok(DownloadResult::Cancelled) => {
+                        // Cancelled - permit already released, nothing to do
+                    }
+                    Err(e) => {
+                        log::error!("Download task panicked: {:?}", e);
+                        // Permit already released via RAII
+                    }
+                }
+                // Immediately try to start another download
+                continue;
+            }
+
+            // Event 3: Recycled (only wait when blocked on permits with pending work)
+            _ = coordinator.recycle_notify.notified(),
+                if coordinator.should_wait_for_recycle() => {
+                // Wake up to try draining
+                continue;
+            }
+
+            // Event 4: Retry timer - wake up when next retry is ready
+            _ = tokio::time::sleep(next_retry_sleep.unwrap_or(tokio::time::Duration::from_secs(3600))),
+                if next_retry_sleep.is_some() => {
+                // Wake up to retry deferred requests
+                continue;
+            }
+
+            else => break,  // All channels closed AND no work pending
+        }
+    }
+}
+
 type CompletionCallback = Box<dyn Fn() + Send + Sync>;
 
 /// Future for a remote log download request
 pub struct RemoteLogDownloadFuture {
-    result: Arc<Mutex<Option<Result<Vec<u8>>>>>,
+    result: Arc<Mutex<Option<Result<RemoteLogFile>>>>,
     completion_callbacks: Arc<Mutex<Vec<CompletionCallback>>>,
-    // todo: add recycleCallback
 }
 
 impl RemoteLogDownloadFuture {
-    pub fn new(receiver: oneshot::Receiver<Result<Vec<u8>>>) -> Self {
+    pub fn new(receiver: oneshot::Receiver<Result<RemoteLogFile>>) -> Self {
         let result = Arc::new(Mutex::new(None));
         let result_clone = Arc::clone(&result);
         let completion_callbacks: Arc<Mutex<Vec<CompletionCallback>>> =
@@ -123,7 +646,7 @@ impl RemoteLogDownloadFuture {
             // This also ensures that any callbacks registered after this point will be called immediately
             let callbacks: Vec<CompletionCallback> = {
                 let mut callbacks_guard = callbacks_clone.lock();
-                std::mem::take(&mut *callbacks_guard)
+                mem::take(&mut *callbacks_guard)
             };
             for callback in callbacks {
                 callback();
@@ -172,40 +695,90 @@ impl RemoteLogDownloadFuture {
         self.result.lock().is_some()
     }
 
-    /// Get the downloaded file path (synchronous, only works after is_done() returns true)
-    pub fn get_remote_log_bytes(&self) -> Result<Vec<u8>> {
-        // todo: handle download fail
-        let guard = self.result.lock();
-        match guard.as_ref() {
-            Some(Ok(path)) => Ok(path.clone()),
-            Some(Err(e)) => Err(Error::IoUnexpectedError {
-                message: format!("Fail to get remote log bytes: {e}"),
-                source: io::Error::other(format!("{e:?}")),
-            }),
+    /// Take the RemoteLogFile (including the permit) from this future
+    /// This should only be called when the download is complete
+    /// This is the correct way to consume the download - it transfers permit ownership
+    pub fn take_remote_log_file(&self) -> Result<RemoteLogFile> {
+        let mut guard = self.result.lock();
+        match guard.take() {
+            Some(Ok(remote_log_file)) => Ok(remote_log_file),
+            Some(Err(e)) => {
+                let error_msg = format!("{e}");
+                Err(Error::IoUnexpectedError {
+                    message: format!("Fail to get remote log file: {error_msg}"),
+                    source: io::Error::other(error_msg),
+                })
+            }
             None => Err(Error::IoUnexpectedError {
-                message: "Get remote log bytes not completed yet".to_string(),
-                source: io::Error::other("Get remote log bytes not completed yet"),
+                message: "Remote log file already taken or not ready".to_string(),
+                source: io::Error::other("Remote log file already taken or not ready"),
             }),
         }
     }
 }
 
-/// Downloader for remote log segment files
+/// Downloader for remote log segment files.
+///
+/// # Shutdown behavior
+///
+/// When the downloader is dropped, the request channel closes, signaling the coordinator
+/// to stop accepting new work. The coordinator will finish any in-flight downloads but
+/// won't wait for completion. Pending futures will fail.
 pub struct RemoteLogDownloader {
-    local_log_dir: TempDir,
-    remote_fs_props: RwLock<HashMap<String, String>>,
+    request_sender: Option<mpsc::UnboundedSender<RemoteLogDownloadRequest>>,
+    remote_fs_props: Option<Arc<RwLock<HashMap<String, String>>>>,
 }
 
 impl RemoteLogDownloader {
-    pub fn new(local_log_dir: TempDir) -> Result<Self> {
+    pub fn new(
+        local_log_dir: TempDir,
+        max_prefetch_segments: usize,
+        max_concurrent_downloads: usize,
+    ) -> Result<Self> {
+        let remote_fs_props = Arc::new(RwLock::new(HashMap::new()));
+        let fetcher = Arc::new(ProductionFetcher {
+            remote_fs_props: remote_fs_props.clone(),
+            local_log_dir: Arc::new(local_log_dir),
+        });
+
+        let mut downloader =
+            Self::new_with_fetcher(fetcher, max_prefetch_segments, max_concurrent_downloads)?;
+        downloader.remote_fs_props = Some(remote_fs_props);
+        Ok(downloader)
+    }
+
+    /// Create a RemoteLogDownloader with a custom fetcher (for testing).
+    /// The remote_fs_props will be None since custom fetchers typically don't need S3 credentials.
+    pub fn new_with_fetcher(
+        fetcher: Arc<dyn RemoteLogFetcher>,
+        max_prefetch_segments: usize,
+        max_concurrent_downloads: usize,
+    ) -> Result<Self> {
+        let (request_sender, request_receiver) = mpsc::unbounded_channel();
+
+        let coordinator = DownloadCoordinator {
+            download_queue: BinaryHeap::new(),
+            active_downloads: JoinSet::new(),
+            in_flight: 0,
+            prefetch_semaphore: Arc::new(Semaphore::new(max_prefetch_segments)),
+            max_concurrent_downloads,
+            recycle_notify: Arc::new(Notify::new()),
+            fetcher,
+        };
+
+        // Spawn coordinator task - it will exit when request_sender is dropped
+        tokio::spawn(coordinator_loop(coordinator, request_receiver));
+
         Ok(Self {
-            local_log_dir,
-            remote_fs_props: RwLock::new(HashMap::new()),
+            request_sender: Some(request_sender),
+            remote_fs_props: None,
         })
     }
 
     pub fn set_remote_fs_props(&self, props: HashMap<String, String>) {
-        *self.remote_fs_props.write() = props;
+        if let Some(ref remote_fs_props) = self.remote_fs_props {
+            *remote_fs_props.write() = props;
+        }
     }
 
     /// Request to fetch a remote log segment to local. This method is non-blocking.
@@ -214,49 +787,44 @@ impl RemoteLogDownloader {
         remote_log_tablet_dir: &str,
         segment: &RemoteLogSegment,
     ) -> RemoteLogDownloadFuture {
-        let (sender, receiver) = oneshot::channel();
-        let local_file_name = segment.local_file_name();
-        let local_file_path = self.local_log_dir.path().join(&local_file_name);
-        let remote_path = self.build_remote_path(remote_log_tablet_dir, segment);
-        let remote_log_tablet_dir = remote_log_tablet_dir.to_string();
-        let remote_fs_props = self.remote_fs_props.read().clone();
-        // Spawn async download & read task
-        tokio::spawn(async move {
-            let result = async {
-                let file_path = Self::download_file(
-                    &remote_log_tablet_dir,
-                    &remote_path,
-                    &local_file_path,
-                    &remote_fs_props,
-                )
-                .await?;
-                let bytes = tokio::fs::read(&file_path).await?;
-
-                // Delete the downloaded local file to free disk (async, but we'll do it in background)
-                let file_path_clone = file_path.clone();
-                tokio::spawn(async move {
-                    let _ = delete_file(file_path_clone).await;
-                });
-
-                Ok(bytes)
+        let (result_sender, result_receiver) = oneshot::channel();
+
+        let request = RemoteLogDownloadRequest {
+            segment: segment.clone(),
+            remote_log_tablet_dir: remote_log_tablet_dir.to_string(),
+            result_sender,
+            retry_count: 0,
+            next_retry_at: None,
+        };
+
+        // Send to coordinator (non-blocking)
+        if let Some(ref sender) = self.request_sender {
+            if sender.send(request).is_err() {
+                // Coordinator is gone - immediately fail the future
+                let (error_sender, error_receiver) = oneshot::channel();
+                let _ = error_sender.send(Err(Error::UnexpectedError {
+                    message: "RemoteLogDownloader coordinator has shut down".to_string(),
+                    source: None,
+                }));
+                return RemoteLogDownloadFuture::new(error_receiver);
             }
-            .await;
+        }
 
-            let _ = sender.send(result);
-        });
-        RemoteLogDownloadFuture::new(receiver)
+        RemoteLogDownloadFuture::new(result_receiver)
     }
+}
 
-    /// Build the remote path for a log segment
-    fn build_remote_path(&self, remote_log_tablet_dir: &str, segment: &RemoteLogSegment) -> String {
-        // Format: ${remote_log_tablet_dir}/${segment_id}/${offset_prefix}.log
-        let offset_prefix = format!("{:020}", segment.start_offset);
-        format!(
-            "{}/{}/{}.log",
-            remote_log_tablet_dir, segment.segment_id, offset_prefix
-        )
+impl Drop for RemoteLogDownloader {
+    fn drop(&mut self) {
+        // Drop the request sender to signal coordinator shutdown.
+        // This causes request_receiver.recv() to return None, allowing the
+        // coordinator to exit gracefully after processing pending work.
+        // The coordinator task will finish on its own when it sees the channel closed.
+        drop(self.request_sender.take());
     }
+}
 
+impl RemoteLogDownloader {
     /// Download a file from remote storage to local using streaming read/write
     async fn download_file(
         remote_log_tablet_dir: &str,
@@ -293,7 +861,7 @@ impl RemoteLogDownloader {
         let (op, relative_path) = storage.create(remote_path)?;
 
         // Timeout for remote storage operations (30 seconds)
-        const REMOTE_OP_TIMEOUT: std::time::Duration = std::time::Duration::from_secs(30);
+        const REMOTE_OP_TIMEOUT: Duration = Duration::from_secs(30);
 
         // Get file metadata to know the size with timeout
         let meta = op.stat(relative_path).await?;
@@ -310,7 +878,7 @@ impl RemoteLogDownloader {
         let total_chunks = file_size.div_ceil(CHUNK_SIZE);
 
         while offset < file_size {
-            let end = std::cmp::min(offset + CHUNK_SIZE, file_size);
+            let end = min(offset + CHUNK_SIZE, file_size);
             let range = offset..end;
             chunk_count += 1;
 
@@ -347,70 +915,349 @@ impl RemoteLogDownloader {
     }
 }
 
-/// Pending fetch that waits for remote log file to be downloaded
-pub struct RemotePendingFetch {
-    segment: RemoteLogSegment,
-    download_future: RemoteLogDownloadFuture,
-    pos_in_log_segment: i32,
-    fetch_offset: i64,
-    high_watermark: i64,
-    read_context: ReadContext,
-}
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use std::sync::atomic::{AtomicUsize, Ordering};
 
-impl RemotePendingFetch {
-    pub fn new(
-        segment: RemoteLogSegment,
-        download_future: RemoteLogDownloadFuture,
-        pos_in_log_segment: i32,
-        fetch_offset: i64,
-        high_watermark: i64,
-        read_context: ReadContext,
-    ) -> Self {
-        Self {
+    /// Helper function to create a TableBucket for testing
+    fn create_table_bucket(table_id: i64, bucket_id: i32) -> TableBucket {
+        TableBucket::new(table_id, bucket_id)
+    }
+
+    /// Simplified fake fetcher for testing
+    struct FakeFetcher {
+        completion_gate: Arc<Notify>,
+        in_flight: Arc<AtomicUsize>,
+        max_seen_in_flight: Arc<AtomicUsize>,
+        fail_count: Arc<Mutex<usize>>,
+        auto_complete: bool,
+    }
+
+    impl FakeFetcher {
+        fn new(fail_count: usize, auto_complete: bool) -> Self {
+            Self {
+                completion_gate: Arc::new(Notify::new()),
+                in_flight: Arc::new(AtomicUsize::new(0)),
+                max_seen_in_flight: Arc::new(AtomicUsize::new(0)),
+                fail_count: Arc::new(Mutex::new(fail_count)),
+                auto_complete,
+            }
+        }
+
+        fn max_seen_in_flight(&self) -> usize {
+            self.max_seen_in_flight.load(Ordering::SeqCst)
+        }
+
+        fn in_flight(&self) -> usize {
+            self.in_flight.load(Ordering::SeqCst)
+        }
+
+        fn release_one(&self) {
+            self.completion_gate.notify_one();
+        }
+
+        fn release_all(&self) {
+            self.completion_gate.notify_waiters();
+        }
+    }
+
+    impl RemoteLogFetcher for FakeFetcher {
+        fn fetch(
+            &self,
+            request: &RemoteLogDownloadRequest,
+        ) -> Pin<Box<dyn Future<Output = Result<FetchResult>> + Send>> {
+            let gate = self.completion_gate.clone();
+            let in_flight = self.in_flight.clone();
+            let max_seen = self.max_seen_in_flight.clone();
+            let fail_count = self.fail_count.clone();
+            let segment_id = request.segment().segment_id.clone();
+            let auto_complete = self.auto_complete;
+
+            Box::pin(async move {
+                // Track in-flight
+                let current = in_flight.fetch_add(1, Ordering::SeqCst) + 1;
+                max_seen.fetch_max(current, Ordering::SeqCst);
+
+                // Wait for gate (or auto-complete)
+                if !auto_complete {
+                    gate.notified().await;
+                } else {
+                    tokio::task::yield_now().await;
+                }
+
+                // Check if should fail
+                let should_fail = {
+                    let mut count = fail_count.lock();
+                    if *count > 0 {
+                        *count -= 1;
+                        true
+                    } else {
+                        false
+                    }
+                };
+
+                in_flight.fetch_sub(1, Ordering::SeqCst);
+
+                if should_fail {
+                    Err(Error::UnexpectedError {
+                        message: format!("Fake fetch failed for {}", segment_id),
+                        source: None,
+                    })
+                } else {
+                    let fake_data = vec![1, 2, 3, 4];
+                    let temp_dir = env::temp_dir();
+                    let timestamp = SystemTime::now()
+                        .duration_since(UNIX_EPOCH)
+                        .unwrap()
+                        .as_nanos();
+                    let file_path =
+                        temp_dir.join(format!("fake_segment_{}_{}.log", segment_id, timestamp));
+                    tokio::fs::write(&file_path, &fake_data).await?;
+
+                    Ok(FetchResult {
+                        file_path,
+                        file_size: fake_data.len(),
+                    })
+                }
+            })
+        }
+    }
+
+    /// Helper function to create a RemoteLogSegment for testing
+    fn create_segment(
+        segment_id: &str,
+        start_offset: i64,
+        max_timestamp: i64,
+        table_bucket: TableBucket,
+    ) -> RemoteLogSegment {
+        RemoteLogSegment {
+            segment_id: segment_id.to_string(),
+            start_offset,
+            end_offset: start_offset + 1000,
+            size_in_bytes: 1024,
+            table_bucket,
+            max_timestamp,
+        }
+    }
+
+    /// Helper function to create a RemoteLogDownloadRequest for testing
+    fn create_request(segment: RemoteLogSegment) -> RemoteLogDownloadRequest {
+        let (result_sender, _) = oneshot::channel();
+        RemoteLogDownloadRequest {
+            remote_log_tablet_dir: "test_dir".to_string(),
             segment,
-            download_future,
-            pos_in_log_segment,
-            fetch_offset,
-            high_watermark,
-            read_context,
+            result_sender,
+            retry_count: 0,
+            next_retry_at: None,
         }
     }
-}
 
-impl PendingFetch for RemotePendingFetch {
-    fn table_bucket(&self) -> &TableBucket {
-        &self.segment.table_bucket
+    #[test]
+    fn test_priority_ordering_matching_java_test_case() {
+        // Test priority ordering: timestamp across buckets, offset within bucket
+        // Does NOT test tie-breakers (segment_id) - those are implementation details
+
+        let bucket1 = create_table_bucket(1, 0);
+        let bucket2 = create_table_bucket(1, 1);
+        let bucket3 = create_table_bucket(1, 2);
+        let bucket4 = create_table_bucket(1, 3);
+
+        // Create segments with distinct timestamps/offsets (no ties)
+        let seg_negative = create_segment("seg_neg", 0, -1, bucket1.clone());
+        let seg_zero = create_segment("seg_zero", 0, 0, bucket2.clone());
+        let seg_1000 = create_segment("seg_1000", 0, 1000, bucket3.clone());
+        let seg_2000 = create_segment("seg_2000", 0, 2000, bucket4.clone());
+        let seg_same_bucket_100 = create_segment("seg_sb_100", 100, 5000, bucket1.clone());
+        let seg_same_bucket_50 = create_segment("seg_sb_50", 50, 5000, bucket1.clone());
+
+        let mut heap = BinaryHeap::new();
+        heap.push(Reverse(create_request(seg_2000)));
+        heap.push(Reverse(create_request(seg_same_bucket_100)));
+        heap.push(Reverse(create_request(seg_1000)));
+        heap.push(Reverse(create_request(seg_zero)));
+        heap.push(Reverse(create_request(seg_negative)));
+        heap.push(Reverse(create_request(seg_same_bucket_50)));
+
+        // Verify ordering by timestamp/offset, not segment_id
+        let first = heap.pop().unwrap().0;
+        assert_eq!(first.segment.max_timestamp, -1, "Lowest timestamp first");
+
+        let second = heap.pop().unwrap().0;
+        assert_eq!(second.segment.max_timestamp, 0);
+
+        let third = heap.pop().unwrap().0;
+        assert_eq!(third.segment.max_timestamp, 1000);
+
+        let fourth = heap.pop().unwrap().0;
+        assert_eq!(fourth.segment.max_timestamp, 2000);
+
+        // Last two are same bucket (ts=5000), ordered by offset
+        let fifth = heap.pop().unwrap().0;
+        assert_eq!(fifth.segment.max_timestamp, 5000);
+        assert_eq!(
+            fifth.segment.start_offset, 50,
+            "Lower offset first within bucket"
+        );
+
+        let sixth = heap.pop().unwrap().0;
+        assert_eq!(sixth.segment.max_timestamp, 5000);
+        assert_eq!(sixth.segment.start_offset, 100);
     }
 
-    fn is_completed(&self) -> bool {
-        self.download_future.is_done()
+    #[tokio::test]
+    async fn test_concurrency_and_priority() {
+        // Test concurrency limiting and priority-based scheduling together
+        let fake_fetcher = Arc::new(FakeFetcher::new(0, false)); // Manual control
+
+        let downloader = RemoteLogDownloader::new_with_fetcher(
+            fake_fetcher.clone(),
+            10, // High prefetch limit
+            2,  // Max concurrent downloads = 2
+        )
+        .unwrap();
+
+        let bucket = create_table_bucket(1, 0);
+
+        // Request 4 segments with same priority (to isolate concurrency limiting from priority)
+        let segs: Vec<_> = (0..4)
+            .map(|i| create_segment(&format!("seg{}", i), i * 100, 1000, bucket.clone()))
+            .collect();
+
+        let _futures: Vec<_> = segs
+            .iter()
+            .map(|seg| downloader.request_remote_log("dir", seg))
+            .collect();
+
+        // Wait for exactly 2 to start
+        tokio::time::sleep(Duration::from_millis(50)).await;
+        assert_eq!(
+            fake_fetcher.in_flight(),
+            2,
+            "Concurrency limit: exactly 2 should be in-flight"
+        );
+
+        // Release one
+        fake_fetcher.release_one();
+        tokio::time::sleep(Duration::from_millis(50)).await;
+
+        // Max should never exceed 2
+        assert_eq!(
+            fake_fetcher.max_seen_in_flight(),
+            2,
+            "Max concurrent should not exceed 2"
+        );
+
+        // Release all
+        fake_fetcher.release_all();
     }
 
-    fn to_completed_fetch(self: Box<Self>) -> Result<Box<dyn CompletedFetch>> {
-        // Get the file path (this should only be called when is_completed() returns true)
-        let mut data = self.download_future.get_remote_log_bytes()?;
+    #[tokio::test]
+    async fn test_prefetch_limit() {
+        // Test that prefetch semaphore limits outstanding downloads
+        let fake_fetcher = Arc::new(FakeFetcher::new(0, true)); // Auto-complete
 
-        // Slice the data if needed
-        let data = if self.pos_in_log_segment > 0 {
-            data.split_off(self.pos_in_log_segment as usize)
-        } else {
-            data
-        };
+        let downloader = RemoteLogDownloader::new_with_fetcher(
+            fake_fetcher,
+            2,  // Max prefetch = 2
+            10, // High concurrent limit
+        )
+        .unwrap();
+
+        let bucket = create_table_bucket(1, 0);
 
-        let size_in_bytes = data.len();
+        // Request 4 downloads
+        let segs: Vec<_> = (0..4)
+            .map(|i| create_segment(&format!("seg{}", i), i * 100, 1000, bucket.clone()))
+            .collect();
 
-        let log_record_batch = LogRecordsBatches::new(data);
+        let mut futures: Vec<_> = segs
+            .iter()
+            .map(|seg| downloader.request_remote_log("dir", seg))
+            .collect();
 
-        // Create DefaultCompletedFetch from the data
-        let completed_fetch = DefaultCompletedFetch::new(
-            self.segment.table_bucket,
-            log_record_batch,
-            size_in_bytes,
-            self.read_context,
-            self.fetch_offset,
-            self.high_watermark,
+        // Wait for first 2 to complete
+        let deadline = tokio::time::Instant::now() + Duration::from_secs(2);
+        loop {
+            if futures.iter().filter(|f| f.is_done()).count() >= 2 {
+                break;
+            }
+            if tokio::time::Instant::now() > deadline {
+                panic!("Timeout waiting for first 2 downloads");
+            }
+            tokio::time::sleep(Duration::from_millis(10)).await;
+        }
+
+        // Verify 3rd and 4th are blocked (prefetch limit)
+        tokio::time::sleep(Duration::from_millis(50)).await;
+        assert_eq!(
+            futures.iter().filter(|f| f.is_done()).count(),
+            2,
+            "Prefetch limit: only 2 should complete"
         );
 
-        Ok(Box::new(completed_fetch))
+        // Drop first 2 (releases permits)
+        let f4 = futures.pop().unwrap();
+        let f3 = futures.pop().unwrap();
+        drop(futures);
+
+        // 3rd and 4th should now complete
+        let deadline = tokio::time::Instant::now() + Duration::from_secs(2);
+        loop {
+            if f3.is_done() && f4.is_done() {
+                break;
+            }
+            if tokio::time::Instant::now() > deadline {
+                panic!("Timeout after permit release");
+            }
+            tokio::time::sleep(Duration::from_millis(10)).await;
+        }
+    }
+
+    #[tokio::test]
+    async fn test_retry_and_cancellation() {
+        // Test retry with exponential backoff
+        let fake_fetcher = Arc::new(FakeFetcher::new(2, true)); // Fail twice, succeed third time
+
+        let downloader =
+            RemoteLogDownloader::new_with_fetcher(fake_fetcher.clone(), 10, 1).unwrap();
+
+        let bucket = create_table_bucket(1, 0);
+        let seg = create_segment("seg1", 0, 1000, bucket);
+
+        let future = downloader.request_remote_log("dir", &seg);
+
+        // Should succeed after retries
+        let deadline = tokio::time::Instant::now() + Duration::from_secs(5);
+        loop {
+            if future.is_done() {
+                break;
+            }
+            if tokio::time::Instant::now() > deadline {
+                panic!("Timeout waiting for retry to succeed");
+            }
+            tokio::time::sleep(Duration::from_millis(50)).await;
+        }
+
+        assert!(future.is_done(), "Should succeed after retries");
+
+        // Test cancellation
+        let seg2 = create_segment("seg2", 100, 1000, create_table_bucket(1, 0));
+        let fake_fetcher2 = Arc::new(FakeFetcher::new(100, true)); // Fail forever
+        let downloader2 =
+            RemoteLogDownloader::new_with_fetcher(fake_fetcher2.clone(), 10, 1).unwrap();
+
+        let future2 = downloader2.request_remote_log("dir", &seg2);
+        tokio::time::sleep(Duration::from_millis(50)).await;
+
+        // Drop to cancel
+        drop(future2);
+        tokio::time::sleep(Duration::from_millis(50)).await;
+
+        assert_eq!(
+            fake_fetcher2.in_flight(),
+            0,
+            "Cancellation should release resources"
+        );
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index afa44f350b..8712650e6a 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -19,10 +19,12 @@ use arrow::array::RecordBatch;
 use arrow_schema::SchemaRef;
 use log::{debug, warn};
 use parking_lot::{Mutex, RwLock};
-use std::collections::{HashMap, HashSet};
-use std::slice::from_ref;
-use std::sync::Arc;
-use std::time::Duration;
+use std::{
+    collections::{HashMap, HashSet},
+    slice::from_ref,
+    sync::Arc,
+    time::{Duration, Instant},
+};
 use tempfile::TempDir;
 
 use crate::client::connection::FlussConnection;
@@ -30,11 +32,9 @@ use crate::client::credentials::CredentialsCache;
 use crate::client::metadata::Metadata;
 use crate::client::table::log_fetch_buffer::{
     CompletedFetch, DefaultCompletedFetch, FetchErrorAction, FetchErrorContext, FetchErrorLogLevel,
-    LogFetchBuffer,
-};
-use crate::client::table::remote_log::{
-    RemoteLogDownloader, RemoteLogFetchInfo, RemotePendingFetch,
+    LogFetchBuffer, RemotePendingFetch,
 };
+use crate::client::table::remote_log::{RemoteLogDownloader, RemoteLogFetchInfo};
 use crate::error::{ApiError, Error, FlussError, Result};
 use crate::metadata::{PhysicalTablePath, TableBucket, TableInfo, TablePath};
 use crate::proto::{ErrorResponse, FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
@@ -223,6 +223,7 @@ impl<'a> TableScan<'a> {
             &self.table_info,
             self.metadata.clone(),
             self.conn.get_connections(),
+            self.conn.config(),
             self.projected_fields,
         )?;
         Ok(LogScanner {
@@ -235,6 +236,7 @@ impl<'a> TableScan<'a> {
             &self.table_info,
             self.metadata.clone(),
             self.conn.get_connections(),
+            self.conn.config(),
             self.projected_fields,
         )?;
         Ok(RecordBatchLogScanner {
@@ -273,6 +275,7 @@ impl LogScannerInner {
         table_info: &TableInfo,
         metadata: Arc<Metadata>,
         connections: Arc<RpcClient>,
+        config: &crate::config::Config,
         projected_fields: Option<Vec<usize>>,
     ) -> Result<Self> {
         let log_scanner_status = Arc::new(LogScannerStatus::new());
@@ -286,13 +289,14 @@ impl LogScannerInner {
                 connections.clone(),
                 metadata.clone(),
                 log_scanner_status.clone(),
+                config,
                 projected_fields,
             )?,
         })
     }
 
     async fn poll_records(&self, timeout: Duration) -> Result<ScanRecords> {
-        let start = std::time::Instant::now();
+        let start = Instant::now();
         let deadline = start + timeout;
 
         loop {
@@ -307,7 +311,7 @@ impl LogScannerInner {
             }
 
             // No data available, check if we should wait
-            let now = std::time::Instant::now();
+            let now = Instant::now();
             if now >= deadline {
                 // Timeout reached, return empty result
                 return Ok(ScanRecords::new(HashMap::new()));
@@ -376,7 +380,7 @@ impl LogScannerInner {
     }
 
     async fn poll_batches(&self, timeout: Duration) -> Result<Vec<RecordBatch>> {
-        let start = std::time::Instant::now();
+        let start = Instant::now();
         let deadline = start + timeout;
 
         loop {
@@ -387,7 +391,7 @@ impl LogScannerInner {
                 return Ok(batches);
             }
 
-            let now = std::time::Instant::now();
+            let now = Instant::now();
             if now >= deadline {
                 return Ok(Vec::new());
             }
@@ -478,6 +482,7 @@ impl LogFetcher {
         conns: Arc<RpcClient>,
         metadata: Arc<Metadata>,
         log_scanner_status: Arc<LogScannerStatus>,
+        config: &crate::config::Config,
         projected_fields: Option<Vec<usize>>,
     ) -> Result<Self> {
         let full_arrow_schema = to_arrow_schema(table_info.get_row_type())?;
@@ -497,7 +502,11 @@ impl LogFetcher {
             log_scanner_status,
             read_context,
             remote_read_context,
-            remote_log_downloader: Arc::new(RemoteLogDownloader::new(tmp_dir)?),
+            remote_log_downloader: Arc::new(RemoteLogDownloader::new(
+                tmp_dir,
+                config.scanner_remote_log_prefetch_num,
+                config.scanner_remote_log_download_threads,
+            )?),
             credentials_cache: Arc::new(CredentialsCache::new(conns.clone(), metadata.clone())),
             log_fetch_buffer,
             nodes_with_pending_fetch_requests: Arc::new(Mutex::new(HashSet::new())),
@@ -1510,6 +1519,7 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata,
             status.clone(),
+            &crate::config::Config::default(),
             None,
         )?;
 
@@ -1529,8 +1539,8 @@ mod tests {
         Ok(())
     }
 
-    #[test]
-    fn fetch_records_from_fetch_drains_unassigned_bucket() -> Result<()> {
+    #[tokio::test]
+    async fn fetch_records_from_fetch_drains_unassigned_bucket() -> Result<()> {
         let table_path = TablePath::new("db".to_string(), "tbl".to_string());
         let table_info = build_table_info(table_path.clone(), 1, 1);
         let cluster = build_cluster_arc(&table_path, 1, 1);
@@ -1541,6 +1551,7 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata,
             status,
+            &crate::config::Config::default(),
             None,
         )?;
 
@@ -1576,6 +1587,7 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata,
             status,
+            &crate::config::Config::default(),
             None,
         )?;
 
@@ -1599,6 +1611,7 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata.clone(),
             status.clone(),
+            &crate::config::Config::default(),
             None,
         )?;
 
@@ -1649,6 +1662,7 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata.clone(),
             status.clone(),
+            &crate::config::Config::default(),
             None,
         )?;
 
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 92f600e62a..705e241da0 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -36,6 +36,16 @@ pub struct Config {
 
     #[arg(long, default_value_t = 2 * 1024 * 1024)]
     pub writer_batch_size: i32,
+
+    /// Maximum number of remote log segments to prefetch
+    /// Default: 4 (matching Java CLIENT_SCANNER_REMOTE_LOG_PREFETCH_NUM)
+    #[arg(long, default_value_t = 4)]
+    pub scanner_remote_log_prefetch_num: usize,
+
+    /// Maximum concurrent remote log downloads
+    /// Default: 3 (matching Java REMOTE_FILE_DOWNLOAD_THREAD_NUM)
+    #[arg(long, default_value_t = 3)]
+    pub scanner_remote_log_download_threads: usize,
 }
 
 impl Default for Config {
@@ -46,6 +56,8 @@ impl Default for Config {
             writer_acks: String::from("all"),
             writer_retries: i32::MAX,
             writer_batch_size: 2 * 1024 * 1024,
+            scanner_remote_log_prefetch_num: 4,
+            scanner_remote_log_download_threads: 3,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index eaee94c36c..65eddce71e 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -306,6 +306,7 @@ message PbRemoteLogSegment {
   required int64 remote_log_start_offset = 2;
   required int64 remote_log_end_offset = 3;
   required int32 segment_size_in_bytes = 4;
+  optional int64 max_timestamp = 5;
 }
 
 message PbListOffsetsRespForBucket {
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 39114d3273..4bfdc71c99 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -46,7 +46,10 @@ use byteorder::{ByteOrder, LittleEndian};
 use bytes::Bytes;
 use crc32c::crc32c;
 use std::{
-    io::{Cursor, Write},
+    collections::HashMap,
+    fs::File,
+    io::{Cursor, Read, Seek, SeekFrom, Write},
+    path::PathBuf,
     sync::Arc,
 };
 
@@ -82,6 +85,11 @@ pub const RECORD_BATCH_HEADER_SIZE: usize = RECORDS_OFFSET;
 pub const ARROW_CHANGETYPE_OFFSET: usize = RECORD_BATCH_HEADER_SIZE;
 pub const LOG_OVERHEAD: usize = LENGTH_OFFSET + LENGTH_LENGTH;
 
+/// Maximum batch size matches Java's Integer.MAX_VALUE limit.
+/// Java uses int type for batch size, so max value is 2^31 - 1 = 2,147,483,647 bytes (~2GB).
+/// This is the implicit limit in FileLogRecords.java and other Java components.
+pub const MAX_BATCH_SIZE: usize = i32::MAX as usize; // 2,147,483,647 bytes (~2GB)
+
 /// const for record
 /// The "magic" values.
 #[derive(Debug, Clone, Copy)]
@@ -89,6 +97,49 @@ pub enum LogMagicValue {
     V0 = 0,
 }
 
+/// Safely convert batch size from i32 to usize with validation.
+///
+/// Validates that:
+/// - batch_size_bytes is non-negative
+/// - batch_size_bytes + LOG_OVERHEAD doesn't overflow
+/// - Result is within reasonable bounds
+fn validate_batch_size(batch_size_bytes: i32) -> Result<usize> {
+    // Check for negative size (corrupted data)
+    if batch_size_bytes < 0 {
+        return Err(Error::UnexpectedError {
+            message: format!("Invalid negative batch size: {}", batch_size_bytes),
+            source: None,
+        });
+    }
+
+    let batch_size_u = batch_size_bytes as usize;
+
+    // Check for overflow when adding LOG_OVERHEAD
+    let total_size =
+        batch_size_u
+            .checked_add(LOG_OVERHEAD)
+            .ok_or_else(|| Error::UnexpectedError {
+                message: format!(
+                    "Batch size {} + LOG_OVERHEAD {} would overflow",
+                    batch_size_u, LOG_OVERHEAD
+                ),
+                source: None,
+            })?;
+
+    // Sanity check: reject unreasonably large batches
+    if total_size > MAX_BATCH_SIZE {
+        return Err(Error::UnexpectedError {
+            message: format!(
+                "Batch size {} exceeds maximum allowed size {}",
+                total_size, MAX_BATCH_SIZE
+            ),
+            source: None,
+        });
+    }
+
+    Ok(total_size)
+}
+
 // NOTE: Rust layout/offsets currently match Java only for V0.
 // TODO: Add V1 layout/offsets to keep parity with Java's V1 format.
 pub const CURRENT_LOG_MAGIC_VALUE: u8 = LogMagicValue::V0 as u8;
@@ -441,53 +492,280 @@ pub trait ToArrow {
     fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()>;
 }
 
-pub struct LogRecordsBatches {
+/// In-memory log record source.
+/// Used for local tablet server fetches (existing path).
+struct MemorySource {
     data: Bytes,
+}
+
+impl MemorySource {
+    fn new(data: Vec<u8>) -> Self {
+        Self {
+            data: Bytes::from(data),
+        }
+    }
+
+    fn read_batch_header(&mut self, pos: usize) -> Result<(i64, usize)> {
+        if pos + LOG_OVERHEAD > self.data.len() {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "Position {} + LOG_OVERHEAD {} exceeds data size {}",
+                    pos,
+                    LOG_OVERHEAD,
+                    self.data.len()
+                ),
+                source: None,
+            });
+        }
+
+        let base_offset = LittleEndian::read_i64(&self.data[pos + BASE_OFFSET_OFFSET..]);
+        let batch_size_bytes = LittleEndian::read_i32(&self.data[pos + LENGTH_OFFSET..]);
+
+        // Validate batch size to prevent integer overflow and corruption
+        let batch_size = validate_batch_size(batch_size_bytes)?;
+
+        Ok((base_offset, batch_size))
+    }
+
+    fn read_batch_data(&mut self, pos: usize, size: usize) -> Result<Bytes> {
+        if pos + size > self.data.len() {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "Read beyond data size: {} + {} > {}",
+                    pos,
+                    size,
+                    self.data.len()
+                ),
+                source: None,
+            });
+        }
+        // Zero-copy slice (Bytes is Arc-based)
+        Ok(self.data.slice(pos..pos + size))
+    }
+
+    fn total_size(&self) -> usize {
+        self.data.len()
+    }
+}
+
+/// RAII guard that deletes a file when dropped.
+/// Used to ensure file deletion happens AFTER the file handle is closed.
+struct FileCleanupGuard {
+    file_path: PathBuf,
+}
+
+impl Drop for FileCleanupGuard {
+    fn drop(&mut self) {
+        // File handle is already closed (this guard drops after the file field)
+        if let Err(e) = std::fs::remove_file(&self.file_path) {
+            log::warn!(
+                "Failed to delete remote log file {}: {}",
+                self.file_path.display(),
+                e
+            );
+        } else {
+            log::debug!("Deleted remote log file: {}", self.file_path.display());
+        }
+    }
+}
+
+/// File-backed log record source.
+/// Used for remote log segments downloaded to local disk.
+/// Streams data on-demand instead of loading entire file into memory.
+///
+/// Uses seek + read_exact for cross-platform compatibility.
+/// Access pattern is sequential iteration (single consumer).
+struct FileSource {
+    file: File,
+    file_size: usize,
+    base_offset: usize,
+    _cleanup: Option<FileCleanupGuard>, // Drops AFTER file (field order matters!)
+}
+
+impl FileSource {
+    /// Create a new FileSource.
+    ///
+    /// The file at `file_path` will be deleted when this FileSource is dropped.
+    fn new(file: File, base_offset: usize, file_path: PathBuf) -> Result<Self> {
+        let file_size = file.metadata()?.len() as usize;
+
+        // Validate base_offset to prevent underflow in total_size()
+        if base_offset > file_size {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "base_offset ({}) exceeds file_size ({})",
+                    base_offset, file_size
+                ),
+                source: None,
+            });
+        }
+
+        Ok(Self {
+            file,
+            file_size,
+            base_offset,
+            _cleanup: Some(FileCleanupGuard { file_path }),
+        })
+    }
+
+    /// Read data at a specific position using seek + read_exact.
+    /// This is cross-platform and adequate for sequential access patterns.
+    fn read_at(&mut self, pos: u64, buf: &mut [u8]) -> Result<()> {
+        self.file.seek(SeekFrom::Start(pos))?;
+        self.file.read_exact(buf)?;
+        Ok(())
+    }
+
+    fn read_batch_header(&mut self, pos: usize) -> Result<(i64, usize)> {
+        let actual_pos = self.base_offset + pos;
+        if actual_pos + LOG_OVERHEAD > self.file_size {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "Position {} exceeds file size {}",
+                    actual_pos, self.file_size
+                ),
+                source: None,
+            });
+        }
+
+        // Read only the header to extract base_offset and batch_size
+        let mut header_buf = vec![0u8; LOG_OVERHEAD];
+        self.read_at(actual_pos as u64, &mut header_buf)?;
+
+        let base_offset = LittleEndian::read_i64(&header_buf[BASE_OFFSET_OFFSET..]);
+        let batch_size_bytes = LittleEndian::read_i32(&header_buf[LENGTH_OFFSET..]);
+
+        // Validate batch size to prevent integer overflow and corruption
+        let batch_size = validate_batch_size(batch_size_bytes)?;
+
+        Ok((base_offset, batch_size))
+    }
+
+    fn read_batch_data(&mut self, pos: usize, size: usize) -> Result<Bytes> {
+        let actual_pos = self.base_offset + pos;
+        if actual_pos + size > self.file_size {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "Read beyond file size: {} + {} > {}",
+                    actual_pos, size, self.file_size
+                ),
+                source: None,
+            });
+        }
+
+        // Read the full batch data
+        let mut batch_buf = vec![0u8; size];
+        self.read_at(actual_pos as u64, &mut batch_buf)?;
+
+        Ok(Bytes::from(batch_buf))
+    }
+
+    fn total_size(&self) -> usize {
+        self.file_size - self.base_offset
+    }
+}
+
+/// Enum for different log record sources.
+enum LogRecordsSource {
+    Memory(MemorySource),
+    File(FileSource),
+}
+
+impl LogRecordsSource {
+    fn read_batch_header(&mut self, pos: usize) -> Result<(i64, usize)> {
+        match self {
+            Self::Memory(s) => s.read_batch_header(pos),
+            Self::File(s) => s.read_batch_header(pos),
+        }
+    }
+
+    fn read_batch_data(&mut self, pos: usize, size: usize) -> Result<Bytes> {
+        match self {
+            Self::Memory(s) => s.read_batch_data(pos, size),
+            Self::File(s) => s.read_batch_data(pos, size),
+        }
+    }
+
+    fn total_size(&self) -> usize {
+        match self {
+            Self::Memory(s) => s.total_size(),
+            Self::File(s) => s.total_size(),
+        }
+    }
+}
+
+pub struct LogRecordsBatches {
+    source: LogRecordsSource,
     current_pos: usize,
     remaining_bytes: usize,
 }
 
 impl LogRecordsBatches {
+    /// Create from in-memory Vec (existing path - backward compatible).
     pub fn new(data: Vec<u8>) -> Self {
-        let remaining_bytes: usize = data.len();
+        let source = LogRecordsSource::Memory(MemorySource::new(data));
+        let remaining_bytes = source.total_size();
         Self {
-            data: Bytes::from(data),
+            source,
             current_pos: 0,
             remaining_bytes,
         }
     }
 
-    pub fn next_batch_size(&self) -> Option<usize> {
+    /// Create from file.
+    /// Enables streaming without loading entire file into memory.
+    ///
+    /// The file at `file_path` will be deleted when dropped.
+    /// This ensures the file is closed before deletion.
+    pub fn from_file(file: File, base_offset: usize, file_path: PathBuf) -> Result<Self> {
+        let source = FileSource::new(file, base_offset, file_path)?;
+        let remaining_bytes = source.total_size();
+        Ok(Self {
+            source: LogRecordsSource::File(source),
+            current_pos: 0,
+            remaining_bytes,
+        })
+    }
+
+    /// Try to get the size of the next batch.
+    fn next_batch_size(&mut self) -> Result<Option<usize>> {
         if self.remaining_bytes < LOG_OVERHEAD {
-            return None;
+            return Ok(None);
         }
 
-        let batch_size_bytes =
-            LittleEndian::read_i32(self.data.get(self.current_pos + LENGTH_OFFSET..).unwrap());
-        let batch_size = batch_size_bytes as usize + LOG_OVERHEAD;
-        if batch_size > self.remaining_bytes {
-            return None;
+        // Read only header to get size
+        match self.source.read_batch_header(self.current_pos) {
+            Ok((_base_offset, batch_size)) => {
+                if batch_size > self.remaining_bytes {
+                    Ok(None)
+                } else {
+                    Ok(Some(batch_size))
+                }
+            }
+            Err(e) => Err(e),
         }
-        Some(batch_size)
     }
 }
 
 impl Iterator for LogRecordsBatches {
-    type Item = LogRecordBatch;
+    type Item = Result<LogRecordBatch>;
 
     fn next(&mut self) -> Option<Self::Item> {
         match self.next_batch_size() {
-            Some(batch_size) => {
-                let start = self.current_pos;
-                let end = start + batch_size;
-                // Since LogRecordsBatches owns the Vec<u8>, the slice is valid
-                // as long as the mutable reference exists, which is 'a
-                let record_batch = LogRecordBatch::new(self.data.slice(start..end));
-                self.current_pos += batch_size;
-                self.remaining_bytes -= batch_size;
-                Some(record_batch)
+            Ok(Some(batch_size)) => {
+                // Read full batch data on-demand
+                match self.source.read_batch_data(self.current_pos, batch_size) {
+                    Ok(data) => {
+                        let record_batch = LogRecordBatch::new(data);
+                        self.current_pos += batch_size;
+                        self.remaining_bytes -= batch_size;
+                        Some(Ok(record_batch))
+                    }
+                    Err(e) => Some(Err(e)),
+                }
             }
-            None => None,
+            Ok(None) => None,
+            Err(e) => Some(Err(e)),
         }
     }
 }
@@ -1012,7 +1290,7 @@ impl ReadContext {
             &body_buffer,
             batch_metadata,
             resolve_schema,
-            &std::collections::HashMap::new(),
+            &HashMap::new(),
             None,
             &version,
         )?;
@@ -1052,7 +1330,7 @@ impl ReadContext {
             &body_buffer,
             batch_metadata,
             self.full_schema.clone(),
-            &std::collections::HashMap::new(),
+            &HashMap::new(),
             None,
             &version,
         )?;
@@ -1157,7 +1435,7 @@ pub struct MyVec<T>(pub StreamReader<T>);
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::{DataField, DataTypes};
+    use crate::metadata::{DataField, DataTypes, RowType};
 
     #[test]
     fn test_to_array_type() {
@@ -1456,6 +1734,49 @@ mod tests {
         Ok(())
     }
 
+    // Tests for file-backed streaming
+
+    #[test]
+    fn test_file_source_streaming() -> Result<()> {
+        use tempfile::NamedTempFile;
+
+        // Test 1: Basic file reads work
+        let test_data = vec![1, 2, 3, 4, 5, 6, 7, 8, 9, 10];
+        let mut tmp_file = NamedTempFile::new()?;
+        tmp_file.write_all(&test_data)?;
+        tmp_file.flush()?;
+
+        let file_path = tmp_file.path().to_path_buf();
+        let file = File::open(&file_path)?;
+        let mut source = FileSource::new(file, 0, file_path)?;
+
+        // Read full data
+        let data = source.read_batch_data(0, 10)?;
+        assert_eq!(data.to_vec(), test_data);
+
+        // Read partial data
+        let partial = source.read_batch_data(2, 5)?;
+        assert_eq!(partial.to_vec(), vec![3, 4, 5, 6, 7]);
+
+        // Test 2: base_offset works (critical for remote logs with pos_in_log_segment)
+        let prefix = vec![0xFF; 100];
+        let actual_data = vec![1, 2, 3, 4, 5];
+        let mut tmp_file2 = NamedTempFile::new()?;
+        tmp_file2.write_all(&prefix)?;
+        tmp_file2.write_all(&actual_data)?;
+        tmp_file2.flush()?;
+
+        let file_path2 = tmp_file2.path().to_path_buf();
+        let file2 = File::open(&file_path2)?;
+        let mut source2 = FileSource::new(file2, 100, file_path2)?; // Skip first 100 bytes
+
+        assert_eq!(source2.total_size(), 5); // Only counts data after offset
+        let data2 = source2.read_batch_data(0, 5)?;
+        assert_eq!(data2.to_vec(), actual_data);
+
+        Ok(())
+    }
+
     #[test]
     fn test_all_types_end_to_end() -> Result<()> {
         use crate::row::{Date, Datum, Decimal, GenericRow, Time, TimestampLtz, TimestampNtz};
@@ -1590,4 +1911,63 @@ mod tests {
 
         Ok(())
     }
+
+    #[test]
+    fn test_log_records_batches_from_file() -> Result<()> {
+        use crate::client::WriteRecord;
+        use crate::compression::{
+            ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+        };
+        use crate::metadata::TablePath;
+        use crate::row::GenericRow;
+        use tempfile::NamedTempFile;
+
+        // Integration test: Real log record batch streamed from file
+        let row_type = RowType::new(vec![
+            DataField::new("id".to_string(), DataTypes::int(), None),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+        ]);
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+
+        let mut builder = MemoryLogRecordsArrowBuilder::new(
+            1,
+            &row_type,
+            false,
+            ArrowCompressionInfo {
+                compression_type: ArrowCompressionType::None,
+                compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+            },
+        )?;
+
+        let mut row = GenericRow::new();
+        row.set_field(0, 1_i32);
+        row.set_field(1, "alice");
+        let record = WriteRecord::for_append(table_path.clone(), 1, row);
+        builder.append(&record)?;
+
+        let mut row2 = GenericRow::new();
+        row2.set_field(0, 2_i32);
+        row2.set_field(1, "bob");
+        let record2 = WriteRecord::for_append(table_path, 2, row2);
+        builder.append(&record2)?;
+
+        let data = builder.build()?;
+
+        // Write to file
+        let mut tmp_file = NamedTempFile::new()?;
+        tmp_file.write_all(&data)?;
+        tmp_file.flush()?;
+
+        // Create file-backed LogRecordsBatches (should stream, not load all into memory)
+        let file_path = tmp_file.path().to_path_buf();
+        let file = File::open(&file_path)?;
+        let mut batches = LogRecordsBatches::from_file(file, 0, file_path)?;
+
+        // Iterate through batches (should work just like in-memory)
+        let batch = batches.next().expect("Should have at least one batch")?;
+        assert!(batch.size_in_bytes() > 0);
+        assert_eq!(batch.record_count(), 2);
+
+        Ok(())
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index 30424e5d16..156ef04956 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -22,7 +22,6 @@ use crate::metadata::TableBucket;
 use linked_hash_map::LinkedHashMap;
 use std::collections::{HashMap, HashSet};
 use std::hash::Hash;
-use std::path::PathBuf;
 use std::sync::Arc;
 use std::time::{SystemTime, UNIX_EPOCH};
 
@@ -33,11 +32,9 @@ pub fn current_time_ms() -> i64 {
         .as_millis() as i64
 }
 
-pub async fn delete_file(file_path: PathBuf) {
-    tokio::fs::remove_file(&file_path)
-        .await
-        .unwrap_or_else(|err| log::warn!("Could not delete file: {file_path:?}, error: {err:?}"));
-}
+// Removed: delete_file() is no longer used.
+// File cleanup is now handled via RAII with FileCleanupGuard in arrow.rs
+// which uses Rust's drop order to ensure files are closed before deletion.
 
 pub struct FairBucketStatusMap<S> {
     map: LinkedHashMap<TableBucket, Arc<S>>,

From d695cb803509bd00f7f725afac278b026e6ff227 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sun, 25 Jan 2026 01:18:59 +0000
Subject: [PATCH 085/287] feat: Implement Admin APIs for partitioning (#208)

---
 fluss-rust/crates/fluss/src/client/admin.rs   |  76 ++-
 .../crates/fluss/src/client/table/scanner.rs  |   3 +-
 .../fluss/src/client/write/accumulator.rs     |   2 +-
 .../crates/fluss/src/client/write/sender.rs   |   3 +-
 fluss-rust/crates/fluss/src/lib.rs            |   4 +-
 fluss-rust/crates/fluss/src/metadata/mod.rs   |   2 +
 .../crates/fluss/src/metadata/partition.rs    | 469 ++++++++++++++++++
 fluss-rust/crates/fluss/src/metadata/table.rs |  66 ++-
 .../crates/fluss/src/proto/fluss_api.proto    |  36 +-
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |  12 +
 .../fluss/src/rpc/message/create_partition.rs |  59 +++
 .../fluss/src/rpc/message/drop_partition.rs   |  59 +++
 .../fluss/src/rpc/message/list_offsets.rs     |  10 +-
 .../src/rpc/message/list_partition_infos.rs   |  63 +++
 .../crates/fluss/src/rpc/message/mod.rs       |   6 +
 fluss-rust/crates/fluss/src/util/mod.rs       |   3 +-
 .../crates/fluss/tests/integration/admin.rs   | 145 +++++-
 17 files changed, 983 insertions(+), 35 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/metadata/partition.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/drop_partition.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/list_partition_infos.rs

diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 6646f97cf8..bffe0f5141 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -17,20 +17,21 @@
 
 use crate::client::metadata::Metadata;
 use crate::metadata::{
-    DatabaseDescriptor, DatabaseInfo, JsonSerde, LakeSnapshot, TableBucket, TableDescriptor,
-    TableInfo, TablePath,
+    DatabaseDescriptor, DatabaseInfo, JsonSerde, LakeSnapshot, PartitionInfo, PartitionSpec,
+    TableBucket, TableDescriptor, TableInfo, TablePath,
 };
 use crate::rpc::message::{
-    CreateDatabaseRequest, CreateTableRequest, DatabaseExistsRequest, DropDatabaseRequest,
-    DropTableRequest, GetDatabaseInfoRequest, GetLatestLakeSnapshotRequest, GetTableRequest,
-    ListDatabasesRequest, ListTablesRequest, TableExistsRequest,
+    CreateDatabaseRequest, CreatePartitionRequest, CreateTableRequest, DatabaseExistsRequest,
+    DropDatabaseRequest, DropPartitionRequest, DropTableRequest, GetDatabaseInfoRequest,
+    GetLatestLakeSnapshotRequest, GetTableRequest, ListDatabasesRequest, ListPartitionInfosRequest,
+    ListTablesRequest, TableExistsRequest,
 };
 use crate::rpc::message::{ListOffsetsRequest, OffsetSpec};
 use crate::rpc::{RpcClient, ServerConnection};
 
-use crate::BucketId;
 use crate::error::{Error, Result};
 use crate::proto::GetTableInfoResponse;
+use crate::{BucketId, PartitionId, TableId};
 use std::collections::HashMap;
 use std::slice::from_ref;
 use std::sync::Arc;
@@ -138,6 +139,63 @@ impl FlussAdmin {
         Ok(response.table_name)
     }
 
+    /// List all partitions in the given table.
+    pub async fn list_partition_infos(&self, table_path: &TablePath) -> Result<Vec<PartitionInfo>> {
+        self.list_partition_infos_with_spec(table_path, None).await
+    }
+
+    /// List partitions in the given table that match the partial partition spec.
+    pub async fn list_partition_infos_with_spec(
+        &self,
+        table_path: &TablePath,
+        partial_partition_spec: Option<&PartitionSpec>,
+    ) -> Result<Vec<PartitionInfo>> {
+        let response = self
+            .admin_gateway
+            .request(ListPartitionInfosRequest::new(
+                table_path,
+                partial_partition_spec,
+            ))
+            .await?;
+        Ok(response.get_partitions_info())
+    }
+
+    /// Create a new partition for a partitioned table.
+    pub async fn create_partition(
+        &self,
+        table_path: &TablePath,
+        partition_spec: &PartitionSpec,
+        ignore_if_exists: bool,
+    ) -> Result<()> {
+        let _response = self
+            .admin_gateway
+            .request(CreatePartitionRequest::new(
+                table_path,
+                partition_spec,
+                ignore_if_exists,
+            ))
+            .await?;
+        Ok(())
+    }
+
+    /// Drop a partition from a partitioned table.
+    pub async fn drop_partition(
+        &self,
+        table_path: &TablePath,
+        partition_spec: &PartitionSpec,
+        ignore_if_not_exists: bool,
+    ) -> Result<()> {
+        let _response = self
+            .admin_gateway
+            .request(DropPartitionRequest::new(
+                table_path,
+                partition_spec,
+                ignore_if_not_exists,
+            ))
+            .await?;
+        Ok(())
+    }
+
     /// Check if a table exists
     pub async fn table_exists(&self, table_path: &TablePath) -> Result<bool> {
         let response = self
@@ -263,13 +321,13 @@ impl FlussAdmin {
 
     fn prepare_list_offsets_requests(
         &self,
-        table_id: i64,
-        partition_id: Option<i64>,
+        table_id: TableId,
+        partition_id: Option<PartitionId>,
         buckets: &[BucketId],
         offset_spec: OffsetSpec,
     ) -> Result<HashMap<i32, ListOffsetsRequest>> {
         let cluster = self.metadata.get_cluster();
-        let mut node_for_bucket_list: HashMap<i32, Vec<i32>> = HashMap::new();
+        let mut node_for_bucket_list: HashMap<i32, Vec<BucketId>> = HashMap::new();
 
         for bucket_id in buckets {
             let table_bucket = TableBucket::new(table_id, *bucket_id);
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 8712650e6a..61ed56e1df 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -27,6 +27,7 @@ use std::{
 };
 use tempfile::TempDir;
 
+use crate::TableId;
 use crate::client::connection::FlussConnection;
 use crate::client::credentials::CredentialsCache;
 use crate::client::metadata::Metadata;
@@ -264,7 +265,7 @@ pub struct RecordBatchLogScanner {
 /// Private shared implementation for both scanner types
 struct LogScannerInner {
     table_path: TablePath,
-    table_id: i64,
+    table_id: TableId,
     metadata: Arc<Metadata>,
     log_scanner_status: Arc<LogScannerStatus>,
     log_fetcher: LogFetcher,
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 46c822c1a2..96114fb015 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -401,7 +401,7 @@ impl RecordAccumulator {
         ready_write_batch.write_batch.re_enqueued();
         let table_path = ready_write_batch.write_batch.table_path().clone();
         let bucket_id = ready_write_batch.table_bucket.bucket_id();
-        let table_id = u64::try_from(ready_write_batch.table_bucket.table_id()).unwrap_or(0);
+        let table_id = ready_write_batch.table_bucket.table_id();
 
         let dq = {
             let mut binding =
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index ceed245621..1ffda58230 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -15,6 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::TableId;
 use crate::client::broadcast;
 use crate::client::metadata::Metadata;
 use crate::client::write::batch::WriteBatch;
@@ -144,7 +145,7 @@ impl Sender {
             return Ok(());
         }
         let mut records_by_bucket = HashMap::new();
-        let mut write_batch_by_table: HashMap<i64, Vec<TableBucket>> = HashMap::new();
+        let mut write_batch_by_table: HashMap<TableId, Vec<TableBucket>> = HashMap::new();
 
         for batch in batches {
             let table_bucket = batch.table_bucket.clone();
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index e8d822fb77..f079db2808 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -34,8 +34,8 @@ mod util;
 #[cfg(test)]
 mod test_utils;
 
-pub type TableId = u64;
-pub type PartitionId = u64;
+pub type TableId = i64;
+pub type PartitionId = i64;
 pub type BucketId = i32;
 
 pub mod proto {
diff --git a/fluss-rust/crates/fluss/src/metadata/mod.rs b/fluss-rust/crates/fluss/src/metadata/mod.rs
index 9c0b1b472c..0ca654a6b1 100644
--- a/fluss-rust/crates/fluss/src/metadata/mod.rs
+++ b/fluss-rust/crates/fluss/src/metadata/mod.rs
@@ -19,10 +19,12 @@ mod data_lake_format;
 mod database;
 mod datatype;
 mod json_serde;
+mod partition;
 mod table;
 
 pub use data_lake_format::*;
 pub use database::*;
 pub use datatype::*;
 pub use json_serde::*;
+pub use partition::*;
 pub use table::*;
diff --git a/fluss-rust/crates/fluss/src/metadata/partition.rs b/fluss-rust/crates/fluss/src/metadata/partition.rs
new file mode 100644
index 0000000000..1ecc0dcd9e
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metadata/partition.rs
@@ -0,0 +1,469 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::PartitionId;
+use crate::error::{Error, Result};
+use crate::proto::{PbKeyValue, PbPartitionInfo, PbPartitionSpec};
+use std::collections::HashMap;
+use std::fmt::{Display, Formatter};
+
+/// Represents a partition spec in fluss. Partition columns and values are NOT of strict order, and
+/// they need to be re-arranged to the correct order by comparing with a list of strictly ordered
+/// partition keys.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct PartitionSpec {
+    partition_spec: HashMap<String, String>,
+}
+
+impl PartitionSpec {
+    pub fn new(partition_spec: HashMap<String, String>) -> Self {
+        Self { partition_spec }
+    }
+
+    pub fn get_spec_map(&self) -> &HashMap<String, String> {
+        &self.partition_spec
+    }
+
+    pub fn to_pb(&self) -> PbPartitionSpec {
+        PbPartitionSpec {
+            partition_key_values: self
+                .partition_spec
+                .iter()
+                .map(|(k, v)| PbKeyValue {
+                    key: k.clone(),
+                    value: v.clone(),
+                })
+                .collect(),
+        }
+    }
+
+    pub fn from_pb(pb: &PbPartitionSpec) -> Self {
+        let partition_spec = pb
+            .partition_key_values
+            .iter()
+            .map(|kv| (kv.key.clone(), kv.value.clone()))
+            .collect();
+        Self { partition_spec }
+    }
+}
+
+impl Display for PartitionSpec {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "PartitionSpec{{{:?}}}", self.partition_spec)
+    }
+}
+
+/// Represents a partition, which is the resolved version of PartitionSpec. The partition
+/// spec is re-arranged into the correct order by comparing it with a list of strictly ordered
+/// partition keys.
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub struct ResolvedPartitionSpec {
+    partition_keys: Vec<String>,
+    partition_values: Vec<String>,
+}
+
+pub const PARTITION_SPEC_SEPARATOR: &str = "$";
+
+impl ResolvedPartitionSpec {
+    pub fn new(partition_keys: Vec<String>, partition_values: Vec<String>) -> Result<Self> {
+        if partition_keys.len() != partition_values.len() {
+            return Err(Error::IllegalArgument {
+                message: "The number of partition keys and partition values should be the same."
+                    .to_string(),
+            });
+        }
+        Ok(Self {
+            partition_keys,
+            partition_values,
+        })
+    }
+
+    pub fn from_partition_spec(
+        partition_keys: Vec<String>,
+        partition_spec: &PartitionSpec,
+    ) -> Self {
+        let partition_values =
+            Self::get_reordered_partition_values(&partition_keys, partition_spec);
+        Self {
+            partition_keys,
+            partition_values,
+        }
+    }
+
+    pub fn from_partition_value(partition_key: String, partition_value: String) -> Self {
+        Self {
+            partition_keys: vec![partition_key],
+            partition_values: vec![partition_value],
+        }
+    }
+
+    pub fn from_partition_name(partition_keys: Vec<String>, partition_name: &str) -> Self {
+        let partition_values: Vec<String> = partition_name
+            .split(PARTITION_SPEC_SEPARATOR)
+            .map(|s| s.to_string())
+            .collect();
+        Self {
+            partition_keys,
+            partition_values,
+        }
+    }
+
+    pub fn from_partition_qualified_name(qualified_partition_name: &str) -> Result<Self> {
+        let mut keys = Vec::new();
+        let mut values = Vec::new();
+
+        for pair in qualified_partition_name.split('/') {
+            let parts: Vec<&str> = pair.splitn(2, '=').collect();
+            if parts.len() != 2 {
+                return Err(Error::IllegalArgument {
+                    message: format!(
+                        "Invalid partition name format. Expected key=value, got: {}",
+                        pair
+                    ),
+                });
+            }
+            keys.push(parts[0].to_string());
+            values.push(parts[1].to_string());
+        }
+
+        Ok(Self {
+            partition_keys: keys,
+            partition_values: values,
+        })
+    }
+
+    pub fn get_partition_keys(&self) -> &[String] {
+        &self.partition_keys
+    }
+
+    pub fn get_partition_values(&self) -> &[String] {
+        &self.partition_values
+    }
+
+    pub fn to_partition_spec(&self) -> PartitionSpec {
+        let mut spec_map = HashMap::new();
+        for (i, key) in self.partition_keys.iter().enumerate() {
+            spec_map.insert(key.clone(), self.partition_values[i].clone());
+        }
+        PartitionSpec::new(spec_map)
+    }
+
+    /// Generate the partition name for a partition table with specified partition values.
+    ///
+    /// The partition name is in the following format: value1$value2$...$valueN
+    pub fn get_partition_name(&self) -> String {
+        self.partition_values.join(PARTITION_SPEC_SEPARATOR)
+    }
+
+    /// Returns the qualified partition name for a partition spec.
+    /// The format is: key1=value1/key2=value2/.../keyN=valueN
+    pub fn get_partition_qualified_name(&self) -> String {
+        let mut sb = String::new();
+        for (i, key) in self.partition_keys.iter().enumerate() {
+            sb.push_str(key);
+            sb.push('=');
+            sb.push_str(&self.partition_values[i]);
+            if i != self.partition_keys.len() - 1 {
+                sb.push('/');
+            }
+        }
+        sb
+    }
+
+    pub fn contains(&self, other: &ResolvedPartitionSpec) -> Result<bool> {
+        let other_partition_keys = other.get_partition_keys();
+        let other_partition_values = other.get_partition_values();
+
+        let mut expected_partition_values = Vec::new();
+        for other_partition_key in other_partition_keys {
+            let key_index = self
+                .partition_keys
+                .iter()
+                .position(|k| k == other_partition_key);
+            match key_index {
+                Some(idx) => expected_partition_values.push(self.partition_values[idx].clone()),
+                None => {
+                    return Err(Error::IllegalArgument {
+                        message: format!(
+                            "table does not contain partitionKey: {}",
+                            other_partition_key
+                        ),
+                    });
+                }
+            }
+        }
+
+        let expected_partition_name = expected_partition_values.join(PARTITION_SPEC_SEPARATOR);
+        let other_partition_name = other_partition_values.join(PARTITION_SPEC_SEPARATOR);
+
+        Ok(expected_partition_name == other_partition_name)
+    }
+
+    pub fn to_pb(&self) -> PbPartitionSpec {
+        PbPartitionSpec {
+            partition_key_values: self
+                .partition_keys
+                .iter()
+                .zip(self.partition_values.iter())
+                .map(|(k, v)| PbKeyValue {
+                    key: k.clone(),
+                    value: v.clone(),
+                })
+                .collect(),
+        }
+    }
+
+    pub fn from_pb(pb: &PbPartitionSpec) -> Self {
+        let partition_keys = pb
+            .partition_key_values
+            .iter()
+            .map(|kv| kv.key.clone())
+            .collect();
+        let partition_values = pb
+            .partition_key_values
+            .iter()
+            .map(|kv| kv.value.clone())
+            .collect();
+        Self {
+            partition_keys,
+            partition_values,
+        }
+    }
+
+    fn get_reordered_partition_values(
+        partition_keys: &[String],
+        partition_spec: &PartitionSpec,
+    ) -> Vec<String> {
+        let partition_spec_map = partition_spec.get_spec_map();
+        partition_keys
+            .iter()
+            .map(|key| partition_spec_map.get(key).cloned().unwrap_or_default())
+            .collect()
+    }
+}
+
+impl Display for ResolvedPartitionSpec {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(f, "{}", self.get_partition_qualified_name())
+    }
+}
+
+/// Information of a partition metadata, includes the partition's name and the partition id that
+/// represents the unique identifier of the partition.
+#[derive(Debug, Clone, PartialEq, Eq, Hash)]
+pub struct PartitionInfo {
+    partition_id: PartitionId,
+    partition_spec: ResolvedPartitionSpec,
+}
+
+impl PartitionInfo {
+    pub fn new(partition_id: PartitionId, partition_spec: ResolvedPartitionSpec) -> Self {
+        Self {
+            partition_id,
+            partition_spec,
+        }
+    }
+
+    /// Get the partition id. The id is globally unique in the Fluss cluster.
+    pub fn get_partition_id(&self) -> PartitionId {
+        self.partition_id
+    }
+
+    /// Get the partition name.
+    pub fn get_partition_name(&self) -> String {
+        self.partition_spec.get_partition_name()
+    }
+
+    pub fn get_resolved_partition_spec(&self) -> &ResolvedPartitionSpec {
+        &self.partition_spec
+    }
+
+    pub fn get_partition_spec(&self) -> PartitionSpec {
+        self.partition_spec.to_partition_spec()
+    }
+
+    pub fn to_pb(&self) -> PbPartitionInfo {
+        PbPartitionInfo {
+            partition_id: self.partition_id,
+            partition_spec: self.partition_spec.to_pb(),
+        }
+    }
+
+    pub fn from_pb(pb: &PbPartitionInfo) -> Self {
+        Self {
+            partition_id: pb.partition_id,
+            partition_spec: ResolvedPartitionSpec::from_pb(&pb.partition_spec),
+        }
+    }
+}
+
+impl Display for PartitionInfo {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(
+            f,
+            "Partition{{name='{}', id={}}}",
+            self.get_partition_name(),
+            self.partition_id
+        )
+    }
+}
+
+/// A class to identify a table partition, containing the table id and the partition id.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub struct TablePartition {
+    table_id: i64,
+    partition_id: PartitionId,
+}
+
+impl TablePartition {
+    pub fn new(table_id: i64, partition_id: PartitionId) -> Self {
+        Self {
+            table_id,
+            partition_id,
+        }
+    }
+
+    pub fn get_table_id(&self) -> i64 {
+        self.table_id
+    }
+
+    pub fn get_partition_id(&self) -> PartitionId {
+        self.partition_id
+    }
+}
+
+impl Display for TablePartition {
+    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+        write!(
+            f,
+            "TablePartition{{tableId={}, partitionId={}}}",
+            self.table_id, self.partition_id
+        )
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_resolved_partition_spec_name() {
+        let spec = ResolvedPartitionSpec::new(
+            vec!["date".to_string(), "region".to_string()],
+            vec!["2024-01-15".to_string(), "US".to_string()],
+        )
+        .unwrap();
+
+        assert_eq!(spec.get_partition_name(), "2024-01-15$US");
+        assert_eq!(
+            spec.get_partition_qualified_name(),
+            "date=2024-01-15/region=US"
+        );
+    }
+
+    #[test]
+    fn test_resolved_partition_spec_from_partition_name() {
+        let spec = ResolvedPartitionSpec::from_partition_name(
+            vec!["date".to_string(), "region".to_string()],
+            "2024-01-15$US",
+        );
+
+        assert_eq!(spec.get_partition_values(), &["2024-01-15", "US"]);
+    }
+
+    #[test]
+    fn test_resolved_partition_spec_from_qualified_name() {
+        let spec =
+            ResolvedPartitionSpec::from_partition_qualified_name("date=2024-01-15/region=US")
+                .unwrap();
+
+        assert_eq!(spec.get_partition_keys(), &["date", "region"]);
+        assert_eq!(spec.get_partition_values(), &["2024-01-15", "US"]);
+    }
+
+    #[test]
+    fn test_resolved_partition_spec_mismatched_lengths() {
+        let result = ResolvedPartitionSpec::new(
+            vec!["date".to_string(), "region".to_string()],
+            vec!["2024-01-15".to_string()],
+        );
+
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_partition_info() {
+        let spec =
+            ResolvedPartitionSpec::new(vec!["date".to_string()], vec!["2024-01-15".to_string()])
+                .unwrap();
+
+        let info = PartitionInfo::new(42, spec);
+        assert_eq!(info.get_partition_id(), 42);
+        assert_eq!(info.get_partition_name(), "2024-01-15");
+    }
+
+    #[test]
+    fn test_table_partition() {
+        let tp = TablePartition::new(100, 42);
+        assert_eq!(tp.get_table_id(), 100);
+        assert_eq!(tp.get_partition_id(), 42);
+    }
+
+    #[test]
+    fn test_partition_spec_pb_roundtrip() {
+        let mut map = HashMap::new();
+        map.insert("date".to_string(), "2024-01-15".to_string());
+        let spec = PartitionSpec::new(map);
+
+        let pb = spec.to_pb();
+        let restored = PartitionSpec::from_pb(&pb);
+
+        assert_eq!(
+            spec.get_spec_map().get("date"),
+            restored.get_spec_map().get("date")
+        );
+    }
+
+    #[test]
+    fn test_partition_info_pb_roundtrip() {
+        let spec =
+            ResolvedPartitionSpec::new(vec!["date".to_string()], vec!["2024-01-15".to_string()])
+                .unwrap();
+        let info = PartitionInfo::new(42, spec);
+
+        let pb = info.to_pb();
+        let restored = PartitionInfo::from_pb(&pb);
+
+        assert_eq!(info.get_partition_id(), restored.get_partition_id());
+        assert_eq!(info.get_partition_name(), restored.get_partition_name());
+    }
+
+    #[test]
+    fn test_contains() {
+        let full_spec = ResolvedPartitionSpec::new(
+            vec!["date".to_string(), "region".to_string()],
+            vec!["2024-01-15".to_string(), "US".to_string()],
+        )
+        .unwrap();
+
+        let partial_spec =
+            ResolvedPartitionSpec::new(vec!["date".to_string()], vec!["2024-01-15".to_string()])
+                .unwrap();
+
+        assert!(full_spec.contains(&partial_spec).unwrap());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index f4cf972d26..c4a9195403 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -20,6 +20,7 @@ use crate::error::Error::{IllegalArgument, InvalidTableError};
 use crate::error::{Error, Result};
 use crate::metadata::DataLakeFormat;
 use crate::metadata::datatype::{DataField, DataType, RowType};
+use crate::{BucketId, PartitionId, TableId};
 use core::fmt;
 use serde::{Deserialize, Serialize};
 use std::collections::{HashMap, HashSet};
@@ -697,32 +698,71 @@ impl TablePath {
     }
 }
 
+/// A database name, table name and partition name combo. It's used to represent the physical path of
+/// a bucket. If the bucket belongs to a partition (i.e., the table is a partitioned table),
+/// `partition_name` will be `Some(...)`; otherwise, it will be `None`.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct PhysicalTablePath {
     table_path: TablePath,
-    #[allow(dead_code)]
-    partition: Option<String>,
+    partition_name: Option<String>,
 }
 
 impl PhysicalTablePath {
     pub fn of(table_path: TablePath) -> Self {
         Self {
             table_path,
-            partition: None,
+            partition_name: None,
         }
     }
 
-    // TODO: support partition
+    pub fn of_partitioned(table_path: TablePath, partition_name: Option<String>) -> Self {
+        Self {
+            table_path,
+            partition_name,
+        }
+    }
+
+    pub fn of_with_names(
+        database_name: String,
+        table_name: String,
+        partition_name: Option<String>,
+    ) -> Self {
+        Self {
+            table_path: TablePath::new(database_name, table_name),
+            partition_name,
+        }
+    }
 
     pub fn get_table_path(&self) -> &TablePath {
         &self.table_path
     }
+
+    pub fn get_database_name(&self) -> &str {
+        self.table_path.database()
+    }
+
+    pub fn get_table_name(&self) -> &str {
+        self.table_path.table()
+    }
+
+    pub fn get_partition_name(&self) -> Option<&String> {
+        self.partition_name.as_ref()
+    }
+}
+
+impl Display for PhysicalTablePath {
+    fn fmt(&self, f: &mut Formatter<'_>) -> fmt::Result {
+        match &self.partition_name {
+            Some(partition) => write!(f, "{}(p={})", self.table_path, partition),
+            None => write!(f, "{}", self.table_path),
+        }
+    }
 }
 
 #[derive(Debug, Clone)]
 pub struct TableInfo {
     pub table_path: TablePath,
-    pub table_id: i64,
+    pub table_id: TableId,
     pub schema_id: i32,
     pub schema: Schema,
     pub row_type: RowType,
@@ -819,7 +859,7 @@ impl TableInfo {
     #[allow(clippy::too_many_arguments)]
     pub fn new(
         table_path: TablePath,
-        table_id: i64,
+        table_id: TableId,
         schema_id: i32,
         schema: Schema,
         bucket_keys: Vec<String>,
@@ -1000,13 +1040,13 @@ impl Display for TableInfo {
 
 #[derive(Debug, Clone, Serialize, Deserialize, Hash, PartialEq, Eq)]
 pub struct TableBucket {
-    table_id: i64,
-    partition_id: Option<i64>,
-    bucket: i32,
+    table_id: TableId,
+    partition_id: Option<PartitionId>,
+    bucket: BucketId,
 }
 
 impl TableBucket {
-    pub fn new(table_id: i64, bucket: i32) -> Self {
+    pub fn new(table_id: TableId, bucket: BucketId) -> Self {
         TableBucket {
             table_id,
             partition_id: None,
@@ -1014,15 +1054,15 @@ impl TableBucket {
         }
     }
 
-    pub fn table_id(&self) -> i64 {
+    pub fn table_id(&self) -> TableId {
         self.table_id
     }
 
-    pub fn bucket_id(&self) -> i32 {
+    pub fn bucket_id(&self) -> BucketId {
         self.bucket
     }
 
-    pub fn partition_id(&self) -> Option<i64> {
+    pub fn partition_id(&self) -> Option<PartitionId> {
         self.partition_id
     }
 }
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index 65eddce71e..eca4cf3846 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -374,4 +374,38 @@ message PbLookupRespForBucket {
 
 message PbValue {
   optional bytes values = 1;
-}
\ No newline at end of file
+}
+
+message PbPartitionSpec {
+  repeated PbKeyValue partition_key_values = 1;
+}
+
+message PbPartitionInfo {
+  required int64 partition_id = 1;
+  required PbPartitionSpec partition_spec = 2;
+}
+
+message ListPartitionInfosRequest {
+  required PbTablePath table_path = 1;
+  optional PbPartitionSpec partial_partition_spec = 2;
+}
+
+message ListPartitionInfosResponse {
+  repeated PbPartitionInfo partitions_info = 1;
+}
+
+message CreatePartitionRequest {
+  required PbTablePath table_path = 1;
+  required PbPartitionSpec partition_spec = 2;
+  required bool ignore_if_exists = 3;
+}
+
+message CreatePartitionResponse {}
+
+message DropPartitionRequest {
+  required PbTablePath table_path = 1;
+  required PbPartitionSpec partition_spec = 2;
+  required bool ignore_if_not_exists = 3;
+}
+
+message DropPartitionResponse {}
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index 66e4beb8e4..f6009c071e 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -27,6 +27,7 @@ pub enum ApiKey {
     DropTable,
     GetTable,
     ListTables,
+    ListPartitionInfos,
     TableExists,
     MetaData,
     ProduceLog,
@@ -37,6 +38,8 @@ pub enum ApiKey {
     GetFileSystemSecurityToken,
     GetDatabaseInfo,
     GetLatestLakeSnapshot,
+    CreatePartition,
+    DropPartition,
     Unknown(i16),
 }
 
@@ -51,6 +54,7 @@ impl From<i16> for ApiKey {
             1006 => ApiKey::DropTable,
             1007 => ApiKey::GetTable,
             1008 => ApiKey::ListTables,
+            1009 => ApiKey::ListPartitionInfos,
             1010 => ApiKey::TableExists,
             1012 => ApiKey::MetaData,
             1014 => ApiKey::ProduceLog,
@@ -61,6 +65,8 @@ impl From<i16> for ApiKey {
             1025 => ApiKey::GetFileSystemSecurityToken,
             1032 => ApiKey::GetLatestLakeSnapshot,
             1035 => ApiKey::GetDatabaseInfo,
+            1036 => ApiKey::CreatePartition,
+            1037 => ApiKey::DropPartition,
             _ => Unknown(key),
         }
     }
@@ -77,6 +83,7 @@ impl From<ApiKey> for i16 {
             ApiKey::DropTable => 1006,
             ApiKey::GetTable => 1007,
             ApiKey::ListTables => 1008,
+            ApiKey::ListPartitionInfos => 1009,
             ApiKey::TableExists => 1010,
             ApiKey::MetaData => 1012,
             ApiKey::ProduceLog => 1014,
@@ -87,6 +94,8 @@ impl From<ApiKey> for i16 {
             ApiKey::GetFileSystemSecurityToken => 1025,
             ApiKey::GetLatestLakeSnapshot => 1032,
             ApiKey::GetDatabaseInfo => 1035,
+            ApiKey::CreatePartition => 1036,
+            ApiKey::DropPartition => 1037,
             Unknown(x) => x,
         }
     }
@@ -107,6 +116,7 @@ mod tests {
             (1006, ApiKey::DropTable),
             (1007, ApiKey::GetTable),
             (1008, ApiKey::ListTables),
+            (1009, ApiKey::ListPartitionInfos),
             (1010, ApiKey::TableExists),
             (1012, ApiKey::MetaData),
             (1014, ApiKey::ProduceLog),
@@ -117,6 +127,8 @@ mod tests {
             (1025, ApiKey::GetFileSystemSecurityToken),
             (1032, ApiKey::GetLatestLakeSnapshot),
             (1035, ApiKey::GetDatabaseInfo),
+            (1036, ApiKey::CreatePartition),
+            (1037, ApiKey::DropPartition),
         ];
 
         for (raw, key) in cases {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs b/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
new file mode 100644
index 0000000000..93dbf70d3b
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
@@ -0,0 +1,59 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::{PartitionSpec, TablePath};
+use crate::proto::CreatePartitionResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::convert::to_table_path;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct CreatePartitionRequest {
+    pub inner_request: proto::CreatePartitionRequest,
+}
+
+impl CreatePartitionRequest {
+    pub fn new(
+        table_path: &TablePath,
+        partition_spec: &PartitionSpec,
+        ignore_if_exists: bool,
+    ) -> Self {
+        CreatePartitionRequest {
+            inner_request: proto::CreatePartitionRequest {
+                table_path: to_table_path(table_path),
+                partition_spec: partition_spec.to_pb(),
+                ignore_if_exists,
+            },
+        }
+    }
+}
+
+impl RequestBody for CreatePartitionRequest {
+    type ResponseBody = CreatePartitionResponse;
+
+    const API_KEY: ApiKey = ApiKey::CreatePartition;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(CreatePartitionRequest);
+impl_read_version_type!(CreatePartitionResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/drop_partition.rs b/fluss-rust/crates/fluss/src/rpc/message/drop_partition.rs
new file mode 100644
index 0000000000..ddc97d8300
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/drop_partition.rs
@@ -0,0 +1,59 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::{PartitionSpec, TablePath};
+use crate::proto::DropPartitionResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::convert::to_table_path;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct DropPartitionRequest {
+    pub inner_request: proto::DropPartitionRequest,
+}
+
+impl DropPartitionRequest {
+    pub fn new(
+        table_path: &TablePath,
+        partition_spec: &PartitionSpec,
+        ignore_if_not_exists: bool,
+    ) -> Self {
+        DropPartitionRequest {
+            inner_request: proto::DropPartitionRequest {
+                table_path: to_table_path(table_path),
+                partition_spec: partition_spec.to_pb(),
+                ignore_if_not_exists,
+            },
+        }
+    }
+}
+
+impl RequestBody for DropPartitionRequest {
+    type ResponseBody = DropPartitionResponse;
+
+    const API_KEY: ApiKey = ApiKey::DropPartition;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(DropPartitionRequest);
+impl_read_version_type!(DropPartitionResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
index fcecb4188c..262645a6d9 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
@@ -15,7 +15,9 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::{
+    BucketId, PartitionId, TableId, impl_read_version_type, impl_write_version_type, proto,
+};
 
 use crate::error::Result as FlussResult;
 use crate::error::{Error, FlussError};
@@ -74,9 +76,9 @@ pub struct ListOffsetsRequest {
 
 impl ListOffsetsRequest {
     pub fn new(
-        table_id: i64,
-        partition_id: Option<i64>,
-        bucket_ids: Vec<i32>,
+        table_id: TableId,
+        partition_id: Option<PartitionId>,
+        bucket_ids: Vec<BucketId>,
         offset_spec: OffsetSpec,
     ) -> Self {
         ListOffsetsRequest {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_partition_infos.rs b/fluss-rust/crates/fluss/src/rpc/message/list_partition_infos.rs
new file mode 100644
index 0000000000..ab693671e5
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_partition_infos.rs
@@ -0,0 +1,63 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::{PartitionInfo, PartitionSpec, TablePath};
+use crate::proto::ListPartitionInfosResponse;
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::convert::to_table_path;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug)]
+pub struct ListPartitionInfosRequest {
+    pub inner_request: proto::ListPartitionInfosRequest,
+}
+
+impl ListPartitionInfosRequest {
+    pub fn new(table_path: &TablePath, partial_partition_spec: Option<&PartitionSpec>) -> Self {
+        ListPartitionInfosRequest {
+            inner_request: proto::ListPartitionInfosRequest {
+                table_path: to_table_path(table_path),
+                partial_partition_spec: partial_partition_spec.map(|s| s.to_pb()),
+            },
+        }
+    }
+}
+
+impl RequestBody for ListPartitionInfosRequest {
+    type ResponseBody = ListPartitionInfosResponse;
+
+    const API_KEY: ApiKey = ApiKey::ListPartitionInfos;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(ListPartitionInfosRequest);
+impl_read_version_type!(ListPartitionInfosResponse);
+
+impl ListPartitionInfosResponse {
+    pub fn get_partitions_info(&self) -> Vec<PartitionInfo> {
+        self.partitions_info
+            .iter()
+            .map(PartitionInfo::from_pb)
+            .collect()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 881a64f687..addb97a15f 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -21,9 +21,11 @@ use crate::rpc::frame::{ReadError, WriteError};
 use bytes::{Buf, BufMut};
 
 mod create_database;
+mod create_partition;
 mod create_table;
 mod database_exists;
 mod drop_database;
+mod drop_partition;
 mod drop_table;
 mod fetch;
 mod get_database_info;
@@ -33,6 +35,7 @@ mod get_table;
 mod header;
 mod list_databases;
 mod list_offsets;
+mod list_partition_infos;
 mod list_tables;
 mod lookup;
 mod produce_log;
@@ -42,9 +45,11 @@ mod update_metadata;
 
 pub use crate::rpc::RpcError;
 pub use create_database::*;
+pub use create_partition::*;
 pub use create_table::*;
 pub use database_exists::*;
 pub use drop_database::*;
+pub use drop_partition::*;
 pub use drop_table::*;
 pub use fetch::*;
 pub use get_database_info::*;
@@ -54,6 +59,7 @@ pub use get_table::*;
 pub use header::*;
 pub use list_databases::*;
 pub use list_offsets::*;
+pub use list_partition_infos::*;
 pub use list_tables::*;
 pub use lookup::*;
 pub use produce_log::*;
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index 156ef04956..3760487d42 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -18,6 +18,7 @@
 pub mod murmur_hash;
 pub mod varint;
 
+use crate::TableId;
 use crate::metadata::TableBucket;
 use linked_hash_map::LinkedHashMap;
 use std::collections::{HashMap, HashSet};
@@ -151,7 +152,7 @@ impl<S> FairBucketStatusMap<S> {
         self.map.clear();
 
         // Group buckets by table ID
-        let mut table_to_buckets: LinkedHashMap<i64, Vec<TableBucket>> = LinkedHashMap::new();
+        let mut table_to_buckets: LinkedHashMap<TableId, Vec<TableBucket>> = LinkedHashMap::new();
         for bucket in bucket_to_status.keys() {
             table_to_buckets
                 .entry(bucket.table_id())
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index fbdb295d40..9842a5aa7e 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -37,9 +37,10 @@ mod admin_test {
     use crate::integration::utils::{get_cluster, start_cluster, stop_cluster};
     use fluss::error::FlussError;
     use fluss::metadata::{
-        DataTypes, DatabaseDescriptorBuilder, KvFormat, LogFormat, Schema, TableDescriptor,
-        TablePath,
+        DataTypes, DatabaseDescriptorBuilder, KvFormat, LogFormat, PartitionSpec, Schema,
+        TableDescriptor, TablePath,
     };
+    use std::collections::HashMap;
     use std::sync::Arc;
 
     fn before_all() {
@@ -223,6 +224,146 @@ mod admin_test {
         assert_eq!(admin.database_exists(test_db_name).await.unwrap(), false);
     }
 
+    #[tokio::test]
+    async fn test_partition_apis() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection
+            .get_admin()
+            .await
+            .expect("Failed to get admin client");
+
+        let test_db_name = "test_partition_apis_db";
+        let db_descriptor = DatabaseDescriptorBuilder::default()
+            .comment("Database for test_partition_apis")
+            .build();
+
+        admin
+            .create_database(test_db_name, true, Some(&db_descriptor))
+            .await
+            .expect("Failed to create test database");
+
+        let test_table_name = "partitioned_table";
+        let table_path = TablePath::new(test_db_name.to_string(), test_table_name.to_string());
+
+        let table_schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .column("dt", DataTypes::string())
+            .column("region", DataTypes::string())
+            .primary_key(vec![
+                "id".to_string(),
+                "dt".to_string(),
+                "region".to_string(),
+            ])
+            .build()
+            .expect("Failed to build table schema");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(table_schema)
+            .distributed_by(Some(3), vec!["id".to_string()])
+            .partitioned_by(vec!["dt".to_string(), "region".to_string()])
+            .property("table.replication.factor", "1")
+            .log_format(LogFormat::ARROW)
+            .kv_format(KvFormat::COMPACTED)
+            .build()
+            .expect("Failed to build table descriptor");
+
+        admin
+            .create_table(&table_path, &table_descriptor, true)
+            .await
+            .expect("Failed to create partitioned table");
+
+        let partitions = admin
+            .list_partition_infos(&table_path)
+            .await
+            .expect("Failed to list partitions");
+        assert!(
+            partitions.is_empty(),
+            "Expected no partitions initially, found {}",
+            partitions.len()
+        );
+
+        let mut partition_values = HashMap::new();
+        partition_values.insert("dt".to_string(), "2024-01-15".to_string());
+        partition_values.insert("region".to_string(), "EMEA".to_string());
+        let partition_spec = PartitionSpec::new(partition_values);
+
+        admin
+            .create_partition(&table_path, &partition_spec, false)
+            .await
+            .expect("Failed to create partition");
+
+        let partitions = admin
+            .list_partition_infos(&table_path)
+            .await
+            .expect("Failed to list partitions");
+        assert_eq!(
+            partitions.len(),
+            1,
+            "Expected exactly one partition after creation"
+        );
+        assert_eq!(
+            partitions[0].get_partition_name(),
+            "2024-01-15$EMEA",
+            "Partition name mismatch"
+        );
+
+        // list with partial spec filter - should find the partition
+        let mut partition_values = HashMap::new();
+        partition_values.insert("dt".to_string(), "2024-01-15".to_string());
+        let partial_partition_spec = PartitionSpec::new(partition_values);
+
+        let partitions_with_spec = admin
+            .list_partition_infos_with_spec(&table_path, Some(&partial_partition_spec))
+            .await
+            .expect("Failed to list partitions with spec");
+        assert_eq!(
+            partitions_with_spec.len(),
+            1,
+            "Expected one partition matching the spec"
+        );
+        assert_eq!(
+            partitions_with_spec[0].get_partition_name(),
+            "2024-01-15$EMEA",
+            "Partition name mismatch with spec filter"
+        );
+
+        // list with non-matching spec - should find no partitions
+        let mut non_matching_values = HashMap::new();
+        non_matching_values.insert("dt".to_string(), "2024-01-16".to_string());
+        let non_matching_spec = PartitionSpec::new(non_matching_values);
+        let partitions_non_matching = admin
+            .list_partition_infos_with_spec(&table_path, Some(&non_matching_spec))
+            .await
+            .expect("Failed to list partitions with non-matching spec");
+        assert!(
+            partitions_non_matching.is_empty(),
+            "Expected no partitions for non-matching spec"
+        );
+
+        admin
+            .drop_partition(&table_path, &partition_spec, false)
+            .await
+            .expect("Failed to drop partition");
+
+        let partitions = admin
+            .list_partition_infos(&table_path)
+            .await
+            .expect("Failed to list partitions");
+        assert!(
+            partitions.is_empty(),
+            "Expected no partitions after drop, found {}",
+            partitions.len()
+        );
+
+        admin
+            .drop_table(&table_path, true)
+            .await
+            .expect("Failed to drop table");
+        admin.drop_database(test_db_name, true, true).await;
+    }
+
     #[tokio::test]
     async fn test_fluss_error_response() {
         let cluster = get_fluss_cluster();

From 8406db0ee42caf00c55ec33b13b834860ae49998 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 25 Jan 2026 08:31:08 +0000
Subject: [PATCH 086/287] chore: add more info for RecordBatches (#211)

---
 .../src/client/table/log_fetch_buffer.rs      | 28 ++++---
 .../crates/fluss/src/client/table/scanner.rs  | 44 +++++++----
 fluss-rust/crates/fluss/src/record/mod.rs     | 77 +++++++++++++++++++
 .../crates/fluss/tests/integration/table.rs   | 20 +++--
 4 files changed, 133 insertions(+), 36 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index 4a64eda25a..b529806f84 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -65,7 +65,7 @@ pub trait CompletedFetch: Send + Sync {
     fn fetch_error_context(&self) -> Option<&FetchErrorContext>;
     fn take_error(&mut self) -> Option<Error>;
     fn fetch_records(&mut self, max_records: usize) -> Result<Vec<ScanRecord>>;
-    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<RecordBatch>>;
+    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<(RecordBatch, i64)>>;
     fn is_consumed(&self) -> bool;
     fn records_read(&self) -> usize;
     fn drain(&mut self);
@@ -476,8 +476,9 @@ impl DefaultCompletedFetch {
             source: None,
         }
     }
-    /// Get the next batch directly without row iteration
-    fn next_fetched_batch(&mut self) -> Result<Option<RecordBatch>> {
+    /// Get the next batch with its base offset.
+    /// Returns (RecordBatch, base_offset) where base_offset is the offset of the first record.
+    fn next_fetched_batch(&mut self) -> Result<Option<(RecordBatch, i64)>> {
         loop {
             let Some(log_batch_result) = self.log_record_batch.next() else {
                 self.drain();
@@ -492,20 +493,23 @@ impl DefaultCompletedFetch {
                 continue;
             }
 
-            // Truncate batch
-            let base_offset = log_batch.base_log_offset();
-            if self.next_fetch_offset > base_offset {
-                let skip_count = (self.next_fetch_offset - base_offset) as usize;
+            // Calculate the effective base offset for this batch
+            let log_base_offset = log_batch.base_log_offset();
+            let effective_base_offset = if self.next_fetch_offset > log_base_offset {
+                let skip_count = (self.next_fetch_offset - log_base_offset) as usize;
                 if skip_count >= record_batch.num_rows() {
                     continue;
                 }
                 // Slice the batch to skip the first skip_count rows
                 record_batch = record_batch.slice(skip_count, record_batch.num_rows() - skip_count);
-            }
+                self.next_fetch_offset
+            } else {
+                log_base_offset
+            };
 
             self.next_fetch_offset = log_batch.next_log_offset();
             self.records_read += record_batch.num_rows();
-            return Ok(Some(record_batch));
+            return Ok(Some((record_batch, effective_base_offset)));
         }
     }
 }
@@ -585,7 +589,7 @@ impl CompletedFetch for DefaultCompletedFetch {
         Ok(scan_records)
     }
 
-    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<RecordBatch>> {
+    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<(RecordBatch, i64)>> {
         if let Some(error) = self.error.take() {
             return Err(error);
         }
@@ -607,7 +611,7 @@ impl CompletedFetch for DefaultCompletedFetch {
 
         for _ in 0..max_batches {
             match self.next_fetched_batch()? {
-                Some(batch) => batches.push(batch),
+                Some(batch_with_offset) => batches.push(batch_with_offset),
                 None => break,
             }
         }
@@ -692,7 +696,7 @@ impl CompletedFetch for RemoteCompletedFetch {
         self.inner.fetch_records(max_records)
     }
 
-    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<RecordBatch>> {
+    fn fetch_batches(&mut self, max_batches: usize) -> Result<Vec<(RecordBatch, i64)>> {
         self.inner.fetch_batches(max_batches)
     }
 
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 61ed56e1df..dbebe1aca4 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -15,7 +15,6 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use arrow::array::RecordBatch;
 use arrow_schema::SchemaRef;
 use log::{debug, warn};
 use parking_lot::{Mutex, RwLock};
@@ -39,7 +38,9 @@ use crate::client::table::remote_log::{RemoteLogDownloader, RemoteLogFetchInfo};
 use crate::error::{ApiError, Error, FlussError, Result};
 use crate::metadata::{PhysicalTablePath, TableBucket, TableInfo, TablePath};
 use crate::proto::{ErrorResponse, FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
-use crate::record::{LogRecordsBatches, ReadContext, ScanRecord, ScanRecords, to_arrow_schema};
+use crate::record::{
+    LogRecordsBatches, ReadContext, ScanBatch, ScanRecord, ScanRecords, to_arrow_schema,
+};
 use crate::rpc::{RpcClient, RpcError, message};
 use crate::util::FairBucketStatusMap;
 
@@ -380,7 +381,7 @@ impl LogScannerInner {
         self.log_fetcher.collect_fetches()
     }
 
-    async fn poll_batches(&self, timeout: Duration) -> Result<Vec<RecordBatch>> {
+    async fn poll_batches(&self, timeout: Duration) -> Result<Vec<ScanBatch>> {
         let start = Instant::now();
         let deadline = start + timeout;
 
@@ -410,7 +411,7 @@ impl LogScannerInner {
         }
     }
 
-    async fn poll_for_batches(&self) -> Result<Vec<RecordBatch>> {
+    async fn poll_for_batches(&self) -> Result<Vec<ScanBatch>> {
         let result = self.log_fetcher.collect_batches()?;
         if !result.is_empty() {
             return Ok(result);
@@ -438,7 +439,8 @@ impl LogScanner {
 
 // Implementation for RecordBatchLogScanner (batches mode)
 impl RecordBatchLogScanner {
-    pub async fn poll(&self, timeout: Duration) -> Result<Vec<RecordBatch>> {
+    /// Poll for batches with metadata (bucket and offset information).
+    pub async fn poll(&self, timeout: Duration) -> Result<Vec<ScanBatch>> {
         self.inner.poll_batches(timeout).await
     }
 
@@ -1134,13 +1136,13 @@ impl LogFetcher {
         }
     }
 
-    /// Collect completed fetches as RecordBatches
-    fn collect_batches(&self) -> Result<Vec<RecordBatch>> {
+    /// Collect completed fetches as ScanBatches (with bucket and offset metadata)
+    fn collect_batches(&self) -> Result<Vec<ScanBatch>> {
         // Limit memory usage with both batch count and byte size constraints.
         // Max 100 batches per poll, but also check total bytes (soft cap ~64MB).
         const MAX_BATCHES: usize = 100;
         const MAX_BYTES: usize = 64 * 1024 * 1024; // 64MB soft cap
-        let mut result: Vec<RecordBatch> = Vec::new();
+        let mut result: Vec<ScanBatch> = Vec::new();
         let mut batches_remaining = MAX_BATCHES;
         let mut bytes_consumed: usize = 0;
 
@@ -1150,17 +1152,19 @@ impl LogFetcher {
 
                 match next_in_line {
                     Some(mut next_fetch) if !next_fetch.is_consumed() => {
-                        let batches =
+                        let scan_batches =
                             self.fetch_batches_from_fetch(&mut next_fetch, batches_remaining)?;
-                        let batch_count = batches.len();
+                        let batch_count = scan_batches.len();
 
-                        if !batches.is_empty() {
+                        if !scan_batches.is_empty() {
                             // Track bytes consumed (soft cap - may exceed by one fetch)
-                            let batch_bytes: usize =
-                                batches.iter().map(|b| b.get_array_memory_size()).sum();
+                            let batch_bytes: usize = scan_batches
+                                .iter()
+                                .map(|sb| sb.batch().get_array_memory_size())
+                                .sum();
                             bytes_consumed += batch_bytes;
 
-                            result.extend(batches);
+                            result.extend(scan_batches);
                             batches_remaining = batches_remaining.saturating_sub(batch_count);
                         }
 
@@ -1214,7 +1218,7 @@ impl LogFetcher {
         &self,
         next_in_line_fetch: &mut Box<dyn CompletedFetch>,
         max_batches: usize,
-    ) -> Result<Vec<RecordBatch>> {
+    ) -> Result<Vec<ScanBatch>> {
         let table_bucket = next_in_line_fetch.table_bucket().clone();
         let current_offset = self.log_scanner_status.get_bucket_offset(&table_bucket);
 
@@ -1230,7 +1234,7 @@ impl LogFetcher {
         let fetch_offset = next_in_line_fetch.next_fetch_offset();
 
         if fetch_offset == current_offset {
-            let batches = next_in_line_fetch.fetch_batches(max_batches)?;
+            let batches_with_offsets = next_in_line_fetch.fetch_batches(max_batches)?;
             let next_fetch_offset = next_in_line_fetch.next_fetch_offset();
 
             if next_fetch_offset > current_offset {
@@ -1238,7 +1242,13 @@ impl LogFetcher {
                     .update_offset(&table_bucket, next_fetch_offset);
             }
 
-            Ok(batches)
+            // Convert to ScanBatch with bucket info
+            Ok(batches_with_offsets
+                .into_iter()
+                .map(|(batch, base_offset)| {
+                    ScanBatch::new(table_bucket.clone(), batch, base_offset)
+                })
+                .collect())
         } else {
             warn!(
                 "Ignoring fetched batches for {table_bucket:?} at offset {fetch_offset} since the current offset is {current_offset}"
diff --git a/fluss-rust/crates/fluss/src/record/mod.rs b/fluss-rust/crates/fluss/src/record/mod.rs
index 94997e8d80..8438b16d54 100644
--- a/fluss-rust/crates/fluss/src/record/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/mod.rs
@@ -17,6 +17,7 @@
 
 use crate::metadata::TableBucket;
 use crate::row::ColumnarRow;
+use ::arrow::array::RecordBatch;
 use core::fmt;
 use std::collections::HashMap;
 
@@ -170,6 +171,60 @@ impl ScanRecords {
     }
 }
 
+/// A batch of records with metadata about bucket and offsets.
+///
+/// This is the batch-level equivalent of [`ScanRecord`], providing efficient
+/// access to Arrow RecordBatches while preserving the bucket and offset information
+/// needed for tracking consumption progress.
+#[derive(Debug, Clone)]
+pub struct ScanBatch {
+    /// The bucket this batch belongs to
+    bucket: TableBucket,
+    /// The Arrow RecordBatch containing the data
+    batch: RecordBatch,
+    /// Offset of the first record in this batch
+    base_offset: i64,
+}
+
+impl ScanBatch {
+    pub fn new(bucket: TableBucket, batch: RecordBatch, base_offset: i64) -> Self {
+        Self {
+            bucket,
+            batch,
+            base_offset,
+        }
+    }
+
+    pub fn bucket(&self) -> &TableBucket {
+        &self.bucket
+    }
+
+    pub fn batch(&self) -> &RecordBatch {
+        &self.batch
+    }
+
+    pub fn into_batch(self) -> RecordBatch {
+        self.batch
+    }
+
+    pub fn base_offset(&self) -> i64 {
+        self.base_offset
+    }
+
+    pub fn num_records(&self) -> usize {
+        self.batch.num_rows()
+    }
+
+    /// Returns the offset of the last record in this batch.
+    pub fn last_offset(&self) -> i64 {
+        if self.batch.num_rows() == 0 {
+            self.base_offset - 1
+        } else {
+            self.base_offset + self.batch.num_rows() as i64 - 1
+        }
+    }
+}
+
 impl IntoIterator for ScanRecords {
     type Item = ScanRecord;
     type IntoIter = std::vec::IntoIter<ScanRecord>;
@@ -243,4 +298,26 @@ mod tests {
         assert_eq!(record.timestamp(), -1);
         assert_eq!(record.change_type(), &ChangeType::Insert);
     }
+
+    #[test]
+    fn scan_batch_last_offset() {
+        let schema = Arc::new(Schema::new(vec![Field::new("v", DataType::Int32, false)]));
+        let bucket = TableBucket::new(1, 0);
+
+        // Batch with 3 records starting at offset 100 -> last_offset = 102
+        let batch = RecordBatch::try_new(
+            schema.clone(),
+            vec![Arc::new(Int32Array::from(vec![1, 2, 3]))],
+        )
+        .unwrap();
+        let scan_batch = ScanBatch::new(bucket.clone(), batch, 100);
+        assert_eq!(scan_batch.num_records(), 3);
+        assert_eq!(scan_batch.last_offset(), 102);
+
+        // Empty batch -> last_offset = base_offset - 1
+        let empty_batch = RecordBatch::new_empty(schema);
+        let empty_scan_batch = ScanBatch::new(bucket, empty_batch, 100);
+        assert_eq!(empty_scan_batch.num_records(), 0);
+        assert_eq!(empty_scan_batch.last_offset(), 99);
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index ef73b5685f..046ec02388 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -498,8 +498,10 @@ mod table_test {
         let all_ids: Vec<i32> = batches
             .iter()
             .flat_map(|b| {
-                (0..b.num_rows()).map(|i| {
-                    b.column(0)
+                let batch = b.batch();
+                (0..batch.num_rows()).map(move |i| {
+                    batch
+                        .column(0)
                         .as_any()
                         .downcast_ref::<Int32Array>()
                         .unwrap()
@@ -523,8 +525,10 @@ mod table_test {
         let new_ids: Vec<i32> = more
             .iter()
             .flat_map(|b| {
-                (0..b.num_rows()).map(|i| {
-                    b.column(0)
+                let batch = b.batch();
+                (0..batch.num_rows()).map(move |i| {
+                    batch
+                        .column(0)
                         .as_any()
                         .downcast_ref::<Int32Array>()
                         .unwrap()
@@ -544,8 +548,10 @@ mod table_test {
         let trunc_ids: Vec<i32> = trunc_batches
             .iter()
             .flat_map(|b| {
-                (0..b.num_rows()).map(|i| {
-                    b.column(0)
+                let batch = b.batch();
+                (0..batch.num_rows()).map(move |i| {
+                    batch
+                        .column(0)
                         .as_any()
                         .downcast_ref::<Int32Array>()
                         .unwrap()
@@ -568,6 +574,6 @@ mod table_test {
         let proj_batches = proj.poll(Duration::from_secs(10)).await.unwrap();
 
         // Projected batch should have 1 column (id), not 2 (id, name)
-        assert_eq!(proj_batches[0].num_columns(), 1);
+        assert_eq!(proj_batches[0].batch().num_columns(), 1);
     }
 }

From 9408a03ef70810bf7496843f68ac7d01aea0b60a Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 25 Jan 2026 08:31:55 +0000
Subject: [PATCH 087/287] feat: Support Arrow append operations for decimals,
 temporal types in Python (#206)

---
 fluss-rust/bindings/python/Cargo.toml         |   1 +
 fluss-rust/bindings/python/example/example.py |  59 ++-
 fluss-rust/bindings/python/src/table.rs       | 448 +++++++++++++++++-
 fluss-rust/bindings/python/src/utils.rs       |  35 +-
 4 files changed, 528 insertions(+), 15 deletions(-)

diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
index 4da8bf835e..ff4d687d80 100644
--- a/fluss-rust/bindings/python/Cargo.toml
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -36,3 +36,4 @@ arrow-schema = "57.0.0"
 arrow-array = "57.0.0"
 pyo3-async-runtimes = { version = "0.26.0", features = ["tokio-runtime"] }
 jiff = { workspace = true }
+bigdecimal = "0.4"
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index f1f20d1503..730416bb6f 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -17,6 +17,8 @@
 
 import asyncio
 import time
+from datetime import date, time as dt_time, datetime
+from decimal import Decimal
 
 import pandas as pd
 import pyarrow as pa
@@ -45,6 +47,11 @@ async def main():
         pa.field("name", pa.string()),
         pa.field("score", pa.float32()),
         pa.field("age", pa.int32()),
+        pa.field("birth_date", pa.date32()),
+        pa.field("check_in_time", pa.time32("ms")),
+        pa.field("created_at", pa.timestamp("us")),  # TIMESTAMP (NTZ)
+        pa.field("updated_at", pa.timestamp("us", tz="UTC")),  # TIMESTAMP_LTZ
+        pa.field("salary", pa.decimal128(10, 2)),
     ]
 
     # Create a PyArrow schema
@@ -60,7 +67,7 @@ async def main():
     admin = await conn.get_admin()
 
     # Create a Fluss table
-    table_path = fluss.TablePath("fluss", "sample_table")
+    table_path = fluss.TablePath("fluss", "sample_table_types")
 
     try:
         await admin.create_table(table_path, table_descriptor, True)
@@ -96,6 +103,11 @@ async def main():
                 pa.array(["Alice", "Bob", "Charlie"], type=pa.string()),
                 pa.array([95.2, 87.2, 92.1], type=pa.float32()),
                 pa.array([25, 30, 35], type=pa.int32()),
+                pa.array([date(1999, 5, 15), date(1994, 3, 20), date(1989, 11, 8)], type=pa.date32()),
+                pa.array([dt_time(9, 0, 0), dt_time(9, 30, 0), dt_time(10, 0, 0)], type=pa.time32("ms")),
+                pa.array([datetime(2024, 1, 15, 10, 30), datetime(2024, 1, 15, 11, 0), datetime(2024, 1, 15, 11, 30)], type=pa.timestamp("us")),
+                pa.array([datetime(2024, 1, 15, 10, 30), datetime(2024, 1, 15, 11, 0), datetime(2024, 1, 15, 11, 30)], type=pa.timestamp("us", tz="UTC")),
+                pa.array([Decimal("75000.00"), Decimal("82000.50"), Decimal("95000.75")], type=pa.decimal128(10, 2)),
             ],
             schema=schema,
         )
@@ -111,6 +123,11 @@ async def main():
                 pa.array(["David", "Eve"], type=pa.string()),
                 pa.array([88.5, 91.0], type=pa.float32()),
                 pa.array([28, 32], type=pa.int32()),
+                pa.array([date(1996, 7, 22), date(1992, 12, 1)], type=pa.date32()),
+                pa.array([dt_time(14, 15, 0), dt_time(8, 45, 0)], type=pa.time32("ms")),
+                pa.array([datetime(2024, 1, 16, 9, 0), datetime(2024, 1, 16, 9, 30)], type=pa.timestamp("us")),
+                pa.array([datetime(2024, 1, 16, 9, 0), datetime(2024, 1, 16, 9, 30)], type=pa.timestamp("us", tz="UTC")),
+                pa.array([Decimal("68000.00"), Decimal("72500.25")], type=pa.decimal128(10, 2)),
             ],
             schema=schema,
         )
@@ -118,15 +135,32 @@ async def main():
         append_writer.write_arrow_batch(pa_record_batch)
         print("Successfully wrote PyArrow RecordBatch")
 
-        # Test 3: Append single rows
-        print("\n--- Testing single row append ---")
-        # Dict input
-        await append_writer.append({"id": 8, "name": "Helen", "score": 93.5, "age": 26})
-        print("Successfully appended row (dict)")
-
-        # List input
-        await append_writer.append([9, "Ivan", 90.0, 31])
-        print("Successfully appended row (list)")
+        # Test 3: Append single rows with Date, Time, Timestamp, Decimal
+        print("\n--- Testing single row append with temporal/decimal types ---")
+        # Dict input with all types including Date, Time, Timestamp, Decimal
+        await append_writer.append({
+            "id": 8,
+            "name": "Helen",
+            "score": 93.5,
+            "age": 26,
+            "birth_date": date(1998, 4, 10),
+            "check_in_time": dt_time(11, 30, 45),
+            "created_at": datetime(2024, 1, 17, 14, 0, 0),
+            "updated_at": datetime(2024, 1, 17, 14, 0, 0),
+            "salary": Decimal("88000.00"),
+        })
+        print("Successfully appended row (dict with Date, Time, Timestamp, Decimal)")
+
+        # List input with all types
+        await append_writer.append([
+            9, "Ivan", 90.0, 31,
+            date(1993, 8, 25),
+            dt_time(16, 45, 0),
+            datetime(2024, 1, 17, 15, 30, 0),
+            datetime(2024, 1, 17, 15, 30, 0),
+            Decimal("91500.50"),
+        ])
+        print("Successfully appended row (list with Date, Time, Timestamp, Decimal)")
 
         # Test 4: Write Pandas DataFrame
         print("\n--- Testing Pandas DataFrame write ---")
@@ -136,6 +170,11 @@ async def main():
                 "name": ["Frank", "Grace"],
                 "score": [89.3, 94.7],
                 "age": [29, 27],
+                "birth_date": [date(1995, 2, 14), date(1997, 9, 30)],
+                "check_in_time": [dt_time(10, 0, 0), dt_time(10, 30, 0)],
+                "created_at": [datetime(2024, 1, 18, 8, 0), datetime(2024, 1, 18, 8, 30)],
+                "updated_at": [datetime(2024, 1, 18, 8, 0), datetime(2024, 1, 18, 8, 30)],
+                "salary": [Decimal("79000.00"), Decimal("85500.75")],
             }
         )
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 773354e8d8..b56a29dbf4 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -18,12 +18,22 @@
 use crate::TOKIO_RUNTIME;
 use crate::*;
 use arrow::array::RecordBatch;
-use arrow_pyarrow::FromPyArrow;
+use arrow_pyarrow::{FromPyArrow, ToPyArrow};
 use fluss::client::EARLIEST_OFFSET;
 use fluss::rpc::message::OffsetSpec;
+use pyo3::types::IntoPyDict;
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::Arc;
 
+// Time conversion constants
+const MILLIS_PER_SECOND: i64 = 1_000;
+const MILLIS_PER_MINUTE: i64 = 60_000;
+const MILLIS_PER_HOUR: i64 = 3_600_000;
+const MICROS_PER_MILLI: i64 = 1_000;
+const MICROS_PER_SECOND: i64 = 1_000_000;
+const MICROS_PER_DAY: i64 = 86_400_000_000;
+const NANOS_PER_MILLI: i64 = 1_000_000;
+
 /// Represents a Fluss table for data operations
 #[pyclass]
 pub struct FlussTable {
@@ -246,14 +256,29 @@ impl AppendWriter {
 
     /// Write Pandas DataFrame data
     pub fn write_pandas(&self, py: Python, df: Py<PyAny>) -> PyResult<()> {
+        // Get the expected Arrow schema from the Fluss table
+        let row_type = self.table_info.get_row_type();
+        let expected_schema = fcore::record::to_arrow_schema(row_type)
+            .map_err(|e| FlussError::new_err(format!("Failed to get table schema: {}", e)))?;
+
+        // Convert Arrow schema to PyArrow schema
+        let py_schema = expected_schema
+            .as_ref()
+            .to_pyarrow(py)
+            .map_err(|e| FlussError::new_err(format!("Failed to convert schema: {}", e)))?;
+
         // Import pyarrow module
         let pyarrow = py.import("pyarrow")?;
 
         // Get the Table class from pyarrow module
         let table_class = pyarrow.getattr("Table")?;
 
-        // Call Table.from_pandas(df) - from_pandas is a class method
-        let pa_table = table_class.call_method1("from_pandas", (df,))?;
+        // Call Table.from_pandas(df, schema=expected_schema) to ensure proper type casting
+        let pa_table = table_class.call_method(
+            "from_pandas",
+            (df,),
+            Some(&[("schema", py_schema)].into_py_dict(py)?),
+        )?;
 
         // Then call write_arrow with the converted table
         self.write_arrow(py, pa_table.into())
@@ -473,12 +498,393 @@ fn python_value_to_datum(
                 )))
             }
         }
+        fcore::metadata::DataType::Decimal(decimal_type) => {
+            python_decimal_to_datum(value, decimal_type.precision(), decimal_type.scale())
+        }
+        fcore::metadata::DataType::Date(_) => python_date_to_datum(value),
+        fcore::metadata::DataType::Time(_) => python_time_to_datum(value),
+        fcore::metadata::DataType::Timestamp(_) => python_datetime_to_timestamp_ntz(value),
+        fcore::metadata::DataType::TimestampLTz(_) => python_datetime_to_timestamp_ltz(value),
         _ => Err(FlussError::new_err(format!(
             "Unsupported data type for row-level operations: {data_type}"
         ))),
     }
 }
 
+/// Cached decimal.Decimal type
+/// Uses PyOnceLock for thread-safety and subinterpreter compatibility.
+static DECIMAL_TYPE: pyo3::sync::PyOnceLock<Py<pyo3::types::PyType>> =
+    pyo3::sync::PyOnceLock::new();
+
+/// Cached UTC epoch type
+static UTC_EPOCH: pyo3::sync::PyOnceLock<Py<PyAny>> = pyo3::sync::PyOnceLock::new();
+
+/// Get the cached decimal.Decimal type, importing it once per interpreter.
+fn get_decimal_type(py: Python) -> PyResult<Bound<pyo3::types::PyType>> {
+    let ty = DECIMAL_TYPE.get_or_try_init(py, || -> PyResult<_> {
+        let decimal_mod = py.import("decimal")?;
+        let decimal_ty = decimal_mod
+            .getattr("Decimal")?
+            .downcast_into::<pyo3::types::PyType>()?;
+        Ok(decimal_ty.unbind())
+    })?;
+    Ok(ty.bind(py).clone())
+}
+
+/// Get the cached UTC epoch datetime, creating it once per interpreter.
+fn get_utc_epoch(py: Python) -> PyResult<Bound<PyAny>> {
+    let epoch = UTC_EPOCH.get_or_try_init(py, || -> PyResult<_> {
+        let datetime_mod = py.import("datetime")?;
+        let timezone = datetime_mod.getattr("timezone")?;
+        let utc = timezone.getattr("utc")?;
+        let epoch = datetime_mod
+            .getattr("datetime")?
+            .call1((1970, 1, 1, 0, 0, 0, 0, &utc))?;
+        Ok(epoch.unbind())
+    })?;
+    Ok(epoch.bind(py).clone())
+}
+
+/// Validate that value is a decimal.Decimal instance.
+fn ensure_is_decimal(value: &Bound<PyAny>) -> PyResult<()> {
+    let decimal_ty = get_decimal_type(value.py())?;
+    if !value.is_instance(&decimal_ty.into_any())? {
+        return Err(FlussError::new_err(format!(
+            "Expected decimal.Decimal, got {}",
+            get_type_name(value)
+        )));
+    }
+    Ok(())
+}
+
+/// Convert Python decimal.Decimal to Datum::Decimal.
+/// Only accepts decimal.Decimal
+fn python_decimal_to_datum(
+    value: &Bound<PyAny>,
+    precision: u32,
+    scale: u32,
+) -> PyResult<fcore::row::Datum<'static>> {
+    use std::str::FromStr;
+
+    ensure_is_decimal(value)?;
+
+    let decimal_str: String = value.str()?.extract()?;
+    let bd = bigdecimal::BigDecimal::from_str(&decimal_str).map_err(|e| {
+        FlussError::new_err(format!("Failed to parse decimal '{}': {}", decimal_str, e))
+    })?;
+
+    let decimal = fcore::row::Decimal::from_big_decimal(bd, precision, scale).map_err(|e| {
+        FlussError::new_err(format!(
+            "Failed to convert decimal '{}' to DECIMAL({}, {}): {}",
+            decimal_str, precision, scale, e
+        ))
+    })?;
+
+    Ok(fcore::row::Datum::Decimal(decimal))
+}
+
+/// Convert Python datetime.date to Datum::Date.
+fn python_date_to_datum(value: &Bound<PyAny>) -> PyResult<fcore::row::Datum<'static>> {
+    use pyo3::types::{PyDate, PyDateAccess, PyDateTime};
+
+    // Reject datetime.datetime (subclass of date) - use timestamp columns for those
+    if value.downcast::<PyDateTime>().is_ok() {
+        return Err(FlussError::new_err(
+            "Expected datetime.date, got datetime.datetime. Use a TIMESTAMP column for datetime values.",
+        ));
+    }
+
+    let date = value.downcast::<PyDate>().map_err(|_| {
+        FlussError::new_err(format!(
+            "Expected datetime.date, got {}",
+            get_type_name(value)
+        ))
+    })?;
+
+    let year = date.get_year();
+    let month = date.get_month();
+    let day = date.get_day();
+
+    // Calculate days since Unix epoch (1970-01-01)
+    let civil_date = jiff::civil::date(year as i16, month as i8, day as i8);
+    let epoch = jiff::civil::date(1970, 1, 1);
+    let days_since_epoch = (civil_date - epoch).get_days();
+
+    Ok(fcore::row::Datum::Date(fcore::row::Date::new(
+        days_since_epoch,
+    )))
+}
+
+/// Convert Python datetime.time to Datum::Time.
+/// Uses PyO3's native PyTime type for efficient access.
+///
+/// Note: Fluss TIME is always stored as milliseconds since midnight (i32) regardless
+/// of the schema's precision setting. This matches the Java Fluss wire protocol.
+/// Sub-millisecond precision (microseconds not divisible by 1000) will raise an error
+/// to prevent silent data loss and ensure fail-fast behavior.
+fn python_time_to_datum(value: &Bound<PyAny>) -> PyResult<fcore::row::Datum<'static>> {
+    use pyo3::types::{PyTime, PyTimeAccess};
+
+    let time = value.downcast::<PyTime>().map_err(|_| {
+        FlussError::new_err(format!(
+            "Expected datetime.time, got {}",
+            get_type_name(value)
+        ))
+    })?;
+
+    let hour = time.get_hour() as i32;
+    let minute = time.get_minute() as i32;
+    let second = time.get_second() as i32;
+    let microsecond = time.get_microsecond() as i32;
+
+    // Strict validation: reject sub-millisecond precision
+    if microsecond % MICROS_PER_MILLI as i32 != 0 {
+        return Err(FlussError::new_err(format!(
+            "TIME values with sub-millisecond precision are not supported. \
+             Got time with {} microseconds (not divisible by 1000). \
+             Fluss stores TIME as milliseconds since midnight. \
+             Please round to milliseconds before insertion.",
+            microsecond
+        )));
+    }
+
+    // Convert to milliseconds since midnight
+    let millis = hour * MILLIS_PER_HOUR as i32
+        + minute * MILLIS_PER_MINUTE as i32
+        + second * MILLIS_PER_SECOND as i32
+        + microsecond / MICROS_PER_MILLI as i32;
+
+    Ok(fcore::row::Datum::Time(fcore::row::Time::new(millis)))
+}
+
+/// Convert Python datetime-like object to Datum::TimestampNtz.
+/// Supports: datetime.datetime (naive preferred), pd.Timestamp, np.datetime64
+fn python_datetime_to_timestamp_ntz(value: &Bound<PyAny>) -> PyResult<fcore::row::Datum<'static>> {
+    let (epoch_millis, nano_of_milli) = extract_datetime_components_ntz(value)?;
+
+    let ts = fcore::row::TimestampNtz::from_millis_nanos(epoch_millis, nano_of_milli)
+        .map_err(|e| FlussError::new_err(format!("Failed to create TimestampNtz: {}", e)))?;
+
+    Ok(fcore::row::Datum::TimestampNtz(ts))
+}
+
+/// Convert Python datetime-like object to Datum::TimestampLtz.
+/// For naive datetimes, assumes UTC. For aware datetimes, converts to UTC.
+/// Supports: datetime.datetime, pd.Timestamp, np.datetime64
+fn python_datetime_to_timestamp_ltz(value: &Bound<PyAny>) -> PyResult<fcore::row::Datum<'static>> {
+    let (epoch_millis, nano_of_milli) = extract_datetime_components_ltz(value)?;
+
+    let ts = fcore::row::TimestampLtz::from_millis_nanos(epoch_millis, nano_of_milli)
+        .map_err(|e| FlussError::new_err(format!("Failed to create TimestampLtz: {}", e)))?;
+
+    Ok(fcore::row::Datum::TimestampLtz(ts))
+}
+
+/// Extract epoch milliseconds for TimestampNtz (wall-clock time, no timezone conversion).
+/// Uses integer arithmetic to avoid float precision issues.
+/// For clarity, tz-aware datetimes are rejected - use TimestampLtz for those.
+fn extract_datetime_components_ntz(value: &Bound<PyAny>) -> PyResult<(i64, i32)> {
+    use pyo3::types::PyDateTime;
+
+    // Try PyDateTime first
+    if let Ok(dt) = value.downcast::<PyDateTime>() {
+        // Reject tz-aware datetime for NTZ - it's ambiguous what the user wants
+        let tzinfo = dt.getattr("tzinfo")?;
+        if !tzinfo.is_none() {
+            return Err(FlussError::new_err(
+                "TIMESTAMP (without timezone) requires a naive datetime. \
+                 Got timezone-aware datetime. Either remove tzinfo or use TIMESTAMP_LTZ column.",
+            ));
+        }
+        return datetime_to_epoch_millis_as_utc(dt);
+    }
+
+    // Check for pandas Timestamp by verifying module name
+    if is_pandas_timestamp(value) {
+        // For NTZ, reject tz-aware pandas Timestamps for consistency with datetime behavior
+        if let Ok(tz) = value.getattr("tz") {
+            if !tz.is_none() {
+                return Err(FlussError::new_err(
+                    "TIMESTAMP (without timezone) requires a naive pd.Timestamp. \
+                     Got timezone-aware Timestamp. Either use tz_localize(None) or use TIMESTAMP_LTZ column.",
+                ));
+            }
+        }
+        // Naive pandas Timestamp: .value is nanoseconds since epoch (wall-clock as UTC)
+        let nanos: i64 = value.getattr("value")?.extract()?;
+        return Ok(nanos_to_millis_and_submillis(nanos));
+    }
+
+    // Try to_pydatetime() for objects that support it
+    if let Ok(py_dt) = value.call_method0("to_pydatetime") {
+        if let Ok(dt) = py_dt.downcast::<PyDateTime>() {
+            let tzinfo = dt.getattr("tzinfo")?;
+            if !tzinfo.is_none() {
+                return Err(FlussError::new_err(
+                    "TIMESTAMP (without timezone) requires a naive datetime. \
+                     Got timezone-aware value. Use TIMESTAMP_LTZ column instead.",
+                ));
+            }
+            return datetime_to_epoch_millis_as_utc(dt);
+        }
+    }
+
+    Err(FlussError::new_err(format!(
+        "Expected naive datetime.datetime or pd.Timestamp, got {}",
+        get_type_name(value)
+    )))
+}
+
+/// Extract epoch milliseconds for TimestampLtz (instant in time, UTC-based).
+/// For naive datetimes, assumes UTC. For aware datetimes, converts to UTC.
+fn extract_datetime_components_ltz(value: &Bound<PyAny>) -> PyResult<(i64, i32)> {
+    use pyo3::types::PyDateTime;
+
+    // Try PyDateTime first
+    if let Ok(dt) = value.downcast::<PyDateTime>() {
+        // Check if timezone-aware
+        let tzinfo = dt.getattr("tzinfo")?;
+        if tzinfo.is_none() {
+            // Naive datetime: assume UTC (treat components as UTC time)
+            return datetime_to_epoch_millis_as_utc(dt);
+        } else {
+            // Aware datetime: use timedelta from epoch to get correct UTC instant
+            return datetime_to_epoch_millis_utc_aware(dt);
+        }
+    }
+
+    // Check for pandas Timestamp
+    if is_pandas_timestamp(value) {
+        // pandas Timestamp.value is always nanoseconds since UTC epoch
+        let nanos: i64 = value.getattr("value")?.extract()?;
+        return Ok(nanos_to_millis_and_submillis(nanos));
+    }
+
+    // Try to_pydatetime()
+    if let Ok(py_dt) = value.call_method0("to_pydatetime") {
+        if let Ok(dt) = py_dt.downcast::<PyDateTime>() {
+            let tzinfo = dt.getattr("tzinfo")?;
+            if tzinfo.is_none() {
+                return datetime_to_epoch_millis_as_utc(dt);
+            } else {
+                return datetime_to_epoch_millis_utc_aware(dt);
+            }
+        }
+    }
+
+    Err(FlussError::new_err(format!(
+        "Expected datetime.datetime or pd.Timestamp, got {}",
+        get_type_name(value)
+    )))
+}
+
+/// Convert datetime components to epoch milliseconds treating them as UTC
+fn datetime_to_epoch_millis_as_utc(
+    dt: &pyo3::Bound<'_, pyo3::types::PyDateTime>,
+) -> PyResult<(i64, i32)> {
+    use pyo3::types::{PyDateAccess, PyTimeAccess};
+
+    let year = dt.get_year();
+    let month = dt.get_month();
+    let day = dt.get_day();
+    let hour = dt.get_hour();
+    let minute = dt.get_minute();
+    let second = dt.get_second();
+    let microsecond = dt.get_microsecond();
+
+    // Create jiff civil datetime and convert to UTC timestamp
+    // Safe casts: hour (0-23), minute (0-59), second (0-59) all fit in i8
+    let civil_dt = jiff::civil::date(year as i16, month as i8, day as i8).at(
+        hour as i8,
+        minute as i8,
+        second as i8,
+        microsecond as i32 * 1000,
+    );
+
+    let timestamp = jiff::tz::Offset::UTC
+        .to_timestamp(civil_dt)
+        .map_err(|e| FlussError::new_err(format!("Invalid datetime: {}", e)))?;
+
+    let millis = timestamp.as_millisecond();
+    let nano_of_milli = (timestamp.subsec_nanosecond() % NANOS_PER_MILLI as i32) as i32;
+
+    Ok((millis, nano_of_milli))
+}
+
+/// Convert timezone-aware datetime to epoch milliseconds using Python's timedelta.
+/// This correctly handles timezone conversions by computing (dt - UTC_EPOCH).
+/// The UTC epoch is cached for performance.
+fn datetime_to_epoch_millis_utc_aware(
+    dt: &pyo3::Bound<'_, pyo3::types::PyDateTime>,
+) -> PyResult<(i64, i32)> {
+    use pyo3::types::{PyDelta, PyDeltaAccess};
+
+    let py = dt.py();
+    let epoch = get_utc_epoch(py)?;
+
+    // Compute delta = dt - epoch (this handles timezone conversion correctly)
+    let delta = dt.call_method1("__sub__", (epoch,))?;
+    let delta = delta.downcast::<PyDelta>()?;
+
+    // Extract components using integer arithmetic
+    let days = delta.get_days() as i64;
+    let seconds = delta.get_seconds() as i64;
+    let microseconds = delta.get_microseconds() as i64;
+
+    // Total milliseconds (note: days can be negative for dates before epoch)
+    let total_micros = days * MICROS_PER_DAY + seconds * MICROS_PER_SECOND + microseconds;
+    let millis = total_micros / MICROS_PER_MILLI;
+    let nano_of_milli = ((total_micros % MICROS_PER_MILLI) * MICROS_PER_MILLI) as i32;
+
+    // Handle negative microseconds remainder
+    let (millis, nano_of_milli) = if nano_of_milli < 0 {
+        (millis - 1, nano_of_milli + NANOS_PER_MILLI as i32)
+    } else {
+        (millis, nano_of_milli)
+    };
+
+    Ok((millis, nano_of_milli))
+}
+
+/// Convert nanoseconds to (milliseconds, nano_of_millisecond)
+fn nanos_to_millis_and_submillis(nanos: i64) -> (i64, i32) {
+    let millis = nanos / NANOS_PER_MILLI;
+    let nano_of_milli = (nanos % NANOS_PER_MILLI) as i32;
+
+    // Handle negative nanoseconds correctly (Euclidean remainder)
+    if nano_of_milli < 0 {
+        (millis - 1, nano_of_milli + NANOS_PER_MILLI as i32)
+    } else {
+        (millis, nano_of_milli)
+    }
+}
+
+/// Check if value is a pandas Timestamp by examining its type.
+fn is_pandas_timestamp(value: &Bound<PyAny>) -> bool {
+    // Check module and class name to avoid importing pandas
+    if let Ok(cls) = value.get_type().getattr("__module__") {
+        if let Ok(module) = cls.extract::<&str>() {
+            if module.starts_with("pandas") {
+                if let Ok(name) = value.get_type().getattr("__name__") {
+                    if let Ok(name_str) = name.extract::<&str>() {
+                        return name_str == "Timestamp";
+                    }
+                }
+            }
+        }
+    }
+    false
+}
+
+/// Get type name
+fn get_type_name(value: &Bound<PyAny>) -> String {
+    value
+        .get_type()
+        .name()
+        .map(|s| s.to_string())
+        .unwrap_or_else(|_| "unknown".to_string())
+}
+
 /// Scanner for reading log data from a Fluss table
 #[pyclass]
 pub struct LogScanner {
@@ -621,3 +1027,39 @@ impl LogScanner {
         }
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_nanos_to_millis_and_submillis() {
+        // Simple positive case
+        assert_eq!(nanos_to_millis_and_submillis(1_500_000), (1, 500_000));
+
+        // Exact millisecond boundary
+        assert_eq!(nanos_to_millis_and_submillis(2_000_000), (2, 0));
+
+        // Zero
+        assert_eq!(nanos_to_millis_and_submillis(0), (0, 0));
+
+        // Large value
+        assert_eq!(
+            nanos_to_millis_and_submillis(86_400_000_000_000), // 1 day in nanos
+            (86_400_000, 0)
+        );
+
+        // Negative: -1.5 milliseconds should be (-2 millis, +500_000 nanos)
+        // Because -1_500_000 nanos = -2ms + 500_000ns
+        assert_eq!(nanos_to_millis_and_submillis(-1_500_000), (-2, 500_000));
+
+        // Negative exact boundary
+        assert_eq!(nanos_to_millis_and_submillis(-2_000_000), (-2, 0));
+
+        // Small negative
+        assert_eq!(nanos_to_millis_and_submillis(-1), (-1, 999_999));
+
+        // Negative with sub-millisecond part
+        assert_eq!(nanos_to_millis_and_submillis(-500_000), (-1, 500_000));
+    }
+}
diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
index 09e6b5f589..ee32c9c133 100644
--- a/fluss-rust/bindings/python/src/utils.rs
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -59,8 +59,39 @@ impl Utils {
             ArrowDataType::Binary | ArrowDataType::LargeBinary => DataTypes::bytes(),
             ArrowDataType::Date32 => DataTypes::date(),
             ArrowDataType::Date64 => DataTypes::date(),
-            ArrowDataType::Time32(_) | ArrowDataType::Time64(_) => DataTypes::time(),
-            ArrowDataType::Timestamp(_, _) => DataTypes::timestamp(),
+            ArrowDataType::Time32(unit) => match unit {
+                arrow_schema::TimeUnit::Second => DataTypes::time_with_precision(0),
+                arrow_schema::TimeUnit::Millisecond => DataTypes::time_with_precision(3),
+                _ => {
+                    return Err(FlussError::new_err(format!(
+                        "Unsupported Time32 unit: {unit:?}"
+                    )));
+                }
+            },
+            ArrowDataType::Time64(unit) => match unit {
+                arrow_schema::TimeUnit::Microsecond => DataTypes::time_with_precision(6),
+                arrow_schema::TimeUnit::Nanosecond => DataTypes::time_with_precision(9),
+                _ => {
+                    return Err(FlussError::new_err(format!(
+                        "Unsupported Time64 unit: {unit:?}"
+                    )));
+                }
+            },
+            ArrowDataType::Timestamp(unit, tz) => {
+                let precision = match unit {
+                    arrow_schema::TimeUnit::Second => 0,
+                    arrow_schema::TimeUnit::Millisecond => 3,
+                    arrow_schema::TimeUnit::Microsecond => 6,
+                    arrow_schema::TimeUnit::Nanosecond => 9,
+                };
+                // Arrow Timestamp with timezone -> Fluss TimestampLtz
+                // Arrow Timestamp without timezone -> Fluss Timestamp (NTZ)
+                if tz.is_some() {
+                    DataTypes::timestamp_ltz_with_precision(precision)
+                } else {
+                    DataTypes::timestamp_with_precision(precision)
+                }
+            }
             ArrowDataType::Decimal128(precision, scale) => {
                 DataTypes::decimal(*precision as u32, *scale as u32)
             }

From 54ef268e1224c3ab785446265377d58cdd384dc5 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 25 Jan 2026 21:37:20 +0800
Subject: [PATCH 088/287] chore: introduce new with capacity to align generic
 row with java side (#212)

---
 fluss-rust/bindings/cpp/src/types.rs          |  2 +-
 fluss-rust/bindings/python/src/table.rs       | 20 ++---
 .../crates/examples/src/example_kv_table.rs   | 13 ++-
 .../crates/examples/src/example_table.rs      |  4 +-
 .../src/client/table/log_fetch_buffer.rs      |  4 +-
 .../fluss/src/client/table/remote_log.rs      | 15 ++--
 .../crates/fluss/src/client/table/upsert.rs   |  6 +-
 .../crates/fluss/src/metadata/json_serde.rs   | 12 +--
 .../crates/fluss/src/metadata/partition.rs    |  6 +-
 fluss-rust/crates/fluss/src/metadata/table.rs |  3 +-
 fluss-rust/crates/fluss/src/record/arrow.rs   | 36 +++-----
 fluss-rust/crates/fluss/src/row/column.rs     |  5 +-
 .../src/row/compacted/compacted_row_reader.rs |  7 +-
 fluss-rust/crates/fluss/src/row/datum.rs      | 48 ++++------
 fluss-rust/crates/fluss/src/row/decimal.rs    | 15 ++--
 fluss-rust/crates/fluss/src/row/mod.rs        | 90 +++++++++++++------
 .../fluss/tests/integration/kv_table.rs       | 34 ++++---
 .../tests/integration/table_remote_scan.rs    |  2 +-
 18 files changed, 151 insertions(+), 171 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index fef73ceaf0..726e3d1220 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -209,7 +209,7 @@ pub fn empty_table_info() -> ffi::FfiTableInfo {
 pub fn ffi_row_to_core(row: &ffi::FfiGenericRow) -> fcore::row::GenericRow<'_> {
     use fcore::row::Datum;
 
-    let mut generic_row = fcore::row::GenericRow::new();
+    let mut generic_row = fcore::row::GenericRow::new(row.fields.len());
 
     for (idx, field) in row.fields.iter().enumerate() {
         let datum = match field.datum_type {
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index b56a29dbf4..0ae7186403 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -259,13 +259,13 @@ impl AppendWriter {
         // Get the expected Arrow schema from the Fluss table
         let row_type = self.table_info.get_row_type();
         let expected_schema = fcore::record::to_arrow_schema(row_type)
-            .map_err(|e| FlussError::new_err(format!("Failed to get table schema: {}", e)))?;
+            .map_err(|e| FlussError::new_err(format!("Failed to get table schema: {e}")))?;
 
         // Convert Arrow schema to PyArrow schema
         let py_schema = expected_schema
             .as_ref()
             .to_pyarrow(py)
-            .map_err(|e| FlussError::new_err(format!("Failed to convert schema: {}", e)))?;
+            .map_err(|e| FlussError::new_err(format!("Failed to convert schema: {e}")))?;
 
         // Import pyarrow module
         let pyarrow = py.import("pyarrow")?;
@@ -570,13 +570,12 @@ fn python_decimal_to_datum(
 
     let decimal_str: String = value.str()?.extract()?;
     let bd = bigdecimal::BigDecimal::from_str(&decimal_str).map_err(|e| {
-        FlussError::new_err(format!("Failed to parse decimal '{}': {}", decimal_str, e))
+        FlussError::new_err(format!("Failed to parse decimal '{decimal_str}': {e}"))
     })?;
 
     let decimal = fcore::row::Decimal::from_big_decimal(bd, precision, scale).map_err(|e| {
         FlussError::new_err(format!(
-            "Failed to convert decimal '{}' to DECIMAL({}, {}): {}",
-            decimal_str, precision, scale, e
+            "Failed to convert decimal '{decimal_str}' to DECIMAL({precision}, {scale}): {e}"
         ))
     })?;
 
@@ -641,10 +640,9 @@ fn python_time_to_datum(value: &Bound<PyAny>) -> PyResult<fcore::row::Datum<'sta
     if microsecond % MICROS_PER_MILLI as i32 != 0 {
         return Err(FlussError::new_err(format!(
             "TIME values with sub-millisecond precision are not supported. \
-             Got time with {} microseconds (not divisible by 1000). \
+             Got time with {microsecond} microseconds (not divisible by 1000). \
              Fluss stores TIME as milliseconds since midnight. \
-             Please round to milliseconds before insertion.",
-            microsecond
+             Please round to milliseconds before insertion."
         )));
     }
 
@@ -663,7 +661,7 @@ fn python_datetime_to_timestamp_ntz(value: &Bound<PyAny>) -> PyResult<fcore::row
     let (epoch_millis, nano_of_milli) = extract_datetime_components_ntz(value)?;
 
     let ts = fcore::row::TimestampNtz::from_millis_nanos(epoch_millis, nano_of_milli)
-        .map_err(|e| FlussError::new_err(format!("Failed to create TimestampNtz: {}", e)))?;
+        .map_err(|e| FlussError::new_err(format!("Failed to create TimestampNtz: {e}")))?;
 
     Ok(fcore::row::Datum::TimestampNtz(ts))
 }
@@ -675,7 +673,7 @@ fn python_datetime_to_timestamp_ltz(value: &Bound<PyAny>) -> PyResult<fcore::row
     let (epoch_millis, nano_of_milli) = extract_datetime_components_ltz(value)?;
 
     let ts = fcore::row::TimestampLtz::from_millis_nanos(epoch_millis, nano_of_milli)
-        .map_err(|e| FlussError::new_err(format!("Failed to create TimestampLtz: {}", e)))?;
+        .map_err(|e| FlussError::new_err(format!("Failed to create TimestampLtz: {e}")))?;
 
     Ok(fcore::row::Datum::TimestampLtz(ts))
 }
@@ -803,7 +801,7 @@ fn datetime_to_epoch_millis_as_utc(
 
     let timestamp = jiff::tz::Offset::UTC
         .to_timestamp(civil_dt)
-        .map_err(|e| FlussError::new_err(format!("Invalid datetime: {}", e)))?;
+        .map_err(|e| FlussError::new_err(format!("Invalid datetime: {e}")))?;
 
     let millis = timestamp.as_millisecond();
     let nano_of_milli = (timestamp.subsec_nanosecond() % NANOS_PER_MILLI as i32) as i32;
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index dcf7db8f05..032691e0a1 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -58,7 +58,7 @@ pub async fn main() -> Result<()> {
 
     println!("\n=== Upserting ===");
     for (id, name, age) in [(1, "Verso", 32i64), (2, "Noco", 25), (3, "Esquie", 35)] {
-        let mut row = GenericRow::new();
+        let mut row = GenericRow::new(3);
         row.set_field(0, id);
         row.set_field(1, name);
         row.set_field(2, age);
@@ -80,7 +80,7 @@ pub async fn main() -> Result<()> {
     }
 
     println!("\n=== Updating ===");
-    let mut row = GenericRow::new();
+    let mut row = GenericRow::new(3);
     row.set_field(0, 1);
     row.set_field(1, "Verso");
     row.set_field(2, 33i64);
@@ -96,12 +96,11 @@ pub async fn main() -> Result<()> {
     );
 
     println!("\n=== Deleting ===");
-    let mut row = GenericRow::new();
+    // For delete, only primary key field needs to be set; other fields can remain null
+    let mut row = GenericRow::new(3);
     row.set_field(0, 2);
-    row.set_field(1, "");
-    row.set_field(2, 0i64);
     upsert_writer.delete(&row).await?;
-    println!("Deleted: {row:?}");
+    println!("Deleted row with id=2");
 
     let result = lookuper.lookup(&make_key(2)).await?;
     if result.get_single_row()?.is_none() {
@@ -112,7 +111,7 @@ pub async fn main() -> Result<()> {
 }
 
 fn make_key(id: i32) -> GenericRow<'static> {
-    let mut row = GenericRow::new();
+    let mut row = GenericRow::new(1);
     row.set_field(0, id);
     row
 }
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index 7333056feb..ca6b942861 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -56,7 +56,7 @@ pub async fn main() -> Result<()> {
     print!("Get created table:\n {table_info}\n");
 
     // write row
-    let mut row = GenericRow::new();
+    let mut row = GenericRow::new(3);
     row.set_field(0, 22222);
     row.set_field(1, "t2t");
     row.set_field(2, 123_456_789_123i64);
@@ -64,7 +64,7 @@ pub async fn main() -> Result<()> {
     let table = conn.get_table(&table_path).await?;
     let append_writer = table.new_append()?.create_writer();
     let f1 = append_writer.append(row);
-    row = GenericRow::new();
+    row = GenericRow::new(3);
     row.set_field(0, 233333);
     row.set_field(1, "tt44");
     row.set_field(2, 987_654_321_987i64);
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index b529806f84..7ece34b478 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -800,7 +800,7 @@ impl PendingFetch for RemotePendingFetch {
             let pos = self.pos_in_log_segment as usize;
             if pos >= file_size {
                 return Err(Error::UnexpectedError {
-                    message: format!("Position {} exceeds file size {}", pos, file_size),
+                    message: format!("Position {pos} exceeds file size {file_size}"),
                     source: None,
                 });
             }
@@ -911,7 +911,7 @@ mod tests {
             },
         )?;
 
-        let mut row = GenericRow::new();
+        let mut row = GenericRow::new(2);
         row.set_field(0, 1_i32);
         row.set_field(1, "alice");
         let record = WriteRecord::for_append(table_path, 1, row);
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index c39056db11..a2e19d4901 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -469,7 +469,7 @@ async fn spawn_download_task(
                 result_sender: request.result_sender,
             }
         }
-        Err(e) if request.result_sender.is_closed() => {
+        Err(_e) if request.result_sender.is_closed() => {
             // Receiver dropped (cancelled) - release permit, don't re-queue
             drop(permit);
             DownloadResult::Cancelled
@@ -491,8 +491,7 @@ async fn spawn_download_task(
                 DownloadResult::FailedPermanently {
                     error: Error::UnexpectedError {
                         message: format!(
-                            "Failed to download remote log segment after {} retries: {}",
-                            retry_count, e
+                            "Failed to download remote log segment after {retry_count} retries: {e}"
                         ),
                         source: Some(Box::new(e)),
                     },
@@ -585,7 +584,7 @@ async fn coordinator_loop(
                         // Cancelled - permit already released, nothing to do
                     }
                     Err(e) => {
-                        log::error!("Download task panicked: {:?}", e);
+                        log::error!("Download task panicked: {e:?}");
                         // Permit already released via RAII
                     }
                 }
@@ -1001,7 +1000,7 @@ mod tests {
 
                 if should_fail {
                     Err(Error::UnexpectedError {
-                        message: format!("Fake fetch failed for {}", segment_id),
+                        message: format!("Fake fetch failed for {segment_id}"),
                         source: None,
                     })
                 } else {
@@ -1012,7 +1011,7 @@ mod tests {
                         .unwrap()
                         .as_nanos();
                     let file_path =
-                        temp_dir.join(format!("fake_segment_{}_{}.log", segment_id, timestamp));
+                        temp_dir.join(format!("fake_segment_{segment_id}_{timestamp}.log"));
                     tokio::fs::write(&file_path, &fake_data).await?;
 
                     Ok(FetchResult {
@@ -1121,7 +1120,7 @@ mod tests {
 
         // Request 4 segments with same priority (to isolate concurrency limiting from priority)
         let segs: Vec<_> = (0..4)
-            .map(|i| create_segment(&format!("seg{}", i), i * 100, 1000, bucket.clone()))
+            .map(|i| create_segment(&format!("seg{i}"), i * 100, 1000, bucket.clone()))
             .collect();
 
         let _futures: Vec<_> = segs
@@ -1168,7 +1167,7 @@ mod tests {
 
         // Request 4 downloads
         let segs: Vec<_> = (0..4)
-            .map(|i| create_segment(&format!("seg{}", i), i * 100, 1000, bucket.clone()))
+            .map(|i| create_segment(&format!("seg{i}"), i * 100, 1000, bucket.clone()))
             .collect();
 
         let mut futures: Vec<_> = segs
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
index a3909e7258..984592d06e 100644
--- a/fluss-rust/crates/fluss/src/client/table/upsert.rs
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -232,8 +232,7 @@ impl UpsertWriterFactory {
                 None => {
                     return Err(IllegalArgument {
                         message: format!(
-                            "The specified primary key {} is not in row type {}",
-                            primary_key, row_type
+                            "The specified primary key {primary_key} is not in row type {row_type}"
                         ),
                     });
                 }
@@ -250,8 +249,7 @@ impl UpsertWriterFactory {
                 if target_column_set[index] {
                     return Err(IllegalArgument {
                         message: format!(
-                            "Explicitly specifying values for the auto increment column {} is not allowed.",
-                            auto_increment_col_name
+                            "Explicitly specifying values for the auto increment column {auto_increment_col_name} is not allowed."
                         ),
                     });
                 }
diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
index faa5583bed..d0d56ef286 100644
--- a/fluss-rust/crates/fluss/src/metadata/json_serde.rs
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -205,7 +205,7 @@ impl JsonSerde for DataType {
                 DataType::Decimal(
                     crate::metadata::datatype::DecimalType::with_nullable(true, precision, scale)
                         .map_err(|e| Error::JsonSerdeError {
-                        message: format!("Invalid DECIMAL parameters: {}", e),
+                        message: format!("Invalid DECIMAL parameters: {e}"),
                     })?,
                 )
             }
@@ -218,7 +218,7 @@ impl JsonSerde for DataType {
                 DataType::Time(
                     crate::metadata::datatype::TimeType::with_nullable(true, precision).map_err(
                         |e| Error::JsonSerdeError {
-                            message: format!("Invalid TIME_WITHOUT_TIME_ZONE precision: {}", e),
+                            message: format!("Invalid TIME_WITHOUT_TIME_ZONE precision: {e}"),
                         },
                     )?,
                 )
@@ -231,10 +231,7 @@ impl JsonSerde for DataType {
                 DataType::Timestamp(
                     crate::metadata::datatype::TimestampType::with_nullable(true, precision)
                         .map_err(|e| Error::JsonSerdeError {
-                            message: format!(
-                                "Invalid TIMESTAMP_WITHOUT_TIME_ZONE precision: {}",
-                                e
-                            ),
+                            message: format!("Invalid TIMESTAMP_WITHOUT_TIME_ZONE precision: {e}"),
                         })?,
                 )
             }
@@ -247,8 +244,7 @@ impl JsonSerde for DataType {
                     crate::metadata::datatype::TimestampLTzType::with_nullable(true, precision)
                         .map_err(|e| Error::JsonSerdeError {
                             message: format!(
-                                "Invalid TIMESTAMP_WITH_LOCAL_TIME_ZONE precision: {}",
-                                e
+                                "Invalid TIMESTAMP_WITH_LOCAL_TIME_ZONE precision: {e}"
                             ),
                         })?,
                 )
diff --git a/fluss-rust/crates/fluss/src/metadata/partition.rs b/fluss-rust/crates/fluss/src/metadata/partition.rs
index 1ecc0dcd9e..e40fbf9e4a 100644
--- a/fluss-rust/crates/fluss/src/metadata/partition.rs
+++ b/fluss-rust/crates/fluss/src/metadata/partition.rs
@@ -131,8 +131,7 @@ impl ResolvedPartitionSpec {
             if parts.len() != 2 {
                 return Err(Error::IllegalArgument {
                     message: format!(
-                        "Invalid partition name format. Expected key=value, got: {}",
-                        pair
+                        "Invalid partition name format. Expected key=value, got: {pair}"
                     ),
                 });
             }
@@ -199,8 +198,7 @@ impl ResolvedPartitionSpec {
                 None => {
                     return Err(Error::IllegalArgument {
                         message: format!(
-                            "table does not contain partitionKey: {}",
-                            other_partition_key
+                            "table does not contain partitionKey: {other_partition_key}"
                         ),
                     });
                 }
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index c4a9195403..3b9da7d99a 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -227,8 +227,7 @@ impl SchemaBuilder {
             if !column_names.contains(auto_inc_col) {
                 return Err(IllegalArgument {
                     message: format!(
-                        "Auto increment column '{}' is not found in the schema columns.",
-                        auto_inc_col
+                        "Auto increment column '{auto_inc_col}' is not found in the schema columns."
                     ),
                 });
             }
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 4bfdc71c99..63df6de67c 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -107,7 +107,7 @@ fn validate_batch_size(batch_size_bytes: i32) -> Result<usize> {
     // Check for negative size (corrupted data)
     if batch_size_bytes < 0 {
         return Err(Error::UnexpectedError {
-            message: format!("Invalid negative batch size: {}", batch_size_bytes),
+            message: format!("Invalid negative batch size: {batch_size_bytes}"),
             source: None,
         });
     }
@@ -120,8 +120,7 @@ fn validate_batch_size(batch_size_bytes: i32) -> Result<usize> {
             .checked_add(LOG_OVERHEAD)
             .ok_or_else(|| Error::UnexpectedError {
                 message: format!(
-                    "Batch size {} + LOG_OVERHEAD {} would overflow",
-                    batch_size_u, LOG_OVERHEAD
+                    "Batch size {batch_size_u} + LOG_OVERHEAD {LOG_OVERHEAD} would overflow"
                 ),
                 source: None,
             })?;
@@ -130,8 +129,7 @@ fn validate_batch_size(batch_size_bytes: i32) -> Result<usize> {
     if total_size > MAX_BATCH_SIZE {
         return Err(Error::UnexpectedError {
             message: format!(
-                "Batch size {} exceeds maximum allowed size {}",
-                total_size, MAX_BATCH_SIZE
+                "Batch size {total_size} exceeds maximum allowed size {MAX_BATCH_SIZE}"
             ),
             source: None,
         });
@@ -259,8 +257,7 @@ impl RowAppendRecordBatchBuilder {
                     .with_precision_and_scale(*precision, *scale)
                     .map_err(|e| Error::IllegalArgument {
                         message: format!(
-                            "Invalid decimal precision {} or scale {}: {}",
-                            precision, scale, e
+                            "Invalid decimal precision {precision} or scale {scale}: {e}"
                         ),
                     })?;
                 Ok(Box::new(builder))
@@ -273,8 +270,7 @@ impl RowAppendRecordBatchBuilder {
                 }
                 _ => Err(Error::IllegalArgument {
                     message: format!(
-                        "Time32 only supports Second and Millisecond units, got: {:?}",
-                        unit
+                        "Time32 only supports Second and Millisecond units, got: {unit:?}"
                     ),
                 }),
             },
@@ -285,8 +281,7 @@ impl RowAppendRecordBatchBuilder {
                 arrow_schema::TimeUnit::Nanosecond => Ok(Box::new(Time64NanosecondBuilder::new())),
                 _ => Err(Error::IllegalArgument {
                     message: format!(
-                        "Time64 only supports Microsecond and Nanosecond units, got: {:?}",
-                        unit
+                        "Time64 only supports Microsecond and Nanosecond units, got: {unit:?}"
                     ),
                 }),
             },
@@ -592,10 +587,7 @@ impl FileSource {
         // Validate base_offset to prevent underflow in total_size()
         if base_offset > file_size {
             return Err(Error::UnexpectedError {
-                message: format!(
-                    "base_offset ({}) exceeds file_size ({})",
-                    base_offset, file_size
-                ),
+                message: format!("base_offset ({base_offset}) exceeds file_size ({file_size})"),
                 source: None,
             });
         }
@@ -1044,7 +1036,7 @@ pub fn to_arrow_type(fluss_type: &DataType) -> Result<ArrowDataType> {
             7..=9 => ArrowDataType::Time64(arrow_schema::TimeUnit::Nanosecond),
             invalid => {
                 return Err(Error::IllegalArgument {
-                    message: format!("Invalid precision {} for TimeType (must be 0-9)", invalid),
+                    message: format!("Invalid precision {invalid} for TimeType (must be 0-9)"),
                 });
             }
         },
@@ -1055,10 +1047,7 @@ pub fn to_arrow_type(fluss_type: &DataType) -> Result<ArrowDataType> {
             7..=9 => ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, None),
             invalid => {
                 return Err(Error::IllegalArgument {
-                    message: format!(
-                        "Invalid precision {} for TimestampType (must be 0-9)",
-                        invalid
-                    ),
+                    message: format!("Invalid precision {invalid} for TimestampType (must be 0-9)"),
                 });
             }
         },
@@ -1070,8 +1059,7 @@ pub fn to_arrow_type(fluss_type: &DataType) -> Result<ArrowDataType> {
             invalid => {
                 return Err(Error::IllegalArgument {
                     message: format!(
-                        "Invalid precision {} for TimestampLTzType (must be 0-9)",
-                        invalid
+                        "Invalid precision {invalid} for TimestampLTzType (must be 0-9)"
                     ),
                 });
             }
@@ -1939,13 +1927,13 @@ mod tests {
             },
         )?;
 
-        let mut row = GenericRow::new();
+        let mut row = GenericRow::new(2);
         row.set_field(0, 1_i32);
         row.set_field(1, "alice");
         let record = WriteRecord::for_append(table_path.clone(), 1, row);
         builder.append(&record)?;
 
-        let mut row2 = GenericRow::new();
+        let mut row2 = GenericRow::new(2);
         row2.set_field(0, 2_i32);
         row2.set_field(1, "bob");
         let record2 = WriteRecord::for_append(table_path, 2, row2);
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 615e038454..46c25b247d 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -199,10 +199,7 @@ impl InternalRow for ColumnarRow {
         let field = schema.field(pos);
         let arrow_scale = match field.data_type() {
             DataType::Decimal128(_p, s) => *s as i64,
-            dt => panic!(
-                "Expected Decimal128 data type at column {}, found: {:?}",
-                pos, dt
-            ),
+            dt => panic!("Expected Decimal128 data type at column {pos}, found: {dt:?}"),
         };
 
         let i128_val = array.value(self.row_id);
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 40470db170..00e53aa142 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -50,7 +50,7 @@ impl<'a> CompactedRowDeserializer<'a> {
     }
 
     pub fn deserialize(&self, reader: &CompactedRowReader<'a>) -> GenericRow<'a> {
-        let mut row = GenericRow::new();
+        let mut row = GenericRow::new(self.row_type.fields().len());
         let mut cursor = reader.initial_position();
         for (col_pos, data_field) in self.row_type.fields().iter().enumerate() {
             let dtype = &data_field.data_type;
@@ -161,10 +161,7 @@ impl<'a> CompactedRowDeserializer<'a> {
                     }
                 }
                 _ => {
-                    panic!(
-                        "Unsupported DataType in CompactedRowDeserializer: {:?}",
-                        dtype
-                    );
+                    panic!("Unsupported DataType in CompactedRowDeserializer: {dtype:?}");
                 }
             };
             cursor = next_cursor;
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 7b3850f880..b808373084 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -407,8 +407,7 @@ fn millis_nanos_to_micros(millis: i64, nanos: i32) -> Result<i64> {
         .checked_mul(MICROS_PER_MILLI)
         .ok_or_else(|| RowConvertError {
             message: format!(
-                "Timestamp milliseconds {} overflows when converting to microseconds",
-                millis
+                "Timestamp milliseconds {millis} overflows when converting to microseconds"
             ),
         })?;
     let nanos_micros = (nanos as i64) / MICROS_PER_MILLI;
@@ -416,8 +415,7 @@ fn millis_nanos_to_micros(millis: i64, nanos: i32) -> Result<i64> {
         .checked_add(nanos_micros)
         .ok_or_else(|| RowConvertError {
             message: format!(
-                "Timestamp overflow when adding microseconds: {} + {}",
-                millis_micros, nanos_micros
+                "Timestamp overflow when adding microseconds: {millis_micros} + {nanos_micros}"
             ),
         })
 }
@@ -429,16 +427,14 @@ fn millis_nanos_to_nanos(millis: i64, nanos: i32) -> Result<i64> {
         .checked_mul(NANOS_PER_MILLI)
         .ok_or_else(|| RowConvertError {
             message: format!(
-                "Timestamp milliseconds {} overflows when converting to nanoseconds",
-                millis
+                "Timestamp milliseconds {millis} overflows when converting to nanoseconds"
             ),
         })?;
     millis_nanos
         .checked_add(nanos as i64)
         .ok_or_else(|| RowConvertError {
             message: format!(
-                "Timestamp overflow when adding nanoseconds: {} + {}",
-                millis_nanos, nanos
+                "Timestamp overflow when adding nanoseconds: {millis_nanos} + {nanos}"
             ),
         })
 }
@@ -504,10 +500,7 @@ impl Datum<'_> {
                     arrow_schema::DataType::Decimal128(p, s) => (*p, *s),
                     _ => {
                         return Err(RowConvertError {
-                            message: format!(
-                                "Expected Decimal128 Arrow type, got: {:?}",
-                                data_type
-                            ),
+                            message: format!("Expected Decimal128 Arrow type, got: {data_type:?}"),
                         });
                     }
                 };
@@ -515,7 +508,7 @@ impl Datum<'_> {
                 // Validate scale is non-negative (Fluss doesn't support negative scales)
                 if s < 0 {
                     return Err(RowConvertError {
-                        message: format!("Negative decimal scale {} is not supported", s),
+                        message: format!("Negative decimal scale {s} is not supported"),
                     });
                 }
 
@@ -535,8 +528,7 @@ impl Datum<'_> {
                     if actual_precision > target_precision as usize {
                         return Err(RowConvertError {
                             message: format!(
-                                "Decimal precision overflow: value has {} digits but Arrow expects {} (value: {})",
-                                actual_precision, target_precision, rescaled
+                                "Decimal precision overflow: value has {actual_precision} digits but Arrow expects {target_precision} (value: {rescaled})"
                             ),
                         });
                     }
@@ -546,7 +538,7 @@ impl Datum<'_> {
                         Ok(v) => v,
                         Err(_) => {
                             return Err(RowConvertError {
-                                message: format!("Decimal value exceeds i128 range: {}", rescaled),
+                                message: format!("Decimal value exceeds i128 range: {rescaled}"),
                             });
                         }
                     };
@@ -575,8 +567,7 @@ impl Datum<'_> {
                             if millis % MILLIS_PER_SECOND as i32 != 0 {
                                 return Err(RowConvertError {
                                     message: format!(
-                                        "Time value {} ms has sub-second precision but schema expects seconds only",
-                                        millis
+                                        "Time value {millis} ms has sub-second precision but schema expects seconds only"
                                     ),
                                 });
                             }
@@ -602,8 +593,7 @@ impl Datum<'_> {
                                 .checked_mul(MICROS_PER_MILLI)
                                 .ok_or_else(|| RowConvertError {
                                     message: format!(
-                                        "Time value {} ms overflows when converting to microseconds",
-                                        millis
+                                        "Time value {millis} ms overflows when converting to microseconds"
                                     ),
                                 })?;
                             b.append_value(micros);
@@ -618,8 +608,7 @@ impl Datum<'_> {
                             let nanos = (millis as i64).checked_mul(NANOS_PER_MILLI).ok_or_else(
                                 || RowConvertError {
                                     message: format!(
-                                        "Time value {} ms overflows when converting to nanoseconds",
-                                        millis
+                                        "Time value {millis} ms overflows when converting to nanoseconds"
                                     ),
                                 },
                             )?;
@@ -630,8 +619,7 @@ impl Datum<'_> {
                     _ => {
                         return Err(RowConvertError {
                             message: format!(
-                                "Expected Time32/Time64 Arrow type, got: {:?}",
-                                data_type
+                                "Expected Time32/Time64 Arrow type, got: {data_type:?}"
                             ),
                         });
                     }
@@ -808,8 +796,7 @@ impl TimestampNtz {
         if !(0..=MAX_NANO_OF_MILLISECOND).contains(&nano_of_millisecond) {
             return Err(crate::error::Error::IllegalArgument {
                 message: format!(
-                    "nanoOfMillisecond must be in range [0, {}], got: {}",
-                    MAX_NANO_OF_MILLISECOND, nano_of_millisecond
+                    "nanoOfMillisecond must be in range [0, {MAX_NANO_OF_MILLISECOND}], got: {nano_of_millisecond}"
                 ),
             });
         }
@@ -856,8 +843,7 @@ impl TimestampLtz {
         if !(0..=MAX_NANO_OF_MILLISECOND).contains(&nano_of_millisecond) {
             return Err(crate::error::Error::IllegalArgument {
                 message: format!(
-                    "nanoOfMillisecond must be in range [0, {}], got: {}",
-                    MAX_NANO_OF_MILLISECOND, nano_of_millisecond
+                    "nanoOfMillisecond must be in range [0, {MAX_NANO_OF_MILLISECOND}], got: {nano_of_millisecond}"
                 ),
             });
         }
@@ -1030,10 +1016,8 @@ mod timestamp_tests {
     #[test]
     fn test_timestamp_nanos_out_of_range() {
         // Test that both TimestampNtz and TimestampLtz reject invalid nanos
-        let expected_msg = format!(
-            "nanoOfMillisecond must be in range [0, {}]",
-            MAX_NANO_OF_MILLISECOND
-        );
+        let expected_msg =
+            format!("nanoOfMillisecond must be in range [0, {MAX_NANO_OF_MILLISECOND}]");
 
         // Too large (1,000,000 is just beyond the valid range)
         let result_ntz = TimestampNtz::from_millis_nanos(1000, MAX_NANO_OF_MILLISECOND + 1);
diff --git a/fluss-rust/crates/fluss/src/row/decimal.rs b/fluss-rust/crates/fluss/src/row/decimal.rs
index b14bde50a4..fd21b82968 100644
--- a/fluss-rust/crates/fluss/src/row/decimal.rs
+++ b/fluss-rust/crates/fluss/src/row/decimal.rs
@@ -129,16 +129,14 @@ impl Decimal {
         // Sanity check that scale matches
         debug_assert_eq!(
             exp, scale as i64,
-            "Scaled decimal exponent ({}) != expected scale ({})",
-            exp, scale
+            "Scaled decimal exponent ({exp}) != expected scale ({scale})"
         );
 
         let actual_precision = Self::compute_precision(&unscaled);
         if actual_precision > precision as usize {
             return Err(Error::IllegalArgument {
                 message: format!(
-                    "Decimal precision overflow: value has {} digits but precision is {} (value: {})",
-                    actual_precision, precision, scaled
+                    "Decimal precision overflow: value has {actual_precision} digits but precision is {precision} (value: {scaled})"
                 ),
             });
         }
@@ -147,8 +145,7 @@ impl Decimal {
         let long_val = if precision <= MAX_COMPACT_PRECISION {
             Some(i64::try_from(&unscaled).map_err(|_| Error::IllegalArgument {
                 message: format!(
-                    "Decimal mantissa exceeds i64 range for compact precision {}: unscaled={} (value={})",
-                    precision, unscaled, scaled
+                    "Decimal mantissa exceeds i64 range for compact precision {precision}: unscaled={unscaled} (value={scaled})"
                 ),
             })?)
         } else {
@@ -168,8 +165,7 @@ impl Decimal {
         if precision > MAX_COMPACT_PRECISION {
             return Err(Error::IllegalArgument {
                 message: format!(
-                    "Precision {} exceeds MAX_COMPACT_PRECISION ({})",
-                    precision, MAX_COMPACT_PRECISION
+                    "Precision {precision} exceeds MAX_COMPACT_PRECISION ({MAX_COMPACT_PRECISION})"
                 ),
             });
         }
@@ -178,8 +174,7 @@ impl Decimal {
         if actual_precision > precision as usize {
             return Err(Error::IllegalArgument {
                 message: format!(
-                    "Decimal precision overflow: unscaled value has {} digits but precision is {}",
-                    actual_precision, precision
+                    "Decimal precision overflow: unscaled value has {actual_precision} digits but precision is {precision}"
                 ),
             });
         }
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 81a425408f..f7c8bec5dc 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -159,6 +159,23 @@ impl<'a> InternalRow for GenericRow<'a> {
         self.values.get(_pos).unwrap().try_into().unwrap()
     }
 
+    fn get_float(&self, pos: usize) -> f32 {
+        self.values.get(pos).unwrap().try_into().unwrap()
+    }
+
+    fn get_double(&self, pos: usize) -> f64 {
+        self.values.get(pos).unwrap().try_into().unwrap()
+    }
+
+    fn get_char(&self, pos: usize, _length: usize) -> &str {
+        // don't check length, following java client
+        self.get_string(pos)
+    }
+
+    fn get_string(&self, pos: usize) -> &str {
+        self.values.get(pos).unwrap().try_into().unwrap()
+    }
+
     fn get_decimal(&self, pos: usize, _precision: usize, _scale: usize) -> Decimal {
         match self.values.get(pos).unwrap() {
             Datum::Decimal(d) => d.clone(),
@@ -196,23 +213,6 @@ impl<'a> InternalRow for GenericRow<'a> {
         }
     }
 
-    fn get_float(&self, pos: usize) -> f32 {
-        self.values.get(pos).unwrap().try_into().unwrap()
-    }
-
-    fn get_double(&self, pos: usize) -> f64 {
-        self.values.get(pos).unwrap().try_into().unwrap()
-    }
-
-    fn get_char(&self, pos: usize, _length: usize) -> &str {
-        // don't check length, following java client
-        self.get_string(pos)
-    }
-
-    fn get_string(&self, pos: usize) -> &str {
-        self.values.get(pos).unwrap().try_into().unwrap()
-    }
-
     fn get_binary(&self, pos: usize, _length: usize) -> &[u8] {
         self.values.get(pos).unwrap().as_blob()
     }
@@ -222,24 +222,39 @@ impl<'a> InternalRow for GenericRow<'a> {
     }
 }
 
-impl<'a> Default for GenericRow<'a> {
-    fn default() -> Self {
-        Self::new()
-    }
-}
-
 impl<'a> GenericRow<'a> {
     pub fn from_data(data: Vec<impl Into<Datum<'a>>>) -> GenericRow<'a> {
         GenericRow {
             values: data.into_iter().map(Into::into).collect(),
         }
     }
-    pub fn new() -> GenericRow<'a> {
-        GenericRow { values: vec![] }
+
+    /// Creates a GenericRow with the specified number of fields, all initialized to null.
+    ///
+    /// This is useful when you need to create a row with a specific field count
+    /// but only want to set some fields (e.g., for KV delete operations where
+    /// only primary key fields need to be set).
+    ///
+    /// # Example
+    /// ```
+    /// use fluss::row::GenericRow;
+    ///
+    /// let mut row = GenericRow::new(3);
+    /// row.set_field(0, 42); // Only set the primary key
+    /// // Fields 1 and 2 remain null
+    /// ```
+    pub fn new(field_count: usize) -> GenericRow<'a> {
+        GenericRow {
+            values: vec![Datum::Null; field_count],
+        }
     }
 
+    /// Sets the field at the given position to the specified value.
+    ///
+    /// # Panics
+    /// Panics if `pos` is out of bounds (>= field count).
     pub fn set_field(&mut self, pos: usize, value: impl Into<Datum<'a>>) {
-        self.values.insert(pos, value.into());
+        self.values[pos] = value.into();
     }
 }
 
@@ -249,11 +264,32 @@ mod tests {
 
     #[test]
     fn is_null_at_checks_datum_nullity() {
-        let mut row = GenericRow::new();
+        let mut row = GenericRow::new(2);
         row.set_field(0, Datum::Null);
         row.set_field(1, 42_i32);
 
         assert!(row.is_null_at(0));
         assert!(!row.is_null_at(1));
     }
+
+    #[test]
+    fn new_initializes_nulls() {
+        let row = GenericRow::new(3);
+        assert_eq!(row.get_field_count(), 3);
+        assert!(row.is_null_at(0));
+        assert!(row.is_null_at(1));
+        assert!(row.is_null_at(2));
+    }
+
+    #[test]
+    fn partial_row_for_delete() {
+        // Simulates delete scenario: only primary key (field 0) is set
+        let mut row = GenericRow::new(3);
+        row.set_field(0, 123_i32);
+        // Fields 1 and 2 remain null
+        assert_eq!(row.get_field_count(), 3);
+        assert_eq!(row.get_int(0), 123);
+        assert!(row.is_null_at(1));
+        assert!(row.is_null_at(2));
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index 3f46f9f6eb..a4f2961760 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -53,10 +53,8 @@ mod kv_table_test {
     }
 
     fn make_key(id: i32) -> GenericRow<'static> {
-        let mut row = GenericRow::new();
+        let mut row = GenericRow::new(3);
         row.set_field(0, id);
-        row.set_field(1, "");
-        row.set_field(2, 0i64);
         row
     }
 
@@ -98,7 +96,7 @@ mod kv_table_test {
 
         // Upsert rows
         for (id, name, age) in &test_data {
-            let mut row = GenericRow::new();
+            let mut row = GenericRow::new(3);
             row.set_field(0, *id);
             row.set_field(1, *name);
             row.set_field(2, *age);
@@ -132,7 +130,7 @@ mod kv_table_test {
         }
 
         // Update the record with new age
-        let mut updated_row = GenericRow::new();
+        let mut updated_row = GenericRow::new(3);
         updated_row.set_field(0, 1);
         updated_row.set_field(1, "Verso");
         updated_row.set_field(2, 33i64);
@@ -162,10 +160,8 @@ mod kv_table_test {
         );
 
         // Delete record with id=1
-        let mut delete_row = GenericRow::new();
+        let mut delete_row = GenericRow::new(3);
         delete_row.set_field(0, 1);
-        delete_row.set_field(1, "");
-        delete_row.set_field(2, 0i64);
         upsert_writer
             .delete(&delete_row)
             .await
@@ -262,7 +258,7 @@ mod kv_table_test {
         ];
 
         for (region, user_id, score) in &test_data {
-            let mut row = GenericRow::new();
+            let mut row = GenericRow::new(3);
             row.set_field(0, *region);
             row.set_field(1, *user_id);
             row.set_field(2, *score);
@@ -277,7 +273,7 @@ mod kv_table_test {
             .expect("Failed to create lookuper");
 
         // Lookup (US, 1) - should return score 100
-        let mut key = GenericRow::new();
+        let mut key = GenericRow::new(3);
         key.set_field(0, "US");
         key.set_field(1, 1);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -288,7 +284,7 @@ mod kv_table_test {
         assert_eq!(row.get_long(2), 100, "Score for (US, 1) should be 100");
 
         // Lookup (EU, 2) - should return score 250
-        let mut key = GenericRow::new();
+        let mut key = GenericRow::new(3);
         key.set_field(0, "EU");
         key.set_field(1, 2);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -299,7 +295,7 @@ mod kv_table_test {
         assert_eq!(row.get_long(2), 250, "Score for (EU, 2) should be 250");
 
         // Update (US, 1) score
-        let mut update_row = GenericRow::new();
+        let mut update_row = GenericRow::new(3);
         update_row.set_field(0, "US");
         update_row.set_field(1, 1);
         update_row.set_field(2, 500i64);
@@ -309,7 +305,7 @@ mod kv_table_test {
             .expect("Failed to update");
 
         // Verify update
-        let mut key = GenericRow::new();
+        let mut key = GenericRow::new(3);
         key.set_field(0, "US");
         key.set_field(1, 1);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -367,7 +363,7 @@ mod kv_table_test {
             .create_writer()
             .expect("Failed to create writer");
 
-        let mut row = GenericRow::new();
+        let mut row = GenericRow::new(4);
         row.set_field(0, 1);
         row.set_field(1, "Verso");
         row.set_field(2, 32i64);
@@ -407,7 +403,7 @@ mod kv_table_test {
             .expect("Failed to create UpsertWriter with partial write");
 
         // Update only the score column
-        let mut partial_row = GenericRow::new();
+        let mut partial_row = GenericRow::new(4);
         partial_row.set_field(0, 1);
         partial_row.set_field(1, Datum::Null); // not in partial update column
         partial_row.set_field(2, Datum::Null); // not in partial update column
@@ -522,7 +518,7 @@ mod kv_table_test {
         let col_binary: &[u8] = b"fixed binary data!!!";
 
         // Upsert a row with all datatypes
-        let mut row = GenericRow::new();
+        let mut row = GenericRow::new(17);
         row.set_field(0, pk_int);
         row.set_field(1, col_boolean);
         row.set_field(2, col_tinyint);
@@ -553,7 +549,7 @@ mod kv_table_test {
             .create_lookuper()
             .expect("Failed to create lookuper");
 
-        let mut key = GenericRow::new();
+        let mut key = GenericRow::new(17);
         key.set_field(0, pk_int);
 
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -625,7 +621,7 @@ mod kv_table_test {
 
         // Test with null values for nullable columns
         let pk_int_2 = 2i32;
-        let mut row_with_nulls = GenericRow::new();
+        let mut row_with_nulls = GenericRow::new(17);
         row_with_nulls.set_field(0, pk_int_2);
         row_with_nulls.set_field(1, Datum::Null); // col_boolean
         row_with_nulls.set_field(2, Datum::Null); // col_tinyint
@@ -650,7 +646,7 @@ mod kv_table_test {
             .expect("Failed to upsert row with nulls");
 
         // Lookup row with nulls
-        let mut key2 = GenericRow::new();
+        let mut key2 = GenericRow::new(17);
         key2.set_field(0, pk_int_2);
 
         let result = lookuper.lookup(&key2).await.expect("Failed to lookup");
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index e28a8362e0..c83da0f23c 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -146,7 +146,7 @@ mod table_remote_scan_test {
         // append 20 rows, there must be some tiered to remote
         let record_count = 20;
         for i in 0..record_count {
-            let mut row = GenericRow::new();
+            let mut row = GenericRow::new(2);
             row.set_field(0, i as i32);
             let v = format!("v{}", i);
             row.set_field(1, v.as_str());

From 24c46340f7cd69460cdc911d1edeac57ed494226 Mon Sep 17 00:00:00 2001
From: SkylerLin <44233950+linguoxuan@users.noreply.github.com>
Date: Mon, 26 Jan 2026 12:12:10 +0800
Subject: [PATCH 089/287] test: add it for produce & scan log for all supported
 datatypes (#205)

---
 fluss-rust/crates/fluss/src/row/column.rs     | 164 +++++---
 .../crates/fluss/tests/integration/table.rs   | 391 ++++++++++++++++++
 2 files changed, 507 insertions(+), 48 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 46c25b247d..f48075b369 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -17,8 +17,11 @@
 
 use crate::row::InternalRow;
 use arrow::array::{
-    Array, AsArray, BinaryArray, Decimal128Array, FixedSizeBinaryArray, Float32Array, Float64Array,
-    Int8Array, Int16Array, Int32Array, Int64Array, RecordBatch, StringArray,
+    Array, AsArray, BinaryArray, Date32Array, Decimal128Array, FixedSizeBinaryArray, Float32Array,
+    Float64Array, Int8Array, Int16Array, Int32Array, Int64Array, RecordBatch, StringArray,
+    Time32MillisecondArray, Time32SecondArray, Time64MicrosecondArray, Time64NanosecondArray,
+    TimestampMicrosecondArray, TimestampMillisecondArray, TimestampNanosecondArray,
+    TimestampSecondArray,
 };
 use arrow::datatypes::{DataType as ArrowDataType, TimeUnit};
 use std::sync::Arc;
@@ -67,35 +70,110 @@ impl ColumnarRow {
     ) -> T {
         let schema = self.record_batch.schema();
         let arrow_field = schema.field(pos);
-        let value = self.get_long(pos);
+        let column = self.record_batch.column(pos);
 
-        match arrow_field.data_type() {
-            ArrowDataType::Timestamp(time_unit, _) => {
-                // Convert based on Arrow TimeUnit
-                let (millis, nanos) = match time_unit {
-                    TimeUnit::Second => (value * 1000, 0),
-                    TimeUnit::Millisecond => (value, 0),
-                    TimeUnit::Microsecond => {
-                        let millis = value / 1000;
-                        let nanos = ((value % 1000) * 1000) as i32;
-                        (millis, nanos)
-                    }
-                    TimeUnit::Nanosecond => {
-                        let millis = value / 1_000_000;
-                        let nanos = (value % 1_000_000) as i32;
-                        (millis, nanos)
-                    }
-                };
-
-                if nanos == 0 {
-                    construct_compact(millis)
-                } else {
-                    // nanos is guaranteed to be in valid range [0, 999_999] by arithmetic
-                    construct_with_nanos(millis, nanos)
-                        .expect("nanos in valid range by construction")
+        // Read value based on the actual Arrow timestamp type
+        let value = match arrow_field.data_type() {
+            ArrowDataType::Timestamp(TimeUnit::Second, _) => column
+                .as_any()
+                .downcast_ref::<TimestampSecondArray>()
+                .expect("Expected TimestampSecondArray")
+                .value(self.row_id),
+            ArrowDataType::Timestamp(TimeUnit::Millisecond, _) => column
+                .as_any()
+                .downcast_ref::<TimestampMillisecondArray>()
+                .expect("Expected TimestampMillisecondArray")
+                .value(self.row_id),
+            ArrowDataType::Timestamp(TimeUnit::Microsecond, _) => column
+                .as_any()
+                .downcast_ref::<TimestampMicrosecondArray>()
+                .expect("Expected TimestampMicrosecondArray")
+                .value(self.row_id),
+            ArrowDataType::Timestamp(TimeUnit::Nanosecond, _) => column
+                .as_any()
+                .downcast_ref::<TimestampNanosecondArray>()
+                .expect("Expected TimestampNanosecondArray")
+                .value(self.row_id),
+            other => panic!("Expected Timestamp column at position {pos}, got {other:?}"),
+        };
+
+        // Convert based on Arrow TimeUnit
+        let (millis, nanos) = match arrow_field.data_type() {
+            ArrowDataType::Timestamp(time_unit, _) => match time_unit {
+                TimeUnit::Second => (value * 1000, 0),
+                TimeUnit::Millisecond => (value, 0),
+                TimeUnit::Microsecond => {
+                    // Use Euclidean division so that nanos is always non-negative,
+                    // even for timestamps before the Unix epoch.
+                    let millis = value.div_euclid(1000);
+                    let nanos = (value.rem_euclid(1000) * 1000) as i32;
+                    (millis, nanos)
+                }
+                TimeUnit::Nanosecond => {
+                    // Use Euclidean division so that nanos is always in [0, 999_999].
+                    let millis = value.div_euclid(1_000_000);
+                    let nanos = value.rem_euclid(1_000_000) as i32;
+                    (millis, nanos)
                 }
+            },
+            _ => unreachable!(),
+        };
+
+        if nanos == 0 {
+            construct_compact(millis)
+        } else {
+            // nanos is guaranteed to be in valid range [0, 999_999] by arithmetic
+            construct_with_nanos(millis, nanos).expect("nanos in valid range by construction")
+        }
+    }
+
+    /// Read date value from Arrow Date32Array
+    fn read_date_from_arrow(&self, pos: usize) -> i32 {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<Date32Array>()
+            .expect("Expected Date32Array")
+            .value(self.row_id)
+    }
+
+    /// Read time value from Arrow Time32/Time64 arrays, converting to milliseconds
+    fn read_time_from_arrow(&self, pos: usize) -> i32 {
+        let schema = self.record_batch.schema();
+        let arrow_field = schema.field(pos);
+        let column = self.record_batch.column(pos);
+
+        match arrow_field.data_type() {
+            ArrowDataType::Time32(TimeUnit::Second) => {
+                let value = column
+                    .as_any()
+                    .downcast_ref::<Time32SecondArray>()
+                    .expect("Expected Time32SecondArray")
+                    .value(self.row_id);
+                value * 1000 // Convert seconds to milliseconds
             }
-            other => panic!("Expected Timestamp column at position {pos}, got {other:?}"),
+            ArrowDataType::Time32(TimeUnit::Millisecond) => column
+                .as_any()
+                .downcast_ref::<Time32MillisecondArray>()
+                .expect("Expected Time32MillisecondArray")
+                .value(self.row_id),
+            ArrowDataType::Time64(TimeUnit::Microsecond) => {
+                let value = column
+                    .as_any()
+                    .downcast_ref::<Time64MicrosecondArray>()
+                    .expect("Expected Time64MicrosecondArray")
+                    .value(self.row_id);
+                (value / 1000) as i32 // Convert microseconds to milliseconds
+            }
+            ArrowDataType::Time64(TimeUnit::Nanosecond) => {
+                let value = column
+                    .as_any()
+                    .downcast_ref::<Time64NanosecondArray>()
+                    .expect("Expected Time64NanosecondArray")
+                    .value(self.row_id);
+                (value / 1_000_000) as i32 // Convert nanoseconds to milliseconds
+            }
+            other => panic!("Expected Time column at position {pos}, got {other:?}"),
         }
     }
 }
@@ -220,11 +298,11 @@ impl InternalRow for ColumnarRow {
     }
 
     fn get_date(&self, pos: usize) -> crate::row::datum::Date {
-        crate::row::datum::Date::new(self.get_int(pos))
+        crate::row::datum::Date::new(self.read_date_from_arrow(pos))
     }
 
     fn get_time(&self, pos: usize) -> crate::row::datum::Time {
-        crate::row::datum::Time::new(self.get_int(pos))
+        crate::row::datum::Time::new(self.read_time_from_arrow(pos))
     }
 
     fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampNtz {
@@ -250,16 +328,12 @@ impl InternalRow for ColumnarRow {
     }
 
     fn get_char(&self, pos: usize, _length: usize) -> &str {
-        let array = self
-            .record_batch
+        self.record_batch
             .column(pos)
             .as_any()
-            .downcast_ref::<FixedSizeBinaryArray>()
-            .expect("Expected fixed-size binary array for char type");
-
-        let bytes = array.value(self.row_id);
-        // don't check length, following java client
-        std::str::from_utf8(bytes).expect("Invalid UTF-8 in char field")
+            .downcast_ref::<StringArray>()
+            .expect("Expected String array for char type")
+            .value(self.row_id)
     }
 
     fn get_string(&self, pos: usize) -> &str {
@@ -294,8 +368,8 @@ impl InternalRow for ColumnarRow {
 mod tests {
     use super::*;
     use arrow::array::{
-        BinaryArray, BooleanArray, FixedSizeBinaryArray, Float32Array, Float64Array, Int8Array,
-        Int16Array, Int32Array, Int64Array, StringArray,
+        BinaryArray, BooleanArray, Float32Array, Float64Array, Int8Array, Int16Array, Int32Array,
+        Int64Array, StringArray,
     };
     use arrow::datatypes::{DataType, Field, Schema};
 
@@ -311,7 +385,7 @@ mod tests {
             Field::new("f64", DataType::Float64, false),
             Field::new("s", DataType::Utf8, false),
             Field::new("bin", DataType::Binary, false),
-            Field::new("char", DataType::FixedSizeBinary(2), false),
+            Field::new("char", DataType::Utf8, false),
         ]));
 
         let batch = RecordBatch::try_new(
@@ -326,13 +400,7 @@ mod tests {
                 Arc::new(Float64Array::from(vec![2.5])),
                 Arc::new(StringArray::from(vec!["hello"])),
                 Arc::new(BinaryArray::from(vec![b"data".as_slice()])),
-                Arc::new(
-                    FixedSizeBinaryArray::try_from_sparse_iter_with_size(
-                        vec![Some(b"ab".as_slice())].into_iter(),
-                        2,
-                    )
-                    .expect("fixed array"),
-                ),
+                Arc::new(StringArray::from(vec!["ab"])),
             ],
         )
         .expect("record batch");
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/table.rs
index 046ec02388..6a15674076 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table.rs
@@ -576,4 +576,395 @@ mod table_test {
         // Projected batch should have 1 column (id), not 2 (id, name)
         assert_eq!(proj_batches[0].batch().num_columns(), 1);
     }
+
+    /// Integration test covering produce and scan operations for all supported datatypes
+    /// in log tables.
+    #[tokio::test]
+    async fn all_supported_datatypes() {
+        use fluss::row::{Date, Datum, Decimal, GenericRow, Time, TimestampLtz, TimestampNtz};
+
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_log_all_datatypes".to_string());
+
+        // Create a log table with all supported datatypes for append/scan
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    // Integer types
+                    .column("col_tinyint", DataTypes::tinyint())
+                    .column("col_smallint", DataTypes::smallint())
+                    .column("col_int", DataTypes::int())
+                    .column("col_bigint", DataTypes::bigint())
+                    // Floating point types
+                    .column("col_float", DataTypes::float())
+                    .column("col_double", DataTypes::double())
+                    // Boolean type
+                    .column("col_boolean", DataTypes::boolean())
+                    // Char type
+                    .column("col_char", DataTypes::char(10))
+                    // String type
+                    .column("col_string", DataTypes::string())
+                    // Decimal type
+                    .column("col_decimal", DataTypes::decimal(10, 2))
+                    // Date type
+                    .column("col_date", DataTypes::date())
+                    // Time types
+                    .column("col_time_s", DataTypes::time_with_precision(0))
+                    .column("col_time_ms", DataTypes::time_with_precision(3))
+                    .column("col_time_us", DataTypes::time_with_precision(6))
+                    .column("col_time_ns", DataTypes::time_with_precision(9))
+                    // Timestamp types
+                    .column("col_timestamp_s", DataTypes::timestamp_with_precision(0))
+                    .column("col_timestamp_ms", DataTypes::timestamp_with_precision(3))
+                    .column("col_timestamp_us", DataTypes::timestamp_with_precision(6))
+                    .column("col_timestamp_ns", DataTypes::timestamp_with_precision(9))
+                    // Timestamp_ltz types
+                    .column(
+                        "col_timestamp_ltz_s",
+                        DataTypes::timestamp_ltz_with_precision(0),
+                    )
+                    .column(
+                        "col_timestamp_ltz_ms",
+                        DataTypes::timestamp_ltz_with_precision(3),
+                    )
+                    .column(
+                        "col_timestamp_ltz_us",
+                        DataTypes::timestamp_ltz_with_precision(6),
+                    )
+                    .column(
+                        "col_timestamp_ltz_ns",
+                        DataTypes::timestamp_ltz_with_precision(9),
+                    )
+                    // Bytes type
+                    .column("col_bytes", DataTypes::bytes())
+                    // Timestamp types with negative values (before Unix epoch)
+                    .column(
+                        "col_timestamp_us_neg",
+                        DataTypes::timestamp_with_precision(6),
+                    )
+                    .column(
+                        "col_timestamp_ns_neg",
+                        DataTypes::timestamp_with_precision(9),
+                    )
+                    .column(
+                        "col_timestamp_ltz_us_neg",
+                        DataTypes::timestamp_ltz_with_precision(6),
+                    )
+                    .column(
+                        "col_timestamp_ltz_ns_neg",
+                        DataTypes::timestamp_ltz_with_precision(9),
+                    )
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let field_count = table.table_info().schema.columns().len();
+
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer();
+
+        // Test data for all datatypes
+        let col_tinyint = 127i8;
+        let col_smallint = 32767i16;
+        let col_int = 2147483647i32;
+        let col_bigint = 9223372036854775807i64;
+        let col_float = 3.14f32;
+        let col_double = 2.718281828459045f64;
+        let col_boolean = true;
+        let col_char = "hello";
+        let col_string = "world of fluss rust client";
+        let col_decimal = Decimal::from_unscaled_long(12345, 10, 2).unwrap(); // 123.45
+        let col_date = Date::new(20476); // 2026-01-23
+        let col_time_s = Time::new(36827000); // 10:13:47
+        let col_time_ms = Time::new(36827123); // 10:13:47.123
+        let col_time_us = Time::new(86399999); // 23:59:59.999
+        let col_time_ns = Time::new(1); // 00:00:00.001
+        // 2026-01-23 10:13:47 UTC
+        let col_timestamp_s = TimestampNtz::new(1769163227000);
+        // 2026-01-23 10:13:47.123 UTC
+        let col_timestamp_ms = TimestampNtz::new(1769163227123);
+        // 2026-01-23 10:13:47.123456 UTC
+        let col_timestamp_us = TimestampNtz::from_millis_nanos(1769163227123, 456000).unwrap();
+        // 2026-01-23 10:13:47.123999999 UTC
+        let col_timestamp_ns = TimestampNtz::from_millis_nanos(1769163227123, 999_999).unwrap();
+        let col_timestamp_ltz_s = TimestampLtz::new(1769163227000);
+        let col_timestamp_ltz_ms = TimestampLtz::new(1769163227123);
+        let col_timestamp_ltz_us = TimestampLtz::from_millis_nanos(1769163227123, 456000).unwrap();
+        let col_timestamp_ltz_ns = TimestampLtz::from_millis_nanos(1769163227123, 999_999).unwrap();
+        let col_bytes: Vec<u8> = b"binary data".to_vec();
+
+        // 1960-06-15 08:30:45.123456 UTC (before 1970)
+        let col_timestamp_us_neg = TimestampNtz::from_millis_nanos(-301234154877, 456000).unwrap();
+        // 1960-06-15 08:30:45.123999999 UTC (before 1970)
+        let col_timestamp_ns_neg = TimestampNtz::from_millis_nanos(-301234154877, 999_999).unwrap();
+        let col_timestamp_ltz_us_neg =
+            TimestampLtz::from_millis_nanos(-301234154877, 456000).unwrap();
+        let col_timestamp_ltz_ns_neg =
+            TimestampLtz::from_millis_nanos(-301234154877, 999_999).unwrap();
+
+        // Append a row with all datatypes
+        let mut row = GenericRow::new(field_count);
+        row.set_field(0, col_tinyint);
+        row.set_field(1, col_smallint);
+        row.set_field(2, col_int);
+        row.set_field(3, col_bigint);
+        row.set_field(4, col_float);
+        row.set_field(5, col_double);
+        row.set_field(6, col_boolean);
+        row.set_field(7, col_char);
+        row.set_field(8, col_string);
+        row.set_field(9, col_decimal.clone());
+        row.set_field(10, col_date);
+        row.set_field(11, col_time_s);
+        row.set_field(12, col_time_ms);
+        row.set_field(13, col_time_us);
+        row.set_field(14, col_time_ns);
+        row.set_field(15, col_timestamp_s);
+        row.set_field(16, col_timestamp_ms);
+        row.set_field(17, col_timestamp_us.clone());
+        row.set_field(18, col_timestamp_ns.clone());
+        row.set_field(19, col_timestamp_ltz_s);
+        row.set_field(20, col_timestamp_ltz_ms);
+        row.set_field(21, col_timestamp_ltz_us.clone());
+        row.set_field(22, col_timestamp_ltz_ns.clone());
+        row.set_field(23, col_bytes.as_slice());
+        row.set_field(24, col_timestamp_us_neg.clone());
+        row.set_field(25, col_timestamp_ns_neg.clone());
+        row.set_field(26, col_timestamp_ltz_us_neg.clone());
+        row.set_field(27, col_timestamp_ltz_ns_neg.clone());
+
+        append_writer
+            .append(row)
+            .await
+            .expect("Failed to append row with all datatypes");
+
+        // Append a row with null values for all columns
+        let mut row_with_nulls = GenericRow::new(field_count);
+        for i in 0..field_count {
+            row_with_nulls.set_field(i, Datum::Null);
+        }
+
+        append_writer
+            .append(row_with_nulls)
+            .await
+            .expect("Failed to append row with nulls");
+
+        append_writer.flush().await.expect("Failed to flush");
+
+        // Scan the records
+        let records = scan_table(&table, |scan| scan).await;
+
+        assert_eq!(records.len(), 2, "Expected 2 records");
+
+        let found_row = records[0].row();
+        assert_eq!(found_row.get_byte(0), col_tinyint, "col_tinyint mismatch");
+        assert_eq!(
+            found_row.get_short(1),
+            col_smallint,
+            "col_smallint mismatch"
+        );
+        assert_eq!(found_row.get_int(2), col_int, "col_int mismatch");
+        assert_eq!(found_row.get_long(3), col_bigint, "col_bigint mismatch");
+        assert!(
+            (found_row.get_float(4) - col_float).abs() < f32::EPSILON,
+            "col_float mismatch: expected {}, got {}",
+            col_float,
+            found_row.get_float(4)
+        );
+        assert!(
+            (found_row.get_double(5) - col_double).abs() < f64::EPSILON,
+            "col_double mismatch: expected {}, got {}",
+            col_double,
+            found_row.get_double(5)
+        );
+        assert_eq!(
+            found_row.get_boolean(6),
+            col_boolean,
+            "col_boolean mismatch"
+        );
+        assert_eq!(found_row.get_char(7, 10), col_char, "col_char mismatch");
+        assert_eq!(found_row.get_string(8), col_string, "col_string mismatch");
+        assert_eq!(
+            found_row.get_decimal(9, 10, 2),
+            col_decimal,
+            "col_decimal mismatch"
+        );
+        assert_eq!(
+            found_row.get_date(10).get_inner(),
+            col_date.get_inner(),
+            "col_date mismatch"
+        );
+
+        assert_eq!(
+            found_row.get_time(11).get_inner(),
+            col_time_s.get_inner(),
+            "col_time_s mismatch"
+        );
+
+        assert_eq!(
+            found_row.get_time(12).get_inner(),
+            col_time_ms.get_inner(),
+            "col_time_ms mismatch"
+        );
+
+        assert_eq!(
+            found_row.get_time(13).get_inner(),
+            col_time_us.get_inner(),
+            "col_time_us mismatch"
+        );
+
+        assert_eq!(
+            found_row.get_time(14).get_inner(),
+            col_time_ns.get_inner(),
+            "col_time_ns mismatch"
+        );
+
+        assert_eq!(
+            found_row.get_timestamp_ntz(15, 0).get_millisecond(),
+            col_timestamp_s.get_millisecond(),
+            "col_timestamp_s mismatch"
+        );
+
+        assert_eq!(
+            found_row.get_timestamp_ntz(16, 3).get_millisecond(),
+            col_timestamp_ms.get_millisecond(),
+            "col_timestamp_ms mismatch"
+        );
+
+        let read_ts_us = found_row.get_timestamp_ntz(17, 6);
+        assert_eq!(
+            read_ts_us.get_millisecond(),
+            col_timestamp_us.get_millisecond(),
+            "col_timestamp_us millis mismatch"
+        );
+        assert_eq!(
+            read_ts_us.get_nano_of_millisecond(),
+            col_timestamp_us.get_nano_of_millisecond(),
+            "col_timestamp_us nanos mismatch"
+        );
+
+        let read_ts_ns = found_row.get_timestamp_ntz(18, 9);
+        assert_eq!(
+            read_ts_ns.get_millisecond(),
+            col_timestamp_ns.get_millisecond(),
+            "col_timestamp_ns millis mismatch"
+        );
+        assert_eq!(
+            read_ts_ns.get_nano_of_millisecond(),
+            col_timestamp_ns.get_nano_of_millisecond(),
+            "col_timestamp_ns nanos mismatch"
+        );
+
+        assert_eq!(
+            found_row.get_timestamp_ltz(19, 0).get_epoch_millisecond(),
+            col_timestamp_ltz_s.get_epoch_millisecond(),
+            "col_timestamp_ltz_s mismatch"
+        );
+
+        assert_eq!(
+            found_row.get_timestamp_ltz(20, 3).get_epoch_millisecond(),
+            col_timestamp_ltz_ms.get_epoch_millisecond(),
+            "col_timestamp_ltz_ms mismatch"
+        );
+
+        let read_ts_ltz_us = found_row.get_timestamp_ltz(21, 6);
+        assert_eq!(
+            read_ts_ltz_us.get_epoch_millisecond(),
+            col_timestamp_ltz_us.get_epoch_millisecond(),
+            "col_timestamp_ltz_us millis mismatch"
+        );
+        assert_eq!(
+            read_ts_ltz_us.get_nano_of_millisecond(),
+            col_timestamp_ltz_us.get_nano_of_millisecond(),
+            "col_timestamp_ltz_us nanos mismatch"
+        );
+
+        let read_ts_ltz_ns = found_row.get_timestamp_ltz(22, 9);
+        assert_eq!(
+            read_ts_ltz_ns.get_epoch_millisecond(),
+            col_timestamp_ltz_ns.get_epoch_millisecond(),
+            "col_timestamp_ltz_ns millis mismatch"
+        );
+        assert_eq!(
+            read_ts_ltz_ns.get_nano_of_millisecond(),
+            col_timestamp_ltz_ns.get_nano_of_millisecond(),
+            "col_timestamp_ltz_ns nanos mismatch"
+        );
+        assert_eq!(found_row.get_bytes(23), col_bytes, "col_bytes mismatch");
+
+        // Verify timestamps before Unix epoch (negative timestamps)
+        let read_ts_us_neg = found_row.get_timestamp_ntz(24, 6);
+        assert_eq!(
+            read_ts_us_neg.get_millisecond(),
+            col_timestamp_us_neg.get_millisecond(),
+            "col_timestamp_us_neg millis mismatch"
+        );
+        assert_eq!(
+            read_ts_us_neg.get_nano_of_millisecond(),
+            col_timestamp_us_neg.get_nano_of_millisecond(),
+            "col_timestamp_us_neg nanos mismatch"
+        );
+
+        let read_ts_ns_neg = found_row.get_timestamp_ntz(25, 9);
+        assert_eq!(
+            read_ts_ns_neg.get_millisecond(),
+            col_timestamp_ns_neg.get_millisecond(),
+            "col_timestamp_ns_neg millis mismatch"
+        );
+        assert_eq!(
+            read_ts_ns_neg.get_nano_of_millisecond(),
+            col_timestamp_ns_neg.get_nano_of_millisecond(),
+            "col_timestamp_ns_neg nanos mismatch"
+        );
+
+        let read_ts_ltz_us_neg = found_row.get_timestamp_ltz(26, 6);
+        assert_eq!(
+            read_ts_ltz_us_neg.get_epoch_millisecond(),
+            col_timestamp_ltz_us_neg.get_epoch_millisecond(),
+            "col_timestamp_ltz_us_neg millis mismatch"
+        );
+        assert_eq!(
+            read_ts_ltz_us_neg.get_nano_of_millisecond(),
+            col_timestamp_ltz_us_neg.get_nano_of_millisecond(),
+            "col_timestamp_ltz_us_neg nanos mismatch"
+        );
+
+        let read_ts_ltz_ns_neg = found_row.get_timestamp_ltz(27, 9);
+        assert_eq!(
+            read_ts_ltz_ns_neg.get_epoch_millisecond(),
+            col_timestamp_ltz_ns_neg.get_epoch_millisecond(),
+            "col_timestamp_ltz_ns_neg millis mismatch"
+        );
+        assert_eq!(
+            read_ts_ltz_ns_neg.get_nano_of_millisecond(),
+            col_timestamp_ltz_ns_neg.get_nano_of_millisecond(),
+            "col_timestamp_ltz_ns_neg nanos mismatch"
+        );
+
+        // Verify row with all nulls (record index 1)
+        let found_row_nulls = records[1].row();
+        for i in 0..field_count {
+            assert!(found_row_nulls.is_null_at(i), "column {} should be null", i);
+        }
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
 }

From bf72035a391e6caa823a156b4bbfe3f1c2ba8071 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Mon, 26 Jan 2026 19:29:12 +0800
Subject: [PATCH 090/287] chore: introduce SecurityTokenManager to update token
 in the background (#213)

---
 .../crates/fluss/src/client/credentials.rs    | 392 +++++++++++++-----
 .../fluss/src/client/table/remote_log.rs      |  64 ++-
 .../crates/fluss/src/client/table/scanner.rs  |  45 +-
 3 files changed, 366 insertions(+), 135 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/credentials.rs b/fluss-rust/crates/fluss/src/client/credentials.rs
index c520b4416d..93a536695a 100644
--- a/fluss-rust/crates/fluss/src/client/credentials.rs
+++ b/fluss-rust/crates/fluss/src/client/credentials.rs
@@ -19,13 +19,30 @@ use crate::client::metadata::Metadata;
 use crate::error::{Error, Result};
 use crate::rpc::RpcClient;
 use crate::rpc::message::GetSecurityTokenRequest;
+use log::{debug, info, warn};
 use parking_lot::RwLock;
 use serde::Deserialize;
 use std::collections::HashMap;
 use std::sync::Arc;
-use std::time::{Duration, Instant};
+use std::time::{Duration, SystemTime, UNIX_EPOCH};
+use tokio::sync::{oneshot, watch};
+use tokio::task::JoinHandle;
 
-const CACHE_TTL: Duration = Duration::from_secs(3600);
+/// Default renewal time ratio - refresh at 80% of token lifetime
+const DEFAULT_TOKEN_RENEWAL_RATIO: f64 = 0.8;
+/// Default retry backoff when token fetch fails
+const DEFAULT_RENEWAL_RETRY_BACKOFF: Duration = Duration::from_secs(30);
+/// Minimum delay between refreshes
+const MIN_RENEWAL_DELAY: Duration = Duration::from_secs(1);
+/// Maximum delay between refreshes (7 days) - prevents overflow and ensures periodic refresh
+const MAX_RENEWAL_DELAY: Duration = Duration::from_secs(7 * 24 * 60 * 60);
+/// Default refresh interval for tokens without expiration (never expires)
+const DEFAULT_NON_EXPIRING_REFRESH_INTERVAL: Duration = Duration::from_secs(7 * 24 * 60 * 60); // 7 day
+
+/// Type alias for credentials properties receiver
+/// - `None` = not yet fetched, should wait
+/// - `Some(HashMap)` = fetched (may be empty if no auth needed)
+pub type CredentialsReceiver = watch::Receiver<Option<HashMap<String, String>>>;
 
 #[derive(Debug, Deserialize)]
 struct Credentials {
@@ -34,48 +51,6 @@ struct Credentials {
     security_token: Option<String>,
 }
 
-struct CachedToken {
-    access_key_id: String,
-    secret_access_key: String,
-    security_token: Option<String>,
-    addition_infos: HashMap<String, String>,
-    cached_at: Instant,
-}
-
-impl CachedToken {
-    fn to_remote_fs_props(&self) -> HashMap<String, String> {
-        let mut props = HashMap::new();
-
-        props.insert("access_key_id".to_string(), self.access_key_id.clone());
-        props.insert(
-            "secret_access_key".to_string(),
-            self.secret_access_key.clone(),
-        );
-
-        if let Some(token) = &self.security_token {
-            props.insert("security_token".to_string(), token.clone());
-        }
-
-        for (key, value) in &self.addition_infos {
-            if let Some((opendal_key, transform)) = convert_hadoop_key_to_opendal(key) {
-                let final_value = if transform {
-                    // Invert boolean value (path_style_access -> enable_virtual_host_style)
-                    if value == "true" {
-                        "false".to_string()
-                    } else {
-                        "true".to_string()
-                    }
-                } else {
-                    value.clone()
-                };
-                props.insert(opendal_key, final_value);
-            }
-        }
-
-        props
-    }
-}
-
 /// Returns (opendal_key, needs_inversion)
 /// needs_inversion is true for path_style_access -> enable_virtual_host_style conversion
 fn convert_hadoop_key_to_opendal(hadoop_key: &str) -> Option<(String, bool)> {
@@ -88,53 +63,230 @@ fn convert_hadoop_key_to_opendal(hadoop_key: &str) -> Option<(String, bool)> {
     }
 }
 
-pub struct CredentialsCache {
-    inner: RwLock<Option<CachedToken>>,
+/// Build remote filesystem props from credentials and additional info
+fn build_remote_fs_props(
+    credentials: &Credentials,
+    addition_infos: &HashMap<String, String>,
+) -> HashMap<String, String> {
+    let mut props = HashMap::new();
+
+    props.insert(
+        "access_key_id".to_string(),
+        credentials.access_key_id.clone(),
+    );
+    props.insert(
+        "secret_access_key".to_string(),
+        credentials.access_key_secret.clone(),
+    );
+
+    if let Some(token) = &credentials.security_token {
+        props.insert("security_token".to_string(), token.clone());
+    }
+
+    for (key, value) in addition_infos {
+        if let Some((opendal_key, transform)) = convert_hadoop_key_to_opendal(key) {
+            let final_value = if transform {
+                // Invert boolean value (path_style_access -> enable_virtual_host_style)
+                if value == "true" {
+                    "false".to_string()
+                } else {
+                    "true".to_string()
+                }
+            } else {
+                value.clone()
+            };
+            props.insert(opendal_key, final_value);
+        }
+    }
+
+    props
+}
+
+/// Manager for security tokens that refreshes tokens in a background task.
+///
+/// This follows the pattern from Java's `DefaultSecurityTokenManager`, where
+/// a background thread periodically refreshes tokens based on their expiration time.
+///
+/// Uses `tokio::sync::watch` channel to broadcast token updates to consumers.
+/// Consumers can subscribe by calling `subscribe()` to get a receiver.
+///
+/// The channel value is `Option<HashMap>`:
+/// - `None` = not yet fetched, consumers should wait
+/// - `Some(HashMap)` = fetched (may be empty if no auth needed)
+///
+/// # Example
+/// ```ignore
+/// let manager = SecurityTokenManager::new(rpc_client, metadata);
+/// let credentials_rx = manager.subscribe();
+/// manager.start();
+///
+/// // Consumer can get latest credentials via:
+/// let props = credentials_rx.borrow().clone();
+/// ```
+pub struct SecurityTokenManager {
     rpc_client: Arc<RpcClient>,
     metadata: Arc<Metadata>,
+    token_renewal_ratio: f64,
+    renewal_retry_backoff: Duration,
+    /// Watch channel sender for broadcasting token updates
+    credentials_tx: watch::Sender<Option<HashMap<String, String>>>,
+    /// Watch channel receiver (kept to allow cloning for new subscribers)
+    credentials_rx: watch::Receiver<Option<HashMap<String, String>>>,
+    /// Handle to the background refresh task
+    task_handle: RwLock<Option<JoinHandle<()>>>,
+    /// Sender to signal shutdown
+    shutdown_tx: RwLock<Option<oneshot::Sender<()>>>,
 }
 
-impl CredentialsCache {
+impl SecurityTokenManager {
     pub fn new(rpc_client: Arc<RpcClient>, metadata: Arc<Metadata>) -> Self {
+        let (credentials_tx, credentials_rx) = watch::channel(None);
         Self {
-            inner: RwLock::new(None),
             rpc_client,
             metadata,
+            token_renewal_ratio: DEFAULT_TOKEN_RENEWAL_RATIO,
+            renewal_retry_backoff: DEFAULT_RENEWAL_RETRY_BACKOFF,
+            credentials_tx,
+            credentials_rx,
+            task_handle: RwLock::new(None),
+            shutdown_tx: RwLock::new(None),
+        }
+    }
+
+    /// Subscribe to credential updates.
+    /// Returns a receiver that always contains the latest credentials.
+    /// Consumers can call `receiver.borrow()` to get the current value.
+    pub fn subscribe(&self) -> CredentialsReceiver {
+        self.credentials_rx.clone()
+    }
+
+    /// Start the background token refresh task.
+    /// This should be called once after creating the manager.
+    pub fn start(&self) {
+        if self.task_handle.read().is_some() {
+            warn!("SecurityTokenManager is already started");
+            return;
+        }
+
+        let (shutdown_tx, shutdown_rx) = oneshot::channel();
+        *self.shutdown_tx.write() = Some(shutdown_tx);
+
+        let rpc_client = Arc::clone(&self.rpc_client);
+        let metadata = Arc::clone(&self.metadata);
+        let token_renewal_ratio = self.token_renewal_ratio;
+        let renewal_retry_backoff = self.renewal_retry_backoff;
+        let credentials_tx = self.credentials_tx.clone();
+
+        let handle = tokio::spawn(async move {
+            Self::token_refresh_loop(
+                rpc_client,
+                metadata,
+                token_renewal_ratio,
+                renewal_retry_backoff,
+                credentials_tx,
+                shutdown_rx,
+            )
+            .await;
+        });
+
+        *self.task_handle.write() = Some(handle);
+        info!("SecurityTokenManager started");
+    }
+
+    /// Stop the background token refresh task.
+    pub fn stop(&self) {
+        if let Some(tx) = self.shutdown_tx.write().take() {
+            let _ = tx.send(());
         }
+        // Take and drop the task handle so the task can finish gracefully
+        let _ = self.task_handle.write().take();
+        info!("SecurityTokenManager stopped");
     }
 
-    pub async fn get_or_refresh(&self) -> Result<HashMap<String, String>> {
-        {
-            let guard = self.inner.read();
-            if let Some(cached) = guard.as_ref() {
-                if cached.cached_at.elapsed() < CACHE_TTL {
-                    return Ok(cached.to_remote_fs_props());
+    /// Background task that periodically refreshes tokens.
+    async fn token_refresh_loop(
+        rpc_client: Arc<RpcClient>,
+        metadata: Arc<Metadata>,
+        token_renewal_ratio: f64,
+        renewal_retry_backoff: Duration,
+        credentials_tx: watch::Sender<Option<HashMap<String, String>>>,
+        mut shutdown_rx: oneshot::Receiver<()>,
+    ) {
+        info!("Starting token refresh loop");
+
+        loop {
+            // Fetch token and send to channel
+            let result = Self::fetch_token(&rpc_client, &metadata).await;
+
+            let next_delay = match result {
+                Ok((props, expiration_time)) => {
+                    // Send credentials via watch channel (Some indicates fetched)
+                    if let Err(e) = credentials_tx.send(Some(props)) {
+                        debug!("No active subscribers for credentials update: {e:?}");
+                    }
+
+                    // Calculate next renewal delay based on expiration time
+                    if let Some(exp_time) = expiration_time {
+                        Self::calculate_renewal_delay(exp_time, token_renewal_ratio)
+                    } else {
+                        // No expiration time - token never expires, use long refresh interval
+                        info!(
+                            "Token has no expiration time (never expires), next refresh in {DEFAULT_NON_EXPIRING_REFRESH_INTERVAL:?}"
+                        );
+                        DEFAULT_NON_EXPIRING_REFRESH_INTERVAL
+                    }
+                }
+                Err(e) => {
+                    warn!(
+                        "Failed to obtain security token: {e:?}, will retry in {renewal_retry_backoff:?}"
+                    );
+                    renewal_retry_backoff
+                }
+            };
+
+            debug!("Next token refresh in {next_delay:?}");
+
+            // Wait for either the delay to elapse or shutdown signal
+            tokio::select! {
+                _ = tokio::time::sleep(next_delay) => {
+                    // Continue to next iteration to refresh
+                }
+                _ = &mut shutdown_rx => {
+                     info!("Token refresh loop received shutdown signal");
+                    break;
                 }
             }
         }
-
-        self.refresh_from_server().await
     }
 
-    async fn refresh_from_server(&self) -> Result<HashMap<String, String>> {
-        let cluster = self.metadata.get_cluster();
-        let server_node = cluster
-            .get_one_available_server()
-            .expect("no tablet server available");
-        let conn = self.rpc_client.get_connection(server_node).await?;
+    /// Fetch token from server.
+    /// Returns the props and expiration time if available.
+    async fn fetch_token(
+        rpc_client: &Arc<RpcClient>,
+        metadata: &Arc<Metadata>,
+    ) -> Result<(HashMap<String, String>, Option<i64>)> {
+        let cluster = metadata.get_cluster();
+        let server_node =
+            cluster
+                .get_one_available_server()
+                .ok_or_else(|| Error::UnexpectedError {
+                    message: "No tablet server available for token refresh".to_string(),
+                    source: None,
+                })?;
 
+        let conn = rpc_client.get_connection(server_node).await?;
         let request = GetSecurityTokenRequest::new();
         let response = conn.request(request).await?;
 
-        // the token may be empty if the remote filesystem
-        // doesn't require token to access
+        // The token may be empty if remote filesystem doesn't require authentication
         if response.token.is_empty() {
-            return Ok(HashMap::new());
+            info!("Empty token received, remote filesystem may not require authentication");
+            return Ok((HashMap::new(), response.expiration_time));
         }
 
         let credentials: Credentials =
             serde_json::from_slice(&response.token).map_err(|e| Error::JsonSerdeError {
-                message: format!("Error when parse token from server: {e}"),
+                message: format!("Error when parsing token from server: {e}"),
             })?;
 
         let mut addition_infos = HashMap::new();
@@ -142,26 +294,51 @@ impl CredentialsCache {
             addition_infos.insert(kv.key.clone(), kv.value.clone());
         }
 
-        let cached = CachedToken {
-            access_key_id: credentials.access_key_id,
-            secret_access_key: credentials.access_key_secret,
-            security_token: credentials.security_token,
-            addition_infos,
-            cached_at: Instant::now(),
-        };
+        let props = build_remote_fs_props(&credentials, &addition_infos);
+        debug!("Security token fetched successfully");
+
+        Ok((props, response.expiration_time))
+    }
+
+    /// Calculate the delay before next token renewal.
+    /// Uses the renewal ratio to refresh before actual expiration.
+    /// Caps the delay to MAX_RENEWAL_DELAY to prevent overflow and ensure periodic refresh.
+    fn calculate_renewal_delay(expiration_time: i64, renewal_ratio: f64) -> Duration {
+        let now = SystemTime::now()
+            .duration_since(UNIX_EPOCH)
+            .unwrap()
+            .as_millis() as i64;
+
+        let time_until_expiry = expiration_time - now;
+        if time_until_expiry <= 0 {
+            // Token already expired, refresh immediately
+            return MIN_RENEWAL_DELAY;
+        }
 
-        let props = cached.to_remote_fs_props();
-        *self.inner.write() = Some(cached);
+        // Cap time_until_expiry to prevent overflow when casting to f64 and back
+        let max_delay_ms = MAX_RENEWAL_DELAY.as_millis() as i64;
+        let capped_time = time_until_expiry.min(max_delay_ms);
 
-        Ok(props)
+        let delay_ms = (capped_time as f64 * renewal_ratio) as u64;
+        let delay = Duration::from_millis(delay_ms);
+
+        debug!(
+            "Calculated renewal delay: {delay:?} (expiration: {expiration_time}, now: {now}, ratio: {renewal_ratio})"
+        );
+
+        delay.clamp(MIN_RENEWAL_DELAY, MAX_RENEWAL_DELAY)
+    }
+}
+
+impl Drop for SecurityTokenManager {
+    fn drop(&mut self) {
+        self.stop();
     }
 }
 
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::client::metadata::Metadata;
-    use crate::cluster::Cluster;
 
     #[test]
     fn convert_hadoop_key_to_opendal_maps_known_keys() {
@@ -177,26 +354,52 @@ mod tests {
         assert!(convert_hadoop_key_to_opendal("unknown.key").is_none());
     }
 
-    #[tokio::test]
-    async fn credentials_cache_returns_cached_props() -> Result<()> {
-        let cached = CachedToken {
+    #[test]
+    fn calculate_renewal_delay_returns_correct_delay() {
+        let now = SystemTime::now()
+            .duration_since(UNIX_EPOCH)
+            .unwrap()
+            .as_millis() as i64;
+
+        // Token expires in 1 hour
+        let expiration = now + 3600 * 1000;
+        let delay = SecurityTokenManager::calculate_renewal_delay(expiration, 0.8);
+
+        // Should be approximately 48 minutes (80% of 1 hour)
+        let expected_min = Duration::from_secs(2800); // ~46.7 minutes
+        let expected_max = Duration::from_secs(2900); // ~48.3 minutes
+        assert!(
+            delay >= expected_min && delay <= expected_max,
+            "Expected delay between {expected_min:?} and {expected_max:?}, got {delay:?}"
+        );
+    }
+
+    #[test]
+    fn calculate_renewal_delay_handles_expired_token() {
+        let now = SystemTime::now()
+            .duration_since(UNIX_EPOCH)
+            .unwrap()
+            .as_millis() as i64;
+
+        // Token already expired
+        let expiration = now - 1000;
+        let delay = SecurityTokenManager::calculate_renewal_delay(expiration, 0.8);
+
+        // Should return minimum delay
+        assert_eq!(delay, MIN_RENEWAL_DELAY);
+    }
+
+    #[test]
+    fn build_remote_fs_props_includes_all_fields() {
+        let credentials = Credentials {
             access_key_id: "ak".to_string(),
-            secret_access_key: "sk".to_string(),
+            access_key_secret: "sk".to_string(),
             security_token: Some("token".to_string()),
-            addition_infos: HashMap::from([(
-                "fs.s3a.path.style.access".to_string(),
-                "true".to_string(),
-            )]),
-            cached_at: Instant::now(),
-        };
-
-        let cache = CredentialsCache {
-            inner: RwLock::new(Some(cached)),
-            rpc_client: Arc::new(RpcClient::new()),
-            metadata: Arc::new(Metadata::new_for_test(Arc::new(Cluster::default()))),
         };
+        let addition_infos =
+            HashMap::from([("fs.s3a.path.style.access".to_string(), "true".to_string())]);
 
-        let props = cache.get_or_refresh().await?;
+        let props = build_remote_fs_props(&credentials, &addition_infos);
         assert_eq!(props.get("access_key_id"), Some(&"ak".to_string()));
         assert_eq!(props.get("secret_access_key"), Some(&"sk".to_string()));
         assert_eq!(props.get("security_token"), Some(&"token".to_string()));
@@ -204,6 +407,5 @@ mod tests {
             props.get("enable_virtual_host_style"),
             Some(&"false".to_string())
         );
-        Ok(())
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index a2e19d4901..df747710f6 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -14,11 +14,12 @@
 // See the License for the specific language governing permissions and
 // limitations under the License.
 
+use crate::client::credentials::CredentialsReceiver;
 use crate::error::{Error, Result};
 use crate::io::{FileIO, Storage};
 use crate::metadata::TableBucket;
 use crate::proto::{PbRemoteLogFetchInfo, PbRemoteLogSegment};
-use parking_lot::{Mutex, RwLock};
+use parking_lot::Mutex;
 use std::{
     cmp::{Ordering, Reverse, min},
     collections::{BinaryHeap, HashMap},
@@ -290,7 +291,7 @@ enum DownloadResult {
 
 /// Production implementation of RemoteLogFetcher that downloads from actual storage
 struct ProductionFetcher {
-    remote_fs_props: Arc<RwLock<HashMap<String, String>>>,
+    credentials_rx: CredentialsReceiver,
     local_log_dir: Arc<TempDir>,
 }
 
@@ -299,7 +300,7 @@ impl RemoteLogFetcher for ProductionFetcher {
         &self,
         request: &RemoteLogDownloadRequest,
     ) -> Pin<Box<dyn Future<Output = Result<FetchResult>> + Send>> {
-        let remote_fs_props = self.remote_fs_props.clone();
+        let mut credentials_rx = self.credentials_rx.clone();
         let local_log_dir = self.local_log_dir.clone();
 
         // Clone data needed for async operation to avoid lifetime issues
@@ -317,14 +318,49 @@ impl RemoteLogFetcher for ProductionFetcher {
                 remote_log_tablet_dir, segment.segment_id, offset_prefix
             );
 
-            let remote_fs_props_map = remote_fs_props.read().clone();
+            // Get credentials from watch channel, waiting if not yet fetched
+            // - None = not yet fetched, wait
+            // - Some(props) = fetched (may be empty if no auth needed)
+            let remote_fs_props = {
+                let maybe_props = credentials_rx.borrow().clone();
+                match maybe_props {
+                    Some(props) => props,
+                    None => {
+                        // Credentials not yet fetched, wait for first update
+                        log::info!("Waiting for credentials to be available...");
+                        // If the sender side has been dropped (e.g. during shutdown),
+                        // this will return an error. Surface that as a proper error
+                        // instead of silently falling back to empty credentials.
+                        if let Err(e) = credentials_rx.changed().await {
+                            let io_err = io::Error::new(
+                                io::ErrorKind::BrokenPipe,
+                                format!(
+                                    "credentials manager shut down before credentials were obtained: {e}"
+                                ),
+                            );
+                            return Err(io_err.into());
+                        }
+                        // After a successful change notification, credentials should be set.
+                        // If they are still missing, treat this as an error instead of
+                        // defaulting to an empty map (which could break auth flows).
+                        credentials_rx
+                            .borrow()
+                            .clone()
+                            .ok_or_else(|| Error::UnexpectedError {
+                                message: "credentials not available after watch notification"
+                                    .to_string(),
+                                source: None,
+                            })?
+                    }
+                }
+            };
 
             // Download file to disk (streaming, no memory spike)
             let file_path = RemoteLogDownloader::download_file(
                 &remote_log_tablet_dir,
                 &remote_path,
                 &local_file_path,
-                &remote_fs_props_map,
+                &remote_fs_props,
             )
             .await?;
 
@@ -725,7 +761,6 @@ impl RemoteLogDownloadFuture {
 /// won't wait for completion. Pending futures will fail.
 pub struct RemoteLogDownloader {
     request_sender: Option<mpsc::UnboundedSender<RemoteLogDownloadRequest>>,
-    remote_fs_props: Option<Arc<RwLock<HashMap<String, String>>>>,
 }
 
 impl RemoteLogDownloader {
@@ -733,21 +768,17 @@ impl RemoteLogDownloader {
         local_log_dir: TempDir,
         max_prefetch_segments: usize,
         max_concurrent_downloads: usize,
+        credentials_rx: CredentialsReceiver,
     ) -> Result<Self> {
-        let remote_fs_props = Arc::new(RwLock::new(HashMap::new()));
         let fetcher = Arc::new(ProductionFetcher {
-            remote_fs_props: remote_fs_props.clone(),
+            credentials_rx,
             local_log_dir: Arc::new(local_log_dir),
         });
 
-        let mut downloader =
-            Self::new_with_fetcher(fetcher, max_prefetch_segments, max_concurrent_downloads)?;
-        downloader.remote_fs_props = Some(remote_fs_props);
-        Ok(downloader)
+        Self::new_with_fetcher(fetcher, max_prefetch_segments, max_concurrent_downloads)
     }
 
     /// Create a RemoteLogDownloader with a custom fetcher (for testing).
-    /// The remote_fs_props will be None since custom fetchers typically don't need S3 credentials.
     pub fn new_with_fetcher(
         fetcher: Arc<dyn RemoteLogFetcher>,
         max_prefetch_segments: usize,
@@ -770,16 +801,9 @@ impl RemoteLogDownloader {
 
         Ok(Self {
             request_sender: Some(request_sender),
-            remote_fs_props: None,
         })
     }
 
-    pub fn set_remote_fs_props(&self, props: HashMap<String, String>) {
-        if let Some(ref remote_fs_props) = self.remote_fs_props {
-            *remote_fs_props.write() = props;
-        }
-    }
-
     /// Request to fetch a remote log segment to local. This method is non-blocking.
     pub fn request_remote_log(
         &self,
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index dbebe1aca4..356ba1cdb4 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -28,7 +28,7 @@ use tempfile::TempDir;
 
 use crate::TableId;
 use crate::client::connection::FlussConnection;
-use crate::client::credentials::CredentialsCache;
+use crate::client::credentials::SecurityTokenManager;
 use crate::client::metadata::Metadata;
 use crate::client::table::log_fetch_buffer::{
     CompletedFetch, DefaultCompletedFetch, FetchErrorAction, FetchErrorContext, FetchErrorLogLevel,
@@ -462,9 +462,10 @@ struct LogFetcher {
     read_context: ReadContext,
     remote_read_context: ReadContext,
     remote_log_downloader: Arc<RemoteLogDownloader>,
-    // todo: consider schedule a background thread to update
-    // token instead of update in fetch phase
-    credentials_cache: Arc<CredentialsCache>,
+    /// Background security token manager for remote filesystem access.
+    /// Kept alive to run the background refresh task; stopped on drop.
+    #[allow(dead_code)]
+    security_token_manager: Arc<SecurityTokenManager>,
     log_fetch_buffer: Arc<LogFetchBuffer>,
     nodes_with_pending_fetch_requests: Arc<Mutex<HashSet<i32>>>,
 }
@@ -476,7 +477,6 @@ struct FetchResponseContext {
     read_context: ReadContext,
     remote_read_context: ReadContext,
     remote_log_downloader: Arc<RemoteLogDownloader>,
-    credentials_cache: Arc<CredentialsCache>,
 }
 
 impl LogFetcher {
@@ -497,6 +497,23 @@ impl LogFetcher {
         let tmp_dir = TempDir::with_prefix("fluss-remote-logs")?;
         let log_fetch_buffer = Arc::new(LogFetchBuffer::new(read_context.clone()));
 
+        // Create security token manager for background token refresh
+        let security_token_manager =
+            Arc::new(SecurityTokenManager::new(conns.clone(), metadata.clone()));
+
+        // Subscribe to credentials updates and pass to remote log downloader
+        let credentials_rx = security_token_manager.subscribe();
+
+        let remote_log_downloader = Arc::new(RemoteLogDownloader::new(
+            tmp_dir,
+            config.scanner_remote_log_prefetch_num,
+            config.scanner_remote_log_download_threads,
+            credentials_rx,
+        )?);
+
+        // Start the background token refresh task
+        security_token_manager.start();
+
         Ok(LogFetcher {
             conns: conns.clone(),
             metadata: metadata.clone(),
@@ -505,12 +522,8 @@ impl LogFetcher {
             log_scanner_status,
             read_context,
             remote_read_context,
-            remote_log_downloader: Arc::new(RemoteLogDownloader::new(
-                tmp_dir,
-                config.scanner_remote_log_prefetch_num,
-                config.scanner_remote_log_download_threads,
-            )?),
-            credentials_cache: Arc::new(CredentialsCache::new(conns.clone(), metadata.clone())),
+            remote_log_downloader,
+            security_token_manager,
             log_fetch_buffer,
             nodes_with_pending_fetch_requests: Arc::new(Mutex::new(HashSet::new())),
         })
@@ -670,7 +683,6 @@ impl LogFetcher {
             let read_context = self.read_context.clone();
             let remote_read_context = self.remote_read_context.clone();
             let remote_log_downloader = Arc::clone(&self.remote_log_downloader);
-            let creds_cache = self.credentials_cache.clone();
             let nodes_with_pending = self.nodes_with_pending_fetch_requests.clone();
             let metadata = self.metadata.clone();
             let response_context = FetchResponseContext {
@@ -680,7 +692,6 @@ impl LogFetcher {
                 read_context,
                 remote_read_context,
                 remote_log_downloader,
-                credentials_cache: creds_cache,
             };
             // Spawn async task to handle the fetch request
             // Note: These tasks are not explicitly tracked or cancelled when LogFetcher is dropped.
@@ -755,7 +766,6 @@ impl LogFetcher {
             read_context,
             remote_read_context,
             remote_log_downloader,
-            credentials_cache,
         } = context;
 
         for pb_fetch_log_resp in fetch_response.tables_resp {
@@ -825,10 +835,7 @@ impl LogFetcher {
                 // Check if this is a remote log fetch
                 if let Some(ref remote_log_fetch_info) = fetch_log_for_bucket.remote_log_fetch_info
                 {
-                    // set remote fs props
-                    let remote_fs_props = credentials_cache.get_or_refresh().await.unwrap();
-                    remote_log_downloader.set_remote_fs_props(remote_fs_props);
-
+                    // Remote fs props are already set by the background SecurityTokenManager
                     let remote_fetch_info =
                         RemoteLogFetchInfo::from_proto(remote_log_fetch_info, table_bucket.clone());
 
@@ -1649,7 +1656,6 @@ mod tests {
             read_context: fetcher.read_context.clone(),
             remote_read_context: fetcher.remote_read_context.clone(),
             remote_log_downloader: fetcher.remote_log_downloader.clone(),
-            credentials_cache: fetcher.credentials_cache.clone(),
         };
 
         LogFetcher::handle_fetch_response(response, response_context).await;
@@ -1703,7 +1709,6 @@ mod tests {
             read_context: fetcher.read_context.clone(),
             remote_read_context: fetcher.remote_read_context.clone(),
             remote_log_downloader: fetcher.remote_log_downloader.clone(),
-            credentials_cache: fetcher.credentials_cache.clone(),
         };
 
         LogFetcher::handle_fetch_response(response, response_context).await;

From c80d0aa2569942b3360bf4936384166e9ed47d30 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Tue, 27 Jan 2026 02:37:13 +0100
Subject: [PATCH 091/287] chore: Add blocking poll into python bindings (#154)

---
 fluss-rust/bindings/python/example/example.py |  22 +++
 fluss-rust/bindings/python/src/table.rs       | 175 ++++++++++++------
 2 files changed, 145 insertions(+), 52 deletions(-)

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 730416bb6f..5d0302efea 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -224,6 +224,28 @@ async def main():
 
         # TODO: support to_duckdb()
 
+        # Test the new poll() method for incremental reading
+        print("\n--- Testing poll() method ---")
+        # Reset subscription to start from the beginning
+        log_scanner.subscribe(None, None)
+
+        # Poll with a timeout of 5000ms (5 seconds)
+        # Note: poll() returns an empty table (not an error) on timeout
+        try:
+            poll_result = log_scanner.poll(5000)
+            print(f"Number of rows: {poll_result.num_rows}")
+
+            if poll_result.num_rows > 0:
+                poll_df = poll_result.to_pandas()
+                print(f"Polled data:\n{poll_df}")
+            else:
+                print("Empty result (no records available)")
+                # Empty table still has schema
+                print(f"Schema: {poll_result.schema}")
+
+        except Exception as e:
+            print(f"Error during poll: {e}")
+
     except Exception as e:
         print(f"Error during scanning: {e}")
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 0ae7186403..404335058b 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -20,10 +20,13 @@ use crate::*;
 use arrow::array::RecordBatch;
 use arrow_pyarrow::{FromPyArrow, ToPyArrow};
 use fluss::client::EARLIEST_OFFSET;
+use fluss::record::to_arrow_schema;
 use fluss::rpc::message::OffsetSpec;
 use pyo3::types::IntoPyDict;
 use pyo3_async_runtimes::tokio::future_into_py;
+use std::collections::HashMap;
 use std::sync::Arc;
+use std::time::Duration;
 
 // Time conversion constants
 const MILLIS_PER_SECOND: i64 = 1_000;
@@ -186,7 +189,7 @@ impl FlussTable {
             }
 
             let rust_scanner = table_scan
-                .create_log_scanner()
+                .create_record_batch_log_scanner()
                 .map_err(|e| FlussError::new_err(format!("Failed to create log scanner: {e}")))?;
 
             let admin = conn
@@ -886,7 +889,7 @@ fn get_type_name(value: &Bound<PyAny>) -> String {
 /// Scanner for reading log data from a Fluss table
 #[pyclass]
 pub struct LogScanner {
-    inner: fcore::client::LogScanner,
+    inner: fcore::client::RecordBatchLogScanner,
     admin: fcore::client::FlussAdmin,
     table_info: fcore::metadata::TableInfo,
     #[allow(dead_code)]
@@ -931,63 +934,78 @@ impl LogScanner {
 
     /// Convert all data to Arrow Table
     fn to_arrow(&self, py: Python) -> PyResult<Py<PyAny>> {
-        use std::collections::HashMap;
-        use std::time::Duration;
-
         let mut all_batches = Vec::new();
 
         let num_buckets = self.table_info.get_num_buckets();
         let bucket_ids: Vec<i32> = (0..num_buckets).collect();
 
         // todo: after supporting list_offsets with timestamp, we can use start_timestamp and end_timestamp here
-        let mut stopping_offsets: HashMap<i32, i64> = TOKIO_RUNTIME
-            .block_on(async {
-                self.admin
-                    .list_offsets(
-                        &self.table_info.table_path,
-                        bucket_ids.as_slice(),
-                        OffsetSpec::Latest,
-                    )
-                    .await
+        let mut stopping_offsets: HashMap<i32, i64> = py
+            .detach(|| {
+                TOKIO_RUNTIME.block_on(async {
+                    self.admin
+                        .list_offsets(
+                            &self.table_info.table_path,
+                            bucket_ids.as_slice(),
+                            OffsetSpec::Latest,
+                        )
+                        .await
+                })
             })
             .map_err(|e| FlussError::new_err(e.to_string()))?;
 
-        if !stopping_offsets.is_empty() {
-            loop {
-                let batch_result = TOKIO_RUNTIME
-                    .block_on(async { self.inner.poll(Duration::from_millis(500)).await });
-
-                match batch_result {
-                    Ok(scan_records) => {
-                        let mut result_records: Vec<fcore::record::ScanRecord> = vec![];
-                        for (bucket, records) in scan_records.into_records_by_buckets() {
-                            let stopping_offset = stopping_offsets.get(&bucket.bucket_id());
-
-                            if stopping_offset.is_none() {
-                                // not to include this bucket, skip records for this bucket
-                                // since we already reach end offset for this bucket
-                                continue;
-                            }
-                            if let Some(last_record) = records.last() {
-                                let offset = last_record.offset();
-                                result_records.extend(records);
-                                if offset >= stopping_offset.unwrap() - 1 {
-                                    stopping_offsets.remove(&bucket.bucket_id());
-                                }
-                            }
-                        }
-
-                        if !result_records.is_empty() {
-                            let arrow_batch = Utils::convert_scan_records_to_arrow(result_records);
-                            all_batches.extend(arrow_batch);
-                        }
-
-                        // we have reach end offsets of all bucket
-                        if stopping_offsets.is_empty() {
-                            break;
-                        }
-                    }
-                    Err(e) => return Err(FlussError::new_err(e.to_string())),
+        // Filter out buckets with no records to read (stop_at <= 0)
+        stopping_offsets.retain(|_, &mut v| v > 0);
+
+        while !stopping_offsets.is_empty() {
+            let scan_batches = py
+                .detach(|| {
+                    TOKIO_RUNTIME
+                        .block_on(async { self.inner.poll(Duration::from_millis(500)).await })
+                })
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+            if scan_batches.is_empty() {
+                continue;
+            }
+
+            for scan_batch in scan_batches {
+                let bucket_id = scan_batch.bucket().bucket_id();
+
+                // Check if this bucket is still being tracked; if not, ignore the batch
+                let Some(&stop_at) = stopping_offsets.get(&bucket_id) else {
+                    continue;
+                };
+
+                let base_offset = scan_batch.base_offset();
+                let last_offset = scan_batch.last_offset();
+
+                // If the batch starts at or after the stop_at offset, the bucket is exhausted
+                if base_offset >= stop_at {
+                    stopping_offsets.remove(&bucket_id);
+                    continue;
+                }
+
+                let batch = if last_offset >= stop_at {
+                    // This batch contains the target offset; slice it to keep only records
+                    // where offset < stop_at.
+                    let num_to_keep = (stop_at - base_offset) as usize;
+                    let b = scan_batch.into_batch();
+
+                    // Safety check: ensure we don't attempt to slice more rows than the batch contains
+                    let limit = num_to_keep.min(b.num_rows());
+                    b.slice(0, limit)
+                } else {
+                    // The entire batch is within the desired range (all offsets < stop_at)
+                    scan_batch.into_batch()
+                };
+
+                all_batches.push(Arc::new(batch));
+
+                // If the batch's last offset reached or passed the inclusive limit (stop_at - 1),
+                // we are done with this bucket.
+                if last_offset >= stop_at - 1 {
+                    stopping_offsets.remove(&bucket_id);
                 }
             }
         }
@@ -1004,15 +1022,68 @@ impl LogScanner {
         Ok(df)
     }
 
+    /// Poll for new records with the specified timeout
+    ///
+    /// Args:
+    ///     timeout_ms: Timeout in milliseconds to wait for records
+    ///
+    /// Returns:
+    ///     PyArrow Table containing the polled records
+    ///
+    /// Note:
+    ///     - Returns an empty table (with correct schema) if no records are available
+    ///     - When timeout expires, returns an empty table (NOT an error)
+    fn poll(&self, py: Python, timeout_ms: i64) -> PyResult<Py<PyAny>> {
+        if timeout_ms < 0 {
+            return Err(FlussError::new_err(format!(
+                "timeout_ms must be non-negative, got: {timeout_ms}"
+            )));
+        }
+
+        let timeout = Duration::from_millis(timeout_ms as u64);
+        let scan_batches = py
+            .detach(|| TOKIO_RUNTIME.block_on(async { self.inner.poll(timeout).await }))
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+        // Convert ScanBatch to Arrow batches
+        if scan_batches.is_empty() {
+            return self.create_empty_table(py);
+        }
+
+        let arrow_batches: Vec<_> = scan_batches
+            .into_iter()
+            .map(|scan_batch| Arc::new(scan_batch.into_batch()))
+            .collect();
+
+        Utils::combine_batches_to_table(py, arrow_batches)
+    }
+
+    /// Create an empty PyArrow table with the correct schema
+    fn create_empty_table(&self, py: Python) -> PyResult<Py<PyAny>> {
+        let arrow_schema = to_arrow_schema(self.table_info.get_row_type())
+            .map_err(|e| FlussError::new_err(format!("Failed to get arrow schema: {e}")))?;
+        let py_schema = arrow_schema
+            .as_ref()
+            .to_pyarrow(py)
+            .map_err(|e| FlussError::new_err(format!("Failed to convert schema: {e}")))?;
+
+        let pyarrow = py.import("pyarrow")?;
+        let empty_table = pyarrow
+            .getattr("Table")?
+            .call_method1("from_batches", (vec![] as Vec<Py<PyAny>>, py_schema))?;
+
+        Ok(empty_table.into())
+    }
+
     fn __repr__(&self) -> String {
         format!("LogScanner(table={})", self.table_info.table_path)
     }
 }
 
 impl LogScanner {
-    /// Create LogScanner from core LogScanner
+    /// Create LogScanner from core RecordBatchLogScanner
     pub fn from_core(
-        inner_scanner: fcore::client::LogScanner,
+        inner_scanner: fcore::client::RecordBatchLogScanner,
         admin: fcore::client::FlussAdmin,
         table_info: fcore::metadata::TableInfo,
     ) -> Self {

From bc7efea50c6b4e829434026f7a5e63e6bc00aa98 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Tue, 27 Jan 2026 13:17:52 +0000
Subject: [PATCH 092/287] chore: Introduce PartitionGetter and Partition utils
 (#214)

---
 .../src/client/table/partition_getter.rs      | 177 +++++-
 fluss-rust/crates/fluss/src/error.rs          |   6 +
 .../crates/fluss/src/metadata/partition.rs    |  62 +-
 fluss-rust/crates/fluss/src/metadata/table.rs | 110 ++++
 fluss-rust/crates/fluss/src/row/datum.rs      |  10 +-
 fluss-rust/crates/fluss/src/util/mod.rs       |   1 +
 fluss-rust/crates/fluss/src/util/partition.rs | 532 ++++++++++++++++++
 7 files changed, 847 insertions(+), 51 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/util/partition.rs

diff --git a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
index 4529d8684f..887c0a4fd7 100644
--- a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
+++ b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
@@ -17,40 +17,191 @@
 
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::{DataType, RowType};
+use crate::metadata::{DataType, ResolvedPartitionSpec, RowType};
+use crate::row::InternalRow;
 use crate::row::field_getter::FieldGetter;
+use crate::util::partition;
+use std::sync::Arc;
 
+/// A getter to get partition name from a row.
 #[allow(dead_code)]
-pub struct PartitionGetter<'a> {
-    partitions: Vec<(&'a String, &'a DataType, FieldGetter)>,
+pub struct PartitionGetter {
+    partition_keys: Arc<[String]>,
+    partitions: Vec<(DataType, FieldGetter)>,
 }
 
 #[allow(dead_code)]
-impl<'a> PartitionGetter<'a> {
-    pub fn new(row_type: &'a RowType, partition_keys: &'a Vec<String>) -> Result<Self> {
+impl PartitionGetter {
+    pub fn new(row_type: &RowType, partition_keys: Arc<[String]>) -> Result<Self> {
         let mut partitions = Vec::with_capacity(partition_keys.len());
 
-        for partition_key in partition_keys {
+        for partition_key in partition_keys.iter() {
             if let Some(partition_col_index) = row_type.get_field_index(partition_key.as_str()) {
-                let data_type = &row_type
+                let data_type = row_type
                     .fields()
                     .get(partition_col_index)
                     .unwrap()
-                    .data_type;
-                let field_getter = FieldGetter::create(data_type, partition_col_index);
+                    .data_type
+                    .clone();
+                let field_getter = FieldGetter::create(&data_type, partition_col_index);
 
-                partitions.push((partition_key, data_type, field_getter));
+                partitions.push((data_type, field_getter));
             } else {
                 return Err(IllegalArgument {
                     message: format!(
-                        "The partition column {partition_key} is not in the row {row_type}."
+                        "The partition column {} is not in the row {}.",
+                        partition_key, row_type
                     ),
                 });
             };
         }
 
-        Ok(Self { partitions })
+        Ok(Self {
+            partition_keys,
+            partitions,
+        })
     }
 
-    // TODO Implement get partition
+    pub fn get_partition(&self, row: &dyn InternalRow) -> Result<String> {
+        self.get_partition_spec(row)
+            .map(|ps| ps.get_partition_name())
+    }
+
+    pub fn get_partition_spec(&self, row: &dyn InternalRow) -> Result<ResolvedPartitionSpec> {
+        let mut partition_values = Vec::with_capacity(self.partitions.len());
+
+        for (data_type, field_getter) in &self.partitions {
+            let value = field_getter.get_field(row);
+            if value.is_null() {
+                return Err(IllegalArgument {
+                    message: "Partition value shouldn't be null.".to_string(),
+                });
+            }
+            partition_values.push(partition::convert_value_of_type(&value, data_type)?);
+        }
+
+        ResolvedPartitionSpec::new(Arc::clone(&self.partition_keys), partition_values)
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{DataField, IntType, StringType};
+    use crate::row::{Datum, GenericRow};
+
+    #[test]
+    fn test_partition_getter_single_key() {
+        let row_type = RowType::new(vec![
+            DataField::new("id".to_string(), DataType::Int(IntType::new()), None),
+            DataField::new(
+                "region".to_string(),
+                DataType::String(StringType::new()),
+                None,
+            ),
+        ]);
+
+        let getter = PartitionGetter::new(&row_type, Arc::from(["region".to_string()]))
+            .expect("should succeed");
+
+        let row = GenericRow::from_data(vec![Datum::Int32(42), Datum::from("US")]);
+        let partition_name = getter.get_partition(&row).expect("should succeed");
+        assert_eq!(partition_name, "US");
+    }
+
+    #[test]
+    fn test_partition_getter_multiple_keys() {
+        let row_type = RowType::new(vec![
+            DataField::new("id".to_string(), DataType::Int(IntType::new()), None),
+            DataField::new(
+                "date".to_string(),
+                DataType::String(StringType::new()),
+                None,
+            ),
+            DataField::new(
+                "region".to_string(),
+                DataType::String(StringType::new()),
+                None,
+            ),
+        ]);
+
+        let getter = PartitionGetter::new(
+            &row_type,
+            Arc::from(["date".to_string(), "region".to_string()]),
+        )
+        .expect("should succeed");
+
+        let row = GenericRow::from_data(vec![
+            Datum::Int32(42),
+            Datum::from("2024-01-15"),
+            Datum::from("US"),
+        ]);
+        let partition_name = getter.get_partition(&row).expect("should succeed");
+        assert_eq!(partition_name, "2024-01-15$US");
+    }
+
+    #[test]
+    fn test_partition_getter_invalid_column() {
+        let row_type = RowType::new(vec![DataField::new(
+            "id".to_string(),
+            DataType::Int(IntType::new()),
+            None,
+        )]);
+
+        let result = PartitionGetter::new(&row_type, Arc::from(["nonexistent".to_string()]));
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_partition_getter_null_value() {
+        let row_type = RowType::new(vec![
+            DataField::new("id".to_string(), DataType::Int(IntType::new()), None),
+            DataField::new(
+                "region".to_string(),
+                DataType::String(StringType::new()),
+                None,
+            ),
+        ]);
+
+        let getter = PartitionGetter::new(&row_type, Arc::from(["region".to_string()]))
+            .expect("should succeed");
+
+        let row = GenericRow::from_data(vec![Datum::Int32(42), Datum::Null]);
+        let result = getter.get_partition(&row);
+        assert!(result.is_err());
+    }
+
+    #[test]
+    fn test_get_partition_spec() {
+        let row_type = RowType::new(vec![
+            DataField::new("id".to_string(), DataType::Int(IntType::new()), None),
+            DataField::new(
+                "date".to_string(),
+                DataType::String(StringType::new()),
+                None,
+            ),
+            DataField::new(
+                "region".to_string(),
+                DataType::String(StringType::new()),
+                None,
+            ),
+        ]);
+
+        let getter = PartitionGetter::new(
+            &row_type,
+            Arc::from(["date".to_string(), "region".to_string()]),
+        )
+        .expect("should succeed");
+
+        let row = GenericRow::from_data(vec![
+            Datum::Int32(42),
+            Datum::from("2024-01-15"),
+            Datum::from("US"),
+        ]);
+        let spec = getter.get_partition_spec(&row).expect("should succeed");
+
+        assert_eq!(spec.get_partition_keys(), &["date", "region"]);
+        assert_eq!(spec.get_partition_values(), &["2024-01-15", "US"]);
+        assert_eq!(spec.get_partition_name(), "2024-01-15$US");
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index 368d8abc80..68426d7c28 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -93,6 +93,12 @@ pub enum Error {
     )]
     IllegalArgument { message: String },
 
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting invalid partition error {}.", message)
+    )]
+    InvalidPartition { message: String },
+
     #[snafu(
         visibility(pub(crate)),
         display("Fluss hitting IO not supported error {}.", message)
diff --git a/fluss-rust/crates/fluss/src/metadata/partition.rs b/fluss-rust/crates/fluss/src/metadata/partition.rs
index e40fbf9e4a..bc1935c3c8 100644
--- a/fluss-rust/crates/fluss/src/metadata/partition.rs
+++ b/fluss-rust/crates/fluss/src/metadata/partition.rs
@@ -15,11 +15,12 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::PartitionId;
 use crate::error::{Error, Result};
 use crate::proto::{PbKeyValue, PbPartitionInfo, PbPartitionSpec};
+use crate::{PartitionId, TableId};
 use std::collections::HashMap;
 use std::fmt::{Display, Formatter};
+use std::sync::Arc;
 
 /// Represents a partition spec in fluss. Partition columns and values are NOT of strict order, and
 /// they need to be re-arranged to the correct order by comparing with a list of strictly ordered
@@ -72,20 +73,21 @@ impl Display for PartitionSpec {
 /// partition keys.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct ResolvedPartitionSpec {
-    partition_keys: Vec<String>,
+    partition_keys: Arc<[String]>,
     partition_values: Vec<String>,
 }
 
 pub const PARTITION_SPEC_SEPARATOR: &str = "$";
 
 impl ResolvedPartitionSpec {
-    pub fn new(partition_keys: Vec<String>, partition_values: Vec<String>) -> Result<Self> {
+    pub fn new(partition_keys: Arc<[String]>, partition_values: Vec<String>) -> Result<Self> {
         if partition_keys.len() != partition_values.len() {
             return Err(Error::IllegalArgument {
                 message: "The number of partition keys and partition values should be the same."
                     .to_string(),
             });
         }
+
         Ok(Self {
             partition_keys,
             partition_values,
@@ -93,7 +95,7 @@ impl ResolvedPartitionSpec {
     }
 
     pub fn from_partition_spec(
-        partition_keys: Vec<String>,
+        partition_keys: Arc<[String]>,
         partition_spec: &PartitionSpec,
     ) -> Self {
         let partition_values =
@@ -104,14 +106,7 @@ impl ResolvedPartitionSpec {
         }
     }
 
-    pub fn from_partition_value(partition_key: String, partition_value: String) -> Self {
-        Self {
-            partition_keys: vec![partition_key],
-            partition_values: vec![partition_value],
-        }
-    }
-
-    pub fn from_partition_name(partition_keys: Vec<String>, partition_name: &str) -> Self {
+    pub fn from_partition_name(partition_keys: Arc<[String]>, partition_name: &str) -> Self {
         let partition_values: Vec<String> = partition_name
             .split(PARTITION_SPEC_SEPARATOR)
             .map(|s| s.to_string())
@@ -140,7 +135,7 @@ impl ResolvedPartitionSpec {
         }
 
         Ok(Self {
-            partition_keys: keys,
+            partition_keys: Arc::from(keys),
             partition_values: values,
         })
     }
@@ -236,6 +231,7 @@ impl ResolvedPartitionSpec {
             .iter()
             .map(|kv| kv.value.clone())
             .collect();
+
         Self {
             partition_keys,
             partition_values,
@@ -243,7 +239,7 @@ impl ResolvedPartitionSpec {
     }
 
     fn get_reordered_partition_values(
-        partition_keys: &[String],
+        partition_keys: &Arc<[String]>,
         partition_spec: &PartitionSpec,
     ) -> Vec<String> {
         let partition_spec_map = partition_spec.get_spec_map();
@@ -310,7 +306,7 @@ impl PartitionInfo {
 }
 
 impl Display for PartitionInfo {
-    fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
+    fn fmt(&self, f: &mut Formatter) -> std::fmt::Result {
         write!(
             f,
             "Partition{{name='{}', id={}}}",
@@ -323,12 +319,12 @@ impl Display for PartitionInfo {
 /// A class to identify a table partition, containing the table id and the partition id.
 #[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
 pub struct TablePartition {
-    table_id: i64,
+    table_id: TableId,
     partition_id: PartitionId,
 }
 
 impl TablePartition {
-    pub fn new(table_id: i64, partition_id: PartitionId) -> Self {
+    pub fn new(table_id: TableId, partition_id: PartitionId) -> Self {
         Self {
             table_id,
             partition_id,
@@ -361,7 +357,7 @@ mod tests {
     #[test]
     fn test_resolved_partition_spec_name() {
         let spec = ResolvedPartitionSpec::new(
-            vec!["date".to_string(), "region".to_string()],
+            Arc::from(["date".to_string(), "region".to_string()]),
             vec!["2024-01-15".to_string(), "US".to_string()],
         )
         .unwrap();
@@ -376,7 +372,7 @@ mod tests {
     #[test]
     fn test_resolved_partition_spec_from_partition_name() {
         let spec = ResolvedPartitionSpec::from_partition_name(
-            vec!["date".to_string(), "region".to_string()],
+            Arc::from(["date".to_string(), "region".to_string()]),
             "2024-01-15$US",
         );
 
@@ -396,7 +392,7 @@ mod tests {
     #[test]
     fn test_resolved_partition_spec_mismatched_lengths() {
         let result = ResolvedPartitionSpec::new(
-            vec!["date".to_string(), "region".to_string()],
+            Arc::from(["date".to_string(), "region".to_string()]),
             vec!["2024-01-15".to_string()],
         );
 
@@ -405,9 +401,11 @@ mod tests {
 
     #[test]
     fn test_partition_info() {
-        let spec =
-            ResolvedPartitionSpec::new(vec!["date".to_string()], vec!["2024-01-15".to_string()])
-                .unwrap();
+        let spec = ResolvedPartitionSpec::new(
+            Arc::from(["date".to_string()]),
+            vec!["2024-01-15".to_string()],
+        )
+        .unwrap();
 
         let info = PartitionInfo::new(42, spec);
         assert_eq!(info.get_partition_id(), 42);
@@ -438,9 +436,11 @@ mod tests {
 
     #[test]
     fn test_partition_info_pb_roundtrip() {
-        let spec =
-            ResolvedPartitionSpec::new(vec!["date".to_string()], vec!["2024-01-15".to_string()])
-                .unwrap();
+        let spec = ResolvedPartitionSpec::new(
+            Arc::from(["date".to_string()]),
+            vec!["2024-01-15".to_string()],
+        )
+        .unwrap();
         let info = PartitionInfo::new(42, spec);
 
         let pb = info.to_pb();
@@ -453,14 +453,16 @@ mod tests {
     #[test]
     fn test_contains() {
         let full_spec = ResolvedPartitionSpec::new(
-            vec!["date".to_string(), "region".to_string()],
+            Arc::from(["date".to_string(), "region".to_string()]),
             vec!["2024-01-15".to_string(), "US".to_string()],
         )
         .unwrap();
 
-        let partial_spec =
-            ResolvedPartitionSpec::new(vec!["date".to_string()], vec!["2024-01-15".to_string()])
-                .unwrap();
+        let partial_spec = ResolvedPartitionSpec::new(
+            Arc::from(["date".to_string()]),
+            vec!["2024-01-15".to_string()],
+        )
+        .unwrap();
 
         assert!(full_spec.contains(&partial_spec).unwrap());
     }
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 3b9da7d99a..0c0cdf5152 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -678,6 +678,10 @@ impl Display for TablePath {
     }
 }
 
+const MAX_NAME_LENGTH: usize = 200;
+
+const INTERNAL_NAME_PREFIX: &str = "__";
+
 impl TablePath {
     pub fn new(db: String, tbl: String) -> Self {
         TablePath {
@@ -695,6 +699,52 @@ impl TablePath {
     pub fn table(&self) -> &str {
         &self.table
     }
+
+    pub fn detect_invalid_name(identifier: &str) -> Option<String> {
+        if identifier.is_empty() {
+            return Some("the empty string is not allowed".to_string());
+        }
+        if identifier == "." {
+            return Some("'.' is not allowed".to_string());
+        }
+        if identifier == ".." {
+            return Some("'..' is not allowed".to_string());
+        }
+        if identifier.len() > MAX_NAME_LENGTH {
+            return Some(format!(
+                "the length of '{}' is longer than the max allowed length {}",
+                identifier, MAX_NAME_LENGTH
+            ));
+        }
+        if Self::contains_invalid_pattern(identifier) {
+            return Some(format!(
+                "'{}' contains one or more characters other than ASCII alphanumerics, '_' and '-'",
+                identifier
+            ));
+        }
+        None
+    }
+
+    pub fn validate_prefix(identifier: &str) -> Option<String> {
+        if identifier.starts_with(INTERNAL_NAME_PREFIX) {
+            return Some(format!(
+                "'{}' is not allowed as prefix, since it is reserved for internal databases/internal tables/internal partitions in Fluss server",
+                INTERNAL_NAME_PREFIX
+            ));
+        }
+        None
+    }
+
+    // Valid characters for Fluss table names are the ASCII alphanumerics, '_' and '-'.
+    fn contains_invalid_pattern(identifier: &str) -> bool {
+        for c in identifier.chars() {
+            let valid_char = c.is_ascii_alphanumeric() || c == '_' || c == '-';
+            if !valid_char {
+                return true;
+            }
+        }
+        false
+    }
 }
 
 /// A database name, table name and partition name combo. It's used to represent the physical path of
@@ -1106,3 +1156,63 @@ impl LakeSnapshot {
         &self.table_buckets_offset
     }
 }
+
+/// Tests for [`TablePath`].
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_validate() {
+        // assert valid name
+        let path = TablePath::new("db_2-abc3".to_string(), "table-1_abc_2".to_string());
+        assert!(TablePath::detect_invalid_name(path.database()).is_none());
+        assert!(TablePath::detect_invalid_name(path.table()).is_none());
+        assert_eq!(path.to_string(), "db_2-abc3.table-1_abc_2");
+
+        // assert invalid name prefix
+        assert!(
+            TablePath::validate_prefix("__table-1")
+                .unwrap()
+                .contains("'__' is not allowed as prefix")
+        );
+
+        // check max length
+        let long_name = "a".repeat(200);
+        assert!(TablePath::detect_invalid_name(&long_name).is_none());
+
+        // assert invalid names
+        assert_invalid_name("*abc", "'*abc' contains one or more characters other than");
+        assert_invalid_name(
+            "table.abc",
+            "'table.abc' contains one or more characters other than",
+        );
+        assert_invalid_name("", "the empty string is not allowed");
+        assert_invalid_name(" ", "' ' contains one or more characters other than");
+        assert_invalid_name(".", "'.' is not allowed");
+        assert_invalid_name("..", "'..' is not allowed");
+        let invalid_long_name = "a".repeat(201);
+        assert_invalid_name(
+            &invalid_long_name,
+            &format!(
+                "the length of '{}' is longer than the max allowed length {}",
+                invalid_long_name, MAX_NAME_LENGTH
+            ),
+        );
+    }
+
+    fn assert_invalid_name(name: &str, expected_message: &str) {
+        let result = TablePath::detect_invalid_name(name);
+        assert!(
+            result.is_some(),
+            "Expected '{}' to be invalid, but it was valid",
+            name
+        );
+        assert!(
+            result.as_ref().unwrap().contains(expected_message),
+            "Expected message containing '{}', but got '{}'",
+            expected_message,
+            result.unwrap()
+        );
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index b808373084..e1b70adca2 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -789,10 +789,7 @@ impl TimestampNtz {
         }
     }
 
-    pub fn from_millis_nanos(
-        millisecond: i64,
-        nano_of_millisecond: i32,
-    ) -> crate::error::Result<Self> {
+    pub fn from_millis_nanos(millisecond: i64, nano_of_millisecond: i32) -> Result<Self> {
         if !(0..=MAX_NANO_OF_MILLISECOND).contains(&nano_of_millisecond) {
             return Err(crate::error::Error::IllegalArgument {
                 message: format!(
@@ -836,10 +833,7 @@ impl TimestampLtz {
         }
     }
 
-    pub fn from_millis_nanos(
-        epoch_millisecond: i64,
-        nano_of_millisecond: i32,
-    ) -> crate::error::Result<Self> {
+    pub fn from_millis_nanos(epoch_millisecond: i64, nano_of_millisecond: i32) -> Result<Self> {
         if !(0..=MAX_NANO_OF_MILLISECOND).contains(&nano_of_millisecond) {
             return Err(crate::error::Error::IllegalArgument {
                 message: format!(
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index 3760487d42..b987fe255d 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 pub mod murmur_hash;
+pub mod partition;
 pub mod varint;
 
 use crate::TableId;
diff --git a/fluss-rust/crates/fluss/src/util/partition.rs b/fluss-rust/crates/fluss/src/util/partition.rs
new file mode 100644
index 0000000000..036cac46e2
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/util/partition.rs
@@ -0,0 +1,532 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+/// Utils for partition.
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::DataType;
+use crate::row::{Date, Datum, Time, TimestampLtz, TimestampNtz};
+use jiff::ToSpan;
+use std::fmt::Write;
+
+fn hex_string(bytes: &[u8]) -> String {
+    let mut hex = String::with_capacity(bytes.len() * 2);
+    for &b in bytes {
+        write!(hex, "{:02x}", b).unwrap();
+    }
+    hex
+}
+
+fn reformat_float(value: f32) -> String {
+    if value.is_nan() {
+        "NaN".to_string()
+    } else if value.is_infinite() {
+        if value > 0.0 {
+            "Inf".to_string()
+        } else {
+            "-Inf".to_string()
+        }
+    } else {
+        value.to_string().replace('.', "_")
+    }
+}
+
+fn reformat_double(value: f64) -> String {
+    if value.is_nan() {
+        "NaN".to_string()
+    } else if value.is_infinite() {
+        if value > 0.0 {
+            "Inf".to_string()
+        } else {
+            "-Inf".to_string()
+        }
+    } else {
+        value.to_string().replace('.', "_")
+    }
+}
+
+const UNIX_EPOCH_DATE: jiff::civil::Date = jiff::civil::date(1970, 1, 1);
+
+fn day_to_string(days: i32) -> String {
+    let date = UNIX_EPOCH_DATE + days.days();
+    format!("{:04}-{:02}-{:02}", date.year(), date.month(), date.day())
+}
+
+fn date_to_string(date: Date) -> String {
+    day_to_string(date.get_inner())
+}
+
+const MILLIS_PER_SECOND: i64 = 1_000;
+const MILLIS_PER_MINUTE: i64 = 60 * MILLIS_PER_SECOND;
+const MILLIS_PER_HOUR: i64 = 60 * MILLIS_PER_MINUTE;
+
+fn milli_to_string(milli: i32) -> String {
+    let hour = milli.div_euclid(MILLIS_PER_HOUR as i32);
+    let min = milli
+        .rem_euclid(MILLIS_PER_HOUR as i32)
+        .div_euclid(MILLIS_PER_MINUTE as i32);
+    let sec = milli
+        .rem_euclid(MILLIS_PER_MINUTE as i32)
+        .div_euclid(MILLIS_PER_SECOND as i32);
+    let ms = milli.rem_euclid(MILLIS_PER_SECOND as i32);
+
+    format!("{:02}-{:02}-{:02}_{:03}", hour, min, sec, ms)
+}
+
+fn time_to_string(time: Time) -> String {
+    milli_to_string(time.get_inner())
+}
+
+trait Timestamp {
+    fn get_milli(&self) -> i64;
+    fn get_nano_of_milli(&self) -> i32;
+}
+
+impl Timestamp for TimestampNtz {
+    fn get_milli(&self) -> i64 {
+        self.get_millisecond()
+    }
+
+    fn get_nano_of_milli(&self) -> i32 {
+        self.get_nano_of_millisecond()
+    }
+}
+
+impl Timestamp for TimestampLtz {
+    fn get_milli(&self) -> i64 {
+        self.get_epoch_millisecond()
+    }
+
+    fn get_nano_of_milli(&self) -> i32 {
+        self.get_nano_of_millisecond()
+    }
+}
+
+/// This formats date time while adhering to java side behaviour
+///
+fn timestamp_to_string<T: Timestamp>(ts: T) -> String {
+    let millis = ts.get_milli();
+    let nanos = ts.get_nano_of_milli();
+
+    let millis_of_second = millis.rem_euclid(MILLIS_PER_SECOND);
+    let total_secs = millis.div_euclid(MILLIS_PER_SECOND);
+
+    let epoch = jiff::Timestamp::UNIX_EPOCH;
+    let ts_jiff = epoch + jiff::Span::new().seconds(total_secs);
+    let dt = ts_jiff.to_zoned(jiff::tz::TimeZone::UTC).datetime();
+
+    if nanos > 0 {
+        format!(
+            "{:04}-{:02}-{:02}-{:02}-{:02}-{:02}_{:03}{:06}",
+            dt.year(),
+            dt.month(),
+            dt.day(),
+            dt.hour(),
+            dt.minute(),
+            dt.second(),
+            millis_of_second,
+            nanos
+        )
+    } else if millis_of_second > 0 {
+        format!(
+            "{:04}-{:02}-{:02}-{:02}-{:02}-{:02}_{:03}",
+            dt.year(),
+            dt.month(),
+            dt.day(),
+            dt.hour(),
+            dt.minute(),
+            dt.second(),
+            millis_of_second
+        )
+    } else {
+        format!(
+            "{:04}-{:02}-{:02}-{:02}-{:02}-{:02}_",
+            dt.year(),
+            dt.month(),
+            dt.day(),
+            dt.hour(),
+            dt.minute(),
+            dt.second(),
+        )
+    }
+}
+
+/// Converts a Datum value to its string representation for partition naming.
+pub fn convert_value_of_type(value: &Datum, data_type: &DataType) -> Result<String> {
+    match (value, data_type) {
+        (Datum::String(s), DataType::Char(_) | DataType::String(_)) => Ok(s.to_string()),
+        (Datum::Bool(b), DataType::Boolean(_)) => Ok(b.to_string()),
+        (Datum::Blob(bytes), DataType::Binary(_) | DataType::Bytes(_)) => Ok(hex_string(bytes)),
+        (Datum::Int8(v), DataType::TinyInt(_)) => Ok(v.to_string()),
+        (Datum::Int16(v), DataType::SmallInt(_)) => Ok(v.to_string()),
+        (Datum::Int32(v), DataType::Int(_)) => Ok(v.to_string()),
+        (Datum::Int64(v), DataType::BigInt(_)) => Ok(v.to_string()),
+        (Datum::Date(d), DataType::Date(_)) => Ok(date_to_string(*d)),
+        (Datum::Time(t), DataType::Time(_)) => Ok(time_to_string(*t)),
+        (Datum::Float32(f), DataType::Float(_)) => Ok(reformat_float(f.into_inner())),
+        (Datum::Float64(f), DataType::Double(_)) => Ok(reformat_double(f.into_inner())),
+        (Datum::TimestampLtz(ts), DataType::TimestampLTz(_)) => Ok(timestamp_to_string(*ts)),
+        (Datum::TimestampNtz(ts), DataType::Timestamp(_)) => Ok(timestamp_to_string(*ts)),
+        _ => Err(IllegalArgument {
+            message: format!(
+                "Unsupported conversion to partition key from data type: {data_type:?}, value: {value:?}"
+            ),
+        }),
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{
+        BigIntType, BinaryType, BooleanType, BytesType, CharType, DateType, DoubleType, FloatType,
+        IntType, SmallIntType, StringType, TimeType, TimestampLTzType, TimestampType, TinyIntType,
+    };
+    use crate::row::{Date, Time, TimestampLtz, TimestampNtz};
+    use std::borrow::Cow;
+
+    use crate::metadata::TablePath;
+
+    #[test]
+    fn test_string() {
+        let datum = Datum::String(Cow::Borrowed("Fluss"));
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::String(StringType::new()))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "Fluss");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_char() {
+        let datum = Datum::String(Cow::Borrowed("F"));
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::Char(CharType::new(1)))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "F");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_boolean() {
+        let datum = Datum::Bool(true);
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::Boolean(BooleanType::new()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "true");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_byte() {
+        let datum = Datum::Blob(Cow::Borrowed(&[0x10, 0x20, 0x30, 0x40, 0x50, 0xFF]));
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::Bytes(BytesType::new()))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "1020304050ff");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_binary() {
+        let datum = Datum::Blob(Cow::Borrowed(&[0x10, 0x20, 0x30, 0x40, 0x50, 0xFF]));
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::Binary(BinaryType::new(6)))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "1020304050ff");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_tiny_int() {
+        let datum = Datum::Int8(100);
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::TinyInt(TinyIntType::new()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "100");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_small_int() {
+        let datum = Datum::Int16(-32760);
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::SmallInt(SmallIntType::new()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "-32760");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_int() {
+        let datum = Datum::Int32(299000);
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::Int(IntType::new()))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "299000");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_big_int() {
+        let datum = Datum::Int64(1748662955428);
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::BigInt(BigIntType::new()))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "1748662955428");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_date() {
+        let datum = Datum::Date(Date::new(20235));
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::Date(DateType::new()))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-27");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_time() {
+        let datum = Datum::Time(Time::new(5402199));
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::Time(TimeType::new(3).unwrap()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "01-30-02_199");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_float() {
+        let datum = Datum::Float32(5.73.into());
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::Float(FloatType::new()))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "5_73");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        let datum = Datum::Float32(f32::NAN.into());
+        assert_eq!(
+            convert_value_of_type(&datum, &DataType::Float(FloatType::new()))
+                .expect("datum conversion to partition string failed"),
+            "NaN"
+        );
+
+        let datum = Datum::Float32(f32::INFINITY.into());
+        assert_eq!(
+            convert_value_of_type(&datum, &DataType::Float(FloatType::new()))
+                .expect("datum conversion to partition string failed"),
+            "Inf"
+        );
+
+        let datum = Datum::Float32(f32::NEG_INFINITY.into());
+        assert_eq!(
+            convert_value_of_type(&datum, &DataType::Float(FloatType::new()))
+                .expect("datum conversion to partition string failed"),
+            "-Inf"
+        );
+    }
+
+    #[test]
+    fn test_double() {
+        let datum = Datum::Float64(5.73737.into());
+
+        let to_string_result = convert_value_of_type(&datum, &DataType::Double(DoubleType::new()))
+            .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "5_73737");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        let datum = Datum::Float64(f64::NAN.into());
+        assert_eq!(
+            convert_value_of_type(&datum, &DataType::Double(DoubleType::new()))
+                .expect("datum conversion to partition string failed"),
+            "NaN"
+        );
+
+        let datum = Datum::Float64(f64::INFINITY.into());
+        assert_eq!(
+            convert_value_of_type(&datum, &DataType::Double(DoubleType::new()))
+                .expect("datum conversion to partition string failed"),
+            "Inf"
+        );
+
+        let datum = Datum::Float64(f64::NEG_INFINITY.into());
+        assert_eq!(
+            convert_value_of_type(&datum, &DataType::Double(DoubleType::new()))
+                .expect("datum conversion to partition string failed"),
+            "-Inf"
+        );
+    }
+
+    #[test]
+    fn test_timestamp_ntz() {
+        let datum = Datum::TimestampNtz(
+            TimestampNtz::from_millis_nanos(1748662955428, 99988)
+                .expect("TimestampNtz init failed"),
+        );
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::Timestamp(TimestampType::new(9).unwrap()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-31-03-42-35_428099988");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        // Zero nanos of millis
+        let datum = Datum::TimestampNtz(
+            TimestampNtz::from_millis_nanos(1748662955428, 0).expect("TimestampNtz init failed"),
+        );
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::Timestamp(TimestampType::new(9).unwrap()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-31-03-42-35_428");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        // Zero millis
+        let datum = Datum::TimestampNtz(
+            TimestampNtz::from_millis_nanos(1748662955000, 99988)
+                .expect("TimestampNtz init failed"),
+        );
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::Timestamp(TimestampType::new(9).unwrap()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-31-03-42-35_000099988");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        // Zero millis and zero nanos
+        let datum = Datum::TimestampNtz(
+            TimestampNtz::from_millis_nanos(1748662955000, 0).expect("TimestampNtz init failed"),
+        );
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::Timestamp(TimestampType::new(9).unwrap()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-31-03-42-35_");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        // Negative millis
+        let datum = Datum::TimestampNtz(
+            TimestampNtz::from_millis_nanos(-1748662955428, 99988)
+                .expect("TimestampNtz init failed"),
+        );
+
+        let to_string_result =
+            convert_value_of_type(&datum, &DataType::Timestamp(TimestampType::new(9).unwrap()))
+                .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "1914-08-03-20-17-24_572099988");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+
+    #[test]
+    fn test_timestamp_ltz() {
+        let datum = Datum::TimestampLtz(
+            TimestampLtz::from_millis_nanos(1748662955428, 99988)
+                .expect("TimestampLtz init failed"),
+        );
+
+        let to_string_result = convert_value_of_type(
+            &datum,
+            &DataType::TimestampLTz(TimestampLTzType::new(9).unwrap()),
+        )
+        .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-31-03-42-35_428099988");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        // Zero nanos of millis
+        let datum = Datum::TimestampLtz(
+            TimestampLtz::from_millis_nanos(1748662955428, 0).expect("TimestampLtz init failed"),
+        );
+
+        let to_string_result = convert_value_of_type(
+            &datum,
+            &DataType::TimestampLTz(TimestampLTzType::new(9).unwrap()),
+        )
+        .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-31-03-42-35_428");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        // Zero millis
+        let datum = Datum::TimestampLtz(
+            TimestampLtz::from_millis_nanos(1748662955000, 99988)
+                .expect("TimestampLtz init failed"),
+        );
+
+        let to_string_result = convert_value_of_type(
+            &datum,
+            &DataType::TimestampLTz(TimestampLTzType::new(9).unwrap()),
+        )
+        .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-31-03-42-35_000099988");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        // Zero millis and zero nanos
+        let datum = Datum::TimestampLtz(
+            TimestampLtz::from_millis_nanos(1748662955000, 0).expect("TimestampLtz init failed"),
+        );
+
+        let to_string_result = convert_value_of_type(
+            &datum,
+            &DataType::TimestampLTz(TimestampLTzType::new(9).unwrap()),
+        )
+        .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "2025-05-31-03-42-35_");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+
+        // Negative millis
+        let datum = Datum::TimestampLtz(
+            TimestampLtz::from_millis_nanos(-1748662955428, 99988)
+                .expect("TimestampLtz init failed"),
+        );
+
+        let to_string_result = convert_value_of_type(
+            &datum,
+            &DataType::TimestampLTz(TimestampLTzType::new(9).unwrap()),
+        )
+        .expect("datum conversion to partition string failed");
+        assert_eq!(to_string_result, "1914-08-03-20-17-24_572099988");
+        let detect_invalid = TablePath::detect_invalid_name(&to_string_result);
+        assert!(detect_invalid.is_none());
+    }
+}

From 9371dcc313acf27b9eb53763867d5592b3b0ede4 Mon Sep 17 00:00:00 2001
From: Junbo Wang <beryllwang@gmail.com>
Date: Wed, 28 Jan 2026 13:28:27 +0800
Subject: [PATCH 093/287] [chore] Implement is_auto_partitioned method in
 table.rs (#48)

---
 .../src/client/table/partition_getter.rs      |   3 +-
 fluss-rust/crates/fluss/src/metadata/table.rs | 188 +++++++++++++++++-
 fluss-rust/crates/fluss/src/util/partition.rs |   4 +-
 3 files changed, 180 insertions(+), 15 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
index 887c0a4fd7..1a76106867 100644
--- a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
+++ b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
@@ -49,8 +49,7 @@ impl PartitionGetter {
             } else {
                 return Err(IllegalArgument {
                     message: format!(
-                        "The partition column {} is not in the row {}.",
-                        partition_key, row_type
+                        "The partition column {partition_key} is not in the row {row_type}."
                     ),
                 });
             };
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 0c0cdf5152..7b93acae14 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -712,14 +712,12 @@ impl TablePath {
         }
         if identifier.len() > MAX_NAME_LENGTH {
             return Some(format!(
-                "the length of '{}' is longer than the max allowed length {}",
-                identifier, MAX_NAME_LENGTH
+                "the length of '{identifier}' is longer than the max allowed length {MAX_NAME_LENGTH}"
             ));
         }
         if Self::contains_invalid_pattern(identifier) {
             return Some(format!(
-                "'{}' contains one or more characters other than ASCII alphanumerics, '_' and '-'",
-                identifier
+                "'{identifier}' contains one or more characters other than ASCII alphanumerics, '_' and '-'"
             ));
         }
         None
@@ -728,8 +726,7 @@ impl TablePath {
     pub fn validate_prefix(identifier: &str) -> Option<String> {
         if identifier.starts_with(INTERNAL_NAME_PREFIX) {
             return Some(format!(
-                "'{}' is not allowed as prefix, since it is reserved for internal databases/internal tables/internal partitions in Fluss server",
-                INTERNAL_NAME_PREFIX
+                "'{INTERNAL_NAME_PREFIX}' is not allowed as prefix, since it is reserved for internal databases/internal tables/internal partitions in Fluss server"
             ));
         }
         None
@@ -834,6 +831,75 @@ impl TableInfo {
     }
 }
 
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+pub struct AutoPartitionStrategy {
+    auto_partition_enabled: bool,
+    auto_partition_key: Option<String>,
+    auto_partition_time_unit: String,
+    auto_partition_num_precreate: i32,
+    auto_partition_num_retention: i32,
+    auto_partition_timezone: String,
+}
+
+impl AutoPartitionStrategy {
+    pub fn from(properties: &HashMap<String, String>) -> Self {
+        Self {
+            auto_partition_enabled: properties
+                .get("table.auto-partition.enabled")
+                .and_then(|s| s.parse().ok())
+                .unwrap_or(false),
+            auto_partition_key: properties
+                .get("table.auto-partition.key")
+                .map(|s| s.to_string()),
+            auto_partition_time_unit: properties
+                .get("table.auto-partition.time-unit")
+                .map(|s| s.to_string())
+                .unwrap_or_else(|| "DAY".to_string()),
+            auto_partition_num_precreate: properties
+                .get("table.auto-partition.num-precreate")
+                .and_then(|s| s.parse().ok())
+                .unwrap_or(2),
+            auto_partition_num_retention: properties
+                .get("table.auto-partition.num-retention")
+                .and_then(|s| s.parse().ok())
+                .unwrap_or(7),
+            auto_partition_timezone: properties
+                .get("table.auto-partition.time-zone")
+                .map(|s| s.to_string())
+                .unwrap_or_else(|| {
+                    jiff::tz::TimeZone::system()
+                        .iana_name()
+                        .unwrap_or("UTC")
+                        .to_string()
+                }),
+        }
+    }
+
+    pub fn is_auto_partition_enabled(&self) -> bool {
+        self.auto_partition_enabled
+    }
+
+    pub fn key(&self) -> Option<&str> {
+        self.auto_partition_key.as_deref()
+    }
+
+    pub fn time_unit(&self) -> &str {
+        &self.auto_partition_time_unit
+    }
+
+    pub fn num_precreate(&self) -> i32 {
+        self.auto_partition_num_precreate
+    }
+
+    pub fn num_retention(&self) -> i32 {
+        self.auto_partition_num_retention
+    }
+
+    pub fn timezone(&self) -> &str {
+        &self.auto_partition_timezone
+    }
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
 pub struct TableConfig {
     pub properties: HashMap<String, String>,
@@ -866,6 +932,10 @@ impl TableConfig {
             .unwrap_or(DEFAULT_KV_FORMAT);
         kv_format.parse().map_err(Into::into)
     }
+
+    pub fn get_auto_partition_strategy(&self) -> AutoPartitionStrategy {
+        AutoPartitionStrategy::from(&self.properties)
+    }
 }
 
 impl TableInfo {
@@ -1003,7 +1073,11 @@ impl TableInfo {
     }
 
     pub fn is_auto_partitioned(&self) -> bool {
-        self.is_partitioned() && todo!()
+        self.is_partitioned()
+            && self
+                .table_config
+                .get_auto_partition_strategy()
+                .is_auto_partition_enabled()
     }
 
     pub fn get_partition_keys(&self) -> &[String] {
@@ -1161,6 +1235,7 @@ impl LakeSnapshot {
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::metadata::DataTypes;
 
     #[test]
     fn test_validate() {
@@ -1195,8 +1270,7 @@ mod tests {
         assert_invalid_name(
             &invalid_long_name,
             &format!(
-                "the length of '{}' is longer than the max allowed length {}",
-                invalid_long_name, MAX_NAME_LENGTH
+                "the length of '{invalid_long_name}' is longer than the max allowed length {MAX_NAME_LENGTH}"
             ),
         );
     }
@@ -1205,8 +1279,7 @@ mod tests {
         let result = TablePath::detect_invalid_name(name);
         assert!(
             result.is_some(),
-            "Expected '{}' to be invalid, but it was valid",
-            name
+            "Expected '{name}' to be invalid, but it was valid"
         );
         assert!(
             result.as_ref().unwrap().contains(expected_message),
@@ -1215,4 +1288,97 @@ mod tests {
             result.unwrap()
         );
     }
+
+    #[test]
+    fn test_is_auto_partitioned() {
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .primary_key(vec!["id".to_string()])
+            .build()
+            .unwrap();
+
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+
+        // 1. Not partitioned, auto partition disabled
+        let mut properties = HashMap::new();
+        let table_info = TableInfo::new(
+            table_path.clone(),
+            1,
+            1,
+            schema.clone(),
+            vec!["id".to_string()],
+            vec![], // No partition keys
+            1,
+            properties.clone(),
+            HashMap::new(),
+            None,
+            0,
+            0,
+        );
+        assert!(!table_info.is_auto_partitioned());
+
+        // 2. Not partitioned, auto partition enabled
+        properties.insert(
+            "table.auto-partition.enabled".to_string(),
+            "true".to_string(),
+        );
+        let table_info = TableInfo::new(
+            table_path.clone(),
+            1,
+            1,
+            schema.clone(),
+            vec!["id".to_string()],
+            vec![], // No partition keys
+            1,
+            properties.clone(),
+            HashMap::new(),
+            None,
+            0,
+            0,
+        );
+        assert!(!table_info.is_auto_partitioned());
+
+        // 3. Partitioned, auto partition disabled
+        properties.insert(
+            "table.auto-partition.enabled".to_string(),
+            "false".to_string(),
+        );
+        let table_info = TableInfo::new(
+            table_path.clone(),
+            1,
+            1,
+            schema.clone(),
+            vec!["id".to_string()],
+            vec!["name".to_string()], // Partition keys
+            1,
+            properties.clone(),
+            HashMap::new(),
+            None,
+            0,
+            0,
+        );
+        assert!(!table_info.is_auto_partitioned());
+
+        // 4. Partitioned, auto partition enabled
+        properties.insert(
+            "table.auto-partition.enabled".to_string(),
+            "true".to_string(),
+        );
+        let table_info = TableInfo::new(
+            table_path.clone(),
+            1,
+            1,
+            schema.clone(),
+            vec!["id".to_string()],
+            vec!["name".to_string()], // Partition keys
+            1,
+            properties.clone(),
+            HashMap::new(),
+            None,
+            0,
+            0,
+        );
+        assert!(table_info.is_auto_partitioned());
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/util/partition.rs b/fluss-rust/crates/fluss/src/util/partition.rs
index 036cac46e2..ccc71a6b08 100644
--- a/fluss-rust/crates/fluss/src/util/partition.rs
+++ b/fluss-rust/crates/fluss/src/util/partition.rs
@@ -26,7 +26,7 @@ use std::fmt::Write;
 fn hex_string(bytes: &[u8]) -> String {
     let mut hex = String::with_capacity(bytes.len() * 2);
     for &b in bytes {
-        write!(hex, "{:02x}", b).unwrap();
+        write!(hex, "{b:02x}").unwrap();
     }
     hex
 }
@@ -84,7 +84,7 @@ fn milli_to_string(milli: i32) -> String {
         .div_euclid(MILLIS_PER_SECOND as i32);
     let ms = milli.rem_euclid(MILLIS_PER_SECOND as i32);
 
-    format!("{:02}-{:02}-{:02}_{:03}", hour, min, sec, ms)
+    format!("{hour:02}-{min:02}-{sec:02}_{ms:03}")
 }
 
 fn time_to_string(time: Time) -> String {

From 0fe410e163714b6a6f5b3c67c08ac445fcdd97d3 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Wed, 28 Jan 2026 21:52:02 +0800
Subject: [PATCH 094/287] chore: minor fix for rust code (#218)

---
 fluss-rust/crates/fluss/src/client/admin.rs   | 24 +++----
 .../crates/fluss/src/client/connection.rs     | 22 +++++--
 .../crates/fluss/src/client/metadata.rs       |  9 ++-
 .../fluss/src/client/write/accumulator.rs     | 18 ++---
 .../crates/fluss/src/client/write/sender.rs   |  2 +-
 .../crates/fluss/src/cluster/cluster.rs       | 27 ++++++--
 fluss-rust/crates/fluss/src/io/file_io.rs     |  4 +-
 .../src/record/kv/kv_record_batch_builder.rs  |  3 +-
 fluss-rust/crates/fluss/src/row/encode/mod.rs | 14 ++--
 .../crates/fluss/src/rpc/server_connection.rs | 65 +++++++++++++------
 fluss-rust/crates/fluss/src/util/mod.rs       |  2 +-
 .../crates/fluss/tests/integration/admin.rs   | 15 ++++-
 12 files changed, 136 insertions(+), 69 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index bffe0f5141..286c46c26a 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -47,14 +47,15 @@ pub struct FlussAdmin {
 
 impl FlussAdmin {
     pub async fn new(connections: Arc<RpcClient>, metadata: Arc<Metadata>) -> Result<Self> {
-        let admin_con = connections
-            .get_connection(
-                metadata
-                    .get_cluster()
-                    .get_coordinator_server()
-                    .expect("Couldn't coordinator server"),
-            )
-            .await?;
+        let admin_con =
+            connections
+                .get_connection(metadata.get_cluster().get_coordinator_server().ok_or_else(
+                    || Error::UnexpectedError {
+                        message: "Coordinator server not found in cluster metadata".to_string(),
+                        source: None,
+                    },
+                )?)
+                .await?;
 
         Ok(FlussAdmin {
             admin_gateway: admin_con,
@@ -211,7 +212,7 @@ impl FlussAdmin {
         database_name: &str,
         ignore_if_not_exists: bool,
         cascade: bool,
-    ) {
+    ) -> Result<()> {
         let _response = self
             .admin_gateway
             .request(DropDatabaseRequest::new(
@@ -219,7 +220,8 @@ impl FlussAdmin {
                 ignore_if_not_exists,
                 cascade,
             ))
-            .await;
+            .await?;
+        Ok(())
     }
 
     /// List all databases
@@ -298,7 +300,7 @@ impl FlussAdmin {
         }
 
         let cluster = self.metadata.get_cluster();
-        let table_id = cluster.get_table(table_path).table_id;
+        let table_id = cluster.get_table(table_path)?.table_id;
 
         // Prepare requests
         let requests_by_server =
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 0e41bbe756..a19dbd2f60 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -68,19 +68,31 @@ impl FlussConnection {
     }
 
     pub fn get_or_create_writer_client(&self) -> Result<Arc<WriterClient>> {
+        // 1. Fast path: Attempt to acquire a read lock to check if the client already exists.
         if let Some(client) = self.writer_client.read().as_ref() {
             return Ok(client.clone());
         }
 
-        // If not exists, create new one
-        let client = Arc::new(WriterClient::new(self.args.clone(), self.metadata.clone())?);
-        *self.writer_client.write() = Some(client.clone());
-        Ok(client)
+        // 2. Slow path: Acquire the write lock.
+        let mut writer_guard = self.writer_client.write();
+
+        // 3. Double-check: Another thread might have initialized the client
+        // while this thread was waiting for the write lock.
+        if let Some(client) = writer_guard.as_ref() {
+            return Ok(client.clone());
+        }
+
+        // 4. Initialize the client since we are certain it doesn't exist yet.
+        let new_client = Arc::new(WriterClient::new(self.args.clone(), self.metadata.clone())?);
+
+        // 5. Store and return the newly created client.
+        *writer_guard = Some(new_client.clone());
+        Ok(new_client)
     }
 
     pub async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>> {
         self.metadata.update_table_metadata(table_path).await?;
-        let table_info = self.metadata.get_cluster().get_table(table_path).clone();
+        let table_info = self.metadata.get_cluster().get_table(table_path)?.clone();
         if table_info.is_partitioned() {
             return Err(crate::error::Error::UnsupportedOperation {
                 message: "Partitioned tables are not supported".to_string(),
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index 3c6730b545..614f6e7880 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -16,7 +16,7 @@
 // under the License.
 
 use crate::cluster::{Cluster, ServerNode, ServerType};
-use crate::error::Result;
+use crate::error::{Error, Result};
 use crate::metadata::{PhysicalTablePath, TableBucket, TablePath};
 use crate::proto::MetadataResponse;
 use crate::rpc::message::UpdateMetadataRequest;
@@ -45,7 +45,12 @@ impl Metadata {
     }
 
     async fn init_cluster(boot_strap: &str, connections: Arc<RpcClient>) -> Result<Cluster> {
-        let socket_address = boot_strap.parse::<SocketAddr>().unwrap();
+        let socket_address =
+            boot_strap
+                .parse::<SocketAddr>()
+                .map_err(|e| Error::IllegalArgument {
+                    message: format!("Invalid bootstrap address '{boot_strap}': {e}"),
+                })?;
         let server_node = ServerNode::new(
             -1,
             socket_address.ip().to_string(),
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 96114fb015..624e7c447b 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -96,9 +96,9 @@ impl RecordAccumulator {
         }
 
         let table_path = &record.table_path;
-        let table_info = cluster.get_table(table_path);
+        let table_info = cluster.get_table(table_path)?;
         let arrow_compression_info = table_info.get_table_config().get_arrow_compression_info()?;
-        let row_type = &cluster.get_table(table_path).row_type;
+        let row_type = &table_info.row_type;
 
         let schema_id = table_info.schema_id;
 
@@ -188,7 +188,7 @@ impl RecordAccumulator {
         self.append_new_batch(cluster, record, bucket_id, &mut dq_guard)
     }
 
-    pub async fn ready(&self, cluster: &Arc<Cluster>) -> ReadyCheckResult {
+    pub async fn ready(&self, cluster: &Arc<Cluster>) -> Result<ReadyCheckResult> {
         // Snapshot just the Arcs we need, avoiding cloning the entire BucketAndWriteBatches struct
         let entries: Vec<(TablePath, BucketBatches)> = self
             .write_batches
@@ -219,14 +219,14 @@ impl RecordAccumulator {
                     cluster,
                     next_ready_check_delay_ms,
                 )
-                .await
+                .await?
         }
 
-        ReadyCheckResult {
+        Ok(ReadyCheckResult {
             ready_nodes,
             next_ready_check_delay_ms,
             unknown_leader_tables,
-        }
+        })
     }
 
     async fn bucket_ready(
@@ -237,7 +237,7 @@ impl RecordAccumulator {
         unknown_leader_tables: &mut HashSet<TablePath>,
         cluster: &Cluster,
         next_ready_check_delay_ms: i64,
-    ) -> i64 {
+    ) -> Result<i64> {
         let mut next_delay = next_ready_check_delay_ms;
 
         for (bucket_id, batch) in bucket_batches {
@@ -250,7 +250,7 @@ impl RecordAccumulator {
             let waited_time_ms = batch.waited_time_ms(current_time_ms());
             let deque_size = batch_guard.len();
             let full = deque_size > 1 || batch.is_closed();
-            let table_bucket = cluster.get_table_bucket(table_path, bucket_id);
+            let table_bucket = cluster.get_table_bucket(table_path, bucket_id)?;
             if let Some(leader) = cluster.leader_for(&table_bucket) {
                 next_delay =
                     self.batch_ready(leader, waited_time_ms, full, ready_nodes, next_delay);
@@ -258,7 +258,7 @@ impl RecordAccumulator {
                 unknown_leader_tables.insert(table_path.clone());
             }
         }
-        next_delay
+        Ok(next_delay)
     }
 
     fn batch_ready(
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index 1ffda58230..905ef8052b 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -78,7 +78,7 @@ impl Sender {
 
     async fn run_once(&self) -> Result<()> {
         let cluster = self.metadata.get_cluster();
-        let ready_check_result = self.accumulator.ready(&cluster).await;
+        let ready_check_result = self.accumulator.ready(&cluster).await?;
 
         // Update metadata if needed
         if !ready_check_result.unknown_leader_tables.is_empty() {
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
index 2484026a98..0b14fe67fd 100644
--- a/fluss-rust/crates/fluss/src/cluster/cluster.rs
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -17,7 +17,7 @@
 
 use crate::BucketId;
 use crate::cluster::{BucketLocation, ServerNode, ServerType};
-use crate::error::Result;
+use crate::error::{Error, Result};
 use crate::metadata::{
     JsonSerde, PhysicalTablePath, TableBucket, TableDescriptor, TableInfo, TablePath,
 };
@@ -188,7 +188,14 @@ impl Cluster {
             let table_id = table_metadata.table_id;
             let table_path = from_pb_table_path(&table_metadata.table_path);
             let table_descriptor = TableDescriptor::deserialize_json(
-                &serde_json::from_slice(table_metadata.table_json.as_slice()).unwrap(),
+                &serde_json::from_slice(table_metadata.table_json.as_slice()).map_err(|e| {
+                    Error::JsonSerdeError {
+                        message: format!(
+                            "Error deserializing table_json into TableDescriptor for table_id {} and table_path {}: {}",
+                            table_id, table_path, e
+                        )
+                    }
+                })?,
             )?;
             let table_info = TableInfo::of(
                 table_path.clone(),
@@ -261,9 +268,13 @@ impl Cluster {
         self.alive_tablet_servers_by_id.get(&id)
     }
 
-    pub fn get_table_bucket(&self, table_path: &TablePath, bucket_id: BucketId) -> TableBucket {
-        let table_info = self.get_table(table_path);
-        TableBucket::new(table_info.table_id, bucket_id)
+    pub fn get_table_bucket(
+        &self,
+        table_path: &TablePath,
+        bucket_id: BucketId,
+    ) -> Result<TableBucket> {
+        let table_info = self.get_table(table_path)?;
+        Ok(TableBucket::new(table_info.table_id, bucket_id))
     }
 
     pub fn get_bucket_locations_by_path(&self) -> &HashMap<TablePath, Vec<BucketLocation>> {
@@ -306,10 +317,12 @@ impl Cluster {
             .num_buckets
     }
 
-    pub fn get_table(&self, table_path: &TablePath) -> &TableInfo {
+    pub fn get_table(&self, table_path: &TablePath) -> Result<&TableInfo> {
         self.table_info_by_path
             .get(table_path)
-            .unwrap_or_else(|| panic!("can't find table info by path {table_path}"))
+            .ok_or_else(|| Error::InvalidTableError {
+                message: format!("Table info not found for {table_path}"),
+            })
     }
 
     pub fn opt_get_table(&self, table_path: &TablePath) -> Option<&TableInfo> {
diff --git a/fluss-rust/crates/fluss/src/io/file_io.rs b/fluss-rust/crates/fluss/src/io/file_io.rs
index e7b026df55..adca333f6b 100644
--- a/fluss-rust/crates/fluss/src/io/file_io.rs
+++ b/fluss-rust/crates/fluss/src/io/file_io.rs
@@ -39,8 +39,8 @@ pub struct FileIO {
 impl FileIO {
     /// Try to infer file io scheme from path.
     pub fn from_url(path: &str) -> Result<FileIOBuilder> {
-        let url = Url::parse(path).map_err(|_| Error::IllegalArgument {
-            message: format!("Invalid URL: {path}"),
+        let url = Url::parse(path).map_err(|e| Error::IllegalArgument {
+            message: format!("Invalid URL '{path}': {e}"),
         })?;
         Ok(FileIOBuilder::new(url.scheme()))
     }
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
index 0b65500fd4..837076482e 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
@@ -29,6 +29,7 @@ use crate::record::kv::kv_record_batch::{
 };
 use crate::record::kv::{CURRENT_KV_MAGIC_VALUE, NO_BATCH_SEQUENCE, NO_WRITER_ID};
 use bytes::{Bytes, BytesMut};
+use log::warn;
 use std::io;
 
 /// Builder for KvRecordBatch.
@@ -305,7 +306,7 @@ impl Drop for KvRecordBatchBuilder {
     fn drop(&mut self) {
         // Warn if the builder has records but was never built or was aborted
         if self.current_record_number > 0 && !self.aborted && self.built_buffer.is_none() {
-            eprintln!(
+            warn!(
                 "Warning: KvRecordBatchBuilder dropped with {} record(s) that were never built. \
                  Call build() to serialize the batch before dropping.",
                 self.current_record_number
diff --git a/fluss-rust/crates/fluss/src/row/encode/mod.rs b/fluss-rust/crates/fluss/src/row/encode/mod.rs
index 468d4d182b..d5cf8ace85 100644
--- a/fluss-rust/crates/fluss/src/row/encode/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/mod.rs
@@ -18,7 +18,7 @@
 mod compacted_key_encoder;
 mod compacted_row_encoder;
 
-use crate::error::Result;
+use crate::error::{Error, Result};
 use crate::metadata::{DataLakeFormat, KvFormat, RowType};
 use crate::row::encode::compacted_key_encoder::CompactedKeyEncoder;
 use crate::row::encode::compacted_row_encoder::CompactedRowEncoder;
@@ -48,15 +48,15 @@ impl KeyEncoderFactory {
         data_lake_format: &Option<DataLakeFormat>,
     ) -> Result<Box<dyn KeyEncoder>> {
         match data_lake_format {
-            Some(DataLakeFormat::Paimon) => {
-                unimplemented!("KeyEncoder for Paimon format is currently unimplemented")
-            }
+            Some(DataLakeFormat::Paimon) => Err(Error::UnsupportedOperation {
+                message: "KeyEncoder for Paimon format is not yet implemented".to_string(),
+            }),
             Some(DataLakeFormat::Lance) => Ok(Box::new(CompactedKeyEncoder::create_key_encoder(
                 row_type, key_fields,
             )?)),
-            Some(DataLakeFormat::Iceberg) => {
-                unimplemented!("KeyEncoder for Iceberg format is currently unimplemented")
-            }
+            Some(DataLakeFormat::Iceberg) => Err(Error::UnsupportedOperation {
+                message: "KeyEncoder for Iceberg format is not yet implemented".to_string(),
+            }),
             None => Ok(Box::new(CompactedKeyEncoder::create_key_encoder(
                 row_type, key_fields,
             )?)),
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index 441b175a24..7504e2a43b 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -26,6 +26,7 @@ use crate::rpc::message::{
 };
 use crate::rpc::transport::Transport;
 use futures::future::BoxFuture;
+use log::warn;
 use parking_lot::{Mutex, RwLock};
 use std::collections::HashMap;
 use std::io::Cursor;
@@ -66,29 +67,25 @@ impl RpcClient {
         server_node: &ServerNode,
     ) -> Result<ServerConnection, RpcError> {
         let server_id = server_node.uid();
-        let connection = {
+        {
             let connections = self.connections.read();
-            connections.get(server_id).cloned()
-        };
-
-        if let Some(conn) = connection {
-            if !conn.is_poisoned() {
-                return Ok(conn);
+            if let Some(conn) = connections.get(server_id).cloned() {
+                if !conn.is_poisoned() {
+                    return Ok(conn);
+                }
             }
         }
-
-        let new_server = match self.connect(server_node).await {
-            Ok(new_server) => new_server,
-            Err(e) => {
-                self.connections.write().remove(server_id);
-                return Err(e);
+        let new_server = self.connect(server_node).await?;
+        {
+            let mut connections = self.connections.write();
+            if let Some(race_conn) = connections.get(server_id) {
+                if !race_conn.is_poisoned() {
+                    return Ok(race_conn.clone());
+                }
             }
-        };
-
-        self.connections
-            .write()
-            .insert(server_id.clone(), new_server.clone());
 
+            connections.insert(server_id.clone(), new_server.clone());
+        }
         Ok(new_server)
     }
 
@@ -253,7 +250,7 @@ where
         R: RequestBody + Send + WriteVersionedType<Vec<u8>>,
         R::ResponseBody: ReadVersionedType<Cursor<Vec<u8>>>,
     {
-        let request_id = self.request_id.fetch_add(1, Ordering::SeqCst);
+        let request_id = self.request_id.fetch_add(1, Ordering::SeqCst) & 0x7FFFFFFF;
         let header = RequestHeader {
             request_api_key: R::API_KEY,
             request_api_version: ApiVersion(0),
@@ -290,7 +287,10 @@ where
 
         self.send_message(buf).await?;
         _cleanup_on_cancel.message_sent();
-        let mut response = rx.await.expect("Who closed this channel?!")?;
+        let mut response = rx.await.map_err(|e| Error::UnexpectedError {
+            message: "Got recvError, some one close the channel".to_string(),
+            source: Some(Box::new(e)),
+        })??;
 
         if let Some(error_response) = response.header.error_response {
             return Err(Error::FlussAPIError {
@@ -395,6 +395,31 @@ where
     }
 }
 
+impl<F> Drop for CancellationSafeFuture<F>
+where
+    F: Future + Send + 'static,
+{
+    fn drop(&mut self) {
+        // If the future hasn't finished yet, we must ensure it completes in the background.
+        // This prevents leaving half-sent messages on the wire if the caller cancels the request.
+        if let Some(fut) = self.inner.take() {
+            // Attempt to get a handle to the current Tokio runtime.
+            // This avoids a panic if the runtime has already shut down.
+            if let Ok(handle) = tokio::runtime::Handle::try_current() {
+                handle.spawn(async move {
+                    let _ = fut.await;
+                });
+            } else {
+                // Fallback: If no runtime is active, we cannot spawn.
+                // At this point, the future 'fut' will be dropped.
+                // Since the runtime is likely shutting down anyway,
+                // the underlying connection is probably being closed.
+                warn!("Tokio runtime not found during drop; background task cancelled.");
+            }
+        }
+    }
+}
+
 /// Helper that ensures that a request is removed when a request is cancelled before it was actually sent out.
 struct CleanupRequestStateOnCancel {
     state: Arc<Mutex<ConnectionState>>,
diff --git a/fluss-rust/crates/fluss/src/util/mod.rs b/fluss-rust/crates/fluss/src/util/mod.rs
index b987fe255d..ee8dde4a41 100644
--- a/fluss-rust/crates/fluss/src/util/mod.rs
+++ b/fluss-rust/crates/fluss/src/util/mod.rs
@@ -30,7 +30,7 @@ use std::time::{SystemTime, UNIX_EPOCH};
 pub fn current_time_ms() -> i64 {
     SystemTime::now()
         .duration_since(UNIX_EPOCH)
-        .unwrap()
+        .unwrap_or(std::time::Duration::ZERO)
         .as_millis() as i64
 }
 
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index 9842a5aa7e..e94b67c510 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -96,7 +96,10 @@ mod admin_test {
         assert_eq!(db_info.database_descriptor(), &db_descriptor);
 
         // drop database
-        admin.drop_database(db_name, false, true).await;
+        admin
+            .drop_database(db_name, false, true)
+            .await
+            .expect("should drop_database");
 
         // database shouldn't exist now
         assert_eq!(admin.database_exists(db_name).await.unwrap(), false);
@@ -218,7 +221,10 @@ mod admin_test {
         assert_eq!(admin.table_exists(&table_path).await.unwrap(), false);
 
         // drop database
-        admin.drop_database(test_db_name, false, true).await;
+        admin
+            .drop_database(test_db_name, false, true)
+            .await
+            .expect("Should drop database");
 
         // database shouldn't exist now
         assert_eq!(admin.database_exists(test_db_name).await.unwrap(), false);
@@ -361,7 +367,10 @@ mod admin_test {
             .drop_table(&table_path, true)
             .await
             .expect("Failed to drop table");
-        admin.drop_database(test_db_name, true, true).await;
+        admin
+            .drop_database(test_db_name, true, true)
+            .await
+            .expect("Should drop database");
     }
 
     #[tokio::test]

From 06b30c2a75a242cadf0e90a3e52fe162d3aa5078 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Thu, 29 Jan 2026 00:04:47 +0800
Subject: [PATCH 095/287] chore:  Fix async fn panic in CancellationSafeFuture
 when future completes

---
 fluss-rust/crates/fluss/src/rpc/server_connection.rs | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index 7504e2a43b..c8fe9ae393 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -385,9 +385,15 @@ where
         mut self: std::pin::Pin<&mut Self>,
         cx: &mut std::task::Context<'_>,
     ) -> Poll<Self::Output> {
-        match self.inner.as_mut().expect("no dropped").as_mut().poll(cx) {
+        let inner = self
+            .inner
+            .as_mut()
+            .expect("CancellationSafeFuture polled after completion");
+
+        match inner.as_mut().poll(cx) {
             Poll::Ready(res) => {
                 self.done = true;
+                self.inner = None; // Prevent re-polling
                 Poll::Ready(res)
             }
             Poll::Pending => Poll::Pending,

From 9ccf598226c746be3f708946f7ad7411aa5f5f56 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Thu, 29 Jan 2026 09:35:04 +0800
Subject: [PATCH 096/287] chore: support estimated_size_in_bytes for write
 batch (#219)

---
 .../fluss/src/client/write/accumulator.rs     |   4 +-
 .../crates/fluss/src/client/write/batch.rs    | 172 +++++++++++++++++-
 .../crates/fluss/src/cluster/cluster.rs       |   3 +-
 fluss-rust/crates/fluss/src/record/arrow.rs   |  26 +++
 4 files changed, 198 insertions(+), 7 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 624e7c447b..a5b983277f 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -311,7 +311,7 @@ impl RecordAccumulator {
         node: &ServerNode,
         max_size: i32,
     ) -> Result<Vec<ReadyWriteBatch>> {
-        let mut size = 0;
+        let mut size: usize = 0;
         let buckets = self.get_all_buckets_in_current_node(node, cluster);
         let mut ready = Vec::new();
 
@@ -354,7 +354,7 @@ impl RecordAccumulator {
                     if !batch_lock.is_empty() {
                         let first_batch = batch_lock.front().unwrap();
 
-                        if size + first_batch.estimated_size_in_bytes() > max_size as i64
+                        if size + first_batch.estimated_size_in_bytes() > max_size as usize
                             && !ready.is_empty()
                         {
                             // there is a rare case that a single batch size is larger than the request size
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index 78381c6e76..41561d4ac7 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -132,9 +132,11 @@ impl WriteBatch {
         }
     }
 
-    pub fn estimated_size_in_bytes(&self) -> i64 {
-        0
-        // todo: calculate estimated_size_in_bytes
+    pub fn estimated_size_in_bytes(&self) -> usize {
+        match self {
+            WriteBatch::ArrowLog(batch) => batch.estimated_size_in_bytes(),
+            WriteBatch::Kv(batch) => batch.estimated_size_in_bytes(),
+        }
     }
 
     pub fn is_closed(&self) -> bool {
@@ -245,6 +247,18 @@ impl ArrowLogWriteBatch {
     pub fn close(&mut self) {
         self.arrow_builder.close()
     }
+
+    /// Get an estimate of the number of bytes written to the underlying buffer.
+    /// The returned value is exactly correct if the batch has been built.
+    pub fn estimated_size_in_bytes(&self) -> usize {
+        if let Some(ref bytes) = self.built_records {
+            // Return actual size if already built
+            bytes.len()
+        } else {
+            // Delegate to arrow builder for estimated size
+            self.arrow_builder.estimated_size_in_bytes()
+        }
+    }
 }
 
 pub struct KvWriteBatch {
@@ -340,11 +354,18 @@ impl KvWriteBatch {
     pub fn target_columns(&self) -> Option<&Arc<Vec<usize>>> {
         self.target_columns.as_ref()
     }
+
+    /// Get an estimate of the number of bytes written to the underlying buffer.
+    /// This returns the current size including header and all appended records.
+    pub fn estimated_size_in_bytes(&self) -> usize {
+        self.kv_batch_builder.get_size_in_bytes()
+    }
 }
 
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::client::{RowBytes, WriteFormat};
     use crate::metadata::TablePath;
 
     #[test]
@@ -363,4 +384,149 @@ mod tests {
         batch.re_enqueued();
         assert_eq!(batch.attempts(), 1);
     }
+
+    #[test]
+    fn test_arrow_log_write_batch_estimated_size() {
+        use crate::client::WriteRecord;
+        use crate::compression::{
+            ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+        };
+        use crate::metadata::{DataField, DataTypes, RowType};
+        use crate::row::GenericRow;
+        use arrow::array::{Int32Array, RecordBatch, StringArray};
+        use std::sync::Arc;
+
+        let row_type = RowType::new(vec![
+            DataField::new("id".to_string(), DataTypes::int(), None),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+        ]);
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+
+        // Test 1: RowAppendRecordBatchBuilder (to_append_record_batch=false)
+        {
+            let mut batch = ArrowLogWriteBatch::new(
+                1,
+                table_path.clone(),
+                1,
+                ArrowCompressionInfo {
+                    compression_type: ArrowCompressionType::None,
+                    compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+                },
+                &row_type,
+                0,
+                0,
+                false,
+            )
+            .unwrap();
+
+            // Append rows
+            for _ in 0..200 {
+                let mut row = GenericRow::new(2);
+                row.set_field(0, 1_i32);
+                row.set_field(1, "hello");
+                let record = WriteRecord::for_append(Arc::new(table_path.clone()), 1, row);
+                batch.try_append(&record).unwrap();
+            }
+
+            let estimated_size = batch.estimated_size_in_bytes();
+            assert!(estimated_size > 0);
+
+            let built_data = batch.build().unwrap();
+            let actual_size = built_data.len();
+
+            let diff = actual_size - estimated_size;
+            let threshold = actual_size / 10; // 10% tolerance
+            assert!(
+                diff <= threshold,
+                "RowAppend: estimated_size {estimated_size} and actual_size {actual_size} differ by more than 10%"
+            );
+        }
+
+        // Test 2: PrebuiltRecordBatchBuilder (to_append_record_batch=true)
+        {
+            let mut batch = ArrowLogWriteBatch::new(
+                1,
+                table_path.clone(),
+                1,
+                ArrowCompressionInfo {
+                    compression_type: ArrowCompressionType::None,
+                    compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+                },
+                &row_type,
+                0,
+                0,
+                true,
+            )
+            .unwrap();
+
+            // Create a pre-built RecordBatch
+            let schema = crate::record::to_arrow_schema(&row_type).unwrap();
+            let ids: Vec<i32> = (0..200).collect();
+            let names: Vec<&str> = (0..200).map(|_| "hello").collect();
+            let record_batch = RecordBatch::try_new(
+                schema,
+                vec![
+                    Arc::new(Int32Array::from(ids)),
+                    Arc::new(StringArray::from(names)),
+                ],
+            )
+            .unwrap();
+
+            let record =
+                WriteRecord::for_append_record_batch(Arc::new(table_path.clone()), 1, record_batch);
+            batch.try_append(&record).unwrap();
+
+            let estimated_size = batch.estimated_size_in_bytes();
+            assert!(estimated_size > 0);
+
+            let built_data = batch.build().unwrap();
+            let actual_size = built_data.len();
+
+            let diff = actual_size - estimated_size;
+            let threshold = actual_size / 10; // 10% tolerance
+            assert!(
+                diff <= threshold,
+                "Prebuilt: estimated_size {estimated_size} and actual_size {actual_size} differ by more than 10%"
+            );
+        }
+    }
+
+    #[test]
+    fn test_kv_write_batch_estimated_size() {
+        use crate::metadata::KvFormat;
+
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+
+        let mut batch = KvWriteBatch::new(
+            1,
+            table_path.clone(),
+            1,
+            KvWriteBatch::DEFAULT_WRITE_LIMIT,
+            KvFormat::COMPACTED,
+            0,
+            None,
+            0,
+        );
+
+        for _ in 0..200 {
+            let record = WriteRecord::for_upsert(
+                Arc::new(table_path.clone()),
+                1,
+                Bytes::from(vec![1_u8, 2_u8, 3_u8]),
+                None,
+                WriteFormat::CompactedKv,
+                None,
+                Some(RowBytes::Owned(Bytes::from(vec![1_u8, 2_u8, 3_u8]))),
+            );
+            batch.try_append(&record).unwrap();
+        }
+
+        let estimated_size = batch.estimated_size_in_bytes();
+        let actual_size = batch.build().unwrap().len();
+
+        assert_eq!(
+            actual_size, estimated_size,
+            "estimated size {estimated_size} is not equal to actual size"
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
index 0b14fe67fd..d6fe0ae5d1 100644
--- a/fluss-rust/crates/fluss/src/cluster/cluster.rs
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -191,8 +191,7 @@ impl Cluster {
                 &serde_json::from_slice(table_metadata.table_json.as_slice()).map_err(|e| {
                     Error::JsonSerdeError {
                         message: format!(
-                            "Error deserializing table_json into TableDescriptor for table_id {} and table_path {}: {}",
-                            table_id, table_path, e
+                            "Error deserializing table_json into TableDescriptor for table_id {table_id} and table_path {table_path}: {e}"
                         )
                     }
                 })?,
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 63df6de67c..6340dc8022 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -175,6 +175,9 @@ pub trait ArrowRecordBatchInnerBuilder: Send + Sync {
     fn records_count(&self) -> i32;
 
     fn is_full(&self) -> bool;
+
+    /// Get an estimate of the size in bytes of the arrow data.
+    fn estimated_size_in_bytes(&self) -> usize;
 }
 
 #[derive(Default)]
@@ -214,6 +217,13 @@ impl ArrowRecordBatchInnerBuilder for PrebuiltRecordBatchBuilder {
         // full if has one record batch
         self.arrow_record_batch.is_some()
     }
+
+    fn estimated_size_in_bytes(&self) -> usize {
+        self.arrow_record_batch
+            .as_ref()
+            .map(|batch| batch.get_array_memory_size())
+            .unwrap_or(0)
+    }
 }
 
 pub struct RowAppendRecordBatchBuilder {
@@ -361,6 +371,16 @@ impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
     fn is_full(&self) -> bool {
         self.records_count() >= DEFAULT_MAX_RECORD
     }
+
+    fn estimated_size_in_bytes(&self) -> usize {
+        // Returns the uncompressed Arrow array memory size (same as Java's arrowWriter.estimatedSizeInBytes()).
+        // Note: This is the size before compression. After build(), the actual size may be smaller
+        // if compression is enabled.
+        self.arrow_column_builders
+            .iter()
+            .map(|builder| builder.finish_cloned().get_array_memory_size())
+            .sum()
+    }
 }
 
 impl MemoryLogRecordsArrowBuilder {
@@ -481,6 +501,12 @@ impl MemoryLogRecordsArrowBuilder {
         cursor.write_i32::<LittleEndian>(record_count)?;
         Ok(())
     }
+
+    /// Get an estimate of the number of bytes written to the underlying buffer.
+    /// This includes the batch header size plus the estimated arrow data size.
+    pub fn estimated_size_in_bytes(&self) -> usize {
+        RECORD_BATCH_HEADER_SIZE + self.arrow_record_batch_builder.estimated_size_in_bytes()
+    }
 }
 
 pub trait ToArrow {

From 2db8982a158972b2194400feb1684c6d537ba088 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 30 Jan 2026 09:34:55 +0800
Subject: [PATCH 097/287] feat: support scan from oss (#217)

---
 fluss-rust/crates/fluss/Cargo.toml            |  5 ++-
 .../crates/fluss/src/client/credentials.rs    | 28 +++++++++++-
 .../fluss/src/client/table/remote_log.rs      |  1 +
 fluss-rust/crates/fluss/src/io/mod.rs         |  5 +++
 fluss-rust/crates/fluss/src/io/storage.rs     | 15 ++++++-
 fluss-rust/crates/fluss/src/io/storage_oss.rs | 45 +++++++++++++++++++
 6 files changed, 95 insertions(+), 4 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/io/storage_oss.rs

diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 9aeee72db4..6b2707bee3 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -22,12 +22,13 @@ version = { workspace = true }
 name = "fluss"
 
 [features]
-default = ["storage-memory", "storage-fs", "storage-s3"]
-storage-all = ["storage-memory", "storage-fs", "storage-s3"]
+default = ["storage-memory", "storage-fs"]
+storage-all = ["storage-memory", "storage-fs", "storage-s3", "storage-oss"]
 
 storage-memory = ["opendal/services-memory"]
 storage-fs = ["opendal/services-fs"]
 storage-s3 = ["opendal/services-s3"]
+storage-oss = ["opendal/services-oss"]
 integration_tests = []
 
 [dependencies]
diff --git a/fluss-rust/crates/fluss/src/client/credentials.rs b/fluss-rust/crates/fluss/src/client/credentials.rs
index 93a536695a..a954e2a916 100644
--- a/fluss-rust/crates/fluss/src/client/credentials.rs
+++ b/fluss-rust/crates/fluss/src/client/credentials.rs
@@ -55,10 +55,14 @@ struct Credentials {
 /// needs_inversion is true for path_style_access -> enable_virtual_host_style conversion
 fn convert_hadoop_key_to_opendal(hadoop_key: &str) -> Option<(String, bool)> {
     match hadoop_key {
+        // S3 specific configurations
         "fs.s3a.endpoint" => Some(("endpoint".to_string(), false)),
         "fs.s3a.endpoint.region" => Some(("region".to_string(), false)),
         "fs.s3a.path.style.access" => Some(("enable_virtual_host_style".to_string(), true)),
         "fs.s3a.connection.ssl.enabled" => None,
+        // OSS specific configurations
+        "fs.oss.endpoint" => Some(("endpoint".to_string(), false)),
+        "fs.oss.region" => Some(("region".to_string(), false)),
         _ => None,
     }
 }
@@ -74,11 +78,20 @@ fn build_remote_fs_props(
         "access_key_id".to_string(),
         credentials.access_key_id.clone(),
     );
+
+    // S3 specific configurations
     props.insert(
         "secret_access_key".to_string(),
         credentials.access_key_secret.clone(),
     );
 
+    // OSS specific configurations, todo: consider refactor it
+    // to handle different conversion for different scheme in different method
+    props.insert(
+        "access_key_secret".to_string(),
+        credentials.access_key_secret.clone(),
+    );
+
     if let Some(token) = &credentials.security_token {
         props.insert("security_token".to_string(), token.clone());
     }
@@ -342,6 +355,7 @@ mod tests {
 
     #[test]
     fn convert_hadoop_key_to_opendal_maps_known_keys() {
+        // S3 keys
         let (key, invert) = convert_hadoop_key_to_opendal("fs.s3a.endpoint").expect("key");
         assert_eq!(key, "endpoint");
         assert!(!invert);
@@ -351,6 +365,17 @@ mod tests {
         assert!(invert);
 
         assert!(convert_hadoop_key_to_opendal("fs.s3a.connection.ssl.enabled").is_none());
+
+        // OSS keys
+        let (key, invert) = convert_hadoop_key_to_opendal("fs.oss.endpoint").expect("key");
+        assert_eq!(key, "endpoint");
+        assert!(!invert);
+
+        let (key, invert) = convert_hadoop_key_to_opendal("fs.oss.region").expect("key");
+        assert_eq!(key, "region");
+        assert!(!invert);
+
+        // Unknown key
         assert!(convert_hadoop_key_to_opendal("unknown.key").is_none());
     }
 
@@ -401,7 +426,8 @@ mod tests {
 
         let props = build_remote_fs_props(&credentials, &addition_infos);
         assert_eq!(props.get("access_key_id"), Some(&"ak".to_string()));
-        assert_eq!(props.get("secret_access_key"), Some(&"sk".to_string()));
+        assert_eq!(props.get("access_key_secret"), Some(&"sk".to_string()));
+        assert_eq!(props.get("access_key_secret"), Some(&"sk".to_string()));
         assert_eq!(props.get("security_token"), Some(&"token".to_string()));
         assert_eq!(
             props.get("enable_virtual_host_style"),
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index df747710f6..5583f89d5a 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -869,6 +869,7 @@ impl RemoteLogDownloader {
         // For S3/S3A URLs, inject S3 credentials from props
         let file_io_builder = if remote_log_tablet_dir.starts_with("s3://")
             || remote_log_tablet_dir.starts_with("s3a://")
+            || remote_log_tablet_dir.starts_with("oss://")
         {
             file_io_builder.with_props(
                 remote_fs_props
diff --git a/fluss-rust/crates/fluss/src/io/mod.rs b/fluss-rust/crates/fluss/src/io/mod.rs
index a03a394529..74265017aa 100644
--- a/fluss-rust/crates/fluss/src/io/mod.rs
+++ b/fluss-rust/crates/fluss/src/io/mod.rs
@@ -37,3 +37,8 @@ use storage_memory::*;
 mod storage_s3;
 #[cfg(feature = "storage-s3")]
 use storage_s3::*;
+
+#[cfg(feature = "storage-oss")]
+mod storage_oss;
+#[cfg(feature = "storage-oss")]
+use storage_oss::*;
diff --git a/fluss-rust/crates/fluss/src/io/storage.rs b/fluss-rust/crates/fluss/src/io/storage.rs
index d90eaa5711..a370861094 100644
--- a/fluss-rust/crates/fluss/src/io/storage.rs
+++ b/fluss-rust/crates/fluss/src/io/storage.rs
@@ -19,7 +19,6 @@ use crate::error;
 use crate::error::Result;
 use crate::io::FileIOBuilder;
 use opendal::{Operator, Scheme};
-use std::collections::HashMap;
 
 /// The storage carries all supported storage services in fluss
 #[derive(Debug)]
@@ -30,9 +29,12 @@ pub enum Storage {
     LocalFs,
     #[cfg(feature = "storage-s3")]
     S3 { props: HashMap<String, String> },
+    #[cfg(feature = "storage-oss")]
+    Oss { props: HashMap<String, String> },
 }
 
 impl Storage {
+    #[allow(unused_variables)]
     pub(crate) fn build(file_io_builder: FileIOBuilder) -> Result<Self> {
         let (scheme_str, props) = file_io_builder.into_parts();
         let scheme = Self::parse_scheme(&scheme_str)?;
@@ -44,6 +46,8 @@ impl Storage {
             Scheme::Fs => Ok(Self::LocalFs),
             #[cfg(feature = "storage-s3")]
             Scheme::S3 => Ok(Self::S3 { props }),
+            #[cfg(feature = "storage-oss")]
+            Scheme::Oss => Ok(Self::Oss { props }),
             _ => Err(error::Error::IoUnsupported {
                 message: format!("Unsupported storage feature {scheme_str}"),
             }),
@@ -79,6 +83,14 @@ impl Storage {
                 let op = super::s3_config_build(&s3_props)?;
                 Ok((op, key))
             }
+            #[cfg(feature = "storage-oss")]
+            Storage::Oss { props } => {
+                let (bucket, key) = super::parse_oss_path(path);
+                let mut oss_props = props.clone();
+                oss_props.insert("bucket".to_string(), bucket.to_string());
+                let op = super::oss_config_build(&oss_props)?;
+                Ok((op, key))
+            }
         }
     }
 
@@ -87,6 +99,7 @@ impl Storage {
             "memory" => Ok(Scheme::Memory),
             "file" | "" => Ok(Scheme::Fs),
             "s3" | "s3a" => Ok(Scheme::S3),
+            "oss" => Ok(Scheme::Oss),
             s => Ok(s.parse::<Scheme>()?),
         }
     }
diff --git a/fluss-rust/crates/fluss/src/io/storage_oss.rs b/fluss-rust/crates/fluss/src/io/storage_oss.rs
new file mode 100644
index 0000000000..3d5d05499a
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/io/storage_oss.rs
@@ -0,0 +1,45 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::Result;
+use opendal::Configurator;
+use opendal::Operator;
+use opendal::layers::TimeoutLayer;
+use opendal::services::OssConfig;
+use std::collections::HashMap;
+use std::time::Duration;
+
+pub(crate) fn oss_config_build(props: &HashMap<String, String>) -> Result<Operator> {
+    let config = OssConfig::from_iter(props.clone())?;
+    let op = Operator::from_config(config)?.finish();
+
+    // Add timeout layer to prevent hanging on OSS operations
+    let timeout_layer = TimeoutLayer::new()
+        .with_timeout(Duration::from_secs(10))
+        .with_io_timeout(Duration::from_secs(30));
+
+    Ok(op.layer(timeout_layer))
+}
+
+pub(crate) fn parse_oss_path(path: &str) -> (&str, &str) {
+    let path = path.strip_prefix("oss://").unwrap_or(path);
+
+    match path.find('/') {
+        Some(idx) => (&path[..idx], &path[idx + 1..]),
+        None => (path, ""),
+    }
+}

From 80ac6fd47ba35009ad82b9498b1b902592ab295f Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Fri, 30 Jan 2026 08:08:25 +0000
Subject: [PATCH 098/287] feat: Implement partitioning in Upsert / Lookup
 (#220)

---
 fluss-rust/crates/examples/Cargo.toml         |   6 +-
 .../src/example_partitioned_kv_table.rs       | 153 +++++++++++++
 .../crates/examples/src/example_table.rs      |   1 +
 fluss-rust/crates/fluss/src/bucketing/mod.rs  |   1 -
 fluss-rust/crates/fluss/src/client/admin.rs   |   8 +-
 .../crates/fluss/src/client/connection.rs     |   5 -
 .../crates/fluss/src/client/metadata.rs       |  81 ++++++-
 .../crates/fluss/src/client/table/append.rs   |  23 +-
 .../src/client/table/log_fetch_buffer.rs      |   9 +-
 .../crates/fluss/src/client/table/lookup.rs   |  95 +++++---
 .../crates/fluss/src/client/table/mod.rs      |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  |  19 +-
 .../crates/fluss/src/client/table/upsert.rs   |  39 +++-
 .../crates/fluss/src/client/table/writer.rs   |  55 -----
 .../fluss/src/client/write/accumulator.rs     | 128 +++++++----
 .../crates/fluss/src/client/write/batch.rs    |  72 ++++---
 .../fluss/src/client/write/bucket_assigner.rs |  16 +-
 .../crates/fluss/src/client/write/mod.rs      |  33 ++-
 .../crates/fluss/src/client/write/sender.rs   | 118 +++++++---
 .../fluss/src/client/write/writer_client.rs   |  47 ++--
 .../crates/fluss/src/cluster/cluster.rs       | 204 +++++++++++++-----
 fluss-rust/crates/fluss/src/cluster/mod.rs    |  13 +-
 fluss-rust/crates/fluss/src/error.rs          |   6 +
 .../crates/fluss/src/metadata/datatype.rs     |   9 +
 fluss-rust/crates/fluss/src/metadata/table.rs |  45 ++--
 fluss-rust/crates/fluss/src/record/arrow.rs   |  13 +-
 .../fluss/src/rpc/message/update_metadata.rs  |  26 ++-
 fluss-rust/crates/fluss/src/test_utils.rs     |  11 +-
 .../fluss/tests/integration/kv_table.rs       | 175 ++++++++++++++-
 29 files changed, 1071 insertions(+), 342 deletions(-)
 create mode 100644 fluss-rust/crates/examples/src/example_partitioned_kv_table.rs

diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
index 117ceb2708..16629bed16 100644
--- a/fluss-rust/crates/examples/Cargo.toml
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -33,4 +33,8 @@ path = "src/example_table.rs"
 
 [[example]]
 name = "example-upsert-lookup"
-path = "src/example_kv_table.rs"
\ No newline at end of file
+path = "src/example_kv_table.rs"
+
+[[example]]
+name = "example-partitioned-upsert-lookup"
+path = "src/example_partitioned_kv_table.rs"
\ No newline at end of file
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
new file mode 100644
index 0000000000..a5e76fa38e
--- /dev/null
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -0,0 +1,153 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use clap::Parser;
+use fluss::client::{FlussAdmin, FlussConnection, UpsertWriter};
+use fluss::config::Config;
+use fluss::error::Result;
+use fluss::metadata::{DataTypes, PartitionSpec, Schema, TableDescriptor, TablePath};
+use fluss::row::{GenericRow, InternalRow};
+use std::collections::HashMap;
+
+#[tokio::main]
+#[allow(dead_code)]
+pub async fn main() -> Result<()> {
+    let mut config = Config::parse();
+    config.bootstrap_server = Some("127.0.0.1:9123".to_string());
+
+    let conn = FlussConnection::new(config).await?;
+
+    let table_descriptor = TableDescriptor::builder()
+        .schema(
+            Schema::builder()
+                .column("id", DataTypes::int())
+                .column("region", DataTypes::string())
+                .column("zone", DataTypes::bigint())
+                .column("score", DataTypes::bigint())
+                .primary_key(vec![
+                    "id".to_string(),
+                    "region".to_string(),
+                    "zone".to_string(),
+                ])
+                .build()?,
+        )
+        .partitioned_by(vec!["region".to_string(), "zone".to_string()])
+        .build()?;
+
+    let table_path = TablePath::new("fluss".to_owned(), "partitioned_kv_example".to_owned());
+
+    let mut admin = conn.get_admin().await?;
+    admin
+        .create_table(&table_path, &table_descriptor, true)
+        .await?;
+    println!(
+        "Created KV Table:\n {}\n",
+        admin.get_table(&table_path).await?
+    );
+
+    create_partition(&table_path, &mut admin, "APAC", 1).await;
+    create_partition(&table_path, &mut admin, "EMEA", 2).await;
+    create_partition(&table_path, &mut admin, "US", 3).await;
+
+    let table = conn.get_table(&table_path).await?;
+    let table_upsert = table.new_upsert()?;
+    let mut upsert_writer = table_upsert.create_writer()?;
+
+    println!("\n=== Upserting ===");
+    for (id, region, zone, score) in [
+        (1001, "APAC", 1i64, 1234i64),
+        (1002, "EMEA", 2, 2234),
+        (1003, "US", 3, 3234),
+    ] {
+        let mut row = GenericRow::new(4);
+        row.set_field(0, id);
+        row.set_field(1, region);
+        row.set_field(2, zone);
+        row.set_field(3, score);
+        upsert_writer.upsert(&row).await?;
+        println!("Upserted: {row:?}");
+    }
+
+    println!("\n=== Looking up ===");
+    let mut lookuper = table.new_lookup()?.create_lookuper()?;
+
+    for (id, region, zone) in [(1001, "APAC", 1i64), (1002, "EMEA", 2), (1003, "US", 3)] {
+        let result = lookuper
+            .lookup(&make_key(id, region, zone))
+            .await
+            .expect("lookup");
+        let row = result.get_single_row()?.unwrap();
+        println!(
+            "Found id={id}: region={}, zone={}, score={}",
+            row.get_string(1),
+            row.get_long(2),
+            row.get_long(3)
+        );
+    }
+
+    println!("\n=== Updating ===");
+    let mut row = GenericRow::new(4);
+    row.set_field(0, 1001);
+    row.set_field(1, "APAC");
+    row.set_field(2, 1i64);
+    row.set_field(3, 4321i64);
+    upsert_writer.upsert(&row).await?;
+    println!("Updated: {row:?}");
+
+    let result = lookuper.lookup(&make_key(1001, "APAC", 1)).await?;
+    let row = result.get_single_row()?.unwrap();
+    println!(
+        "Verified update: region={}, zone={}",
+        row.get_string(1),
+        row.get_long(2)
+    );
+
+    println!("\n=== Deleting ===");
+    let mut row = GenericRow::new(4);
+    row.set_field(0, 1002);
+    row.set_field(1, "EMEA");
+    row.set_field(2, 2i64);
+    upsert_writer.delete(&row).await?;
+    println!("Deleted: {row:?}");
+
+    let result = lookuper.lookup(&make_key(1002, "EMEA", 2)).await?;
+    if result.get_single_row()?.is_none() {
+        println!("Verified deletion");
+    }
+
+    Ok(())
+}
+
+async fn create_partition(table_path: &TablePath, admin: &mut FlussAdmin, region: &str, zone: i64) {
+    let mut partition_values = HashMap::new();
+    partition_values.insert("region".to_string(), region.to_string());
+    partition_values.insert("zone".to_string(), zone.to_string());
+    let partition_spec = PartitionSpec::new(partition_values);
+
+    admin
+        .create_partition(table_path, &partition_spec, true)
+        .await
+        .unwrap();
+}
+
+fn make_key(id: i32, region: &str, zone: i64) -> GenericRow<'static> {
+    let mut row = GenericRow::new(4);
+    row.set_field(0, id);
+    row.set_field(1, region.to_string());
+    row.set_field(2, zone);
+    row
+}
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index ca6b942861..92055a702b 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 mod example_kv_table;
+mod example_partitioned_kv_table;
 
 use clap::Parser;
 use fluss::client::FlussConnection;
diff --git a/fluss-rust/crates/fluss/src/bucketing/mod.rs b/fluss-rust/crates/fluss/src/bucketing/mod.rs
index 2611ac7ecf..1b43d12a23 100644
--- a/fluss-rust/crates/fluss/src/bucketing/mod.rs
+++ b/fluss-rust/crates/fluss/src/bucketing/mod.rs
@@ -24,7 +24,6 @@ pub trait BucketingFunction: Sync + Send {
     fn bucketing(&self, bucket_key: &[u8], num_buckets: i32) -> Result<i32>;
 }
 
-#[allow(dead_code)]
 impl dyn BucketingFunction {
     /// Provides the bucketing function for a given [DataLakeFormat]
     ///
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 286c46c26a..ea1efc3810 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -32,7 +32,7 @@ use crate::rpc::{RpcClient, ServerConnection};
 use crate::error::{Error, Result};
 use crate::proto::GetTableInfoResponse;
 use crate::{BucketId, PartitionId, TableId};
-use std::collections::HashMap;
+use std::collections::{HashMap, HashSet};
 use std::slice::from_ref;
 use std::sync::Arc;
 use tokio::task::JoinHandle;
@@ -111,6 +111,12 @@ impl FlussAdmin {
             .admin_gateway
             .request(GetTableRequest::new(table_path))
             .await?;
+
+        // force update to avoid stale data in cache
+        self.metadata
+            .update_tables_metadata(&HashSet::from([table_path]), &HashSet::new(), vec![])
+            .await?;
+
         let GetTableInfoResponse {
             table_id,
             schema_id,
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index a19dbd2f60..e021011807 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -93,11 +93,6 @@ impl FlussConnection {
     pub async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>> {
         self.metadata.update_table_metadata(table_path).await?;
         let table_info = self.metadata.get_cluster().get_table(table_path)?.clone();
-        if table_info.is_partitioned() {
-            return Err(crate::error::Error::UnsupportedOperation {
-                message: "Partitioned tables are not supported".to_string(),
-            });
-        }
         Ok(FlussTable::new(self, self.metadata.clone(), table_info))
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index 614f6e7880..52ccd62e43 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -58,7 +58,14 @@ impl Metadata {
             ServerType::CoordinatorServer,
         );
         let con = connections.get_connection(&server_node).await?;
-        let response = con.request(UpdateMetadataRequest::new(&[])).await?;
+
+        let response = con
+            .request(UpdateMetadataRequest::new(
+                &HashSet::default(),
+                &HashSet::new(),
+                vec![],
+            ))
+            .await?;
         Cluster::from_metadata_response(response, None)
     }
 
@@ -95,7 +102,12 @@ impl Metadata {
         Ok(())
     }
 
-    pub async fn update_tables_metadata(&self, table_paths: &HashSet<&TablePath>) -> Result<()> {
+    pub async fn update_tables_metadata(
+        &self,
+        table_paths: &HashSet<&TablePath>,
+        physical_table_paths: &HashSet<&Arc<PhysicalTablePath>>,
+        partition_ids: Vec<i64>,
+    ) -> Result<()> {
         let maybe_server = {
             let guard = self.cluster.read();
             guard.get_one_available_server().cloned()
@@ -114,16 +126,19 @@ impl Metadata {
 
         let conn = self.connections.get_connection(&server).await?;
 
-        let update_table_paths: Vec<&TablePath> = table_paths.iter().copied().collect();
         let response = conn
-            .request(UpdateMetadataRequest::new(update_table_paths.as_slice()))
+            .request(UpdateMetadataRequest::new(
+                table_paths,
+                physical_table_paths,
+                partition_ids,
+            ))
             .await?;
         self.update(response).await?;
         Ok(())
     }
 
     pub async fn update_table_metadata(&self, table_path: &TablePath) -> Result<()> {
-        self.update_tables_metadata(&HashSet::from([table_path]))
+        self.update_tables_metadata(&HashSet::from([table_path]), &HashSet::new(), vec![])
             .await
     }
 
@@ -133,8 +148,9 @@ impl Metadata {
             .iter()
             .filter(|table_path| cluster_binding.opt_get_table(table_path).is_none())
             .collect();
+
         if !need_update_table_paths.is_empty() {
-            self.update_tables_metadata(&need_update_table_paths)
+            self.update_tables_metadata(&need_update_table_paths, &HashSet::new(), vec![])
                 .await?;
         }
         Ok(())
@@ -150,7 +166,48 @@ impl Metadata {
         guard.clone()
     }
 
-    pub fn leader_for(&self, table_bucket: &TableBucket) -> Option<ServerNode> {
+    const MAX_RETRY_TIMES: u8 = 3;
+
+    pub async fn leader_for(
+        &self,
+        table_path: &TablePath,
+        table_bucket: &TableBucket,
+    ) -> Result<Option<ServerNode>> {
+        let leader = self.get_leader_for(table_bucket);
+
+        if leader.is_some() {
+            Ok(leader)
+        } else {
+            for _ in 0..Self::MAX_RETRY_TIMES {
+                if let Some(partition_id) = table_bucket.partition_id() {
+                    self.update_tables_metadata(
+                        &HashSet::from([table_path]),
+                        &HashSet::new(),
+                        vec![partition_id],
+                    )
+                    .await?;
+                } else {
+                    self.update_tables_metadata(
+                        &HashSet::from([table_path]),
+                        &HashSet::new(),
+                        vec![],
+                    )
+                    .await?;
+                }
+
+                let cluster = self.cluster.read();
+                let leader = cluster.leader_for(table_bucket);
+
+                if leader.is_some() {
+                    return Ok(leader.cloned());
+                }
+            }
+
+            Ok(None)
+        }
+    }
+
+    fn get_leader_for(&self, table_bucket: &TableBucket) -> Option<ServerNode> {
         let cluster = self.cluster.read();
         cluster.leader_for(table_bucket).cloned()
     }
@@ -173,14 +230,16 @@ mod tests {
     use crate::metadata::{TableBucket, TablePath};
     use crate::test_utils::build_cluster_arc;
 
-    #[test]
-    fn leader_for_returns_server() {
+    #[tokio::test]
+    async fn leader_for_returns_server() {
         let table_path = TablePath::new("db".to_string(), "tbl".to_string());
         let cluster = build_cluster_arc(&table_path, 1, 1);
         let metadata = Metadata::new_for_test(cluster);
         let leader = metadata
-            .leader_for(&TableBucket::new(1, 0))
-            .expect("leader");
+            .leader_for(&table_path, &TableBucket::new(1, 0))
+            .await
+            .expect("leader request should be Ok")
+            .expect("leader should exist");
         assert_eq!(leader.id(), 1);
     }
 
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index 6d76f28b32..7fe2023bbb 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -17,7 +17,7 @@
 
 use crate::client::{WriteRecord, WriterClient};
 use crate::error::Result;
-use crate::metadata::{TableInfo, TablePath};
+use crate::metadata::{PhysicalTablePath, TableInfo, TablePath};
 use crate::row::GenericRow;
 use arrow::array::RecordBatch;
 use std::sync::Arc;
@@ -25,14 +25,14 @@ use std::sync::Arc;
 #[allow(dead_code)]
 pub struct TableAppend {
     table_path: TablePath,
-    table_info: TableInfo,
+    table_info: Arc<TableInfo>,
     writer_client: Arc<WriterClient>,
 }
 
 impl TableAppend {
     pub(super) fn new(
         table_path: TablePath,
-        table_info: TableInfo,
+        table_info: Arc<TableInfo>,
         writer_client: Arc<WriterClient>,
     ) -> Self {
         Self {
@@ -44,23 +44,27 @@ impl TableAppend {
 
     pub fn create_writer(&self) -> AppendWriter {
         AppendWriter {
-            table_path: Arc::new(self.table_path.clone()),
+            physical_table_path: Arc::new(PhysicalTablePath::of(Arc::new(self.table_path.clone()))),
             writer_client: self.writer_client.clone(),
-            table_info: Arc::new(self.table_info.clone()),
+            table_info: Arc::clone(&self.table_info),
         }
     }
 }
 
 pub struct AppendWriter {
-    table_path: Arc<TablePath>,
+    physical_table_path: Arc<PhysicalTablePath>,
     writer_client: Arc<WriterClient>,
     table_info: Arc<TableInfo>,
 }
 
 impl AppendWriter {
     pub async fn append(&self, row: GenericRow<'_>) -> Result<()> {
-        let record =
-            WriteRecord::for_append(self.table_path.clone(), self.table_info.schema_id, row);
+        let record = WriteRecord::for_append(
+            Arc::clone(&self.table_info),
+            Arc::clone(&self.physical_table_path),
+            self.table_info.schema_id,
+            row,
+        );
         let result_handle = self.writer_client.send(&record).await?;
         let result = result_handle.wait().await?;
         result_handle.result(result)
@@ -68,7 +72,8 @@ impl AppendWriter {
 
     pub async fn append_arrow_batch(&self, batch: RecordBatch) -> Result<()> {
         let record = WriteRecord::for_append_record_batch(
-            self.table_path.clone(),
+            Arc::clone(&self.table_info),
+            Arc::clone(&self.physical_table_path),
             self.table_info.schema_id,
             batch,
         );
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index 7ece34b478..78ee065a4d 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -833,9 +833,10 @@ mod tests {
     use crate::compression::{
         ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
     };
-    use crate::metadata::{DataField, DataTypes, RowType, TablePath};
+    use crate::metadata::{DataField, DataTypes, PhysicalTablePath, RowType, TablePath};
     use crate::record::{MemoryLogRecordsArrowBuilder, ReadContext, to_arrow_schema};
     use crate::row::GenericRow;
+    use crate::test_utils::build_table_info;
     use std::sync::Arc;
 
     fn test_read_context() -> Result<ReadContext> {
@@ -899,7 +900,9 @@ mod tests {
             DataField::new("id".to_string(), DataTypes::int(), None),
             DataField::new("name".to_string(), DataTypes::string(), None),
         ]);
-        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path)));
 
         let mut builder = MemoryLogRecordsArrowBuilder::new(
             1,
@@ -914,7 +917,7 @@ mod tests {
         let mut row = GenericRow::new(2);
         row.set_field(0, 1_i32);
         row.set_field(1, "alice");
-        let record = WriteRecord::for_append(table_path, 1, row);
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, row);
         builder.append(&record)?;
 
         let data = builder.build()?;
diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index 4e89176a61..69cb91efa7 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -18,8 +18,9 @@
 use crate::bucketing::BucketingFunction;
 use crate::client::connection::FlussConnection;
 use crate::client::metadata::Metadata;
+use crate::client::table::partition_getter::PartitionGetter;
 use crate::error::{Error, Result};
-use crate::metadata::{RowType, TableBucket, TableInfo};
+use crate::metadata::{PhysicalTablePath, RowType, TableBucket, TableInfo, TablePath};
 use crate::record::kv::SCHEMA_ID_LENGTH;
 use crate::row::InternalRow;
 use crate::row::compacted::CompactedRow;
@@ -133,20 +134,43 @@ impl<'a> TableLookup<'a> {
         let data_lake_format = self.table_info.get_table_config().get_datalake_format()?;
         let bucketing_function = <dyn BucketingFunction>::of(data_lake_format.as_ref());
 
-        // Create key encoder for the primary key fields
-        let pk_fields = self.table_info.get_physical_primary_keys().to_vec();
-        let key_encoder = KeyEncoderFactory::of(
-            self.table_info.row_type(),
-            pk_fields.as_slice(),
-            &data_lake_format,
-        )?;
+        let row_type = self.table_info.row_type();
+        let primary_keys = self.table_info.get_primary_keys();
+        let lookup_row_type = row_type.project_with_field_names(primary_keys)?;
+
+        let physical_primary_keys = self.table_info.get_physical_primary_keys().to_vec();
+        let primary_key_encoder =
+            KeyEncoderFactory::of(&lookup_row_type, &physical_primary_keys, &data_lake_format)?;
+
+        let bucket_key_encoder = if self.table_info.is_default_bucket_key() {
+            None
+        } else {
+            let bucket_keys = self.table_info.get_bucket_keys().to_vec();
+            Some(KeyEncoderFactory::of(
+                &lookup_row_type,
+                &bucket_keys,
+                &data_lake_format,
+            )?)
+        };
+
+        let partition_getter = if self.table_info.is_partitioned() {
+            Some(PartitionGetter::new(
+                &lookup_row_type,
+                Arc::clone(self.table_info.get_partition_keys()),
+            )?)
+        } else {
+            None
+        };
 
         Ok(Lookuper {
             conn: self.conn,
+            table_path: Arc::new(self.table_info.table_path.clone()),
             table_info: self.table_info,
             metadata: self.metadata,
             bucketing_function,
-            key_encoder,
+            primary_key_encoder,
+            bucket_key_encoder,
+            partition_getter,
             num_buckets,
         })
     }
@@ -163,13 +187,15 @@ impl<'a> TableLookup<'a> {
 /// let row = GenericRow::new(vec![Datum::Int32(42)]); // lookup key
 /// let result = lookuper.lookup(&row).await?;
 /// ```
-// TODO: Support partitioned tables (extract partition from key)
 pub struct Lookuper<'a> {
     conn: &'a FlussConnection,
     table_info: TableInfo,
+    table_path: Arc<TablePath>,
     metadata: Arc<Metadata>,
     bucketing_function: Box<dyn BucketingFunction>,
-    key_encoder: Box<dyn KeyEncoder>,
+    primary_key_encoder: Box<dyn KeyEncoder>,
+    bucket_key_encoder: Option<Box<dyn KeyEncoder>>,
+    partition_getter: Option<PartitionGetter>,
     num_buckets: i32,
 }
 
@@ -187,26 +213,47 @@ impl<'a> Lookuper<'a> {
     /// * `Err(Error)` - If the lookup fails
     pub async fn lookup(&mut self, row: &dyn InternalRow) -> Result<LookupResult<'_>> {
         // todo: support batch lookup
-        // Encode the key from the row
-        let encoded_key = self.key_encoder.encode_key(row)?;
-        let key_bytes = encoded_key.to_vec();
+        let pk_bytes = self.primary_key_encoder.encode_key(row)?;
+        let pk_bytes_vec = pk_bytes.to_vec();
+        let bk_bytes = match &mut self.bucket_key_encoder {
+            Some(encoder) => &encoder.encode_key(row)?,
+            None => &pk_bytes,
+        };
+
+        let partition_id = if let Some(ref partition_getter) = self.partition_getter {
+            let partition_name = partition_getter.get_partition(row)?;
+            let physical_table_path = PhysicalTablePath::of_partitioned(
+                Arc::clone(&self.table_path),
+                Some(partition_name),
+            );
+            let cluster = self.metadata.get_cluster();
+            match cluster.get_partition_id(&physical_table_path) {
+                Some(id) => Some(id),
+                None => {
+                    // Partition doesn't exist, return empty result (like Java)
+                    return Ok(LookupResult::empty(self.table_info.row_type()));
+                }
+            }
+        } else {
+            None
+        };
 
-        // Compute bucket from encoded key
         let bucket_id = self
             .bucketing_function
-            .bucketing(&key_bytes, self.num_buckets)?;
+            .bucketing(bk_bytes, self.num_buckets)?;
 
         let table_id = self.table_info.get_table_id();
-        let table_bucket = TableBucket::new(table_id, bucket_id);
+        let table_bucket = TableBucket::new_with_partition(table_id, partition_id, bucket_id);
 
         // Find the leader for this bucket
         let cluster = self.metadata.get_cluster();
-        let leader =
-            cluster
-                .leader_for(&table_bucket)
-                .ok_or_else(|| Error::LeaderNotAvailable {
-                    message: format!("No leader found for table bucket: {table_bucket}"),
-                })?;
+        let leader = self
+            .metadata
+            .leader_for(self.table_path.as_ref(), &table_bucket)
+            .await?
+            .ok_or_else(|| Error::LeaderNotAvailable {
+                message: format!("No leader found for table bucket: {table_bucket}"),
+            })?;
 
         // Get connection to the tablet server
         let tablet_server =
@@ -223,7 +270,7 @@ impl<'a> Lookuper<'a> {
         let connection = connections.get_connection(tablet_server).await?;
 
         // Send lookup request
-        let request = LookupRequest::new(table_id, None, bucket_id, vec![key_bytes]);
+        let request = LookupRequest::new(table_id, partition_id, bucket_id, vec![pk_bytes_vec]);
         let response = connection.request(request).await?;
 
         // Extract the values from response
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 2dc56d52d2..2fbbbc917f 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -69,7 +69,7 @@ impl<'a> FlussTable<'a> {
     pub fn new_append(&self) -> Result<TableAppend> {
         Ok(TableAppend::new(
             self.table_path.clone(),
-            self.table_info.clone(),
+            Arc::new(self.table_info.clone()),
             self.conn.get_or_create_writer_client()?,
         ))
     }
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 356ba1cdb4..14d2841124 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -630,7 +630,7 @@ impl LogFetcher {
         if self.is_partitioned {
             // Fallback to full table metadata refresh until partition-aware updates are available.
             self.metadata
-                .update_tables_metadata(&HashSet::from([&self.table_path]))
+                .update_tables_metadata(&HashSet::from([&self.table_path]), &HashSet::new(), vec![])
                 .await
                 .or_else(|e| {
                     if let Error::RpcError { source, .. } = &e
@@ -649,7 +649,7 @@ impl LogFetcher {
 
         // TODO: Handle PartitionNotExist error
         self.metadata
-            .update_tables_metadata(&HashSet::from([&self.table_path]))
+            .update_tables_metadata(&HashSet::from([&self.table_path]), &HashSet::new(), vec![])
             .await
             .or_else(|e| {
                 if let Error::RpcError { source, .. } = &e
@@ -799,8 +799,9 @@ impl LogFetcher {
                         let table_id = table_bucket.table_id();
                         let cluster = metadata.get_cluster();
                         if let Some(table_path) = cluster.get_table_path_by_id(table_id) {
-                            let physical_tables =
-                                HashSet::from([PhysicalTablePath::of(table_path.clone())]);
+                            let physical_tables = HashSet::from([PhysicalTablePath::of(Arc::new(
+                                table_path.clone(),
+                            ))]);
                             metadata.invalidate_physical_table_meta(&physical_tables);
                         } else {
                             warn!(
@@ -1498,7 +1499,7 @@ mod tests {
     use crate::compression::{
         ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
     };
-    use crate::metadata::{TableInfo, TablePath};
+    use crate::metadata::{PhysicalTablePath, TableInfo, TablePath};
     use crate::record::MemoryLogRecordsArrowBuilder;
     use crate::row::{Datum, GenericRow};
     use crate::rpc::FlussError;
@@ -1514,8 +1515,10 @@ mod tests {
                 compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
             },
         )?;
+        let physical_table_path = Arc::new(PhysicalTablePath::of(table_path));
         let record = WriteRecord::for_append(
-            table_path,
+            Arc::new(table_info.clone()),
+            physical_table_path,
             1,
             GenericRow {
                 values: vec![Datum::Int32(1)],
@@ -1684,7 +1687,7 @@ mod tests {
         )?;
 
         let bucket = TableBucket::new(1, 0);
-        assert!(metadata.leader_for(&bucket).is_some());
+        assert!(metadata.leader_for(&table_path, &bucket).await?.is_some());
 
         let response = crate::proto::FetchLogResponse {
             tables_resp: vec![crate::proto::PbFetchLogRespForTable {
@@ -1713,7 +1716,7 @@ mod tests {
 
         LogFetcher::handle_fetch_response(response, response_context).await;
 
-        assert!(metadata.leader_for(&bucket).is_none());
+        assert!(metadata.get_cluster().leader_for(&bucket).is_none());
         Ok(())
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
index 984592d06e..269d5258f8 100644
--- a/fluss-rust/crates/fluss/src/client/table/upsert.rs
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -19,12 +19,13 @@ use crate::client::table::writer::{DeleteResult, TableWriter, UpsertResult, Upse
 use crate::client::{RowBytes, WriteFormat, WriteRecord, WriterClient};
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::{KvFormat, RowType, TableInfo, TablePath};
+use crate::metadata::{PhysicalTablePath, RowType, TableInfo, TablePath};
 use crate::row::InternalRow;
 use crate::row::encode::{KeyEncoder, KeyEncoderFactory, RowEncoder, RowEncoderFactory};
 use crate::row::field_getter::FieldGetter;
 use std::sync::Arc;
 
+use crate::client::table::partition_getter::PartitionGetter;
 use bitvec::prelude::bitvec;
 use bytes::Bytes;
 
@@ -107,30 +108,25 @@ impl TableUpsert {
     }
 }
 
-#[allow(dead_code)]
 struct UpsertWriterImpl<RE>
 where
     RE: RowEncoder,
 {
     table_path: Arc<TablePath>,
     writer_client: Arc<WriterClient>,
-    // TODO: Partitioning
-    // partition_field_getter: Option<Box<dyn KeyEncoder>>,
+    partition_field_getter: Option<PartitionGetter>,
     primary_key_encoder: Box<dyn KeyEncoder>,
     target_columns: Option<Arc<Vec<usize>>>,
     // Use primary key encoder as bucket key encoder when None
     bucket_key_encoder: Option<Box<dyn KeyEncoder>>,
-    kv_format: KvFormat,
     write_format: WriteFormat,
     row_encoder: RE,
     field_getters: Box<[FieldGetter]>,
     table_info: Arc<TableInfo>,
 }
 
-#[allow(dead_code)]
 struct UpsertWriterFactory;
 
-#[allow(dead_code)]
 impl UpsertWriterFactory {
     pub fn create(
         table_path: Arc<TablePath>,
@@ -168,13 +164,22 @@ impl UpsertWriterFactory {
 
         let field_getters = FieldGetter::create_field_getters(row_type);
 
+        let partition_field_getter = if table_info.is_partitioned() {
+            Some(PartitionGetter::new(
+                row_type,
+                Arc::clone(table_info.get_partition_keys()),
+            )?)
+        } else {
+            None
+        };
+
         Ok(UpsertWriterImpl {
             table_path,
+            partition_field_getter,
             writer_client,
             primary_key_encoder,
             target_columns: partial_update_columns,
             bucket_key_encoder,
-            kv_format: kv_format.clone(),
             write_format,
             row_encoder: RowEncoderFactory::create(kv_format, row_type.clone())?,
             field_getters,
@@ -311,6 +316,18 @@ impl<RE: RowEncoder> UpsertWriterImpl<RE> {
         }
         self.row_encoder.finish_row()
     }
+
+    fn get_physical_path<R: InternalRow>(&self, row: &R) -> Result<PhysicalTablePath> {
+        if let Some(partition_getter) = &self.partition_field_getter {
+            let partition = partition_getter.get_partition(row);
+            Ok(PhysicalTablePath::of_partitioned(
+                Arc::clone(&self.table_path),
+                Some(partition?),
+            ))
+        } else {
+            Ok(PhysicalTablePath::of(Arc::clone(&self.table_path)))
+        }
+    }
 }
 
 impl<RE: RowEncoder> TableWriter for UpsertWriterImpl<RE> {
@@ -343,7 +360,8 @@ impl<RE: RowEncoder> UpsertWriter for UpsertWriterImpl<RE> {
         };
 
         let write_record = WriteRecord::for_upsert(
-            Arc::clone(&self.table_path),
+            Arc::clone(&self.table_info),
+            Arc::new(self.get_physical_path(row)?),
             self.table_info.schema_id,
             key,
             bucket_key,
@@ -372,7 +390,8 @@ impl<RE: RowEncoder> UpsertWriter for UpsertWriterImpl<RE> {
         let (key, bucket_key) = self.get_keys(row)?;
 
         let write_record = WriteRecord::for_upsert(
-            Arc::clone(&self.table_path),
+            Arc::clone(&self.table_info),
+            Arc::new(self.get_physical_path(row)?),
             self.table_info.schema_id,
             key,
             bucket_key,
diff --git a/fluss-rust/crates/fluss/src/client/table/writer.rs b/fluss-rust/crates/fluss/src/client/table/writer.rs
index 8276545703..ec26ec63dd 100644
--- a/fluss-rust/crates/fluss/src/client/table/writer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/writer.rs
@@ -15,12 +15,9 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::client::{WriteRecord, WriterClient};
 use crate::row::{GenericRow, InternalRow};
-use std::sync::Arc;
 
 use crate::error::Result;
-use crate::metadata::{TableInfo, TablePath};
 
 #[allow(dead_code, async_fn_in_trait)]
 pub trait TableWriter {
@@ -47,55 +44,3 @@ pub struct UpsertResult;
 /// Currently this is an empty struct to allow for compatible evolution in the future
 #[derive(Default)]
 pub struct DeleteResult;
-
-#[allow(dead_code)]
-pub struct AbstractTableWriter {
-    table_path: Arc<TablePath>,
-    writer_client: Arc<WriterClient>,
-    field_count: i32,
-    schema_id: i32,
-}
-
-#[allow(dead_code)]
-impl AbstractTableWriter {
-    pub fn new(
-        table_path: TablePath,
-        table_info: &TableInfo,
-        writer_client: Arc<WriterClient>,
-    ) -> Self {
-        // todo: partition
-        Self {
-            table_path: Arc::new(table_path),
-            writer_client,
-            field_count: table_info.row_type().fields().len() as i32,
-            schema_id: table_info.schema_id,
-        }
-    }
-
-    pub async fn send(&self, write_record: &WriteRecord<'_>) -> Result<()> {
-        let result_handle = self.writer_client.send(write_record).await?;
-        let result = result_handle.wait().await?;
-        result_handle.result(result)
-    }
-}
-
-impl TableWriter for AbstractTableWriter {
-    async fn flush(&self) -> Result<()> {
-        todo!()
-    }
-}
-
-// Append writer implementation
-#[allow(dead_code)]
-pub struct AppendWriterImpl {
-    base: AbstractTableWriter,
-}
-
-#[allow(dead_code)]
-impl AppendWriterImpl {
-    pub async fn append(&self, row: GenericRow<'_>) -> Result<()> {
-        let record =
-            WriteRecord::for_append(self.base.table_path.clone(), self.base.schema_id, row);
-        self.base.send(&record).await
-    }
-}
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index a5b983277f..2a45517306 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -21,7 +21,7 @@ use crate::client::{LogWriteRecord, Record, ResultHandle, WriteRecord};
 use crate::cluster::{BucketLocation, Cluster, ServerNode};
 use crate::config::Config;
 use crate::error::Result;
-use crate::metadata::{TableBucket, TablePath};
+use crate::metadata::{PhysicalTablePath, TableBucket};
 use crate::util::current_time_ms;
 use crate::{BucketId, PartitionId, TableId};
 use dashmap::DashMap;
@@ -37,7 +37,7 @@ type BucketBatches = Vec<(BucketId, Arc<Mutex<VecDeque<WriteBatch>>>)>;
 #[allow(dead_code)]
 pub struct RecordAccumulator {
     config: Config,
-    write_batches: DashMap<TablePath, BucketAndWriteBatches>,
+    write_batches: DashMap<Arc<PhysicalTablePath>, BucketAndWriteBatches>,
     // batch_id -> complete callback
     incomplete_batches: RwLock<HashMap<i64, ResultHandle>>,
     batch_timeout_ms: i64,
@@ -88,14 +88,14 @@ impl RecordAccumulator {
         &self,
         cluster: &Cluster,
         record: &WriteRecord,
-        bucket_id: BucketId,
         dq: &mut VecDeque<WriteBatch>,
     ) -> Result<RecordAppendResult> {
         if let Some(append_result) = self.try_append(record, dq)? {
             return Ok(append_result);
         }
 
-        let table_path = &record.table_path;
+        let physical_table_path = &record.physical_table_path;
+        let table_path = physical_table_path.get_table_path();
         let table_info = cluster.get_table(table_path)?;
         let arrow_compression_info = table_info.get_table_config().get_arrow_compression_info()?;
         let row_type = &table_info.row_type;
@@ -105,22 +105,20 @@ impl RecordAccumulator {
         let mut batch: WriteBatch = match record.record() {
             Record::Log(_) => ArrowLog(ArrowLogWriteBatch::new(
                 self.batch_id.fetch_add(1, Ordering::Relaxed),
-                table_path.as_ref().clone(),
+                Arc::clone(physical_table_path),
                 schema_id,
                 arrow_compression_info,
                 row_type,
-                bucket_id,
                 current_time_ms(),
                 matches!(&record.record, Record::Log(LogWriteRecord::RecordBatch(_))),
             )?),
             Record::Kv(kv_record) => Kv(KvWriteBatch::new(
                 self.batch_id.fetch_add(1, Ordering::Relaxed),
-                table_path.as_ref().clone(),
+                Arc::clone(physical_table_path),
                 schema_id,
                 // TODO: Decide how to derive write limit in the absence of java's equivalent of PreAllocatedPagedOutputView
                 KvWriteBatch::DEFAULT_WRITE_LIMIT,
                 record.write_format.to_kv_format()?,
-                bucket_id,
                 kv_record.target_columns.clone(),
                 current_time_ms(),
             )),
@@ -153,18 +151,25 @@ impl RecordAccumulator {
         cluster: &Cluster,
         abort_if_batch_full: bool,
     ) -> Result<RecordAppendResult> {
-        let table_path = &record.table_path;
+        let physical_table_path = &record.physical_table_path;
+        let table_path = physical_table_path.get_table_path();
+        let table_info = cluster.get_table(table_path)?;
+        let is_partitioned_table = table_info.is_partitioned();
 
-        // TODO: Implement partitioning
+        let partition_id = if is_partitioned_table {
+            cluster.get_partition_id(physical_table_path)
+        } else {
+            None
+        };
 
         let dq = {
             let mut binding = self
                 .write_batches
-                .entry(table_path.as_ref().clone())
+                .entry(Arc::clone(physical_table_path))
                 .or_insert_with(|| BucketAndWriteBatches {
-                    table_id: 0,
-                    is_partitioned_table: false,
-                    partition_id: None,
+                    table_id: table_info.table_id,
+                    is_partitioned_table,
+                    partition_id,
                     batches: Default::default(),
                 });
             let bucket_and_batches = binding.value_mut();
@@ -185,23 +190,24 @@ impl RecordAccumulator {
                 true, false, true,
             ));
         }
-        self.append_new_batch(cluster, record, bucket_id, &mut dq_guard)
+        self.append_new_batch(cluster, record, &mut dq_guard)
     }
 
     pub async fn ready(&self, cluster: &Arc<Cluster>) -> Result<ReadyCheckResult> {
         // Snapshot just the Arcs we need, avoiding cloning the entire BucketAndWriteBatches struct
-        let entries: Vec<(TablePath, BucketBatches)> = self
+        let entries: Vec<(Arc<PhysicalTablePath>, Option<PartitionId>, BucketBatches)> = self
             .write_batches
             .iter()
             .map(|entry| {
-                let table_path = entry.key().clone();
+                let physical_table_path = Arc::clone(entry.key());
+                let partition_id = entry.value().partition_id;
                 let bucket_batches: Vec<_> = entry
                     .value()
                     .batches
                     .iter()
                     .map(|(bucket_id, batch_arc)| (*bucket_id, batch_arc.clone()))
                     .collect();
-                (table_path, bucket_batches)
+                (physical_table_path, partition_id, bucket_batches)
             })
             .collect();
 
@@ -209,10 +215,12 @@ impl RecordAccumulator {
         let mut next_ready_check_delay_ms = self.batch_timeout_ms;
         let mut unknown_leader_tables = HashSet::new();
 
-        for (table_path, bucket_batches) in entries {
+        for (physical_table_path, mut partition_id, bucket_batches) in entries {
             next_ready_check_delay_ms = self
                 .bucket_ready(
-                    &table_path,
+                    &physical_table_path,
+                    physical_table_path.get_partition_name().is_some(),
+                    &mut partition_id,
                     bucket_batches,
                     &mut ready_nodes,
                     &mut unknown_leader_tables,
@@ -229,17 +237,42 @@ impl RecordAccumulator {
         })
     }
 
+    #[allow(clippy::too_many_arguments)]
     async fn bucket_ready(
         &self,
-        table_path: &TablePath,
+        physical_table_path: &Arc<PhysicalTablePath>,
+        is_partitioned_table: bool,
+        partition_id: &mut Option<PartitionId>,
         bucket_batches: BucketBatches,
         ready_nodes: &mut HashSet<ServerNode>,
-        unknown_leader_tables: &mut HashSet<TablePath>,
+        unknown_leader_tables: &mut HashSet<Arc<PhysicalTablePath>>,
         cluster: &Cluster,
         next_ready_check_delay_ms: i64,
     ) -> Result<i64> {
         let mut next_delay = next_ready_check_delay_ms;
 
+        // First check this table has partitionId.
+        if is_partitioned_table && partition_id.is_none() {
+            let partition_id = cluster.get_partition_id(physical_table_path);
+
+            if partition_id.is_some() {
+                // Update the cached partition_id
+                if let Some(mut entry) = self.write_batches.get_mut(physical_table_path) {
+                    entry.partition_id = partition_id;
+                }
+            } else {
+                log::debug!(
+                    "Partition does not exist for {}, bucket will not be set to ready",
+                    physical_table_path.as_ref()
+                );
+
+                // TODO: we shouldn't add unready partitions to unknownLeaderTables,
+                // because it cases PartitionNotExistException later
+                unknown_leader_tables.insert(Arc::clone(physical_table_path));
+                return Ok(next_delay);
+            }
+        }
+
         for (bucket_id, batch) in bucket_batches {
             let batch_guard = batch.lock().await;
             if batch_guard.is_empty() {
@@ -250,12 +283,12 @@ impl RecordAccumulator {
             let waited_time_ms = batch.waited_time_ms(current_time_ms());
             let deque_size = batch_guard.len();
             let full = deque_size > 1 || batch.is_closed();
-            let table_bucket = cluster.get_table_bucket(table_path, bucket_id)?;
+            let table_bucket = cluster.get_table_bucket(physical_table_path, bucket_id)?;
             if let Some(leader) = cluster.leader_for(&table_bucket) {
                 next_delay =
                     self.batch_ready(leader, waited_time_ms, full, ready_nodes, next_delay);
             } else {
-                unknown_leader_tables.insert(table_path.clone());
+                unknown_leader_tables.insert(Arc::clone(physical_table_path));
             }
         }
         Ok(next_delay)
@@ -332,14 +365,14 @@ impl RecordAccumulator {
 
         loop {
             let bucket = &buckets[current_index];
-            let table_path = bucket.table_path.clone();
+            let table_path = bucket.physical_table_path();
             let table_bucket = bucket.table_bucket.clone();
             last_processed_index = current_index;
             current_index = (current_index + 1) % buckets.len();
 
             let deque = self
                 .write_batches
-                .get(&table_path)
+                .get(table_path)
                 .and_then(|bucket_and_write_batches| {
                     bucket_and_write_batches
                         .batches
@@ -399,20 +432,22 @@ impl RecordAccumulator {
 
     pub async fn re_enqueue(&self, ready_write_batch: ReadyWriteBatch) {
         ready_write_batch.write_batch.re_enqueued();
-        let table_path = ready_write_batch.write_batch.table_path().clone();
+        let physical_table_path = ready_write_batch.write_batch.physical_table_path();
         let bucket_id = ready_write_batch.table_bucket.bucket_id();
         let table_id = ready_write_batch.table_bucket.table_id();
+        let partition_id = ready_write_batch.table_bucket.partition_id();
+        let is_partitioned_table = partition_id.is_some();
 
         let dq = {
-            let mut binding =
-                self.write_batches
-                    .entry(table_path)
-                    .or_insert_with(|| BucketAndWriteBatches {
-                        table_id,
-                        is_partitioned_table: false,
-                        partition_id: None,
-                        batches: Default::default(),
-                    });
+            let mut binding = self
+                .write_batches
+                .entry(Arc::clone(physical_table_path))
+                .or_insert_with(|| BucketAndWriteBatches {
+                    table_id,
+                    is_partitioned_table,
+                    partition_id,
+                    batches: Default::default(),
+                });
             let bucket_and_batches = binding.value_mut();
             bucket_and_batches
                 .batches
@@ -478,6 +513,12 @@ pub struct ReadyWriteBatch {
     pub write_batch: WriteBatch,
 }
 
+impl ReadyWriteBatch {
+    pub fn write_batch(&self) -> &WriteBatch {
+        &self.write_batch
+    }
+}
+
 #[allow(dead_code)]
 struct BucketAndWriteBatches {
     table_id: TableId,
@@ -525,14 +566,14 @@ impl RecordAppendResult {
 pub struct ReadyCheckResult {
     pub ready_nodes: HashSet<ServerNode>,
     pub next_ready_check_delay_ms: i64,
-    pub unknown_leader_tables: HashSet<TablePath>,
+    pub unknown_leader_tables: HashSet<Arc<PhysicalTablePath>>,
 }
 
 impl ReadyCheckResult {
     pub fn new(
         ready_nodes: HashSet<ServerNode>,
         next_ready_check_delay_ms: i64,
-        unknown_leader_tables: HashSet<TablePath>,
+        unknown_leader_tables: HashSet<Arc<PhysicalTablePath>>,
     ) -> Self {
         ReadyCheckResult {
             ready_nodes,
@@ -547,17 +588,20 @@ mod tests {
     use super::*;
     use crate::metadata::TablePath;
     use crate::row::{Datum, GenericRow};
-    use crate::test_utils::build_cluster;
+    use crate::test_utils::{build_cluster, build_table_info};
     use std::sync::Arc;
 
     #[tokio::test]
     async fn re_enqueue_increments_attempts() -> Result<()> {
         let config = Config::default();
         let accumulator = RecordAccumulator::new(config);
-        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
-        let cluster = Arc::new(build_cluster(table_path.as_ref(), 1, 1));
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
         let record = WriteRecord::for_append(
-            table_path.clone(),
+            table_info,
+            physical_table_path,
             1,
             GenericRow {
                 values: vec![Datum::Int32(1)],
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index 41561d4ac7..da30c8aca4 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -15,12 +15,11 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::BucketId;
 use crate::client::broadcast::{BatchWriteResult, BroadcastOnce};
 use crate::client::{Record, ResultHandle, WriteRecord};
 use crate::compression::ArrowCompressionInfo;
 use crate::error::{Error, Result};
-use crate::metadata::{KvFormat, RowType, TablePath};
+use crate::metadata::{KvFormat, PhysicalTablePath, RowType};
 use crate::record::MemoryLogRecordsArrowBuilder;
 use crate::record::kv::KvRecordBatchBuilder;
 use bytes::Bytes;
@@ -28,12 +27,10 @@ use std::cmp::max;
 use std::sync::Arc;
 use std::sync::atomic::{AtomicBool, AtomicI32, Ordering};
 
-#[allow(dead_code)]
 pub struct InnerWriteBatch {
     batch_id: i64,
-    table_path: TablePath,
+    physical_table_path: Arc<PhysicalTablePath>,
     create_ms: i64,
-    bucket_id: BucketId,
     results: BroadcastOnce<BatchWriteResult>,
     completed: AtomicBool,
     attempts: AtomicI32,
@@ -41,12 +38,11 @@ pub struct InnerWriteBatch {
 }
 
 impl InnerWriteBatch {
-    fn new(batch_id: i64, table_path: TablePath, create_ms: i64, bucket_id: BucketId) -> Self {
+    fn new(batch_id: i64, physical_table_path: Arc<PhysicalTablePath>, create_ms: i64) -> Self {
         InnerWriteBatch {
             batch_id,
-            table_path,
+            physical_table_path,
             create_ms,
-            bucket_id,
             results: Default::default(),
             completed: AtomicBool::new(false),
             attempts: AtomicI32::new(0),
@@ -74,8 +70,8 @@ impl InnerWriteBatch {
         self.drained_ms = max(self.drained_ms, now_ms);
     }
 
-    fn table_path(&self) -> &TablePath {
-        &self.table_path
+    fn physical_table_path(&self) -> &Arc<PhysicalTablePath> {
+        &self.physical_table_path
     }
 
     fn attempts(&self) -> i32 {
@@ -165,8 +161,8 @@ impl WriteBatch {
         self.inner_batch().batch_id
     }
 
-    pub fn table_path(&self) -> &TablePath {
-        self.inner_batch().table_path()
+    pub fn physical_table_path(&self) -> &Arc<PhysicalTablePath> {
+        self.inner_batch().physical_table_path()
     }
 
     pub fn attempts(&self) -> i32 {
@@ -192,15 +188,14 @@ impl ArrowLogWriteBatch {
     #[allow(clippy::too_many_arguments)]
     pub fn new(
         batch_id: i64,
-        table_path: TablePath,
+        physical_table_path: Arc<PhysicalTablePath>,
         schema_id: i32,
         arrow_compression_info: ArrowCompressionInfo,
         row_type: &RowType,
-        bucket_id: BucketId,
         create_ms: i64,
         to_append_record_batch: bool,
     ) -> Result<Self> {
-        let base = InnerWriteBatch::new(batch_id, table_path, create_ms, bucket_id);
+        let base = InnerWriteBatch::new(batch_id, physical_table_path, create_ms);
         Ok(Self {
             write_batch: base,
             arrow_builder: MemoryLogRecordsArrowBuilder::new(
@@ -273,15 +268,14 @@ impl KvWriteBatch {
     #[allow(clippy::too_many_arguments)]
     pub fn new(
         batch_id: i64,
-        table_path: TablePath,
+        physical_table_path: Arc<PhysicalTablePath>,
         schema_id: i32,
         write_limit: usize,
         kv_format: KvFormat,
-        bucket_id: BucketId,
         target_columns: Option<Arc<Vec<usize>>>,
         create_ms: i64,
     ) -> Self {
-        let base = InnerWriteBatch::new(batch_id, table_path, create_ms, bucket_id);
+        let base = InnerWriteBatch::new(batch_id, physical_table_path, create_ms);
         Self {
             write_batch: base,
             kv_batch_builder: KvRecordBatchBuilder::new(schema_id, write_limit, kv_format),
@@ -367,19 +361,22 @@ mod tests {
     use super::*;
     use crate::client::{RowBytes, WriteFormat};
     use crate::metadata::TablePath;
+    use crate::test_utils::build_table_info;
 
     #[test]
     fn complete_only_once() {
-        let batch =
-            InnerWriteBatch::new(1, TablePath::new("db".to_string(), "tbl".to_string()), 0, 0);
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let physical_path = PhysicalTablePath::of(Arc::new(table_path));
+        let batch = InnerWriteBatch::new(1, Arc::new(physical_path), 0);
         assert!(batch.complete(Ok(())));
         assert!(!batch.complete(Err(crate::client::broadcast::Error::Dropped)));
     }
 
     #[test]
     fn attempts_increment_on_reenqueue() {
-        let batch =
-            InnerWriteBatch::new(1, TablePath::new("db".to_string(), "tbl".to_string()), 0, 0);
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let physical_path = PhysicalTablePath::of(Arc::new(table_path));
+        let batch = InnerWriteBatch::new(1, Arc::new(physical_path), 0);
         assert_eq!(batch.attempts(), 0);
         batch.re_enqueued();
         assert_eq!(batch.attempts(), 1);
@@ -401,12 +398,14 @@ mod tests {
             DataField::new("name".to_string(), DataTypes::string(), None),
         ]);
         let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path)));
 
         // Test 1: RowAppendRecordBatchBuilder (to_append_record_batch=false)
         {
             let mut batch = ArrowLogWriteBatch::new(
                 1,
-                table_path.clone(),
+                Arc::clone(&physical_table_path),
                 1,
                 ArrowCompressionInfo {
                     compression_type: ArrowCompressionType::None,
@@ -414,7 +413,6 @@ mod tests {
                 },
                 &row_type,
                 0,
-                0,
                 false,
             )
             .unwrap();
@@ -424,7 +422,12 @@ mod tests {
                 let mut row = GenericRow::new(2);
                 row.set_field(0, 1_i32);
                 row.set_field(1, "hello");
-                let record = WriteRecord::for_append(Arc::new(table_path.clone()), 1, row);
+                let record = WriteRecord::for_append(
+                    Arc::clone(&table_info),
+                    Arc::clone(&physical_table_path),
+                    1,
+                    row,
+                );
                 batch.try_append(&record).unwrap();
             }
 
@@ -446,7 +449,7 @@ mod tests {
         {
             let mut batch = ArrowLogWriteBatch::new(
                 1,
-                table_path.clone(),
+                physical_table_path.clone(),
                 1,
                 ArrowCompressionInfo {
                     compression_type: ArrowCompressionType::None,
@@ -454,7 +457,6 @@ mod tests {
                 },
                 &row_type,
                 0,
-                0,
                 true,
             )
             .unwrap();
@@ -472,8 +474,12 @@ mod tests {
             )
             .unwrap();
 
-            let record =
-                WriteRecord::for_append_record_batch(Arc::new(table_path.clone()), 1, record_batch);
+            let record = WriteRecord::for_append_record_batch(
+                Arc::clone(&table_info),
+                Arc::clone(&physical_table_path),
+                1,
+                record_batch,
+            );
             batch.try_append(&record).unwrap();
 
             let estimated_size = batch.estimated_size_in_bytes();
@@ -496,21 +502,23 @@ mod tests {
         use crate::metadata::KvFormat;
 
         let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path)));
 
         let mut batch = KvWriteBatch::new(
             1,
-            table_path.clone(),
+            Arc::clone(&physical_path),
             1,
             KvWriteBatch::DEFAULT_WRITE_LIMIT,
             KvFormat::COMPACTED,
-            0,
             None,
             0,
         );
 
         for _ in 0..200 {
             let record = WriteRecord::for_upsert(
-                Arc::new(table_path.clone()),
+                Arc::clone(&table_info),
+                Arc::clone(&physical_path),
                 1,
                 Bytes::from(vec![1_u8, 2_u8, 3_u8]),
                 None,
diff --git a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
index 817101a41a..7fcd20ba54 100644
--- a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
+++ b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
@@ -19,9 +19,10 @@ use crate::bucketing::BucketingFunction;
 use crate::cluster::Cluster;
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::TablePath;
+use crate::metadata::PhysicalTablePath;
 use bytes::Bytes;
 use rand::Rng;
+use std::sync::Arc;
 use std::sync::atomic::{AtomicI32, Ordering};
 
 pub trait BucketAssigner: Sync + Send {
@@ -34,12 +35,12 @@ pub trait BucketAssigner: Sync + Send {
 
 #[derive(Debug)]
 pub struct StickyBucketAssigner {
-    table_path: TablePath,
+    table_path: Arc<PhysicalTablePath>,
     current_bucket_id: AtomicI32,
 }
 
 impl StickyBucketAssigner {
-    pub fn new(table_path: TablePath) -> Self {
+    pub fn new(table_path: Arc<PhysicalTablePath>) -> Self {
         Self {
             table_path,
             current_bucket_id: AtomicI32::new(-1),
@@ -55,7 +56,7 @@ impl StickyBucketAssigner {
                 let mut rng = rand::rng();
                 let mut random: i32 = rng.random();
                 random &= i32::MAX;
-                new_bucket = random % cluster.get_bucket_count(&self.table_path);
+                new_bucket = random % cluster.get_bucket_count(self.table_path.get_table_path());
             } else if available_buckets.len() == 1 {
                 new_bucket = available_buckets[0].table_bucket.bucket_id();
             } else {
@@ -155,12 +156,15 @@ mod tests {
     use crate::cluster::Cluster;
     use crate::metadata::TablePath;
     use crate::test_utils::build_cluster;
+    use std::sync::Arc;
 
     #[test]
     fn sticky_bucket_assigner_picks_available_bucket() {
         let table_path = TablePath::new("db".to_string(), "tbl".to_string());
         let cluster = build_cluster(&table_path, 1, 2);
-        let assigner = StickyBucketAssigner::new(table_path);
+        let assigner = StickyBucketAssigner::new(Arc::new(PhysicalTablePath::of(Arc::new(
+            table_path.clone(),
+        ))));
         let bucket = assigner.assign_bucket(None, &cluster).expect("bucket");
         assert!((0..2).contains(&bucket));
 
@@ -174,7 +178,7 @@ mod tests {
         let assigner = HashBucketAssigner::new(3, <dyn BucketingFunction>::of(None));
         let cluster = Cluster::default();
         let err = assigner.assign_bucket(None, &cluster).unwrap_err();
-        assert!(matches!(err, crate::error::Error::IllegalArgument { .. }));
+        assert!(matches!(err, IllegalArgument { .. }));
     }
 
     #[test]
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index dcc6795996..868b582c2a 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -20,7 +20,8 @@ mod batch;
 
 use crate::client::broadcast::{self as client_broadcast, BatchWriteResult, BroadcastOnceReceiver};
 use crate::error::Error;
-use crate::metadata::TablePath;
+use crate::metadata::{PhysicalTablePath, TableInfo};
+
 use crate::row::GenericRow;
 pub use accumulator::*;
 use arrow::array::RecordBatch;
@@ -40,16 +41,21 @@ pub use writer_client::WriterClient;
 #[allow(dead_code)]
 pub struct WriteRecord<'a> {
     record: Record<'a>,
-    table_path: Arc<TablePath>,
+    physical_table_path: Arc<PhysicalTablePath>,
     bucket_key: Option<Bytes>,
     schema_id: i32,
     write_format: WriteFormat,
+    table_info: Arc<TableInfo>,
 }
 
 impl<'a> WriteRecord<'a> {
     pub fn record(&self) -> &Record<'a> {
         &self.record
     }
+
+    pub fn physical_table_path(&self) -> &Arc<PhysicalTablePath> {
+        &self.physical_table_path
+    }
 }
 
 pub enum Record<'a> {
@@ -102,10 +108,16 @@ impl<'a> KvWriteRecord<'a> {
 }
 
 impl<'a> WriteRecord<'a> {
-    pub fn for_append(table_path: Arc<TablePath>, schema_id: i32, row: GenericRow<'a>) -> Self {
+    pub fn for_append(
+        table_info: Arc<TableInfo>,
+        physical_table_path: Arc<PhysicalTablePath>,
+        schema_id: i32,
+        row: GenericRow<'a>,
+    ) -> Self {
         Self {
+            table_info,
             record: Record::Log(LogWriteRecord::Generic(row)),
-            table_path,
+            physical_table_path,
             bucket_key: None,
             schema_id,
             write_format: WriteFormat::ArrowLog,
@@ -113,21 +125,25 @@ impl<'a> WriteRecord<'a> {
     }
 
     pub fn for_append_record_batch(
-        table_path: Arc<TablePath>,
+        table_info: Arc<TableInfo>,
+        physical_table_path: Arc<PhysicalTablePath>,
         schema_id: i32,
         row: RecordBatch,
     ) -> Self {
         Self {
+            table_info,
             record: Record::Log(LogWriteRecord::RecordBatch(Arc::new(row))),
-            table_path,
+            physical_table_path,
             bucket_key: None,
             schema_id,
             write_format: WriteFormat::ArrowLog,
         }
     }
 
+    #[allow(clippy::too_many_arguments)]
     pub fn for_upsert(
-        table_path: Arc<TablePath>,
+        table_info: Arc<TableInfo>,
+        physical_table_path: Arc<PhysicalTablePath>,
         schema_id: i32,
         key: Bytes,
         bucket_key: Option<Bytes>,
@@ -136,8 +152,9 @@ impl<'a> WriteRecord<'a> {
         row_bytes: Option<RowBytes<'a>>,
     ) -> Self {
         Self {
+            table_info,
             record: Record::Kv(KvWriteRecord::new(key, target_columns, row_bytes)),
-            table_path,
+            physical_table_path,
             bucket_key,
             schema_id,
             write_format,
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index 905ef8052b..6a7dad002c 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -15,20 +15,20 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::TableId;
 use crate::client::broadcast;
 use crate::client::metadata::Metadata;
 use crate::client::write::batch::WriteBatch;
 use crate::client::{ReadyWriteBatch, RecordAccumulator};
 use crate::error::Error::UnexpectedError;
 use crate::error::{FlussError, Result};
-use crate::metadata::{TableBucket, TablePath};
+use crate::metadata::{PhysicalTablePath, TableBucket, TablePath};
 use crate::proto::{
     PbProduceLogRespForBucket, PbPutKvRespForBucket, ProduceLogResponse, PutKvResponse,
 };
 use crate::rpc::ServerConnection;
 use crate::rpc::message::{ProduceLogRequest, PutKvRequest};
-use log::warn;
+use crate::{PartitionId, TableId};
+use log::{debug, warn};
 use parking_lot::Mutex;
 use std::collections::{HashMap, HashSet};
 use std::sync::Arc;
@@ -82,9 +82,39 @@ impl Sender {
 
         // Update metadata if needed
         if !ready_check_result.unknown_leader_tables.is_empty() {
-            self.metadata
-                .update_tables_metadata(&ready_check_result.unknown_leader_tables.iter().collect())
-                .await?;
+            let mut table_paths: HashSet<&TablePath> = HashSet::new();
+            let mut physical_table_paths: HashSet<&Arc<PhysicalTablePath>> = HashSet::new();
+
+            for unknown_paths in ready_check_result.unknown_leader_tables.iter() {
+                if unknown_paths.get_partition_name().is_some() {
+                    physical_table_paths.insert(unknown_paths);
+                } else {
+                    table_paths.insert(unknown_paths.get_table_path());
+                }
+            }
+
+            if let Err(e) = self
+                .metadata
+                .update_tables_metadata(&table_paths, &physical_table_paths, vec![])
+                .await
+            {
+                match &e {
+                    crate::error::Error::FlussAPIError { api_error }
+                        if api_error.code == FlussError::PartitionNotExists.code() =>
+                    {
+                        warn!(
+                            "Partition does not exist during metadata update, continuing: {}",
+                            api_error
+                        );
+                    }
+                    _ => return Err(e),
+                }
+            }
+
+            debug!(
+                "Client update metadata due to unknown leader tables from the batched records: {:?}",
+                ready_check_result.unknown_leader_tables
+            );
         }
 
         if ready_check_result.ready_nodes.is_empty() {
@@ -327,10 +357,15 @@ impl Sender {
         response: R,
     ) -> Result<()> {
         let mut invalid_metadata_tables: HashSet<TablePath> = HashSet::new();
+        let mut invalid_physical_table_paths: HashSet<Arc<PhysicalTablePath>> = HashSet::new();
         let mut pending_buckets: HashSet<TableBucket> = request_buckets.iter().cloned().collect();
 
         for bucket_resp in response.buckets_resp() {
-            let tb = TableBucket::new(table_id, bucket_resp.bucket_id());
+            let tb = TableBucket::new_with_partition(
+                table_id,
+                bucket_resp.partition_id(),
+                bucket_resp.bucket_id(),
+            );
             let Some(ready_batch) = records_by_bucket.remove(&tb) else {
                 panic!("Missing ready batch for table bucket {tb}");
             };
@@ -343,11 +378,13 @@ impl Sender {
                         .error_message()
                         .cloned()
                         .unwrap_or_else(|| error.message().to_string());
-                    if let Some(table_path) = self
+                    if let Some(physical_table_path) = self
                         .handle_write_batch_error(ready_batch, error, message)
                         .await?
                     {
-                        invalid_metadata_tables.insert(table_path);
+                        invalid_metadata_tables
+                            .insert(physical_table_path.get_table_path().clone());
+                        invalid_physical_table_paths.insert(physical_table_path);
                     }
                 }
                 _ => self.complete_batch(ready_batch),
@@ -356,7 +393,7 @@ impl Sender {
 
         for bucket in pending_buckets {
             if let Some(ready_batch) = records_by_bucket.remove(&bucket) {
-                if let Some(table_path) = self
+                if let Some(physical_table_path) = self
                     .handle_write_batch_error(
                         ready_batch,
                         FlussError::UnknownServerError,
@@ -364,12 +401,13 @@ impl Sender {
                     )
                     .await?
                 {
-                    invalid_metadata_tables.insert(table_path);
+                    invalid_metadata_tables.insert(physical_table_path.get_table_path().clone());
+                    invalid_physical_table_paths.insert(physical_table_path);
                 }
             }
         }
 
-        self.update_metadata_if_needed(invalid_metadata_tables)
+        self.update_metadata_if_needed(invalid_metadata_tables, invalid_physical_table_paths)
             .await;
         Ok(())
     }
@@ -398,15 +436,18 @@ impl Sender {
         message: String,
     ) -> Result<()> {
         let mut invalid_metadata_tables: HashSet<TablePath> = HashSet::new();
+        let mut invalid_physical_table_paths: HashSet<Arc<PhysicalTablePath>> = HashSet::new();
+
         for batch in batches {
-            if let Some(table_path) = self
+            if let Some(physical_table_path) = self
                 .handle_write_batch_error(batch, error, message.clone())
                 .await?
             {
-                invalid_metadata_tables.insert(table_path);
+                invalid_metadata_tables.insert(physical_table_path.get_table_path().clone());
+                invalid_physical_table_paths.insert(physical_table_path);
             }
         }
-        self.update_metadata_if_needed(invalid_metadata_tables)
+        self.update_metadata_if_needed(invalid_metadata_tables, invalid_physical_table_paths)
             .await;
         Ok(())
     }
@@ -432,20 +473,22 @@ impl Sender {
         ready_write_batch: ReadyWriteBatch,
         error: FlussError,
         message: String,
-    ) -> Result<Option<TablePath>> {
-        let table_path = ready_write_batch.write_batch.table_path().clone();
+    ) -> Result<Option<Arc<PhysicalTablePath>>> {
+        let physical_table_path = Arc::clone(ready_write_batch.write_batch.physical_table_path());
         if self.can_retry(&ready_write_batch, error) {
             warn!(
-                "Retrying write batch for {table_path} on bucket {} after error {error:?}: {message}",
+                "Retrying write batch for {} on bucket {} after error {error:?}: {message}",
+                physical_table_path.as_ref(),
                 ready_write_batch.table_bucket.bucket_id()
             );
             self.re_enqueue_batch(ready_write_batch).await;
-            return Ok(Self::is_invalid_metadata_error(error).then_some(table_path));
+            return Ok(Self::is_invalid_metadata_error(error).then_some(physical_table_path));
         }
 
         if error == FlussError::DuplicateSequenceException {
             warn!(
-                "Duplicate sequence for {table_path} on bucket {}: {message}",
+                "Duplicate sequence for {} on bucket {}: {message}",
+                physical_table_path.as_ref(),
                 ready_write_batch.table_bucket.bucket_id()
             );
             self.complete_batch(ready_write_batch);
@@ -459,7 +502,7 @@ impl Sender {
                 message,
             },
         );
-        Ok(Self::is_invalid_metadata_error(error).then_some(table_path))
+        Ok(Self::is_invalid_metadata_error(error).then_some(physical_table_path))
     }
 
     async fn re_enqueue_batch(&self, ready_write_batch: ReadyWriteBatch) {
@@ -484,12 +527,22 @@ impl Sender {
             && Self::is_retriable_error(error)
     }
 
-    async fn update_metadata_if_needed(&self, table_paths: HashSet<TablePath>) {
+    async fn update_metadata_if_needed(
+        &self,
+        table_paths: HashSet<TablePath>,
+        physical_table_path: HashSet<Arc<PhysicalTablePath>>,
+    ) {
         if table_paths.is_empty() {
             return;
         }
         let table_path_refs: HashSet<&TablePath> = table_paths.iter().collect();
-        if let Err(e) = self.metadata.update_tables_metadata(&table_path_refs).await {
+        let physical_table_path_refs: HashSet<&Arc<PhysicalTablePath>> =
+            physical_table_path.iter().collect();
+        if let Err(e) = self
+            .metadata
+            .update_tables_metadata(&table_path_refs, &physical_table_path_refs, vec![])
+            .await
+        {
             warn!("Failed to update metadata after write error: {e:?}");
         }
     }
@@ -536,6 +589,8 @@ trait BucketResponse {
     fn bucket_id(&self) -> i32;
     fn error_code(&self) -> Option<i32>;
     fn error_message(&self) -> Option<&String>;
+
+    fn partition_id(&self) -> Option<PartitionId>;
 }
 
 impl BucketResponse for PbProduceLogRespForBucket {
@@ -548,6 +603,10 @@ impl BucketResponse for PbProduceLogRespForBucket {
     fn error_message(&self) -> Option<&String> {
         self.error_message.as_ref()
     }
+
+    fn partition_id(&self) -> Option<PartitionId> {
+        self.partition_id
+    }
 }
 
 impl BucketResponse for PbPutKvRespForBucket {
@@ -560,6 +619,10 @@ impl BucketResponse for PbPutKvRespForBucket {
     fn error_message(&self) -> Option<&String> {
         self.error_message.as_ref()
     }
+
+    fn partition_id(&self) -> Option<PartitionId> {
+        self.partition_id
+    }
 }
 
 trait WriteResponse {
@@ -587,11 +650,11 @@ mod tests {
     use crate::client::WriteRecord;
     use crate::cluster::Cluster;
     use crate::config::Config;
-    use crate::metadata::TablePath;
+    use crate::metadata::{PhysicalTablePath, TablePath};
     use crate::proto::{PbProduceLogRespForBucket, ProduceLogResponse};
     use crate::row::{Datum, GenericRow};
     use crate::rpc::FlussError;
-    use crate::test_utils::build_cluster_arc;
+    use crate::test_utils::{build_cluster_arc, build_table_info};
     use std::collections::{HashMap, HashSet};
 
     async fn build_ready_batch(
@@ -599,8 +662,11 @@ mod tests {
         cluster: Arc<Cluster>,
         table_path: Arc<TablePath>,
     ) -> Result<(ReadyWriteBatch, crate::client::ResultHandle)> {
+        let table_info = Arc::new(build_table_info(table_path.as_ref().clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(table_path));
         let record = WriteRecord::for_append(
-            table_path,
+            table_info,
+            physical_table_path,
             1,
             GenericRow {
                 values: vec![Datum::Int32(1)],
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index 65b04f5621..c386adf70e 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -15,20 +15,23 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::BucketId;
+use crate::bucketing::BucketingFunction;
 use crate::client::metadata::Metadata;
-use crate::client::write::bucket_assigner::{BucketAssigner, StickyBucketAssigner};
+use crate::client::write::bucket_assigner::{
+    BucketAssigner, HashBucketAssigner, StickyBucketAssigner,
+};
 use crate::client::write::sender::Sender;
 use crate::client::{RecordAccumulator, ResultHandle, WriteRecord};
 use crate::config::Config;
-use crate::metadata::TablePath;
+use crate::error::{Error, Result};
+use crate::metadata::{PhysicalTablePath, TableInfo};
 use bytes::Bytes;
 use dashmap::DashMap;
 use std::sync::Arc;
 use tokio::sync::mpsc;
 use tokio::task::JoinHandle;
 
-use crate::error::{Error, Result};
-
 #[allow(dead_code)]
 pub struct WriterClient {
     config: Config,
@@ -37,7 +40,7 @@ pub struct WriterClient {
     shutdown_tx: mpsc::Sender<()>,
     sender_join_handle: JoinHandle<()>,
     metadata: Arc<Metadata>,
-    bucket_assigners: DashMap<TablePath, Arc<Box<dyn BucketAssigner>>>,
+    bucket_assigners: DashMap<Arc<PhysicalTablePath>, Arc<dyn BucketAssigner>>,
 }
 
 impl WriterClient {
@@ -89,11 +92,12 @@ impl WriterClient {
     }
 
     pub async fn send(&self, record: &WriteRecord<'_>) -> Result<ResultHandle> {
-        let table_path = &record.table_path;
+        let physical_table_path = &record.physical_table_path;
         let cluster = self.metadata.get_cluster();
         let bucket_key = record.bucket_key.as_ref();
 
-        let (bucket_assigner, bucket_id) = self.assign_bucket(bucket_key, table_path)?;
+        let (bucket_assigner, bucket_id) =
+            self.assign_bucket(&record.table_info, bucket_key, physical_table_path)?;
 
         let mut result = self
             .accumulate
@@ -118,17 +122,19 @@ impl WriterClient {
     }
     fn assign_bucket(
         &self,
+        table_info: &Arc<TableInfo>,
         bucket_key: Option<&Bytes>,
-        table_path: &Arc<TablePath>,
-    ) -> Result<(Arc<Box<dyn BucketAssigner>>, i32)> {
+        table_path: &Arc<PhysicalTablePath>,
+    ) -> Result<(Arc<dyn BucketAssigner>, BucketId)> {
         let cluster = self.metadata.get_cluster();
         let bucket_assigner = {
             if let Some(assigner) = self.bucket_assigners.get(table_path) {
                 assigner.clone()
             } else {
-                let assigner = Arc::new(Self::create_bucket_assigner(table_path.as_ref()));
+                let assigner =
+                    Self::create_bucket_assigner(table_info, Arc::clone(table_path), bucket_key)?;
                 self.bucket_assigners
-                    .insert(table_path.as_ref().clone(), assigner.clone());
+                    .insert(Arc::clone(table_path), Arc::clone(&assigner.clone()));
                 assigner
             }
         };
@@ -160,8 +166,21 @@ impl WriterClient {
         Ok(())
     }
 
-    pub fn create_bucket_assigner(table_path: &TablePath) -> Box<dyn BucketAssigner> {
-        // always sticky
-        Box::new(StickyBucketAssigner::new(table_path.clone()))
+    pub fn create_bucket_assigner(
+        table_info: &Arc<TableInfo>,
+        table_path: Arc<PhysicalTablePath>,
+        bucket_key: Option<&Bytes>,
+    ) -> Result<Arc<dyn BucketAssigner>> {
+        if bucket_key.is_some() {
+            let datalake_format = table_info.get_table_config().get_datalake_format()?;
+            let function = <dyn BucketingFunction>::of(datalake_format.as_ref());
+            Ok(Arc::new(HashBucketAssigner::new(
+                table_info.num_buckets,
+                function,
+            )))
+        } else {
+            // TODO: Wire up toi use round robin/sticky according to ConfigOptions.CLIENT_WRITER_BUCKET_NO_KEY_ASSIGNER
+            Ok(Arc::new(StickyBucketAssigner::new(table_path)))
+        }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
index d6fe0ae5d1..1f950ad6b9 100644
--- a/fluss-rust/crates/fluss/src/cluster/cluster.rs
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -15,16 +15,18 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::BucketId;
 use crate::cluster::{BucketLocation, ServerNode, ServerType};
+use crate::error::Error::PartitionNotExist;
 use crate::error::{Error, Result};
 use crate::metadata::{
     JsonSerde, PhysicalTablePath, TableBucket, TableDescriptor, TableInfo, TablePath,
 };
-use crate::proto::MetadataResponse;
+use crate::proto::{MetadataResponse, PbBucketMetadata};
 use crate::rpc::{from_pb_server_node, from_pb_table_path};
+use crate::{BucketId, PartitionId, TableId};
 use rand::random_range;
 use std::collections::{HashMap, HashSet};
+use std::sync::Arc;
 
 static EMPTY: Vec<BucketLocation> = Vec::new();
 
@@ -33,27 +35,35 @@ pub struct Cluster {
     coordinator_server: Option<ServerNode>,
     alive_tablet_servers_by_id: HashMap<i32, ServerNode>,
     alive_tablet_servers: Vec<ServerNode>,
-    available_locations_by_path: HashMap<TablePath, Vec<BucketLocation>>,
+    available_locations_by_path: HashMap<Arc<PhysicalTablePath>, Vec<BucketLocation>>,
     available_locations_by_bucket: HashMap<TableBucket, BucketLocation>,
-    table_id_by_path: HashMap<TablePath, i64>,
-    table_path_by_id: HashMap<i64, TablePath>,
+    table_id_by_path: HashMap<TablePath, TableId>,
+    table_path_by_id: HashMap<TableId, TablePath>,
     table_info_by_path: HashMap<TablePath, TableInfo>,
+    partitions_id_by_path: HashMap<Arc<PhysicalTablePath>, PartitionId>,
+    partition_name_by_id: HashMap<PartitionId, String>,
 }
 
 impl Cluster {
+    #[allow(clippy::too_many_arguments)]
     pub fn new(
         coordinator_server: Option<ServerNode>,
         alive_tablet_servers_by_id: HashMap<i32, ServerNode>,
-        available_locations_by_path: HashMap<TablePath, Vec<BucketLocation>>,
+        available_locations_by_path: HashMap<Arc<PhysicalTablePath>, Vec<BucketLocation>>,
         available_locations_by_bucket: HashMap<TableBucket, BucketLocation>,
-        table_id_by_path: HashMap<TablePath, i64>,
+        table_id_by_path: HashMap<TablePath, TableId>,
         table_info_by_path: HashMap<TablePath, TableInfo>,
+        partitions_id_by_path: HashMap<Arc<PhysicalTablePath>, PartitionId>,
     ) -> Self {
         let alive_tablet_servers = alive_tablet_servers_by_id.values().cloned().collect();
         let table_path_by_id = table_id_by_path
             .iter()
             .map(|(path, table_id)| (*table_id, path.clone()))
             .collect();
+        let partition_name_by_id = partitions_id_by_path
+            .iter()
+            .filter_map(|(path, id)| path.get_partition_name().map(|name| (*id, name.clone())))
+            .collect();
         Cluster {
             coordinator_server,
             alive_tablet_servers_by_id,
@@ -63,10 +73,12 @@ impl Cluster {
             table_id_by_path,
             table_path_by_id,
             table_info_by_path,
+            partitions_id_by_path,
+            partition_name_by_id,
         }
     }
 
-    pub fn invalidate_server(&self, server_id: &i32, table_ids: Vec<i64>) -> Self {
+    pub fn invalidate_server(&self, server_id: &i32, table_ids: Vec<TableId>) -> Self {
         let alive_tablet_servers_by_id = self
             .alive_tablet_servers_by_id
             .iter()
@@ -89,6 +101,7 @@ impl Cluster {
             available_locations_by_bucket,
             self.table_id_by_path.clone(),
             self.table_info_by_path.clone(),
+            self.partitions_id_by_path.clone(),
         )
     }
 
@@ -110,6 +123,7 @@ impl Cluster {
             available_locations_by_bucket,
             self.table_id_by_path.clone(),
             self.table_info_by_path.clone(),
+            self.partitions_id_by_path.clone(),
         )
     }
 
@@ -123,6 +137,8 @@ impl Cluster {
             table_id_by_path,
             table_path_by_id,
             table_info_by_path,
+            partitions_id_by_path,
+            partition_name_by_id,
         } = cluster;
         self.coordinator_server = coordinator_server;
         self.alive_tablet_servers_by_id = alive_tablet_servers_by_id;
@@ -132,26 +148,30 @@ impl Cluster {
         self.table_id_by_path = table_id_by_path;
         self.table_path_by_id = table_path_by_id;
         self.table_info_by_path = table_info_by_path;
+        self.partitions_id_by_path = partitions_id_by_path;
+        self.partition_name_by_id = partition_name_by_id;
     }
 
     fn filter_bucket_locations_by_path(
         &self,
         table_paths: &HashSet<&TablePath>,
     ) -> (
-        HashMap<TablePath, Vec<BucketLocation>>,
+        HashMap<Arc<PhysicalTablePath>, Vec<BucketLocation>>,
         HashMap<TableBucket, BucketLocation>,
     ) {
         let available_locations_by_path = self
             .available_locations_by_path
             .iter()
-            .filter(|&(path, _)| !table_paths.contains(path))
+            .filter(|&(path, _)| !table_paths.contains(path.get_table_path()))
             .map(|(path, locations)| (path.clone(), locations.clone()))
             .collect();
 
         let available_locations_by_bucket = self
             .available_locations_by_bucket
             .iter()
-            .filter(|&(_bucket, location)| !table_paths.contains(&location.table_path))
+            .filter(|&(_bucket, location)| {
+                !table_paths.contains(&location.physical_table_path.get_table_path())
+            })
             .map(|(bucket, location)| (bucket.clone(), location.clone()))
             .collect();
 
@@ -175,15 +195,19 @@ impl Cluster {
 
         let mut table_id_by_path = HashMap::new();
         let mut table_info_by_path = HashMap::new();
+        let mut partitions_id_by_path = HashMap::new();
+        let mut tmp_available_locations_by_path = HashMap::new();
+        let mut tmp_available_location_by_bucket = HashMap::new();
+
         if let Some(origin) = origin_cluster {
             table_info_by_path.extend(origin.get_table_info_by_path().clone());
             table_id_by_path.extend(origin.get_table_id_by_path().clone());
+            partitions_id_by_path.extend(origin.partitions_id_by_path.clone());
+            tmp_available_locations_by_path.extend(origin.available_locations_by_path.clone());
+            tmp_available_location_by_bucket.extend(origin.available_locations_by_bucket.clone());
         }
 
-        // Index the bucket locations by table path, and index bucket location by bucket
-        let mut tmp_available_location_by_bucket = HashMap::new();
-        let mut tmp_available_locations_by_path = HashMap::new();
-
+        // iterate all table metadata
         for table_metadata in metadata_response.table_metadata {
             let table_id = table_metadata.table_id;
             let table_path = from_pb_table_path(&table_metadata.table_path);
@@ -207,39 +231,56 @@ impl Cluster {
             table_info_by_path.insert(table_path.clone(), table_info);
             table_id_by_path.insert(table_path.clone(), table_id);
 
-            // now, get bucket matadata
-            let mut found_unavailable_bucket = false;
-            let mut available_bucket_for_table = vec![];
-            let mut bucket_for_table = vec![];
-            for bucket_metadata in table_metadata.bucket_metadata {
-                let bucket_id = bucket_metadata.bucket_id;
-                let bucket = TableBucket::new(table_id, bucket_id);
-                let bucket_location;
-                if let Some(leader_id) = bucket_metadata.leader_id
-                    && let Some(server_node) = servers.get(&leader_id)
-                {
-                    bucket_location = BucketLocation::new(
-                        bucket.clone(),
-                        Some(server_node.clone()),
-                        table_path.clone(),
-                    );
-                    available_bucket_for_table.push(bucket_location.clone());
-                    tmp_available_location_by_bucket
-                        .insert(bucket.clone(), bucket_location.clone());
-                } else {
-                    found_unavailable_bucket = true;
-                    bucket_location = BucketLocation::new(bucket.clone(), None, table_path.clone());
-                }
-                bucket_for_table.push(bucket_location.clone());
+            let bucket_metadata = table_metadata.bucket_metadata;
+            let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+
+            let bucket_locations = get_bucket_locations(
+                &mut servers,
+                bucket_metadata.as_slice(),
+                table_id,
+                None,
+                &physical_table_path,
+            );
+            tmp_available_locations_by_path.insert(physical_table_path, bucket_locations);
+        }
+
+        // iterate all partition metadata
+        for partition_metadata in metadata_response.partition_metadata {
+            let table_id = partition_metadata.table_id;
+
+            if let Some(cluster) = origin_cluster {
+                let partition_name = partition_metadata.partition_name;
+                let table_path = cluster.get_table_path_by_id(table_id).unwrap();
+                let partition_id = partition_metadata.partition_id;
+
+                let physical_table_path = Arc::new(PhysicalTablePath::of_partitioned(
+                    Arc::new(table_path.clone()),
+                    Some(partition_name),
+                ));
+
+                partitions_id_by_path.insert(Arc::clone(&physical_table_path), partition_id);
+
+                let bucket_locations = get_bucket_locations(
+                    &mut servers,
+                    partition_metadata.bucket_metadata.as_slice(),
+                    table_id,
+                    Some(partition_id),
+                    &physical_table_path,
+                );
+
+                tmp_available_locations_by_path.insert(physical_table_path, bucket_locations);
             }
+        }
 
-            if found_unavailable_bucket {
-                tmp_available_locations_by_path
-                    .insert(table_path.clone(), available_bucket_for_table.clone());
-            } else {
-                tmp_available_locations_by_path.insert(table_path.clone(), bucket_for_table);
+        for bucket_locations in &mut tmp_available_locations_by_path.values() {
+            for location in bucket_locations {
+                if location.leader().is_some() {
+                    tmp_available_location_by_bucket
+                        .insert(location.table_bucket.clone(), location.clone());
+                }
             }
         }
+
         Ok(Cluster::new(
             coordinator_server,
             servers,
@@ -247,6 +288,7 @@ impl Cluster {
             tmp_available_location_by_bucket,
             table_id_by_path,
             table_info_by_path,
+            partitions_id_by_path,
         ))
     }
 
@@ -269,14 +311,43 @@ impl Cluster {
 
     pub fn get_table_bucket(
         &self,
-        table_path: &TablePath,
+        physical_table_path: &PhysicalTablePath,
         bucket_id: BucketId,
     ) -> Result<TableBucket> {
-        let table_info = self.get_table(table_path)?;
-        Ok(TableBucket::new(table_info.table_id, bucket_id))
+        let table_info = self.get_table(physical_table_path.get_table_path())?;
+        let partition_id = self.get_partition_id(physical_table_path);
+
+        if physical_table_path.get_partition_name().is_some() && partition_id.is_none() {
+            return Err(PartitionNotExist {
+                message: format!(
+                    "The partition {} is not found in cluster",
+                    physical_table_path.get_partition_name().unwrap()
+                ),
+            });
+        }
+
+        Ok(TableBucket::new_with_partition(
+            table_info.table_id,
+            partition_id,
+            bucket_id,
+        ))
     }
 
-    pub fn get_bucket_locations_by_path(&self) -> &HashMap<TablePath, Vec<BucketLocation>> {
+    pub fn get_partition_id(&self, physical_table_path: &PhysicalTablePath) -> Option<PartitionId> {
+        self.partitions_id_by_path.get(physical_table_path).copied()
+    }
+
+    pub fn get_partition_name(&self, partition_id: PartitionId) -> Option<&String> {
+        self.partition_name_by_id.get(&partition_id)
+    }
+
+    pub fn get_table_id(&self, table_path: &TablePath) -> Option<i64> {
+        self.table_id_by_path.get(table_path).copied()
+    }
+
+    pub fn get_bucket_locations_by_path(
+        &self,
+    ) -> &HashMap<Arc<PhysicalTablePath>, Vec<BucketLocation>> {
         &self.available_locations_by_path
     }
 
@@ -288,13 +359,13 @@ impl Cluster {
         &self.table_id_by_path
     }
 
-    pub fn get_table_path_by_id(&self, table_id: i64) -> Option<&TablePath> {
+    pub fn get_table_path_by_id(&self, table_id: TableId) -> Option<&TablePath> {
         self.table_path_by_id.get(&table_id)
     }
 
     pub fn get_available_buckets_for_table_path(
         &self,
-        table_path: &TablePath,
+        table_path: &PhysicalTablePath,
     ) -> &Vec<BucketLocation> {
         self.available_locations_by_path
             .get(table_path)
@@ -327,4 +398,37 @@ impl Cluster {
     pub fn opt_get_table(&self, table_path: &TablePath) -> Option<&TableInfo> {
         self.table_info_by_path.get(table_path)
     }
+
+    pub fn get_partition_id_by_path(&self) -> &HashMap<Arc<PhysicalTablePath>, PartitionId> {
+        &self.partitions_id_by_path
+    }
+}
+
+fn get_bucket_locations(
+    servers: &mut HashMap<i32, ServerNode>,
+    bucket_metadata: &[PbBucketMetadata],
+    table_id: i64,
+    partition_id: Option<PartitionId>,
+    physical_table_path: &Arc<PhysicalTablePath>,
+) -> Vec<BucketLocation> {
+    let mut bucket_locations = Vec::new();
+    for metadata in bucket_metadata {
+        let bucket_id = metadata.bucket_id;
+        let bucket = TableBucket::new_with_partition(table_id, partition_id, bucket_id);
+
+        let server = if let Some(leader_id) = metadata.leader_id
+            && let Some(server_node) = servers.get(&leader_id)
+        {
+            Some(server_node.clone())
+        } else {
+            None
+        };
+
+        bucket_locations.push(BucketLocation::new(
+            bucket.clone(),
+            server,
+            Arc::clone(physical_table_path),
+        ));
+    }
+    bucket_locations
 }
diff --git a/fluss-rust/crates/fluss/src/cluster/mod.rs b/fluss-rust/crates/fluss/src/cluster/mod.rs
index f9d42e4453..58e80c00b0 100644
--- a/fluss-rust/crates/fluss/src/cluster/mod.rs
+++ b/fluss-rust/crates/fluss/src/cluster/mod.rs
@@ -16,7 +16,8 @@
 // under the License.
 
 use crate::BucketId;
-use crate::metadata::{TableBucket, TablePath};
+use crate::metadata::{PhysicalTablePath, TableBucket};
+use std::sync::Arc;
 
 #[allow(clippy::module_inception)]
 mod cluster;
@@ -69,19 +70,19 @@ pub enum ServerType {
 pub struct BucketLocation {
     pub table_bucket: TableBucket,
     leader: Option<ServerNode>,
-    pub table_path: TablePath,
+    physical_table_path: Arc<PhysicalTablePath>,
 }
 
 impl BucketLocation {
     pub fn new(
         table_bucket: TableBucket,
         leader: Option<ServerNode>,
-        table_path: TablePath,
+        physical_table_path: Arc<PhysicalTablePath>,
     ) -> BucketLocation {
         BucketLocation {
             table_bucket,
             leader,
-            table_path,
+            physical_table_path,
         }
     }
 
@@ -96,4 +97,8 @@ impl BucketLocation {
     pub fn bucket_id(&self) -> BucketId {
         self.table_bucket.bucket_id()
     }
+
+    pub fn physical_table_path(&self) -> &Arc<PhysicalTablePath> {
+        &self.physical_table_path
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index 68426d7c28..ef86530833 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -99,6 +99,12 @@ pub enum Error {
     )]
     InvalidPartition { message: String },
 
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss hitting partition not exist error {}.", message)
+    )]
+    PartitionNotExist { message: String },
+
     #[snafu(
         visibility(pub(crate)),
         display("Fluss hitting IO not supported error {}.", message)
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index e365237030..6431d3a97d 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -930,6 +930,15 @@ impl RowType {
         self.fields.iter().map(|f| f.name.as_str()).collect()
     }
 
+    pub fn project_with_field_names(&self, field_names: &[String]) -> Result<RowType> {
+        let indices: Vec<usize> = field_names
+            .iter()
+            .filter_map(|pk| self.get_field_index(pk))
+            .collect();
+
+        self.project(indices.as_slice())
+    }
+
     pub fn project(&self, project_field_positions: &[usize]) -> Result<RowType> {
         Ok(RowType::with_nullable(
             self.nullable,
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 7b93acae14..ce362c43be 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -25,6 +25,7 @@ use core::fmt;
 use serde::{Deserialize, Serialize};
 use std::collections::{HashMap, HashSet};
 use std::fmt::{Display, Formatter};
+use std::sync::Arc;
 use strum_macros::EnumString;
 
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
@@ -172,7 +173,7 @@ impl SchemaBuilder {
                 self
             }
             _ => {
-                panic!("data type msut be row type")
+                panic!("data type must be row type")
             }
         }
     }
@@ -325,7 +326,7 @@ pub struct TableDescriptorBuilder {
     schema: Option<Schema>,
     properties: HashMap<String, String>,
     custom_properties: HashMap<String, String>,
-    partition_keys: Vec<String>,
+    partition_keys: Arc<[String]>,
     comment: Option<String>,
     table_distribution: Option<TableDistribution>,
 }
@@ -374,7 +375,7 @@ impl TableDescriptorBuilder {
     }
 
     pub fn partitioned_by(mut self, partition_keys: Vec<String>) -> Self {
-        self.partition_keys = partition_keys;
+        self.partition_keys = Arc::from(partition_keys);
         self
     }
 
@@ -413,7 +414,7 @@ impl TableDescriptorBuilder {
 pub struct TableDescriptor {
     schema: Schema,
     comment: Option<String>,
-    partition_keys: Vec<String>,
+    partition_keys: Arc<[String]>,
     table_distribution: Option<TableDistribution>,
     properties: HashMap<String, String>,
     custom_properties: HashMap<String, String>,
@@ -749,19 +750,19 @@ impl TablePath {
 /// `partition_name` will be `Some(...)`; otherwise, it will be `None`.
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
 pub struct PhysicalTablePath {
-    table_path: TablePath,
+    table_path: Arc<TablePath>,
     partition_name: Option<String>,
 }
 
 impl PhysicalTablePath {
-    pub fn of(table_path: TablePath) -> Self {
+    pub fn of(table_path: Arc<TablePath>) -> Self {
         Self {
             table_path,
             partition_name: None,
         }
     }
 
-    pub fn of_partitioned(table_path: TablePath, partition_name: Option<String>) -> Self {
+    pub fn of_partitioned(table_path: Arc<TablePath>, partition_name: Option<String>) -> Self {
         Self {
             table_path,
             partition_name,
@@ -774,7 +775,7 @@ impl PhysicalTablePath {
         partition_name: Option<String>,
     ) -> Self {
         Self {
-            table_path: TablePath::new(database_name, table_name),
+            table_path: Arc::new(TablePath::new(database_name, table_name)),
             partition_name,
         }
     }
@@ -815,7 +816,7 @@ pub struct TableInfo {
     pub primary_keys: Vec<String>,
     pub physical_primary_keys: Vec<String>,
     pub bucket_keys: Vec<String>,
-    pub partition_keys: Vec<String>,
+    pub partition_keys: Arc<[String]>,
     pub num_buckets: i32,
     pub properties: HashMap<String, String>,
     pub table_config: TableConfig,
@@ -982,7 +983,7 @@ impl TableInfo {
         schema_id: i32,
         schema: Schema,
         bucket_keys: Vec<String>,
-        partition_keys: Vec<String>,
+        partition_keys: Arc<[String]>,
         num_buckets: i32,
         properties: HashMap<String, String>,
         custom_properties: HashMap<String, String>,
@@ -1080,7 +1081,7 @@ impl TableInfo {
                 .is_auto_partition_enabled()
     }
 
-    pub fn get_partition_keys(&self) -> &[String] {
+    pub fn get_partition_keys(&self) -> &Arc<[String]> {
         &self.partition_keys
     }
 
@@ -1115,7 +1116,7 @@ impl TableInfo {
     pub fn to_table_descriptor(&self) -> Result<TableDescriptor> {
         let mut builder = TableDescriptor::builder()
             .schema(self.schema.clone())
-            .partitioned_by(self.partition_keys.clone())
+            .partitioned_by(self.partition_keys.to_vec())
             .distributed_by(Some(self.num_buckets), self.bucket_keys.clone())
             .properties(self.properties.clone())
             .custom_properties(self.custom_properties.clone());
@@ -1177,6 +1178,18 @@ impl TableBucket {
         }
     }
 
+    pub fn new_with_partition(
+        table_id: TableId,
+        partition_id: Option<PartitionId>,
+        bucket: BucketId,
+    ) -> Self {
+        TableBucket {
+            table_id,
+            partition_id,
+            bucket,
+        }
+    }
+
     pub fn table_id(&self) -> TableId {
         self.table_id
     }
@@ -1308,7 +1321,7 @@ mod tests {
             1,
             schema.clone(),
             vec!["id".to_string()],
-            vec![], // No partition keys
+            Arc::from(vec![]), // No partition keys
             1,
             properties.clone(),
             HashMap::new(),
@@ -1329,7 +1342,7 @@ mod tests {
             1,
             schema.clone(),
             vec!["id".to_string()],
-            vec![], // No partition keys
+            Arc::from(vec![]), // No partition keys
             1,
             properties.clone(),
             HashMap::new(),
@@ -1350,7 +1363,7 @@ mod tests {
             1,
             schema.clone(),
             vec!["id".to_string()],
-            vec!["name".to_string()], // Partition keys
+            Arc::from(vec!["name".to_string()]), // Partition keys
             1,
             properties.clone(),
             HashMap::new(),
@@ -1371,7 +1384,7 @@ mod tests {
             1,
             schema.clone(),
             vec!["id".to_string()],
-            vec!["name".to_string()], // Partition keys
+            Arc::from(vec!["name".to_string()]), // Partition keys
             1,
             properties.clone(),
             HashMap::new(),
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 6340dc8022..726106b701 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -1450,6 +1450,7 @@ pub struct MyVec<T>(pub StreamReader<T>);
 mod tests {
     use super::*;
     use crate::metadata::{DataField, DataTypes, RowType};
+    use crate::test_utils::build_table_info;
 
     #[test]
     fn test_to_array_type() {
@@ -1932,7 +1933,7 @@ mod tests {
         use crate::compression::{
             ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
         };
-        use crate::metadata::TablePath;
+        use crate::metadata::{PhysicalTablePath, TablePath};
         use crate::row::GenericRow;
         use tempfile::NamedTempFile;
 
@@ -1941,7 +1942,9 @@ mod tests {
             DataField::new("id".to_string(), DataTypes::int(), None),
             DataField::new("name".to_string(), DataTypes::string(), None),
         ]);
-        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path)));
 
         let mut builder = MemoryLogRecordsArrowBuilder::new(
             1,
@@ -1956,13 +1959,15 @@ mod tests {
         let mut row = GenericRow::new(2);
         row.set_field(0, 1_i32);
         row.set_field(1, "alice");
-        let record = WriteRecord::for_append(table_path.clone(), 1, row);
+        let record =
+            WriteRecord::for_append(Arc::clone(&table_info), physical_table_path.clone(), 1, row);
         builder.append(&record)?;
 
         let mut row2 = GenericRow::new(2);
         row2.set_field(0, 2_i32);
         row2.set_field(1, "bob");
-        let record2 = WriteRecord::for_append(table_path, 2, row2);
+        let record2 =
+            WriteRecord::for_append(Arc::clone(&table_info), physical_table_path, 2, row2);
         builder.append(&record2)?;
 
         let data = builder.build()?;
diff --git a/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs b/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
index a6e6288609..1f0d88c2ae 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
@@ -15,14 +15,15 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::proto::{MetadataResponse, PbTablePath};
+use crate::metadata::{PhysicalTablePath, TablePath};
+use crate::proto::{MetadataResponse, PbPhysicalTablePath, PbTablePath};
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::ReadError;
 use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-
-use crate::metadata::TablePath;
-use crate::rpc::frame::ReadError;
+use std::collections::HashSet;
+use std::sync::Arc;
 
 use crate::{impl_read_version_type, impl_write_version_type, proto};
 use bytes::{Buf, BufMut};
@@ -33,7 +34,11 @@ pub struct UpdateMetadataRequest {
 }
 
 impl UpdateMetadataRequest {
-    pub fn new(table_paths: &[&TablePath]) -> Self {
+    pub fn new(
+        table_paths: &HashSet<&TablePath>,
+        physical_table_paths: &HashSet<&Arc<PhysicalTablePath>>,
+        partition_ids: Vec<i64>,
+    ) -> Self {
         UpdateMetadataRequest {
             inner_request: proto::MetadataRequest {
                 table_path: table_paths
@@ -43,8 +48,15 @@ impl UpdateMetadataRequest {
                         table_name: path.table().to_string(),
                     })
                     .collect(),
-                partitions_path: vec![],
-                partitions_id: vec![],
+                partitions_path: physical_table_paths
+                    .iter()
+                    .map(|path| PbPhysicalTablePath {
+                        database_name: path.get_database_name().to_string(),
+                        table_name: path.get_table_name().to_string(),
+                        partition_name: path.get_partition_name().map(|pn| pn.to_string()),
+                    })
+                    .collect(),
+                partitions_id: partition_ids,
             },
         }
     }
diff --git a/fluss-rust/crates/fluss/src/test_utils.rs b/fluss-rust/crates/fluss/src/test_utils.rs
index d1cd3ec712..8e8fbe4884 100644
--- a/fluss-rust/crates/fluss/src/test_utils.rs
+++ b/fluss-rust/crates/fluss/src/test_utils.rs
@@ -17,7 +17,8 @@
 
 use crate::cluster::{BucketLocation, Cluster, ServerNode, ServerType};
 use crate::metadata::{
-    DataField, DataTypes, Schema, TableBucket, TableDescriptor, TableInfo, TablePath,
+    DataField, DataTypes, PhysicalTablePath, Schema, TableBucket, TableDescriptor, TableInfo,
+    TablePath,
 };
 use std::collections::HashMap;
 use std::sync::Arc;
@@ -53,12 +54,15 @@ pub(crate) fn build_cluster(table_path: &TablePath, table_id: i64, buckets: i32)
         let bucket_location = BucketLocation::new(
             table_bucket.clone(),
             Some(server.clone()),
-            table_path.clone(),
+            Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone()))),
         );
         bucket_locations.push(bucket_location.clone());
         locations_by_bucket.insert(table_bucket, bucket_location);
     }
-    locations_by_path.insert(table_path.clone(), bucket_locations);
+    locations_by_path.insert(
+        Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone()))),
+        bucket_locations,
+    );
 
     let mut table_id_by_path = HashMap::new();
     table_id_by_path.insert(table_path.clone(), table_id);
@@ -76,6 +80,7 @@ pub(crate) fn build_cluster(table_path: &TablePath, table_id: i64, buckets: i32)
         locations_by_bucket,
         table_id_by_path,
         table_info_by_path,
+        HashMap::new(),
     )
 }
 
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index a4f2961760..b2263c2955 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -36,7 +36,7 @@ mod kv_table_test {
     use crate::integration::fluss_cluster::FlussTestingCluster;
     use crate::integration::utils::{create_table, get_cluster, start_cluster, stop_cluster};
     use fluss::client::UpsertWriter;
-    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    use fluss::metadata::{DataTypes, PartitionSpec, Schema, TableDescriptor, TablePath};
     use fluss::row::{GenericRow, InternalRow};
     use std::sync::Arc;
 
@@ -438,6 +438,179 @@ mod kv_table_test {
             .expect("Failed to drop table");
     }
 
+    #[tokio::test]
+    async fn partitioned_table_upsert_and_lookup() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path =
+            TablePath::new("fluss".to_string(), "test_partitioned_kv_table".to_string());
+
+        // Create a partitioned KV table with region as partition key
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("region", DataTypes::string())
+                    .column("user_id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .column("score", DataTypes::bigint())
+                    .primary_key(vec!["region".to_string(), "user_id".to_string()])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .partitioned_by(vec!["region".to_string()])
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        // Create partitions for each region before inserting data
+        for region in &["US", "EU", "APAC"] {
+            let mut partition_map = std::collections::HashMap::new();
+            partition_map.insert("region".to_string(), region.to_string());
+            let partition_spec = PartitionSpec::new(partition_map);
+            admin
+                .create_partition(&table_path, &partition_spec, false)
+                .await
+                .expect("Failed to create partition");
+        }
+
+        let connection = cluster.get_fluss_connection().await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+
+        let mut upsert_writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        // Insert records with different partitions
+        let test_data = [
+            ("US", 1, "Gustave", 100i64),
+            ("US", 2, "Lune", 200i64),
+            ("EU", 1, "Sciel", 150i64),
+            ("EU", 2, "Maelle", 250i64),
+            ("APAC", 1, "Noco", 300i64),
+        ];
+
+        for (region, user_id, name, score) in &test_data {
+            let mut row = GenericRow::new(4);
+            row.set_field(0, *region);
+            row.set_field(1, *user_id);
+            row.set_field(2, *name);
+            row.set_field(3, *score);
+            upsert_writer.upsert(&row).await.expect("Failed to upsert");
+        }
+
+        // Create lookuper
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        // Lookup records - the lookup key includes partition key columns
+        for (region, user_id, expected_name, expected_score) in &test_data {
+            let mut key = GenericRow::new(4);
+            key.set_field(0, *region);
+            key.set_field(1, *user_id);
+
+            let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+            let row = result
+                .get_single_row()
+                .expect("Failed to get row")
+                .expect("Row should exist");
+
+            assert_eq!(row.get_string(0), *region, "region mismatch");
+            assert_eq!(row.get_int(1), *user_id, "user_id mismatch");
+            assert_eq!(row.get_string(2), *expected_name, "name mismatch");
+            assert_eq!(row.get_long(3), *expected_score, "score mismatch");
+        }
+
+        // Test update within a partition
+        let mut updated_row = GenericRow::new(4);
+        updated_row.set_field(0, "US");
+        updated_row.set_field(1, 1);
+        updated_row.set_field(2, "Gustave Updated");
+        updated_row.set_field(3, 999i64);
+        upsert_writer
+            .upsert(&updated_row)
+            .await
+            .expect("Failed to upsert updated row");
+
+        // Verify the update
+        let mut key = GenericRow::new(4);
+        key.set_field(0, "US");
+        key.set_field(1, 1);
+        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+        let row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+        assert_eq!(row.get_string(2), "Gustave Updated");
+        assert_eq!(row.get_long(3), 999);
+
+        // Lookup in non-existent partition should return empty result
+        let mut non_existent_key = GenericRow::new(4);
+        non_existent_key.set_field(0, "UNKNOWN_REGION");
+        non_existent_key.set_field(1, 1);
+        let result = lookuper
+            .lookup(&non_existent_key)
+            .await
+            .expect("Failed to lookup non-existent partition");
+        assert!(
+            result
+                .get_single_row()
+                .expect("Failed to get row")
+                .is_none(),
+            "Lookup in non-existent partition should return None"
+        );
+
+        // Delete a record within a partition
+        let mut delete_key = GenericRow::new(4);
+        delete_key.set_field(0, "EU");
+        delete_key.set_field(1, 1);
+        upsert_writer
+            .delete(&delete_key)
+            .await
+            .expect("Failed to delete");
+
+        // Verify deletion
+        let mut key = GenericRow::new(4);
+        key.set_field(0, "EU");
+        key.set_field(1, 1);
+        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+        assert!(
+            result
+                .get_single_row()
+                .expect("Failed to get row")
+                .is_none(),
+            "Deleted record should not exist"
+        );
+
+        // Verify other records in the same partition still exist
+        let mut key = GenericRow::new(4);
+        key.set_field(0, "EU");
+        key.set_field(1, 2);
+        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+        let row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+        assert_eq!(row.get_string(2), "Maelle");
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
     /// Integration test covering put and get operations for all supported datatypes.
     #[tokio::test]
     async fn all_supported_datatypes() {

From 9a61576136a9a5be37cf599cec399f779d5cb1d1 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sat, 31 Jan 2026 07:54:29 +0800
Subject: [PATCH 099/287] feat: support produce partitioned table (#228)

---
 fluss-rust/bindings/cpp/src/lib.rs            |   7 +-
 fluss-rust/bindings/python/src/table.rs       |   6 +-
 .../crates/examples/src/example_kv_table.rs   |   2 +-
 .../src/example_partitioned_kv_table.rs       |   2 +-
 .../crates/examples/src/example_table.rs      |   8 +-
 .../crates/fluss/src/client/table/append.rs   |  55 ++++++--
 .../src/client/table/log_fetch_buffer.rs      |   2 +-
 .../crates/fluss/src/client/table/mod.rs      |   4 +-
 .../src/client/table/partition_getter.rs      |  19 ++-
 .../crates/fluss/src/client/table/scanner.rs  |  13 +-
 .../crates/fluss/src/client/table/upsert.rs   |  67 +++++----
 .../crates/fluss/src/client/table/writer.rs   |  46 -------
 .../fluss/src/client/write/accumulator.rs     |  12 +-
 .../crates/fluss/src/client/write/batch.rs    |   2 +-
 .../crates/fluss/src/client/write/mod.rs      |   8 +-
 .../crates/fluss/src/client/write/sender.rs   |  15 +-
 fluss-rust/crates/fluss/src/io/storage.rs     |   2 +
 fluss-rust/crates/fluss/src/record/arrow.rs   |  54 +++++---
 fluss-rust/crates/fluss/src/row/column.rs     |  36 ++---
 .../fluss/src/row/compacted/compacted_row.rs  |  17 ++-
 fluss-rust/crates/fluss/src/row/mod.rs        |   2 +-
 .../fluss/tests/integration/kv_table.rs       |  17 +--
 .../integration/{table.rs => log_table.rs}    | 128 ++++++++++++++++--
 .../tests/integration/table_remote_scan.rs    |   7 +-
 .../crates/fluss/tests/integration/utils.rs   |  26 +++-
 fluss-rust/crates/fluss/tests/test_fluss.rs   |   2 +-
 26 files changed, 350 insertions(+), 209 deletions(-)
 delete mode 100644 fluss-rust/crates/fluss/src/client/table/writer.rs
 rename fluss-rust/crates/fluss/tests/integration/{table.rs => log_table.rs} (90%)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 2d37763673..bd38a03963 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -508,7 +508,10 @@ impl Table {
             Err(e) => return Err(format!("Failed to create append: {e}")),
         };
 
-        let writer = table_append.create_writer();
+        let writer = match table_append.create_writer() {
+            Ok(w) => w,
+            Err(e) => return Err(format!("Failed to create writer: {e}")),
+        };
         let writer = Box::into_raw(Box::new(AppendWriter { inner: writer }));
         Ok(writer)
     }
@@ -580,7 +583,7 @@ impl AppendWriter {
     fn append(&mut self, row: &ffi::FfiGenericRow) -> ffi::FfiResult {
         let generic_row = types::ffi_row_to_core(row);
 
-        let result = RUNTIME.block_on(async { self.inner.append(generic_row).await });
+        let result = RUNTIME.block_on(async { self.inner.append(&generic_row).await });
 
         match result {
             Ok(_) => ok_result(),
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 404335058b..48f09e7ac1 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -68,7 +68,9 @@ impl FlussTable {
                 .new_append()
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
 
-            let rust_writer = table_append.create_writer();
+            let rust_writer = table_append
+                .create_writer()
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
 
             let py_writer = AppendWriter::from_core(rust_writer, table_info);
 
@@ -251,7 +253,7 @@ impl AppendWriter {
 
         future_into_py(py, async move {
             inner
-                .append(generic_row)
+                .append(&generic_row)
                 .await
                 .map_err(|e| FlussError::new_err(e.to_string()))
         })
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 032691e0a1..437da06b4c 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -16,7 +16,7 @@
 // under the License.
 
 use clap::Parser;
-use fluss::client::{FlussConnection, UpsertWriter};
+use fluss::client::FlussConnection;
 use fluss::config::Config;
 use fluss::error::Result;
 use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index a5e76fa38e..1b0c3035c4 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -16,7 +16,7 @@
 // under the License.
 
 use clap::Parser;
-use fluss::client::{FlussAdmin, FlussConnection, UpsertWriter};
+use fluss::client::{FlussAdmin, FlussConnection};
 use fluss::config::Config;
 use fluss::error::Result;
 use fluss::metadata::{DataTypes, PartitionSpec, Schema, TableDescriptor, TablePath};
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index 92055a702b..6c74e635ac 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -63,13 +63,13 @@ pub async fn main() -> Result<()> {
     row.set_field(2, 123_456_789_123i64);
 
     let table = conn.get_table(&table_path).await?;
-    let append_writer = table.new_append()?.create_writer();
-    let f1 = append_writer.append(row);
-    row = GenericRow::new(3);
+    let append_writer = table.new_append()?.create_writer()?;
+    let f1 = append_writer.append(&row);
+    let mut row = GenericRow::new(3);
     row.set_field(0, 233333);
     row.set_field(1, "tt44");
     row.set_field(2, 987_654_321_987i64);
-    let f2 = append_writer.append(row);
+    let f2 = append_writer.append(&row);
     try_join!(f1, f2, append_writer.flush())?;
 
     // scan rows
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index 7fe2023bbb..ace91a607c 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -15,16 +15,16 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::client::table::partition_getter::{PartitionGetter, get_physical_path};
 use crate::client::{WriteRecord, WriterClient};
 use crate::error::Result;
 use crate::metadata::{PhysicalTablePath, TableInfo, TablePath};
-use crate::row::GenericRow;
+use crate::row::{ColumnarRow, InternalRow};
 use arrow::array::RecordBatch;
 use std::sync::Arc;
 
-#[allow(dead_code)]
 pub struct TableAppend {
-    table_path: TablePath,
+    table_path: Arc<TablePath>,
     table_info: Arc<TableInfo>,
     writer_client: Arc<WriterClient>,
 }
@@ -36,32 +36,48 @@ impl TableAppend {
         writer_client: Arc<WriterClient>,
     ) -> Self {
         Self {
-            table_path,
+            table_path: Arc::new(table_path),
             table_info,
             writer_client,
         }
     }
 
-    pub fn create_writer(&self) -> AppendWriter {
-        AppendWriter {
-            physical_table_path: Arc::new(PhysicalTablePath::of(Arc::new(self.table_path.clone()))),
+    pub fn create_writer(&self) -> Result<AppendWriter> {
+        let partition_getter = if self.table_info.is_partitioned() {
+            Some(PartitionGetter::new(
+                self.table_info.row_type(),
+                Arc::clone(self.table_info.get_partition_keys()),
+            )?)
+        } else {
+            None
+        };
+
+        Ok(AppendWriter {
+            table_path: Arc::clone(&self.table_path),
+            partition_getter,
             writer_client: self.writer_client.clone(),
             table_info: Arc::clone(&self.table_info),
-        }
+        })
     }
 }
 
 pub struct AppendWriter {
-    physical_table_path: Arc<PhysicalTablePath>,
+    table_path: Arc<TablePath>,
+    partition_getter: Option<PartitionGetter>,
     writer_client: Arc<WriterClient>,
     table_info: Arc<TableInfo>,
 }
 
 impl AppendWriter {
-    pub async fn append(&self, row: GenericRow<'_>) -> Result<()> {
+    pub async fn append<R: InternalRow>(&self, row: &R) -> Result<()> {
+        let physical_table_path = Arc::new(get_physical_path(
+            &self.table_path,
+            self.partition_getter.as_ref(),
+            row,
+        )?);
         let record = WriteRecord::for_append(
             Arc::clone(&self.table_info),
-            Arc::clone(&self.physical_table_path),
+            physical_table_path,
             self.table_info.schema_id,
             row,
         );
@@ -70,10 +86,25 @@ impl AppendWriter {
         result_handle.result(result)
     }
 
+    /// Appends an Arrow RecordBatch to the table.
+    ///
+    /// For partitioned tables, the partition is derived from the **first row** of the batch.
+    /// Callers must ensure all rows in the batch belong to the same partition.
     pub async fn append_arrow_batch(&self, batch: RecordBatch) -> Result<()> {
+        let physical_table_path = if self.partition_getter.is_some() && batch.num_rows() > 0 {
+            let first_row = ColumnarRow::new(Arc::new(batch.clone()));
+            Arc::new(get_physical_path(
+                &self.table_path,
+                self.partition_getter.as_ref(),
+                &first_row,
+            )?)
+        } else {
+            Arc::new(PhysicalTablePath::of(Arc::clone(&self.table_path)))
+        };
+
         let record = WriteRecord::for_append_record_batch(
             Arc::clone(&self.table_info),
-            Arc::clone(&self.physical_table_path),
+            physical_table_path,
             self.table_info.schema_id,
             batch,
         );
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index 78ee065a4d..b622f19a08 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -917,7 +917,7 @@ mod tests {
         let mut row = GenericRow::new(2);
         row.set_field(0, 1_i32);
         row.set_field(1, "alice");
-        let record = WriteRecord::for_append(table_info, physical_table_path, 1, row);
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
         builder.append(&record)?;
 
         let data = builder.build()?;
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 2fbbbc917f..6d54933abc 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -31,16 +31,14 @@ mod partition_getter;
 mod remote_log;
 mod scanner;
 mod upsert;
-mod writer;
 
-use crate::client::table::upsert::TableUpsert;
 pub use append::{AppendWriter, TableAppend};
 pub use lookup::{LookupResult, Lookuper, TableLookup};
 pub use remote_log::{
     DEFAULT_SCANNER_REMOTE_LOG_DOWNLOAD_THREADS, DEFAULT_SCANNER_REMOTE_LOG_PREFETCH_NUM,
 };
 pub use scanner::{LogScanner, RecordBatchLogScanner, TableScan};
-pub use writer::{TableWriter, UpsertWriter};
+pub use upsert::{TableUpsert, UpsertWriter};
 
 #[allow(dead_code)]
 pub struct FlussTable<'a> {
diff --git a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
index 1a76106867..913680198d 100644
--- a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
+++ b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
@@ -17,12 +17,29 @@
 
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::{DataType, ResolvedPartitionSpec, RowType};
+use crate::metadata::{DataType, PhysicalTablePath, ResolvedPartitionSpec, RowType, TablePath};
 use crate::row::InternalRow;
 use crate::row::field_getter::FieldGetter;
 use crate::util::partition;
 use std::sync::Arc;
 
+/// Get the physical table path for a row, handling partitioned vs non-partitioned tables.
+pub fn get_physical_path<R: InternalRow>(
+    table_path: &Arc<TablePath>,
+    partition_getter: Option<&PartitionGetter>,
+    row: &R,
+) -> Result<PhysicalTablePath> {
+    if let Some(getter) = partition_getter {
+        let partition = getter.get_partition(row)?;
+        Ok(PhysicalTablePath::of_partitioned(
+            Arc::clone(table_path),
+            Some(partition),
+        ))
+    } else {
+        Ok(PhysicalTablePath::of(Arc::clone(table_path)))
+    }
+}
+
 /// A getter to get partition name from a row.
 #[allow(dead_code)]
 pub struct PartitionGetter {
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 14d2841124..10e7fff5bf 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -1516,14 +1516,11 @@ mod tests {
             },
         )?;
         let physical_table_path = Arc::new(PhysicalTablePath::of(table_path));
-        let record = WriteRecord::for_append(
-            Arc::new(table_info.clone()),
-            physical_table_path,
-            1,
-            GenericRow {
-                values: vec![Datum::Int32(1)],
-            },
-        );
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+        let record =
+            WriteRecord::for_append(Arc::new(table_info.clone()), physical_table_path, 1, &row);
         builder.append(&record)?;
         builder.build()
     }
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
index 269d5258f8..05953971af 100644
--- a/fluss-rust/crates/fluss/src/client/table/upsert.rs
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -15,17 +15,16 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::client::table::writer::{DeleteResult, TableWriter, UpsertResult, UpsertWriter};
 use crate::client::{RowBytes, WriteFormat, WriteRecord, WriterClient};
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::{PhysicalTablePath, RowType, TableInfo, TablePath};
+use crate::metadata::{RowType, TableInfo, TablePath};
 use crate::row::InternalRow;
 use crate::row::encode::{KeyEncoder, KeyEncoderFactory, RowEncoder, RowEncoderFactory};
 use crate::row::field_getter::FieldGetter;
 use std::sync::Arc;
 
-use crate::client::table::partition_getter::PartitionGetter;
+use crate::client::table::partition_getter::{PartitionGetter, get_physical_path};
 use bitvec::prelude::bitvec;
 use bytes::Bytes;
 
@@ -98,7 +97,7 @@ impl TableUpsert {
         self.partial_update(Some(valid_col_indices))
     }
 
-    pub fn create_writer(&self) -> Result<impl UpsertWriter> {
+    pub fn create_writer(&self) -> Result<UpsertWriter> {
         UpsertWriterFactory::create(
             Arc::new(self.table_path.clone()),
             Arc::new(self.table_info.clone()),
@@ -108,10 +107,7 @@ impl TableUpsert {
     }
 }
 
-struct UpsertWriterImpl<RE>
-where
-    RE: RowEncoder,
-{
+pub struct UpsertWriter {
     table_path: Arc<TablePath>,
     writer_client: Arc<WriterClient>,
     partition_field_getter: Option<PartitionGetter>,
@@ -120,7 +116,7 @@ where
     // Use primary key encoder as bucket key encoder when None
     bucket_key_encoder: Option<Box<dyn KeyEncoder>>,
     write_format: WriteFormat,
-    row_encoder: RE,
+    row_encoder: Box<dyn RowEncoder>,
     field_getters: Box<[FieldGetter]>,
     table_info: Arc<TableInfo>,
 }
@@ -133,7 +129,7 @@ impl UpsertWriterFactory {
         table_info: Arc<TableInfo>,
         partial_update_columns: Option<Arc<Vec<usize>>>,
         writer_client: Arc<WriterClient>,
-    ) -> Result<impl UpsertWriter> {
+    ) -> Result<UpsertWriter> {
         let data_lake_format = &table_info.table_config.get_datalake_format()?;
         let row_type = table_info.row_type();
         let physical_pks = table_info.get_physical_primary_keys();
@@ -173,7 +169,7 @@ impl UpsertWriterFactory {
             None
         };
 
-        Ok(UpsertWriterImpl {
+        Ok(UpsertWriter {
             table_path,
             partition_field_getter,
             writer_client,
@@ -181,7 +177,7 @@ impl UpsertWriterFactory {
             target_columns: partial_update_columns,
             bucket_key_encoder,
             write_format,
-            row_encoder: RowEncoderFactory::create(kv_format, row_type.clone())?,
+            row_encoder: Box::new(RowEncoderFactory::create(kv_format, row_type.clone())?),
             field_getters,
             table_info: table_info.clone(),
         })
@@ -283,8 +279,7 @@ impl UpsertWriterFactory {
     }
 }
 
-#[allow(dead_code)]
-impl<RE: RowEncoder> UpsertWriterImpl<RE> {
+impl UpsertWriter {
     fn check_field_count<R: InternalRow>(&self, row: &R) -> Result<()> {
         let expected = self.table_info.get_row_type().fields().len();
         if row.get_field_count() != expected {
@@ -317,31 +312,15 @@ impl<RE: RowEncoder> UpsertWriterImpl<RE> {
         self.row_encoder.finish_row()
     }
 
-    fn get_physical_path<R: InternalRow>(&self, row: &R) -> Result<PhysicalTablePath> {
-        if let Some(partition_getter) = &self.partition_field_getter {
-            let partition = partition_getter.get_partition(row);
-            Ok(PhysicalTablePath::of_partitioned(
-                Arc::clone(&self.table_path),
-                Some(partition?),
-            ))
-        } else {
-            Ok(PhysicalTablePath::of(Arc::clone(&self.table_path)))
-        }
-    }
-}
-
-impl<RE: RowEncoder> TableWriter for UpsertWriterImpl<RE> {
     /// Flush data written that have not yet been sent to the server, forcing the client to send the
     /// requests to server and blocks on the completion of the requests associated with these
     /// records. A request is considered completed when it is successfully acknowledged according to
     /// the CLIENT_WRITER_ACKS configuration option you have specified or else it
     /// results in an error.
-    async fn flush(&self) -> Result<()> {
+    pub async fn flush(&self) -> Result<()> {
         self.writer_client.flush().await
     }
-}
 
-impl<RE: RowEncoder> UpsertWriter for UpsertWriterImpl<RE> {
     /// Inserts row into Fluss table if they do not already exist, or updates them if they do exist.
     ///
     /// # Arguments
@@ -349,7 +328,7 @@ impl<RE: RowEncoder> UpsertWriter for UpsertWriterImpl<RE> {
     ///
     /// # Returns
     /// Ok(UpsertResult) when completed normally
-    async fn upsert<R: InternalRow>(&mut self, row: &R) -> Result<UpsertResult> {
+    pub async fn upsert<R: InternalRow>(&mut self, row: &R) -> Result<UpsertResult> {
         self.check_field_count(row)?;
 
         let (key, bucket_key) = self.get_keys(row)?;
@@ -361,7 +340,11 @@ impl<RE: RowEncoder> UpsertWriter for UpsertWriterImpl<RE> {
 
         let write_record = WriteRecord::for_upsert(
             Arc::clone(&self.table_info),
-            Arc::new(self.get_physical_path(row)?),
+            Arc::new(get_physical_path(
+                &self.table_path,
+                self.partition_field_getter.as_ref(),
+                row,
+            )?),
             self.table_info.schema_id,
             key,
             bucket_key,
@@ -384,14 +367,18 @@ impl<RE: RowEncoder> UpsertWriter for UpsertWriterImpl<RE> {
     ///
     /// # Returns
     /// Ok(DeleteResult) when completed normally
-    async fn delete<R: InternalRow>(&mut self, row: &R) -> Result<DeleteResult> {
+    pub async fn delete<R: InternalRow>(&mut self, row: &R) -> Result<DeleteResult> {
         self.check_field_count(row)?;
 
         let (key, bucket_key) = self.get_keys(row)?;
 
         let write_record = WriteRecord::for_upsert(
             Arc::clone(&self.table_info),
-            Arc::new(self.get_physical_path(row)?),
+            Arc::new(get_physical_path(
+                &self.table_path,
+                self.partition_field_getter.as_ref(),
+                row,
+            )?),
             self.table_info.schema_id,
             key,
             bucket_key,
@@ -537,3 +524,13 @@ mod tests {
         ));
     }
 }
+
+/// The result of upserting a record
+/// Currently this is an empty struct to allow for compatible evolution in the future
+#[derive(Default)]
+pub struct UpsertResult;
+
+/// The result of deleting a record
+/// Currently this is an empty struct to allow for compatible evolution in the future
+#[derive(Default)]
+pub struct DeleteResult;
diff --git a/fluss-rust/crates/fluss/src/client/table/writer.rs b/fluss-rust/crates/fluss/src/client/table/writer.rs
deleted file mode 100644
index ec26ec63dd..0000000000
--- a/fluss-rust/crates/fluss/src/client/table/writer.rs
+++ /dev/null
@@ -1,46 +0,0 @@
-// Licensed to the Apache Software Foundation (ASF) under one
-// or more contributor license agreements.  See the NOTICE file
-// distributed with this work for additional information
-// regarding copyright ownership.  The ASF licenses this file
-// to you under the Apache License, Version 2.0 (the
-// "License"); you may not use this file except in compliance
-// with the License.  You may obtain a copy of the License at
-//
-//   http://www.apache.org/licenses/LICENSE-2.0
-//
-// Unless required by applicable law or agreed to in writing,
-// software distributed under the License is distributed on an
-// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-// KIND, either express or implied.  See the License for the
-// specific language governing permissions and limitations
-// under the License.
-
-use crate::row::{GenericRow, InternalRow};
-
-use crate::error::Result;
-
-#[allow(dead_code, async_fn_in_trait)]
-pub trait TableWriter {
-    async fn flush(&self) -> Result<()>;
-}
-
-#[allow(dead_code)]
-pub trait AppendWriter: TableWriter {
-    async fn append(&self, row: GenericRow) -> Result<()>;
-}
-
-#[allow(dead_code, async_fn_in_trait)]
-pub trait UpsertWriter: TableWriter {
-    async fn upsert<R: InternalRow>(&mut self, row: &R) -> Result<UpsertResult>;
-    async fn delete<R: InternalRow>(&mut self, row: &R) -> Result<DeleteResult>;
-}
-
-/// The result of upserting a record
-/// Currently this is an empty struct to allow for compatible evolution in the future
-#[derive(Default)]
-pub struct UpsertResult;
-
-/// The result of deleting a record
-/// Currently this is an empty struct to allow for compatible evolution in the future
-#[derive(Default)]
-pub struct DeleteResult;
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 2a45517306..5eae868dd7 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -599,14 +599,10 @@ mod tests {
         let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
         let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
         let cluster = Arc::new(build_cluster(&table_path, 1, 1));
-        let record = WriteRecord::for_append(
-            table_info,
-            physical_table_path,
-            1,
-            GenericRow {
-                values: vec![Datum::Int32(1)],
-            },
-        );
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
 
         accumulator.append(&record, 0, &cluster, false).await?;
 
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index da30c8aca4..c765473096 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -426,7 +426,7 @@ mod tests {
                     Arc::clone(&table_info),
                     Arc::clone(&physical_table_path),
                     1,
-                    row,
+                    &row,
                 );
                 batch.try_append(&record).unwrap();
             }
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index 868b582c2a..25a0db61b2 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -22,7 +22,7 @@ use crate::client::broadcast::{self as client_broadcast, BatchWriteResult, Broad
 use crate::error::Error;
 use crate::metadata::{PhysicalTablePath, TableInfo};
 
-use crate::row::GenericRow;
+use crate::row::InternalRow;
 pub use accumulator::*;
 use arrow::array::RecordBatch;
 use bytes::Bytes;
@@ -64,7 +64,7 @@ pub enum Record<'a> {
 }
 
 pub enum LogWriteRecord<'a> {
-    Generic(GenericRow<'a>),
+    InternalRow(&'a dyn InternalRow),
     RecordBatch(Arc<RecordBatch>),
 }
 
@@ -112,11 +112,11 @@ impl<'a> WriteRecord<'a> {
         table_info: Arc<TableInfo>,
         physical_table_path: Arc<PhysicalTablePath>,
         schema_id: i32,
-        row: GenericRow<'a>,
+        row: &'a dyn InternalRow,
     ) -> Self {
         Self {
             table_info,
-            record: Record::Log(LogWriteRecord::Generic(row)),
+            record: Record::Log(LogWriteRecord::InternalRow(row)),
             physical_table_path,
             bucket_key: None,
             schema_id,
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index 6a7dad002c..f336d0cdca 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -103,8 +103,7 @@ impl Sender {
                         if api_error.code == FlussError::PartitionNotExists.code() =>
                     {
                         warn!(
-                            "Partition does not exist during metadata update, continuing: {}",
-                            api_error
+                            "Partition does not exist during metadata update, continuing: {api_error}"
                         );
                     }
                     _ => return Err(e),
@@ -664,14 +663,10 @@ mod tests {
     ) -> Result<(ReadyWriteBatch, crate::client::ResultHandle)> {
         let table_info = Arc::new(build_table_info(table_path.as_ref().clone(), 1, 1));
         let physical_table_path = Arc::new(PhysicalTablePath::of(table_path));
-        let record = WriteRecord::for_append(
-            table_info,
-            physical_table_path,
-            1,
-            GenericRow {
-                values: vec![Datum::Int32(1)],
-            },
-        );
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
         let result = accumulator.append(&record, 0, &cluster, false).await?;
         let result_handle = result.result_handle.expect("result handle");
         let server = cluster.get_tablet_server(1).expect("server");
diff --git a/fluss-rust/crates/fluss/src/io/storage.rs b/fluss-rust/crates/fluss/src/io/storage.rs
index a370861094..a57351783e 100644
--- a/fluss-rust/crates/fluss/src/io/storage.rs
+++ b/fluss-rust/crates/fluss/src/io/storage.rs
@@ -19,6 +19,8 @@ use crate::error;
 use crate::error::Result;
 use crate::io::FileIOBuilder;
 use opendal::{Operator, Scheme};
+#[cfg(any(feature = "storage-s3", feature = "storage-oss"))]
+use std::collections::HashMap;
 
 /// The storage carries all supported storage services in fluss
 #[derive(Debug)]
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 726106b701..b798896ace 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -20,7 +20,8 @@ use crate::compression::ArrowCompressionInfo;
 use crate::error::{Error, Result};
 use crate::metadata::{DataType, RowType};
 use crate::record::{ChangeType, ScanRecord};
-use crate::row::{ColumnarRow, GenericRow};
+use crate::row::field_getter::FieldGetter;
+use crate::row::{ColumnarRow, InternalRow};
 use arrow::array::{
     ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
     Float32Builder, Float64Builder, Int8Builder, Int16Builder, Int32Builder, Int64Builder,
@@ -166,7 +167,7 @@ pub struct MemoryLogRecordsArrowBuilder {
 pub trait ArrowRecordBatchInnerBuilder: Send + Sync {
     fn build_arrow_record_batch(&mut self) -> Result<Arc<RecordBatch>>;
 
-    fn append(&mut self, row: &GenericRow) -> Result<bool>;
+    fn append(&mut self, row: &dyn InternalRow) -> Result<bool>;
 
     fn append_batch(&mut self, record_batch: Arc<RecordBatch>) -> Result<bool>;
 
@@ -191,7 +192,7 @@ impl ArrowRecordBatchInnerBuilder for PrebuiltRecordBatchBuilder {
         Ok(self.arrow_record_batch.as_ref().unwrap().clone())
     }
 
-    fn append(&mut self, _row: &GenericRow) -> Result<bool> {
+    fn append(&mut self, _row: &dyn InternalRow) -> Result<bool> {
         // append one single row is not supported, return false directly
         Ok(false)
     }
@@ -229,6 +230,7 @@ impl ArrowRecordBatchInnerBuilder for PrebuiltRecordBatchBuilder {
 pub struct RowAppendRecordBatchBuilder {
     table_schema: SchemaRef,
     arrow_column_builders: Vec<Box<dyn ArrayBuilder>>,
+    field_getters: Box<[FieldGetter]>,
     records_count: i32,
 }
 
@@ -240,9 +242,11 @@ impl RowAppendRecordBatchBuilder {
             .iter()
             .map(|field| Self::create_builder(field.data_type()))
             .collect();
+        let field_getters = FieldGetter::create_field_getters(row_type);
         Ok(Self {
             table_schema: schema_ref.clone(),
             arrow_column_builders: builders?,
+            field_getters,
             records_count: 0,
         })
     }
@@ -346,11 +350,18 @@ impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
         )?))
     }
 
-    fn append(&mut self, row: &GenericRow) -> Result<bool> {
-        for (idx, value) in row.values.iter().enumerate() {
+    fn append(&mut self, row: &dyn InternalRow) -> Result<bool> {
+        for (idx, getter) in self.field_getters.iter().enumerate() {
+            let datum = getter.get_field(row);
             let field_type = self.table_schema.field(idx).data_type();
-            let builder = self.arrow_column_builders.get_mut(idx).unwrap();
-            value.append_to(builder.as_mut(), field_type)?;
+            let builder =
+                self.arrow_column_builders
+                    .get_mut(idx)
+                    .ok_or_else(|| Error::UnexpectedError {
+                        message: format!("Column builder at index {idx} not found."),
+                        source: None,
+                    })?;
+            datum.append_to(builder, field_type)?;
         }
         self.records_count += 1;
         Ok(true)
@@ -412,7 +423,9 @@ impl MemoryLogRecordsArrowBuilder {
     pub fn append(&mut self, record: &WriteRecord) -> Result<bool> {
         match &record.record() {
             Record::Log(log_write_record) => match log_write_record {
-                LogWriteRecord::Generic(row) => Ok(self.arrow_record_batch_builder.append(row)?),
+                LogWriteRecord::InternalRow(row) => {
+                    Ok(self.arrow_record_batch_builder.append(*row)?)
+                }
                 LogWriteRecord::RecordBatch(record_batch) => Ok(self
                     .arrow_record_batch_builder
                     .append_batch(record_batch.clone())?),
@@ -1715,9 +1728,10 @@ mod tests {
         )]);
         let mut builder = RowAppendRecordBatchBuilder::new(&row_type)?;
         let decimal = Decimal::from_big_decimal(BigDecimal::from_str("123.456").unwrap(), 10, 3)?;
-        builder.append(&GenericRow {
+        let row = GenericRow {
             values: vec![Datum::Decimal(decimal)],
-        })?;
+        };
+        builder.append(&row)?;
         let batch = builder.build_arrow_record_batch()?;
         let array = batch
             .column(0)
@@ -1735,9 +1749,10 @@ mod tests {
         )]);
         let mut builder = RowAppendRecordBatchBuilder::new(&row_type)?;
         let decimal = Decimal::from_big_decimal(BigDecimal::from_str("123456.78").unwrap(), 10, 2)?;
-        let result = builder.append(&GenericRow {
+        let row = GenericRow {
             values: vec![Datum::Decimal(decimal)],
-        });
+        };
+        let result = builder.append(&row);
         assert!(result.is_err());
         assert!(
             result
@@ -1832,7 +1847,7 @@ mod tests {
         let mut builder = RowAppendRecordBatchBuilder::new(&row_type)?;
 
         // Append rows with various data types
-        builder.append(&GenericRow {
+        let row = GenericRow {
             values: vec![
                 Datum::Int32(1),
                 Datum::Decimal(Decimal::from_big_decimal(
@@ -1851,7 +1866,8 @@ mod tests {
                 // 1609459200000 ms = 2021-01-01 00:00:00 UTC, with 987654 additional nanoseconds
                 Datum::TimestampLtz(TimestampLtz::from_millis_nanos(1609459200000, 987654)?),
             ],
-        })?;
+        };
+        builder.append(&row)?;
 
         let batch = builder.build_arrow_record_batch()?;
 
@@ -1959,15 +1975,19 @@ mod tests {
         let mut row = GenericRow::new(2);
         row.set_field(0, 1_i32);
         row.set_field(1, "alice");
-        let record =
-            WriteRecord::for_append(Arc::clone(&table_info), physical_table_path.clone(), 1, row);
+        let record = WriteRecord::for_append(
+            Arc::clone(&table_info),
+            physical_table_path.clone(),
+            1,
+            &row,
+        );
         builder.append(&record)?;
 
         let mut row2 = GenericRow::new(2);
         row2.set_field(0, 2_i32);
         row2.set_field(1, "bob");
         let record2 =
-            WriteRecord::for_append(Arc::clone(&table_info), physical_table_path, 2, row2);
+            WriteRecord::for_append(Arc::clone(&table_info), physical_table_path, 2, &row2);
         builder.append(&record2)?;
 
         let data = builder.build()?;
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index f48075b369..50db32b14d 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -248,6 +248,24 @@ impl InternalRow for ColumnarRow {
             .value(self.row_id)
     }
 
+    fn get_char(&self, pos: usize, _length: usize) -> &str {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<StringArray>()
+            .expect("Expected String array for char type")
+            .value(self.row_id)
+    }
+
+    fn get_string(&self, pos: usize) -> &str {
+        self.record_batch
+            .column(pos)
+            .as_any()
+            .downcast_ref::<StringArray>()
+            .expect("Expected String array.")
+            .value(self.row_id)
+    }
+
     fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> crate::row::Decimal {
         use arrow::datatypes::DataType;
 
@@ -327,24 +345,6 @@ impl InternalRow for ColumnarRow {
         )
     }
 
-    fn get_char(&self, pos: usize, _length: usize) -> &str {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<StringArray>()
-            .expect("Expected String array for char type")
-            .value(self.row_id)
-    }
-
-    fn get_string(&self, pos: usize) -> &str {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<StringArray>()
-            .expect("Expected String array.")
-            .value(self.row_id)
-    }
-
     fn get_binary(&self, pos: usize, _length: usize) -> &[u8] {
         self.record_batch
             .column(pos)
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 35d684db6f..232220720c 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -76,7 +76,6 @@ impl<'a> CompactedRow<'a> {
     }
 }
 
-#[allow(dead_code)]
 impl<'a> InternalRow for CompactedRow<'a> {
     fn get_field_count(&self) -> usize {
         self.arity
@@ -125,14 +124,6 @@ impl<'a> InternalRow for CompactedRow<'a> {
         self.decoded_row().get_string(pos)
     }
 
-    fn get_binary(&self, pos: usize, length: usize) -> &[u8] {
-        self.decoded_row().get_binary(pos, length)
-    }
-
-    fn get_bytes(&self, pos: usize) -> &[u8] {
-        self.decoded_row().get_bytes(pos)
-    }
-
     fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> crate::row::Decimal {
         self.decoded_row().get_decimal(pos, precision, scale)
     }
@@ -153,6 +144,14 @@ impl<'a> InternalRow for CompactedRow<'a> {
         self.decoded_row().get_timestamp_ltz(pos, precision)
     }
 
+    fn get_binary(&self, pos: usize, length: usize) -> &[u8] {
+        self.decoded_row().get_binary(pos, length)
+    }
+
+    fn get_bytes(&self, pos: usize) -> &[u8] {
+        self.decoded_row().get_bytes(pos)
+    }
+
     fn as_encoded_bytes(&self, write_format: WriteFormat) -> Option<&[u8]> {
         match write_format {
             WriteFormat::CompactedKv => Some(self.as_bytes()),
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index f7c8bec5dc..276dcca38e 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -55,7 +55,7 @@ impl<'a> BinaryRow<'a> {
 }
 
 // TODO make functions return Result<?> for better error handling
-pub trait InternalRow {
+pub trait InternalRow: Send + Sync {
     /// Returns the number of fields in this row
     fn get_field_count(&self) -> usize;
 
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index b2263c2955..3691d655a4 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -34,9 +34,10 @@ static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>>
 mod kv_table_test {
     use super::SHARED_FLUSS_CLUSTER;
     use crate::integration::fluss_cluster::FlussTestingCluster;
-    use crate::integration::utils::{create_table, get_cluster, start_cluster, stop_cluster};
-    use fluss::client::UpsertWriter;
-    use fluss::metadata::{DataTypes, PartitionSpec, Schema, TableDescriptor, TablePath};
+    use crate::integration::utils::{
+        create_partitions, create_table, get_cluster, start_cluster, stop_cluster,
+    };
+    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::row::{GenericRow, InternalRow};
     use std::sync::Arc;
 
@@ -467,15 +468,7 @@ mod kv_table_test {
         create_table(&admin, &table_path, &table_descriptor).await;
 
         // Create partitions for each region before inserting data
-        for region in &["US", "EU", "APAC"] {
-            let mut partition_map = std::collections::HashMap::new();
-            partition_map.insert("region".to_string(), region.to_string());
-            let partition_spec = PartitionSpec::new(partition_map);
-            admin
-                .create_partition(&table_path, &partition_spec, false)
-                .await
-                .expect("Failed to create partition");
-        }
+        create_partitions(&admin, &table_path, "region", &["US", "EU", "APAC"]).await;
 
         let connection = cluster.get_fluss_connection().await;
 
diff --git a/fluss-rust/crates/fluss/tests/integration/table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
similarity index 90%
rename from fluss-rust/crates/fluss/tests/integration/table.rs
rename to fluss-rust/crates/fluss/tests/integration/log_table.rs
index 6a15674076..64e6289cee 100644
--- a/fluss-rust/crates/fluss/tests/integration/table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -34,7 +34,9 @@ static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>>
 mod table_test {
     use super::SHARED_FLUSS_CLUSTER;
     use crate::integration::fluss_cluster::FlussTestingCluster;
-    use crate::integration::utils::{create_table, get_cluster, start_cluster, stop_cluster};
+    use crate::integration::utils::{
+        create_partitions, create_table, get_cluster, start_cluster, stop_cluster,
+    };
     use arrow::array::record_batch;
     use fluss::client::{FlussTable, TableScan};
     use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
@@ -44,6 +46,8 @@ mod table_test {
     use jiff::Timestamp;
     use std::collections::HashMap;
     use std::sync::Arc;
+    use std::sync::atomic::AtomicUsize;
+    use std::sync::atomic::Ordering;
     use std::time::Duration;
 
     fn before_all() {
@@ -91,7 +95,8 @@ mod table_test {
         let append_writer = table
             .new_append()
             .expect("Failed to create append")
-            .create_writer();
+            .create_writer()
+            .expect("Failed to create writer");
 
         let batch1 =
             record_batch!(("c1", Int32, [1, 2, 3]), ("c2", Utf8, ["a1", "a2", "a3"])).unwrap();
@@ -217,7 +222,8 @@ mod table_test {
             .expect("Failed to get table")
             .new_append()
             .expect("Failed to create append")
-            .create_writer();
+            .create_writer()
+            .expect("Failed to create writer");
 
         let batch = record_batch!(
             ("id", Int32, [1, 2, 3]),
@@ -314,7 +320,8 @@ mod table_test {
         let append_writer = table
             .new_append()
             .expect("Failed to create append")
-            .create_writer();
+            .create_writer()
+            .expect("Failed to create writer");
 
         let batch = record_batch!(
             ("col_a", Int32, [1, 2, 3]),
@@ -472,7 +479,7 @@ mod table_test {
                 .is_empty()
         );
 
-        let writer = table.new_append().unwrap().create_writer();
+        let writer = table.new_append().unwrap().create_writer().unwrap();
         writer
             .append_arrow_batch(
                 record_batch!(("id", Int32, [1, 2]), ("name", Utf8, ["a", "b"])).unwrap(),
@@ -676,7 +683,8 @@ mod table_test {
         let append_writer = table
             .new_append()
             .expect("Failed to create append")
-            .create_writer();
+            .create_writer()
+            .expect("Failed to create writer");
 
         // Test data for all datatypes
         let col_tinyint = 127i8;
@@ -749,7 +757,7 @@ mod table_test {
         row.set_field(27, col_timestamp_ltz_ns_neg.clone());
 
         append_writer
-            .append(row)
+            .append(&row)
             .await
             .expect("Failed to append row with all datatypes");
 
@@ -760,7 +768,7 @@ mod table_test {
         }
 
         append_writer
-            .append(row_with_nulls)
+            .append(&row_with_nulls)
             .await
             .expect("Failed to append row with nulls");
 
@@ -967,4 +975,108 @@ mod table_test {
             .await
             .expect("Failed to drop table");
     }
+
+    #[tokio::test]
+    async fn partitioned_table_append() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new(
+            "fluss".to_string(),
+            "test_partitioned_log_append".to_string(),
+        );
+
+        // Create a partitioned log table
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("region", DataTypes::string())
+                    .column("value", DataTypes::bigint())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .partitioned_by(vec!["region".to_string()])
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        // Create partitions
+        create_partitions(&admin, &table_path, "region", &["US", "EU"]).await;
+
+        // Wait for partitions to be available
+        tokio::time::sleep(Duration::from_secs(2)).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        // Create append writer - this should now work for partitioned tables
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        // Append records with different partitions
+        let test_data = [
+            (1, "US", 100i64),
+            (2, "US", 200i64),
+            (3, "EU", 300i64),
+            (4, "EU", 400i64),
+        ];
+
+        for (id, region, value) in &test_data {
+            let mut row = fluss::row::GenericRow::new(3);
+            row.set_field(0, *id);
+            row.set_field(1, *region);
+            row.set_field(2, *value);
+            append_writer
+                .append(&row)
+                .await
+                .expect("Failed to append row");
+        }
+
+        append_writer.flush().await.expect("Failed to flush");
+
+        // Test append_arrow_batch for partitioned tables
+        // Each batch must contain rows from the same partition
+        let us_batch = record_batch!(
+            ("id", Int32, [5, 6]),
+            ("region", Utf8, ["US", "US"]),
+            ("value", Int64, [500, 600])
+        )
+        .unwrap();
+        append_writer
+            .append_arrow_batch(us_batch)
+            .await
+            .expect("Failed to append US batch");
+
+        let eu_batch = record_batch!(
+            ("id", Int32, [7, 8]),
+            ("region", Utf8, ["EU", "EU"]),
+            ("value", Int64, [700, 800])
+        )
+        .unwrap();
+        append_writer
+            .append_arrow_batch(eu_batch)
+            .await
+            .expect("Failed to append EU batch");
+
+        append_writer
+            .flush()
+            .await
+            .expect("Failed to flush batches");
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+
+        // todo: add scan test in 203
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index c83da0f23c..ce0c1371c0 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -40,10 +40,10 @@ mod table_remote_scan_test {
     use fluss::row::{GenericRow, InternalRow};
     use std::collections::HashMap;
     use std::sync::Arc;
+    use std::sync::atomic::AtomicUsize;
     use std::thread;
     use std::time::Duration;
     use uuid::Uuid;
-
     fn before_all() {
         // Create a new tokio runtime in a separate thread
         let cluster_lock = SHARED_FLUSS_CLUSTER.clone();
@@ -141,7 +141,8 @@ mod table_remote_scan_test {
         let append_writer = table
             .new_append()
             .expect("Failed to create append")
-            .create_writer();
+            .create_writer()
+            .expect("Failed to create writer");
 
         // append 20 rows, there must be some tiered to remote
         let record_count = 20;
@@ -151,7 +152,7 @@ mod table_remote_scan_test {
             let v = format!("v{}", i);
             row.set_field(1, v.as_str());
             append_writer
-                .append(row)
+                .append(&row)
                 .await
                 .expect("Failed to append row");
         }
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index 4d0c349f0c..fd5145a73c 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -17,8 +17,9 @@
  */
 use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
 use fluss::client::FlussAdmin;
-use fluss::metadata::{TableDescriptor, TablePath};
+use fluss::metadata::{PartitionSpec, TableDescriptor, TablePath};
 use parking_lot::RwLock;
+use std::collections::HashMap;
 use std::sync::Arc;
 use std::time::Duration;
 
@@ -102,3 +103,26 @@ pub fn get_cluster(cluster_lock: &RwLock<Option<FlussTestingCluster>>) -> Arc<Fl
             .clone(),
     )
 }
+
+/// Creates partitions for a partitioned table.
+///
+/// # Arguments
+/// * `admin` - The FlussAdmin instance
+/// * `table_path` - The table path
+/// * `partition_column` - The partition column name
+/// * `partition_values` - The partition values to create
+pub async fn create_partitions(
+    admin: &FlussAdmin,
+    table_path: &TablePath,
+    partition_column: &str,
+    partition_values: &[&str],
+) {
+    for value in partition_values {
+        let mut partition_map = HashMap::new();
+        partition_map.insert(partition_column.to_string(), value.to_string());
+        admin
+            .create_partition(table_path, &PartitionSpec::new(partition_map), true)
+            .await
+            .expect("Failed to create partition");
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
index f3987e62db..a6cc27a952 100644
--- a/fluss-rust/crates/fluss/tests/test_fluss.rs
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -23,7 +23,7 @@ mod integration {
     mod admin;
     mod fluss_cluster;
     mod kv_table;
-    mod table;
+    mod log_table;
 
     mod utils;
 

From b7d511dc797c456fc54c42aff7e2bda878f74903 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 1 Feb 2026 19:59:37 +0800
Subject: [PATCH 100/287] feat: support list offset for partitioned table
 (#229)

---
 fluss-rust/crates/fluss/src/client/admin.rs   | 63 ++++++++++++++++---
 .../crates/fluss/src/client/metadata.rs       | 21 +++++++
 .../fluss/tests/integration/log_table.rs      | 32 ++++++++++
 3 files changed, 107 insertions(+), 9 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index ea1efc3810..9061169d2a 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -18,7 +18,7 @@
 use crate::client::metadata::Metadata;
 use crate::metadata::{
     DatabaseDescriptor, DatabaseInfo, JsonSerde, LakeSnapshot, PartitionInfo, PartitionSpec,
-    TableBucket, TableDescriptor, TableInfo, TablePath,
+    PhysicalTablePath, TableBucket, TableDescriptor, TableInfo, TablePath,
 };
 use crate::rpc::message::{
     CreateDatabaseRequest, CreatePartitionRequest, CreateTableRequest, DatabaseExistsRequest,
@@ -33,7 +33,6 @@ use crate::error::{Error, Result};
 use crate::proto::GetTableInfoResponse;
 use crate::{BucketId, PartitionId, TableId};
 use std::collections::{HashMap, HashSet};
-use std::slice::from_ref;
 use std::sync::Arc;
 use tokio::task::JoinHandle;
 
@@ -294,23 +293,69 @@ impl FlussAdmin {
         buckets_id: &[BucketId],
         offset_spec: OffsetSpec,
     ) -> Result<HashMap<i32, i64>> {
-        self.metadata
-            .check_and_update_table_metadata(from_ref(table_path))
-            .await?;
+        self.do_list_offsets(table_path, None, buckets_id, offset_spec)
+            .await
+    }
+
+    /// List offset for the specified buckets in a partition. This operation enables to find
+    /// the beginning offset, end offset as well as the offset matching a timestamp in buckets.
+    pub async fn list_partition_offsets(
+        &self,
+        table_path: &TablePath,
+        partition_name: &str,
+        buckets_id: &[BucketId],
+        offset_spec: OffsetSpec,
+    ) -> Result<HashMap<i32, i64>> {
+        self.do_list_offsets(table_path, Some(partition_name), buckets_id, offset_spec)
+            .await
+    }
 
+    async fn do_list_offsets(
+        &self,
+        table_path: &TablePath,
+        partition_name: Option<&str>,
+        buckets_id: &[BucketId],
+        offset_spec: OffsetSpec,
+    ) -> Result<HashMap<i32, i64>> {
         if buckets_id.is_empty() {
-            return Err(Error::UnexpectedError {
+            return Err(Error::IllegalArgument {
                 message: "Buckets are empty.".to_string(),
-                source: None,
             });
         }
 
+        // force to update table metadata like java side
+        self.metadata.update_table_metadata(table_path).await?;
+
         let cluster = self.metadata.get_cluster();
         let table_id = cluster.get_table(table_path)?.table_id;
 
+        // Resolve partition_id from partition_name if provided
+        let partition_id = if let Some(name) = partition_name {
+            let physical_table_path = Arc::new(PhysicalTablePath::of_partitioned(
+                Arc::new(table_path.clone()),
+                Some(name.to_string()),
+            ));
+
+            // Update partition metadata like java side
+            self.metadata
+                .update_physical_table_metadata(std::slice::from_ref(&physical_table_path))
+                .await?;
+
+            let cluster = self.metadata.get_cluster();
+            Some(
+                cluster
+                    .get_partition_id(&physical_table_path)
+                    .ok_or_else(|| Error::PartitionNotExist {
+                        message: format!("Partition '{name}' not found for table '{table_path}'"),
+                    })?,
+            )
+        } else {
+            None
+        };
+
         // Prepare requests
         let requests_by_server =
-            self.prepare_list_offsets_requests(table_id, None, buckets_id, offset_spec)?;
+            self.prepare_list_offsets_requests(table_id, partition_id, buckets_id, offset_spec)?;
 
         // Send Requests
         let response_futures = self.send_list_offsets_request(requests_by_server).await?;
@@ -338,7 +383,7 @@ impl FlussAdmin {
         let mut node_for_bucket_list: HashMap<i32, Vec<BucketId>> = HashMap::new();
 
         for bucket_id in buckets {
-            let table_bucket = TableBucket::new(table_id, *bucket_id);
+            let table_bucket = TableBucket::new_with_partition(table_id, partition_id, *bucket_id);
             let leader = cluster.leader_for(&table_bucket).ok_or_else(|| {
                 // todo: consider retry?
                 Error::UnexpectedError {
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index 52ccd62e43..c6244cd797 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -142,6 +142,27 @@ impl Metadata {
             .await
     }
 
+    pub async fn update_physical_table_metadata(
+        &self,
+        physical_table_paths: &[Arc<PhysicalTablePath>],
+    ) -> Result<()> {
+        let mut update_table_paths = HashSet::new();
+        let mut update_partition_paths = HashSet::new();
+        for physical_table_path in physical_table_paths {
+            match physical_table_path.get_partition_name() {
+                Some(_) => {
+                    update_partition_paths.insert(physical_table_path);
+                }
+                None => {
+                    update_table_paths.insert(physical_table_path.get_table_path());
+                }
+            }
+        }
+
+        self.update_tables_metadata(&update_table_paths, &update_partition_paths, vec![])
+            .await
+    }
+
     pub async fn check_and_update_table_metadata(&self, table_paths: &[TablePath]) -> Result<()> {
         let cluster_binding = self.cluster.read().clone();
         let need_update_table_paths: HashSet<&TablePath> = table_paths
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 64e6289cee..27b4d8313f 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -1072,6 +1072,38 @@ mod table_test {
             .await
             .expect("Failed to flush batches");
 
+        // Test list_offsets_for_partition
+        // US partition has 4 records: 2 from row append + 2 from batch append
+        let us_offsets = admin
+            .list_partition_offsets(&table_path, "US", &[0], OffsetSpec::Latest)
+            .await
+            .expect("Failed to list offsets for US partition");
+        assert_eq!(
+            us_offsets.get(&0),
+            Some(&4),
+            "US partition should have 4 records"
+        );
+
+        // EU partition has 4 records: 2 from row append + 2 from batch append
+        let eu_offsets = admin
+            .list_partition_offsets(&table_path, "EU", &[0], OffsetSpec::Latest)
+            .await
+            .expect("Failed to list offsets for EU partition");
+        assert_eq!(
+            eu_offsets.get(&0),
+            Some(&4),
+            "EU partition should have 4 records"
+        );
+
+        // test list a not exist partition should return error
+        let result = admin
+            .list_partition_offsets(&table_path, "NOT Exists", &[0], OffsetSpec::Latest)
+            .await;
+        assert!(result.is_err());
+        assert!(result.unwrap_err().to_string().contains(
+            "Table partition 'fluss.test_partitioned_log_append(p=NOT Exists)' does not exist."
+        ));
+
         admin
             .drop_table(&table_path, false)
             .await

From 17ba9d12202a28856f365973dad1bee276681d95 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Tue, 3 Feb 2026 20:42:28 +0800
Subject: [PATCH 101/287] feat: support list partition offset in cpp binding
 (#231)

---
 fluss-rust/.gitignore                     |  5 ++-
 fluss-rust/bindings/cpp/include/fluss.hpp | 12 +++++++
 fluss-rust/bindings/cpp/src/admin.cpp     | 32 ++++++++++++++---
 fluss-rust/bindings/cpp/src/lib.rs        | 42 ++++++++++++++++++++---
 4 files changed, 81 insertions(+), 10 deletions(-)

diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
index 8202bbca02..9c585d8632 100644
--- a/fluss-rust/.gitignore
+++ b/fluss-rust/.gitignore
@@ -26,4 +26,7 @@ __pycache__/
 *.so
 *.egg-info/
 dist/
-build/
\ No newline at end of file
+build/
+
+# CPP
+*CMakeFiles/
\ No newline at end of file
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 479adf97a9..4ef3fe1808 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -407,7 +407,19 @@ class Admin {
                        const OffsetQuery& offset_query,
                        std::unordered_map<int32_t, int64_t>& out);
 
+    Result ListPartitionOffsets(const TablePath& table_path,
+                              const std::string& partition_name,
+                              const std::vector<int32_t>& bucket_ids,
+                              const OffsetQuery& offset_query,
+                              std::unordered_map<int32_t, int64_t>& out);
+
 private:
+    Result DoListOffsets(const TablePath& table_path,
+                       const std::vector<int32_t>& bucket_ids,
+                       const OffsetQuery& offset_query,
+                       std::unordered_map<int32_t, int64_t>& out,
+                       const std::string* partition_name = nullptr);
+
     friend class Connection;
     Admin(ffi::Admin* admin) noexcept;
 
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index bf9c712f4e..e4106146ee 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -108,10 +108,12 @@ Result Admin::GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& o
     return result;
 }
 
-Result Admin::ListOffsets(const TablePath& table_path,
-                          const std::vector<int32_t>& bucket_ids,
-                          const OffsetQuery& offset_query,
-                          std::unordered_map<int32_t, int64_t>& out) {
+// function for common list offsets functionality
+Result Admin::DoListOffsets(const TablePath& table_path,
+                         const std::vector<int32_t>& bucket_ids,
+                         const OffsetQuery& offset_query,
+                         std::unordered_map<int32_t, int64_t>& out,
+                         const std::string* partition_name) {
     if (!Available()) {
         return utils::make_error(1, "Admin not available");
     }
@@ -127,7 +129,12 @@ Result Admin::ListOffsets(const TablePath& table_path,
     ffi_query.offset_type = static_cast<int32_t>(offset_query.spec);
     ffi_query.timestamp = offset_query.timestamp;
 
-    auto ffi_result = admin_->list_offsets(ffi_path, std::move(rust_bucket_ids), ffi_query);
+    ffi::FfiListOffsetsResult ffi_result;
+    if (partition_name != nullptr) {
+        ffi_result = admin_->list_partition_offsets(ffi_path, rust::String(*partition_name), std::move(rust_bucket_ids), ffi_query);
+    } else {
+        ffi_result = admin_->list_offsets(ffi_path, std::move(rust_bucket_ids), ffi_query);
+    }
     
     auto result = utils::from_ffi_result(ffi_result.result);
     if (result.Ok()) {
@@ -140,4 +147,19 @@ Result Admin::ListOffsets(const TablePath& table_path,
     return result;
 }
 
+Result Admin::ListOffsets(const TablePath& table_path,
+                          const std::vector<int32_t>& bucket_ids,
+                          const OffsetQuery& offset_query,
+                          std::unordered_map<int32_t, int64_t>& out) {
+    return DoListOffsets(table_path, bucket_ids, offset_query, out);
+}
+
+Result Admin::ListPartitionOffsets(const TablePath& table_path,
+                                const std::string& partition_name,
+                                const std::vector<int32_t>& bucket_ids,
+                                const OffsetQuery& offset_query,
+                                std::unordered_map<int32_t, int64_t>& out) {
+    return DoListOffsets(table_path, bucket_ids, offset_query, out, &partition_name);
+}
+
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index bd38a03963..b327ba550b 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -193,6 +193,13 @@ mod ffi {
             bucket_ids: Vec<i32>,
             offset_query: &FfiOffsetQuery,
         ) -> FfiListOffsetsResult;
+        fn list_partition_offsets(
+            self: &Admin,
+            table_path: &FfiTablePath,
+            partition_name: String,
+            bucket_ids: Vec<i32>,
+            offset_query: &FfiOffsetQuery,
+        ) -> FfiListOffsetsResult;
 
         // Table
         unsafe fn delete_table(table: *mut Table);
@@ -431,9 +438,11 @@ impl Admin {
         }
     }
 
-    fn list_offsets(
+    // Helper function for common list offsets functionality
+    fn do_list_offsets(
         &self,
         table_path: &ffi::FfiTablePath,
+        partition_name: Option<&str>,
         bucket_ids: Vec<i32>,
         offset_query: &ffi::FfiOffsetQuery,
     ) -> ffi::FfiListOffsetsResult {
@@ -460,9 +469,15 @@ impl Admin {
         };
 
         let result = RUNTIME.block_on(async {
-            self.inner
-                .list_offsets(&path, &bucket_ids, offset_spec)
-                .await
+            if let Some(part_name) = partition_name {
+                self.inner
+                    .list_partition_offsets(&path, part_name, &bucket_ids, offset_spec)
+                    .await
+            } else {
+                self.inner
+                    .list_offsets(&path, &bucket_ids, offset_spec)
+                    .await
+            }
         });
 
         match result {
@@ -482,6 +497,25 @@ impl Admin {
             },
         }
     }
+
+    fn list_offsets(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        bucket_ids: Vec<i32>,
+        offset_query: &ffi::FfiOffsetQuery,
+    ) -> ffi::FfiListOffsetsResult {
+        self.do_list_offsets(table_path, None, bucket_ids, offset_query)
+    }
+
+    fn list_partition_offsets(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        partition_name: String,
+        bucket_ids: Vec<i32>,
+        offset_query: &ffi::FfiOffsetQuery,
+    ) -> ffi::FfiListOffsetsResult {
+        self.do_list_offsets(table_path, Some(&partition_name), bucket_ids, offset_query)
+    }
 }
 
 // Table implementation

From da22ac85d01b8886287b4aed181fb8413bd1df2a Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Tue, 3 Feb 2026 22:08:17 +0800
Subject: [PATCH 102/287] feat: introduce scan record batch in cpp (#230)

---
 fluss-rust/bindings/cpp/.gitignore           |   1 +
 fluss-rust/bindings/cpp/CMakeLists.txt       |   8 +-
 fluss-rust/bindings/cpp/Cargo.toml           |   2 +-
 fluss-rust/bindings/cpp/examples/example.cpp |  58 ++++-
 fluss-rust/bindings/cpp/include/fluss.hpp    |  55 +++-
 fluss-rust/bindings/cpp/src/lib.rs           | 250 +++++++++++++++----
 fluss-rust/bindings/cpp/src/table.cpp        | 127 ++++++++++
 fluss-rust/bindings/cpp/src/types.rs         |  31 +++
 8 files changed, 479 insertions(+), 53 deletions(-)

diff --git a/fluss-rust/bindings/cpp/.gitignore b/fluss-rust/bindings/cpp/.gitignore
index 43f761c951..da15a58b53 100644
--- a/fluss-rust/bindings/cpp/.gitignore
+++ b/fluss-rust/bindings/cpp/.gitignore
@@ -1,5 +1,6 @@
 build/
 cmake-build-*/
+CMakeFiles/
 .idea/
 *.o
 *.a
diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
index 629f3f076d..93cfc413fe 100644
--- a/fluss-rust/bindings/cpp/CMakeLists.txt
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -29,6 +29,8 @@ set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
 
 find_package(Threads REQUIRED)
 
+find_package(Arrow REQUIRED)
+
 if (NOT CMAKE_BUILD_TYPE)
     set(CMAKE_BUILD_TYPE Debug)
 endif()
@@ -88,12 +90,16 @@ target_sources(fluss_cpp PRIVATE ${RUST_HEADER_FILE})
 target_include_directories(fluss_cpp PUBLIC ${CPP_INCLUDE_DIR})
 target_link_libraries(fluss_cpp PUBLIC ${RUST_LIB})
 target_link_libraries(fluss_cpp PRIVATE ${CMAKE_DL_LIBS} Threads::Threads)
+target_link_libraries(fluss_cpp PUBLIC Arrow::arrow_shared)
+target_compile_definitions(fluss_cpp PRIVATE ARROW_FOUND)
 if(APPLE)
     target_link_libraries(fluss_cpp PUBLIC "-framework CoreFoundation" "-framework Security")
 endif()
 
 add_executable(fluss_cpp_example examples/example.cpp)
-target_link_libraries(fluss_cpp_example fluss_cpp)
+target_link_libraries(fluss_cpp_example PRIVATE fluss_cpp)
+target_link_libraries(fluss_cpp_example PRIVATE Arrow::arrow_shared)
+target_compile_definitions(fluss_cpp_example PRIVATE ARROW_FOUND)
 target_include_directories(fluss_cpp_example PUBLIC ${CPP_INCLUDE_DIR})
 
 set_target_properties(fluss_cpp
diff --git a/fluss-rust/bindings/cpp/Cargo.toml b/fluss-rust/bindings/cpp/Cargo.toml
index 2d3d913550..0bbcbf0d95 100644
--- a/fluss-rust/bindings/cpp/Cargo.toml
+++ b/fluss-rust/bindings/cpp/Cargo.toml
@@ -27,7 +27,7 @@ crate-type = ["staticlib"]
 
 [dependencies]
 anyhow = "1.0"
-arrow = { workspace = true }
+arrow = { workspace = true, features = ["ffi"] }
 cxx = "1.0"
 fluss = { path = "../../crates/fluss" }
 tokio = { version = "1.27", features = ["rt-multi-thread", "macros"] }
diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 6ff2b9b7e3..45f7f9ea9c 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -15,12 +15,14 @@
 // specific language governing permissions and limitations
 // under the License.
 
-#include "fluss.hpp"
+#include <arrow/record_batch.h>
 
+#include <chrono>
 #include <iostream>
-#include <vector>
 #include <unordered_map>
-#include <chrono>
+#include <vector>
+
+#include "fluss.hpp"
 
 static void check(const char* step, const fluss::Result& r) {
     if (!r.Ok()) {
@@ -179,6 +181,7 @@ int main() {
     
     // 8.1) Query earliest offsets for all buckets
     std::vector<int32_t> all_bucket_ids;
+    all_bucket_ids.reserve(buckets);
     for (int b = 0; b < buckets; ++b) {
         all_bucket_ids.push_back(b);
     }
@@ -250,5 +253,54 @@ int main() {
         std::cout << "  ... and " << (batch_records.Size() - 5) << " more records" << std::endl;
     }
 
+    // 9) Test the new Arrow record batch polling functionality
+    std::cout << "\n=== Testing Arrow Record Batch Polling ===" << std::endl;
+    
+    fluss::LogScanner arrow_scanner;
+    check("new_record_batch_log_scanner", table.NewRecordBatchLogScanner(arrow_scanner));
+    
+    // Subscribe to all buckets starting from offset 0
+    for (int b = 0; b < buckets; ++b) {
+        check("subscribe_arrow", arrow_scanner.Subscribe(b, 0));
+    }
+    
+    fluss::ArrowRecordBatches arrow_batches;
+    check("poll_record_batch", arrow_scanner.PollRecordBatch(5000, arrow_batches));
+    
+    std::cout << "Polled " << arrow_batches.Size() << " Arrow record batches" << std::endl;
+    for (size_t i = 0; i < arrow_batches.Size(); ++i) {
+        const auto& batch = arrow_batches[i];
+        if (batch->Available()) {
+            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows() << " rows. " << std::endl;
+        } else {
+            std::cout << "  Batch " << i << ": not available" << std::endl;
+        }
+    }
+    
+    // 10) Test the new Arrow record batch polling with projection
+    std::cout << "\n=== Testing Arrow Record Batch Polling with Projection ===" << std::endl;
+    
+    fluss::LogScanner projected_arrow_scanner;
+    check("new_record_batch_log_scanner_with_projection", 
+          table.NewRecordBatchLogScannerWithProjection(projected_columns, projected_arrow_scanner));
+    
+    // Subscribe to all buckets starting from offset 0
+    for (int b = 0; b < buckets; ++b) {
+        check("subscribe_projected_arrow", projected_arrow_scanner.Subscribe(b, 0));
+    }
+    
+    fluss::ArrowRecordBatches projected_arrow_batches;
+    check("poll_projected_record_batch", projected_arrow_scanner.PollRecordBatch(5000, projected_arrow_batches));
+    
+    std::cout << "Polled " << projected_arrow_batches.Size() << " projected Arrow record batches" << std::endl;
+    for (size_t i = 0; i < projected_arrow_batches.Size(); ++i) {
+        const auto& batch = projected_arrow_batches[i];
+        if (batch->Available()) {
+            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows() << " rows " << std::endl;
+        } else {
+            std::cout << "  Batch " << i << ": not available" << std::endl;
+        }
+    }
+
     return 0;
 }
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 4ef3fe1808..968cb06509 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -19,13 +19,17 @@
 
 #pragma once
 
-#include <cstdint>
 #include <memory>
 #include <optional>
 #include <string>
 #include <unordered_map>
 #include <vector>
 
+// Forward declare Arrow classes to avoid including heavy Arrow headers in header
+namespace arrow {
+    class RecordBatch;
+}
+
 namespace fluss {
 
 namespace ffi {
@@ -336,6 +340,52 @@ struct ScanRecords {
     auto end() const { return records.end(); }
 };
 
+class ArrowRecordBatch {
+public:
+
+    std::shared_ptr<arrow::RecordBatch> GetArrowRecordBatch() const { return batch_; }
+
+    bool Available() const;
+
+    // Get number of rows in the batch
+    int64_t NumRows() const;
+    
+    // Get ScanBatch metadata
+    int64_t GetTableId() const;
+    int64_t GetPartitionId() const;
+    int32_t GetBucketId() const;
+    int64_t GetBaseOffset() const;
+    int64_t GetLastOffset() const;
+
+private:
+    friend class LogScanner;
+    explicit ArrowRecordBatch(
+        std::shared_ptr<arrow::RecordBatch> batch,
+        int64_t table_id,
+        int64_t partition_id,
+        int32_t bucket_id,
+        int64_t base_offset) noexcept;
+
+    std::shared_ptr<arrow::RecordBatch> batch_{nullptr};
+
+    int64_t table_id_;
+    int64_t partition_id_;
+    int32_t bucket_id_;
+    int64_t base_offset_;
+};
+
+
+struct ArrowRecordBatches {
+    std::vector<std::unique_ptr<ArrowRecordBatch>> batches;
+
+    size_t Size() const { return batches.size(); }
+    bool Empty() const { return batches.empty(); }
+    const std::unique_ptr<ArrowRecordBatch>& operator[](size_t idx) const { return batches[idx]; }
+
+    auto begin() const { return batches.begin(); }
+    auto end() const { return batches.end(); }
+};
+
 struct BucketOffset {
     int64_t table_id;
     int64_t partition_id;
@@ -442,6 +492,8 @@ class Table {
     Result NewAppendWriter(AppendWriter& out);
     Result NewLogScanner(LogScanner& out);
     Result NewLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out);
+    Result NewRecordBatchLogScanner(LogScanner& out);
+    Result NewRecordBatchLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out);
 
     TableInfo GetTableInfo() const;
     TablePath GetTablePath() const;
@@ -493,6 +545,7 @@ class LogScanner {
     Result Subscribe(int32_t bucket_id, int64_t start_offset);
     Result Subscribe(const std::vector<BucketSubscription>& bucket_offsets);
     Result Poll(int64_t timeout_ms, ScanRecords& out);
+    Result PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out);
 
 private:
     friend class Table;
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index b327ba550b..e0835985e2 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -119,6 +119,24 @@ mod ffi {
         scan_records: FfiScanRecords,
     }
 
+    struct FfiArrowRecordBatch {
+        array_ptr: usize,
+        schema_ptr: usize,
+        table_id: i64,
+        partition_id: i64,
+        bucket_id: i32,
+        base_offset: i64,
+    }
+
+    struct FfiArrowRecordBatches {
+        batches: Vec<FfiArrowRecordBatch>,
+    }
+
+    struct FfiArrowRecordBatchesResult {
+        result: FfiResult,
+        arrow_batches: FfiArrowRecordBatches,
+    }
+
     struct FfiLakeSnapshot {
         snapshot_id: i64,
         bucket_offsets: Vec<FfiBucketOffset>,
@@ -209,6 +227,11 @@ mod ffi {
             self: &Table,
             column_indices: Vec<usize>,
         ) -> Result<*mut LogScanner>;
+        fn new_record_batch_log_scanner(self: &Table) -> Result<*mut LogScanner>;
+        fn new_record_batch_log_scanner_with_projection(
+            self: &Table,
+            column_indices: Vec<usize>,
+        ) -> Result<*mut LogScanner>;
         fn get_table_info_from_table(self: &Table) -> FfiTableInfo;
         fn get_table_path(self: &Table) -> FfiTablePath;
         fn has_primary_key(self: &Table) -> bool;
@@ -226,6 +249,8 @@ mod ffi {
             subscriptions: Vec<FfiBucketSubscription>,
         ) -> FfiResult;
         fn poll(self: &LogScanner, timeout_ms: i64) -> FfiScanRecordsResult;
+        fn poll_record_batch(self: &LogScanner, timeout_ms: i64) -> FfiArrowRecordBatchesResult;
+        fn free_arrow_ffi_structures(array_ptr: usize, schema_ptr: usize);
     }
 }
 
@@ -252,7 +277,8 @@ pub struct AppendWriter {
 }
 
 pub struct LogScanner {
-    inner: fcore::client::LogScanner,
+    inner: Option<fcore::client::LogScanner>,
+    inner_batch: Option<fcore::client::RecordBatchLogScanner>,
 }
 
 fn ok_result() -> ffi::FfiResult {
@@ -551,41 +577,101 @@ impl Table {
     }
 
     fn new_log_scanner(&self) -> Result<*mut LogScanner, String> {
-        let fluss_table = fcore::client::FlussTable::new(
-            &self.connection,
-            self.metadata.clone(),
-            self.table_info.clone(),
-        );
+        RUNTIME.block_on(async {
+            let fluss_table = fcore::client::FlussTable::new(
+                &self.connection,
+                self.metadata.clone(),
+                self.table_info.clone(),
+            );
+
+            let scanner = match fluss_table.new_scan().create_log_scanner() {
+                Ok(a) => a,
+                Err(e) => return Err(format!("Failed to create log scanner: {e}")),
+            };
+
+            let scanner_ptr = Box::into_raw(Box::new(LogScanner {
+                inner: Some(scanner),
+                inner_batch: None,
+            }));
 
-        let scanner = match fluss_table.new_scan().create_log_scanner() {
-            Ok(a) => a,
-            Err(e) => return Err(format!("Failed to create log scanner: {e}")),
-        };
-        let scanner = Box::into_raw(Box::new(LogScanner { inner: scanner }));
-        Ok(scanner)
+            Ok(scanner_ptr)
+        })
     }
 
     fn new_log_scanner_with_projection(
         &self,
         column_indices: Vec<usize>,
     ) -> Result<*mut LogScanner, String> {
-        let fluss_table = fcore::client::FlussTable::new(
-            &self.connection,
-            self.metadata.clone(),
-            self.table_info.clone(),
-        );
+        RUNTIME.block_on(async {
+            let fluss_table = fcore::client::FlussTable::new(
+                &self.connection,
+                self.metadata.clone(),
+                self.table_info.clone(),
+            );
+
+            let scan = fluss_table.new_scan();
+            let scan = match scan.project(&column_indices) {
+                Ok(s) => s,
+                Err(e) => return Err(format!("Failed to project columns: {e}")),
+            };
+            let scanner = match scan.create_log_scanner() {
+                Ok(a) => a,
+                Err(e) => return Err(format!("Failed to create log scanner: {e}")),
+            };
+            let scanner = Box::into_raw(Box::new(LogScanner {
+                inner: Some(scanner),
+                inner_batch: None,
+            }));
+            Ok(scanner)
+        })
+    }
+
+    fn new_record_batch_log_scanner(&self) -> Result<*mut LogScanner, String> {
+        RUNTIME.block_on(async {
+            let fluss_table = fcore::client::FlussTable::new(
+                &self.connection,
+                self.metadata.clone(),
+                self.table_info.clone(),
+            );
+
+            let scanner = match fluss_table.new_scan().create_record_batch_log_scanner() {
+                Ok(a) => a,
+                Err(e) => return Err(format!("Failed to create record batch log scanner: {e}")),
+            };
+            let scanner = Box::into_raw(Box::new(LogScanner {
+                inner: None,
+                inner_batch: Some(scanner),
+            }));
+            Ok(scanner)
+        })
+    }
 
-        let scan = fluss_table.new_scan();
-        let scan = match scan.project(&column_indices) {
-            Ok(s) => s,
-            Err(e) => return Err(format!("Failed to project columns: {e}")),
-        };
-        let scanner = match scan.create_log_scanner() {
-            Ok(a) => a,
-            Err(e) => return Err(format!("Failed to create log scanner: {e}")),
-        };
-        let scanner = Box::into_raw(Box::new(LogScanner { inner: scanner }));
-        Ok(scanner)
+    fn new_record_batch_log_scanner_with_projection(
+        &self,
+        column_indices: Vec<usize>,
+    ) -> Result<*mut LogScanner, String> {
+        RUNTIME.block_on(async {
+            let fluss_table = fcore::client::FlussTable::new(
+                &self.connection,
+                self.metadata.clone(),
+                self.table_info.clone(),
+            );
+
+            let scan = fluss_table.new_scan();
+            let scan = match scan.project(&column_indices) {
+                Ok(s) => s,
+                Err(e) => return Err(format!("Failed to project columns: {e}")),
+            };
+            let scanner = match scan.create_record_batch_log_scanner() {
+                Ok(a) => a,
+                Err(e) => return Err(format!("Failed to create record batch log scanner: {e}")),
+            };
+            let scanner = Box::into_raw(Box::new(LogScanner {
+                inner: None,
+                inner_batch: Some(scanner),
+            }));
+            Ok(scanner)
+        })
     }
 
     fn get_table_info_from_table(&self) -> ffi::FfiTableInfo {
@@ -644,14 +730,36 @@ unsafe fn delete_log_scanner(scanner: *mut LogScanner) {
     }
 }
 
+// Helper function to free the Arrow FFI structures separately (for use after ImportRecordBatch)
+pub extern "C" fn free_arrow_ffi_structures(array_ptr: usize, schema_ptr: usize) {
+    use arrow::ffi::{FFI_ArrowArray, FFI_ArrowSchema};
+    if array_ptr != 0 {
+        let _array = unsafe { Box::from_raw(array_ptr as *mut FFI_ArrowArray) };
+    }
+    if schema_ptr != 0 {
+        let _schema = unsafe { Box::from_raw(schema_ptr as *mut FFI_ArrowSchema) };
+    }
+}
+
 impl LogScanner {
     fn subscribe(&self, bucket_id: i32, start_offset: i64) -> ffi::FfiResult {
-        let result =
-            RUNTIME.block_on(async { self.inner.subscribe(bucket_id, start_offset).await });
+        if let Some(ref inner) = self.inner {
+            let result = RUNTIME.block_on(async { inner.subscribe(bucket_id, start_offset).await });
 
-        match result {
-            Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            match result {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else if let Some(ref inner_batch) = self.inner_batch {
+            let result =
+                RUNTIME.block_on(async { inner_batch.subscribe(bucket_id, start_offset).await });
+
+            match result {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else {
+            err_result(1, "LogScanner not initialized".to_string())
         }
     }
 
@@ -662,27 +770,75 @@ impl LogScanner {
             bucket_offsets.insert(sub.bucket_id, sub.offset);
         }
 
-        let result = RUNTIME.block_on(async { self.inner.subscribe_batch(&bucket_offsets).await });
+        if let Some(ref inner) = self.inner {
+            let result = RUNTIME.block_on(async { inner.subscribe_batch(&bucket_offsets).await });
 
-        match result {
-            Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            match result {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else if let Some(ref inner_batch) = self.inner_batch {
+            let result =
+                RUNTIME.block_on(async { inner_batch.subscribe_batch(&bucket_offsets).await });
+
+            match result {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else {
+            err_result(1, "LogScanner not initialized".to_string())
         }
     }
 
     fn poll(&self, timeout_ms: i64) -> ffi::FfiScanRecordsResult {
-        let timeout = Duration::from_millis(timeout_ms as u64);
-        let result = RUNTIME.block_on(async { self.inner.poll(timeout).await });
+        if let Some(ref inner) = self.inner {
+            let timeout = Duration::from_millis(timeout_ms as u64);
+            let result = RUNTIME.block_on(async { inner.poll(timeout).await });
 
-        match result {
-            Ok(records) => ffi::FfiScanRecordsResult {
-                result: ok_result(),
-                scan_records: types::core_scan_records_to_ffi(&records),
-            },
-            Err(e) => ffi::FfiScanRecordsResult {
-                result: err_result(1, e.to_string()),
+            match result {
+                Ok(records) => ffi::FfiScanRecordsResult {
+                    result: ok_result(),
+                    scan_records: types::core_scan_records_to_ffi(&records),
+                },
+                Err(e) => ffi::FfiScanRecordsResult {
+                    result: err_result(1, e.to_string()),
+                    scan_records: ffi::FfiScanRecords { records: vec![] },
+                },
+            }
+        } else {
+            ffi::FfiScanRecordsResult {
+                result: err_result(1, "Record-based scanner not available".to_string()),
                 scan_records: ffi::FfiScanRecords { records: vec![] },
-            },
+            }
+        }
+    }
+
+    fn poll_record_batch(&self, timeout_ms: i64) -> ffi::FfiArrowRecordBatchesResult {
+        if let Some(ref inner_batch) = self.inner_batch {
+            let timeout = Duration::from_millis(timeout_ms as u64);
+            let result = RUNTIME.block_on(async { inner_batch.poll(timeout).await });
+
+            match result {
+                Ok(batches) => match types::core_scan_batches_to_ffi(&batches) {
+                    Ok(arrow_batches) => ffi::FfiArrowRecordBatchesResult {
+                        result: ok_result(),
+                        arrow_batches,
+                    },
+                    Err(e) => ffi::FfiArrowRecordBatchesResult {
+                        result: err_result(1, e),
+                        arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
+                    },
+                },
+                Err(e) => ffi::FfiArrowRecordBatchesResult {
+                    result: err_result(1, e.to_string()),
+                    arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
+                },
+            }
+        } else {
+            ffi::FfiArrowRecordBatchesResult {
+                result: err_result(1, "Batch-based scanner not available".to_string()),
+                arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
+            }
         }
     }
 }
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index d42e1a2299..118ca3c276 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -21,6 +21,10 @@
 #include "lib.rs.h"
 #include "ffi_converter.hpp"
 #include "rust/cxx.h"
+#include <arrow/c/bridge.h>
+// todo:  bindings/cpp/BUILD.bazel still doesn’t declare Arrow include/link dependencies.
+// In environments where Bazel does not already have Arrow available, this will fail at compile/link time.
+#include <arrow/record_batch.h>
 
 namespace fluss {
 
@@ -101,6 +105,40 @@ Result Table::NewLogScannerWithProjection(const std::vector<size_t>& column_indi
     }
 }
 
+Result Table::NewRecordBatchLogScanner(LogScanner& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        out.scanner_ = table_->new_record_batch_log_scanner();
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result Table::NewRecordBatchLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        rust::Vec<size_t> rust_indices;
+        for (size_t idx : column_indices) {
+            rust_indices.push_back(idx);
+        }
+        out.scanner_ = table_->new_record_batch_log_scanner_with_projection(std::move(rust_indices));
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
 TableInfo Table::GetTableInfo() const {
     if (!Available()) {
         return TableInfo{};
@@ -242,4 +280,93 @@ Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
     return utils::make_ok();
 }
 
+ArrowRecordBatch::ArrowRecordBatch(
+    std::shared_ptr<arrow::RecordBatch> batch,
+    int64_t table_id,
+    int64_t partition_id,
+    int32_t bucket_id,
+    int64_t base_offset) noexcept
+    : batch_(std::move(batch)),
+      table_id_(table_id),
+      partition_id_(partition_id),
+      bucket_id_(bucket_id),
+      base_offset_(base_offset) {}
+
+bool ArrowRecordBatch::Available() const { return batch_ != nullptr; }
+
+int64_t ArrowRecordBatch::NumRows() const {
+    if (!Available()) return 0;
+    return batch_->num_rows();
+}
+
+
+int64_t ArrowRecordBatch::GetTableId() const {
+    if (!Available()) return 0;
+    return this->table_id_;
+}
+
+int64_t ArrowRecordBatch::GetPartitionId() const {
+    if (!Available()) return -1;
+    return this->partition_id_;
+}
+
+int32_t ArrowRecordBatch::GetBucketId() const {
+    if (!Available()) return -1;
+    return this->bucket_id_;
+}
+
+int64_t ArrowRecordBatch::GetBaseOffset() const {
+    if (!Available()) return -1;
+    return this->base_offset_;
+}
+
+int64_t ArrowRecordBatch::GetLastOffset() const {
+    if (!Available()) return -1;
+    return this->base_offset_ + this->NumRows() - 1;
+}
+
+Result LogScanner::PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out) {
+    if (!Available()) {
+        return utils::make_error(1, "LogScanner not available");
+    }
+
+    auto ffi_result = scanner_->poll_record_batch(timeout_ms);
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (!result.Ok()) {
+        return result;
+    }
+
+    // Convert the FFI Arrow record batches to C++ ArrowRecordBatch objects
+    out.batches.clear();
+    for (const auto& ffi_batch : ffi_result.arrow_batches.batches) {
+        auto* c_array = reinterpret_cast<struct ArrowArray*>(ffi_batch.array_ptr);
+        auto* c_schema = reinterpret_cast<struct ArrowSchema*>(ffi_batch.schema_ptr);
+
+        auto import_result = arrow::ImportRecordBatch(c_array, c_schema);
+        if (import_result.ok()) {
+            auto batch_ptr = import_result.ValueOrDie();
+            auto batch_wrapper = std::unique_ptr<ArrowRecordBatch>(new ArrowRecordBatch(
+                std::move(batch_ptr),
+                ffi_batch.table_id,
+                ffi_batch.partition_id,
+                ffi_batch.bucket_id,
+                ffi_batch.base_offset
+            ));
+            out.batches.push_back(std::move(batch_wrapper));
+            
+            // Free the container structures that were allocated in Rust after successful import
+            ffi::free_arrow_ffi_structures(ffi_batch.array_ptr, ffi_batch.schema_ptr);
+        } else {
+            // Import failed, free the container structures to avoid leaks and return error
+            ffi::free_arrow_ffi_structures(ffi_batch.array_ptr, ffi_batch.schema_ptr);
+            
+            // Return an error indicating that the import failed
+            std::string error_msg = "Failed to import Arrow record batch: " + import_result.status().ToString();
+            return utils::make_error(1, error_msg);
+        }
+    }
+    
+    return utils::make_ok();
+}
+
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 726e3d1220..91d6e260ba 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -23,10 +23,13 @@ use arrow::array::{
     TimestampMillisecondArray, TimestampNanosecondArray, TimestampSecondArray,
 };
 use arrow::datatypes::{DataType as ArrowDataType, TimeUnit};
+use arrow::ffi::{FFI_ArrowArray, FFI_ArrowSchema};
 use fcore::row::InternalRow;
 use fluss as fcore;
 use std::borrow::Cow;
 
+use arrow::array::Array;
+
 pub const DATA_TYPE_BOOLEAN: i32 = 1;
 pub const DATA_TYPE_TINYINT: i32 = 2;
 pub const DATA_TYPE_SMALLINT: i32 = 3;
@@ -478,3 +481,31 @@ pub fn core_lake_snapshot_to_ffi(snapshot: &fcore::metadata::LakeSnapshot) -> ff
         bucket_offsets,
     }
 }
+
+pub fn core_scan_batches_to_ffi(
+    batches: &[fcore::record::ScanBatch],
+) -> Result<ffi::FfiArrowRecordBatches, String> {
+    let mut ffi_batches = Vec::new();
+    for batch in batches {
+        let record_batch = batch.batch();
+        // Convert RecordBatch to StructArray first, then get the data
+        let struct_array = arrow::array::StructArray::from(record_batch.clone());
+        let ffi_array = Box::new(FFI_ArrowArray::new(&struct_array.into_data()));
+        let ffi_schema = Box::new(
+            FFI_ArrowSchema::try_from(record_batch.schema().as_ref()).map_err(|e| e.to_string())?,
+        );
+        // Export as raw pointers
+        ffi_batches.push(ffi::FfiArrowRecordBatch {
+            array_ptr: Box::into_raw(ffi_array) as usize,
+            schema_ptr: Box::into_raw(ffi_schema) as usize,
+            table_id: batch.bucket().table_id(),
+            partition_id: batch.bucket().partition_id().unwrap_or(-1),
+            bucket_id: batch.bucket().bucket_id(),
+            base_offset: batch.base_offset(),
+        });
+    }
+
+    Ok(ffi::FfiArrowRecordBatches {
+        batches: ffi_batches,
+    })
+}

From 21585a56804679695eaee82da7c3faf3ae6ad1a8 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Tue, 3 Feb 2026 23:55:05 +0800
Subject: [PATCH 103/287] chore: make Config#bootstrap_server required (#233)

---
 fluss-rust/bindings/cpp/src/lib.rs            |  2 +-
 fluss-rust/bindings/python/src/config.rs      |  6 +--
 .../crates/examples/src/example_kv_table.rs   |  2 +-
 .../src/example_partitioned_kv_table.rs       |  2 +-
 .../crates/examples/src/example_table.rs      |  2 +-
 .../crates/fluss/src/client/connection.rs     |  6 +--
 .../crates/fluss/src/client/table/scanner.rs  |  8 ++--
 fluss-rust/crates/fluss/src/config.rs         | 38 +++++++++++--------
 .../fluss/tests/integration/fluss_cluster.rs  |  2 +-
 9 files changed, 36 insertions(+), 32 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index e0835985e2..11e9105af1 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -298,7 +298,7 @@ fn err_result(code: i32, msg: String) -> ffi::FfiResult {
 // Connection implementation
 fn new_connection(bootstrap_server: &str) -> Result<*mut Connection, String> {
     let config = fluss::config::Config {
-        bootstrap_server: Some(bootstrap_server.to_string()),
+        bootstrap_server: bootstrap_server.to_string(),
         ..Default::default()
     };
 
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 70bd9cd770..1e80dbf3c9 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -40,7 +40,7 @@ impl Config {
 
                 match key.as_str() {
                     "bootstrap.servers" => {
-                        config.bootstrap_server = Some(value);
+                        config.bootstrap_server = value;
                     }
                     "request.max.size" => {
                         if let Ok(size) = value.parse::<i32>() {
@@ -72,14 +72,14 @@ impl Config {
 
     /// Get the bootstrap server
     #[getter]
-    fn bootstrap_server(&self) -> Option<String> {
+    fn bootstrap_server(&self) -> String {
         self.inner.bootstrap_server.clone()
     }
 
     /// Set the bootstrap server
     #[setter]
     fn set_bootstrap_server(&mut self, server: String) {
-        self.inner.bootstrap_server = Some(server);
+        self.inner.bootstrap_server = server;
     }
 
     /// Get the request max size
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 437da06b4c..325d842a58 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -26,7 +26,7 @@ use fluss::row::{GenericRow, InternalRow};
 #[allow(dead_code)]
 pub async fn main() -> Result<()> {
     let mut config = Config::parse();
-    config.bootstrap_server = Some("127.0.0.1:9123".to_string());
+    config.bootstrap_server = "127.0.0.1:9123".to_string();
 
     let conn = FlussConnection::new(config).await?;
 
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index 1b0c3035c4..ab28758043 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -27,7 +27,7 @@ use std::collections::HashMap;
 #[allow(dead_code)]
 pub async fn main() -> Result<()> {
     let mut config = Config::parse();
-    config.bootstrap_server = Some("127.0.0.1:9123".to_string());
+    config.bootstrap_server = "127.0.0.1:9123".to_string();
 
     let conn = FlussConnection::new(config).await?;
 
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index 6c74e635ac..ae21b1ba5c 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -30,7 +30,7 @@ use tokio::try_join;
 #[tokio::main]
 pub async fn main() -> Result<()> {
     let mut config = Config::parse();
-    config.bootstrap_server = Some("127.0.0.1:9123".to_string());
+    config.bootstrap_server = "127.0.0.1:9123".to_string();
 
     let conn = FlussConnection::new(config).await?;
 
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index e021011807..4dcefbb012 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -37,11 +37,7 @@ pub struct FlussConnection {
 impl FlussConnection {
     pub async fn new(arg: Config) -> Result<Self> {
         let connections = Arc::new(RpcClient::new());
-        let metadata = Metadata::new(
-            arg.bootstrap_server.as_ref().unwrap().as_str(),
-            connections.clone(),
-        )
-        .await?;
+        let metadata = Metadata::new(arg.bootstrap_server.as_str(), connections.clone()).await?;
 
         Ok(FlussConnection {
             metadata: Arc::new(metadata),
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 10e7fff5bf..d30c5d5554 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -87,8 +87,8 @@ impl<'a> TableScan<'a> {
     ///
     /// # pub async fn example() -> Result<()> {
     ///     let mut config = Config::default();
-    ///     config.bootstrap_server = Some("127.0.0.1:9123".to_string());
-    ///     let conn = FlussConnection::new(config).await?;
+    ///     config.bootstrap_server = "127.0.0.1:9123".to_string();
+    ///     let conn = FlussConnection::new(config).await;
     ///
     ///     let table_descriptor = TableDescriptor::builder()
     ///         .schema(
@@ -163,8 +163,8 @@ impl<'a> TableScan<'a> {
     ///
     /// # pub async fn example() -> Result<()> {
     ///     let mut config = Config::default();
-    ///     config.bootstrap_server = Some("127.0.0.1:9123".to_string());
-    ///     let conn = FlussConnection::new(config).await?;
+    ///     config.bootstrap_server = "127.0.0.1:9123".to_string();
+    ///     let conn = FlussConnection::new(config).await;
     ///
     ///     let table_descriptor = TableDescriptor::builder()
     ///         .schema(
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 705e241da0..972d15c622 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -18,46 +18,54 @@
 use clap::Parser;
 use serde::{Deserialize, Serialize};
 
+const DEFAULT_BOOTSTRAP_SERVER: &str = "127.0.0.1:9123";
+const DEFAULT_REQUEST_MAX_SIZE: i32 = 10 * 1024 * 1024;
+const DEFAULT_WRITER_BATCH_SIZE: i32 = 2 * 1024 * 1024;
+const DEFAULT_RETRIES: i32 = i32::MAX;
+const DEFAULT_PREFETCH_NUM: usize = 4;
+const DEFAULT_DOWNLOAD_THREADS: usize = 3;
+
+const DEFAULT_ACKS: &str = "all";
+
 #[derive(Parser, Debug, Clone, Deserialize, Serialize)]
 #[command(author, version, about, long_about = None)]
 pub struct Config {
-    #[arg(long)]
-    #[serde(skip_serializing_if = "Option::is_none")]
-    pub bootstrap_server: Option<String>,
+    #[arg(long, default_value_t = String::from(DEFAULT_BOOTSTRAP_SERVER))]
+    pub bootstrap_server: String,
 
-    #[arg(long, default_value_t = 10 * 1024 * 1024)]
+    #[arg(long, default_value_t = DEFAULT_REQUEST_MAX_SIZE)]
     pub request_max_size: i32,
 
-    #[arg(long, default_value_t = String::from("all"))]
+    #[arg(long, default_value_t = String::from(DEFAULT_ACKS))]
     pub writer_acks: String,
 
-    #[arg(long, default_value_t = i32::MAX)]
+    #[arg(long, default_value_t = DEFAULT_RETRIES)]
     pub writer_retries: i32,
 
-    #[arg(long, default_value_t = 2 * 1024 * 1024)]
+    #[arg(long, default_value_t = DEFAULT_WRITER_BATCH_SIZE)]
     pub writer_batch_size: i32,
 
     /// Maximum number of remote log segments to prefetch
     /// Default: 4 (matching Java CLIENT_SCANNER_REMOTE_LOG_PREFETCH_NUM)
-    #[arg(long, default_value_t = 4)]
+    #[arg(long, default_value_t = DEFAULT_PREFETCH_NUM)]
     pub scanner_remote_log_prefetch_num: usize,
 
     /// Maximum concurrent remote log downloads
     /// Default: 3 (matching Java REMOTE_FILE_DOWNLOAD_THREAD_NUM)
-    #[arg(long, default_value_t = 3)]
+    #[arg(long, default_value_t = DEFAULT_DOWNLOAD_THREADS)]
     pub scanner_remote_log_download_threads: usize,
 }
 
 impl Default for Config {
     fn default() -> Self {
         Self {
-            bootstrap_server: None,
-            request_max_size: 10 * 1024 * 1024,
-            writer_acks: String::from("all"),
+            bootstrap_server: String::from(DEFAULT_BOOTSTRAP_SERVER),
+            request_max_size: DEFAULT_REQUEST_MAX_SIZE,
+            writer_acks: String::from(DEFAULT_ACKS),
             writer_retries: i32::MAX,
-            writer_batch_size: 2 * 1024 * 1024,
-            scanner_remote_log_prefetch_num: 4,
-            scanner_remote_log_download_threads: 3,
+            writer_batch_size: DEFAULT_WRITER_BATCH_SIZE,
+            scanner_remote_log_prefetch_num: DEFAULT_PREFETCH_NUM,
+            scanner_remote_log_download_threads: DEFAULT_DOWNLOAD_THREADS,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
index 21422df6a0..a579303cf0 100644
--- a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
+++ b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
@@ -242,7 +242,7 @@ impl FlussTestingCluster {
     pub async fn get_fluss_connection(&self) -> FlussConnection {
         let mut config = Config::default();
         config.writer_acks = "all".to_string();
-        config.bootstrap_server = Some(self.bootstrap_servers.clone());
+        config.bootstrap_server = self.bootstrap_servers.clone();
 
         // Retry mechanism: retry for up to 1 minute
         let max_retries = 60; // 60 retry attempts

From b399e8e49fb4411160fe0b980dc6fc7c06f5c8a3 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Wed, 4 Feb 2026 07:43:24 +0800
Subject: [PATCH 104/287] chore: accept Into<String> to improve api usage
 (#234)

---
 fluss-rust/bindings/python/src/metadata.rs    |   6 +-
 .../crates/examples/src/example_kv_table.rs   |   4 +-
 .../src/example_partitioned_kv_table.rs       |  10 +-
 .../crates/examples/src/example_table.rs      |   2 +-
 .../src/client/table/log_fetch_buffer.rs      |  10 +-
 .../src/client/table/partition_getter.rs      |  46 ++-----
 .../crates/fluss/src/client/table/upsert.rs   |  30 ++---
 .../crates/fluss/src/metadata/database.rs     |  18 +--
 .../crates/fluss/src/metadata/datatype.rs     |  36 +++---
 .../crates/fluss/src/metadata/json_serde.rs   |  16 +--
 .../crates/fluss/src/metadata/partition.rs    |  10 +-
 fluss-rust/crates/fluss/src/metadata/table.rs | 117 ++++++++++++------
 fluss-rust/crates/fluss/src/record/arrow.rs   |  12 +-
 .../src/record/kv/kv_record_read_context.rs   |   2 +-
 fluss-rust/crates/fluss/src/test_utils.rs     |   6 +-
 .../crates/fluss/tests/integration/admin.rs   |  30 ++---
 .../fluss/tests/integration/kv_table.rs       |  23 ++--
 .../fluss/tests/integration/log_table.rs      |  20 ++-
 .../tests/integration/table_remote_scan.rs    |   5 +-
 .../crates/fluss/tests/integration/utils.rs   |   2 +-
 20 files changed, 194 insertions(+), 211 deletions(-)

diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
index bc5f288071..235df56ba7 100644
--- a/fluss-rust/bindings/python/src/metadata.rs
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -218,11 +218,11 @@ impl TableDescriptor {
         schema: &Schema, // fluss schema
         kwargs: Option<&Bound<'_, PyDict>>,
     ) -> PyResult<Self> {
-        let mut partition_keys = Vec::new();
+        let mut partition_keys: Vec<String> = Vec::new();
         let mut bucket_count = None;
         let mut bucket_keys = Vec::new();
-        let mut properties = std::collections::HashMap::new();
-        let mut custom_properties = std::collections::HashMap::new();
+        let mut properties: HashMap<String, String> = HashMap::new();
+        let mut custom_properties: HashMap<String, String> = HashMap::new();
         let mut comment: Option<String> = None;
         let mut log_format = None;
         let mut kv_format = None;
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 325d842a58..042e38413d 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -36,12 +36,12 @@ pub async fn main() -> Result<()> {
                 .column("id", DataTypes::int())
                 .column("name", DataTypes::string())
                 .column("age", DataTypes::bigint())
-                .primary_key(vec!["id".to_string()])
+                .primary_key(vec!["id"])
                 .build()?,
         )
         .build()?;
 
-    let table_path = TablePath::new("fluss".to_owned(), "rust_upsert_lookup_example".to_owned());
+    let table_path = TablePath::new("fluss", "rust_upsert_lookup_example");
 
     let admin = conn.get_admin().await?;
     admin
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index ab28758043..d1b6814cbd 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -38,17 +38,13 @@ pub async fn main() -> Result<()> {
                 .column("region", DataTypes::string())
                 .column("zone", DataTypes::bigint())
                 .column("score", DataTypes::bigint())
-                .primary_key(vec![
-                    "id".to_string(),
-                    "region".to_string(),
-                    "zone".to_string(),
-                ])
+                .primary_key(vec!["id", "region", "zone"])
                 .build()?,
         )
-        .partitioned_by(vec!["region".to_string(), "zone".to_string()])
+        .partitioned_by(vec!["region", "zone"])
         .build()?;
 
-    let table_path = TablePath::new("fluss".to_owned(), "partitioned_kv_example".to_owned());
+    let table_path = TablePath::new("fluss", "partitioned_kv_example");
 
     let mut admin = conn.get_admin().await?;
     admin
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index ae21b1ba5c..733b13e447 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -44,7 +44,7 @@ pub async fn main() -> Result<()> {
         )
         .build()?;
 
-    let table_path = TablePath::new("fluss".to_owned(), "rust_test_long".to_owned());
+    let table_path = TablePath::new("fluss", "rust_test_long");
 
     let admin = conn.get_admin().await?;
 
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index b622f19a08..edab91d5cf 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -840,11 +840,7 @@ mod tests {
     use std::sync::Arc;
 
     fn test_read_context() -> Result<ReadContext> {
-        let row_type = RowType::new(vec![DataField::new(
-            "id".to_string(),
-            DataTypes::int(),
-            None,
-        )]);
+        let row_type = RowType::new(vec![DataField::new("id", DataTypes::int(), None)]);
         Ok(ReadContext::new(to_arrow_schema(&row_type)?, false))
     }
 
@@ -897,8 +893,8 @@ mod tests {
     #[test]
     fn default_completed_fetch_reads_records() -> Result<()> {
         let row_type = RowType::new(vec![
-            DataField::new("id".to_string(), DataTypes::int(), None),
-            DataField::new("name".to_string(), DataTypes::string(), None),
+            DataField::new("id", DataTypes::int(), None),
+            DataField::new("name", DataTypes::string(), None),
         ]);
         let table_path = TablePath::new("db".to_string(), "tbl".to_string());
         let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
diff --git a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
index 913680198d..a1aad2d83e 100644
--- a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
+++ b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
@@ -109,12 +109,8 @@ mod tests {
     #[test]
     fn test_partition_getter_single_key() {
         let row_type = RowType::new(vec![
-            DataField::new("id".to_string(), DataType::Int(IntType::new()), None),
-            DataField::new(
-                "region".to_string(),
-                DataType::String(StringType::new()),
-                None,
-            ),
+            DataField::new("id", DataType::Int(IntType::new()), None),
+            DataField::new("region", DataType::String(StringType::new()), None),
         ]);
 
         let getter = PartitionGetter::new(&row_type, Arc::from(["region".to_string()]))
@@ -128,17 +124,9 @@ mod tests {
     #[test]
     fn test_partition_getter_multiple_keys() {
         let row_type = RowType::new(vec![
-            DataField::new("id".to_string(), DataType::Int(IntType::new()), None),
-            DataField::new(
-                "date".to_string(),
-                DataType::String(StringType::new()),
-                None,
-            ),
-            DataField::new(
-                "region".to_string(),
-                DataType::String(StringType::new()),
-                None,
-            ),
+            DataField::new("id", DataType::Int(IntType::new()), None),
+            DataField::new("date", DataType::String(StringType::new()), None),
+            DataField::new("region", DataType::String(StringType::new()), None),
         ]);
 
         let getter = PartitionGetter::new(
@@ -159,7 +147,7 @@ mod tests {
     #[test]
     fn test_partition_getter_invalid_column() {
         let row_type = RowType::new(vec![DataField::new(
-            "id".to_string(),
+            "id",
             DataType::Int(IntType::new()),
             None,
         )]);
@@ -171,12 +159,8 @@ mod tests {
     #[test]
     fn test_partition_getter_null_value() {
         let row_type = RowType::new(vec![
-            DataField::new("id".to_string(), DataType::Int(IntType::new()), None),
-            DataField::new(
-                "region".to_string(),
-                DataType::String(StringType::new()),
-                None,
-            ),
+            DataField::new("id", DataType::Int(IntType::new()), None),
+            DataField::new("region", DataType::String(StringType::new()), None),
         ]);
 
         let getter = PartitionGetter::new(&row_type, Arc::from(["region".to_string()]))
@@ -190,17 +174,9 @@ mod tests {
     #[test]
     fn test_get_partition_spec() {
         let row_type = RowType::new(vec![
-            DataField::new("id".to_string(), DataType::Int(IntType::new()), None),
-            DataField::new(
-                "date".to_string(),
-                DataType::String(StringType::new()),
-                None,
-            ),
-            DataField::new(
-                "region".to_string(),
-                DataType::String(StringType::new()),
-                None,
-            ),
+            DataField::new("id", DataType::Int(IntType::new()), None),
+            DataField::new("date", DataType::String(StringType::new()), None),
+            DataField::new("region", DataType::String(StringType::new()), None),
         ]);
 
         let getter = PartitionGetter::new(
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
index 05953971af..bb6c651075 100644
--- a/fluss-rust/crates/fluss/src/client/table/upsert.rs
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -403,8 +403,8 @@ mod tests {
     fn sanity_check() {
         // No target columns specified but table has auto-increment column
         let fields = vec![
-            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
-            DataField::new("name".to_string(), DataTypes::string(), None),
+            DataField::new("id", DataTypes::int().as_non_nullable(), None),
+            DataField::new("name", DataTypes::string(), None),
         ];
         let row_type = RowType::new(fields);
         let primary_keys = vec!["id".to_string()];
@@ -424,9 +424,9 @@ mod tests {
 
         // Target columns do not contain primary key
         let fields = vec![
-            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
-            DataField::new("name".to_string(), DataTypes::string(), None),
-            DataField::new("value".to_string(), DataTypes::int(), None),
+            DataField::new("id", DataTypes::int().as_non_nullable(), None),
+            DataField::new("name", DataTypes::string(), None),
+            DataField::new("value", DataTypes::int(), None),
         ];
         let row_type = RowType::new(fields);
         let primary_keys = vec!["id".to_string()];
@@ -449,8 +449,8 @@ mod tests {
 
         // Primary key column not found in row type
         let fields = vec![
-            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
-            DataField::new("name".to_string(), DataTypes::string(), None),
+            DataField::new("id", DataTypes::int().as_non_nullable(), None),
+            DataField::new("name", DataTypes::string(), None),
         ];
         let row_type = RowType::new(fields);
         let primary_keys = vec!["nonexistent_pk".to_string()];
@@ -473,13 +473,9 @@ mod tests {
 
         // Target columns include auto-increment column
         let fields = vec![
-            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
-            DataField::new(
-                "seq".to_string(),
-                DataTypes::bigint().as_non_nullable(),
-                None,
-            ),
-            DataField::new("name".to_string(), DataTypes::string(), None),
+            DataField::new("id", DataTypes::int().as_non_nullable(), None),
+            DataField::new("seq", DataTypes::bigint().as_non_nullable(), None),
+            DataField::new("name", DataTypes::string(), None),
         ];
         let row_type = RowType::new(fields);
         let primary_keys = vec!["id".to_string()];
@@ -499,13 +495,13 @@ mod tests {
 
         // Non-nullable column not in target columns (partial update requires nullable)
         let fields = vec![
-            DataField::new("id".to_string(), DataTypes::int().as_non_nullable(), None),
+            DataField::new("id", DataTypes::int().as_non_nullable(), None),
             DataField::new(
-                "required_field".to_string(),
+                "required_field",
                 DataTypes::string().as_non_nullable(),
                 None,
             ),
-            DataField::new("optional_field".to_string(), DataTypes::int(), None),
+            DataField::new("optional_field", DataTypes::int(), None),
         ];
         let row_type = RowType::new(fields);
         let primary_keys = vec!["id".to_string()];
diff --git a/fluss-rust/crates/fluss/src/metadata/database.rs b/fluss-rust/crates/fluss/src/metadata/database.rs
index fad1498f58..15fefb5496 100644
--- a/fluss-rust/crates/fluss/src/metadata/database.rs
+++ b/fluss-rust/crates/fluss/src/metadata/database.rs
@@ -89,19 +89,23 @@ impl DatabaseDescriptor {
 }
 
 impl DatabaseDescriptorBuilder {
-    pub fn comment(mut self, comment: &str) -> Self {
-        self.comment = Some(comment.to_string());
+    pub fn comment<C: Into<String>>(mut self, comment: C) -> Self {
+        self.comment = Some(comment.into());
         self
     }
 
-    pub fn custom_properties(mut self, properties: HashMap<String, String>) -> Self {
-        self.custom_properties = properties;
+    pub fn custom_properties<K: Into<String>, V: Into<String>>(
+        mut self,
+        properties: HashMap<K, V>,
+    ) -> Self {
+        for (k, v) in properties {
+            self.custom_properties.insert(k.into(), v.into());
+        }
         self
     }
 
-    pub fn custom_property(mut self, key: &str, value: &str) -> Self {
-        self.custom_properties
-            .insert(key.to_string(), value.to_string());
+    pub fn custom_property<K: Into<String>, V: Into<String>>(mut self, key: K, value: V) -> Self {
+        self.custom_properties.insert(key.into(), value.into());
         self
     }
 
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 6431d3a97d..3da270bc6a 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -1114,13 +1114,13 @@ impl DataTypes {
     }
 
     /// Field definition with field name and data type.
-    pub fn field(name: String, data_type: DataType) -> DataField {
+    pub fn field<N: Into<String>>(name: N, data_type: DataType) -> DataField {
         DataField::new(name, data_type, None)
     }
 
     /// Field definition with field name, data type, and a description.
-    pub fn field_with_description(
-        name: String,
+    pub fn field_with_description<N: Into<String>>(
+        name: N,
         data_type: DataType,
         description: String,
     ) -> DataField {
@@ -1151,9 +1151,13 @@ pub struct DataField {
 }
 
 impl DataField {
-    pub fn new(name: String, data_type: DataType, description: Option<String>) -> DataField {
+    pub fn new<N: Into<String>>(
+        name: N,
+        data_type: DataType,
+        description: Option<String>,
+    ) -> DataField {
         DataField {
-            name,
+            name: name.into(),
             data_type,
             description,
         }
@@ -1318,13 +1322,13 @@ fn test_map_display() {
 #[test]
 fn test_row_display() {
     let fields = vec![
-        DataTypes::field("id".to_string(), DataTypes::int()),
-        DataTypes::field("name".to_string(), DataTypes::string()),
+        DataTypes::field("id", DataTypes::int()),
+        DataTypes::field("name", DataTypes::string()),
     ];
     let row_type = RowType::new(fields);
     assert_eq!(row_type.to_string(), "ROW<id INT, name STRING>");
 
-    let fields_non_null = vec![DataTypes::field("age".to_string(), DataTypes::bigint())];
+    let fields_non_null = vec![DataTypes::field("age", DataTypes::bigint())];
     let row_type_non_null = RowType::with_nullable(false, fields_non_null);
     assert_eq!(row_type_non_null.to_string(), "ROW<age BIGINT> NOT NULL");
 }
@@ -1354,23 +1358,23 @@ fn test_datatype_display() {
 
 #[test]
 fn test_datafield_display() {
-    let field = DataTypes::field("user_id".to_string(), DataTypes::bigint());
+    let field = DataTypes::field("user_id", DataTypes::bigint());
     assert_eq!(field.to_string(), "user_id BIGINT");
 
-    let field2 = DataTypes::field("email".to_string(), DataTypes::string());
+    let field2 = DataTypes::field("email", DataTypes::string());
     assert_eq!(field2.to_string(), "email STRING");
 
-    let field3 = DataTypes::field("score".to_string(), DataTypes::decimal(10, 2));
+    let field3 = DataTypes::field("score", DataTypes::decimal(10, 2));
     assert_eq!(field3.to_string(), "score DECIMAL(10, 2)");
 }
 
 #[test]
 fn test_complex_nested_display() {
     let row_type = DataTypes::row(vec![
-        DataTypes::field("id".to_string(), DataTypes::int()),
-        DataTypes::field("tags".to_string(), DataTypes::array(DataTypes::string())),
+        DataTypes::field("id", DataTypes::int()),
+        DataTypes::field("tags", DataTypes::array(DataTypes::string())),
         DataTypes::field(
-            "metadata".to_string(),
+            "metadata",
             DataTypes::map(DataTypes::string(), DataTypes::string()),
         ),
     ]);
@@ -1394,8 +1398,8 @@ fn test_deeply_nested_types() {
     let nested = DataTypes::array(DataTypes::map(
         DataTypes::string(),
         DataTypes::row(vec![
-            DataTypes::field("x".to_string(), DataTypes::int()),
-            DataTypes::field("y".to_string(), DataTypes::int()),
+            DataTypes::field("x", DataTypes::int()),
+            DataTypes::field("y", DataTypes::int()),
         ]),
     ));
     assert_eq!(nested.to_string(), "ARRAY<MAP<STRING, ROW<x INT, y INT>>>");
diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
index d0d56ef286..d58fb7ee8e 100644
--- a/fluss-rust/crates/fluss/src/metadata/json_serde.rs
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -403,8 +403,7 @@ impl JsonSerde for Column {
             .and_then(|v| v.as_str())
             .ok_or_else(|| Error::JsonSerdeError {
                 message: format!("Missing required field: {}", Self::NAME),
-            })?
-            .to_string();
+            })?;
 
         let data_type_node = node
             .get(Self::DATA_TYPE)
@@ -414,7 +413,7 @@ impl JsonSerde for Column {
 
         let data_type = DataType::deserialize_json(data_type_node)?;
 
-        let mut column = Column::new(&name, data_type);
+        let mut column = Column::new(name, data_type);
 
         if let Some(comment) = node.get(Self::COMMENT).and_then(|v| v.as_str()) {
             column = column.with_comment(comment);
@@ -483,14 +482,9 @@ impl JsonSerde for Schema {
 
             let mut primary_keys = Vec::with_capacity(pk_array.len());
             for name_node in pk_array {
-                primary_keys.push(
-                    name_node
-                        .as_str()
-                        .ok_or_else(|| Error::InvalidTableError {
-                            message: "Primary key element must be a string".to_string(),
-                        })?
-                        .to_string(),
-                );
+                primary_keys.push(name_node.as_str().ok_or_else(|| Error::InvalidTableError {
+                    message: "Primary key element must be a string".to_string(),
+                })?);
             }
 
             schema_builder = schema_builder.primary_key(primary_keys);
diff --git a/fluss-rust/crates/fluss/src/metadata/partition.rs b/fluss-rust/crates/fluss/src/metadata/partition.rs
index bc1935c3c8..18402354a5 100644
--- a/fluss-rust/crates/fluss/src/metadata/partition.rs
+++ b/fluss-rust/crates/fluss/src/metadata/partition.rs
@@ -31,8 +31,14 @@ pub struct PartitionSpec {
 }
 
 impl PartitionSpec {
-    pub fn new(partition_spec: HashMap<String, String>) -> Self {
-        Self { partition_spec }
+    pub fn new<K: Into<String>, V: Into<String>>(partition_spec: HashMap<K, V>) -> Self {
+        let mut new_map = HashMap::new();
+        for (k, v) in partition_spec {
+            new_map.insert(k.into(), v.into());
+        }
+        Self {
+            partition_spec: new_map,
+        }
     }
 
     pub fn get_spec_map(&self) -> &HashMap<String, String> {
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index ce362c43be..908f446914 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -36,16 +36,16 @@ pub struct Column {
 }
 
 impl Column {
-    pub fn new(name: &str, data_type: DataType) -> Self {
+    pub fn new<N: Into<String>>(name: N, data_type: DataType) -> Self {
         Self {
-            name: name.to_string(),
+            name: name.into(),
             data_type,
             comment: None,
         }
     }
 
-    pub fn with_comment(mut self, comment: &str) -> Self {
-        self.comment = Some(comment.to_string());
+    pub fn with_comment<C: Into<String>>(mut self, comment: C) -> Self {
+        self.comment = Some(comment.into());
         self
     }
 
@@ -78,9 +78,9 @@ pub struct PrimaryKey {
 }
 
 impl PrimaryKey {
-    pub fn new(constraint_name: &str, column_names: Vec<String>) -> Self {
+    pub fn new<N: Into<String>>(constraint_name: N, column_names: Vec<String>) -> Self {
         Self {
-            constraint_name: constraint_name.to_string(),
+            constraint_name: constraint_name.into(),
             column_names,
         }
     }
@@ -178,8 +178,8 @@ impl SchemaBuilder {
         }
     }
 
-    pub fn column(mut self, name: &str, data_type: DataType) -> Self {
-        self.columns.push(Column::new(name, data_type));
+    pub fn column<N: Into<String>>(mut self, name: N, data_type: DataType) -> Self {
+        self.columns.push(Column::new(name.into(), data_type));
         self
     }
 
@@ -188,20 +188,34 @@ impl SchemaBuilder {
         self
     }
 
-    pub fn with_comment(mut self, comment: &str) -> Self {
+    pub fn with_comment<C: Into<String>>(mut self, comment: C) -> Self {
         if let Some(last) = self.columns.last_mut() {
-            *last = last.clone().with_comment(comment);
+            *last = last.clone().with_comment(comment.into());
         }
         self
     }
 
-    pub fn primary_key(self, column_names: Vec<String>) -> Self {
-        let constraint_name = format!("PK_{}", column_names.join("_"));
-        self.primary_key_named(&constraint_name, column_names)
+    pub fn primary_key<I, S>(self, column_names: I) -> Self
+    where
+        I: IntoIterator<Item = S>,
+        S: Into<String>,
+    {
+        let names: Vec<String> = column_names.into_iter().map(|s| s.into()).collect();
+
+        let constraint_name = format!("PK_{}", names.join("_"));
+
+        self.primary_key_named(&constraint_name, names)
     }
 
-    pub fn primary_key_named(mut self, constraint_name: &str, column_names: Vec<String>) -> Self {
-        self.primary_key = Some(PrimaryKey::new(constraint_name, column_names));
+    pub fn primary_key_named<N: Into<String>, P: Into<String>>(
+        mut self,
+        constraint_name: N,
+        column_names: Vec<P>,
+    ) -> Self {
+        self.primary_key = Some(PrimaryKey::new(
+            constraint_name.into(),
+            column_names.into_iter().map(|s| s.into()).collect(),
+        ));
         self
     }
 
@@ -209,14 +223,14 @@ impl SchemaBuilder {
     /// whenever a new row is inserted into the table, the new row will be assigned with the next
     /// available value from the auto-increment sequence. A table can have at most one auto
     /// increment column.
-    pub fn enable_auto_increment(mut self, column_name: &str) -> Result<Self> {
+    pub fn enable_auto_increment<N: Into<String>>(mut self, column_name: N) -> Result<Self> {
         if !self.auto_increment_col_names.is_empty() {
             return Err(IllegalArgument {
                 message: "Multiple auto increment columns are not supported yet.".to_string(),
             });
         }
 
-        self.auto_increment_col_names.push(column_name.to_string());
+        self.auto_increment_col_names.push(column_name.into());
         Ok(self)
     }
 
@@ -353,29 +367,43 @@ impl TableDescriptorBuilder {
         self
     }
 
-    pub fn property<T: ToString>(mut self, key: &str, value: T) -> Self {
-        self.properties.insert(key.to_string(), value.to_string());
+    pub fn property<K: Into<String>, V: Into<String>>(mut self, key: K, value: V) -> Self {
+        self.properties.insert(key.into(), value.into());
         self
     }
 
-    pub fn properties(mut self, properties: HashMap<String, String>) -> Self {
-        self.properties.extend(properties);
+    pub fn properties<K: Into<String>, V: Into<String>>(
+        mut self,
+        properties: HashMap<K, V>,
+    ) -> Self {
+        for (k, v) in properties {
+            self.properties.insert(k.into(), v.into());
+        }
         self
     }
 
-    pub fn custom_property(mut self, key: &str, value: &str) -> Self {
-        self.custom_properties
-            .insert(key.to_string(), value.to_string());
+    pub fn custom_property<K: Into<String>, V: Into<String>>(mut self, key: K, value: V) -> Self {
+        self.custom_properties.insert(key.into(), value.into());
         self
     }
 
-    pub fn custom_properties(mut self, custom_properties: HashMap<String, String>) -> Self {
-        self.custom_properties.extend(custom_properties);
+    pub fn custom_properties<K: Into<String>, V: Into<String>>(
+        mut self,
+        custom_properties: HashMap<K, V>,
+    ) -> Self {
+        for (k, v) in custom_properties {
+            self.custom_properties.insert(k.into(), v.into());
+        }
         self
     }
 
-    pub fn partitioned_by(mut self, partition_keys: Vec<String>) -> Self {
-        self.partition_keys = Arc::from(partition_keys);
+    pub fn partitioned_by<P: Into<String>>(mut self, partition_keys: Vec<P>) -> Self {
+        self.partition_keys = Arc::from(
+            partition_keys
+                .into_iter()
+                .map(|s| s.into())
+                .collect::<Vec<String>>(),
+        );
         self
     }
 
@@ -387,8 +415,8 @@ impl TableDescriptorBuilder {
         self
     }
 
-    pub fn comment(mut self, comment: &str) -> Self {
-        self.comment = Some(comment.to_string());
+    pub fn comment<S: Into<String>>(mut self, comment: S) -> Self {
+        self.comment = Some(comment.into());
         self
     }
 
@@ -487,9 +515,16 @@ impl TableDescriptor {
             })
     }
 
-    pub fn with_properties(&self, new_properties: HashMap<String, String>) -> Self {
+    pub fn with_properties<K: Into<String>, V: Into<String>>(
+        &self,
+        new_properties: HashMap<K, V>,
+    ) -> Self {
+        let mut properties = HashMap::new();
+        for (k, v) in new_properties {
+            properties.insert(k.into(), v.into());
+        }
         Self {
-            properties: new_properties,
+            properties,
             ..self.clone()
         }
     }
@@ -684,10 +719,10 @@ const MAX_NAME_LENGTH: usize = 200;
 const INTERNAL_NAME_PREFIX: &str = "__";
 
 impl TablePath {
-    pub fn new(db: String, tbl: String) -> Self {
+    pub fn new<D: Into<String>, T: Into<String>>(db: D, tbl: T) -> Self {
         TablePath {
-            database: db,
-            table: tbl,
+            database: db.into(),
+            table: tbl.into(),
         }
     }
 
@@ -769,14 +804,14 @@ impl PhysicalTablePath {
         }
     }
 
-    pub fn of_with_names(
-        database_name: String,
-        table_name: String,
-        partition_name: Option<String>,
+    pub fn of_with_names<D: Into<String>, T: Into<String>, P: Into<String>>(
+        database_name: D,
+        table_name: T,
+        partition_name: Option<P>,
     ) -> Self {
         Self {
             table_path: Arc::new(TablePath::new(database_name, table_name)),
-            partition_name,
+            partition_name: partition_name.map(|p| p.into()),
         }
     }
 
@@ -1122,7 +1157,7 @@ impl TableInfo {
             .custom_properties(self.custom_properties.clone());
 
         if let Some(comment) = &self.comment {
-            builder = builder.comment(&comment.clone());
+            builder = builder.comment(comment.clone());
         }
 
         builder.build()
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index b798896ace..fe2f2f4463 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -1590,8 +1590,8 @@ mod tests {
 
         assert_eq!(
             to_arrow_type(&DataTypes::row(vec![
-                DataTypes::field("f1".to_string(), DataTypes::int()),
-                DataTypes::field("f2".to_string(), DataTypes::string()),
+                DataTypes::field("f1", DataTypes::int()),
+                DataTypes::field("f2", DataTypes::string()),
             ]))
             .unwrap(),
             ArrowDataType::Struct(arrow_schema::Fields::from(vec![
@@ -1654,8 +1654,8 @@ mod tests {
     #[test]
     fn projection_rejects_out_of_bounds_index() {
         let row_type = RowType::new(vec![
-            DataField::new("id".to_string(), DataTypes::int(), None),
-            DataField::new("name".to_string(), DataTypes::string(), None),
+            DataField::new("id", DataTypes::int(), None),
+            DataField::new("name", DataTypes::string(), None),
         ]);
         let schema = to_arrow_schema(&row_type).unwrap();
         let result = ReadContext::with_projection_pushdown(schema, vec![0, 2], false);
@@ -1722,7 +1722,7 @@ mod tests {
 
         // Test 1: Rescaling from scale 3 to scale 2
         let row_type = RowType::new(vec![DataField::new(
-            "amount".to_string(),
+            "amount",
             DataTypes::decimal(10, 2),
             None,
         )]);
@@ -1743,7 +1743,7 @@ mod tests {
 
         // Test 2: Precision overflow (should error)
         let row_type = RowType::new(vec![DataField::new(
-            "amount".to_string(),
+            "amount",
             DataTypes::decimal(5, 2),
             None,
         )]);
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
index 9236321668..77cdbcb1b7 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
@@ -120,7 +120,7 @@ mod tests {
         fn new(data_types: Vec<crate::metadata::DataType>) -> Self {
             let mut builder = Schema::builder();
             for (i, dt) in data_types.iter().enumerate() {
-                builder = builder.column(&format!("field{i}"), dt.clone());
+                builder = builder.column(format!("field{i}"), dt.clone());
             }
             let schema = builder.build().expect("Failed to build schema");
 
diff --git a/fluss-rust/crates/fluss/src/test_utils.rs b/fluss-rust/crates/fluss/src/test_utils.rs
index 8e8fbe4884..752d42244e 100644
--- a/fluss-rust/crates/fluss/src/test_utils.rs
+++ b/fluss-rust/crates/fluss/src/test_utils.rs
@@ -24,11 +24,7 @@ use std::collections::HashMap;
 use std::sync::Arc;
 
 pub(crate) fn build_table_info(table_path: TablePath, table_id: i64, buckets: i32) -> TableInfo {
-    let row_type = DataTypes::row(vec![DataField::new(
-        "id".to_string(),
-        DataTypes::int(),
-        None,
-    )]);
+    let row_type = DataTypes::row(vec![DataField::new("id", DataTypes::int(), None)]);
     let mut schema_builder = Schema::builder().with_row_type(&row_type);
     let schema = schema_builder.build().expect("schema build");
     let table_descriptor = TableDescriptor::builder()
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index e94b67c510..c6c98b85d4 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -64,13 +64,7 @@ mod admin_test {
 
         let db_descriptor = DatabaseDescriptorBuilder::default()
             .comment("test_db")
-            .custom_properties(
-                [
-                    ("k1".to_string(), "v1".to_string()),
-                    ("k2".to_string(), "v2".to_string()),
-                ]
-                .into(),
-            )
+            .custom_properties([("k1", "v1"), ("k2", "v2")].into())
             .build();
 
         let db_name = "test_create_database";
@@ -128,7 +122,7 @@ mod admin_test {
             .expect("Failed to create test database");
 
         let test_table_name = "test_user_table";
-        let table_path = TablePath::new(test_db_name.to_string(), test_table_name.to_string());
+        let table_path = TablePath::new(test_db_name, test_table_name);
 
         // build table schema
         let table_schema = Schema::builder()
@@ -250,25 +244,21 @@ mod admin_test {
             .expect("Failed to create test database");
 
         let test_table_name = "partitioned_table";
-        let table_path = TablePath::new(test_db_name.to_string(), test_table_name.to_string());
+        let table_path = TablePath::new(test_db_name, test_table_name);
 
         let table_schema = Schema::builder()
             .column("id", DataTypes::int())
             .column("name", DataTypes::string())
             .column("dt", DataTypes::string())
             .column("region", DataTypes::string())
-            .primary_key(vec![
-                "id".to_string(),
-                "dt".to_string(),
-                "region".to_string(),
-            ])
+            .primary_key(vec!["id", "dt", "region"])
             .build()
             .expect("Failed to build table schema");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(table_schema)
             .distributed_by(Some(3), vec!["id".to_string()])
-            .partitioned_by(vec!["dt".to_string(), "region".to_string()])
+            .partitioned_by(vec!["dt", "region"])
             .property("table.replication.factor", "1")
             .log_format(LogFormat::ARROW)
             .kv_format(KvFormat::COMPACTED)
@@ -291,8 +281,8 @@ mod admin_test {
         );
 
         let mut partition_values = HashMap::new();
-        partition_values.insert("dt".to_string(), "2024-01-15".to_string());
-        partition_values.insert("region".to_string(), "EMEA".to_string());
+        partition_values.insert("dt", "2024-01-15");
+        partition_values.insert("region", "EMEA");
         let partition_spec = PartitionSpec::new(partition_values);
 
         admin
@@ -317,7 +307,7 @@ mod admin_test {
 
         // list with partial spec filter - should find the partition
         let mut partition_values = HashMap::new();
-        partition_values.insert("dt".to_string(), "2024-01-15".to_string());
+        partition_values.insert("dt", "2024-01-15");
         let partial_partition_spec = PartitionSpec::new(partition_values);
 
         let partitions_with_spec = admin
@@ -337,7 +327,7 @@ mod admin_test {
 
         // list with non-matching spec - should find no partitions
         let mut non_matching_values = HashMap::new();
-        non_matching_values.insert("dt".to_string(), "2024-01-16".to_string());
+        non_matching_values.insert("dt", "2024-01-16");
         let non_matching_spec = PartitionSpec::new(non_matching_values);
         let partitions_non_matching = admin
             .list_partition_infos_with_spec(&table_path, Some(&non_matching_spec))
@@ -382,7 +372,7 @@ mod admin_test {
             .await
             .expect("Failed to get admin client");
 
-        let table_path = TablePath::new("fluss".to_string(), "not_exist".to_string());
+        let table_path = TablePath::new("fluss", "not_exist");
 
         let result = admin.get_table(&table_path).await;
         assert!(result.is_err(), "Expected error but got Ok");
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index 3691d655a4..c419ed900b 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -66,7 +66,7 @@ mod kv_table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss".to_string(), "test_upsert_and_lookup".to_string());
+        let table_path = TablePath::new("fluss", "test_upsert_and_lookup");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
@@ -74,7 +74,7 @@ mod kv_table_test {
                     .column("id", DataTypes::int())
                     .column("name", DataTypes::string())
                     .column("age", DataTypes::bigint())
-                    .primary_key(vec!["id".to_string()])
+                    .primary_key(vec!["id"])
                     .build()
                     .expect("Failed to build schema"),
             )
@@ -223,7 +223,7 @@ mod kv_table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss".to_string(), "test_composite_pk".to_string());
+        let table_path = TablePath::new("fluss", "test_composite_pk");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
@@ -231,7 +231,7 @@ mod kv_table_test {
                     .column("region", DataTypes::string())
                     .column("user_id", DataTypes::int())
                     .column("score", DataTypes::bigint())
-                    .primary_key(vec!["region".to_string(), "user_id".to_string()])
+                    .primary_key(vec!["region", "user_id"])
                     .build()
                     .expect("Failed to build schema"),
             )
@@ -335,7 +335,7 @@ mod kv_table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss".to_string(), "test_partial_update".to_string());
+        let table_path = TablePath::new("fluss", "test_partial_update");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
@@ -344,7 +344,7 @@ mod kv_table_test {
                     .column("name", DataTypes::string())
                     .column("age", DataTypes::bigint())
                     .column("score", DataTypes::bigint())
-                    .primary_key(vec!["id".to_string()])
+                    .primary_key(vec!["id"])
                     .build()
                     .expect("Failed to build schema"),
             )
@@ -446,8 +446,7 @@ mod kv_table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path =
-            TablePath::new("fluss".to_string(), "test_partitioned_kv_table".to_string());
+        let table_path = TablePath::new("fluss", "test_partitioned_kv_table");
 
         // Create a partitioned KV table with region as partition key
         let table_descriptor = TableDescriptor::builder()
@@ -457,11 +456,11 @@ mod kv_table_test {
                     .column("user_id", DataTypes::int())
                     .column("name", DataTypes::string())
                     .column("score", DataTypes::bigint())
-                    .primary_key(vec!["region".to_string(), "user_id".to_string()])
+                    .primary_key(vec!["region", "user_id"])
                     .build()
                     .expect("Failed to build schema"),
             )
-            .partitioned_by(vec!["region".to_string()])
+            .partitioned_by(vec!["region"])
             .build()
             .expect("Failed to build table");
 
@@ -614,7 +613,7 @@ mod kv_table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss".to_string(), "test_all_datatypes".to_string());
+        let table_path = TablePath::new("fluss", "test_all_datatypes");
 
         // Create a table with all supported primitive datatypes
         let table_descriptor = TableDescriptor::builder()
@@ -645,7 +644,7 @@ mod kv_table_test {
                     // Binary types
                     .column("col_bytes", DataTypes::bytes())
                     .column("col_binary", DataTypes::binary(20))
-                    .primary_key(vec!["pk_int".to_string()])
+                    .primary_key(vec!["pk_int"])
                     .build()
                     .expect("Failed to build schema"),
             )
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 27b4d8313f..514df82802 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -69,10 +69,7 @@ mod table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new(
-            "fluss".to_string(),
-            "test_append_record_batch_and_scan".to_string(),
-        );
+        let table_path = TablePath::new("fluss", "test_append_record_batch_and_scan");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
@@ -171,7 +168,7 @@ mod table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss".to_string(), "test_list_offsets".to_string());
+        let table_path = TablePath::new("fluss", "test_list_offsets");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
@@ -295,7 +292,7 @@ mod table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss".to_string(), "test_project".to_string());
+        let table_path = TablePath::new("fluss", "test_project");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
@@ -451,7 +448,7 @@ mod table_test {
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss".to_string(), "test_poll_batches".to_string());
+        let table_path = TablePath::new("fluss", "test_poll_batches");
         let schema = Schema::builder()
             .column("id", DataTypes::int())
             .column("name", DataTypes::string())
@@ -595,7 +592,7 @@ mod table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss".to_string(), "test_log_all_datatypes".to_string());
+        let table_path = TablePath::new("fluss", "test_log_all_datatypes");
 
         // Create a log table with all supported datatypes for append/scan
         let table_descriptor = TableDescriptor::builder()
@@ -983,10 +980,7 @@ mod table_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new(
-            "fluss".to_string(),
-            "test_partitioned_log_append".to_string(),
-        );
+        let table_path = TablePath::new("fluss", "test_partitioned_log_append");
 
         // Create a partitioned log table
         let table_descriptor = TableDescriptor::builder()
@@ -998,7 +992,7 @@ mod table_test {
                     .build()
                     .expect("Failed to build schema"),
             )
-            .partitioned_by(vec!["region".to_string()])
+            .partitioned_by(vec!["region"])
             .build()
             .expect("Failed to build table");
 
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index ce0c1371c0..0efe388247 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -115,10 +115,7 @@ mod table_remote_scan_test {
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new(
-            "fluss".to_string(),
-            "test_append_record_batch_and_scan".to_string(),
-        );
+        let table_path = TablePath::new("fluss", "test_append_record_batch_and_scan");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index fd5145a73c..ae61d3ad68 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -119,7 +119,7 @@ pub async fn create_partitions(
 ) {
     for value in partition_values {
         let mut partition_map = HashMap::new();
-        partition_map.insert(partition_column.to_string(), value.to_string());
+        partition_map.insert(partition_column, *value);
         admin
             .create_partition(table_path, &PartitionSpec::new(partition_map), true)
             .await

From 9231fb4b2e4cebd13724d23344234396c8fabfc1 Mon Sep 17 00:00:00 2001
From: Miao <one.lemorage@gmail.com>
Date: Wed, 4 Feb 2026 12:06:55 +0800
Subject: [PATCH 105/287] feat: add table partition scanning (#222)

---
 fluss-rust/bindings/python/src/metadata.rs    |   6 +-
 fluss-rust/crates/fluss/src/client/admin.rs   |   6 +-
 .../crates/fluss/src/client/metadata.rs       |   4 +-
 .../crates/fluss/src/client/table/scanner.rs  | 153 +++++++++++++-----
 fluss-rust/crates/fluss/src/metadata/table.rs |   2 +-
 .../fluss/tests/integration/log_table.rs      |  66 +++++++-
 6 files changed, 185 insertions(+), 52 deletions(-)

diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
index 235df56ba7..f422696157 100644
--- a/fluss-rust/bindings/python/src/metadata.rs
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -530,7 +530,11 @@ impl TableBucket {
 
     /// Convert to core TableBucket (internal use)
     pub fn to_core(&self) -> fcore::metadata::TableBucket {
-        fcore::metadata::TableBucket::new(self.table_id, self.bucket)
+        fcore::metadata::TableBucket::new_with_partition(
+            self.table_id,
+            self.partition_id,
+            self.bucket,
+        )
     }
 }
 
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 9061169d2a..737ead3d55 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -273,7 +273,11 @@ impl FlussAdmin {
         // Convert proto response to LakeSnapshot
         let mut table_buckets_offset = HashMap::new();
         for bucket_snapshot in response.bucket_snapshots {
-            let table_bucket = TableBucket::new(response.table_id, bucket_snapshot.bucket_id);
+            let table_bucket = TableBucket::new_with_partition(
+                response.table_id,
+                bucket_snapshot.partition_id,
+                bucket_snapshot.bucket_id,
+            );
             if let Some(log_offset) = bucket_snapshot.log_offset {
                 table_buckets_offset.insert(table_bucket, log_offset);
             }
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index c6244cd797..ce00ced2b5 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -259,8 +259,8 @@ mod tests {
         let leader = metadata
             .leader_for(&table_path, &TableBucket::new(1, 0))
             .await
-            .expect("leader request should be Ok")
-            .expect("leader should exist");
+            .unwrap()
+            .expect("leader");
         assert_eq!(leader.id(), 1);
     }
 
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index d30c5d5554..a88964ea97 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -26,7 +26,6 @@ use std::{
 };
 use tempfile::TempDir;
 
-use crate::TableId;
 use crate::client::connection::FlussConnection;
 use crate::client::credentials::SecurityTokenManager;
 use crate::client::metadata::Metadata;
@@ -43,6 +42,7 @@ use crate::record::{
 };
 use crate::rpc::{RpcClient, RpcError, message};
 use crate::util::FairBucketStatusMap;
+use crate::{PartitionId, TableId};
 
 const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
 #[allow(dead_code)]
@@ -88,7 +88,7 @@ impl<'a> TableScan<'a> {
     /// # pub async fn example() -> Result<()> {
     ///     let mut config = Config::default();
     ///     config.bootstrap_server = "127.0.0.1:9123".to_string();
-    ///     let conn = FlussConnection::new(config).await;
+    ///     let conn = FlussConnection::new(config).await?;
     ///
     ///     let table_descriptor = TableDescriptor::builder()
     ///         .schema(
@@ -164,7 +164,7 @@ impl<'a> TableScan<'a> {
     /// # pub async fn example() -> Result<()> {
     ///     let mut config = Config::default();
     ///     config.bootstrap_server = "127.0.0.1:9123".to_string();
-    ///     let conn = FlussConnection::new(config).await;
+    ///     let conn = FlussConnection::new(config).await?;
     ///
     ///     let table_descriptor = TableDescriptor::builder()
     ///         .schema(
@@ -270,6 +270,7 @@ struct LogScannerInner {
     metadata: Arc<Metadata>,
     log_scanner_status: Arc<LogScannerStatus>,
     log_fetcher: LogFetcher,
+    is_partitioned_table: bool,
 }
 
 impl LogScannerInner {
@@ -284,6 +285,7 @@ impl LogScannerInner {
         Ok(Self {
             table_path: table_info.table_path.clone(),
             table_id: table_info.table_id,
+            is_partitioned_table: table_info.is_partitioned(),
             metadata: metadata.clone(),
             log_scanner_status: log_scanner_status.clone(),
             log_fetcher: LogFetcher::new(
@@ -337,6 +339,13 @@ impl LogScannerInner {
     }
 
     async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
+        if self.is_partitioned_table {
+            return Err(Error::UnsupportedOperation {
+                message: "The table is a partitioned table, please use \"subscribe_partition\" to \
+                subscribe a partitioned bucket instead."
+                    .to_string(),
+            });
+        }
         let table_bucket = TableBucket::new(self.table_id, bucket);
         self.metadata
             .check_and_update_table_metadata(from_ref(&self.table_path))
@@ -347,6 +356,13 @@ impl LogScannerInner {
     }
 
     async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
+        if self.is_partitioned_table {
+            return Err(Error::UnsupportedOperation {
+                message:
+                    "The table is a partitioned table, subscribe_batch is not supported currently."
+                        .to_string(),
+            });
+        }
         self.metadata
             .check_and_update_table_metadata(from_ref(&self.table_path))
             .await?;
@@ -368,6 +384,29 @@ impl LogScannerInner {
         Ok(())
     }
 
+    async fn subscribe_partition(
+        &self,
+        partition_id: PartitionId,
+        bucket: i32,
+        offset: i64,
+    ) -> Result<()> {
+        if !self.is_partitioned_table {
+            return Err(Error::UnsupportedOperation {
+                message: "The table is not a partitioned table, please use \"subscribe\" to \
+                subscribe a non-partitioned bucket instead."
+                    .to_string(),
+            });
+        }
+        let table_bucket =
+            TableBucket::new_with_partition(self.table_id, Some(partition_id), bucket);
+        self.metadata
+            .check_and_update_table_metadata(from_ref(&self.table_path))
+            .await?;
+        self.log_scanner_status
+            .assign_scan_bucket(table_bucket, offset);
+        Ok(())
+    }
+
     async fn poll_for_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
         let result = self.log_fetcher.collect_fetches()?;
         if !result.is_empty() {
@@ -435,6 +474,17 @@ impl LogScanner {
     pub async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
         self.inner.subscribe_batch(bucket_offsets).await
     }
+
+    pub async fn subscribe_partition(
+        &self,
+        partition_id: PartitionId,
+        bucket: i32,
+        offset: i64,
+    ) -> Result<()> {
+        self.inner
+            .subscribe_partition(partition_id, bucket, offset)
+            .await
+    }
 }
 
 // Implementation for RecordBatchLogScanner (batches mode)
@@ -451,6 +501,17 @@ impl RecordBatchLogScanner {
     pub async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
         self.inner.subscribe_batch(bucket_offsets).await
     }
+
+    pub async fn subscribe_partition(
+        &self,
+        partition_id: PartitionId,
+        bucket: i32,
+        offset: i64,
+    ) -> Result<()> {
+        self.inner
+            .subscribe_partition(partition_id, bucket, offset)
+            .await
+    }
 }
 
 struct LogFetcher {
@@ -617,55 +678,55 @@ impl LogFetcher {
         )
     }
 
-    async fn check_and_update_metadata(&self) -> Result<()> {
-        let need_update = self
-            .fetchable_buckets()
-            .iter()
-            .any(|bucket| self.get_table_bucket_leader(bucket).is_none());
+    async fn check_and_update_metadata(&self, table_buckets: &[TableBucket]) -> Result<()> {
+        let mut partition_ids = Vec::new();
+        let mut need_update = false;
 
-        if !need_update {
-            return Ok(());
+        for tb in table_buckets {
+            if self.get_table_bucket_leader(tb).is_some() {
+                continue;
+            }
+
+            if self.is_partitioned {
+                partition_ids.push(tb.partition_id().unwrap());
+            } else {
+                need_update = true;
+                break;
+            }
         }
 
-        if self.is_partitioned {
-            // Fallback to full table metadata refresh until partition-aware updates are available.
+        let update_result = if self.is_partitioned && !partition_ids.is_empty() {
             self.metadata
-                .update_tables_metadata(&HashSet::from([&self.table_path]), &HashSet::new(), vec![])
+                .update_tables_metadata(
+                    &HashSet::from([&self.table_path]),
+                    &HashSet::new(),
+                    partition_ids,
+                )
                 .await
-                .or_else(|e| {
-                    if let Error::RpcError { source, .. } = &e
-                        && matches!(source, RpcError::ConnectionError(_) | RpcError::Poisoned(_))
-                    {
-                        warn!(
-                            "Retrying after encountering error while updating table metadata: {e}"
-                        );
-                        Ok(())
-                    } else {
-                        Err(e)
-                    }
-                })?;
-            return Ok(());
-        }
+        } else if need_update {
+            self.metadata.update_table_metadata(&self.table_path).await
+        } else {
+            Ok(())
+        };
 
-        // TODO: Handle PartitionNotExist error
-        self.metadata
-            .update_tables_metadata(&HashSet::from([&self.table_path]), &HashSet::new(), vec![])
-            .await
-            .or_else(|e| {
-                if let Error::RpcError { source, .. } = &e
-                    && matches!(source, RpcError::ConnectionError(_) | RpcError::Poisoned(_))
-                {
-                    warn!("Retrying after encountering error while updating table metadata: {e}");
-                    Ok(())
-                } else {
-                    Err(e)
-                }
-            })
+        // TODO: Handle PartitionNotExist error like java side
+        update_result.or_else(|e| {
+            if let Error::RpcError { source, .. } = &e
+                && matches!(source, RpcError::ConnectionError(_) | RpcError::Poisoned(_))
+            {
+                warn!("Retrying after encountering error while updating table metadata: {e}");
+                Ok(())
+            } else {
+                Err(e)
+            }
+        })?;
+        Ok(())
     }
 
     /// Send fetch requests asynchronously without waiting for responses
     async fn send_fetches(&self) -> Result<()> {
-        self.check_and_update_metadata().await?;
+        self.check_and_update_metadata(self.fetchable_buckets().as_slice())
+            .await?;
         let fetch_request = self.prepare_fetch_log_requests().await;
 
         for (leader, fetch_request) in fetch_request {
@@ -774,7 +835,11 @@ impl LogFetcher {
 
             for fetch_log_for_bucket in fetch_log_for_buckets {
                 let bucket: i32 = fetch_log_for_bucket.bucket_id;
-                let table_bucket = TableBucket::new(table_id, bucket);
+                let table_bucket = TableBucket::new_with_partition(
+                    table_id,
+                    fetch_log_for_bucket.partition_id,
+                    bucket,
+                );
 
                 // todo: check fetch result code for per-bucket
                 let Some(fetch_offset) = log_scanner_status.get_bucket_offset(&table_bucket) else {
@@ -1302,7 +1367,7 @@ impl LogFetcher {
                         )
                     } else {
                         let fetch_log_req_for_bucket = PbFetchLogReqForBucket {
-                            partition_id: None,
+                            partition_id: bucket.partition_id(),
                             bucket_id: bucket.bucket_id(),
                             fetch_offset: offset,
                             // 1M
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 908f446914..4e0a525620 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -1206,7 +1206,7 @@ pub struct TableBucket {
 
 impl TableBucket {
     pub fn new(table_id: TableId, bucket: BucketId) -> Self {
-        TableBucket {
+        Self {
             table_id,
             partition_id: None,
             bucket,
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 514df82802..cbfcbe58b8 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -974,7 +974,7 @@ mod table_test {
     }
 
     #[tokio::test]
-    async fn partitioned_table_append() {
+    async fn partitioned_table_append_scan() {
         let cluster = get_fluss_cluster();
         let connection = cluster.get_fluss_connection().await;
 
@@ -1098,11 +1098,71 @@ mod table_test {
             "Table partition 'fluss.test_partitioned_log_append(p=NOT Exists)' does not exist."
         ));
 
+        let log_scanner = table
+            .new_scan()
+            .create_log_scanner()
+            .expect("Failed to create log scanner");
+        let partition_info = admin
+            .list_partition_infos(&table_path)
+            .await
+            .expect("Failed to list partition infos");
+        for partition_info in partition_info {
+            log_scanner
+                .subscribe_partition(partition_info.get_partition_id(), 0, 0)
+                .await
+                .expect("Failed to subscribe to partition");
+        }
+
+        let expected_records = vec![
+            (1, "US", 100i64),
+            (2, "US", 200i64),
+            (3, "EU", 300i64),
+            (4, "EU", 400),
+            (5, "US", 500i64),
+            (6, "US", 600i64),
+            (7, "EU", 700i64),
+            (8, "EU", 800i64),
+        ];
+        let expected_records: Vec<(i32, String, i64)> = expected_records
+            .into_iter()
+            .map(|(id, region, val)| (id, region.to_string(), val))
+            .collect();
+
+        let mut collected_records: Vec<(i32, String, i64)> = Vec::new();
+        let start_time = std::time::Instant::now();
+        while collected_records.len() < expected_records.len()
+            && start_time.elapsed() < Duration::from_secs(10)
+        {
+            let records = log_scanner
+                .poll(Duration::from_millis(500))
+                .await
+                .expect("Failed to poll log scanner");
+            for rec in records {
+                let row = rec.row();
+                collected_records.push((
+                    row.get_int(0),
+                    row.get_string(1).to_string(),
+                    row.get_long(2),
+                ));
+            }
+        }
+
+        assert_eq!(
+            collected_records.len(),
+            expected_records.len(),
+            "Did not receive all records in time, expect receive {} records, but got {} records",
+            expected_records.len(),
+            collected_records.len()
+        );
+        collected_records.sort_by_key(|r| r.0);
+        assert_eq!(
+            collected_records, expected_records,
+            "Data mismatch between sent and received"
+        );
+
         admin
             .drop_table(&table_path, false)
             .await
             .expect("Failed to drop table");
-
-        // todo: add scan test in 203
     }
 }

From becde5511978e4fa9183f3f83eb8dd21cb26944f Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Wed, 4 Feb 2026 14:38:10 +0800
Subject: [PATCH 106/287] feat: support subscribe partition in cpp binding
 (#236)

---
 fluss-rust/bindings/cpp/include/fluss.hpp |  1 +
 fluss-rust/bindings/cpp/src/lib.rs        | 48 ++++++++++++++++++++---
 fluss-rust/bindings/cpp/src/table.cpp     |  9 +++++
 3 files changed, 53 insertions(+), 5 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 968cb06509..d35ece2cf5 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -544,6 +544,7 @@ class LogScanner {
 
     Result Subscribe(int32_t bucket_id, int64_t start_offset);
     Result Subscribe(const std::vector<BucketSubscription>& bucket_offsets);
+    Result SubscribePartition(int64_t partition_id, int32_t bucket_id, int64_t start_offset);
     Result Poll(int64_t timeout_ms, ScanRecords& out);
     Result PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out);
 
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 11e9105af1..7ae6416c3c 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -21,6 +21,7 @@ use std::sync::{Arc, LazyLock};
 use std::time::Duration;
 
 use fluss as fcore;
+use fluss::PartitionId;
 
 static RUNTIME: LazyLock<tokio::runtime::Runtime> = LazyLock::new(|| {
     tokio::runtime::Builder::new_multi_thread()
@@ -248,6 +249,12 @@ mod ffi {
             self: &LogScanner,
             subscriptions: Vec<FfiBucketSubscription>,
         ) -> FfiResult;
+        fn subscribe_partition(
+            self: &LogScanner,
+            partition_id: i64,
+            bucket_id: i32,
+            start_offset: i64,
+        ) -> FfiResult;
         fn poll(self: &LogScanner, timeout_ms: i64) -> FfiScanRecordsResult;
         fn poll_record_batch(self: &LogScanner, timeout_ms: i64) -> FfiArrowRecordBatchesResult;
         fn free_arrow_ffi_structures(array_ptr: usize, schema_ptr: usize);
@@ -743,17 +750,39 @@ pub extern "C" fn free_arrow_ffi_structures(array_ptr: usize, schema_ptr: usize)
 
 impl LogScanner {
     fn subscribe(&self, bucket_id: i32, start_offset: i64) -> ffi::FfiResult {
-        if let Some(ref inner) = self.inner {
-            let result = RUNTIME.block_on(async { inner.subscribe(bucket_id, start_offset).await });
+        self.do_subscribe(None, bucket_id, start_offset)
+    }
 
+    fn do_subscribe(
+        &self,
+        partition_id: Option<PartitionId>,
+        bucket_id: i32,
+        start_offset: i64,
+    ) -> ffi::FfiResult {
+        if let Some(ref inner) = self.inner {
+            let result = RUNTIME.block_on(async {
+                if let Some(partition_id) = partition_id {
+                    inner
+                        .subscribe_partition(partition_id, bucket_id, start_offset)
+                        .await
+                } else {
+                    inner.subscribe(bucket_id, start_offset).await
+                }
+            });
             match result {
                 Ok(_) => ok_result(),
                 Err(e) => err_result(1, e.to_string()),
             }
         } else if let Some(ref inner_batch) = self.inner_batch {
-            let result =
-                RUNTIME.block_on(async { inner_batch.subscribe(bucket_id, start_offset).await });
-
+            let result = RUNTIME.block_on(async {
+                if let Some(partition_id) = partition_id {
+                    inner_batch
+                        .subscribe_partition(partition_id, bucket_id, start_offset)
+                        .await
+                } else {
+                    inner_batch.subscribe(bucket_id, start_offset).await
+                }
+            });
             match result {
                 Ok(_) => ok_result(),
                 Err(e) => err_result(1, e.to_string()),
@@ -790,6 +819,15 @@ impl LogScanner {
         }
     }
 
+    fn subscribe_partition(
+        &self,
+        partition_id: PartitionId,
+        bucket_id: i32,
+        start_offset: i64,
+    ) -> ffi::FfiResult {
+        self.do_subscribe(Some(partition_id), bucket_id, start_offset)
+    }
+
     fn poll(&self, timeout_ms: i64) -> ffi::FfiScanRecordsResult {
         if let Some(ref inner) = self.inner {
             let timeout = Duration::from_millis(timeout_ms as u64);
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 118ca3c276..b327dbacd8 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -265,6 +265,15 @@ Result LogScanner::Subscribe(const std::vector<BucketSubscription>& bucket_offse
     return utils::from_ffi_result(ffi_result);
 }
 
+Result LogScanner::SubscribePartition(int64_t partition_id, int32_t bucket_id, int64_t start_offset) {
+    if (!Available()) {
+        return utils::make_error(1, "LogScanner not available");
+    }
+
+    auto ffi_result = scanner_->subscribe_partition(partition_id, bucket_id, start_offset);
+    return utils::from_ffi_result(ffi_result);
+}
+
 Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
     if (!Available()) {
         return utils::make_error(1, "LogScanner not available");

From 2ad9dfe3d547dae3ab13eae627125e95210ab2a5 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Wed, 4 Feb 2026 12:45:08 +0000
Subject: [PATCH 107/287] chore: Reject table scan for INDEXED format or KV
 table (#238)

---
 fluss-rust/bindings/cpp/src/lib.rs            | 55 +++++------
 .../crates/fluss/src/client/table/scanner.rs  | 97 ++++++++++++++++++-
 fluss-rust/crates/fluss/src/metadata/table.rs | 11 +++
 3 files changed, 132 insertions(+), 31 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 7ae6416c3c..ab02c8d072 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -591,10 +591,10 @@ impl Table {
                 self.table_info.clone(),
             );
 
-            let scanner = match fluss_table.new_scan().create_log_scanner() {
-                Ok(a) => a,
-                Err(e) => return Err(format!("Failed to create log scanner: {e}")),
-            };
+            let scanner = fluss_table
+                .new_scan()
+                .create_log_scanner()
+                .map_err(|e| format!("Failed to create log scanner: {e}"))?;
 
             let scanner_ptr = Box::into_raw(Box::new(LogScanner {
                 inner: Some(scanner),
@@ -616,17 +616,15 @@ impl Table {
                 self.table_info.clone(),
             );
 
-            let scan = fluss_table.new_scan();
-            let scan = match scan.project(&column_indices) {
-                Ok(s) => s,
-                Err(e) => return Err(format!("Failed to project columns: {e}")),
-            };
-            let scanner = match scan.create_log_scanner() {
-                Ok(a) => a,
-                Err(e) => return Err(format!("Failed to create log scanner: {e}")),
-            };
+            let log_scanner = fluss_table
+                .new_scan()
+                .project(&column_indices)
+                .map_err(|e| format!("Failed to project columns: {e}"))?
+                .create_log_scanner()
+                .map_err(|e| format!("Failed to create log scanner: {e}"))?;
+
             let scanner = Box::into_raw(Box::new(LogScanner {
-                inner: Some(scanner),
+                inner: Some(log_scanner),
                 inner_batch: None,
             }));
             Ok(scanner)
@@ -641,13 +639,14 @@ impl Table {
                 self.table_info.clone(),
             );
 
-            let scanner = match fluss_table.new_scan().create_record_batch_log_scanner() {
-                Ok(a) => a,
-                Err(e) => return Err(format!("Failed to create record batch log scanner: {e}")),
-            };
+            let batch_scanner = fluss_table
+                .new_scan()
+                .create_record_batch_log_scanner()
+                .map_err(|e| format!("Failed to create record batch log scanner: {e}"))?;
+
             let scanner = Box::into_raw(Box::new(LogScanner {
                 inner: None,
-                inner_batch: Some(scanner),
+                inner_batch: Some(batch_scanner),
             }));
             Ok(scanner)
         })
@@ -664,18 +663,16 @@ impl Table {
                 self.table_info.clone(),
             );
 
-            let scan = fluss_table.new_scan();
-            let scan = match scan.project(&column_indices) {
-                Ok(s) => s,
-                Err(e) => return Err(format!("Failed to project columns: {e}")),
-            };
-            let scanner = match scan.create_record_batch_log_scanner() {
-                Ok(a) => a,
-                Err(e) => return Err(format!("Failed to create record batch log scanner: {e}")),
-            };
+            let batch_scanner = fluss_table
+                .new_scan()
+                .project(&column_indices)
+                .map_err(|e| format!("Failed to project columns: {e}"))?
+                .create_record_batch_log_scanner()
+                .map_err(|e| format!("Failed to create record batch log scanner: {e}"))?;
+
             let scanner = Box::into_raw(Box::new(LogScanner {
                 inner: None,
-                inner_batch: Some(scanner),
+                inner_batch: Some(batch_scanner),
             }));
             Ok(scanner)
         })
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index a88964ea97..422f9d32ab 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -34,8 +34,9 @@ use crate::client::table::log_fetch_buffer::{
     LogFetchBuffer, RemotePendingFetch,
 };
 use crate::client::table::remote_log::{RemoteLogDownloader, RemoteLogFetchInfo};
+use crate::error::Error::UnsupportedOperation;
 use crate::error::{ApiError, Error, FlussError, Result};
-use crate::metadata::{PhysicalTablePath, TableBucket, TableInfo, TablePath};
+use crate::metadata::{LogFormat, PhysicalTablePath, TableBucket, TableInfo, TablePath};
 use crate::proto::{ErrorResponse, FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
 use crate::record::{
     LogRecordsBatches, ReadContext, ScanBatch, ScanRecord, ScanRecords, to_arrow_schema,
@@ -221,6 +222,7 @@ impl<'a> TableScan<'a> {
     }
 
     pub fn create_log_scanner(self) -> Result<LogScanner> {
+        validate_scan_support(&self.table_info.table_path, &self.table_info)?;
         let inner = LogScannerInner::new(
             &self.table_info,
             self.metadata.clone(),
@@ -234,6 +236,7 @@ impl<'a> TableScan<'a> {
     }
 
     pub fn create_record_batch_log_scanner(self) -> Result<RecordBatchLogScanner> {
+        validate_scan_support(&self.table_info.table_path, &self.table_info)?;
         let inner = LogScannerInner::new(
             &self.table_info,
             self.metadata.clone(),
@@ -1556,6 +1559,25 @@ impl BucketScanStatus {
     }
 }
 
+fn validate_scan_support(table_path: &TablePath, table_info: &TableInfo) -> Result<()> {
+    if table_info.schema.primary_key().is_some() {
+        return Err(UnsupportedOperation {
+            message: format!("Table {table_path} is not a Log Table and doesn't support scan."),
+        });
+    }
+
+    let log_format = table_info.table_config.get_log_format()?;
+    if LogFormat::ARROW != log_format {
+        return Err(UnsupportedOperation {
+            message: format!(
+                "Scan is only supported for ARROW format and table {table_path} uses {log_format} format"
+            ),
+        });
+    }
+
+    Ok(())
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
@@ -1564,7 +1586,7 @@ mod tests {
     use crate::compression::{
         ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
     };
-    use crate::metadata::{PhysicalTablePath, TableInfo, TablePath};
+    use crate::metadata::{DataTypes, PhysicalTablePath, Schema, TableInfo, TablePath};
     use crate::record::MemoryLogRecordsArrowBuilder;
     use crate::row::{Datum, GenericRow};
     use crate::rpc::FlussError;
@@ -1781,4 +1803,75 @@ mod tests {
         assert!(metadata.get_cluster().leader_for(&bucket).is_none());
         Ok(())
     }
+
+    fn create_test_table_info(
+        has_primary_key: bool,
+        log_format: Option<&str>,
+    ) -> (TableInfo, TablePath) {
+        let mut schema_builder = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string());
+
+        if has_primary_key {
+            schema_builder = schema_builder.primary_key(vec!["id"]);
+        }
+
+        let schema = schema_builder.build().unwrap();
+        let table_path = TablePath::new("test_db", "test_table");
+
+        let mut properties = HashMap::new();
+        if let Some(format) = log_format {
+            properties.insert("table.log.format".to_string(), format.to_string());
+        }
+
+        let table_info = TableInfo::new(
+            table_path.clone(),
+            1,
+            1,
+            schema,
+            vec![],
+            Arc::from(vec![]),
+            1,
+            properties,
+            HashMap::new(),
+            None,
+            0,
+            0,
+        );
+
+        (table_info, table_path)
+    }
+
+    #[test]
+    fn test_validate_scan_support() {
+        // Primary key table
+        let (table_info, table_path) = create_test_table_info(true, Some("ARROW"));
+        let result = validate_scan_support(&table_path, &table_info);
+
+        assert!(result.is_err());
+        let err = result.unwrap_err();
+        assert!(matches!(err, UnsupportedOperation { .. }));
+        assert!(err.to_string().contains(
+            format!("Table {table_path} is not a Log Table and doesn't support scan.").as_str()
+        ));
+
+        // Indexed format
+        let (table_info, table_path) = create_test_table_info(false, Some("INDEXED"));
+        let result = validate_scan_support(&table_path, &table_info);
+
+        assert!(result.is_err());
+        let err = result.unwrap_err();
+        assert!(matches!(err, UnsupportedOperation { .. }));
+        assert!(err.to_string().contains(format!("Scan is only supported for ARROW format and table {table_path} uses INDEXED format").as_str()));
+
+        // Default format
+        let (table_info, table_path) = create_test_table_info(false, None);
+        let result = validate_scan_support(&table_path, &table_info);
+        assert!(result.is_ok());
+
+        // Arrow format
+        let (table_info, table_path) = create_test_table_info(false, Some("ARROW"));
+        let result = validate_scan_support(&table_path, &table_info);
+        assert!(result.is_ok());
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 4e0a525620..66de2a9488 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -969,6 +969,17 @@ impl TableConfig {
         kv_format.parse().map_err(Into::into)
     }
 
+    pub fn get_log_format(&self) -> Result<LogFormat> {
+        // TODO: Consolidate configurations logic, constants, defaults in a single place
+        const DEFAULT_LOG_FORMAT: &str = "ARROW";
+        let log_format = self
+            .properties
+            .get("table.log.format")
+            .map(String::as_str)
+            .unwrap_or(DEFAULT_LOG_FORMAT);
+        LogFormat::parse(log_format)
+    }
+
     pub fn get_auto_partition_strategy(&self) -> AutoPartitionStrategy {
         AutoPartitionStrategy::from(&self.properties)
     }

From f7fb74164525298b7de23f34e4cb9458623e0ed3 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 4 Feb 2026 15:15:26 +0000
Subject: [PATCH 108/287] feat: introduce kv tables support in python (#239)

---
 fluss-rust/bindings/python/example/example.py | 305 +++++++++++--
 fluss-rust/bindings/python/fluss/__init__.pyi |  81 +++-
 fluss-rust/bindings/python/src/lib.rs         |   6 +
 fluss-rust/bindings/python/src/lookup.rs      | 111 +++++
 fluss-rust/bindings/python/src/table.rs       | 417 +++++++++++++++++-
 fluss-rust/bindings/python/src/upsert.rs      | 188 ++++++++
 .../crates/fluss/src/client/table/lookup.rs   |  50 ++-
 .../crates/fluss/src/client/table/mod.rs      |   4 +-
 .../crates/fluss/src/client/table/scanner.rs  |   3 +-
 fluss-rust/crates/fluss/src/row/encode/mod.rs |   4 +-
 10 files changed, 1101 insertions(+), 68 deletions(-)
 create mode 100644 fluss-rust/bindings/python/src/lookup.rs
 create mode 100644 fluss-rust/bindings/python/src/upsert.rs

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 5d0302efea..c359425e13 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -16,8 +16,9 @@
 # under the License.
 
 import asyncio
-import time
-from datetime import date, time as dt_time, datetime
+import traceback
+from datetime import date, datetime
+from datetime import time as dt_time
 from decimal import Decimal
 
 import pandas as pd
@@ -103,11 +104,34 @@ async def main():
                 pa.array(["Alice", "Bob", "Charlie"], type=pa.string()),
                 pa.array([95.2, 87.2, 92.1], type=pa.float32()),
                 pa.array([25, 30, 35], type=pa.int32()),
-                pa.array([date(1999, 5, 15), date(1994, 3, 20), date(1989, 11, 8)], type=pa.date32()),
-                pa.array([dt_time(9, 0, 0), dt_time(9, 30, 0), dt_time(10, 0, 0)], type=pa.time32("ms")),
-                pa.array([datetime(2024, 1, 15, 10, 30), datetime(2024, 1, 15, 11, 0), datetime(2024, 1, 15, 11, 30)], type=pa.timestamp("us")),
-                pa.array([datetime(2024, 1, 15, 10, 30), datetime(2024, 1, 15, 11, 0), datetime(2024, 1, 15, 11, 30)], type=pa.timestamp("us", tz="UTC")),
-                pa.array([Decimal("75000.00"), Decimal("82000.50"), Decimal("95000.75")], type=pa.decimal128(10, 2)),
+                pa.array(
+                    [date(1999, 5, 15), date(1994, 3, 20), date(1989, 11, 8)],
+                    type=pa.date32(),
+                ),
+                pa.array(
+                    [dt_time(9, 0, 0), dt_time(9, 30, 0), dt_time(10, 0, 0)],
+                    type=pa.time32("ms"),
+                ),
+                pa.array(
+                    [
+                        datetime(2024, 1, 15, 10, 30),
+                        datetime(2024, 1, 15, 11, 0),
+                        datetime(2024, 1, 15, 11, 30),
+                    ],
+                    type=pa.timestamp("us"),
+                ),
+                pa.array(
+                    [
+                        datetime(2024, 1, 15, 10, 30),
+                        datetime(2024, 1, 15, 11, 0),
+                        datetime(2024, 1, 15, 11, 30),
+                    ],
+                    type=pa.timestamp("us", tz="UTC"),
+                ),
+                pa.array(
+                    [Decimal("75000.00"), Decimal("82000.50"), Decimal("95000.75")],
+                    type=pa.decimal128(10, 2),
+                ),
             ],
             schema=schema,
         )
@@ -125,9 +149,18 @@ async def main():
                 pa.array([28, 32], type=pa.int32()),
                 pa.array([date(1996, 7, 22), date(1992, 12, 1)], type=pa.date32()),
                 pa.array([dt_time(14, 15, 0), dt_time(8, 45, 0)], type=pa.time32("ms")),
-                pa.array([datetime(2024, 1, 16, 9, 0), datetime(2024, 1, 16, 9, 30)], type=pa.timestamp("us")),
-                pa.array([datetime(2024, 1, 16, 9, 0), datetime(2024, 1, 16, 9, 30)], type=pa.timestamp("us", tz="UTC")),
-                pa.array([Decimal("68000.00"), Decimal("72500.25")], type=pa.decimal128(10, 2)),
+                pa.array(
+                    [datetime(2024, 1, 16, 9, 0), datetime(2024, 1, 16, 9, 30)],
+                    type=pa.timestamp("us"),
+                ),
+                pa.array(
+                    [datetime(2024, 1, 16, 9, 0), datetime(2024, 1, 16, 9, 30)],
+                    type=pa.timestamp("us", tz="UTC"),
+                ),
+                pa.array(
+                    [Decimal("68000.00"), Decimal("72500.25")],
+                    type=pa.decimal128(10, 2),
+                ),
             ],
             schema=schema,
         )
@@ -138,28 +171,35 @@ async def main():
         # Test 3: Append single rows with Date, Time, Timestamp, Decimal
         print("\n--- Testing single row append with temporal/decimal types ---")
         # Dict input with all types including Date, Time, Timestamp, Decimal
-        await append_writer.append({
-            "id": 8,
-            "name": "Helen",
-            "score": 93.5,
-            "age": 26,
-            "birth_date": date(1998, 4, 10),
-            "check_in_time": dt_time(11, 30, 45),
-            "created_at": datetime(2024, 1, 17, 14, 0, 0),
-            "updated_at": datetime(2024, 1, 17, 14, 0, 0),
-            "salary": Decimal("88000.00"),
-        })
+        await append_writer.append(
+            {
+                "id": 8,
+                "name": "Helen",
+                "score": 93.5,
+                "age": 26,
+                "birth_date": date(1998, 4, 10),
+                "check_in_time": dt_time(11, 30, 45),
+                "created_at": datetime(2024, 1, 17, 14, 0, 0),
+                "updated_at": datetime(2024, 1, 17, 14, 0, 0),
+                "salary": Decimal("88000.00"),
+            }
+        )
         print("Successfully appended row (dict with Date, Time, Timestamp, Decimal)")
 
         # List input with all types
-        await append_writer.append([
-            9, "Ivan", 90.0, 31,
-            date(1993, 8, 25),
-            dt_time(16, 45, 0),
-            datetime(2024, 1, 17, 15, 30, 0),
-            datetime(2024, 1, 17, 15, 30, 0),
-            Decimal("91500.50"),
-        ])
+        await append_writer.append(
+            [
+                9,
+                "Ivan",
+                90.0,
+                31,
+                date(1993, 8, 25),
+                dt_time(16, 45, 0),
+                datetime(2024, 1, 17, 15, 30, 0),
+                datetime(2024, 1, 17, 15, 30, 0),
+                Decimal("91500.50"),
+            ]
+        )
         print("Successfully appended row (list with Date, Time, Timestamp, Decimal)")
 
         # Test 4: Write Pandas DataFrame
@@ -172,8 +212,14 @@ async def main():
                 "age": [29, 27],
                 "birth_date": [date(1995, 2, 14), date(1997, 9, 30)],
                 "check_in_time": [dt_time(10, 0, 0), dt_time(10, 30, 0)],
-                "created_at": [datetime(2024, 1, 18, 8, 0), datetime(2024, 1, 18, 8, 30)],
-                "updated_at": [datetime(2024, 1, 18, 8, 0), datetime(2024, 1, 18, 8, 30)],
+                "created_at": [
+                    datetime(2024, 1, 18, 8, 0),
+                    datetime(2024, 1, 18, 8, 30),
+                ],
+                "updated_at": [
+                    datetime(2024, 1, 18, 8, 0),
+                    datetime(2024, 1, 18, 8, 30),
+                ],
                 "salary": [Decimal("79000.00"), Decimal("85500.75")],
             }
         )
@@ -249,6 +295,199 @@ async def main():
     except Exception as e:
         print(f"Error during scanning: {e}")
 
+    # =====================================================
+    # Demo: Primary Key Table with Lookup and Upsert
+    # =====================================================
+    print("\n" + "=" * 60)
+    print("--- Testing Primary Key Table (Lookup & Upsert) ---")
+    print("=" * 60)
+
+    # Create a primary key table for lookup/upsert tests
+    # Include temporal and decimal types to test full conversion
+    pk_table_fields = [
+        pa.field("user_id", pa.int32()),
+        pa.field("name", pa.string()),
+        pa.field("email", pa.string()),
+        pa.field("age", pa.int32()),
+        pa.field("birth_date", pa.date32()),
+        pa.field("login_time", pa.time32("ms")),
+        pa.field("created_at", pa.timestamp("us")),  # TIMESTAMP (NTZ)
+        pa.field("updated_at", pa.timestamp("us", tz="UTC")),  # TIMESTAMP_LTZ
+        pa.field("balance", pa.decimal128(10, 2)),
+    ]
+    pk_schema = pa.schema(pk_table_fields)
+    fluss_pk_schema = fluss.Schema(pk_schema, primary_keys=["user_id"])
+
+    # Create table descriptor
+    pk_table_descriptor = fluss.TableDescriptor(
+        fluss_pk_schema,
+        bucket_count=3,
+    )
+
+    pk_table_path = fluss.TablePath("fluss", "users_pk_table_v3")
+
+    try:
+        await admin.create_table(pk_table_path, pk_table_descriptor, True)
+        print(f"Created PK table: {pk_table_path}")
+    except Exception as e:
+        print(f"PK Table creation failed (may already exist): {e}")
+
+    # Get the PK table
+    pk_table = await conn.get_table(pk_table_path)
+    print(f"Got PK table: {pk_table}")
+    print(f"Has primary key: {pk_table.has_primary_key()}")
+
+    # --- Test Upsert ---
+    print("\n--- Testing Upsert ---")
+    try:
+        upsert_writer = pk_table.new_upsert()
+        print(f"Created upsert writer: {upsert_writer}")
+
+        await upsert_writer.upsert(
+            {
+                "user_id": 1,
+                "name": "Alice",
+                "email": "alice@example.com",
+                "age": 25,
+                "birth_date": date(1999, 5, 15),
+                "login_time": dt_time(9, 30, 45, 123000),  # 09:30:45.123
+                "created_at": datetime(
+                    2024, 1, 15, 10, 30, 45, 123456
+                ),  # with microseconds
+                "updated_at": datetime(2024, 1, 15, 10, 30, 45, 123456),
+                "balance": Decimal("1234.56"),
+            }
+        )
+        print("Upserted user_id=1 (Alice)")
+
+        await upsert_writer.upsert(
+            {
+                "user_id": 2,
+                "name": "Bob",
+                "email": "bob@example.com",
+                "age": 30,
+                "birth_date": date(1994, 3, 20),
+                "login_time": dt_time(14, 15, 30, 500000),  # 14:15:30.500
+                "created_at": datetime(2024, 1, 16, 11, 22, 33, 444555),
+                "updated_at": datetime(2024, 1, 16, 11, 22, 33, 444555),
+                "balance": Decimal("5678.91"),
+            }
+        )
+        print("Upserted user_id=2 (Bob)")
+
+        await upsert_writer.upsert(
+            {
+                "user_id": 3,
+                "name": "Charlie",
+                "email": "charlie@example.com",
+                "age": 35,
+                "birth_date": date(1989, 11, 8),
+                "login_time": dt_time(16, 45, 59, 999000),  # 16:45:59.999
+                "created_at": datetime(2024, 1, 17, 23, 59, 59, 999999),
+                "updated_at": datetime(2024, 1, 17, 23, 59, 59, 999999),
+                "balance": Decimal("9876.54"),
+            }
+        )
+        print("Upserted user_id=3 (Charlie)")
+
+        # Update an existing row (same PK, different values)
+        await upsert_writer.upsert(
+            {
+                "user_id": 1,
+                "name": "Alice Updated",
+                "email": "alice.new@example.com",
+                "age": 26,
+                "birth_date": date(1999, 5, 15),
+                "login_time": dt_time(10, 11, 12, 345000),  # 10:11:12.345
+                "created_at": datetime(2024, 1, 15, 10, 30, 45, 123456),  # unchanged
+                "updated_at": datetime(
+                    2024, 1, 20, 15, 45, 30, 678901
+                ),  # new update time
+                "balance": Decimal("2345.67"),
+            }
+        )
+        print("Updated user_id=1 (Alice -> Alice Updated)")
+
+        # Explicit flush to ensure all upserts are acknowledged
+        await upsert_writer.flush()
+        print("Flushed all upserts")
+
+    except Exception as e:
+        print(f"Error during upsert: {e}")
+        traceback.print_exc()
+
+    # --- Test Lookup ---
+    print("\n--- Testing Lookup ---")
+    try:
+        lookuper = pk_table.new_lookup()
+        print(f"Created lookuper: {lookuper}")
+
+        result = await lookuper.lookup({"user_id": 1})
+        if result:
+            print("Lookup user_id=1: Found!")
+            print(f"  name: {result['name']}")
+            print(f"  email: {result['email']}")
+            print(f"  age: {result['age']}")
+            print(
+                f"  birth_date: {result['birth_date']} (type: {type(result['birth_date']).__name__})"
+            )
+            print(
+                f"  login_time: {result['login_time']} (type: {type(result['login_time']).__name__})"
+            )
+            print(
+                f"  created_at: {result['created_at']} (type: {type(result['created_at']).__name__})"
+            )
+            print(
+                f"  updated_at: {result['updated_at']} (type: {type(result['updated_at']).__name__})"
+            )
+            print(
+                f"  balance: {result['balance']} (type: {type(result['balance']).__name__})"
+            )
+        else:
+            print("Lookup user_id=1: Not found")
+
+        # Lookup another row
+        result = await lookuper.lookup({"user_id": 2})
+        if result:
+            print(f"Lookup user_id=2: Found! -> {result}")
+        else:
+            print("Lookup user_id=2: Not found")
+
+        # Lookup non-existent row
+        result = await lookuper.lookup({"user_id": 999})
+        if result:
+            print(f"Lookup user_id=999: Found! -> {result}")
+        else:
+            print("Lookup user_id=999: Not found (as expected)")
+
+    except Exception as e:
+        print(f"Error during lookup: {e}")
+        traceback.print_exc()
+
+    # --- Test Delete ---
+    print("\n--- Testing Delete ---")
+    try:
+        upsert_writer = pk_table.new_upsert()
+
+        # Delete only needs PK columns - much simpler API!
+        await upsert_writer.delete({"user_id": 3})
+        print("Deleted user_id=3")
+
+        # Explicit flush to ensure delete is acknowledged
+        await upsert_writer.flush()
+        print("Flushed delete")
+
+        lookuper = pk_table.new_lookup()
+        result = await lookuper.lookup({"user_id": 3})
+        if result:
+            print(f"Lookup user_id=3 after delete: Still found! -> {result}")
+        else:
+            print("Lookup user_id=3 after delete: Not found (deletion confirmed)")
+
+    except Exception as e:
+        print(f"Error during delete: {e}")
+        traceback.print_exc()
+
     # Demo: Column projection
     print("\n--- Testing Column Projection ---")
     try:
@@ -258,7 +497,9 @@ async def main():
         scanner_index.subscribe(None, None)
         df_projected = scanner_index.to_pandas()
         print(df_projected.head())
-        print(f"   Projected {df_projected.shape[1]} columns: {list(df_projected.columns)}")
+        print(
+            f"   Projected {df_projected.shape[1]} columns: {list(df_projected.columns)}"
+        )
 
         # Project specific columns by name (Pythonic!)
         print("\n2. Projection by name ['name', 'score'] (Pythonic):")
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 6073070c0d..c911ebedfc 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -45,7 +45,12 @@ class FlussConnection:
     async def get_table(self, table_path: TablePath) -> FlussTable: ...
     def close(self) -> None: ...
     def __enter__(self) -> FlussConnection: ...
-    def __exit__(self, exc_type: Optional[type], exc_value: Optional[BaseException], traceback: Optional[TracebackType]) -> bool: ...
+    def __exit__(
+        self,
+        exc_type: Optional[type],
+        exc_value: Optional[BaseException],
+        traceback: Optional[TracebackType],
+    ) -> bool: ...
     def __repr__(self) -> str: ...
 
 class FlussAdmin:
@@ -61,7 +66,17 @@ class FlussAdmin:
 
 class FlussTable:
     async def new_append_writer(self) -> AppendWriter: ...
-    async def new_log_scanner(self) -> LogScanner: ...
+    async def new_log_scanner(
+        self,
+        project: Optional[List[int]] = None,
+        columns: Optional[List[str]] = None,
+    ) -> LogScanner: ...
+    def new_upsert(
+        self,
+        columns: Optional[List[str]] = None,
+        column_indices: Optional[List[int]] = None,
+    ) -> UpsertWriter: ...
+    def new_lookup(self) -> Lookuper: ...
     def get_table_info(self) -> TableInfo: ...
     def get_table_path(self) -> TablePath: ...
     def has_primary_key(self) -> bool: ...
@@ -100,6 +115,49 @@ class AppendWriter:
     def flush(self) -> None: ...
     def __repr__(self) -> str: ...
 
+class UpsertWriter:
+    """Writer for upserting and deleting data in a Fluss primary key table."""
+
+    async def upsert(self, row: dict | list | tuple) -> None:
+        """Upsert a row into the table.
+
+        If a row with the same primary key exists, it will be updated.
+        Otherwise, a new row will be inserted.
+
+        Args:
+            row: Dictionary mapping field names to values, or
+                 list/tuple of values in schema order
+        """
+        ...
+    async def delete(self, pk: dict | list | tuple) -> None:
+        """Delete a row from the table by primary key.
+
+        Args:
+            pk: Dictionary with PK column names as keys, or
+                list/tuple of PK values in PK column order
+        """
+        ...
+    async def flush(self) -> None:
+        """Flush all pending upsert/delete operations to the server."""
+        ...
+    def __repr__(self) -> str: ...
+
+class Lookuper:
+    """Lookuper for performing primary key lookups on a Fluss table."""
+
+    async def lookup(self, pk: dict | list | tuple) -> Optional[Dict[str, object]]:
+        """Lookup a row by its primary key.
+
+        Args:
+            pk: Dictionary with PK column names as keys, or
+                list/tuple of PK values in PK column order
+
+        Returns:
+            A dict containing the row data if found, None otherwise.
+        """
+        ...
+    def __repr__(self) -> str: ...
+
 class LogScanner:
     def subscribe(
         self, start_timestamp: Optional[int], end_timestamp: Optional[int]
@@ -109,14 +167,27 @@ class LogScanner:
     def __repr__(self) -> str: ...
 
 class Schema:
-    def __init__(self, schema: pa.Schema, primary_keys: Optional[List[str]] = None) -> None: ...
+    def __init__(
+        self, schema: pa.Schema, primary_keys: Optional[List[str]] = None
+    ) -> None: ...
     def get_column_names(self) -> List[str]: ...
     def get_column_types(self) -> List[str]: ...
-    def get_columns(self) -> List[Tuple[str,str]]: ...
+    def get_columns(self) -> List[Tuple[str, str]]: ...
     def __str__(self) -> str: ...
 
 class TableDescriptor:
-    def __init__(self, schema: Schema, **kwargs: str) -> None: ...
+    def __init__(
+        self,
+        schema: Schema,
+        *,
+        partition_keys: Optional[List[str]] = None,
+        bucket_count: Optional[int] = None,
+        bucket_keys: Optional[List[str]] = None,
+        comment: Optional[str] = None,
+        log_format: Optional[str] = None,
+        kv_format: Optional[str] = None,
+        **properties: str,
+    ) -> None: ...
     def get_schema(self) -> Schema: ...
 
 class TablePath:
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 49d51794ca..3da0b251f6 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -25,16 +25,20 @@ mod admin;
 mod config;
 mod connection;
 mod error;
+mod lookup;
 mod metadata;
 mod table;
+mod upsert;
 mod utils;
 
 pub use admin::*;
 pub use config::*;
 pub use connection::*;
 pub use error::*;
+pub use lookup::*;
 pub use metadata::*;
 pub use table::*;
+pub use upsert::*;
 pub use utils::*;
 
 static TOKIO_RUNTIME: LazyLock<Runtime> = LazyLock::new(|| {
@@ -55,6 +59,8 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<FlussAdmin>()?;
     m.add_class::<FlussTable>()?;
     m.add_class::<AppendWriter>()?;
+    m.add_class::<UpsertWriter>()?;
+    m.add_class::<Lookuper>()?;
     m.add_class::<Schema>()?;
     m.add_class::<LogScanner>()?;
     m.add_class::<LakeSnapshot>()?;
diff --git a/fluss-rust/bindings/python/src/lookup.rs b/fluss-rust/bindings/python/src/lookup.rs
new file mode 100644
index 0000000000..8d91a6198b
--- /dev/null
+++ b/fluss-rust/bindings/python/src/lookup.rs
@@ -0,0 +1,111 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::table::{internal_row_to_dict, python_pk_to_generic_row};
+use crate::*;
+use pyo3_async_runtimes::tokio::future_into_py;
+use std::sync::Arc;
+use tokio::sync::Mutex;
+
+/// Lookuper for performing primary key lookups on a Fluss table.
+///
+/// The Lookuper caches key encoders and bucketing functions, making
+/// repeated lookups efficient. Create once and reuse for multiple lookups.
+///
+/// # Example:
+///     lookuper = table.new_lookup()
+///     result = await lookuper.lookup({"user_id": 1})
+///     result2 = await lookuper.lookup({"user_id": 2})  # Reuses cached encoders
+#[pyclass]
+pub struct Lookuper {
+    inner: Arc<Mutex<fcore::client::Lookuper>>,
+    table_info: Arc<fcore::metadata::TableInfo>,
+}
+
+#[pymethods]
+impl Lookuper {
+    /// Lookup a row by its primary key.
+    ///
+    /// Args:
+    ///     pk: A dict, list, or tuple containing only the primary key values.
+    ///         For dict: keys are PK column names.
+    ///         For list/tuple: values in PK column order.
+    ///
+    /// Returns:
+    ///     A dict containing the row data if found, None otherwise.
+    pub fn lookup<'py>(
+        &self,
+        py: Python<'py>,
+        pk: &Bound<'_, PyAny>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let generic_row = python_pk_to_generic_row(pk, &self.table_info)?;
+        let inner = self.inner.clone();
+        let table_info = self.table_info.clone();
+
+        future_into_py(py, async move {
+            // Perform async lookup
+            let result = {
+                let mut lookuper = inner.lock().await;
+                lookuper
+                    .lookup(&generic_row)
+                    .await
+                    .map_err(|e| FlussError::new_err(e.to_string()))?
+            };
+
+            // Extract row data
+            let row_opt = result
+                .get_single_row()
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+            // Convert to Python with GIL
+            Python::attach(|py| match row_opt {
+                Some(compacted_row) => internal_row_to_dict(py, &compacted_row, &table_info),
+                None => Ok(py.None()),
+            })
+        })
+    }
+
+    fn __repr__(&self) -> String {
+        "Lookuper()".to_string()
+    }
+}
+
+impl Lookuper {
+    /// Create a Lookuper from connection components.
+    ///
+    /// This creates the core Lookuper which caches encoders and bucketing functions.
+    pub fn new(
+        connection: &Arc<fcore::client::FlussConnection>,
+        metadata: Arc<fcore::client::Metadata>,
+        table_info: fcore::metadata::TableInfo,
+    ) -> PyResult<Self> {
+        let fluss_table = fcore::client::FlussTable::new(connection, metadata, table_info.clone());
+
+        let table_lookup = fluss_table
+            .new_lookup()
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+        let lookuper = table_lookup
+            .create_lookuper()
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+        Ok(Self {
+            inner: Arc::new(Mutex::new(lookuper)),
+            table_info: Arc::new(table_info),
+        })
+    }
+}
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 48f09e7ac1..4554ca17e5 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -36,6 +36,7 @@ const MICROS_PER_MILLI: i64 = 1_000;
 const MICROS_PER_SECOND: i64 = 1_000_000;
 const MICROS_PER_DAY: i64 = 86_400_000_000;
 const NANOS_PER_MILLI: i64 = 1_000_000;
+const NANOS_PER_MICRO: i64 = 1_000;
 
 /// Represents a Fluss table for data operations
 #[pyclass]
@@ -128,6 +129,70 @@ impl FlussTable {
         self.has_primary_key
     }
 
+    /// Create a new lookuper for primary key lookups.
+    ///
+    /// This is only available for tables with a primary key.
+    pub fn new_lookup(&self, _py: Python) -> PyResult<crate::Lookuper> {
+        if !self.has_primary_key {
+            return Err(FlussError::new_err(
+                "Lookup is only supported for primary key tables",
+            ));
+        }
+
+        crate::Lookuper::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        )
+    }
+
+    /// Create a new upsert writer for the table.
+    ///
+    /// This is only available for tables with a primary key.
+    ///
+    /// Args:
+    ///     columns: Optional list of column names for partial update.
+    ///              Only the specified columns will be updated.
+    ///     column_indices: Optional list of column indices (0-based) for partial update.
+    ///                     Alternative to `columns` parameter.
+    #[pyo3(signature = (columns=None, column_indices=None))]
+    pub fn new_upsert(
+        &self,
+        _py: Python,
+        columns: Option<Vec<String>>,
+        column_indices: Option<Vec<usize>>,
+    ) -> PyResult<crate::UpsertWriter> {
+        if !self.has_primary_key {
+            return Err(FlussError::new_err(
+                "Upsert is only supported for primary key tables",
+            ));
+        }
+
+        // Validate that at most one parameter is specified
+        if columns.is_some() && column_indices.is_some() {
+            return Err(FlussError::new_err(
+                "Specify only one of 'columns' or 'column_indices', not both",
+            ));
+        }
+
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+
+        let table_upsert = fluss_table
+            .new_upsert()
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+        crate::UpsertWriter::new(
+            table_upsert,
+            self.table_info.clone(),
+            columns,
+            column_indices,
+        )
+    }
+
     fn __repr__(&self) -> String {
         format!(
             "FlussTable(path={}.{})",
@@ -358,7 +423,7 @@ where
 }
 
 /// Convert Python row (dict/list/tuple) to GenericRow based on schema
-fn python_to_generic_row(
+pub fn python_to_generic_row(
     row: &Bound<PyAny>,
     table_info: &fcore::metadata::TableInfo,
 ) -> PyResult<fcore::row::GenericRow<'static>> {
@@ -423,6 +488,115 @@ fn python_to_generic_row(
     Ok(fcore::row::GenericRow { values: datums })
 }
 
+/// Convert Python primary key values (dict/list/tuple) to GenericRow.
+/// Only requires PK columns; non-PK columns are filled with Null.
+/// For dict: keys should be PK column names.
+/// For list/tuple: values should be PK values in PK column order.
+pub fn python_pk_to_generic_row(
+    row: &Bound<PyAny>,
+    table_info: &fcore::metadata::TableInfo,
+) -> PyResult<fcore::row::GenericRow<'static>> {
+    let schema = table_info.get_schema();
+    let row_type = table_info.row_type();
+    let fields = row_type.fields();
+    let pk_indexes = schema.primary_key_indexes();
+    let pk_names: Vec<&str> = schema.primary_key_column_names();
+
+    if pk_indexes.is_empty() {
+        return Err(FlussError::new_err(
+            "Table has no primary key; cannot use PK-only row",
+        ));
+    }
+
+    // Initialize all datums as Null
+    let mut datums: Vec<fcore::row::Datum<'static>> = vec![fcore::row::Datum::Null; fields.len()];
+
+    // Extract with user-friendly error message
+    let row_input: RowInput = row.extract().map_err(|_| {
+        let type_name = row
+            .get_type()
+            .name()
+            .map(|n| n.to_string())
+            .unwrap_or_else(|_| "unknown".to_string());
+        FlussError::new_err(format!(
+            "PK row must be a dict, list, or tuple; got {type_name}"
+        ))
+    })?;
+
+    match row_input {
+        RowInput::Dict(dict) => {
+            // Validate keys are PK columns
+            for (k, _) in dict.iter() {
+                let key_str = k.extract::<&str>().map_err(|_| {
+                    let key_type = k
+                        .get_type()
+                        .name()
+                        .map(|n| n.to_string())
+                        .unwrap_or_else(|_| "unknown".to_string());
+                    FlussError::new_err(format!("PK dict keys must be strings; got {key_type}"))
+                })?;
+
+                if !pk_names.contains(&key_str) {
+                    return Err(FlussError::new_err(format!(
+                        "Unknown PK field '{}'. Expected PK fields: {}",
+                        key_str,
+                        pk_names.join(", ")
+                    )));
+                }
+            }
+
+            // Extract PK values
+            for (i, pk_idx) in pk_indexes.iter().enumerate() {
+                let pk_name = pk_names[i];
+                let field: &fcore::metadata::DataField = &fields[*pk_idx];
+                let value = dict
+                    .get_item(pk_name)?
+                    .ok_or_else(|| FlussError::new_err(format!("Missing PK field: {}", pk_name)))?;
+                datums[*pk_idx] = python_value_to_datum(&value, field.data_type())
+                    .map_err(|e| FlussError::new_err(format!("PK field '{}': {}", pk_name, e)))?;
+            }
+        }
+
+        RowInput::List(list) => {
+            if list.len() != pk_indexes.len() {
+                return Err(FlussError::new_err(format!(
+                    "PK list must have {} elements (PK columns), got {}",
+                    pk_indexes.len(),
+                    list.len()
+                )));
+            }
+            for (i, pk_idx) in pk_indexes.iter().enumerate() {
+                let field: &fcore::metadata::DataField = &fields[*pk_idx];
+                let value = list.get_item(i)?;
+                datums[*pk_idx] =
+                    python_value_to_datum(&value, field.data_type()).map_err(|e| {
+                        FlussError::new_err(format!("PK field '{}': {}", field.name(), e))
+                    })?;
+            }
+        }
+
+        RowInput::Tuple(tuple) => {
+            if tuple.len() != pk_indexes.len() {
+                return Err(FlussError::new_err(format!(
+                    "PK tuple must have {} elements (PK columns), got {}",
+                    pk_indexes.len(),
+                    tuple.len()
+                )));
+            }
+            for (i, pk_idx) in pk_indexes.iter().enumerate() {
+                let field: &fcore::metadata::DataField = &fields[*pk_idx];
+                let value = tuple.get_item(i)?;
+                datums[*pk_idx] =
+                    python_value_to_datum(&value, field.data_type()).map_err(|e| {
+                        FlussError::new_err(format!("PK field '{}': {}", field.name(), e))
+                    })?;
+            }
+        }
+    }
+
+    Ok(fcore::row::GenericRow { values: datums })
+}
+
 /// Convert Python value to Datum based on data type
 fn python_value_to_datum(
     value: &Bound<PyAny>,
@@ -516,11 +690,237 @@ fn python_value_to_datum(
     }
 }
 
+/// Convert Rust Datum to Python value based on data type.
+/// This is the reverse of python_value_to_datum.
+pub fn datum_to_python_value(
+    py: Python,
+    row: &dyn fcore::row::InternalRow,
+    pos: usize,
+    data_type: &fcore::metadata::DataType,
+) -> PyResult<Py<PyAny>> {
+    use fcore::metadata::DataType;
+
+    // Check for null first
+    if row.is_null_at(pos) {
+        return Ok(py.None());
+    }
+
+    match data_type {
+        DataType::Boolean(_) => Ok(row
+            .get_boolean(pos)
+            .into_pyobject(py)?
+            .to_owned()
+            .into_any()
+            .unbind()),
+        DataType::TinyInt(_) => Ok(row
+            .get_byte(pos)
+            .into_pyobject(py)?
+            .to_owned()
+            .into_any()
+            .unbind()),
+        DataType::SmallInt(_) => Ok(row
+            .get_short(pos)
+            .into_pyobject(py)?
+            .to_owned()
+            .into_any()
+            .unbind()),
+        DataType::Int(_) => Ok(row
+            .get_int(pos)
+            .into_pyobject(py)?
+            .to_owned()
+            .into_any()
+            .unbind()),
+        DataType::BigInt(_) => Ok(row
+            .get_long(pos)
+            .into_pyobject(py)?
+            .to_owned()
+            .into_any()
+            .unbind()),
+        DataType::Float(_) => Ok(row
+            .get_float(pos)
+            .into_pyobject(py)?
+            .to_owned()
+            .into_any()
+            .unbind()),
+        DataType::Double(_) => Ok(row
+            .get_double(pos)
+            .into_pyobject(py)?
+            .to_owned()
+            .into_any()
+            .unbind()),
+        DataType::String(_) => {
+            let s = row.get_string(pos);
+            Ok(s.into_pyobject(py)?.into_any().unbind())
+        }
+        DataType::Char(char_type) => {
+            let s = row.get_char(pos, char_type.length() as usize);
+            Ok(s.into_pyobject(py)?.into_any().unbind())
+        }
+        DataType::Bytes(_) => {
+            let b = row.get_bytes(pos);
+            Ok(pyo3::types::PyBytes::new(py, b).into_any().unbind())
+        }
+        DataType::Binary(binary_type) => {
+            let b = row.get_binary(pos, binary_type.length());
+            Ok(pyo3::types::PyBytes::new(py, b).into_any().unbind())
+        }
+        DataType::Decimal(decimal_type) => {
+            let decimal = row.get_decimal(
+                pos,
+                decimal_type.precision() as usize,
+                decimal_type.scale() as usize,
+            );
+            rust_decimal_to_python(py, &decimal)
+        }
+        DataType::Date(_) => {
+            let date = row.get_date(pos);
+            rust_date_to_python(py, date)
+        }
+        DataType::Time(_) => {
+            let time = row.get_time(pos);
+            rust_time_to_python(py, time)
+        }
+        DataType::Timestamp(ts_type) => {
+            let ts = row.get_timestamp_ntz(pos, ts_type.precision());
+            rust_timestamp_ntz_to_python(py, ts)
+        }
+        DataType::TimestampLTz(ts_type) => {
+            let ts = row.get_timestamp_ltz(pos, ts_type.precision());
+            rust_timestamp_ltz_to_python(py, ts)
+        }
+        _ => Err(FlussError::new_err(format!(
+            "Unsupported data type for conversion to Python: {data_type}"
+        ))),
+    }
+}
+
+/// Convert Rust Decimal to Python decimal.Decimal
+fn rust_decimal_to_python(py: Python, decimal: &fcore::row::Decimal) -> PyResult<Py<PyAny>> {
+    let decimal_ty = get_decimal_type(py)?;
+    let decimal_str = decimal.to_string();
+    let py_decimal = decimal_ty.call1((decimal_str,))?;
+    Ok(py_decimal.into_any().unbind())
+}
+
+/// Convert Rust Date (days since epoch) to Python datetime.date
+fn rust_date_to_python(py: Python, date: fcore::row::Date) -> PyResult<Py<PyAny>> {
+    use pyo3::types::PyDate;
+
+    let days_since_epoch = date.get_inner();
+    let epoch = jiff::civil::date(1970, 1, 1);
+    let civil_date = epoch + jiff::Span::new().days(days_since_epoch as i64);
+
+    let py_date = PyDate::new(
+        py,
+        civil_date.year() as i32,
+        civil_date.month() as u8,
+        civil_date.day() as u8,
+    )?;
+    Ok(py_date.into_any().unbind())
+}
+
+/// Convert Rust Time (millis since midnight) to Python datetime.time
+fn rust_time_to_python(py: Python, time: fcore::row::Time) -> PyResult<Py<PyAny>> {
+    use pyo3::types::PyTime;
+
+    let millis = time.get_inner() as i64;
+    let hours = millis / MILLIS_PER_HOUR;
+    let minutes = (millis % MILLIS_PER_HOUR) / MILLIS_PER_MINUTE;
+    let seconds = (millis % MILLIS_PER_MINUTE) / MILLIS_PER_SECOND;
+    let microseconds = (millis % MILLIS_PER_SECOND) * MICROS_PER_MILLI;
+
+    let py_time = PyTime::new(
+        py,
+        hours as u8,
+        minutes as u8,
+        seconds as u8,
+        microseconds as u32,
+        None,
+    )?;
+    Ok(py_time.into_any().unbind())
+}
+
+/// Convert Rust TimestampNtz to Python naive datetime
+fn rust_timestamp_ntz_to_python(py: Python, ts: fcore::row::TimestampNtz) -> PyResult<Py<PyAny>> {
+    use pyo3::types::PyDateTime;
+
+    let millis = ts.get_millisecond();
+    let nanos = ts.get_nano_of_millisecond();
+    let total_micros = millis * MICROS_PER_MILLI + (nanos as i64 / NANOS_PER_MICRO);
+
+    // Convert to civil datetime via jiff
+    let timestamp = jiff::Timestamp::from_microsecond(total_micros)
+        .map_err(|e| FlussError::new_err(format!("Invalid timestamp: {e}")))?;
+    let civil_dt = timestamp.to_zoned(jiff::tz::TimeZone::UTC).datetime();
+
+    let py_dt = PyDateTime::new(
+        py,
+        civil_dt.year() as i32,
+        civil_dt.month() as u8,
+        civil_dt.day() as u8,
+        civil_dt.hour() as u8,
+        civil_dt.minute() as u8,
+        civil_dt.second() as u8,
+        (civil_dt.subsec_nanosecond() / 1000) as u32, // microseconds
+        None,
+    )?;
+    Ok(py_dt.into_any().unbind())
+}
+
+/// Convert Rust TimestampLtz to Python timezone-aware datetime (UTC)
+fn rust_timestamp_ltz_to_python(py: Python, ts: fcore::row::TimestampLtz) -> PyResult<Py<PyAny>> {
+    use pyo3::types::PyDateTime;
+
+    let millis = ts.get_epoch_millisecond();
+    let nanos = ts.get_nano_of_millisecond();
+    let total_micros = millis * MICROS_PER_MILLI + (nanos as i64 / NANOS_PER_MICRO);
+
+    // Convert to civil datetime via jiff
+    let timestamp = jiff::Timestamp::from_microsecond(total_micros)
+        .map_err(|e| FlussError::new_err(format!("Invalid timestamp: {e}")))?;
+    let civil_dt = timestamp.to_zoned(jiff::tz::TimeZone::UTC).datetime();
+
+    let utc = get_utc_timezone(py)?;
+    let py_dt = PyDateTime::new(
+        py,
+        civil_dt.year() as i32,
+        civil_dt.month() as u8,
+        civil_dt.day() as u8,
+        civil_dt.hour() as u8,
+        civil_dt.minute() as u8,
+        civil_dt.second() as u8,
+        (civil_dt.subsec_nanosecond() / 1000) as u32, // microseconds
+        Some(&utc),
+    )?;
+    Ok(py_dt.into_any().unbind())
+}
+
+/// Convert an InternalRow to a Python dictionary
+pub fn internal_row_to_dict(
+    py: Python,
+    row: &dyn fcore::row::InternalRow,
+    table_info: &fcore::metadata::TableInfo,
+) -> PyResult<Py<PyAny>> {
+    let row_type = table_info.row_type();
+    let fields = row_type.fields();
+    let dict = pyo3::types::PyDict::new(py);
+
+    for (pos, field) in fields.iter().enumerate() {
+        let value = datum_to_python_value(py, row, pos, field.data_type())?;
+        dict.set_item(field.name(), value)?;
+    }
+
+    Ok(dict.into_any().unbind())
+}
+
 /// Cached decimal.Decimal type
 /// Uses PyOnceLock for thread-safety and subinterpreter compatibility.
 static DECIMAL_TYPE: pyo3::sync::PyOnceLock<Py<pyo3::types::PyType>> =
     pyo3::sync::PyOnceLock::new();
 
+/// Cached UTC timezone
+static UTC_TIMEZONE: pyo3::sync::PyOnceLock<Py<PyAny>> = pyo3::sync::PyOnceLock::new();
+
 /// Cached UTC epoch type
 static UTC_EPOCH: pyo3::sync::PyOnceLock<Py<PyAny>> = pyo3::sync::PyOnceLock::new();
 
@@ -536,6 +936,21 @@ fn get_decimal_type(py: Python) -> PyResult<Bound<pyo3::types::PyType>> {
     Ok(ty.bind(py).clone())
 }
 
+/// Get the cached UTC timezone (datetime.timezone.utc), creating it once per interpreter.
+fn get_utc_timezone(py: Python) -> PyResult<Bound<pyo3::types::PyTzInfo>> {
+    let tz = UTC_TIMEZONE.get_or_try_init(py, || -> PyResult<_> {
+        let datetime_mod = py.import("datetime")?;
+        let timezone = datetime_mod.getattr("timezone")?;
+        let utc = timezone.getattr("utc")?;
+        Ok(utc.unbind())
+    })?;
+    // Downcast to PyTzInfo for use with PyDateTime::new()
+    Ok(tz
+        .bind(py)
+        .clone()
+        .downcast_into::<pyo3::types::PyTzInfo>()?)
+}
+
 /// Get the cached UTC epoch datetime, creating it once per interpreter.
 fn get_utc_epoch(py: Python) -> PyResult<Bound<PyAny>> {
     let epoch = UTC_EPOCH.get_or_try_init(py, || -> PyResult<_> {
diff --git a/fluss-rust/bindings/python/src/upsert.rs b/fluss-rust/bindings/python/src/upsert.rs
new file mode 100644
index 0000000000..08b3597056
--- /dev/null
+++ b/fluss-rust/bindings/python/src/upsert.rs
@@ -0,0 +1,188 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::table::{python_pk_to_generic_row, python_to_generic_row};
+use crate::*;
+use pyo3_async_runtimes::tokio::future_into_py;
+use std::sync::Arc;
+use tokio::sync::Mutex;
+
+/// Writer for upserting and deleting data in a Fluss primary key table.
+///
+/// Each upsert/delete operation is sent to the server and waits for acknowledgment.
+/// Multiple concurrent writers share a common WriterClient which batches requests
+/// for efficiency.
+///
+/// # Example:
+///     writer = table.new_upsert()
+///     await writer.upsert(row1)
+///     await writer.upsert(row2)
+///     await writer.delete(pk)
+///     await writer.flush()  # Ensures all pending operations are acknowledged
+#[pyclass]
+pub struct UpsertWriter {
+    inner: Arc<UpsertWriterInner>,
+}
+
+struct UpsertWriterInner {
+    table_upsert: fcore::client::TableUpsert,
+    /// Lazily initialized writer - created on first write operation
+    writer: Mutex<Option<fcore::client::UpsertWriter>>,
+    table_info: fcore::metadata::TableInfo,
+}
+
+#[pymethods]
+impl UpsertWriter {
+    /// Upsert a row into the table.
+    ///
+    /// If a row with the same primary key exists, it will be updated.
+    /// Otherwise, a new row will be inserted.
+    ///
+    /// Args:
+    ///     row: A dict, list, or tuple containing the row data.
+    ///          For dict: keys are column names, values are column values.
+    ///          For list/tuple: values must be in schema order.
+    ///
+    /// Returns:
+    ///     None on success
+    pub fn upsert<'py>(
+        &self,
+        py: Python<'py>,
+        row: &Bound<'_, PyAny>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let generic_row = python_to_generic_row(row, &self.inner.table_info)?;
+        let inner = self.inner.clone();
+
+        future_into_py(py, async move {
+            let mut guard = inner.get_or_create_writer().await?;
+            let writer = guard.as_mut().unwrap();
+            writer
+                .upsert(&generic_row)
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+            Ok(())
+        })
+    }
+
+    /// Delete a row from the table by primary key.
+    ///
+    /// Args:
+    ///     pk: A dict, list, or tuple containing only the primary key values.
+    ///         For dict: keys are PK column names.
+    ///         For list/tuple: values in PK column order.
+    ///
+    /// Returns:
+    ///     None on success
+    pub fn delete<'py>(
+        &self,
+        py: Python<'py>,
+        pk: &Bound<'_, PyAny>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let generic_row = python_pk_to_generic_row(pk, &self.inner.table_info)?;
+        let inner = self.inner.clone();
+
+        future_into_py(py, async move {
+            let mut guard = inner.get_or_create_writer().await?;
+            let writer = guard.as_mut().unwrap();
+            writer
+                .delete(&generic_row)
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+            Ok(())
+        })
+    }
+
+    /// Flush all pending upsert/delete operations to the server.
+    ///
+    /// This method sends all buffered operations and blocks until they are
+    /// acknowledged according to the writer's ack configuration.
+    ///
+    /// Returns:
+    ///     None on success
+    pub fn flush<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let inner = self.inner.clone();
+
+        future_into_py(py, async move {
+            let writer_guard = inner.writer.lock().await;
+
+            if let Some(writer) = writer_guard.as_ref() {
+                writer
+                    .flush()
+                    .await
+                    .map_err(|e| FlussError::new_err(e.to_string()))
+            } else {
+                // Nothing to flush - no writer was created yet
+                Ok(())
+            }
+        })
+    }
+
+    fn __repr__(&self) -> String {
+        "UpsertWriter()".to_string()
+    }
+}
+
+impl UpsertWriter {
+    /// Create an UpsertWriter from a TableUpsert.
+    ///
+    /// Optionally supports partial updates via column names or indices.
+    pub fn new(
+        table_upsert: fcore::client::TableUpsert,
+        table_info: fcore::metadata::TableInfo,
+        columns: Option<Vec<String>>,
+        column_indices: Option<Vec<usize>>,
+    ) -> PyResult<Self> {
+        // Apply partial update configuration if specified
+        let table_upsert = if let Some(cols) = columns {
+            let col_refs: Vec<&str> = cols.iter().map(|s| s.as_str()).collect();
+            table_upsert
+                .partial_update_with_column_names(&col_refs)
+                .map_err(|e| FlussError::new_err(e.to_string()))?
+        } else if let Some(indices) = column_indices {
+            table_upsert
+                .partial_update(Some(indices))
+                .map_err(|e| FlussError::new_err(e.to_string()))?
+        } else {
+            table_upsert
+        };
+
+        Ok(Self {
+            inner: Arc::new(UpsertWriterInner {
+                table_upsert,
+                writer: Mutex::new(None),
+                table_info,
+            }),
+        })
+    }
+}
+
+impl UpsertWriterInner {
+    /// Get the cached writer or create one on first use.
+    async fn get_or_create_writer(
+        &self,
+    ) -> PyResult<tokio::sync::MutexGuard<'_, Option<fcore::client::UpsertWriter>>> {
+        let mut guard = self.writer.lock().await;
+        if guard.is_none() {
+            let writer = self
+                .table_upsert
+                .create_writer()
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+            *guard = Some(writer);
+        }
+        Ok(guard)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index 69cb91efa7..5410002e7c 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -16,7 +16,6 @@
 // under the License.
 
 use crate::bucketing::BucketingFunction;
-use crate::client::connection::FlussConnection;
 use crate::client::metadata::Metadata;
 use crate::client::table::partition_getter::PartitionGetter;
 use crate::error::{Error, Result};
@@ -26,6 +25,7 @@ use crate::row::InternalRow;
 use crate::row::compacted::CompactedRow;
 use crate::row::encode::{KeyEncoder, KeyEncoderFactory};
 use crate::rpc::ApiError;
+use crate::rpc::RpcClient;
 use crate::rpc::message::LookupRequest;
 use std::sync::Arc;
 
@@ -34,19 +34,19 @@ use std::sync::Arc;
 /// Contains the rows returned from a lookup. For primary key lookups,
 /// this will contain at most one row. For prefix key lookups (future),
 /// this may contain multiple rows.
-pub struct LookupResult<'a> {
+pub struct LookupResult {
     rows: Vec<Vec<u8>>,
-    row_type: &'a RowType,
+    row_type: Arc<RowType>,
 }
 
-impl<'a> LookupResult<'a> {
+impl LookupResult {
     /// Creates a new LookupResult from a list of row bytes.
-    fn new(rows: Vec<Vec<u8>>, row_type: &'a RowType) -> Self {
+    fn new(rows: Vec<Vec<u8>>, row_type: Arc<RowType>) -> Self {
         Self { rows, row_type }
     }
 
     /// Creates an empty LookupResult.
-    fn empty(row_type: &'a RowType) -> Self {
+    fn empty(row_type: Arc<RowType>) -> Self {
         Self {
             rows: Vec::new(),
             row_type,
@@ -67,7 +67,7 @@ impl<'a> LookupResult<'a> {
         match self.rows.len() {
             0 => Ok(None),
             1 => Ok(Some(CompactedRow::from_bytes(
-                self.row_type,
+                &self.row_type,
                 &self.rows[0][SCHEMA_ID_LENGTH..],
             ))),
             _ => Err(Error::UnexpectedError {
@@ -82,7 +82,7 @@ impl<'a> LookupResult<'a> {
         self.rows
             .iter()
             // TODO Add schema id check and fetch when implementing prefix lookup
-            .map(|bytes| CompactedRow::from_bytes(self.row_type, &bytes[SCHEMA_ID_LENGTH..]))
+            .map(|bytes| CompactedRow::from_bytes(&self.row_type, &bytes[SCHEMA_ID_LENGTH..]))
             .collect()
     }
 }
@@ -104,20 +104,20 @@ impl<'a> LookupResult<'a> {
 /// ```
 // TODO: Add lookup_by(column_names) for prefix key lookups (PrefixKeyLookuper)
 // TODO: Add create_typed_lookuper<T>() for typed lookups with POJO mapping
-pub struct TableLookup<'a> {
-    conn: &'a FlussConnection,
+pub struct TableLookup {
+    rpc_client: Arc<RpcClient>,
     table_info: TableInfo,
     metadata: Arc<Metadata>,
 }
 
-impl<'a> TableLookup<'a> {
+impl TableLookup {
     pub(super) fn new(
-        conn: &'a FlussConnection,
+        rpc_client: Arc<RpcClient>,
         table_info: TableInfo,
         metadata: Arc<Metadata>,
     ) -> Self {
         Self {
-            conn,
+            rpc_client,
             table_info,
             metadata,
         }
@@ -127,7 +127,7 @@ impl<'a> TableLookup<'a> {
     ///
     /// The lookuper will automatically encode the key and compute the bucket
     /// for each lookup using the appropriate bucketing function.
-    pub fn create_lookuper(self) -> Result<Lookuper<'a>> {
+    pub fn create_lookuper(self) -> Result<Lookuper> {
         let num_buckets = self.table_info.get_num_buckets();
 
         // Get data lake format from table config for bucketing function
@@ -162,9 +162,11 @@ impl<'a> TableLookup<'a> {
             None
         };
 
+        let row_type = Arc::new(self.table_info.row_type().clone());
         Ok(Lookuper {
-            conn: self.conn,
+            rpc_client: self.rpc_client,
             table_path: Arc::new(self.table_info.table_path.clone()),
+            row_type,
             table_info: self.table_info,
             metadata: self.metadata,
             bucketing_function,
@@ -187,9 +189,10 @@ impl<'a> TableLookup<'a> {
 /// let row = GenericRow::new(vec![Datum::Int32(42)]); // lookup key
 /// let result = lookuper.lookup(&row).await?;
 /// ```
-pub struct Lookuper<'a> {
-    conn: &'a FlussConnection,
+pub struct Lookuper {
+    rpc_client: Arc<RpcClient>,
     table_info: TableInfo,
+    row_type: Arc<RowType>,
     table_path: Arc<TablePath>,
     metadata: Arc<Metadata>,
     bucketing_function: Box<dyn BucketingFunction>,
@@ -199,7 +202,7 @@ pub struct Lookuper<'a> {
     num_buckets: i32,
 }
 
-impl<'a> Lookuper<'a> {
+impl Lookuper {
     /// Looks up a value by its primary key.
     ///
     /// The key is encoded and the bucket is automatically computed using
@@ -211,7 +214,7 @@ impl<'a> Lookuper<'a> {
     /// # Returns
     /// * `Ok(LookupResult)` - The lookup result (may be empty if key not found)
     /// * `Err(Error)` - If the lookup fails
-    pub async fn lookup(&mut self, row: &dyn InternalRow) -> Result<LookupResult<'_>> {
+    pub async fn lookup(&mut self, row: &dyn InternalRow) -> Result<LookupResult> {
         // todo: support batch lookup
         let pk_bytes = self.primary_key_encoder.encode_key(row)?;
         let pk_bytes_vec = pk_bytes.to_vec();
@@ -231,7 +234,7 @@ impl<'a> Lookuper<'a> {
                 Some(id) => Some(id),
                 None => {
                     // Partition doesn't exist, return empty result (like Java)
-                    return Ok(LookupResult::empty(self.table_info.row_type()));
+                    return Ok(LookupResult::empty(Arc::clone(&self.row_type)));
                 }
             }
         } else {
@@ -266,8 +269,7 @@ impl<'a> Lookuper<'a> {
                     ),
                 })?;
 
-        let connections = self.conn.get_connections();
-        let connection = connections.get_connection(tablet_server).await?;
+        let connection = self.rpc_client.get_connection(tablet_server).await?;
 
         // Send lookup request
         let request = LookupRequest::new(table_id, partition_id, bucket_id, vec![pk_bytes_vec]);
@@ -294,10 +296,10 @@ impl<'a> Lookuper<'a> {
                 .filter_map(|pb_value| pb_value.values)
                 .collect();
 
-            return Ok(LookupResult::new(rows, self.table_info.row_type()));
+            return Ok(LookupResult::new(rows, Arc::clone(&self.row_type)));
         }
 
-        Ok(LookupResult::empty(self.table_info.row_type()))
+        Ok(LookupResult::empty(Arc::clone(&self.row_type)))
     }
 
     /// Returns a reference to the table info.
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 6d54933abc..37e9b45b14 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -112,14 +112,14 @@ impl<'a> FlussTable<'a> {
     ///     println!("Found value: {:?}", value);
     /// }
     /// ```
-    pub fn new_lookup(&self) -> Result<TableLookup<'_>> {
+    pub fn new_lookup(&self) -> Result<TableLookup> {
         if !self.has_primary_key {
             return Err(Error::UnsupportedOperation {
                 message: "Lookup is only supported for primary key tables".to_string(),
             });
         }
         Ok(TableLookup::new(
-            self.conn,
+            self.conn.get_connections(),
             self.table_info.clone(),
             self.metadata.clone(),
         ))
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 422f9d32ab..aa9fca4f8a 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -97,7 +97,7 @@ impl<'a> TableScan<'a> {
     ///                 .column("col1", DataTypes::int())
     ///                 .column("col2", DataTypes::string())
     ///                 .column("col3", DataTypes::string())
-    ///                 .column("col3", DataTypes::string())
+    ///                 .column("col4", DataTypes::string())
     ///             .build()?,
     ///         ).build()?;
     ///     let table_path = TablePath::new("fluss".to_owned(), "rust_test_long".to_owned());
@@ -179,7 +179,6 @@ impl<'a> TableScan<'a> {
     ///     let admin = conn.get_admin().await?;
     ///     admin.create_table(&table_path, &table_descriptor, true)
     ///         .await?;
-    ///     let table_info = admin.get_table(&table_path).await?;
     ///     let table = conn.get_table(&table_path).await?;
     ///
     ///     // Project columns by column names
diff --git a/fluss-rust/crates/fluss/src/row/encode/mod.rs b/fluss-rust/crates/fluss/src/row/encode/mod.rs
index d5cf8ace85..1ce7aef75c 100644
--- a/fluss-rust/crates/fluss/src/row/encode/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/mod.rs
@@ -27,7 +27,7 @@ use bytes::Bytes;
 
 /// An interface for encoding key of row into bytes.
 #[allow(dead_code)]
-pub trait KeyEncoder {
+pub trait KeyEncoder: Send + Sync {
     fn encode_key(&mut self, row: &dyn InternalRow) -> Result<Bytes>;
 }
 
@@ -71,7 +71,7 @@ impl KeyEncoderFactory {
 /// 2. call method [`RowEncoder::encode_field()`] to write the row's field.
 /// 3. call method [`RowEncoder::finishRow()`] to finish the writing and get the written row.
 #[allow(dead_code)]
-pub trait RowEncoder {
+pub trait RowEncoder: Send + Sync {
     /// Start to write a new row.
     ///
     /// # Returns

From a084659ace54ff66c96db03b045b99a71a2f66cf Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Thu, 5 Feb 2026 22:27:58 +0000
Subject: [PATCH 109/287] feat: Support different poll methods (#246)

---
 fluss-rust/bindings/python/example/example.py |  92 ++-
 fluss-rust/bindings/python/fluss/__init__.pyi | 244 ++++++-
 fluss-rust/bindings/python/src/lib.rs         |   4 +
 fluss-rust/bindings/python/src/metadata.rs    |  51 ++
 fluss-rust/bindings/python/src/table.rs       | 620 +++++++++++++++---
 fluss-rust/bindings/python/src/utils.rs       |  17 +-
 6 files changed, 885 insertions(+), 143 deletions(-)

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index c359425e13..9cb8f4334e 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -236,31 +236,32 @@ async def main():
         print(f"Error during writing: {e}")
 
     # Now scan the table to verify data was written
-    print("\n--- Scanning table ---")
+    print("\n--- Scanning table (batch scanner) ---")
     try:
-        log_scanner = await table.new_log_scanner()
-        print(f"Created log scanner: {log_scanner}")
+        # Use new_scan().create_batch_scanner() for batch-based operations
+        batch_scanner = await table.new_scan().create_batch_scanner()
+        print(f"Created batch scanner: {batch_scanner}")
 
         # Subscribe to scan from earliest to latest
         # start_timestamp=None (earliest), end_timestamp=None (latest)
-        log_scanner.subscribe(None, None)
+        batch_scanner.subscribe(None, None)
 
         print("Scanning results using to_arrow():")
 
         # Try to get as PyArrow Table
         try:
-            pa_table_result = log_scanner.to_arrow()
+            pa_table_result = batch_scanner.to_arrow()
             print(f"\nAs PyArrow Table: {pa_table_result}")
         except Exception as e:
             print(f"Could not convert to PyArrow: {e}")
 
         # Let's subscribe from the beginning again.
         # Reset subscription
-        log_scanner.subscribe(None, None)
+        batch_scanner.subscribe(None, None)
 
         # Try to get as Pandas DataFrame
         try:
-            df_result = log_scanner.to_pandas()
+            df_result = batch_scanner.to_pandas()
             print(f"\nAs Pandas DataFrame:\n{df_result}")
         except Exception as e:
             print(f"Could not convert to Pandas: {e}")
@@ -270,15 +271,15 @@ async def main():
 
         # TODO: support to_duckdb()
 
-        # Test the new poll() method for incremental reading
-        print("\n--- Testing poll() method ---")
+        # Test poll_arrow() method for incremental reading as Arrow Table
+        print("\n--- Testing poll_arrow() method ---")
         # Reset subscription to start from the beginning
-        log_scanner.subscribe(None, None)
+        batch_scanner.subscribe(None, None)
 
         # Poll with a timeout of 5000ms (5 seconds)
-        # Note: poll() returns an empty table (not an error) on timeout
+        # Note: poll_arrow() returns an empty table (not an error) on timeout
         try:
-            poll_result = log_scanner.poll(5000)
+            poll_result = batch_scanner.poll_arrow(5000)
             print(f"Number of rows: {poll_result.num_rows}")
 
             if poll_result.num_rows > 0:
@@ -289,11 +290,58 @@ async def main():
                 # Empty table still has schema
                 print(f"Schema: {poll_result.schema}")
 
+        except Exception as e:
+            print(f"Error during poll_arrow: {e}")
+
+        # Test poll_batches() method for batches with metadata
+        print("\n--- Testing poll_batches() method ---")
+        batch_scanner.subscribe(None, None)
+
+        try:
+            batches = batch_scanner.poll_batches(5000)
+            print(f"Number of batches: {len(batches)}")
+
+            for i, batch in enumerate(batches):
+                print(f"  Batch {i}: bucket={batch.bucket}, "
+                      f"offsets={batch.base_offset}-{batch.last_offset}, "
+                      f"rows={batch.batch.num_rows}")
+
+        except Exception as e:
+            print(f"Error during poll_batches: {e}")
+
+    except Exception as e:
+        print(f"Error during batch scanning: {e}")
+
+    # Test record-based scanning with poll()
+    print("\n--- Scanning table (record scanner) ---")
+    try:
+        # Use new_scan().create_log_scanner() for record-based operations
+        record_scanner = await table.new_scan().create_log_scanner()
+        print(f"Created record scanner: {record_scanner}")
+
+        record_scanner.subscribe(None, None)
+
+        # Poll returns List[ScanRecord] with per-record metadata
+        print("\n--- Testing poll() method (record-by-record) ---")
+        try:
+            records = record_scanner.poll(5000)
+            print(f"Number of records: {len(records)}")
+
+            # Show first few records with metadata
+            for i, record in enumerate(records[:5]):
+                print(f"  Record {i}: offset={record.offset}, "
+                      f"timestamp={record.timestamp}, "
+                      f"change_type={record.change_type}, "
+                      f"row={record.row}")
+
+            if len(records) > 5:
+                print(f"  ... and {len(records) - 5} more records")
+
         except Exception as e:
             print(f"Error during poll: {e}")
 
     except Exception as e:
-        print(f"Error during scanning: {e}")
+        print(f"Error during record scanning: {e}")
 
     # =====================================================
     # Demo: Primary Key Table with Lookup and Upsert
@@ -488,12 +536,12 @@ async def main():
         print(f"Error during delete: {e}")
         traceback.print_exc()
 
-    # Demo: Column projection
+    # Demo: Column projection using builder pattern
     print("\n--- Testing Column Projection ---")
     try:
-        # Project specific columns by index
+        # Project specific columns by index (using batch scanner for to_pandas)
         print("\n1. Projection by index [0, 1] (id, name):")
-        scanner_index = await table.new_log_scanner(project=[0, 1])
+        scanner_index = await table.new_scan().project([0, 1]).create_batch_scanner()
         scanner_index.subscribe(None, None)
         df_projected = scanner_index.to_pandas()
         print(df_projected.head())
@@ -503,12 +551,22 @@ async def main():
 
         # Project specific columns by name (Pythonic!)
         print("\n2. Projection by name ['name', 'score'] (Pythonic):")
-        scanner_names = await table.new_log_scanner(columns=["name", "score"])
+        scanner_names = await table.new_scan() \
+            .project_by_name(["name", "score"]) \
+            .create_batch_scanner()
         scanner_names.subscribe(None, None)
         df_named = scanner_names.to_pandas()
         print(df_named.head())
         print(f"   Projected {df_named.shape[1]} columns: {list(df_named.columns)}")
 
+        # Test empty result schema with projection
+        print("\n3. Testing empty result schema with projection:")
+        scanner_proj = await table.new_scan().project([0, 2]).create_batch_scanner()
+        scanner_proj.subscribe(None, None)
+        # Quick poll that may return empty
+        result = scanner_proj.poll_arrow(100)
+        print(f"   Schema columns: {result.schema.names}")
+
     except Exception as e:
         print(f"Error during projection: {e}")
 
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index c911ebedfc..40d18f6c27 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -17,12 +17,79 @@
 
 """Type stubs for Fluss Python bindings."""
 
+from enum import IntEnum
 from types import TracebackType
 from typing import Dict, List, Optional, Tuple
 
 import pandas as pd
 import pyarrow as pa
 
+class ChangeType(IntEnum):
+    """Represents the type of change for a record in a log."""
+
+    AppendOnly = 0
+    """Append-only operation"""
+    Insert = 1
+    """Insert operation"""
+    UpdateBefore = 2
+    """Update operation containing the previous content of the updated row"""
+    UpdateAfter = 3
+    """Update operation containing the new content of the updated row"""
+    Delete = 4
+    """Delete operation"""
+
+    def short_string(self) -> str:
+        """Returns a short string representation (+A, +I, -U, +U, -D)."""
+        ...
+
+class ScanRecord:
+    """Represents a single scan record with metadata."""
+
+    @property
+    def bucket(self) -> TableBucket:
+        """The bucket this record belongs to."""
+        ...
+    @property
+    def offset(self) -> int:
+        """The position of this record in the log."""
+        ...
+    @property
+    def timestamp(self) -> int:
+        """The timestamp of this record."""
+        ...
+    @property
+    def change_type(self) -> ChangeType:
+        """The type of change (insert, update, delete, etc.)."""
+        ...
+    @property
+    def row(self) -> Dict[str, object]:
+        """The row data as a dictionary mapping column names to values."""
+        ...
+    def __str__(self) -> str: ...
+    def __repr__(self) -> str: ...
+
+class RecordBatch:
+    """Represents a batch of records with metadata."""
+
+    @property
+    def batch(self) -> pa.RecordBatch:
+        """The Arrow RecordBatch containing the data."""
+        ...
+    @property
+    def bucket(self) -> TableBucket:
+        """The bucket this batch belongs to."""
+        ...
+    @property
+    def base_offset(self) -> int:
+        """The offset of the first record in this batch."""
+        ...
+    @property
+    def last_offset(self) -> int:
+        """The offset of the last record in this batch."""
+        ...
+    def __str__(self) -> str: ...
+    def __repr__(self) -> str: ...
+
 class Config:
     def __init__(self, properties: Optional[Dict[str, str]] = None) -> None: ...
     @property
@@ -64,13 +131,92 @@ class FlussAdmin:
     async def get_latest_lake_snapshot(self, table_path: TablePath) -> LakeSnapshot: ...
     def __repr__(self) -> str: ...
 
+class TableScan:
+    """Builder for creating log scanners with flexible configuration.
+
+    Use this builder to configure projection before creating a log scanner.
+    Obtain a TableScan instance via `FlussTable.new_scan()`.
+
+    Example:
+        ```python
+        # Record-based scanning with projection
+        scanner = await table.new_scan() \\
+            .project([0, 1, 2]) \\
+            .create_log_scanner()
+
+        # Batch-based scanning with column names
+        scanner = await table.new_scan() \\
+            .project_by_name(["id", "name"]) \\
+            .create_batch_scanner()
+        ```
+    """
+
+    def project(self, indices: List[int]) -> "TableScan":
+        """Project to specific columns by their indices.
+
+        Args:
+            indices: List of column indices (0-based) to include in the scan.
+
+        Returns:
+            Self for method chaining.
+        """
+        ...
+    def project_by_name(self, names: List[str]) -> "TableScan":
+        """Project to specific columns by their names.
+
+        Args:
+            names: List of column names to include in the scan.
+
+        Returns:
+            Self for method chaining.
+        """
+        ...
+    async def create_log_scanner(self) -> LogScanner:
+        """Create a record-based log scanner.
+
+        Use this scanner with `poll()` to get individual records with metadata
+        (offset, timestamp, change_type).
+
+        Returns:
+            LogScanner for record-by-record scanning with `poll()`
+        """
+        ...
+    async def create_batch_scanner(self) -> LogScanner:
+        """Create a batch-based log scanner.
+
+        Use this scanner with `poll_arrow()` to get Arrow Tables, or with
+        `poll_batches()` to get individual batches with metadata.
+
+        Returns:
+            LogScanner for batch-based scanning with `poll_arrow()` or `poll_batches()`
+        """
+        ...
+    def __repr__(self) -> str: ...
+
 class FlussTable:
+    def new_scan(self) -> TableScan:
+        """Create a new table scan builder for configuring and creating log scanners.
+
+        Use this method to create scanners with the builder pattern:
+
+        Example:
+            ```python
+            # Record-based scanning
+            scanner = await table.new_scan() \\
+                .project([0, 1]) \\
+                .create_log_scanner()
+
+            # Batch-based scanning
+            scanner = await table.new_scan() \\
+                .project_by_name(["id", "name"]) \\
+                .create_batch_scanner()
+            ```
+
+        Returns:
+            TableScan builder for configuring the scanner.
+        """
+        ...
     async def new_append_writer(self) -> AppendWriter: ...
-    async def new_log_scanner(
-        self,
-        project: Optional[List[int]] = None,
-        columns: Optional[List[str]] = None,
-    ) -> LogScanner: ...
     def new_upsert(
         self,
         columns: Optional[List[str]] = None,
@@ -159,11 +305,93 @@ class Lookuper:
     def __repr__(self) -> str: ...
 
 class LogScanner:
+    """Scanner for reading log data from a Fluss table.
+
+    This scanner supports two modes:
+    - Record-based scanning via `poll()` - returns individual records with metadata
+    - Batch-based scanning via `poll_arrow()` / `poll_batches()` - returns Arrow batches
+
+    Create scanners using the builder pattern:
+        # Record-based scanning
+        scanner = await table.new_scan().create_log_scanner()
+
+        # Batch-based scanning
+        scanner = await table.new_scan().create_batch_scanner()
+
+        # With projection
+        scanner = await table.new_scan().project([0, 1]).create_log_scanner()
+    """
+
     def subscribe(
         self, start_timestamp: Optional[int], end_timestamp: Optional[int]
-    ) -> None: ...
-    def to_pandas(self) -> pd.DataFrame: ...
-    def to_arrow(self) -> pa.Table: ...
+    ) -> None:
+        """Subscribe to log data with timestamp range.
+
+        Args:
+            start_timestamp: Not yet supported, must be None.
+            end_timestamp: Not yet supported, must be None.
+        """
+        ...
+    def poll(self, timeout_ms: int) -> List[ScanRecord]:
+        """Poll for individual records with metadata.
+
+        Requires a record-based scanner (created with new_scan().create_log_scanner()).
+
+        Args:
+            timeout_ms: Timeout in milliseconds to wait for records.
+
+        Returns:
+            List of ScanRecord objects, each containing bucket, offset, timestamp,
+            change_type, and row data as a dictionary.
+
+        Note:
+            Returns an empty list if no records are available or timeout expires.
+        """
+        ...
+    def poll_batches(self, timeout_ms: int) -> List[RecordBatch]:
+        """Poll for batches with metadata.
+
+        Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+
+        Args:
+            timeout_ms: Timeout in milliseconds to wait for batches.
+
+        Returns:
+            List of RecordBatch objects, each containing the Arrow batch along with
+            bucket, base_offset, and last_offset metadata.
+
+        Note:
+            Returns an empty list if no batches are available or timeout expires.
+        """
+        ...
+    def poll_arrow(self, timeout_ms: int) -> pa.Table:
+        """Poll for records as an Arrow Table.
+
+        Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+
+        Args:
+            timeout_ms: Timeout in milliseconds to wait for records.
+
+        Returns:
+            PyArrow Table containing the polled records (batches merged).
+
+        Note:
+            Returns an empty table (with correct schema) if no records are available
+            or timeout expires.
+        """
+        ...
+    def to_pandas(self) -> pd.DataFrame:
+        """Convert all data to Pandas DataFrame.
+
+        Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+        """
+        ...
+    def to_arrow(self) -> pa.Table:
+        """Convert all data to Arrow Table.
+
+        Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+        """
+        ...
     def __repr__(self) -> str: ...
 
 class Schema:
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 3da0b251f6..ce063aba4a 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -58,6 +58,7 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<TableDescriptor>()?;
     m.add_class::<FlussAdmin>()?;
     m.add_class::<FlussTable>()?;
+    m.add_class::<TableScan>()?;
     m.add_class::<AppendWriter>()?;
     m.add_class::<UpsertWriter>()?;
     m.add_class::<Lookuper>()?;
@@ -65,6 +66,9 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<LogScanner>()?;
     m.add_class::<LakeSnapshot>()?;
     m.add_class::<TableBucket>()?;
+    m.add_class::<ChangeType>()?;
+    m.add_class::<ScanRecord>()?;
+    m.add_class::<RecordBatch>()?;
 
     // Register exception types
     m.add_class::<FlussError>()?;
diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
index f422696157..f39f9d441b 100644
--- a/fluss-rust/bindings/python/src/metadata.rs
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -19,6 +19,57 @@ use crate::*;
 use pyo3::types::PyDict;
 use std::collections::HashMap;
 
+/// Represents the type of change for a record in a log
+#[pyclass(eq, eq_int)]
+#[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
+pub enum ChangeType {
+    /// Append-only operation
+    AppendOnly = 0,
+    /// Insert operation
+    Insert = 1,
+    /// Update operation containing the previous content of the updated row
+    UpdateBefore = 2,
+    /// Update operation containing the new content of the updated row
+    UpdateAfter = 3,
+    /// Delete operation
+    Delete = 4,
+}
+
+#[pymethods]
+impl ChangeType {
+    /// Returns a short string representation of this ChangeType
+    pub fn short_string(&self) -> &'static str {
+        match self {
+            ChangeType::AppendOnly => "+A",
+            ChangeType::Insert => "+I",
+            ChangeType::UpdateBefore => "-U",
+            ChangeType::UpdateAfter => "+U",
+            ChangeType::Delete => "-D",
+        }
+    }
+
+    fn __str__(&self) -> &'static str {
+        self.short_string()
+    }
+
+    fn __repr__(&self) -> String {
+        format!("ChangeType.{:?}", self)
+    }
+}
+
+impl ChangeType {
+    /// Convert from core ChangeType
+    pub fn from_core(change_type: fcore::record::ChangeType) -> Self {
+        match change_type {
+            fcore::record::ChangeType::AppendOnly => ChangeType::AppendOnly,
+            fcore::record::ChangeType::Insert => ChangeType::Insert,
+            fcore::record::ChangeType::UpdateBefore => ChangeType::UpdateBefore,
+            fcore::record::ChangeType::UpdateAfter => ChangeType::UpdateAfter,
+            fcore::record::ChangeType::Delete => ChangeType::Delete,
+        }
+    }
+}
+
 /// Represents a table path with database and table name
 #[pyclass]
 #[derive(Clone)]
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 4554ca17e5..30c7ce0bff 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -17,8 +17,9 @@
 
 use crate::TOKIO_RUNTIME;
 use crate::*;
-use arrow::array::RecordBatch;
+use arrow::array::RecordBatch as ArrowRecordBatch;
 use arrow_pyarrow::{FromPyArrow, ToPyArrow};
+use arrow_schema::SchemaRef;
 use fluss::client::EARLIEST_OFFSET;
 use fluss::record::to_arrow_schema;
 use fluss::rpc::message::OffsetSpec;
@@ -38,6 +39,123 @@ const MICROS_PER_DAY: i64 = 86_400_000_000;
 const NANOS_PER_MILLI: i64 = 1_000_000;
 const NANOS_PER_MICRO: i64 = 1_000;
 
+/// Represents a single scan record with metadata
+#[pyclass]
+pub struct ScanRecord {
+    #[pyo3(get)]
+    bucket: TableBucket,
+    #[pyo3(get)]
+    offset: i64,
+    #[pyo3(get)]
+    timestamp: i64,
+    #[pyo3(get)]
+    change_type: ChangeType,
+    /// Store row as a Python dict directly
+    row_dict: Py<pyo3::types::PyDict>,
+}
+
+#[pymethods]
+impl ScanRecord {
+    /// Get the row data as a dictionary
+    #[getter]
+    pub fn row(&self, py: Python) -> Py<pyo3::types::PyDict> {
+        self.row_dict.clone_ref(py)
+    }
+
+    fn __str__(&self) -> String {
+        format!(
+            "ScanRecord(bucket={}, offset={}, timestamp={}, change_type={})",
+            self.bucket.__str__(),
+            self.offset,
+            self.timestamp,
+            self.change_type.short_string()
+        )
+    }
+
+    fn __repr__(&self) -> String {
+        self.__str__()
+    }
+}
+
+impl ScanRecord {
+    /// Create a ScanRecord from core types
+    pub fn from_core(
+        py: Python,
+        bucket: &fcore::metadata::TableBucket,
+        record: &fcore::record::ScanRecord,
+        row_type: &fcore::metadata::RowType,
+    ) -> PyResult<Self> {
+        let fields = row_type.fields();
+        let row = record.row();
+        let dict = pyo3::types::PyDict::new(py);
+
+        for (pos, field) in fields.iter().enumerate() {
+            let value = datum_to_python_value(py, row, pos, field.data_type())?;
+            dict.set_item(field.name(), value)?;
+        }
+
+        Ok(ScanRecord {
+            bucket: TableBucket::from_core(bucket.clone()),
+            offset: record.offset(),
+            timestamp: record.timestamp(),
+            change_type: ChangeType::from_core(*record.change_type()),
+            row_dict: dict.unbind(),
+        })
+    }
+}
+
+/// Represents a batch of records with metadata
+#[pyclass]
+pub struct RecordBatch {
+    batch: Arc<ArrowRecordBatch>,
+    #[pyo3(get)]
+    bucket: TableBucket,
+    #[pyo3(get)]
+    base_offset: i64,
+    #[pyo3(get)]
+    last_offset: i64,
+}
+
+#[pymethods]
+impl RecordBatch {
+    /// Get the Arrow RecordBatch as PyArrow RecordBatch
+    #[getter]
+    pub fn batch(&self, py: Python) -> PyResult<Py<PyAny>> {
+        let pyarrow_batch = self
+            .batch
+            .as_ref()
+            .to_pyarrow(py)
+            .map_err(|e| FlussError::new_err(format!("Failed to convert batch: {e}")))?;
+        Ok(pyarrow_batch.unbind())
+    }
+
+    fn __str__(&self) -> String {
+        format!(
+            "RecordBatch(bucket={}, base_offset={}, last_offset={}, rows={})",
+            self.bucket.__str__(),
+            self.base_offset,
+            self.last_offset,
+            self.batch.num_rows()
+        )
+    }
+
+    fn __repr__(&self) -> String {
+        self.__str__()
+    }
+}
+
+impl RecordBatch {
+    /// Create a RecordBatch from core ScanBatch
+    pub fn from_scan_batch(scan_batch: fcore::record::ScanBatch) -> Self {
+        RecordBatch {
+            bucket: TableBucket::from_core(scan_batch.bucket().clone()),
+            base_offset: scan_batch.base_offset(),
+            last_offset: scan_batch.last_offset(),
+            batch: Arc::new(scan_batch.into_batch()),
+        }
+    }
+}
+
 /// Represents a Fluss table for data operations
 #[pyclass]
 pub struct FlussTable {
@@ -48,14 +166,233 @@ pub struct FlussTable {
     has_primary_key: bool,
 }
 
+/// Builder for creating log scanners with flexible configuration.
+///
+/// Use this builder to configure projection, and in the future, filters
+/// before creating a log scanner.
+#[pyclass]
+pub struct TableScan {
+    connection: Arc<fcore::client::FlussConnection>,
+    metadata: Arc<fcore::client::Metadata>,
+    table_info: fcore::metadata::TableInfo,
+    projection: Option<ProjectionType>,
+}
+
+/// Scanner type for internal use
+enum ScannerType {
+    Record,
+    Batch,
+}
+
+#[pymethods]
+impl TableScan {
+    /// Project to specific columns by their indices.
+    ///
+    /// Args:
+    ///     indices: List of column indices (0-based) to include in the scan.
+    ///
+    /// Returns:
+    ///     Self for method chaining.
+    pub fn project(mut slf: PyRefMut<'_, Self>, indices: Vec<usize>) -> PyRefMut<'_, Self> {
+        slf.projection = Some(ProjectionType::Indices(indices));
+        slf
+    }
+
+    /// Project to specific columns by their names.
+    ///
+    /// Args:
+    ///     names: List of column names to include in the scan.
+    ///
+    /// Returns:
+    ///     Self for method chaining.
+    pub fn project_by_name(mut slf: PyRefMut<'_, Self>, names: Vec<String>) -> PyRefMut<'_, Self> {
+        slf.projection = Some(ProjectionType::Names(names));
+        slf
+    }
+
+    /// Create a record-based log scanner.
+    ///
+    /// Use this scanner with `poll()` to get individual records with metadata
+    /// (offset, timestamp, change_type).
+    ///
+    /// Returns:
+    ///     LogScanner for record-by-record scanning with `poll()`
+    pub fn create_log_scanner<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        self.create_scanner_internal(py, ScannerType::Record)
+    }
+
+    /// Create a batch-based log scanner.
+    ///
+    /// Use this scanner with `poll_arrow()` to get Arrow Tables, or with
+    /// `poll_batches()` to get individual batches with metadata.
+    ///
+    /// Returns:
+    ///     LogScanner for batch-based scanning with `poll_arrow()` or `poll_batches()`
+    pub fn create_batch_scanner<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        self.create_scanner_internal(py, ScannerType::Batch)
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "TableScan(table={}.{})",
+            self.table_info.table_path.database(),
+            self.table_info.table_path.table()
+        )
+    }
+}
+
+impl TableScan {
+    fn create_scanner_internal<'py>(
+        &self,
+        py: Python<'py>,
+        scanner_type: ScannerType,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let conn = self.connection.clone();
+        let metadata = self.metadata.clone();
+        let table_info = self.table_info.clone();
+        let projection = self.projection.clone();
+
+        future_into_py(py, async move {
+            let fluss_table = fcore::client::FlussTable::new(&conn, metadata, table_info.clone());
+
+            let projection_indices = resolve_projection_indices(&projection, &table_info)?;
+            let table_scan = apply_projection(fluss_table.new_scan(), projection)?;
+
+            let admin = conn
+                .get_admin()
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+            let (projected_schema, projected_row_type) =
+                calculate_projected_types(&table_info, projection_indices)?;
+
+            let py_scanner = match scanner_type {
+                ScannerType::Record => {
+                    let rust_scanner = table_scan.create_log_scanner().map_err(|e| {
+                        FlussError::new_err(format!("Failed to create log scanner: {e}"))
+                    })?;
+                    LogScanner::from_log_scanner(
+                        rust_scanner,
+                        admin,
+                        table_info,
+                        projected_schema,
+                        projected_row_type,
+                    )
+                }
+                ScannerType::Batch => {
+                    let rust_scanner =
+                        table_scan.create_record_batch_log_scanner().map_err(|e| {
+                            FlussError::new_err(format!("Failed to create batch scanner: {e}"))
+                        })?;
+                    LogScanner::from_batch_scanner(
+                        rust_scanner,
+                        admin,
+                        table_info,
+                        projected_schema,
+                        projected_row_type,
+                    )
+                }
+            };
+
+            Python::attach(|py| Py::new(py, py_scanner))
+        })
+    }
+}
+
 /// Internal enum to represent different projection types
+#[derive(Clone)]
 enum ProjectionType {
     Indices(Vec<usize>),
     Names(Vec<String>),
 }
 
+/// Resolve projection to column indices
+fn resolve_projection_indices(
+    projection: &Option<ProjectionType>,
+    table_info: &fcore::metadata::TableInfo,
+) -> PyResult<Option<Vec<usize>>> {
+    match projection {
+        Some(ProjectionType::Indices(indices)) => Ok(Some(indices.clone())),
+        Some(ProjectionType::Names(names)) => {
+            let schema = table_info.get_schema();
+            let columns = schema.columns();
+            let mut indices = Vec::with_capacity(names.len());
+            for name in names {
+                let idx = columns
+                    .iter()
+                    .position(|c| c.name() == name)
+                    .ok_or_else(|| FlussError::new_err(format!("Column '{}' not found", name)))?;
+                indices.push(idx);
+            }
+            Ok(Some(indices))
+        }
+        None => Ok(None),
+    }
+}
+
+/// Apply projection to table scan
+fn apply_projection(
+    table_scan: fcore::client::TableScan,
+    projection: Option<ProjectionType>,
+) -> PyResult<fcore::client::TableScan> {
+    match projection {
+        Some(ProjectionType::Indices(indices)) => table_scan
+            .project(&indices)
+            .map_err(|e| FlussError::new_err(format!("Failed to project columns: {e}"))),
+        Some(ProjectionType::Names(names)) => {
+            let column_name_refs: Vec<&str> = names.iter().map(|s| s.as_str()).collect();
+            table_scan
+                .project_by_name(&column_name_refs)
+                .map_err(|e| FlussError::new_err(format!("Failed to project columns: {e}")))
+        }
+        None => Ok(table_scan),
+    }
+}
+
+/// Calculate projected schema and row type from projection indices
+fn calculate_projected_types(
+    table_info: &fcore::metadata::TableInfo,
+    projection_indices: Option<Vec<usize>>,
+) -> PyResult<(SchemaRef, fcore::metadata::RowType)> {
+    let full_schema = to_arrow_schema(table_info.get_row_type())
+        .map_err(|e| FlussError::new_err(format!("Failed to get arrow schema: {e}")))?;
+    let full_row_type = table_info.get_row_type();
+
+    match projection_indices {
+        Some(indices) => {
+            let arrow_fields: Vec<_> = indices
+                .iter()
+                .map(|&i| full_schema.field(i).clone())
+                .collect();
+            let row_fields: Vec<_> = indices
+                .iter()
+                .map(|&i| full_row_type.fields()[i].clone())
+                .collect();
+            Ok((
+                Arc::new(arrow_schema::Schema::new(arrow_fields)),
+                fcore::metadata::RowType::new(row_fields),
+            ))
+        }
+        None => Ok((full_schema, full_row_type.clone())),
+    }
+}
+
 #[pymethods]
 impl FlussTable {
+    /// Create a new table scan builder for configuring and creating log scanners.
+    ///
+    /// Use this method to create scanners with the builder pattern:
+    /// Returns:
+    ///     TableScan builder for configuring the scanner.
+    pub fn new_scan(&self) -> TableScan {
+        TableScan {
+            connection: self.connection.clone(),
+            metadata: self.metadata.clone(),
+            table_info: self.table_info.clone(),
+            projection: None,
+        }
+    }
+
     /// Create a new append writer for the table
     fn new_append_writer<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
         let conn = self.connection.clone();
@@ -79,41 +416,6 @@ impl FlussTable {
         })
     }
 
-    /// Create a new log scanner for the table.
-    ///
-    /// Args:
-    ///     project: Optional list of column indices (0-based) to include in the scan.
-    ///     columns: Optional list of column names to include in the scan.
-    ///
-    /// Returns:
-    ///     LogScanner, optionally with projection applied
-    ///
-    /// Note:
-    ///     Specify only one of 'project' or 'columns'.
-    ///     If neither is specified, all columns are included.
-    ///     Rust side will validate the projection parameters.
-    ///
-    #[pyo3(signature = (project=None, columns=None))]
-    pub fn new_log_scanner<'py>(
-        &self,
-        py: Python<'py>,
-        project: Option<Vec<usize>>,
-        columns: Option<Vec<String>>,
-    ) -> PyResult<Bound<'py, PyAny>> {
-        let projection = match (project, columns) {
-            (Some(_), Some(_)) => {
-                return Err(FlussError::new_err(
-                    "Specify only one of 'project' or 'columns'".to_string(),
-                ));
-            }
-            (Some(indices), None) => Some(ProjectionType::Indices(indices)),
-            (None, Some(names)) => Some(ProjectionType::Names(names)),
-            (None, None) => None,
-        };
-
-        self.create_log_scanner_internal(py, projection)
-    }
-
     /// Get table information
     pub fn get_table_info(&self) -> TableInfo {
         TableInfo::from_core(self.table_info.clone())
@@ -219,55 +521,6 @@ impl FlussTable {
             has_primary_key,
         }
     }
-
-    /// Internal helper to create log scanner with optional projection
-    fn create_log_scanner_internal<'py>(
-        &self,
-        py: Python<'py>,
-        projection: Option<ProjectionType>,
-    ) -> PyResult<Bound<'py, PyAny>> {
-        let conn = self.connection.clone();
-        let metadata = self.metadata.clone();
-        let table_info = self.table_info.clone();
-
-        future_into_py(py, async move {
-            let fluss_table =
-                fcore::client::FlussTable::new(&conn, metadata.clone(), table_info.clone());
-
-            let mut table_scan = fluss_table.new_scan();
-
-            // Apply projection if specified
-            if let Some(proj) = projection {
-                table_scan = match proj {
-                    ProjectionType::Indices(indices) => {
-                        table_scan.project(&indices).map_err(|e| {
-                            FlussError::new_err(format!("Failed to project columns: {e}"))
-                        })?
-                    }
-                    ProjectionType::Names(names) => {
-                        // Convert Vec<String> to Vec<&str> for the API
-                        let column_name_refs: Vec<&str> =
-                            names.iter().map(|s| s.as_str()).collect();
-                        table_scan.project_by_name(&column_name_refs).map_err(|e| {
-                            FlussError::new_err(format!("Failed to project columns: {e}"))
-                        })?
-                    }
-                };
-            }
-
-            let rust_scanner = table_scan
-                .create_record_batch_log_scanner()
-                .map_err(|e| FlussError::new_err(format!("Failed to create log scanner: {e}")))?;
-
-            let admin = conn
-                .get_admin()
-                .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
-
-            let py_scanner = LogScanner::from_core(rust_scanner, admin, table_info.clone());
-            Python::attach(|py| Py::new(py, py_scanner))
-        })
-    }
 }
 
 /// Writer for appending data to a Fluss table
@@ -295,7 +548,7 @@ impl AppendWriter {
     pub fn write_arrow_batch(&self, py: Python, batch: Py<PyAny>) -> PyResult<()> {
         // This shares the underlying Arrow buffers without copying data
         let batch_bound = batch.bind(py);
-        let rust_batch: RecordBatch = FromPyArrow::from_pyarrow_bound(batch_bound)
+        let rust_batch: ArrowRecordBatch = FromPyArrow::from_pyarrow_bound(batch_bound)
             .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch: {e}")))?;
 
         let inner = self.inner.clone();
@@ -1303,12 +1556,23 @@ fn get_type_name(value: &Bound<PyAny>) -> String {
         .unwrap_or_else(|_| "unknown".to_string())
 }
 
-/// Scanner for reading log data from a Fluss table
+/// Scanner for reading log data from a Fluss table.
+///
+/// This scanner supports two modes:
+/// - Record-based scanning via `poll()` - returns individual records with metadata
+/// - Batch-based scanning via `poll_arrow()` / `poll_batches()` - returns Arrow batches
 #[pyclass]
 pub struct LogScanner {
-    inner: fcore::client::RecordBatchLogScanner,
+    /// Record-based scanner for poll()
+    inner: Option<fcore::client::LogScanner>,
+    /// Batch-based scanner for poll_arrow/poll_batches
+    inner_batch: Option<fcore::client::RecordBatchLogScanner>,
     admin: fcore::client::FlussAdmin,
     table_info: fcore::metadata::TableInfo,
+    /// The projected Arrow schema to use for empty table creation
+    projected_schema: SchemaRef,
+    /// The projected row type to use for record-based scanning
+    projected_row_type: fcore::metadata::RowType,
     #[allow(dead_code)]
     start_timestamp: Option<i64>,
     #[allow(dead_code)]
@@ -1338,19 +1602,40 @@ impl LogScanner {
         for bucket_id in 0..num_buckets {
             let start_offset = EARLIEST_OFFSET;
 
-            TOKIO_RUNTIME.block_on(async {
-                self.inner
-                    .subscribe(bucket_id, start_offset)
-                    .await
-                    .map_err(|e| FlussError::new_err(e.to_string()))
-            })?;
+            // Subscribe to the appropriate scanner
+            if let Some(ref inner) = self.inner {
+                TOKIO_RUNTIME.block_on(async {
+                    inner
+                        .subscribe(bucket_id, start_offset)
+                        .await
+                        .map_err(|e| FlussError::new_err(e.to_string()))
+                })?;
+            } else if let Some(ref inner_batch) = self.inner_batch {
+                TOKIO_RUNTIME.block_on(async {
+                    inner_batch
+                        .subscribe(bucket_id, start_offset)
+                        .await
+                        .map_err(|e| FlussError::new_err(e.to_string()))
+                })?;
+            } else {
+                return Err(FlussError::new_err("No scanner available"));
+            }
         }
 
         Ok(())
     }
 
     /// Convert all data to Arrow Table
+    ///
+    /// Note: Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
     fn to_arrow(&self, py: Python) -> PyResult<Py<PyAny>> {
+        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
+            FlussError::new_err(
+                "Batch-based scanner not available. Use new_scan().create_batch_scanner() to create a scanner \
+                 that supports to_arrow().",
+            )
+        })?;
+
         let mut all_batches = Vec::new();
 
         let num_buckets = self.table_info.get_num_buckets();
@@ -1378,7 +1663,7 @@ impl LogScanner {
             let scan_batches = py
                 .detach(|| {
                     TOKIO_RUNTIME
-                        .block_on(async { self.inner.poll(Duration::from_millis(500)).await })
+                        .block_on(async { inner_batch.poll(Duration::from_millis(500)).await })
                 })
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
 
@@ -1439,18 +1724,114 @@ impl LogScanner {
         Ok(df)
     }
 
-    /// Poll for new records with the specified timeout
+    /// Poll for individual records with metadata.
     ///
     /// Args:
     ///     timeout_ms: Timeout in milliseconds to wait for records
     ///
     /// Returns:
-    ///     PyArrow Table containing the polled records
+    ///     List of ScanRecord objects, each containing bucket, offset, timestamp,
+    ///     change_type, and row data as a dictionary.
+    ///
+    /// Note:
+    ///     - Requires a record-based scanner (created with new_scan().create_log_scanner())
+    ///     - Returns an empty list if no records are available
+    ///     - When timeout expires, returns an empty list (NOT an error)
+    fn poll(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<ScanRecord>> {
+        let inner = self.inner.as_ref().ok_or_else(|| {
+            FlussError::new_err(
+                "Record-based scanner not available. Use new_scan().create_log_scanner() to create a scanner \
+                 that supports poll().",
+            )
+        })?;
+
+        if timeout_ms < 0 {
+            return Err(FlussError::new_err(format!(
+                "timeout_ms must be non-negative, got: {timeout_ms}"
+            )));
+        }
+
+        let timeout = Duration::from_millis(timeout_ms as u64);
+        let scan_records = py
+            .detach(|| TOKIO_RUNTIME.block_on(async { inner.poll(timeout).await }))
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+        // Convert ScanRecords to Python ScanRecord list
+        // Use projected_row_type to handle column projection correctly
+        let row_type = &self.projected_row_type;
+        let mut result = Vec::new();
+
+        for (bucket, records) in scan_records.into_records_by_buckets() {
+            for record in records {
+                let scan_record = ScanRecord::from_core(py, &bucket, &record, row_type)?;
+                result.push(scan_record);
+            }
+        }
+
+        Ok(result)
+    }
+
+    /// Poll for batches with metadata.
+    ///
+    /// Args:
+    ///     timeout_ms: Timeout in milliseconds to wait for batches
+    ///
+    /// Returns:
+    ///     List of RecordBatch objects, each containing the Arrow batch along with
+    ///     bucket, base_offset, and last_offset metadata.
     ///
     /// Note:
+    ///     - Requires a batch-based scanner (created with new_scan().create_batch_scanner())
+    ///     - Returns an empty list if no batches are available
+    ///     - When timeout expires, returns an empty list (NOT an error)
+    fn poll_batches(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<RecordBatch>> {
+        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
+            FlussError::new_err(
+                "Batch-based scanner not available. Use new_scan().create_batch_scanner() to create a scanner \
+                 that supports poll_batches().",
+            )
+        })?;
+
+        if timeout_ms < 0 {
+            return Err(FlussError::new_err(format!(
+                "timeout_ms must be non-negative, got: {timeout_ms}"
+            )));
+        }
+
+        let timeout = Duration::from_millis(timeout_ms as u64);
+        let scan_batches = py
+            .detach(|| TOKIO_RUNTIME.block_on(async { inner_batch.poll(timeout).await }))
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+        // Convert ScanBatch to RecordBatch with metadata
+        let result = scan_batches
+            .into_iter()
+            .map(RecordBatch::from_scan_batch)
+            .collect();
+
+        Ok(result)
+    }
+
+    /// Poll for new records as an Arrow Table.
+    ///
+    /// Args:
+    ///     timeout_ms: Timeout in milliseconds to wait for records
+    ///
+    /// Returns:
+    ///     PyArrow Table containing the polled records (batches merged)
+    ///
+    /// Note:
+    ///     - Requires a batch-based scanner (created with new_scan().create_batch_scanner())
     ///     - Returns an empty table (with correct schema) if no records are available
     ///     - When timeout expires, returns an empty table (NOT an error)
-    fn poll(&self, py: Python, timeout_ms: i64) -> PyResult<Py<PyAny>> {
+    fn poll_arrow(&self, py: Python, timeout_ms: i64) -> PyResult<Py<PyAny>> {
+        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
+            FlussError::new_err(
+                "Batch-based scanner not available. Use new_scan().create_batch_scanner() to create a scanner \
+                 that supports poll_arrow().",
+            )
+        })?;
+
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
                 "timeout_ms must be non-negative, got: {timeout_ms}"
@@ -1459,7 +1840,7 @@ impl LogScanner {
 
         let timeout = Duration::from_millis(timeout_ms as u64);
         let scan_batches = py
-            .detach(|| TOKIO_RUNTIME.block_on(async { self.inner.poll(timeout).await }))
+            .detach(|| TOKIO_RUNTIME.block_on(async { inner_batch.poll(timeout).await }))
             .map_err(|e| FlussError::new_err(e.to_string()))?;
 
         // Convert ScanBatch to Arrow batches
@@ -1475,11 +1856,11 @@ impl LogScanner {
         Utils::combine_batches_to_table(py, arrow_batches)
     }
 
-    /// Create an empty PyArrow table with the correct schema
+    /// Create an empty PyArrow table with the correct (projected) schema
     fn create_empty_table(&self, py: Python) -> PyResult<Py<PyAny>> {
-        let arrow_schema = to_arrow_schema(self.table_info.get_row_type())
-            .map_err(|e| FlussError::new_err(format!("Failed to get arrow schema: {e}")))?;
-        let py_schema = arrow_schema
+        // Use the projected schema stored in the scanner
+        let py_schema = self
+            .projected_schema
             .as_ref()
             .to_pyarrow(py)
             .map_err(|e| FlussError::new_err(format!("Failed to convert schema: {e}")))?;
@@ -1498,16 +1879,41 @@ impl LogScanner {
 }
 
 impl LogScanner {
-    /// Create LogScanner from core RecordBatchLogScanner
-    pub fn from_core(
-        inner_scanner: fcore::client::RecordBatchLogScanner,
+    /// Create LogScanner for record-based scanning
+    pub fn from_log_scanner(
+        inner_scanner: fcore::client::LogScanner,
+        admin: fcore::client::FlussAdmin,
+        table_info: fcore::metadata::TableInfo,
+        projected_schema: SchemaRef,
+        projected_row_type: fcore::metadata::RowType,
+    ) -> Self {
+        Self {
+            inner: Some(inner_scanner),
+            inner_batch: None,
+            admin,
+            table_info,
+            projected_schema,
+            projected_row_type,
+            start_timestamp: None,
+            end_timestamp: None,
+        }
+    }
+
+    /// Create LogScanner for batch-based scanning
+    pub fn from_batch_scanner(
+        inner_batch_scanner: fcore::client::RecordBatchLogScanner,
         admin: fcore::client::FlussAdmin,
         table_info: fcore::metadata::TableInfo,
+        projected_schema: SchemaRef,
+        projected_row_type: fcore::metadata::RowType,
     ) -> Self {
         Self {
-            inner: inner_scanner,
+            inner: None,
+            inner_batch: Some(inner_batch_scanner),
             admin,
             table_info,
+            projected_schema,
+            projected_row_type,
             start_timestamp: None,
             end_timestamp: None,
         }
diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
index ee32c9c133..c92f1b9fd9 100644
--- a/fluss-rust/bindings/python/src/utils.rs
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -203,20 +203,15 @@ impl Utils {
         py: Python,
         batches: Vec<Arc<arrow::record_batch::RecordBatch>>,
     ) -> PyResult<Py<PyAny>> {
-        use arrow_array::RecordBatch as ArrowArrayRecordBatch;
-
         let py_batches: Result<Vec<Py<PyAny>>, _> = batches
             .iter()
             .map(|batch| {
-                ArrowArrayRecordBatch::try_new(batch.schema().clone(), batch.columns().to_vec())
-                    .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch: {e}")))
-                    .and_then(|b| {
-                        ToPyArrow::to_pyarrow(&b, py)
-                            .map(|x| x.into())
-                            .map_err(|e| {
-                                FlussError::new_err(format!("Failed to convert to PyObject: {e}"))
-                            })
-                    })
+                // Just dereference the Arc - no need to recreate the batch
+                batch
+                    .as_ref()
+                    .to_pyarrow(py)
+                    .map(|x| x.into())
+                    .map_err(|e| FlussError::new_err(format!("Failed to convert to PyObject: {e}")))
             })
             .collect();
 

From 63683f5d565d434829bff949c69375d9783f4572 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Thu, 5 Feb 2026 22:29:32 +0000
Subject: [PATCH 110/287] chore: Change upsert and delete to use read only self
 reference by using mutex to guard mutable encoders (#247)

---
 .../crates/examples/src/example_kv_table.rs   |  2 +-
 .../src/example_partitioned_kv_table.rs       |  2 +-
 .../crates/fluss/src/client/table/upsert.rs   | 58 +++++++++++++------
 .../fluss/tests/integration/kv_table.rs       | 12 ++--
 4 files changed, 48 insertions(+), 26 deletions(-)

diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 042e38413d..2bbcc74b68 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -54,7 +54,7 @@ pub async fn main() -> Result<()> {
 
     let table = conn.get_table(&table_path).await?;
     let table_upsert = table.new_upsert()?;
-    let mut upsert_writer = table_upsert.create_writer()?;
+    let upsert_writer = table_upsert.create_writer()?;
 
     println!("\n=== Upserting ===");
     for (id, name, age) in [(1, "Verso", 32i64), (2, "Noco", 25), (3, "Esquie", 35)] {
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index d1b6814cbd..884869e168 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -61,7 +61,7 @@ pub async fn main() -> Result<()> {
 
     let table = conn.get_table(&table_path).await?;
     let table_upsert = table.new_upsert()?;
-    let mut upsert_writer = table_upsert.create_writer()?;
+    let upsert_writer = table_upsert.create_writer()?;
 
     println!("\n=== Upserting ===");
     for (id, region, zone, score) in [
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
index bb6c651075..92f6a20c85 100644
--- a/fluss-rust/crates/fluss/src/client/table/upsert.rs
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -16,13 +16,13 @@
 // under the License.
 
 use crate::client::{RowBytes, WriteFormat, WriteRecord, WriterClient};
-use crate::error::Error::IllegalArgument;
+use crate::error::Error::{IllegalArgument, UnexpectedError};
 use crate::error::Result;
 use crate::metadata::{RowType, TableInfo, TablePath};
 use crate::row::InternalRow;
 use crate::row::encode::{KeyEncoder, KeyEncoderFactory, RowEncoder, RowEncoderFactory};
 use crate::row::field_getter::FieldGetter;
-use std::sync::Arc;
+use std::sync::{Arc, Mutex};
 
 use crate::client::table::partition_getter::{PartitionGetter, get_physical_path};
 use bitvec::prelude::bitvec;
@@ -111,12 +111,12 @@ pub struct UpsertWriter {
     table_path: Arc<TablePath>,
     writer_client: Arc<WriterClient>,
     partition_field_getter: Option<PartitionGetter>,
-    primary_key_encoder: Box<dyn KeyEncoder>,
+    primary_key_encoder: Mutex<Box<dyn KeyEncoder>>,
     target_columns: Option<Arc<Vec<usize>>>,
     // Use primary key encoder as bucket key encoder when None
-    bucket_key_encoder: Option<Box<dyn KeyEncoder>>,
+    bucket_key_encoder: Option<Mutex<Box<dyn KeyEncoder>>>,
     write_format: WriteFormat,
-    row_encoder: Box<dyn RowEncoder>,
+    row_encoder: Mutex<Box<dyn RowEncoder>>,
     field_getters: Box<[FieldGetter]>,
     table_info: Arc<TableInfo>,
 }
@@ -173,11 +173,14 @@ impl UpsertWriterFactory {
             table_path,
             partition_field_getter,
             writer_client,
-            primary_key_encoder,
+            primary_key_encoder: Mutex::new(primary_key_encoder),
             target_columns: partial_update_columns,
-            bucket_key_encoder,
+            bucket_key_encoder: bucket_key_encoder.map(Mutex::new),
             write_format,
-            row_encoder: Box::new(RowEncoderFactory::create(kv_format, row_type.clone())?),
+            row_encoder: Mutex::new(Box::new(RowEncoderFactory::create(
+                kv_format,
+                row_type.clone(),
+            )?)),
             field_getters,
             table_info: table_info.clone(),
         })
@@ -294,22 +297,41 @@ impl UpsertWriter {
         Ok(())
     }
 
-    fn get_keys(&mut self, row: &dyn InternalRow) -> Result<(Bytes, Option<Bytes>)> {
-        let key = self.primary_key_encoder.encode_key(row)?;
-        let bucket_key = match &mut self.bucket_key_encoder {
-            Some(bucket_key_encoder) => Some(bucket_key_encoder.encode_key(row)?),
+    fn get_keys(&self, row: &dyn InternalRow) -> Result<(Bytes, Option<Bytes>)> {
+        let key = self
+            .primary_key_encoder
+            .lock()
+            .map_err(|e| UnexpectedError {
+                message: format!("primary_key_encoder lock poisoned: {e}"),
+                source: None,
+            })?
+            .encode_key(row)?;
+        let bucket_key = match &self.bucket_key_encoder {
+            Some(encoder) => Some(
+                encoder
+                    .lock()
+                    .map_err(|e| UnexpectedError {
+                        message: format!("bucket_key_encoder lock poisoned: {e}"),
+                        source: None,
+                    })?
+                    .encode_key(row)?,
+            ),
             None => Some(key.clone()),
         };
         Ok((key, bucket_key))
     }
 
-    fn encode_row<R: InternalRow>(&mut self, row: &R) -> Result<Bytes> {
-        self.row_encoder.start_new_row()?;
+    fn encode_row<R: InternalRow>(&self, row: &R) -> Result<Bytes> {
+        let mut encoder = self.row_encoder.lock().map_err(|e| UnexpectedError {
+            message: format!("row_encoder lock poisoned: {e}"),
+            source: None,
+        })?;
+        encoder.start_new_row()?;
         for (pos, field_getter) in self.field_getters.iter().enumerate() {
             let datum = field_getter.get_field(row);
-            self.row_encoder.encode_field(pos, datum)?;
+            encoder.encode_field(pos, datum)?;
         }
-        self.row_encoder.finish_row()
+        encoder.finish_row()
     }
 
     /// Flush data written that have not yet been sent to the server, forcing the client to send the
@@ -328,7 +350,7 @@ impl UpsertWriter {
     ///
     /// # Returns
     /// Ok(UpsertResult) when completed normally
-    pub async fn upsert<R: InternalRow>(&mut self, row: &R) -> Result<UpsertResult> {
+    pub async fn upsert<R: InternalRow>(&self, row: &R) -> Result<UpsertResult> {
         self.check_field_count(row)?;
 
         let (key, bucket_key) = self.get_keys(row)?;
@@ -367,7 +389,7 @@ impl UpsertWriter {
     ///
     /// # Returns
     /// Ok(DeleteResult) when completed normally
-    pub async fn delete<R: InternalRow>(&mut self, row: &R) -> Result<DeleteResult> {
+    pub async fn delete<R: InternalRow>(&self, row: &R) -> Result<DeleteResult> {
         self.check_field_count(row)?;
 
         let (key, bucket_key) = self.get_keys(row)?;
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index c419ed900b..87d90b0a9c 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -89,7 +89,7 @@ mod kv_table_test {
             .expect("Failed to get table");
 
         let table_upsert = table.new_upsert().expect("Failed to create upsert");
-        let mut upsert_writer = table_upsert
+        let upsert_writer = table_upsert
             .create_writer()
             .expect("Failed to create writer");
 
@@ -246,7 +246,7 @@ mod kv_table_test {
             .expect("Failed to get table");
 
         let table_upsert = table.new_upsert().expect("Failed to create upsert");
-        let mut upsert_writer = table_upsert
+        let upsert_writer = table_upsert
             .create_writer()
             .expect("Failed to create writer");
 
@@ -360,7 +360,7 @@ mod kv_table_test {
 
         // Insert initial record with all columns
         let table_upsert = table.new_upsert().expect("Failed to create upsert");
-        let mut upsert_writer = table_upsert
+        let upsert_writer = table_upsert
             .create_writer()
             .expect("Failed to create writer");
 
@@ -399,7 +399,7 @@ mod kv_table_test {
         let partial_upsert = table_upsert
             .partial_update_with_column_names(&["id", "score"])
             .expect("Failed to create TableUpsert with partial update");
-        let mut partial_writer = partial_upsert
+        let partial_writer = partial_upsert
             .create_writer()
             .expect("Failed to create UpsertWriter with partial write");
 
@@ -478,7 +478,7 @@ mod kv_table_test {
 
         let table_upsert = table.new_upsert().expect("Failed to create upsert");
 
-        let mut upsert_writer = table_upsert
+        let upsert_writer = table_upsert
             .create_writer()
             .expect("Failed to create writer");
 
@@ -659,7 +659,7 @@ mod kv_table_test {
             .expect("Failed to get table");
 
         let table_upsert = table.new_upsert().expect("Failed to create upsert");
-        let mut upsert_writer = table_upsert
+        let upsert_writer = table_upsert
             .create_writer()
             .expect("Failed to create writer");
 

From 60b86d72e1182970ef06ac1c913a64dea71ffca2 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Thu, 5 Feb 2026 23:09:36 +0000
Subject: [PATCH 111/287] chore: refator to builder pattern to create log
 scanner for CPP (#249)

---
 fluss-rust/bindings/cpp/examples/example.cpp | 18 +++---
 fluss-rust/bindings/cpp/include/fluss.hpp    | 28 +++++++--
 fluss-rust/bindings/cpp/src/table.cpp        | 66 +++++++++-----------
 3 files changed, 61 insertions(+), 51 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 45f7f9ea9c..f35f37eef1 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -104,7 +104,7 @@ int main() {
 
     // 6) Scan
     fluss::LogScanner scanner;
-    check("new_log_scanner", table.NewLogScanner(scanner));
+    check("new_log_scanner", table.NewScan().CreateLogScanner(scanner));
 
     auto info = table.GetTableInfo();
     int buckets = info.num_buckets;
@@ -126,8 +126,8 @@ int main() {
     // 7) Project only id (0) and name (1) columns
     std::vector<size_t> projected_columns = {0, 1};
     fluss::LogScanner projected_scanner;
-    check("new_log_scanner_with_projection", 
-          table.NewLogScannerWithProjection(projected_columns, projected_scanner));
+    check("new_log_scanner_with_projection",
+          table.NewScan().Project(projected_columns).CreateLogScanner(projected_scanner));
     
     for (int b = 0; b < buckets; ++b) {
         check("subscribe_projected", projected_scanner.Subscribe(b, 0));
@@ -226,7 +226,7 @@ int main() {
     // 8.4) Use batch subscribe with offsets from list_offsets
     std::cout << "\n=== Batch Subscribe Example ===" << std::endl;
     fluss::LogScanner batch_scanner;
-    check("new_log_scanner_for_batch", table.NewLogScanner(batch_scanner));
+    check("new_log_scanner_for_batch", table.NewScan().CreateLogScanner(batch_scanner));
     
     std::vector<fluss::BucketSubscription> subscriptions;
     for (const auto& [bucket_id, offset] : earliest_offsets) {
@@ -255,9 +255,9 @@ int main() {
 
     // 9) Test the new Arrow record batch polling functionality
     std::cout << "\n=== Testing Arrow Record Batch Polling ===" << std::endl;
-    
+
     fluss::LogScanner arrow_scanner;
-    check("new_record_batch_log_scanner", table.NewRecordBatchLogScanner(arrow_scanner));
+    check("new_record_batch_log_scanner", table.NewScan().CreateRecordBatchScanner(arrow_scanner));
     
     // Subscribe to all buckets starting from offset 0
     for (int b = 0; b < buckets; ++b) {
@@ -279,10 +279,10 @@ int main() {
     
     // 10) Test the new Arrow record batch polling with projection
     std::cout << "\n=== Testing Arrow Record Batch Polling with Projection ===" << std::endl;
-    
+
     fluss::LogScanner projected_arrow_scanner;
-    check("new_record_batch_log_scanner_with_projection", 
-          table.NewRecordBatchLogScannerWithProjection(projected_columns, projected_arrow_scanner));
+    check("new_record_batch_log_scanner_with_projection",
+          table.NewScan().Project(projected_columns).CreateRecordBatchScanner(projected_arrow_scanner));
     
     // Subscribe to all buckets starting from offset 0
     for (int b = 0; b < buckets; ++b) {
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index d35ece2cf5..901b90cae4 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -407,6 +407,7 @@ class AppendWriter;
 class LogScanner;
 class Admin;
 class Table;
+class TableScan;
 
 class Connection {
 public:
@@ -490,10 +491,7 @@ class Table {
     bool Available() const;
 
     Result NewAppendWriter(AppendWriter& out);
-    Result NewLogScanner(LogScanner& out);
-    Result NewLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out);
-    Result NewRecordBatchLogScanner(LogScanner& out);
-    Result NewRecordBatchLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out);
+    TableScan NewScan();
 
     TableInfo GetTableInfo() const;
     TablePath GetTablePath() const;
@@ -501,12 +499,33 @@ class Table {
 
 private:
     friend class Connection;
+    friend class TableScan;
     Table(ffi::Table* table) noexcept;
 
     void Destroy() noexcept;
     ffi::Table* table_{nullptr};
 };
 
+class TableScan {
+public:
+    TableScan(const TableScan&) = delete;
+    TableScan& operator=(const TableScan&) = delete;
+    TableScan(TableScan&&) noexcept = default;
+    TableScan& operator=(TableScan&&) noexcept = default;
+
+    TableScan& Project(std::vector<size_t> column_indices);
+
+    Result CreateLogScanner(LogScanner& out);
+    Result CreateRecordBatchScanner(LogScanner& out);
+
+private:
+    friend class Table;
+    explicit TableScan(ffi::Table* table) noexcept;
+
+    ffi::Table* table_{nullptr};
+    std::vector<size_t> projection_;
+};
+
 class AppendWriter {
 public:
     AppendWriter() noexcept;
@@ -550,6 +569,7 @@ class LogScanner {
 
 private:
     friend class Table;
+    friend class TableScan;
     LogScanner(ffi::LogScanner* scanner) noexcept;
 
     void Destroy() noexcept;
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index b327dbacd8..f9437908e3 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -71,47 +71,33 @@ Result Table::NewAppendWriter(AppendWriter& out) {
     }
 }
 
-Result Table::NewLogScanner(LogScanner& out) {
-    if (!Available()) {
-        return utils::make_error(1, "Table not available");
-    }
-
-    try {
-        out.scanner_ = table_->new_log_scanner();
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
-    } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
-    }
+TableScan Table::NewScan() {
+    return TableScan(table_);
 }
 
-Result Table::NewLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out) {
-    if (!Available()) {
-        return utils::make_error(1, "Table not available");
-    }
+// TableScan implementation
+TableScan::TableScan(ffi::Table* table) noexcept : table_(table) {}
 
-    try {
-        rust::Vec<size_t> rust_indices;
-        for (size_t idx : column_indices) {
-            rust_indices.push_back(idx);
-        }
-        out.scanner_ = table_->new_log_scanner_with_projection(std::move(rust_indices));
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
-    } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
-    }
+TableScan& TableScan::Project(std::vector<size_t> column_indices) {
+    projection_ = std::move(column_indices);
+    return *this;
 }
 
-Result Table::NewRecordBatchLogScanner(LogScanner& out) {
-    if (!Available()) {
+Result TableScan::CreateLogScanner(LogScanner& out) {
+    if (table_ == nullptr) {
         return utils::make_error(1, "Table not available");
     }
 
     try {
-        out.scanner_ = table_->new_record_batch_log_scanner();
+        if (projection_.empty()) {
+            out.scanner_ = table_->new_log_scanner();
+        } else {
+            rust::Vec<size_t> rust_indices;
+            for (size_t idx : projection_) {
+                rust_indices.push_back(idx);
+            }
+            out.scanner_ = table_->new_log_scanner_with_projection(std::move(rust_indices));
+        }
         return utils::make_ok();
     } catch (const rust::Error& e) {
         return utils::make_error(1, e.what());
@@ -120,17 +106,21 @@ Result Table::NewRecordBatchLogScanner(LogScanner& out) {
     }
 }
 
-Result Table::NewRecordBatchLogScannerWithProjection(const std::vector<size_t>& column_indices, LogScanner& out) {
-    if (!Available()) {
+Result TableScan::CreateRecordBatchScanner(LogScanner& out) {
+    if (table_ == nullptr) {
         return utils::make_error(1, "Table not available");
     }
 
     try {
-        rust::Vec<size_t> rust_indices;
-        for (size_t idx : column_indices) {
-            rust_indices.push_back(idx);
+        if (projection_.empty()) {
+            out.scanner_ = table_->new_record_batch_log_scanner();
+        } else {
+            rust::Vec<size_t> rust_indices;
+            for (size_t idx : projection_) {
+                rust_indices.push_back(idx);
+            }
+            out.scanner_ = table_->new_record_batch_log_scanner_with_projection(std::move(rust_indices));
         }
-        out.scanner_ = table_->new_record_batch_log_scanner_with_projection(std::move(rust_indices));
         return utils::make_ok();
     } catch (const rust::Error& e) {
         return utils::make_error(1, e.what());

From 4ed23ff72c628a70cee3a7dc2291fac37bc69406 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 6 Feb 2026 07:09:59 +0800
Subject: [PATCH 112/287] chore: rename subscribe_batch to subscribe_buckets
 (#255)

---
 fluss-rust/bindings/cpp/examples/example.cpp         |  2 +-
 fluss-rust/bindings/cpp/src/lib.rs                   |  8 ++++----
 fluss-rust/bindings/cpp/src/table.cpp                |  2 +-
 fluss-rust/crates/fluss/src/client/table/scanner.rs  | 12 ++++++------
 .../crates/fluss/tests/integration/log_table.rs      |  2 +-
 5 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index f35f37eef1..7022cad1e6 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -235,7 +235,7 @@ int main() {
                   << ", offset=" << offset << std::endl;
     }
     
-    check("subscribe_batch", batch_scanner.Subscribe(subscriptions));
+    check("subscribe_buckets", batch_scanner.Subscribe(subscriptions));
     std::cout << "Batch subscribed to " << subscriptions.size() << " buckets" << std::endl;
     
     // 8.5) Poll and verify bucket_id in records
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index ab02c8d072..b8348654dd 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -245,7 +245,7 @@ mod ffi {
         // LogScanner
         unsafe fn delete_log_scanner(scanner: *mut LogScanner);
         fn subscribe(self: &LogScanner, bucket_id: i32, start_offset: i64) -> FfiResult;
-        fn subscribe_batch(
+        fn subscribe_buckets(
             self: &LogScanner,
             subscriptions: Vec<FfiBucketSubscription>,
         ) -> FfiResult;
@@ -789,7 +789,7 @@ impl LogScanner {
         }
     }
 
-    fn subscribe_batch(&self, subscriptions: Vec<ffi::FfiBucketSubscription>) -> ffi::FfiResult {
+    fn subscribe_buckets(&self, subscriptions: Vec<ffi::FfiBucketSubscription>) -> ffi::FfiResult {
         use std::collections::HashMap;
         let mut bucket_offsets = HashMap::new();
         for sub in subscriptions {
@@ -797,7 +797,7 @@ impl LogScanner {
         }
 
         if let Some(ref inner) = self.inner {
-            let result = RUNTIME.block_on(async { inner.subscribe_batch(&bucket_offsets).await });
+            let result = RUNTIME.block_on(async { inner.subscribe_buckets(&bucket_offsets).await });
 
             match result {
                 Ok(_) => ok_result(),
@@ -805,7 +805,7 @@ impl LogScanner {
             }
         } else if let Some(ref inner_batch) = self.inner_batch {
             let result =
-                RUNTIME.block_on(async { inner_batch.subscribe_batch(&bucket_offsets).await });
+                RUNTIME.block_on(async { inner_batch.subscribe_buckets(&bucket_offsets).await });
 
             match result {
                 Ok(_) => ok_result(),
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index f9437908e3..ab26038911 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -251,7 +251,7 @@ Result LogScanner::Subscribe(const std::vector<BucketSubscription>& bucket_offse
         rust_subs.push_back(ffi_sub);
     }
 
-    auto ffi_result = scanner_->subscribe_batch(std::move(rust_subs));
+    auto ffi_result = scanner_->subscribe_buckets(std::move(rust_subs));
     return utils::from_ffi_result(ffi_result);
 }
 
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index aa9fca4f8a..ef68fb4dd6 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -357,11 +357,11 @@ impl LogScannerInner {
         Ok(())
     }
 
-    async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
+    async fn subscribe_buckets(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
         if self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
                 message:
-                    "The table is a partitioned table, subscribe_batch is not supported currently."
+                    "The table is a partitioned table, subscribe_buckets is not supported currently."
                         .to_string(),
             });
         }
@@ -473,8 +473,8 @@ impl LogScanner {
         self.inner.subscribe(bucket, offset).await
     }
 
-    pub async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
-        self.inner.subscribe_batch(bucket_offsets).await
+    pub async fn subscribe_buckets(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
+        self.inner.subscribe_buckets(bucket_offsets).await
     }
 
     pub async fn subscribe_partition(
@@ -500,8 +500,8 @@ impl RecordBatchLogScanner {
         self.inner.subscribe(bucket, offset).await
     }
 
-    pub async fn subscribe_batch(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
-        self.inner.subscribe_batch(bucket_offsets).await
+    pub async fn subscribe_buckets(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
+        self.inner.subscribe_buckets(bucket_offsets).await
     }
 
     pub async fn subscribe_partition(
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index cbfcbe58b8..3f7dd6e222 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -426,7 +426,7 @@ mod table_test {
         let mut bucket_offsets = HashMap::new();
         bucket_offsets.insert(0, 0);
         log_scanner
-            .subscribe_batch(&bucket_offsets)
+            .subscribe_buckets(&bucket_offsets)
             .await
             .expect("Failed to subscribe");
 

From b4836474b00499f0e08402e3a59df87762a48778 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Thu, 5 Feb 2026 23:27:55 +0000
Subject: [PATCH 113/287] feat: Support drop_table, partitions and offsets
 methods in python bindings (#150)

---
 fluss-rust/bindings/python/example/example.py | 202 +++++++-
 fluss-rust/bindings/python/fluss/__init__.pyi | 127 ++++-
 fluss-rust/bindings/python/src/admin.rs       | 253 +++++++++-
 fluss-rust/bindings/python/src/lib.rs         |  22 +
 fluss-rust/bindings/python/src/table.rs       | 464 +++++++++++++-----
 .../crates/fluss/src/client/table/scanner.rs  |  20 +
 6 files changed, 924 insertions(+), 164 deletions(-)

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 9cb8f4334e..8735038aa5 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -87,6 +87,19 @@ async def main():
     except Exception as e:
         print(f"Failed to get table info: {e}")
 
+    # Demo: List offsets
+    print("\n--- Testing list_offsets() ---")
+    try:
+        # Query latest offsets using OffsetType constant (recommended for type safety)
+        offsets = await admin.list_offsets(
+            table_path,
+            bucket_ids=[0],
+            offset_type=fluss.OffsetType.LATEST
+        )
+        print(f"Latest offsets for table (before writes): {offsets}")
+    except Exception as e:
+        print(f"Failed to list offsets: {e}")
+
     # Get the table instance
     table = await conn.get_table(table_path)
     print(f"Got table: {table}")
@@ -96,7 +109,7 @@ async def main():
     print(f"Created append writer: {append_writer}")
 
     try:
-        # Test 1: Write PyArrow Table
+        # Demo: Write PyArrow Table
         print("\n--- Testing PyArrow Table write ---")
         pa_table = pa.Table.from_arrays(
             [
@@ -139,7 +152,7 @@ async def main():
         append_writer.write_arrow(pa_table)
         print("Successfully wrote PyArrow Table")
 
-        # Test 2: Write PyArrow RecordBatch
+        # Demo: Write PyArrow RecordBatch
         print("\n--- Testing PyArrow RecordBatch write ---")
         pa_record_batch = pa.RecordBatch.from_arrays(
             [
@@ -202,7 +215,7 @@ async def main():
         )
         print("Successfully appended row (list with Date, Time, Timestamp, Decimal)")
 
-        # Test 4: Write Pandas DataFrame
+        # Demo: Write Pandas DataFrame
         print("\n--- Testing Pandas DataFrame write ---")
         df = pd.DataFrame(
             {
@@ -232,6 +245,19 @@ async def main():
         append_writer.flush()
         print("Successfully flushed data")
 
+        # Demo: Check offsets after writes
+        print("\n--- Checking offsets after writes ---")
+        try:
+            # Query with string constant (alternative API - both strings and constants are supported)
+            offsets = await admin.list_offsets(
+                table_path,
+                bucket_ids=[0],
+                offset_type="latest"  # Can also use "earliest" or "timestamp"
+            )
+            print(f"Latest offsets after writing 7 records: {offsets}")
+        except Exception as e:
+            print(f"Failed to list offsets: {e}")
+
     except Exception as e:
         print(f"Error during writing: {e}")
 
@@ -242,10 +268,13 @@ async def main():
         batch_scanner = await table.new_scan().create_batch_scanner()
         print(f"Created batch scanner: {batch_scanner}")
 
-        # Subscribe to scan from earliest to latest
-        # start_timestamp=None (earliest), end_timestamp=None (latest)
-        batch_scanner.subscribe(None, None)
+        # Subscribe to buckets (required before to_arrow/to_pandas)
+        # Use subscribe_buckets to subscribe all buckets from EARLIEST_OFFSET
+        num_buckets = (await admin.get_table(table_path)).num_buckets
+        batch_scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+        print(f"Subscribed to {num_buckets} buckets from EARLIEST_OFFSET")
 
+        # Read all data using to_arrow()
         print("Scanning results using to_arrow():")
 
         # Try to get as PyArrow Table
@@ -255,13 +284,13 @@ async def main():
         except Exception as e:
             print(f"Could not convert to PyArrow: {e}")
 
-        # Let's subscribe from the beginning again.
-        # Reset subscription
-        batch_scanner.subscribe(None, None)
+        # Create a new batch scanner for to_pandas() test
+        batch_scanner2 = await table.new_scan().create_batch_scanner()
+        batch_scanner2.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
         # Try to get as Pandas DataFrame
         try:
-            df_result = batch_scanner.to_pandas()
+            df_result = batch_scanner2.to_pandas()
             print(f"\nAs Pandas DataFrame:\n{df_result}")
         except Exception as e:
             print(f"Could not convert to Pandas: {e}")
@@ -273,13 +302,14 @@ async def main():
 
         # Test poll_arrow() method for incremental reading as Arrow Table
         print("\n--- Testing poll_arrow() method ---")
-        # Reset subscription to start from the beginning
-        batch_scanner.subscribe(None, None)
+        batch_scanner3 = await table.new_scan().create_batch_scanner()
+        batch_scanner3.subscribe(bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
+        print(f"Subscribed to bucket 0 at EARLIEST_OFFSET ({fluss.EARLIEST_OFFSET})")
 
         # Poll with a timeout of 5000ms (5 seconds)
         # Note: poll_arrow() returns an empty table (not an error) on timeout
         try:
-            poll_result = batch_scanner.poll_arrow(5000)
+            poll_result = batch_scanner3.poll_arrow(5000)
             print(f"Number of rows: {poll_result.num_rows}")
 
             if poll_result.num_rows > 0:
@@ -287,7 +317,7 @@ async def main():
                 print(f"Polled data:\n{poll_df}")
             else:
                 print("Empty result (no records available)")
-                # Empty table still has schema
+                # Empty table still has schema - this is useful!
                 print(f"Schema: {poll_result.schema}")
 
         except Exception as e:
@@ -295,10 +325,11 @@ async def main():
 
         # Test poll_batches() method for batches with metadata
         print("\n--- Testing poll_batches() method ---")
-        batch_scanner.subscribe(None, None)
+        batch_scanner4 = await table.new_scan().create_batch_scanner()
+        batch_scanner4.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
         try:
-            batches = batch_scanner.poll_batches(5000)
+            batches = batch_scanner4.poll_batches(5000)
             print(f"Number of batches: {len(batches)}")
 
             for i, batch in enumerate(batches):
@@ -319,7 +350,7 @@ async def main():
         record_scanner = await table.new_scan().create_log_scanner()
         print(f"Created record scanner: {record_scanner}")
 
-        record_scanner.subscribe(None, None)
+        record_scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
         # Poll returns List[ScanRecord] with per-record metadata
         print("\n--- Testing poll() method (record-by-record) ---")
@@ -539,10 +570,13 @@ async def main():
     # Demo: Column projection using builder pattern
     print("\n--- Testing Column Projection ---")
     try:
+        # Get bucket count for subscriptions
+        num_buckets = (await admin.get_table(table_path)).num_buckets
+
         # Project specific columns by index (using batch scanner for to_pandas)
         print("\n1. Projection by index [0, 1] (id, name):")
         scanner_index = await table.new_scan().project([0, 1]).create_batch_scanner()
-        scanner_index.subscribe(None, None)
+        scanner_index.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
         df_projected = scanner_index.to_pandas()
         print(df_projected.head())
         print(
@@ -554,7 +588,7 @@ async def main():
         scanner_names = await table.new_scan() \
             .project_by_name(["name", "score"]) \
             .create_batch_scanner()
-        scanner_names.subscribe(None, None)
+        scanner_names.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
         df_named = scanner_names.to_pandas()
         print(df_named.head())
         print(f"   Projected {df_named.shape[1]} columns: {list(df_named.columns)}")
@@ -562,7 +596,7 @@ async def main():
         # Test empty result schema with projection
         print("\n3. Testing empty result schema with projection:")
         scanner_proj = await table.new_scan().project([0, 2]).create_batch_scanner()
-        scanner_proj.subscribe(None, None)
+        scanner_proj.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
         # Quick poll that may return empty
         result = scanner_proj.poll_arrow(100)
         print(f"   Schema columns: {result.schema.names}")
@@ -570,6 +604,134 @@ async def main():
     except Exception as e:
         print(f"Error during projection: {e}")
 
+    # Demo: Drop tables
+    print("\n--- Testing drop_table() ---")
+    try:
+        # Drop the log table
+        await admin.drop_table(table_path, ignore_if_not_exists=True)
+        print(f"Successfully dropped table: {table_path}")
+        # Drop the PK table
+        await admin.drop_table(pk_table_path, ignore_if_not_exists=True)
+        print(f"Successfully dropped table: {pk_table_path}")
+    except Exception as e:
+        print(f"Failed to drop table: {e}")
+
+    # =====================================================
+    # Demo: Partitioned Table with list_partition_offsets
+    # =====================================================
+    print("\n" + "=" * 60)
+    print("--- Testing Partitioned Table ---")
+    print("=" * 60)
+
+    # Create a partitioned log table
+    partitioned_fields = [
+        pa.field("id", pa.int32()),
+        pa.field("region", pa.string()),  # partition key
+        pa.field("value", pa.int64()),
+    ]
+    partitioned_schema = pa.schema(partitioned_fields)
+    fluss_partitioned_schema = fluss.Schema(partitioned_schema)
+
+    partitioned_table_descriptor = fluss.TableDescriptor(
+        fluss_partitioned_schema,
+        partition_keys=["region"],  # Partition by region
+        bucket_count=1,
+    )
+
+    partitioned_table_path = fluss.TablePath("fluss", "partitioned_log_table_py")
+
+    try:
+        # Drop if exists first
+        await admin.drop_table(partitioned_table_path, ignore_if_not_exists=True)
+        print(f"Dropped existing table: {partitioned_table_path}")
+
+        # Create the partitioned table
+        await admin.create_table(partitioned_table_path, partitioned_table_descriptor, False)
+        print(f"Created partitioned table: {partitioned_table_path}")
+
+        # Create partitions for US and EU regions
+        print("\n--- Creating partitions ---")
+        await admin.create_partition(partitioned_table_path, {"region": "US"}, ignore_if_exists=True)
+        print("Created partition: region=US")
+        await admin.create_partition(partitioned_table_path, {"region": "EU"}, ignore_if_exists=True)
+        print("Created partition: region=EU")
+
+        # List partitions
+        print("\n--- Listing partitions ---")
+        partition_infos = await admin.list_partition_infos(partitioned_table_path)
+        for p in partition_infos:
+            print(f"  {p}")  # PartitionInfo(partition_id=..., partition_name='region=...')
+
+        # Get the table and write some data
+        partitioned_table = await conn.get_table(partitioned_table_path)
+        partitioned_writer = await partitioned_table.new_append_writer()
+
+        # Append data to US partition
+        await partitioned_writer.append({"id": 1, "region": "US", "value": 100})
+        await partitioned_writer.append({"id": 2, "region": "US", "value": 200})
+        # Append data to EU partition
+        await partitioned_writer.append({"id": 3, "region": "EU", "value": 300})
+        await partitioned_writer.append({"id": 4, "region": "EU", "value": 400})
+        partitioned_writer.flush()
+        print("\nWrote 4 records (2 to US, 2 to EU)")
+
+        # Demo: list_partition_offsets
+        print("\n--- Testing list_partition_offsets ---")
+
+        # Query offsets for US partition
+        # Note: partition_name is just the value (e.g., "US"), not "region=US"
+        us_offsets = await admin.list_partition_offsets(
+            partitioned_table_path,
+            partition_name="US",
+            bucket_ids=[0],
+            offset_type="latest"
+        )
+        print(f"US partition latest offsets: {us_offsets}")
+
+        # Query offsets for EU partition
+        eu_offsets = await admin.list_partition_offsets(
+            partitioned_table_path,
+            partition_name="EU",
+            bucket_ids=[0],
+            offset_type="latest"
+        )
+        print(f"EU partition latest offsets: {eu_offsets}")
+
+        # Demo: subscribe_partition for reading partitioned data
+        print("\n--- Testing subscribe_partition + to_arrow() ---")
+        partitioned_scanner = await partitioned_table.new_scan().create_batch_scanner()
+
+        # Subscribe to each partition using partition_id
+        for p in partition_infos:
+            partitioned_scanner.subscribe_partition(
+                partition_id=p.partition_id,
+                bucket_id=0,
+                start_offset=fluss.EARLIEST_OFFSET
+            )
+            print(f"Subscribed to partition {p.partition_name} (id={p.partition_id})")
+
+        # Use to_arrow() - now works for partitioned tables!
+        partitioned_arrow = partitioned_scanner.to_arrow()
+        print(f"\nto_arrow() returned {partitioned_arrow.num_rows} records from partitioned table:")
+        print(partitioned_arrow.to_pandas())
+
+        # Demo: to_pandas() also works for partitioned tables
+        print("\n--- Testing to_pandas() on partitioned table ---")
+        partitioned_scanner2 = await partitioned_table.new_scan().create_batch_scanner()
+        for p in partition_infos:
+            partitioned_scanner2.subscribe_partition(p.partition_id, 0, fluss.EARLIEST_OFFSET)
+        partitioned_df = partitioned_scanner2.to_pandas()
+        print(f"to_pandas() returned {len(partitioned_df)} records:")
+        print(partitioned_df)
+
+        # Cleanup
+        await admin.drop_table(partitioned_table_path, ignore_if_not_exists=True)
+        print(f"\nDropped partitioned table: {partitioned_table_path}")
+
+    except Exception as e:
+        print(f"Error with partitioned table: {e}")
+        traceback.print_exc()
+
     # Close connection
     conn.close()
     print("\nConnection closed")
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 40d18f6c27..a2bbaac401 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -129,6 +129,78 @@ class FlussAdmin:
     ) -> None: ...
     async def get_table(self, table_path: TablePath) -> TableInfo: ...
     async def get_latest_lake_snapshot(self, table_path: TablePath) -> LakeSnapshot: ...
+    async def drop_table(
+        self,
+        table_path: TablePath,
+        ignore_if_not_exists: bool = False,
+    ) -> None: ...
+    async def list_offsets(
+        self,
+        table_path: TablePath,
+        bucket_ids: List[int],
+        offset_type: str,
+        timestamp: Optional[int] = None,
+    ) -> Dict[int, int]:
+        """List offsets for the specified buckets.
+
+        Args:
+            table_path: Path to the table
+            bucket_ids: List of bucket IDs to query
+            offset_type: "earliest", "latest", or "timestamp"
+            timestamp: Required when offset_type is "timestamp"
+
+        Returns:
+            Dict mapping bucket_id -> offset
+        """
+        ...
+    async def list_partition_offsets(
+        self,
+        table_path: TablePath,
+        partition_name: str,
+        bucket_ids: List[int],
+        offset_type: str,
+        timestamp: Optional[int] = None,
+    ) -> Dict[int, int]:
+        """List offsets for buckets in a specific partition.
+
+        Args:
+            table_path: Path to the table
+            partition_name: Partition value (e.g., "US" not "region=US")
+            bucket_ids: List of bucket IDs to query
+            offset_type: "earliest", "latest", or "timestamp"
+            timestamp: Required when offset_type is "timestamp"
+
+        Returns:
+            Dict mapping bucket_id -> offset
+        """
+        ...
+    async def create_partition(
+        self,
+        table_path: TablePath,
+        partition_spec: Dict[str, str],
+        ignore_if_exists: bool = False,
+    ) -> None:
+        """Create a partition for a partitioned table.
+
+        Args:
+            table_path: Path to the table
+            partition_spec: Dict mapping partition column name to value (e.g., {"region": "US"})
+            ignore_if_exists: If True, don't raise error if partition already exists
+        """
+        ...
+    async def list_partition_infos(
+        self,
+        table_path: TablePath,
+    ) -> List["PartitionInfo"]:
+        """List all partitions for a partitioned table.
+
+        Args:
+            table_path: Path to the table
+
+        Returns:
+            List of PartitionInfo objects
+        """
+        ...
     def __repr__(self) -> str: ...
 
 class TableScan:
@@ -322,14 +394,30 @@ class LogScanner:
         scanner = await table.new_scan().project([0, 1]).create_log_scanner()
     """
 
-    def subscribe(
-        self, start_timestamp: Optional[int], end_timestamp: Optional[int]
+    def subscribe(self, bucket_id: int, start_offset: int) -> None:
+        """Subscribe to a single bucket at a specific offset (non-partitioned tables).
+
+        Args:
+            bucket_id: The bucket ID to subscribe to
+            start_offset: The offset to start reading from (use EARLIEST_OFFSET for beginning)
+        """
+        ...
+    def subscribe_buckets(self, bucket_offsets: Dict[int, int]) -> None:
+        """Subscribe to multiple buckets at specified offsets (non-partitioned tables).
+
+        Args:
+            bucket_offsets: Dict mapping bucket_id -> start_offset
+        """
+        ...
+    def subscribe_partition(
+        self, partition_id: int, bucket_id: int, start_offset: int
     ) -> None:
-        """Subscribe to log data with timestamp range.
+        """Subscribe to a bucket within a specific partition (partitioned tables only).
 
         Args:
-            start_timestamp: Not yet supported, must be None.
-            end_timestamp: Not yet supported, must be None.
+            partition_id: The partition ID (from PartitionInfo.partition_id)
+            bucket_id: The bucket ID within the partition
+            start_offset: The offset to start reading from (use EARLIEST_OFFSET for beginning)
         """
         ...
     def poll(self, timeout_ms: int) -> List[ScanRecord]:
@@ -384,12 +472,18 @@ class LogScanner:
         """Convert all data to Pandas DataFrame.
 
         Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+        Reads from currently subscribed buckets until reaching their latest offsets.
+
+        You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
         """
         ...
     def to_arrow(self) -> pa.Table:
         """Convert all data to Arrow Table.
 
         Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+        Reads from currently subscribed buckets until reaching their latest offsets.
+
+        You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
         """
         ...
     def __repr__(self) -> str: ...
@@ -493,4 +587,27 @@ class TableDistribution:
     def bucket_keys(self) -> List[str]: ...
     def bucket_count(self) -> Optional[int]: ...
 
+class PartitionInfo:
+    """Information about a partition."""
+
+    @property
+    def partition_id(self) -> int:
+        """Get the partition ID (globally unique in the cluster)."""
+        ...
+    @property
+    def partition_name(self) -> str:
+        """Get the partition name."""
+        ...
+    def __repr__(self) -> str: ...
+
+class OffsetType:
+    """Offset type constants for list_offsets()."""
+
+    EARLIEST: str
+    LATEST: str
+    TIMESTAMP: str
+
+# Constant for earliest offset (-2)
+EARLIEST_OFFSET: int
+
 __version__: str
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index fa189eb80d..d28c9c066e 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use crate::*;
+use fcore::rpc::message::OffsetSpec;
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::Arc;
 
@@ -25,6 +26,37 @@ pub struct FlussAdmin {
     __admin: Arc<fcore::client::FlussAdmin>,
 }
 
+/// Parse offset_type string into OffsetSpec
+fn parse_offset_spec(offset_type: &str, timestamp: Option<i64>) -> PyResult<OffsetSpec> {
+    match offset_type {
+        s if s.eq_ignore_ascii_case("earliest") => Ok(OffsetSpec::Earliest),
+        s if s.eq_ignore_ascii_case("latest") => Ok(OffsetSpec::Latest),
+        s if s.eq_ignore_ascii_case("timestamp") => {
+            let ts = timestamp.ok_or_else(|| {
+                FlussError::new_err("timestamp must be provided when offset_type='timestamp'")
+            })?;
+            Ok(OffsetSpec::Timestamp(ts))
+        }
+        _ => Err(FlussError::new_err(format!(
+            "Invalid offset_type: '{}'. Must be 'earliest', 'latest', or 'timestamp'",
+            offset_type
+        ))),
+    }
+}
+
+/// Validate bucket IDs are non-negative
+fn validate_bucket_ids(bucket_ids: &[i32]) -> PyResult<()> {
+    for &bucket_id in bucket_ids {
+        if bucket_id < 0 {
+            return Err(FlussError::new_err(format!(
+                "Invalid bucket_id: {}. Bucket IDs must be non-negative",
+                bucket_id
+            )));
+        }
+    }
+    Ok(())
+}
+
 #[pymethods]
 impl FlussAdmin {
     /// Create a table with the given schema
@@ -38,7 +70,7 @@ impl FlussAdmin {
     ) -> PyResult<Bound<'py, PyAny>> {
         let ignore = ignore_if_exists.unwrap_or(false);
 
-        let core_table_path = table_path.to_core().clone();
+        let core_table_path = table_path.to_core();
         let core_descriptor = table_descriptor.to_core().clone();
         let admin = self.__admin.clone();
 
@@ -58,7 +90,7 @@ impl FlussAdmin {
         py: Python<'py>,
         table_path: &TablePath,
     ) -> PyResult<Bound<'py, PyAny>> {
-        let core_table_path = table_path.to_core().clone();
+        let core_table_path = table_path.to_core();
         let admin = self.__admin.clone();
 
         future_into_py(py, async move {
@@ -80,7 +112,7 @@ impl FlussAdmin {
         py: Python<'py>,
         table_path: &TablePath,
     ) -> PyResult<Bound<'py, PyAny>> {
-        let core_table_path = table_path.to_core().clone();
+        let core_table_path = table_path.to_core();
         let admin = self.__admin.clone();
 
         future_into_py(py, async move {
@@ -96,6 +128,183 @@ impl FlussAdmin {
         })
     }
 
+    /// Drop a table
+    #[pyo3(signature = (table_path, ignore_if_not_exists=false))]
+    pub fn drop_table<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+        ignore_if_not_exists: bool,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let core_table_path = table_path.to_core();
+        let admin = self.__admin.clone();
+
+        future_into_py(py, async move {
+            admin
+                .drop_table(&core_table_path, ignore_if_not_exists)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to drop table: {e}")))?;
+
+            Python::attach(|py| Ok(py.None()))
+        })
+    }
+
+    /// List offsets for buckets (non-partitioned tables only).
+    ///
+    /// Args:
+    ///     table_path: Path to the table
+    ///     bucket_ids: List of bucket IDs to query
+    ///     offset_type: Type of offset to retrieve:
+    ///         - "earliest" or OffsetType.EARLIEST: Start of the log
+    ///         - "latest" or OffsetType.LATEST: End of the log
+    ///         - "timestamp" or OffsetType.TIMESTAMP: Offset at given timestamp (requires timestamp arg)
+    ///     timestamp: Required when offset_type is "timestamp", ignored otherwise
+    ///
+    /// Returns:
+    ///     dict[int, int]: Mapping of bucket_id -> offset
+    #[pyo3(signature = (table_path, bucket_ids, offset_type, timestamp=None))]
+    pub fn list_offsets<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+        bucket_ids: Vec<i32>,
+        offset_type: &str,
+        timestamp: Option<i64>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        validate_bucket_ids(&bucket_ids)?;
+        let offset_spec = parse_offset_spec(offset_type, timestamp)?;
+
+        let core_table_path = table_path.to_core();
+        let admin = self.__admin.clone();
+
+        future_into_py(py, async move {
+            let offsets = admin
+                .list_offsets(&core_table_path, &bucket_ids, offset_spec)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to list offsets: {e}")))?;
+
+            Python::attach(|py| {
+                let dict = pyo3::types::PyDict::new(py);
+                for (bucket_id, offset) in offsets {
+                    dict.set_item(bucket_id, offset)?;
+                }
+                Ok(dict.unbind())
+            })
+        })
+    }
+
+    /// List offsets for buckets in a specific partition of a partitioned table.
+    ///
+    /// Args:
+    ///     table_path: Path to the table
+    ///     partition_name: Partition value (e.g., "US" not "region=US")
+    ///     bucket_ids: List of bucket IDs to query
+    ///     offset_type: Type of offset to retrieve:
+    ///         - "earliest" or OffsetType.EARLIEST: Start of the log
+    ///         - "latest" or OffsetType.LATEST: End of the log
+    ///         - "timestamp" or OffsetType.TIMESTAMP: Offset at given timestamp (requires timestamp arg)
+    ///     timestamp: Required when offset_type is "timestamp", ignored otherwise
+    ///
+    /// Returns:
+    ///     dict[int, int]: Mapping of bucket_id -> offset
+    #[pyo3(signature = (table_path, partition_name, bucket_ids, offset_type, timestamp=None))]
+    pub fn list_partition_offsets<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+        partition_name: &str,
+        bucket_ids: Vec<i32>,
+        offset_type: &str,
+        timestamp: Option<i64>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        validate_bucket_ids(&bucket_ids)?;
+        let offset_spec = parse_offset_spec(offset_type, timestamp)?;
+
+        let core_table_path = table_path.to_core();
+        let admin = self.__admin.clone();
+        let partition_name = partition_name.to_string();
+
+        future_into_py(py, async move {
+            let offsets = admin
+                .list_partition_offsets(&core_table_path, &partition_name, &bucket_ids, offset_spec)
+                .await
+                .map_err(|e| {
+                    FlussError::new_err(format!("Failed to list partition offsets: {e}"))
+                })?;
+
+            Python::attach(|py| {
+                let dict = pyo3::types::PyDict::new(py);
+                for (bucket_id, offset) in offsets {
+                    dict.set_item(bucket_id, offset)?;
+                }
+                Ok(dict.unbind())
+            })
+        })
+    }
+
+    /// Create a partition for a partitioned table.
+    ///
+    /// Args:
+    ///     table_path: Path to the table
+    ///     partition_spec: Dict mapping partition column name to value (e.g., {"region": "US"})
+    ///     ignore_if_exists: If True, don't raise error if partition already exists
+    ///
+    /// Returns:
+    ///     None
+    #[pyo3(signature = (table_path, partition_spec, ignore_if_exists=false))]
+    pub fn create_partition<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+        partition_spec: std::collections::HashMap<String, String>,
+        ignore_if_exists: bool,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let core_table_path = table_path.to_core();
+        let admin = self.__admin.clone();
+        let core_partition_spec = fcore::metadata::PartitionSpec::new(partition_spec);
+
+        future_into_py(py, async move {
+            admin
+                .create_partition(&core_table_path, &core_partition_spec, ignore_if_exists)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to create partition: {e}")))?;
+
+            Python::attach(|py| Ok(py.None()))
+        })
+    }
+
+    /// List all partitions for a partitioned table.
+    ///
+    /// Args:
+    ///     table_path: Path to the table
+    ///
+    /// Returns:
+    ///     List[PartitionInfo]: List of partition info objects
+    pub fn list_partition_infos<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let core_table_path = table_path.to_core();
+        let admin = self.__admin.clone();
+
+        future_into_py(py, async move {
+            let partition_infos = admin
+                .list_partition_infos(&core_table_path)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to list partitions: {e}")))?;
+
+            Python::attach(|py| {
+                let py_list = pyo3::types::PyList::empty(py);
+                for info in partition_infos {
+                    let py_info = PartitionInfo::from_core(info);
+                    py_list.append(Py::new(py, py_info)?)?;
+                }
+                Ok(py_list.unbind())
+            })
+        })
+    }
+
     fn __repr__(&self) -> String {
         "FlussAdmin()".to_string()
     }
@@ -109,3 +318,41 @@ impl FlussAdmin {
         }
     }
 }
+
+/// Information about a partition
+#[pyclass]
+pub struct PartitionInfo {
+    partition_id: i64,
+    partition_name: String,
+}
+
+#[pymethods]
+impl PartitionInfo {
+    /// Get the partition ID (globally unique in the cluster)
+    #[getter]
+    fn partition_id(&self) -> i64 {
+        self.partition_id
+    }
+
+    /// Get the partition name (e.g., "US" for a table partitioned by region)
+    #[getter]
+    fn partition_name(&self) -> &str {
+        &self.partition_name
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "PartitionInfo(partition_id={}, partition_name='{}')",
+            self.partition_id, self.partition_name
+        )
+    }
+}
+
+impl PartitionInfo {
+    pub fn from_core(info: fcore::metadata::PartitionInfo) -> Self {
+        Self {
+            partition_id: info.get_partition_id(),
+            partition_name: info.get_partition_name(),
+        }
+    }
+}
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index ce063aba4a..ae7f6c500a 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -48,6 +48,23 @@ static TOKIO_RUNTIME: LazyLock<Runtime> = LazyLock::new(|| {
         .expect("Failed to create Tokio runtime")
 });
 
+/// Offset type constants for list_offsets()
+#[pyclass]
+#[derive(Clone)]
+pub struct OffsetType;
+
+#[pymethods]
+impl OffsetType {
+    #[classattr]
+    const EARLIEST: &'static str = "earliest";
+
+    #[classattr]
+    const LATEST: &'static str = "latest";
+
+    #[classattr]
+    const TIMESTAMP: &'static str = "timestamp";
+}
+
 #[pymodule]
 fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     // Register all classes
@@ -69,6 +86,11 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<ChangeType>()?;
     m.add_class::<ScanRecord>()?;
     m.add_class::<RecordBatch>()?;
+    m.add_class::<PartitionInfo>()?;
+    m.add_class::<OffsetType>()?;
+
+    // Register constants
+    m.add("EARLIEST_OFFSET", fcore::client::EARLIEST_OFFSET)?;
 
     // Register exception types
     m.add_class::<FlussError>()?;
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 30c7ce0bff..c285f25c3a 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -20,7 +20,6 @@ use crate::*;
 use arrow::array::RecordBatch as ArrowRecordBatch;
 use arrow_pyarrow::{FromPyArrow, ToPyArrow};
 use arrow_schema::SchemaRef;
-use fluss::client::EARLIEST_OFFSET;
 use fluss::record::to_arrow_schema;
 use fluss::rpc::message::OffsetSpec;
 use pyo3::types::IntoPyDict;
@@ -1573,155 +1572,95 @@ pub struct LogScanner {
     projected_schema: SchemaRef,
     /// The projected row type to use for record-based scanning
     projected_row_type: fcore::metadata::RowType,
-    #[allow(dead_code)]
-    start_timestamp: Option<i64>,
-    #[allow(dead_code)]
-    end_timestamp: Option<i64>,
+    /// Cache for partition_id -> partition_name mapping (avoids repeated list_partition_infos calls)
+    partition_name_cache: std::sync::RwLock<Option<HashMap<i64, String>>>,
 }
 
 #[pymethods]
 impl LogScanner {
-    /// Subscribe to log data with timestamp range
-    fn subscribe(
-        &mut self,
-        _start_timestamp: Option<i64>,
-        _end_timestamp: Option<i64>,
-    ) -> PyResult<()> {
-        if _start_timestamp.is_some() {
-            return Err(FlussError::new_err(
-                "Specifying start_timestamp is not yet supported. Please use None.".to_string(),
-            ));
-        }
-        if _end_timestamp.is_some() {
-            return Err(FlussError::new_err(
-                "Specifying end_timestamp is not yet supported. Please use None.".to_string(),
-            ));
-        }
-
-        let num_buckets = self.table_info.get_num_buckets();
-        for bucket_id in 0..num_buckets {
-            let start_offset = EARLIEST_OFFSET;
-
-            // Subscribe to the appropriate scanner
-            if let Some(ref inner) = self.inner {
-                TOKIO_RUNTIME.block_on(async {
+    /// Subscribe to a single bucket at a specific offset (non-partitioned tables).
+    ///
+    /// Args:
+    ///     bucket_id: The bucket ID to subscribe to
+    ///     start_offset: The offset to start reading from (use EARLIEST_OFFSET for beginning)
+    fn subscribe(&self, py: Python, bucket_id: i32, start_offset: i64) -> PyResult<()> {
+        py.detach(|| {
+            TOKIO_RUNTIME.block_on(async {
+                if let Some(ref inner) = self.inner {
                     inner
                         .subscribe(bucket_id, start_offset)
                         .await
-                        .map_err(|e| FlussError::new_err(e.to_string()))
-                })?;
-            } else if let Some(ref inner_batch) = self.inner_batch {
-                TOKIO_RUNTIME.block_on(async {
+                        .map_err(|e| FlussError::new_err(format!("Failed to subscribe: {e}")))
+                } else if let Some(ref inner_batch) = self.inner_batch {
                     inner_batch
                         .subscribe(bucket_id, start_offset)
                         .await
-                        .map_err(|e| FlussError::new_err(e.to_string()))
-                })?;
-            } else {
-                return Err(FlussError::new_err("No scanner available"));
-            }
-        }
-
-        Ok(())
+                        .map_err(|e| FlussError::new_err(format!("Failed to subscribe: {e}")))
+                } else {
+                    Err(FlussError::new_err("No scanner available"))
+                }
+            })
+        })
     }
 
-    /// Convert all data to Arrow Table
+    /// Subscribe to multiple buckets at specified offsets (non-partitioned tables).
     ///
-    /// Note: Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
-    fn to_arrow(&self, py: Python) -> PyResult<Py<PyAny>> {
-        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
-            FlussError::new_err(
-                "Batch-based scanner not available. Use new_scan().create_batch_scanner() to create a scanner \
-                 that supports to_arrow().",
-            )
-        })?;
-
-        let mut all_batches = Vec::new();
-
-        let num_buckets = self.table_info.get_num_buckets();
-        let bucket_ids: Vec<i32> = (0..num_buckets).collect();
-
-        // todo: after supporting list_offsets with timestamp, we can use start_timestamp and end_timestamp here
-        let mut stopping_offsets: HashMap<i32, i64> = py
-            .detach(|| {
-                TOKIO_RUNTIME.block_on(async {
-                    self.admin
-                        .list_offsets(
-                            &self.table_info.table_path,
-                            bucket_ids.as_slice(),
-                            OffsetSpec::Latest,
-                        )
+    /// Args:
+    ///     bucket_offsets: A dict mapping bucket_id -> start_offset
+    fn subscribe_buckets(&self, py: Python, bucket_offsets: HashMap<i32, i64>) -> PyResult<()> {
+        py.detach(|| {
+            TOKIO_RUNTIME.block_on(async {
+                if let Some(ref inner) = self.inner {
+                    inner
+                        .subscribe_buckets(&bucket_offsets)
                         .await
-                })
-            })
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
-
-        // Filter out buckets with no records to read (stop_at <= 0)
-        stopping_offsets.retain(|_, &mut v| v > 0);
-
-        while !stopping_offsets.is_empty() {
-            let scan_batches = py
-                .detach(|| {
-                    TOKIO_RUNTIME
-                        .block_on(async { inner_batch.poll(Duration::from_millis(500)).await })
-                })
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
-
-            if scan_batches.is_empty() {
-                continue;
-            }
-
-            for scan_batch in scan_batches {
-                let bucket_id = scan_batch.bucket().bucket_id();
-
-                // Check if this bucket is still being tracked; if not, ignore the batch
-                let Some(&stop_at) = stopping_offsets.get(&bucket_id) else {
-                    continue;
-                };
-
-                let base_offset = scan_batch.base_offset();
-                let last_offset = scan_batch.last_offset();
-
-                // If the batch starts at or after the stop_at offset, the bucket is exhausted
-                if base_offset >= stop_at {
-                    stopping_offsets.remove(&bucket_id);
-                    continue;
-                }
-
-                let batch = if last_offset >= stop_at {
-                    // This batch contains the target offset; slice it to keep only records
-                    // where offset < stop_at.
-                    let num_to_keep = (stop_at - base_offset) as usize;
-                    let b = scan_batch.into_batch();
-
-                    // Safety check: ensure we don't attempt to slice more rows than the batch contains
-                    let limit = num_to_keep.min(b.num_rows());
-                    b.slice(0, limit)
+                        .map_err(|e| FlussError::new_err(format!("Failed to subscribe batch: {e}")))
+                } else if let Some(ref inner_batch) = self.inner_batch {
+                    inner_batch
+                        .subscribe_buckets(&bucket_offsets)
+                        .await
+                        .map_err(|e| FlussError::new_err(format!("Failed to subscribe batch: {e}")))
                 } else {
-                    // The entire batch is within the desired range (all offsets < stop_at)
-                    scan_batch.into_batch()
-                };
-
-                all_batches.push(Arc::new(batch));
-
-                // If the batch's last offset reached or passed the inclusive limit (stop_at - 1),
-                // we are done with this bucket.
-                if last_offset >= stop_at - 1 {
-                    stopping_offsets.remove(&bucket_id);
+                    Err(FlussError::new_err("No scanner available"))
                 }
-            }
-        }
-
-        Utils::combine_batches_to_table(py, all_batches)
+            })
+        })
     }
 
-    /// Convert all data to Pandas DataFrame
-    fn to_pandas(&self, py: Python) -> PyResult<Py<PyAny>> {
-        let arrow_table = self.to_arrow(py)?;
-
-        // Convert Arrow Table to Pandas DataFrame using pyarrow
-        let df = arrow_table.call_method0(py, "to_pandas")?;
-        Ok(df)
+    /// Subscribe to a bucket within a specific partition (partitioned tables only).
+    ///
+    /// Args:
+    ///     partition_id: The partition ID (from PartitionInfo.partition_id)
+    ///     bucket_id: The bucket ID within the partition
+    ///     start_offset: The offset to start reading from (use EARLIEST_OFFSET for beginning)
+    fn subscribe_partition(
+        &self,
+        py: Python,
+        partition_id: i64,
+        bucket_id: i32,
+        start_offset: i64,
+    ) -> PyResult<()> {
+        py.detach(|| {
+            TOKIO_RUNTIME.block_on(async {
+                if let Some(ref inner) = self.inner {
+                    inner
+                        .subscribe_partition(partition_id, bucket_id, start_offset)
+                        .await
+                        .map_err(|e| {
+                            FlussError::new_err(format!("Failed to subscribe partition: {e}"))
+                        })
+                } else if let Some(ref inner_batch) = self.inner_batch {
+                    inner_batch
+                        .subscribe_partition(partition_id, bucket_id, start_offset)
+                        .await
+                        .map_err(|e| {
+                            FlussError::new_err(format!("Failed to subscribe partition: {e}"))
+                        })
+                } else {
+                    Err(FlussError::new_err("No scanner available"))
+                }
+            })
+        })
     }
 
     /// Poll for individual records with metadata.
@@ -1873,6 +1812,54 @@ impl LogScanner {
         Ok(empty_table.into())
     }
 
+    /// Convert all data to Arrow Table.
+    ///
+    /// Reads from currently subscribed buckets until reaching their latest offsets.
+    /// Works for both partitioned and non-partitioned tables.
+    ///
+    /// You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
+    ///
+    /// Returns:
+    ///     PyArrow Table containing all data from subscribed buckets
+    fn to_arrow(&self, py: Python) -> PyResult<Py<PyAny>> {
+        // 1. Get subscribed buckets from scanner (requires batch scanner for get_subscribed_buckets)
+        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
+            FlussError::new_err(
+                "Batch-based scanner not available. Use new_scan().create_batch_scanner() to create a scanner \
+                 that supports to_arrow().",
+            )
+        })?;
+        let subscribed = inner_batch.get_subscribed_buckets();
+        if subscribed.is_empty() {
+            return Err(FlussError::new_err(
+                "No buckets subscribed. Call subscribe(), subscribe_buckets(), or subscribe_partition() first.",
+            ));
+        }
+
+        // 2. Query latest offsets for all subscribed buckets
+        let stopping_offsets = self.query_latest_offsets(py, &subscribed)?;
+
+        // 3. Poll until all buckets reach their stopping offsets
+        self.poll_until_offsets(py, stopping_offsets)
+    }
+
+    /// Convert all data to Pandas DataFrame.
+    ///
+    /// Reads from currently subscribed buckets until reaching their latest offsets.
+    /// Works for both partitioned and non-partitioned tables.
+    ///
+    /// You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
+    ///
+    /// Returns:
+    ///     Pandas DataFrame containing all data from subscribed buckets
+    fn to_pandas(&self, py: Python) -> PyResult<Py<PyAny>> {
+        let arrow_table = self.to_arrow(py)?;
+
+        // Convert Arrow Table to Pandas DataFrame using pyarrow
+        let df = arrow_table.call_method0(py, "to_pandas")?;
+        Ok(df)
+    }
+
     fn __repr__(&self) -> String {
         format!("LogScanner(table={})", self.table_info.table_path)
     }
@@ -1894,8 +1881,7 @@ impl LogScanner {
             table_info,
             projected_schema,
             projected_row_type,
-            start_timestamp: None,
-            end_timestamp: None,
+            partition_name_cache: std::sync::RwLock::new(None),
         }
     }
 
@@ -1914,9 +1900,215 @@ impl LogScanner {
             table_info,
             projected_schema,
             projected_row_type,
-            start_timestamp: None,
-            end_timestamp: None,
+            partition_name_cache: std::sync::RwLock::new(None),
+        }
+    }
+
+    /// Get partition_id -> partition_name mapping, using cache if available
+    fn get_partition_name_map(
+        &self,
+        py: Python,
+        table_path: &fcore::metadata::TablePath,
+    ) -> PyResult<HashMap<i64, String>> {
+        // Check cache first (read lock)
+        {
+            let cache = self.partition_name_cache.read().unwrap();
+            if let Some(map) = cache.as_ref() {
+                return Ok(map.clone());
+            }
+        }
+
+        // Fetch partition infos (releases GIL during async call)
+        let partition_infos: Vec<fcore::metadata::PartitionInfo> = py
+            .detach(|| {
+                TOKIO_RUNTIME.block_on(async { self.admin.list_partition_infos(table_path).await })
+            })
+            .map_err(|e| FlussError::new_err(format!("Failed to list partition infos: {e}")))?;
+
+        // Build and cache the mapping
+        let map: HashMap<i64, String> = partition_infos
+            .into_iter()
+            .map(|info| (info.get_partition_id(), info.get_partition_name()))
+            .collect();
+
+        // Store in cache (write lock)
+        {
+            let mut cache = self.partition_name_cache.write().unwrap();
+            *cache = Some(map.clone());
+        }
+
+        Ok(map)
+    }
+
+    /// Query latest offsets for subscribed buckets (handles both partitioned and non-partitioned)
+    fn query_latest_offsets(
+        &self,
+        py: Python,
+        subscribed: &[(fcore::metadata::TableBucket, i64)],
+    ) -> PyResult<HashMap<fcore::metadata::TableBucket, i64>> {
+        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
+            FlussError::new_err("Batch-based scanner required for this operation")
+        })?;
+        let is_partitioned = inner_batch.is_partitioned();
+        let table_path = &self.table_info.table_path;
+
+        if !is_partitioned {
+            // Non-partitioned: simple case - just query all bucket IDs
+            let bucket_ids: Vec<i32> = subscribed.iter().map(|(tb, _)| tb.bucket_id()).collect();
+
+            let offsets: HashMap<i32, i64> = py
+                .detach(|| {
+                    TOKIO_RUNTIME.block_on(async {
+                        self.admin
+                            .list_offsets(table_path, &bucket_ids, OffsetSpec::Latest)
+                            .await
+                    })
+                })
+                .map_err(|e| FlussError::new_err(format!("Failed to list offsets: {e}")))?;
+
+            // Convert to TableBucket-keyed map
+            let table_id = self.table_info.table_id;
+            Ok(offsets
+                .into_iter()
+                .filter(|(_, offset)| *offset > 0)
+                .map(|(bucket_id, offset)| {
+                    (
+                        fcore::metadata::TableBucket::new(table_id, bucket_id),
+                        offset,
+                    )
+                })
+                .collect())
+        } else {
+            // Partitioned: need to query per partition
+            self.query_partitioned_offsets(py, subscribed)
+        }
+    }
+
+    /// Query offsets for partitioned table subscriptions
+    fn query_partitioned_offsets(
+        &self,
+        py: Python,
+        subscribed: &[(fcore::metadata::TableBucket, i64)],
+    ) -> PyResult<HashMap<fcore::metadata::TableBucket, i64>> {
+        let table_path = &self.table_info.table_path;
+
+        // Get partition_id -> partition_name mapping (cached)
+        let partition_id_to_name = self.get_partition_name_map(py, table_path)?;
+
+        // Group subscribed buckets by partition_id
+        let mut by_partition: HashMap<i64, Vec<i32>> = HashMap::new();
+        for (tb, _) in subscribed {
+            if let Some(partition_id) = tb.partition_id() {
+                by_partition
+                    .entry(partition_id)
+                    .or_default()
+                    .push(tb.bucket_id());
+            }
+        }
+
+        // Query offsets for each partition
+        let mut result: HashMap<fcore::metadata::TableBucket, i64> = HashMap::new();
+        let table_id = self.table_info.table_id;
+
+        for (partition_id, bucket_ids) in by_partition {
+            let partition_name = partition_id_to_name.get(&partition_id).ok_or_else(|| {
+                FlussError::new_err(format!("Unknown partition_id: {partition_id}"))
+            })?;
+
+            let offsets: HashMap<i32, i64> = py
+                .detach(|| {
+                    TOKIO_RUNTIME.block_on(async {
+                        self.admin
+                            .list_partition_offsets(
+                                table_path,
+                                partition_name,
+                                &bucket_ids,
+                                OffsetSpec::Latest,
+                            )
+                            .await
+                    })
+                })
+                .map_err(|e| {
+                    FlussError::new_err(format!(
+                        "Failed to list offsets for partition {partition_name}: {e}"
+                    ))
+                })?;
+
+            for (bucket_id, offset) in offsets {
+                if offset > 0 {
+                    let tb = fcore::metadata::TableBucket::new_with_partition(
+                        table_id,
+                        Some(partition_id),
+                        bucket_id,
+                    );
+                    result.insert(tb, offset);
+                }
+            }
         }
+
+        Ok(result)
+    }
+
+    /// Poll until all buckets reach their stopping offsets
+    fn poll_until_offsets(
+        &self,
+        py: Python,
+        mut stopping_offsets: HashMap<fcore::metadata::TableBucket, i64>,
+    ) -> PyResult<Py<PyAny>> {
+        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
+            FlussError::new_err("Batch-based scanner required for this operation")
+        })?;
+        let mut all_batches = Vec::new();
+
+        while !stopping_offsets.is_empty() {
+            let scan_batches = py
+                .detach(|| {
+                    TOKIO_RUNTIME
+                        .block_on(async { inner_batch.poll(Duration::from_millis(500)).await })
+                })
+                .map_err(|e| FlussError::new_err(format!("Failed to poll: {e}")))?;
+
+            if scan_batches.is_empty() {
+                continue;
+            }
+
+            for scan_batch in scan_batches {
+                let table_bucket = scan_batch.bucket().clone();
+
+                // Check if this bucket is still being tracked
+                let Some(&stop_at) = stopping_offsets.get(&table_bucket) else {
+                    continue;
+                };
+
+                let base_offset = scan_batch.base_offset();
+                let last_offset = scan_batch.last_offset();
+
+                // If the batch starts at or after the stop_at offset, the bucket is exhausted
+                if base_offset >= stop_at {
+                    stopping_offsets.remove(&table_bucket);
+                    continue;
+                }
+
+                let batch = if last_offset >= stop_at {
+                    // Slice batch to keep only records where offset < stop_at
+                    let num_to_keep = (stop_at - base_offset) as usize;
+                    let b = scan_batch.into_batch();
+                    let limit = num_to_keep.min(b.num_rows());
+                    b.slice(0, limit)
+                } else {
+                    scan_batch.into_batch()
+                };
+
+                all_batches.push(Arc::new(batch));
+
+                // Check if we're done with this bucket
+                if last_offset >= stop_at - 1 {
+                    stopping_offsets.remove(&table_bucket);
+                }
+            }
+        }
+
+        Utils::combine_batches_to_table(py, all_batches)
     }
 }
 
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index ef68fb4dd6..d50f19e02c 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -514,6 +514,16 @@ impl RecordBatchLogScanner {
             .subscribe_partition(partition_id, bucket, offset)
             .await
     }
+
+    /// Returns whether the table is partitioned
+    pub fn is_partitioned(&self) -> bool {
+        self.inner.is_partitioned_table
+    }
+
+    /// Returns all subscribed buckets with their current offsets
+    pub fn get_subscribed_buckets(&self) -> Vec<(TableBucket, i64)> {
+        self.inner.log_scanner_status.get_all_subscriptions()
+    }
 }
 
 struct LogFetcher {
@@ -1512,6 +1522,16 @@ impl LogScannerStatus {
         result
     }
 
+    /// Returns all subscribed buckets with their current offsets
+    pub fn get_all_subscriptions(&self) -> Vec<(TableBucket, i64)> {
+        let map = self.bucket_status_map.read();
+        let mut result = Vec::new();
+        map.for_each(|bucket, status| {
+            result.push((bucket.clone(), status.offset()));
+        });
+        result
+    }
+
     /// Helper to get bucket status
     fn get_status(&self, table_bucket: &TableBucket) -> Option<Arc<BucketScanStatus>> {
         let map = self.bucket_status_map.read();

From 28cd8b0c18906ff97d840145674309e87d000c95 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 6 Feb 2026 09:36:07 +0800
Subject: [PATCH 114/287] feat: support unsubscribe partition (#257)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  1 +
 fluss-rust/bindings/cpp/src/lib.rs            | 24 ++++++++
 fluss-rust/bindings/cpp/src/table.cpp         |  9 +++
 .../crates/fluss/src/client/table/scanner.rs  | 29 ++++++++++
 .../fluss/tests/integration/log_table.rs      | 58 +++++++++++++++++++
 5 files changed, 121 insertions(+)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 901b90cae4..3ff9a26c82 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -564,6 +564,7 @@ class LogScanner {
     Result Subscribe(int32_t bucket_id, int64_t start_offset);
     Result Subscribe(const std::vector<BucketSubscription>& bucket_offsets);
     Result SubscribePartition(int64_t partition_id, int32_t bucket_id, int64_t start_offset);
+    Result UnsubscribePartition(int64_t partition_id, int32_t bucket_id);
     Result Poll(int64_t timeout_ms, ScanRecords& out);
     Result PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out);
 
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index b8348654dd..d6e3a9a66e 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -255,6 +255,8 @@ mod ffi {
             bucket_id: i32,
             start_offset: i64,
         ) -> FfiResult;
+        fn unsubscribe_partition(self: &LogScanner, partition_id: i64, bucket_id: i32)
+        -> FfiResult;
         fn poll(self: &LogScanner, timeout_ms: i64) -> FfiScanRecordsResult;
         fn poll_record_batch(self: &LogScanner, timeout_ms: i64) -> FfiArrowRecordBatchesResult;
         fn free_arrow_ffi_structures(array_ptr: usize, schema_ptr: usize);
@@ -825,6 +827,28 @@ impl LogScanner {
         self.do_subscribe(Some(partition_id), bucket_id, start_offset)
     }
 
+    fn unsubscribe_partition(&self, partition_id: PartitionId, bucket_id: i32) -> ffi::FfiResult {
+        if let Some(ref inner) = self.inner {
+            match RUNTIME
+                .block_on(async { inner.unsubscribe_partition(partition_id, bucket_id).await })
+            {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else if let Some(ref inner_batch) = self.inner_batch {
+            match RUNTIME.block_on(async {
+                inner_batch
+                    .unsubscribe_partition(partition_id, bucket_id)
+                    .await
+            }) {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else {
+            err_result(1, "LogScanner not initialized".to_string())
+        }
+    }
+
     fn poll(&self, timeout_ms: i64) -> ffi::FfiScanRecordsResult {
         if let Some(ref inner) = self.inner {
             let timeout = Duration::from_millis(timeout_ms as u64);
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index ab26038911..efb762bd66 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -264,6 +264,15 @@ Result LogScanner::SubscribePartition(int64_t partition_id, int32_t bucket_id, i
     return utils::from_ffi_result(ffi_result);
 }
 
+Result LogScanner::UnsubscribePartition(int64_t partition_id, int32_t bucket_id) {
+    if (!Available()) {
+        return utils::make_error(1, "LogScanner not available");
+    }
+
+    auto ffi_result = scanner_->unsubscribe_partition(partition_id, bucket_id);
+    return utils::from_ffi_result(ffi_result);
+}
+
 Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
     if (!Available()) {
         return utils::make_error(1, "LogScanner not available");
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index d50f19e02c..26f54da8fb 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -409,6 +409,19 @@ impl LogScannerInner {
         Ok(())
     }
 
+    async fn unsubscribe_partition(&self, partition_id: PartitionId, bucket: i32) -> Result<()> {
+        if !self.is_partitioned_table {
+            return Err(Error::UnsupportedOperation {
+                message: "Can't unsubscribe a partition for a non-partitioned table.".to_string(),
+            });
+        }
+        let table_bucket =
+            TableBucket::new_with_partition(self.table_id, Some(partition_id), bucket);
+        self.log_scanner_status
+            .unassign_scan_buckets(from_ref(&table_bucket));
+        Ok(())
+    }
+
     async fn poll_for_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
         let result = self.log_fetcher.collect_fetches()?;
         if !result.is_empty() {
@@ -487,6 +500,14 @@ impl LogScanner {
             .subscribe_partition(partition_id, bucket, offset)
             .await
     }
+
+    pub async fn unsubscribe_partition(
+        &self,
+        partition_id: PartitionId,
+        bucket: i32,
+    ) -> Result<()> {
+        self.inner.unsubscribe_partition(partition_id, bucket).await
+    }
 }
 
 // Implementation for RecordBatchLogScanner (batches mode)
@@ -524,6 +545,14 @@ impl RecordBatchLogScanner {
     pub fn get_subscribed_buckets(&self) -> Vec<(TableBucket, i64)> {
         self.inner.log_scanner_status.get_all_subscriptions()
     }
+
+    pub async fn unsubscribe_partition(
+        &self,
+        partition_id: PartitionId,
+        bucket: i32,
+    ) -> Result<()> {
+        self.inner.unsubscribe_partition(partition_id, bucket).await
+    }
 }
 
 struct LogFetcher {
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 3f7dd6e222..493bb34441 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -1160,6 +1160,64 @@ mod table_test {
             "Data mismatch between sent and received"
         );
 
+        // Test unsubscribe_partition: after unsubscribing from one partition,
+        // data from that partition should no longer be read.
+        let log_scanner_unsub = table
+            .new_scan()
+            .create_log_scanner()
+            .expect("Failed to create log scanner for unsubscribe test");
+        let partition_infos = admin
+            .list_partition_infos(&table_path)
+            .await
+            .expect("Failed to list partition infos");
+        let eu_partition_id = partition_infos
+            .iter()
+            .find(|p| p.get_partition_name() == "EU")
+            .map(|p| p.get_partition_id())
+            .expect("EU partition should exist");
+        for info in &partition_infos {
+            log_scanner_unsub
+                .subscribe_partition(info.get_partition_id(), 0, 0)
+                .await
+                .expect("Failed to subscribe to partition");
+        }
+        log_scanner_unsub
+            .unsubscribe_partition(eu_partition_id, 0)
+            .await
+            .expect("Failed to unsubscribe from EU partition");
+
+        let mut records_after_unsubscribe: Vec<(i32, String, i64)> = Vec::new();
+        let unsub_deadline = std::time::Instant::now() + Duration::from_secs(5);
+        while records_after_unsubscribe.len() < 4 && std::time::Instant::now() < unsub_deadline {
+            let records = log_scanner_unsub
+                .poll(Duration::from_millis(300))
+                .await
+                .expect("Failed to poll after unsubscribe");
+            for rec in records {
+                let row = rec.row();
+                records_after_unsubscribe.push((
+                    row.get_int(0),
+                    row.get_string(1).to_string(),
+                    row.get_long(2),
+                ));
+            }
+        }
+
+        assert!(
+            records_after_unsubscribe.iter().all(|r| r.1 == "US"),
+            "After unsubscribe_partition(EU), only US partition data should be read; got regions: {:?}",
+            records_after_unsubscribe
+                .iter()
+                .map(|r| r.1.as_str())
+                .collect::<Vec<_>>()
+        );
+        assert_eq!(
+            records_after_unsubscribe.len(),
+            4,
+            "Should receive exactly 4 US records (ids 1,2,5,6); got {}",
+            records_after_unsubscribe.len()
+        );
+
         admin
             .drop_table(&table_path, false)
             .await

From 024c1d146c8de338bf1d1dff05db12475eb8d401 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 6 Feb 2026 12:08:20 +0800
Subject: [PATCH 115/287] feat: introduce list partitions in cpp binding (#260)

---
 fluss-rust/bindings/cpp/include/fluss.hpp |  8 +++++
 fluss-rust/bindings/cpp/src/admin.cpp     | 21 +++++++++++
 fluss-rust/bindings/cpp/src/lib.rs        | 44 +++++++++++++++++++++++
 3 files changed, 73 insertions(+)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 3ff9a26c82..9461f68fa6 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -403,6 +403,11 @@ struct LakeSnapshot {
     std::vector<BucketOffset> bucket_offsets;
 };
 
+struct PartitionInfo {
+    int64_t partition_id;
+    std::string partition_name;
+};
+
 class AppendWriter;
 class LogScanner;
 class Admin;
@@ -464,6 +469,9 @@ class Admin {
                               const OffsetQuery& offset_query,
                               std::unordered_map<int32_t, int64_t>& out);
 
+    Result ListPartitionInfos(const TablePath& table_path,
+                             std::vector<PartitionInfo>& out);
+
 private:
     Result DoListOffsets(const TablePath& table_path,
                        const std::vector<int32_t>& bucket_ids,
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index e4106146ee..d19e444cd2 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -162,4 +162,25 @@ Result Admin::ListPartitionOffsets(const TablePath& table_path,
     return DoListOffsets(table_path, bucket_ids, offset_query, out, &partition_name);
 }
 
+Result Admin::ListPartitionInfos(const TablePath& table_path,
+                                 std::vector<PartitionInfo>& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+    auto ffi_result = admin_->list_partition_infos(ffi_path);
+
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.clear();
+        out.reserve(ffi_result.partition_infos.size());
+        for (const auto& pi : ffi_result.partition_infos) {
+            out.push_back({pi.partition_id, std::string(pi.partition_name)});
+        }
+    }
+
+    return result;
+}
+
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index d6e3a9a66e..afdb7c0c1d 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -175,6 +175,16 @@ mod ffi {
         lake_snapshot: FfiLakeSnapshot,
     }
 
+    struct FfiPartitionInfo {
+        partition_id: i64,
+        partition_name: String,
+    }
+
+    struct FfiListPartitionInfosResult {
+        result: FfiResult,
+        partition_infos: Vec<FfiPartitionInfo>,
+    }
+
     extern "Rust" {
         type Connection;
         type Admin;
@@ -219,6 +229,10 @@ mod ffi {
             bucket_ids: Vec<i32>,
             offset_query: &FfiOffsetQuery,
         ) -> FfiListOffsetsResult;
+        fn list_partition_infos(
+            self: &Admin,
+            table_path: &FfiTablePath,
+        ) -> FfiListPartitionInfosResult;
 
         // Table
         unsafe fn delete_table(table: *mut Table);
@@ -551,6 +565,36 @@ impl Admin {
     ) -> ffi::FfiListOffsetsResult {
         self.do_list_offsets(table_path, Some(&partition_name), bucket_ids, offset_query)
     }
+
+    fn list_partition_infos(
+        &self,
+        table_path: &ffi::FfiTablePath,
+    ) -> ffi::FfiListPartitionInfosResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+        let result = RUNTIME.block_on(async { self.inner.list_partition_infos(&path).await });
+        match result {
+            Ok(infos) => {
+                let partition_infos: Vec<ffi::FfiPartitionInfo> = infos
+                    .into_iter()
+                    .map(|info| ffi::FfiPartitionInfo {
+                        partition_id: info.get_partition_id(),
+                        partition_name: info.get_partition_name(),
+                    })
+                    .collect();
+                ffi::FfiListPartitionInfosResult {
+                    result: ok_result(),
+                    partition_infos,
+                }
+            }
+            Err(e) => ffi::FfiListPartitionInfosResult {
+                result: err_result(1, e.to_string()),
+                partition_infos: vec![],
+            },
+        }
+    }
 }
 
 // Table implementation

From 40f13b1828ffb8ff657b0dd94ade953982740749 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 7 Feb 2026 02:01:49 +0000
Subject: [PATCH 116/287] chore: python binding cleanup and bit of refactor
 (#264)

---
 fluss-rust/bindings/python/src/table.rs | 207 +++++++++---------------
 1 file changed, 78 insertions(+), 129 deletions(-)

diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index c285f25c3a..7184c8d2ad 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -265,34 +265,29 @@ impl TableScan {
             let (projected_schema, projected_row_type) =
                 calculate_projected_types(&table_info, projection_indices)?;
 
-            let py_scanner = match scanner_type {
+            let scanner_kind = match scanner_type {
                 ScannerType::Record => {
-                    let rust_scanner = table_scan.create_log_scanner().map_err(|e| {
+                    let s = table_scan.create_log_scanner().map_err(|e| {
                         FlussError::new_err(format!("Failed to create log scanner: {e}"))
                     })?;
-                    LogScanner::from_log_scanner(
-                        rust_scanner,
-                        admin,
-                        table_info,
-                        projected_schema,
-                        projected_row_type,
-                    )
+                    ScannerKind::Record(s)
                 }
                 ScannerType::Batch => {
-                    let rust_scanner =
-                        table_scan.create_record_batch_log_scanner().map_err(|e| {
-                            FlussError::new_err(format!("Failed to create batch scanner: {e}"))
-                        })?;
-                    LogScanner::from_batch_scanner(
-                        rust_scanner,
-                        admin,
-                        table_info,
-                        projected_schema,
-                        projected_row_type,
-                    )
+                    let s = table_scan.create_record_batch_log_scanner().map_err(|e| {
+                        FlussError::new_err(format!("Failed to create batch scanner: {e}"))
+                    })?;
+                    ScannerKind::Batch(s)
                 }
             };
 
+            let py_scanner = LogScanner::new(
+                scanner_kind,
+                admin,
+                table_info,
+                projected_schema,
+                projected_row_type,
+            );
+
             Python::attach(|py| Py::new(py, py_scanner))
         })
     }
@@ -1555,6 +1550,44 @@ fn get_type_name(value: &Bound<PyAny>) -> String {
         .unwrap_or_else(|_| "unknown".to_string())
 }
 
+/// Wraps the two scanner variants so we never have an impossible state
+/// (both None or both Some).
+enum ScannerKind {
+    Record(fcore::client::LogScanner),
+    Batch(fcore::client::RecordBatchLogScanner),
+}
+
+impl ScannerKind {
+    fn as_record(&self) -> PyResult<&fcore::client::LogScanner> {
+        match self {
+            Self::Record(s) => Ok(s),
+            Self::Batch(_) => Err(FlussError::new_err(
+                "poll() requires a record-based scanner. Use new_scan().create_log_scanner().",
+            )),
+        }
+    }
+
+    fn as_batch(&self) -> PyResult<&fcore::client::RecordBatchLogScanner> {
+        match self {
+            Self::Batch(s) => Ok(s),
+            Self::Record(_) => Err(FlussError::new_err(
+                "This method requires a batch-based scanner. Use new_scan().create_batch_scanner().",
+            )),
+        }
+    }
+}
+
+/// Dispatch a method call to whichever scanner variant is active.
+/// Both `LogScanner` and `RecordBatchLogScanner` share the same subscribe interface.
+macro_rules! with_scanner {
+    ($scanner:expr, $method:ident($($arg:expr),*)) => {
+        match $scanner {
+            ScannerKind::Record(s) => s.$method($($arg),*).await,
+            ScannerKind::Batch(s) => s.$method($($arg),*).await,
+        }
+    };
+}
+
 /// Scanner for reading log data from a Fluss table.
 ///
 /// This scanner supports two modes:
@@ -1562,10 +1595,7 @@ fn get_type_name(value: &Bound<PyAny>) -> String {
 /// - Batch-based scanning via `poll_arrow()` / `poll_batches()` - returns Arrow batches
 #[pyclass]
 pub struct LogScanner {
-    /// Record-based scanner for poll()
-    inner: Option<fcore::client::LogScanner>,
-    /// Batch-based scanner for poll_arrow/poll_batches
-    inner_batch: Option<fcore::client::RecordBatchLogScanner>,
+    scanner: ScannerKind,
     admin: fcore::client::FlussAdmin,
     table_info: fcore::metadata::TableInfo,
     /// The projected Arrow schema to use for empty table creation
@@ -1586,19 +1616,8 @@ impl LogScanner {
     fn subscribe(&self, py: Python, bucket_id: i32, start_offset: i64) -> PyResult<()> {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
-                if let Some(ref inner) = self.inner {
-                    inner
-                        .subscribe(bucket_id, start_offset)
-                        .await
-                        .map_err(|e| FlussError::new_err(format!("Failed to subscribe: {e}")))
-                } else if let Some(ref inner_batch) = self.inner_batch {
-                    inner_batch
-                        .subscribe(bucket_id, start_offset)
-                        .await
-                        .map_err(|e| FlussError::new_err(format!("Failed to subscribe: {e}")))
-                } else {
-                    Err(FlussError::new_err("No scanner available"))
-                }
+                with_scanner!(&self.scanner, subscribe(bucket_id, start_offset))
+                    .map_err(|e| FlussError::new_err(e.to_string()))
             })
         })
     }
@@ -1610,19 +1629,8 @@ impl LogScanner {
     fn subscribe_buckets(&self, py: Python, bucket_offsets: HashMap<i32, i64>) -> PyResult<()> {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
-                if let Some(ref inner) = self.inner {
-                    inner
-                        .subscribe_buckets(&bucket_offsets)
-                        .await
-                        .map_err(|e| FlussError::new_err(format!("Failed to subscribe batch: {e}")))
-                } else if let Some(ref inner_batch) = self.inner_batch {
-                    inner_batch
-                        .subscribe_buckets(&bucket_offsets)
-                        .await
-                        .map_err(|e| FlussError::new_err(format!("Failed to subscribe batch: {e}")))
-                } else {
-                    Err(FlussError::new_err("No scanner available"))
-                }
+                with_scanner!(&self.scanner, subscribe_buckets(&bucket_offsets))
+                    .map_err(|e| FlussError::new_err(e.to_string()))
             })
         })
     }
@@ -1642,23 +1650,11 @@ impl LogScanner {
     ) -> PyResult<()> {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
-                if let Some(ref inner) = self.inner {
-                    inner
-                        .subscribe_partition(partition_id, bucket_id, start_offset)
-                        .await
-                        .map_err(|e| {
-                            FlussError::new_err(format!("Failed to subscribe partition: {e}"))
-                        })
-                } else if let Some(ref inner_batch) = self.inner_batch {
-                    inner_batch
-                        .subscribe_partition(partition_id, bucket_id, start_offset)
-                        .await
-                        .map_err(|e| {
-                            FlussError::new_err(format!("Failed to subscribe partition: {e}"))
-                        })
-                } else {
-                    Err(FlussError::new_err("No scanner available"))
-                }
+                with_scanner!(
+                    &self.scanner,
+                    subscribe_partition(partition_id, bucket_id, start_offset)
+                )
+                .map_err(|e| FlussError::new_err(e.to_string()))
             })
         })
     }
@@ -1677,12 +1673,7 @@ impl LogScanner {
     ///     - Returns an empty list if no records are available
     ///     - When timeout expires, returns an empty list (NOT an error)
     fn poll(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<ScanRecord>> {
-        let inner = self.inner.as_ref().ok_or_else(|| {
-            FlussError::new_err(
-                "Record-based scanner not available. Use new_scan().create_log_scanner() to create a scanner \
-                 that supports poll().",
-            )
-        })?;
+        let scanner = self.scanner.as_record()?;
 
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
@@ -1692,7 +1683,7 @@ impl LogScanner {
 
         let timeout = Duration::from_millis(timeout_ms as u64);
         let scan_records = py
-            .detach(|| TOKIO_RUNTIME.block_on(async { inner.poll(timeout).await }))
+            .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
             .map_err(|e| FlussError::new_err(e.to_string()))?;
 
         // Convert ScanRecords to Python ScanRecord list
@@ -1724,12 +1715,7 @@ impl LogScanner {
     ///     - Returns an empty list if no batches are available
     ///     - When timeout expires, returns an empty list (NOT an error)
     fn poll_batches(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<RecordBatch>> {
-        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
-            FlussError::new_err(
-                "Batch-based scanner not available. Use new_scan().create_batch_scanner() to create a scanner \
-                 that supports poll_batches().",
-            )
-        })?;
+        let scanner = self.scanner.as_batch()?;
 
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
@@ -1739,7 +1725,7 @@ impl LogScanner {
 
         let timeout = Duration::from_millis(timeout_ms as u64);
         let scan_batches = py
-            .detach(|| TOKIO_RUNTIME.block_on(async { inner_batch.poll(timeout).await }))
+            .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
             .map_err(|e| FlussError::new_err(e.to_string()))?;
 
         // Convert ScanBatch to RecordBatch with metadata
@@ -1764,12 +1750,7 @@ impl LogScanner {
     ///     - Returns an empty table (with correct schema) if no records are available
     ///     - When timeout expires, returns an empty table (NOT an error)
     fn poll_arrow(&self, py: Python, timeout_ms: i64) -> PyResult<Py<PyAny>> {
-        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
-            FlussError::new_err(
-                "Batch-based scanner not available. Use new_scan().create_batch_scanner() to create a scanner \
-                 that supports poll_arrow().",
-            )
-        })?;
+        let scanner = self.scanner.as_batch()?;
 
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
@@ -1779,7 +1760,7 @@ impl LogScanner {
 
         let timeout = Duration::from_millis(timeout_ms as u64);
         let scan_batches = py
-            .detach(|| TOKIO_RUNTIME.block_on(async { inner_batch.poll(timeout).await }))
+            .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
             .map_err(|e| FlussError::new_err(e.to_string()))?;
 
         // Convert ScanBatch to Arrow batches
@@ -1822,14 +1803,8 @@ impl LogScanner {
     /// Returns:
     ///     PyArrow Table containing all data from subscribed buckets
     fn to_arrow(&self, py: Python) -> PyResult<Py<PyAny>> {
-        // 1. Get subscribed buckets from scanner (requires batch scanner for get_subscribed_buckets)
-        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
-            FlussError::new_err(
-                "Batch-based scanner not available. Use new_scan().create_batch_scanner() to create a scanner \
-                 that supports to_arrow().",
-            )
-        })?;
-        let subscribed = inner_batch.get_subscribed_buckets();
+        let scanner = self.scanner.as_batch()?;
+        let subscribed = scanner.get_subscribed_buckets();
         if subscribed.is_empty() {
             return Err(FlussError::new_err(
                 "No buckets subscribed. Call subscribe(), subscribe_buckets(), or subscribe_partition() first.",
@@ -1866,36 +1841,15 @@ impl LogScanner {
 }
 
 impl LogScanner {
-    /// Create LogScanner for record-based scanning
-    pub fn from_log_scanner(
-        inner_scanner: fcore::client::LogScanner,
-        admin: fcore::client::FlussAdmin,
-        table_info: fcore::metadata::TableInfo,
-        projected_schema: SchemaRef,
-        projected_row_type: fcore::metadata::RowType,
-    ) -> Self {
-        Self {
-            inner: Some(inner_scanner),
-            inner_batch: None,
-            admin,
-            table_info,
-            projected_schema,
-            projected_row_type,
-            partition_name_cache: std::sync::RwLock::new(None),
-        }
-    }
-
-    /// Create LogScanner for batch-based scanning
-    pub fn from_batch_scanner(
-        inner_batch_scanner: fcore::client::RecordBatchLogScanner,
+    fn new(
+        scanner: ScannerKind,
         admin: fcore::client::FlussAdmin,
         table_info: fcore::metadata::TableInfo,
         projected_schema: SchemaRef,
         projected_row_type: fcore::metadata::RowType,
     ) -> Self {
         Self {
-            inner: None,
-            inner_batch: Some(inner_batch_scanner),
+            scanner,
             admin,
             table_info,
             projected_schema,
@@ -1946,10 +1900,8 @@ impl LogScanner {
         py: Python,
         subscribed: &[(fcore::metadata::TableBucket, i64)],
     ) -> PyResult<HashMap<fcore::metadata::TableBucket, i64>> {
-        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
-            FlussError::new_err("Batch-based scanner required for this operation")
-        })?;
-        let is_partitioned = inner_batch.is_partitioned();
+        let scanner = self.scanner.as_batch()?;
+        let is_partitioned = scanner.is_partitioned();
         let table_path = &self.table_info.table_path;
 
         if !is_partitioned {
@@ -2055,16 +2007,13 @@ impl LogScanner {
         py: Python,
         mut stopping_offsets: HashMap<fcore::metadata::TableBucket, i64>,
     ) -> PyResult<Py<PyAny>> {
-        let inner_batch = self.inner_batch.as_ref().ok_or_else(|| {
-            FlussError::new_err("Batch-based scanner required for this operation")
-        })?;
+        let scanner = self.scanner.as_batch()?;
         let mut all_batches = Vec::new();
 
         while !stopping_offsets.is_empty() {
             let scan_batches = py
                 .detach(|| {
-                    TOKIO_RUNTIME
-                        .block_on(async { inner_batch.poll(Duration::from_millis(500)).await })
+                    TOKIO_RUNTIME.block_on(async { scanner.poll(Duration::from_millis(500)).await })
                 })
                 .map_err(|e| FlussError::new_err(format!("Failed to poll: {e}")))?;
 

From 5a334bcc07beacb4d933ac0d66722bffeb74158d Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 7 Feb 2026 02:17:35 +0000
Subject: [PATCH 117/287] chore: Fire-and-forget behaviour for effecient
 batching (#258)

---
 fluss-rust/bindings/cpp/examples/example.cpp  | 16 +++++-
 fluss-rust/bindings/cpp/include/fluss.hpp     | 27 +++++++++
 fluss-rust/bindings/cpp/src/lib.rs            | 37 +++++++++---
 fluss-rust/bindings/cpp/src/table.cpp         | 57 ++++++++++++++++++-
 fluss-rust/bindings/python/example/example.py | 39 +++++++------
 fluss-rust/bindings/python/src/table.rs       | 54 ++++++++++++++----
 fluss-rust/bindings/python/src/upsert.rs      | 47 +++++++++++----
 .../crates/examples/src/example_kv_table.rs   |  5 +-
 .../src/example_partitioned_kv_table.rs       |  5 +-
 .../crates/examples/src/example_table.rs      |  8 +--
 .../crates/fluss/src/client/table/append.rs   | 30 +++++++---
 .../crates/fluss/src/client/table/upsert.rs   | 30 ++++++----
 .../crates/fluss/src/client/write/mod.rs      | 41 +++++++++++++
 .../fluss/tests/integration/kv_table.rs       | 53 +++++++++++------
 .../fluss/tests/integration/log_table.rs      |  4 ++
 15 files changed, 360 insertions(+), 93 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 7022cad1e6..10266c7522 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -91,6 +91,7 @@ int main() {
         {3, "Charlie", 92.1f, 35},
     };
 
+    // Fire-and-forget: queue rows, flush at end
     for (const auto& r : rows) {
         fluss::GenericRow row;
         row.SetInt32(0, r.id);
@@ -100,7 +101,20 @@ int main() {
         check("append", writer.Append(row));
     }
     check("flush", writer.Flush());
-    std::cout << "Wrote " << rows.size() << " rows" << std::endl;
+    std::cout << "Wrote " << rows.size() << " rows (fire-and-forget + flush)" << std::endl;
+
+    // Per-record acknowledgment
+    {
+        fluss::GenericRow row;
+        row.SetInt32(0, 100);
+        row.SetString(1, "AckTest");
+        row.SetFloat32(2, 99.9f);
+        row.SetInt32(3, 42);
+        fluss::WriteResult wr;
+        check("append", writer.Append(row, wr));
+        check("wait", wr.Wait());
+        std::cout << "Row acknowledged by server" << std::endl;
+    }
 
     // 6) Scan
     fluss::LogScanner scanner;
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 9461f68fa6..6c20717565 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -37,6 +37,7 @@ namespace ffi {
     struct Admin;
     struct Table;
     struct AppendWriter;
+    struct WriteResult;
     struct LogScanner;
 }  // namespace ffi
 
@@ -409,6 +410,7 @@ struct PartitionInfo {
 };
 
 class AppendWriter;
+class WriteResult;
 class LogScanner;
 class Admin;
 class Table;
@@ -534,6 +536,30 @@ class TableScan {
     std::vector<size_t> projection_;
 };
 
+class WriteResult {
+public:
+    WriteResult() noexcept;
+    ~WriteResult() noexcept;
+
+    WriteResult(const WriteResult&) = delete;
+    WriteResult& operator=(const WriteResult&) = delete;
+    WriteResult(WriteResult&& other) noexcept;
+    WriteResult& operator=(WriteResult&& other) noexcept;
+
+    bool Available() const;
+
+    /// Wait for server acknowledgment of the write.
+    /// For fire-and-forget, simply let the WriteResult go out of scope.
+    Result Wait();
+
+private:
+    friend class AppendWriter;
+    WriteResult(ffi::WriteResult* inner) noexcept;
+
+    void Destroy() noexcept;
+    ffi::WriteResult* inner_{nullptr};
+};
+
 class AppendWriter {
 public:
     AppendWriter() noexcept;
@@ -547,6 +573,7 @@ class AppendWriter {
     bool Available() const;
 
     Result Append(const GenericRow& row);
+    Result Append(const GenericRow& row, WriteResult& out);
     Result Flush();
 
 private:
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index afdb7c0c1d..7944c100a2 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -190,6 +190,7 @@ mod ffi {
         type Admin;
         type Table;
         type AppendWriter;
+        type WriteResult;
         type LogScanner;
 
         // Connection
@@ -253,9 +254,12 @@ mod ffi {
 
         // AppendWriter
         unsafe fn delete_append_writer(writer: *mut AppendWriter);
-        fn append(self: &mut AppendWriter, row: &FfiGenericRow) -> FfiResult;
+        fn append(self: &mut AppendWriter, row: &FfiGenericRow) -> Result<Box<WriteResult>>;
         fn flush(self: &mut AppendWriter) -> FfiResult;
 
+        // WriteResult — dropped automatically via rust::Box, or call wait() for ack
+        fn wait(self: &mut WriteResult) -> FfiResult;
+
         // LogScanner
         unsafe fn delete_log_scanner(scanner: *mut LogScanner);
         fn subscribe(self: &LogScanner, bucket_id: i32, start_offset: i64) -> FfiResult;
@@ -299,6 +303,10 @@ pub struct AppendWriter {
     inner: fcore::client::AppendWriter,
 }
 
+pub struct WriteResult {
+    inner: Option<fcore::client::WriteResultFuture>,
+}
+
 pub struct LogScanner {
     inner: Option<fcore::client::LogScanner>,
     inner_batch: Option<fcore::client::RecordBatchLogScanner>,
@@ -750,15 +758,16 @@ unsafe fn delete_append_writer(writer: *mut AppendWriter) {
 }
 
 impl AppendWriter {
-    fn append(&mut self, row: &ffi::FfiGenericRow) -> ffi::FfiResult {
+    fn append(&mut self, row: &ffi::FfiGenericRow) -> Result<Box<WriteResult>, String> {
         let generic_row = types::ffi_row_to_core(row);
 
-        let result = RUNTIME.block_on(async { self.inner.append(&generic_row).await });
+        let result_future = RUNTIME
+            .block_on(async { self.inner.append(&generic_row).await })
+            .map_err(|e| format!("Failed to append: {e}"))?;
 
-        match result {
-            Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
-        }
+        Ok(Box::new(WriteResult {
+            inner: Some(result_future),
+        }))
     }
 
     fn flush(&mut self) -> ffi::FfiResult {
@@ -771,6 +780,20 @@ impl AppendWriter {
     }
 }
 
+impl WriteResult {
+    fn wait(&mut self) -> ffi::FfiResult {
+        if let Some(future) = self.inner.take() {
+            let result = RUNTIME.block_on(future);
+            match result {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else {
+            ok_result()
+        }
+    }
+}
+
 // LogScanner implementation
 unsafe fn delete_log_scanner(scanner: *mut LogScanner) {
     if !scanner.is_null() {
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index efb762bd66..24be8d45dd 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -152,6 +152,45 @@ bool Table::HasPrimaryKey() const {
     return table_->has_primary_key();
 }
 
+// WriteResult implementation
+WriteResult::WriteResult() noexcept = default;
+
+WriteResult::WriteResult(ffi::WriteResult* inner) noexcept : inner_(inner) {}
+
+WriteResult::~WriteResult() noexcept { Destroy(); }
+
+void WriteResult::Destroy() noexcept {
+    if (inner_) {
+        // Reconstruct the rust::Box to let Rust drop the value
+        rust::Box<ffi::WriteResult>::from_raw(inner_);
+        inner_ = nullptr;
+    }
+}
+
+WriteResult::WriteResult(WriteResult&& other) noexcept : inner_(other.inner_) {
+    other.inner_ = nullptr;
+}
+
+WriteResult& WriteResult::operator=(WriteResult&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        inner_ = other.inner_;
+        other.inner_ = nullptr;
+    }
+    return *this;
+}
+
+bool WriteResult::Available() const { return inner_ != nullptr; }
+
+Result WriteResult::Wait() {
+    if (!Available()) {
+        return utils::make_ok();
+    }
+
+    auto ffi_result = inner_->wait();
+    return utils::from_ffi_result(ffi_result);
+}
+
 // AppendWriter implementation
 AppendWriter::AppendWriter() noexcept = default;
 
@@ -182,13 +221,25 @@ AppendWriter& AppendWriter::operator=(AppendWriter&& other) noexcept {
 bool AppendWriter::Available() const { return writer_ != nullptr; }
 
 Result AppendWriter::Append(const GenericRow& row) {
+    WriteResult wr;
+    return Append(row, wr);
+}
+
+Result AppendWriter::Append(const GenericRow& row, WriteResult& out) {
     if (!Available()) {
         return utils::make_error(1, "AppendWriter not available");
     }
 
-    auto ffi_row = utils::to_ffi_generic_row(row);
-    auto ffi_result = writer_->append(ffi_row);
-    return utils::from_ffi_result(ffi_result);
+    try {
+        auto ffi_row = utils::to_ffi_generic_row(row);
+        auto rust_box = writer_->append(ffi_row);
+        out.inner_ = rust_box.into_raw();
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
 }
 
 Result AppendWriter::Flush() {
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 8735038aa5..1cabaa5f23 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -417,11 +417,13 @@ async def main():
     print(f"Has primary key: {pk_table.has_primary_key()}")
 
     # --- Test Upsert ---
-    print("\n--- Testing Upsert ---")
+    print("\n--- Testing Upsert (fire-and-forget) ---")
     try:
         upsert_writer = pk_table.new_upsert()
         print(f"Created upsert writer: {upsert_writer}")
 
+        # Fire-and-forget: queue writes without waiting for individual acks.
+        # Records are batched internally for efficiency.
         await upsert_writer.upsert(
             {
                 "user_id": 1,
@@ -437,7 +439,7 @@ async def main():
                 "balance": Decimal("1234.56"),
             }
         )
-        print("Upserted user_id=1 (Alice)")
+        print("Queued user_id=1 (Alice)")
 
         await upsert_writer.upsert(
             {
@@ -452,7 +454,7 @@ async def main():
                 "balance": Decimal("5678.91"),
             }
         )
-        print("Upserted user_id=2 (Bob)")
+        print("Queued user_id=2 (Bob)")
 
         await upsert_writer.upsert(
             {
@@ -467,10 +469,17 @@ async def main():
                 "balance": Decimal("9876.54"),
             }
         )
-        print("Upserted user_id=3 (Charlie)")
+        print("Queued user_id=3 (Charlie)")
 
-        # Update an existing row (same PK, different values)
-        await upsert_writer.upsert(
+        # flush() waits for all queued writes to be acknowledged by the server
+        await upsert_writer.flush()
+        print("Flushed — all 3 rows acknowledged by server")
+
+        # Per-record acknowledgment: await the returned handle to block until
+        # the server confirms this specific write, useful when you need to
+        # read-after-write or verify critical updates.
+        print("\n--- Testing Upsert (per-record acknowledgment) ---")
+        ack = await upsert_writer.upsert(
             {
                 "user_id": 1,
                 "name": "Alice Updated",
@@ -485,11 +494,8 @@ async def main():
                 "balance": Decimal("2345.67"),
             }
         )
-        print("Updated user_id=1 (Alice -> Alice Updated)")
-
-        # Explicit flush to ensure all upserts are acknowledged
-        await upsert_writer.flush()
-        print("Flushed all upserts")
+        await ack  # wait for server acknowledgment before proceeding
+        print("Updated user_id=1 (Alice -> Alice Updated) — server acknowledged")
 
     except Exception as e:
         print(f"Error during upsert: {e}")
@@ -548,13 +554,10 @@ async def main():
     try:
         upsert_writer = pk_table.new_upsert()
 
-        # Delete only needs PK columns - much simpler API!
-        await upsert_writer.delete({"user_id": 3})
-        print("Deleted user_id=3")
-
-        # Explicit flush to ensure delete is acknowledged
-        await upsert_writer.flush()
-        print("Flushed delete")
+        # Per-record ack for delete — await the handle to confirm deletion
+        ack = await upsert_writer.delete({"user_id": 3})
+        await ack
+        print("Deleted user_id=3 — server acknowledged")
 
         lookuper = pk_table.new_lookup()
         result = await lookuper.lookup({"user_id": 3})
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 7184c8d2ad..e987d43d69 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -526,35 +526,59 @@ pub struct AppendWriter {
 
 #[pymethods]
 impl AppendWriter {
-    /// Write Arrow table data
+    /// Write Arrow table data (fire-and-forget, use flush() to ensure delivery)
     pub fn write_arrow(&self, py: Python, table: Py<PyAny>) -> PyResult<()> {
         // Convert Arrow Table to batches and write each batch
         let batches = table.call_method0(py, "to_batches")?;
         let batch_list: Vec<Py<PyAny>> = batches.extract(py)?;
 
         for batch in batch_list {
-            self.write_arrow_batch(py, batch)?;
+            // Drop the ack coroutine — fire-and-forget
+            let _ = self.write_arrow_batch(py, batch)?;
         }
         Ok(())
     }
 
     /// Write Arrow batch data
-    pub fn write_arrow_batch(&self, py: Python, batch: Py<PyAny>) -> PyResult<()> {
+    ///
+    /// Returns:
+    ///     A coroutine that can be awaited for server acknowledgment,
+    ///     or ignored for fire-and-forget behavior.
+    pub fn write_arrow_batch<'py>(
+        &self,
+        py: Python<'py>,
+        batch: Py<PyAny>,
+    ) -> PyResult<Bound<'py, PyAny>> {
         // This shares the underlying Arrow buffers without copying data
         let batch_bound = batch.bind(py);
         let rust_batch: ArrowRecordBatch = FromPyArrow::from_pyarrow_bound(batch_bound)
             .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch: {e}")))?;
 
         let inner = self.inner.clone();
-        // Release the GIL before blocking on async operation
-        let result = py.detach(|| {
-            TOKIO_RUNTIME.block_on(async { inner.append_arrow_batch(rust_batch).await })
-        });
 
-        result.map_err(|e| FlussError::new_err(e.to_string()))
+        future_into_py(py, async move {
+            let result_future = inner
+                .append_arrow_batch(rust_batch)
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+            Python::attach(|py| {
+                future_into_py(py, async move {
+                    result_future
+                        .await
+                        .map_err(|e| FlussError::new_err(e.to_string()))?;
+                    Ok(())
+                })
+                .map(|bound| bound.unbind())
+            })
+        })
     }
 
     /// Append a single row to the table
+    ///
+    /// Returns:
+    ///     A coroutine that can be awaited for server acknowledgment,
+    ///     or ignored for fire-and-forget behavior.
     pub fn append<'py>(
         &self,
         py: Python<'py>,
@@ -564,10 +588,20 @@ impl AppendWriter {
         let inner = self.inner.clone();
 
         future_into_py(py, async move {
-            inner
+            let result_future = inner
                 .append(&generic_row)
                 .await
-                .map_err(|e| FlussError::new_err(e.to_string()))
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+
+            Python::attach(|py| {
+                future_into_py(py, async move {
+                    result_future
+                        .await
+                        .map_err(|e| FlussError::new_err(e.to_string()))?;
+                    Ok(())
+                })
+                .map(|bound| bound.unbind())
+            })
         })
     }
 
diff --git a/fluss-rust/bindings/python/src/upsert.rs b/fluss-rust/bindings/python/src/upsert.rs
index 08b3597056..5c10dedc5a 100644
--- a/fluss-rust/bindings/python/src/upsert.rs
+++ b/fluss-rust/bindings/python/src/upsert.rs
@@ -23,16 +23,21 @@ use tokio::sync::Mutex;
 
 /// Writer for upserting and deleting data in a Fluss primary key table.
 ///
-/// Each upsert/delete operation is sent to the server and waits for acknowledgment.
-/// Multiple concurrent writers share a common WriterClient which batches requests
-/// for efficiency.
+/// Each upsert/delete operation queues the write and returns a coroutine
+/// that can be awaited for per-record acknowledgment, or ignored for
+/// fire-and-forget semantics (call `flush()` to ensure delivery).
 ///
 /// # Example:
 ///     writer = table.new_upsert()
+///
+///     # Fire-and-forget with flush
 ///     await writer.upsert(row1)
 ///     await writer.upsert(row2)
-///     await writer.delete(pk)
-///     await writer.flush()  # Ensures all pending operations are acknowledged
+///     await writer.flush()
+///
+///     # Or await individual acknowledgment
+///     ack = await writer.upsert(row3)
+///     await ack
 #[pyclass]
 pub struct UpsertWriter {
     inner: Arc<UpsertWriterInner>,
@@ -58,7 +63,8 @@ impl UpsertWriter {
     ///          For list/tuple: values must be in schema order.
     ///
     /// Returns:
-    ///     None on success
+    ///     A coroutine that can be awaited for server acknowledgment,
+    ///     or ignored for fire-and-forget behavior.
     pub fn upsert<'py>(
         &self,
         py: Python<'py>,
@@ -70,11 +76,20 @@ impl UpsertWriter {
         future_into_py(py, async move {
             let mut guard = inner.get_or_create_writer().await?;
             let writer = guard.as_mut().unwrap();
-            writer
+            let result_future = writer
                 .upsert(&generic_row)
                 .await
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
-            Ok(())
+
+            Python::attach(|py| {
+                future_into_py(py, async move {
+                    result_future
+                        .await
+                        .map_err(|e| FlussError::new_err(e.to_string()))?;
+                    Ok(())
+                })
+                .map(|bound| bound.unbind())
+            })
         })
     }
 
@@ -86,7 +101,8 @@ impl UpsertWriter {
     ///         For list/tuple: values in PK column order.
     ///
     /// Returns:
-    ///     None on success
+    ///     A coroutine that can be awaited for server acknowledgment,
+    ///     or ignored for fire-and-forget behavior.
     pub fn delete<'py>(
         &self,
         py: Python<'py>,
@@ -98,11 +114,20 @@ impl UpsertWriter {
         future_into_py(py, async move {
             let mut guard = inner.get_or_create_writer().await?;
             let writer = guard.as_mut().unwrap();
-            writer
+            let result_future = writer
                 .delete(&generic_row)
                 .await
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
-            Ok(())
+
+            Python::attach(|py| {
+                future_into_py(py, async move {
+                    result_future
+                        .await
+                        .map_err(|e| FlussError::new_err(e.to_string()))?;
+                    Ok(())
+                })
+                .map(|bound| bound.unbind())
+            })
         })
     }
 
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 2bbcc74b68..2fcb134258 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -65,6 +65,7 @@ pub async fn main() -> Result<()> {
         upsert_writer.upsert(&row).await?;
         println!("Upserted: {row:?}");
     }
+    upsert_writer.flush().await?;
 
     println!("\n=== Looking up ===");
     let mut lookuper = table.new_lookup()?.create_lookuper()?;
@@ -84,7 +85,7 @@ pub async fn main() -> Result<()> {
     row.set_field(0, 1);
     row.set_field(1, "Verso");
     row.set_field(2, 33i64);
-    upsert_writer.upsert(&row).await?;
+    upsert_writer.upsert(&row).await?.await?;
     println!("Updated: {row:?}");
 
     let result = lookuper.lookup(&make_key(1)).await?;
@@ -99,7 +100,7 @@ pub async fn main() -> Result<()> {
     // For delete, only primary key field needs to be set; other fields can remain null
     let mut row = GenericRow::new(3);
     row.set_field(0, 2);
-    upsert_writer.delete(&row).await?;
+    upsert_writer.delete(&row).await?.await?;
     println!("Deleted row with id=2");
 
     let result = lookuper.lookup(&make_key(2)).await?;
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index 884869e168..feb8f05b0d 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -77,6 +77,7 @@ pub async fn main() -> Result<()> {
         upsert_writer.upsert(&row).await?;
         println!("Upserted: {row:?}");
     }
+    upsert_writer.flush().await?;
 
     println!("\n=== Looking up ===");
     let mut lookuper = table.new_lookup()?.create_lookuper()?;
@@ -101,7 +102,7 @@ pub async fn main() -> Result<()> {
     row.set_field(1, "APAC");
     row.set_field(2, 1i64);
     row.set_field(3, 4321i64);
-    upsert_writer.upsert(&row).await?;
+    upsert_writer.upsert(&row).await?.await?;
     println!("Updated: {row:?}");
 
     let result = lookuper.lookup(&make_key(1001, "APAC", 1)).await?;
@@ -117,7 +118,7 @@ pub async fn main() -> Result<()> {
     row.set_field(0, 1002);
     row.set_field(1, "EMEA");
     row.set_field(2, 2i64);
-    upsert_writer.delete(&row).await?;
+    upsert_writer.delete(&row).await?.await?;
     println!("Deleted: {row:?}");
 
     let result = lookuper.lookup(&make_key(1002, "EMEA", 2)).await?;
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index 733b13e447..ee9bc7b349 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -25,7 +25,6 @@ use fluss::error::Result;
 use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
 use fluss::row::{GenericRow, InternalRow};
 use std::time::Duration;
-use tokio::try_join;
 
 #[tokio::main]
 pub async fn main() -> Result<()> {
@@ -64,13 +63,14 @@ pub async fn main() -> Result<()> {
 
     let table = conn.get_table(&table_path).await?;
     let append_writer = table.new_append()?.create_writer()?;
-    let f1 = append_writer.append(&row);
+    // Fire-and-forget: queue writes then flush
+    append_writer.append(&row).await?;
     let mut row = GenericRow::new(3);
     row.set_field(0, 233333);
     row.set_field(1, "tt44");
     row.set_field(2, 987_654_321_987i64);
-    let f2 = append_writer.append(&row);
-    try_join!(f1, f2, append_writer.flush())?;
+    append_writer.append(&row).await?;
+    append_writer.flush().await?;
 
     // scan rows
     let log_scanner = table.new_scan().create_log_scanner()?;
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index ace91a607c..e26b61adac 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -16,7 +16,7 @@
 // under the License.
 
 use crate::client::table::partition_getter::{PartitionGetter, get_physical_path};
-use crate::client::{WriteRecord, WriterClient};
+use crate::client::{WriteRecord, WriteResultFuture, WriterClient};
 use crate::error::Result;
 use crate::metadata::{PhysicalTablePath, TableInfo, TablePath};
 use crate::row::{ColumnarRow, InternalRow};
@@ -69,7 +69,18 @@ pub struct AppendWriter {
 }
 
 impl AppendWriter {
-    pub async fn append<R: InternalRow>(&self, row: &R) -> Result<()> {
+    /// Appends a row to the table.
+    ///
+    /// This method returns a [`WriteResultFuture`] immediately after queueing the write,
+    /// enabling fire-and-forget semantics for efficient batching.
+    ///
+    /// # Arguments
+    /// * row - the row to append.
+    ///
+    /// # Returns
+    /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
+    /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
+    pub async fn append<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
         let physical_table_path = Arc::new(get_physical_path(
             &self.table_path,
             self.partition_getter.as_ref(),
@@ -82,15 +93,21 @@ impl AppendWriter {
             row,
         );
         let result_handle = self.writer_client.send(&record).await?;
-        let result = result_handle.wait().await?;
-        result_handle.result(result)
+        Ok(WriteResultFuture::new(result_handle))
     }
 
     /// Appends an Arrow RecordBatch to the table.
     ///
+    /// This method returns a [`WriteResultFuture`] immediately after queueing the write,
+    /// enabling fire-and-forget semantics for efficient batching.
+    ///
     /// For partitioned tables, the partition is derived from the **first row** of the batch.
     /// Callers must ensure all rows in the batch belong to the same partition.
-    pub async fn append_arrow_batch(&self, batch: RecordBatch) -> Result<()> {
+    ///
+    /// # Returns
+    /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
+    /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
+    pub async fn append_arrow_batch(&self, batch: RecordBatch) -> Result<WriteResultFuture> {
         let physical_table_path = if self.partition_getter.is_some() && batch.num_rows() > 0 {
             let first_row = ColumnarRow::new(Arc::new(batch.clone()));
             Arc::new(get_physical_path(
@@ -109,8 +126,7 @@ impl AppendWriter {
             batch,
         );
         let result_handle = self.writer_client.send(&record).await?;
-        let result = result_handle.wait().await?;
-        result_handle.result(result)
+        Ok(WriteResultFuture::new(result_handle))
     }
 
     pub async fn flush(&self) -> Result<()> {
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
index 92f6a20c85..a1646cc35c 100644
--- a/fluss-rust/crates/fluss/src/client/table/upsert.rs
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::client::{RowBytes, WriteFormat, WriteRecord, WriterClient};
+use crate::client::{RowBytes, WriteFormat, WriteRecord, WriteResultFuture, WriterClient};
 use crate::error::Error::{IllegalArgument, UnexpectedError};
 use crate::error::Result;
 use crate::metadata::{RowType, TableInfo, TablePath};
@@ -345,12 +345,16 @@ impl UpsertWriter {
 
     /// Inserts row into Fluss table if they do not already exist, or updates them if they do exist.
     ///
+    /// This method returns a [`WriteResultFuture`] immediately after queueing the write,
+    /// enabling fire-and-forget semantics for efficient batching.
+    ///
     /// # Arguments
     /// * row - the row to upsert.
     ///
     /// # Returns
-    /// Ok(UpsertResult) when completed normally
-    pub async fn upsert<R: InternalRow>(&self, row: &R) -> Result<UpsertResult> {
+    /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
+    /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
+    pub async fn upsert<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
         self.check_field_count(row)?;
 
         let (key, bucket_key) = self.get_keys(row)?;
@@ -376,20 +380,22 @@ impl UpsertWriter {
         );
 
         let result_handle = self.writer_client.send(&write_record).await?;
-        let result = result_handle.wait().await?;
-
-        result_handle.result(result).map(|_| UpsertResult)
+        Ok(WriteResultFuture::new(result_handle))
     }
 
     /// Delete certain row by the input row in Fluss table, the input row must contain the primary
     /// key.
     ///
+    /// This method returns a [`WriteResultFuture`] immediately after queueing the delete,
+    /// enabling fire-and-forget semantics for efficient batching.
+    ///
     /// # Arguments
-    /// * row - the row to delete.
+    /// * row - the row to delete (must contain the primary key fields).
     ///
     /// # Returns
-    /// Ok(DeleteResult) when completed normally
-    pub async fn delete<R: InternalRow>(&self, row: &R) -> Result<DeleteResult> {
+    /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
+    /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
+    pub async fn delete<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
         self.check_field_count(row)?;
 
         let (key, bucket_key) = self.get_keys(row)?;
@@ -410,9 +416,7 @@ impl UpsertWriter {
         );
 
         let result_handle = self.writer_client.send(&write_record).await?;
-        let result = result_handle.wait().await?;
-
-        result_handle.result(result).map(|_| DeleteResult)
+        Ok(WriteResultFuture::new(result_handle))
     }
 }
 
@@ -546,9 +550,11 @@ mod tests {
 /// The result of upserting a record
 /// Currently this is an empty struct to allow for compatible evolution in the future
 #[derive(Default)]
+#[allow(dead_code)]
 pub struct UpsertResult;
 
 /// The result of deleting a record
 /// Currently this is an empty struct to allow for compatible evolution in the future
 #[derive(Default)]
+#[allow(dead_code)]
 pub struct DeleteResult;
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index 25a0db61b2..49eff05d2b 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -26,7 +26,10 @@ use crate::row::InternalRow;
 pub use accumulator::*;
 use arrow::array::RecordBatch;
 use bytes::Bytes;
+use std::future::Future;
+use std::pin::Pin;
 use std::sync::Arc;
+use std::task::{Context, Poll};
 
 pub(crate) mod broadcast;
 mod bucket_assigner;
@@ -198,3 +201,41 @@ impl ResultHandle {
         })
     }
 }
+
+/// A future that represents a pending write operation.
+///
+/// This type implements [`Future`], allowing users to either:
+/// 1. Await immediately to block on acknowledgment: `writer.upsert(&row).await?.await?`
+/// 2. Fire-and-forget with later flush: `writer.upsert(&row).await?; writer.flush().await?`
+///
+/// This pattern is similar to rdkafka's `DeliveryFuture` and allows for efficient batching
+/// when users don't need immediate per-record acknowledgment.
+pub struct WriteResultFuture {
+    inner: Pin<Box<dyn Future<Output = Result<(), Error>> + Send>>,
+}
+
+impl std::fmt::Debug for WriteResultFuture {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("WriteResultFuture").finish_non_exhaustive()
+    }
+}
+
+impl WriteResultFuture {
+    /// Create a new WriteResultFuture from a ResultHandle.
+    pub fn new(result_handle: ResultHandle) -> Self {
+        Self {
+            inner: Box::pin(async move {
+                let result = result_handle.wait().await?;
+                result_handle.result(result)
+            }),
+        }
+    }
+}
+
+impl Future for WriteResultFuture {
+    type Output = Result<(), Error>;
+
+    fn poll(mut self: Pin<&mut Self>, cx: &mut Context<'_>) -> Poll<Self::Output> {
+        self.inner.as_mut().poll(cx)
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index 87d90b0a9c..0bfe4a370c 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -95,7 +95,7 @@ mod kv_table_test {
 
         let test_data = [(1, "Verso", 32i64), (2, "Noco", 25), (3, "Esquie", 35)];
 
-        // Upsert rows
+        // Upsert rows (fire-and-forget, then flush)
         for (id, name, age) in &test_data {
             let mut row = GenericRow::new(3);
             row.set_field(0, *id);
@@ -106,6 +106,7 @@ mod kv_table_test {
                 .await
                 .expect("Failed to upsert row");
         }
+        upsert_writer.flush().await.expect("Failed to flush");
 
         // Lookup records
         let mut lookuper = table
@@ -130,7 +131,7 @@ mod kv_table_test {
             assert_eq!(row.get_long(2), *expected_age, "age mismatch");
         }
 
-        // Update the record with new age
+        // Update the record with new age (await acknowledgment)
         let mut updated_row = GenericRow::new(3);
         updated_row.set_field(0, 1);
         updated_row.set_field(1, "Verso");
@@ -138,7 +139,9 @@ mod kv_table_test {
         upsert_writer
             .upsert(&updated_row)
             .await
-            .expect("Failed to upsert updated row");
+            .expect("Failed to upsert updated row")
+            .await
+            .expect("Failed to wait for upsert acknowledgment");
 
         // Verify the update
         let result = lookuper
@@ -160,13 +163,15 @@ mod kv_table_test {
             "Name should remain unchanged"
         );
 
-        // Delete record with id=1
+        // Delete record with id=1 (await acknowledgment)
         let mut delete_row = GenericRow::new(3);
         delete_row.set_field(0, 1);
         upsert_writer
             .delete(&delete_row)
             .await
-            .expect("Failed to delete");
+            .expect("Failed to delete")
+            .await
+            .expect("Failed to wait for delete acknowledgment");
 
         // Verify deletion
         let result = lookuper
@@ -265,6 +270,7 @@ mod kv_table_test {
             row.set_field(2, *score);
             upsert_writer.upsert(&row).await.expect("Failed to upsert");
         }
+        upsert_writer.flush().await.expect("Failed to flush");
 
         // Lookup with composite key
         let mut lookuper = table
@@ -295,7 +301,7 @@ mod kv_table_test {
             .expect("Row should exist");
         assert_eq!(row.get_long(2), 250, "Score for (EU, 2) should be 250");
 
-        // Update (US, 1) score
+        // Update (US, 1) score (await acknowledgment)
         let mut update_row = GenericRow::new(3);
         update_row.set_field(0, "US");
         update_row.set_field(1, 1);
@@ -303,7 +309,9 @@ mod kv_table_test {
         upsert_writer
             .upsert(&update_row)
             .await
-            .expect("Failed to update");
+            .expect("Failed to update")
+            .await
+            .expect("Failed to wait for update acknowledgment");
 
         // Verify update
         let mut key = GenericRow::new(3);
@@ -372,7 +380,9 @@ mod kv_table_test {
         upsert_writer
             .upsert(&row)
             .await
-            .expect("Failed to upsert initial row");
+            .expect("Failed to upsert initial row")
+            .await
+            .expect("Failed to wait for upsert acknowledgment");
 
         // Verify initial record
         let mut lookuper = table
@@ -403,7 +413,7 @@ mod kv_table_test {
             .create_writer()
             .expect("Failed to create UpsertWriter with partial write");
 
-        // Update only the score column
+        // Update only the score column (await acknowledgment)
         let mut partial_row = GenericRow::new(4);
         partial_row.set_field(0, 1);
         partial_row.set_field(1, Datum::Null); // not in partial update column
@@ -412,7 +422,9 @@ mod kv_table_test {
         partial_writer
             .upsert(&partial_row)
             .await
-            .expect("Failed to upsert");
+            .expect("Failed to upsert")
+            .await
+            .expect("Failed to wait for upsert acknowledgment");
 
         // Verify partial update - name and age should remain unchanged
         let result = lookuper
@@ -499,6 +511,7 @@ mod kv_table_test {
             row.set_field(3, *score);
             upsert_writer.upsert(&row).await.expect("Failed to upsert");
         }
+        upsert_writer.flush().await.expect("Failed to flush");
 
         // Create lookuper
         let mut lookuper = table
@@ -525,7 +538,7 @@ mod kv_table_test {
             assert_eq!(row.get_long(3), *expected_score, "score mismatch");
         }
 
-        // Test update within a partition
+        // Test update within a partition (await acknowledgment)
         let mut updated_row = GenericRow::new(4);
         updated_row.set_field(0, "US");
         updated_row.set_field(1, 1);
@@ -534,7 +547,9 @@ mod kv_table_test {
         upsert_writer
             .upsert(&updated_row)
             .await
-            .expect("Failed to upsert updated row");
+            .expect("Failed to upsert updated row")
+            .await
+            .expect("Failed to wait for upsert acknowledgment");
 
         // Verify the update
         let mut key = GenericRow::new(4);
@@ -564,14 +579,16 @@ mod kv_table_test {
             "Lookup in non-existent partition should return None"
         );
 
-        // Delete a record within a partition
+        // Delete a record within a partition (await acknowledgment)
         let mut delete_key = GenericRow::new(4);
         delete_key.set_field(0, "EU");
         delete_key.set_field(1, 1);
         upsert_writer
             .delete(&delete_key)
             .await
-            .expect("Failed to delete");
+            .expect("Failed to delete")
+            .await
+            .expect("Failed to wait for delete acknowledgment");
 
         // Verify deletion
         let mut key = GenericRow::new(4);
@@ -705,7 +722,9 @@ mod kv_table_test {
         upsert_writer
             .upsert(&row)
             .await
-            .expect("Failed to upsert row with all datatypes");
+            .expect("Failed to upsert row with all datatypes")
+            .await
+            .expect("Failed to wait for upsert acknowledgment");
 
         // Lookup the record
         let mut lookuper = table
@@ -808,7 +827,9 @@ mod kv_table_test {
         upsert_writer
             .upsert(&row_with_nulls)
             .await
-            .expect("Failed to upsert row with nulls");
+            .expect("Failed to upsert row with nulls")
+            .await
+            .expect("Failed to wait for upsert acknowledgment");
 
         // Lookup row with nulls
         let mut key2 = GenericRow::new(17);
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 493bb34441..8d7773de63 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -109,6 +109,7 @@ mod table_test {
             .await
             .expect("Failed to append batch");
 
+        // Flush to ensure all writes are acknowledged
         append_writer.flush().await.expect("Failed to flush");
 
         // Create scanner to verify appended records
@@ -232,6 +233,9 @@ mod table_test {
             .await
             .expect("Failed to append batch");
 
+        // Flush to ensure all writes are acknowledged
+        append_writer.flush().await.expect("Failed to flush");
+
         tokio::time::sleep(tokio::time::Duration::from_secs(1)).await;
 
         let after_append_ms = Timestamp::now().as_millisecond();

From 6ca3bd7b7eb89e4bbcc8586083f2fd9422616ca3 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sat, 7 Feb 2026 11:36:27 +0800
Subject: [PATCH 118/287] chore: introduce deny to check licenses (#267)

---
 fluss-rust/.github/workflows/ci.yml   |  8 ++++++
 fluss-rust/DEVELOPMENT.md             |  9 +++++++
 fluss-rust/bindings/cpp/Cargo.toml    |  1 +
 fluss-rust/bindings/python/Cargo.toml |  2 +-
 fluss-rust/crates/fluss/Cargo.toml    |  1 +
 fluss-rust/deny.toml                  | 36 +++++++++++++++++++++++++++
 6 files changed, 56 insertions(+), 1 deletion(-)
 create mode 100644 fluss-rust/deny.toml

diff --git a/fluss-rust/.github/workflows/ci.yml b/fluss-rust/.github/workflows/ci.yml
index cf7a126486..e9048fb0e0 100644
--- a/fluss-rust/.github/workflows/ci.yml
+++ b/fluss-rust/.github/workflows/ci.yml
@@ -38,6 +38,14 @@ jobs:
       - name: Check License Header
         uses: apache/skywalking-eyes/header@v0.6.0
 
+      - name: Install cargo-deny
+        uses: taiki-e/install-action@v2
+        with:
+          tool: cargo-deny@0.14.22
+
+      - name: Check dependency licenses (Apache-compatible)
+        run: cargo deny check licenses
+
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
 
diff --git a/fluss-rust/DEVELOPMENT.md b/fluss-rust/DEVELOPMENT.md
index a8a6d5380c..a0669a755e 100644
--- a/fluss-rust/DEVELOPMENT.md
+++ b/fluss-rust/DEVELOPMENT.md
@@ -104,6 +104,15 @@ cargo test --features integration_tests --workspace
 ```
 
 
+### License check (cargo-deny)
+
+We use [cargo-deny](https://embarkstudios.github.io/cargo-deny/) to ensure all dependency licenses are Apache-compatible. When present, configuration lives in a `deny.toml` file at the repo root and should enforce an Apache-compatible license policy.
+
+```bash
+cargo install cargo-deny --locked
+cargo deny check licenses
+```
+
 ### Formatting and Clippy
 
 Our CI runs cargo formatting and clippy to help keep the code base styling tidy and readable. Run the following commands and address any errors or warnings to ensure that your PR can complete CI successfully.
diff --git a/fluss-rust/bindings/cpp/Cargo.toml b/fluss-rust/bindings/cpp/Cargo.toml
index 0bbcbf0d95..0b83de9365 100644
--- a/fluss-rust/bindings/cpp/Cargo.toml
+++ b/fluss-rust/bindings/cpp/Cargo.toml
@@ -19,6 +19,7 @@
 name = "fluss-cpp"
 version = "0.1.0"
 edition.workspace = true
+license.workspace = true
 rust-version.workspace = true
 publish = false
 
diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
index ff4d687d80..0a0daff93d 100644
--- a/fluss-rust/bindings/python/Cargo.toml
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -19,7 +19,7 @@
 name = "fluss_python"
 edition = "2024"
 version = "0.1.0"
-license = "apache-2.0"
+license.workspace = true
 rust-version = "1.85"
 
 [lib]
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 6b2707bee3..c92359408b 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -17,6 +17,7 @@
 
 [package]
 edition = { workspace = true }
+license.workspace = true
 rust-version = { workspace = true }
 version = { workspace = true }
 name = "fluss"
diff --git a/fluss-rust/deny.toml b/fluss-rust/deny.toml
new file mode 100644
index 0000000000..18ed544033
--- /dev/null
+++ b/fluss-rust/deny.toml
@@ -0,0 +1,36 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[licenses]
+allow = [
+    "Apache-2.0",
+    "Apache-2.0 WITH LLVM-exception",
+    "BSD-2-Clause",
+    "BSD-3-Clause",
+    "CC0-1.0",
+    "ISC",
+    "MIT",
+    "Unicode-3.0",
+    "Zlib",
+]
+
+exceptions = [
+    # open data licenses that SHOULD be OK
+    { crate = "webpki-roots", allow = [
+        "CDLA-Permissive-2.0",
+    ] },
+]
\ No newline at end of file

From 9202964fa6d87090909af70bdcff2c142431e1aa Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 7 Feb 2026 13:39:15 +0000
Subject: [PATCH 119/287] ci: Fix unstable poll_batches (#272)

---
 .../fluss/tests/integration/log_table.rs      | 81 +++++++++----------
 1 file changed, 37 insertions(+), 44 deletions(-)

diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 8d7773de63..ed90fd0521 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -502,21 +502,32 @@ mod table_test {
         writer.flush().await.unwrap();
 
         use arrow::array::Int32Array;
-        let batches = scanner.poll(Duration::from_secs(10)).await.unwrap();
-        let all_ids: Vec<i32> = batches
-            .iter()
-            .flat_map(|b| {
-                let batch = b.batch();
-                (0..batch.num_rows()).map(move |i| {
-                    batch
-                        .column(0)
-                        .as_any()
-                        .downcast_ref::<Int32Array>()
-                        .unwrap()
-                        .value(i)
+
+        fn extract_ids(batches: &[fluss::record::ScanBatch]) -> Vec<i32> {
+            batches
+                .iter()
+                .flat_map(|b| {
+                    let batch = b.batch();
+                    (0..batch.num_rows()).map(move |i| {
+                        batch
+                            .column(0)
+                            .as_any()
+                            .downcast_ref::<Int32Array>()
+                            .unwrap()
+                            .value(i)
+                    })
                 })
-            })
-            .collect();
+                .collect()
+        }
+
+        // poll may return partial results if not all batches are available yet,
+        // so we accumulate across multiple polls until we have the expected count.
+        let mut all_ids = Vec::new();
+        let deadline = tokio::time::Instant::now() + Duration::from_secs(10);
+        while all_ids.len() < 6 && tokio::time::Instant::now() < deadline {
+            let batches = scanner.poll(Duration::from_secs(5)).await.unwrap();
+            all_ids.extend(extract_ids(&batches));
+        }
 
         // Test 2: Order should be preserved across multiple batches
         assert_eq!(all_ids, vec![1, 2, 3, 4, 5, 6]);
@@ -529,21 +540,12 @@ mod table_test {
             .unwrap();
         writer.flush().await.unwrap();
 
-        let more = scanner.poll(Duration::from_secs(10)).await.unwrap();
-        let new_ids: Vec<i32> = more
-            .iter()
-            .flat_map(|b| {
-                let batch = b.batch();
-                (0..batch.num_rows()).map(move |i| {
-                    batch
-                        .column(0)
-                        .as_any()
-                        .downcast_ref::<Int32Array>()
-                        .unwrap()
-                        .value(i)
-                })
-            })
-            .collect();
+        let mut new_ids = Vec::new();
+        let deadline = tokio::time::Instant::now() + Duration::from_secs(10);
+        while new_ids.len() < 2 && tokio::time::Instant::now() < deadline {
+            let more = scanner.poll(Duration::from_secs(5)).await.unwrap();
+            new_ids.extend(extract_ids(&more));
+        }
 
         // Test 3: Subsequent polls should not return duplicate data (offset continuation)
         assert_eq!(new_ids, vec![7, 8]);
@@ -552,21 +554,12 @@ mod table_test {
         // Server returns all records from start of batch, but client truncates to subscription offset
         let trunc_scanner = table.new_scan().create_record_batch_log_scanner().unwrap();
         trunc_scanner.subscribe(0, 3).await.unwrap();
-        let trunc_batches = trunc_scanner.poll(Duration::from_secs(10)).await.unwrap();
-        let trunc_ids: Vec<i32> = trunc_batches
-            .iter()
-            .flat_map(|b| {
-                let batch = b.batch();
-                (0..batch.num_rows()).map(move |i| {
-                    batch
-                        .column(0)
-                        .as_any()
-                        .downcast_ref::<Int32Array>()
-                        .unwrap()
-                        .value(i)
-                })
-            })
-            .collect();
+        let mut trunc_ids = Vec::new();
+        let deadline = tokio::time::Instant::now() + Duration::from_secs(10);
+        while trunc_ids.len() < 5 && tokio::time::Instant::now() < deadline {
+            let trunc_batches = trunc_scanner.poll(Duration::from_secs(5)).await.unwrap();
+            trunc_ids.extend(extract_ids(&trunc_batches));
+        }
 
         // Subscribing from offset 3 should return [4,5,6,7,8], not [1,2,3,4,5,6,7,8]
         assert_eq!(trunc_ids, vec![4, 5, 6, 7, 8]);

From b677a6b4bd926f418994548d3349334e4701c58b Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 7 Feb 2026 14:16:30 +0000
Subject: [PATCH 120/287] chore: remove async from queueing while writing
 (#271)

---
 fluss-rust/README.md                          |   3 +-
 fluss-rust/bindings/cpp/src/lib.rs            |   7 +-
 fluss-rust/bindings/python/example/example.py |  33 +++--
 fluss-rust/bindings/python/src/lib.rs         |   3 +
 fluss-rust/bindings/python/src/table.rs       |  88 ++++---------
 fluss-rust/bindings/python/src/upsert.rs      | 124 +++++++-----------
 .../bindings/python/src/write_handle.rs       |  80 +++++++++++
 .../crates/examples/src/example_kv_table.rs   |   6 +-
 .../src/example_partitioned_kv_table.rs       |   6 +-
 .../crates/examples/src/example_table.rs      |   4 +-
 .../crates/fluss/src/client/table/append.rs   |   8 +-
 .../crates/fluss/src/client/table/upsert.rs   |   8 +-
 .../fluss/src/client/write/accumulator.rs     |  64 ++++-----
 .../crates/fluss/src/client/write/mod.rs      |   4 +-
 .../crates/fluss/src/client/write/sender.rs   |  86 ++++++------
 .../fluss/src/client/write/writer_client.rs   |  12 +-
 .../fluss/tests/integration/kv_table.rs       |  18 +--
 .../fluss/tests/integration/log_table.rs      |  17 +--
 .../tests/integration/table_remote_scan.rs    |   7 +-
 19 files changed, 269 insertions(+), 309 deletions(-)
 create mode 100644 fluss-rust/bindings/python/src/write_handle.rs

diff --git a/fluss-rust/README.md b/fluss-rust/README.md
index ee9478c6a5..5e771d9d28 100644
--- a/fluss-rust/README.md
+++ b/fluss-rust/README.md
@@ -101,7 +101,8 @@ pub async fn main() -> Result<()> {
     let table = conn.get_table(&table_path).await;
     let append_writer = table.new_append().create_writer();
     let batch = record_batch!(("c1", Int32, [1, 2, 3, 4, 5, 6]), ("c2", Utf8, ["a1", "a2", "a3", "a4", "a5", "a6"])).unwrap();
-    append_writer.append(batch).await?;
+    append_writer.append(batch)?;
+    append_writer.flush().await?;
     println!("Start to scan log records......");
     // 4: scan the records
     let log_scanner = table.new_scan().create_log_scanner();
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 7944c100a2..4957c9937a 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -761,8 +761,9 @@ impl AppendWriter {
     fn append(&mut self, row: &ffi::FfiGenericRow) -> Result<Box<WriteResult>, String> {
         let generic_row = types::ffi_row_to_core(row);
 
-        let result_future = RUNTIME
-            .block_on(async { self.inner.append(&generic_row).await })
+        let result_future = self
+            .inner
+            .append(&generic_row)
             .map_err(|e| format!("Failed to append: {e}"))?;
 
         Ok(Box::new(WriteResult {
@@ -789,7 +790,7 @@ impl WriteResult {
                 Err(e) => err_result(1, e.to_string()),
             }
         } else {
-            ok_result()
+            err_result(1, "WriteResult already consumed".to_string())
         }
     }
 }
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 1cabaa5f23..d56879a430 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -184,7 +184,7 @@ async def main():
         # Test 3: Append single rows with Date, Time, Timestamp, Decimal
         print("\n--- Testing single row append with temporal/decimal types ---")
         # Dict input with all types including Date, Time, Timestamp, Decimal
-        await append_writer.append(
+        append_writer.append(
             {
                 "id": 8,
                 "name": "Helen",
@@ -200,7 +200,7 @@ async def main():
         print("Successfully appended row (dict with Date, Time, Timestamp, Decimal)")
 
         # List input with all types
-        await append_writer.append(
+        append_writer.append(
             [
                 9,
                 "Ivan",
@@ -242,7 +242,7 @@ async def main():
 
         # Flush all pending data
         print("\n--- Flushing data ---")
-        append_writer.flush()
+        await append_writer.flush()
         print("Successfully flushed data")
 
         # Demo: Check offsets after writes
@@ -422,9 +422,9 @@ async def main():
         upsert_writer = pk_table.new_upsert()
         print(f"Created upsert writer: {upsert_writer}")
 
-        # Fire-and-forget: queue writes without waiting for individual acks.
+        # Fire-and-forget: queue writes synchronously, flush at end.
         # Records are batched internally for efficiency.
-        await upsert_writer.upsert(
+        upsert_writer.upsert(
             {
                 "user_id": 1,
                 "name": "Alice",
@@ -441,7 +441,7 @@ async def main():
         )
         print("Queued user_id=1 (Alice)")
 
-        await upsert_writer.upsert(
+        upsert_writer.upsert(
             {
                 "user_id": 2,
                 "name": "Bob",
@@ -456,7 +456,7 @@ async def main():
         )
         print("Queued user_id=2 (Bob)")
 
-        await upsert_writer.upsert(
+        upsert_writer.upsert(
             {
                 "user_id": 3,
                 "name": "Charlie",
@@ -479,7 +479,7 @@ async def main():
         # the server confirms this specific write, useful when you need to
         # read-after-write or verify critical updates.
         print("\n--- Testing Upsert (per-record acknowledgment) ---")
-        ack = await upsert_writer.upsert(
+        handle = upsert_writer.upsert(
             {
                 "user_id": 1,
                 "name": "Alice Updated",
@@ -494,7 +494,7 @@ async def main():
                 "balance": Decimal("2345.67"),
             }
         )
-        await ack  # wait for server acknowledgment before proceeding
+        await handle.wait()  # wait for server acknowledgment
         print("Updated user_id=1 (Alice -> Alice Updated) — server acknowledged")
 
     except Exception as e:
@@ -554,9 +554,8 @@ async def main():
     try:
         upsert_writer = pk_table.new_upsert()
 
-        # Per-record ack for delete — await the handle to confirm deletion
-        ack = await upsert_writer.delete({"user_id": 3})
-        await ack
+        handle = upsert_writer.delete({"user_id": 3})
+        await handle.wait()
         print("Deleted user_id=3 — server acknowledged")
 
         lookuper = pk_table.new_lookup()
@@ -670,12 +669,12 @@ async def main():
         partitioned_writer = await partitioned_table.new_append_writer()
 
         # Append data to US partition
-        await partitioned_writer.append({"id": 1, "region": "US", "value": 100})
-        await partitioned_writer.append({"id": 2, "region": "US", "value": 200})
+        partitioned_writer.append({"id": 1, "region": "US", "value": 100})
+        partitioned_writer.append({"id": 2, "region": "US", "value": 200})
         # Append data to EU partition
-        await partitioned_writer.append({"id": 3, "region": "EU", "value": 300})
-        await partitioned_writer.append({"id": 4, "region": "EU", "value": 400})
-        partitioned_writer.flush()
+        partitioned_writer.append({"id": 3, "region": "EU", "value": 300})
+        partitioned_writer.append({"id": 4, "region": "EU", "value": 400})
+        await partitioned_writer.flush()
         print("\nWrote 4 records (2 to US, 2 to EU)")
 
         # Demo: list_partition_offsets
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index ae7f6c500a..f1f4ee6b61 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -30,6 +30,7 @@ mod metadata;
 mod table;
 mod upsert;
 mod utils;
+mod write_handle;
 
 pub use admin::*;
 pub use config::*;
@@ -40,6 +41,7 @@ pub use metadata::*;
 pub use table::*;
 pub use upsert::*;
 pub use utils::*;
+pub use write_handle::*;
 
 static TOKIO_RUNTIME: LazyLock<Runtime> = LazyLock::new(|| {
     tokio::runtime::Builder::new_multi_thread()
@@ -88,6 +90,7 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<RecordBatch>()?;
     m.add_class::<PartitionInfo>()?;
     m.add_class::<OffsetType>()?;
+    m.add_class::<WriteResultHandle>()?;
 
     // Register constants
     m.add("EARLIEST_OFFSET", fcore::client::EARLIEST_OFFSET)?;
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index e987d43d69..8af6b13e69 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -533,76 +533,43 @@ impl AppendWriter {
         let batch_list: Vec<Py<PyAny>> = batches.extract(py)?;
 
         for batch in batch_list {
-            // Drop the ack coroutine — fire-and-forget
-            let _ = self.write_arrow_batch(py, batch)?;
+            // Drop the handle — fire-and-forget for bulk writes
+            drop(self.write_arrow_batch(py, batch)?);
         }
         Ok(())
     }
 
-    /// Write Arrow batch data
+    /// Write Arrow batch data.
     ///
     /// Returns:
-    ///     A coroutine that can be awaited for server acknowledgment,
-    ///     or ignored for fire-and-forget behavior.
-    pub fn write_arrow_batch<'py>(
-        &self,
-        py: Python<'py>,
-        batch: Py<PyAny>,
-    ) -> PyResult<Bound<'py, PyAny>> {
+    ///     WriteResultHandle that can be ignored (fire-and-forget) or
+    ///     awaited via `handle.wait()` for server acknowledgment.
+    pub fn write_arrow_batch(&self, py: Python, batch: Py<PyAny>) -> PyResult<WriteResultHandle> {
         // This shares the underlying Arrow buffers without copying data
         let batch_bound = batch.bind(py);
         let rust_batch: ArrowRecordBatch = FromPyArrow::from_pyarrow_bound(batch_bound)
             .map_err(|e| FlussError::new_err(format!("Failed to convert RecordBatch: {e}")))?;
 
-        let inner = self.inner.clone();
-
-        future_into_py(py, async move {
-            let result_future = inner
-                .append_arrow_batch(rust_batch)
-                .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
-
-            Python::attach(|py| {
-                future_into_py(py, async move {
-                    result_future
-                        .await
-                        .map_err(|e| FlussError::new_err(e.to_string()))?;
-                    Ok(())
-                })
-                .map(|bound| bound.unbind())
-            })
-        })
+        let result_future = self
+            .inner
+            .append_arrow_batch(rust_batch)
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+        Ok(WriteResultHandle::new(result_future))
     }
 
-    /// Append a single row to the table
+    /// Append a single row to the table.
     ///
     /// Returns:
-    ///     A coroutine that can be awaited for server acknowledgment,
-    ///     or ignored for fire-and-forget behavior.
-    pub fn append<'py>(
-        &self,
-        py: Python<'py>,
-        row: &Bound<'py, PyAny>,
-    ) -> PyResult<Bound<'py, PyAny>> {
+    ///     WriteResultHandle that can be ignored (fire-and-forget) or
+    ///     awaited via `handle.wait()` for server acknowledgment.
+    pub fn append(&self, row: &Bound<'_, PyAny>) -> PyResult<WriteResultHandle> {
         let generic_row = python_to_generic_row(row, &self.table_info)?;
-        let inner = self.inner.clone();
-
-        future_into_py(py, async move {
-            let result_future = inner
-                .append(&generic_row)
-                .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
 
-            Python::attach(|py| {
-                future_into_py(py, async move {
-                    result_future
-                        .await
-                        .map_err(|e| FlussError::new_err(e.to_string()))?;
-                    Ok(())
-                })
-                .map(|bound| bound.unbind())
-            })
-        })
+        let result_future = self
+            .inner
+            .append(&generic_row)
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+        Ok(WriteResultHandle::new(result_future))
     }
 
     /// Write Pandas DataFrame data
@@ -636,16 +603,13 @@ impl AppendWriter {
     }
 
     /// Flush any pending data
-    pub fn flush(&self, py: Python) -> PyResult<()> {
+    pub fn flush<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
         let inner = self.inner.clone();
-        // Release the GIL before blocking on I/O
-        py.detach(|| {
-            TOKIO_RUNTIME.block_on(async {
-                inner
-                    .flush()
-                    .await
-                    .map_err(|e| FlussError::new_err(e.to_string()))
-            })
+        future_into_py(py, async move {
+            inner
+                .flush()
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))
         })
     }
 
diff --git a/fluss-rust/bindings/python/src/upsert.rs b/fluss-rust/bindings/python/src/upsert.rs
index 5c10dedc5a..0aa69d747d 100644
--- a/fluss-rust/bindings/python/src/upsert.rs
+++ b/fluss-rust/bindings/python/src/upsert.rs
@@ -18,26 +18,24 @@
 use crate::table::{python_pk_to_generic_row, python_to_generic_row};
 use crate::*;
 use pyo3_async_runtimes::tokio::future_into_py;
-use std::sync::Arc;
-use tokio::sync::Mutex;
+use std::sync::{Arc, Mutex};
 
 /// Writer for upserting and deleting data in a Fluss primary key table.
 ///
-/// Each upsert/delete operation queues the write and returns a coroutine
-/// that can be awaited for per-record acknowledgment, or ignored for
-/// fire-and-forget semantics (call `flush()` to ensure delivery).
+/// Each upsert/delete operation synchronously queues the write. Call `flush()`
+/// to ensure all queued writes are delivered to the server.
 ///
 /// # Example:
 ///     writer = table.new_upsert()
 ///
-///     # Fire-and-forget with flush
-///     await writer.upsert(row1)
-///     await writer.upsert(row2)
+///     # Fire-and-forget — ignore the returned handle
+///     writer.upsert(row1)
+///     writer.upsert(row2)
 ///     await writer.flush()
 ///
-///     # Or await individual acknowledgment
-///     ack = await writer.upsert(row3)
-///     await ack
+///     # Per-record ack — call wait() on the handle
+///     handle = writer.upsert(critical_row)
+///     await handle.wait()
 #[pyclass]
 pub struct UpsertWriter {
     inner: Arc<UpsertWriterInner>,
@@ -46,7 +44,7 @@ pub struct UpsertWriter {
 struct UpsertWriterInner {
     table_upsert: fcore::client::TableUpsert,
     /// Lazily initialized writer - created on first write operation
-    writer: Mutex<Option<fcore::client::UpsertWriter>>,
+    writer: Mutex<Option<Arc<fcore::client::UpsertWriter>>>,
     table_info: fcore::metadata::TableInfo,
 }
 
@@ -57,100 +55,65 @@ impl UpsertWriter {
     /// If a row with the same primary key exists, it will be updated.
     /// Otherwise, a new row will be inserted.
     ///
+    /// The write is queued synchronously. Call `flush()` to ensure delivery.
+    ///
     /// Args:
     ///     row: A dict, list, or tuple containing the row data.
     ///          For dict: keys are column names, values are column values.
     ///          For list/tuple: values must be in schema order.
-    ///
-    /// Returns:
-    ///     A coroutine that can be awaited for server acknowledgment,
-    ///     or ignored for fire-and-forget behavior.
-    pub fn upsert<'py>(
-        &self,
-        py: Python<'py>,
-        row: &Bound<'_, PyAny>,
-    ) -> PyResult<Bound<'py, PyAny>> {
+    pub fn upsert(&self, row: &Bound<'_, PyAny>) -> PyResult<WriteResultHandle> {
         let generic_row = python_to_generic_row(row, &self.inner.table_info)?;
-        let inner = self.inner.clone();
-
-        future_into_py(py, async move {
-            let mut guard = inner.get_or_create_writer().await?;
-            let writer = guard.as_mut().unwrap();
-            let result_future = writer
-                .upsert(&generic_row)
-                .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
 
-            Python::attach(|py| {
-                future_into_py(py, async move {
-                    result_future
-                        .await
-                        .map_err(|e| FlussError::new_err(e.to_string()))?;
-                    Ok(())
-                })
-                .map(|bound| bound.unbind())
-            })
-        })
+        let writer = self.inner.get_or_create_writer()?;
+        let result_future = writer
+            .upsert(&generic_row)
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+        Ok(WriteResultHandle::new(result_future))
     }
 
     /// Delete a row from the table by primary key.
     ///
+    /// The delete is queued synchronously. Call `flush()` to ensure delivery.
+    ///
     /// Args:
     ///     pk: A dict, list, or tuple containing only the primary key values.
     ///         For dict: keys are PK column names.
     ///         For list/tuple: values in PK column order.
-    ///
-    /// Returns:
-    ///     A coroutine that can be awaited for server acknowledgment,
-    ///     or ignored for fire-and-forget behavior.
-    pub fn delete<'py>(
-        &self,
-        py: Python<'py>,
-        pk: &Bound<'_, PyAny>,
-    ) -> PyResult<Bound<'py, PyAny>> {
+    pub fn delete(&self, pk: &Bound<'_, PyAny>) -> PyResult<WriteResultHandle> {
         let generic_row = python_pk_to_generic_row(pk, &self.inner.table_info)?;
-        let inner = self.inner.clone();
-
-        future_into_py(py, async move {
-            let mut guard = inner.get_or_create_writer().await?;
-            let writer = guard.as_mut().unwrap();
-            let result_future = writer
-                .delete(&generic_row)
-                .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
 
-            Python::attach(|py| {
-                future_into_py(py, async move {
-                    result_future
-                        .await
-                        .map_err(|e| FlussError::new_err(e.to_string()))?;
-                    Ok(())
-                })
-                .map(|bound| bound.unbind())
-            })
-        })
+        let writer = self.inner.get_or_create_writer()?;
+        let result_future = writer
+            .delete(&generic_row)
+            .map_err(|e| FlussError::new_err(e.to_string()))?;
+        Ok(WriteResultHandle::new(result_future))
     }
 
     /// Flush all pending upsert/delete operations to the server.
     ///
-    /// This method sends all buffered operations and blocks until they are
+    /// This method sends all buffered operations and waits until they are
     /// acknowledged according to the writer's ack configuration.
     ///
     /// Returns:
     ///     None on success
     pub fn flush<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let inner = self.inner.clone();
+        // Clone the Arc<UpsertWriter> out of the lock so we don't hold the guard across await
+        let writer = {
+            let guard = self
+                .inner
+                .writer
+                .lock()
+                .map_err(|e| FlussError::new_err(format!("Lock poisoned: {e}")))?;
+            guard.as_ref().cloned()
+        };
 
         future_into_py(py, async move {
-            let writer_guard = inner.writer.lock().await;
-
-            if let Some(writer) = writer_guard.as_ref() {
+            if let Some(writer) = writer {
                 writer
                     .flush()
                     .await
                     .map_err(|e| FlussError::new_err(e.to_string()))
             } else {
-                // Nothing to flush - no writer was created yet
                 Ok(())
             }
         })
@@ -197,17 +160,18 @@ impl UpsertWriter {
 
 impl UpsertWriterInner {
     /// Get the cached writer or create one on first use.
-    async fn get_or_create_writer(
-        &self,
-    ) -> PyResult<tokio::sync::MutexGuard<'_, Option<fcore::client::UpsertWriter>>> {
-        let mut guard = self.writer.lock().await;
+    fn get_or_create_writer(&self) -> PyResult<Arc<fcore::client::UpsertWriter>> {
+        let mut guard = self
+            .writer
+            .lock()
+            .map_err(|e| FlussError::new_err(format!("Lock poisoned: {e}")))?;
         if guard.is_none() {
             let writer = self
                 .table_upsert
                 .create_writer()
                 .map_err(|e| FlussError::new_err(e.to_string()))?;
-            *guard = Some(writer);
+            *guard = Some(Arc::new(writer));
         }
-        Ok(guard)
+        Ok(guard.as_ref().unwrap().clone())
     }
 }
diff --git a/fluss-rust/bindings/python/src/write_handle.rs b/fluss-rust/bindings/python/src/write_handle.rs
new file mode 100644
index 0000000000..4f3ce99739
--- /dev/null
+++ b/fluss-rust/bindings/python/src/write_handle.rs
@@ -0,0 +1,80 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::*;
+use pyo3_async_runtimes::tokio::future_into_py;
+use std::sync::Mutex;
+
+/// Handle for a pending write operation.
+///
+/// Returned by `upsert()`, `delete()`, `append()`, etc.
+/// Can be safely ignored for fire-and-forget semantics,
+/// or awaited via `wait()` for per-record acknowledgment.
+///
+/// # Example:
+///     # Fire-and-forget — just ignore the handle
+///     writer.upsert(row1)
+///     writer.upsert(row2)
+///     await writer.flush()
+///
+///     # Per-record ack — call wait()
+///     handle = writer.upsert(critical_row)
+///     await handle.wait()
+#[pyclass]
+pub struct WriteResultHandle {
+    inner: Mutex<Option<fcore::client::WriteResultFuture>>,
+}
+
+impl WriteResultHandle {
+    pub fn new(future: fcore::client::WriteResultFuture) -> Self {
+        Self {
+            inner: Mutex::new(Some(future)),
+        }
+    }
+}
+
+#[pymethods]
+impl WriteResultHandle {
+    /// Wait for server acknowledgment of this specific write.
+    ///
+    /// Returns:
+    ///     None on success, raises FlussError on failure.
+    pub fn wait<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let future = self
+            .inner
+            .lock()
+            .map_err(|e| FlussError::new_err(format!("Lock poisoned: {e}")))?
+            .take()
+            .ok_or_else(|| FlussError::new_err("WriteResultHandle already consumed"))?;
+
+        future_into_py(py, async move {
+            future
+                .await
+                .map_err(|e| FlussError::new_err(e.to_string()))?;
+            Ok(())
+        })
+    }
+
+    fn __repr__(&self) -> String {
+        let consumed = self.inner.lock().map(|g| g.is_none()).unwrap_or(false);
+        if consumed {
+            "WriteResultHandle(consumed)".to_string()
+        } else {
+            "WriteResultHandle(pending)".to_string()
+        }
+    }
+}
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 2fcb134258..3acf73f2bf 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -62,7 +62,7 @@ pub async fn main() -> Result<()> {
         row.set_field(0, id);
         row.set_field(1, name);
         row.set_field(2, age);
-        upsert_writer.upsert(&row).await?;
+        upsert_writer.upsert(&row)?;
         println!("Upserted: {row:?}");
     }
     upsert_writer.flush().await?;
@@ -85,7 +85,7 @@ pub async fn main() -> Result<()> {
     row.set_field(0, 1);
     row.set_field(1, "Verso");
     row.set_field(2, 33i64);
-    upsert_writer.upsert(&row).await?.await?;
+    upsert_writer.upsert(&row)?.await?;
     println!("Updated: {row:?}");
 
     let result = lookuper.lookup(&make_key(1)).await?;
@@ -100,7 +100,7 @@ pub async fn main() -> Result<()> {
     // For delete, only primary key field needs to be set; other fields can remain null
     let mut row = GenericRow::new(3);
     row.set_field(0, 2);
-    upsert_writer.delete(&row).await?.await?;
+    upsert_writer.delete(&row)?.await?;
     println!("Deleted row with id=2");
 
     let result = lookuper.lookup(&make_key(2)).await?;
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index feb8f05b0d..ee1f541fb7 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -74,7 +74,7 @@ pub async fn main() -> Result<()> {
         row.set_field(1, region);
         row.set_field(2, zone);
         row.set_field(3, score);
-        upsert_writer.upsert(&row).await?;
+        upsert_writer.upsert(&row)?;
         println!("Upserted: {row:?}");
     }
     upsert_writer.flush().await?;
@@ -102,7 +102,7 @@ pub async fn main() -> Result<()> {
     row.set_field(1, "APAC");
     row.set_field(2, 1i64);
     row.set_field(3, 4321i64);
-    upsert_writer.upsert(&row).await?.await?;
+    upsert_writer.upsert(&row)?.await?;
     println!("Updated: {row:?}");
 
     let result = lookuper.lookup(&make_key(1001, "APAC", 1)).await?;
@@ -118,7 +118,7 @@ pub async fn main() -> Result<()> {
     row.set_field(0, 1002);
     row.set_field(1, "EMEA");
     row.set_field(2, 2i64);
-    upsert_writer.delete(&row).await?.await?;
+    upsert_writer.delete(&row)?.await?;
     println!("Deleted: {row:?}");
 
     let result = lookuper.lookup(&make_key(1002, "EMEA", 2)).await?;
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index ee9bc7b349..199fce2347 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -64,12 +64,12 @@ pub async fn main() -> Result<()> {
     let table = conn.get_table(&table_path).await?;
     let append_writer = table.new_append()?.create_writer()?;
     // Fire-and-forget: queue writes then flush
-    append_writer.append(&row).await?;
+    append_writer.append(&row)?;
     let mut row = GenericRow::new(3);
     row.set_field(0, 233333);
     row.set_field(1, "tt44");
     row.set_field(2, 987_654_321_987i64);
-    append_writer.append(&row).await?;
+    append_writer.append(&row)?;
     append_writer.flush().await?;
 
     // scan rows
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index e26b61adac..942253fa19 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -80,7 +80,7 @@ impl AppendWriter {
     /// # Returns
     /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
     /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
-    pub async fn append<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
+    pub fn append<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
         let physical_table_path = Arc::new(get_physical_path(
             &self.table_path,
             self.partition_getter.as_ref(),
@@ -92,7 +92,7 @@ impl AppendWriter {
             self.table_info.schema_id,
             row,
         );
-        let result_handle = self.writer_client.send(&record).await?;
+        let result_handle = self.writer_client.send(&record)?;
         Ok(WriteResultFuture::new(result_handle))
     }
 
@@ -107,7 +107,7 @@ impl AppendWriter {
     /// # Returns
     /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
     /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
-    pub async fn append_arrow_batch(&self, batch: RecordBatch) -> Result<WriteResultFuture> {
+    pub fn append_arrow_batch(&self, batch: RecordBatch) -> Result<WriteResultFuture> {
         let physical_table_path = if self.partition_getter.is_some() && batch.num_rows() > 0 {
             let first_row = ColumnarRow::new(Arc::new(batch.clone()));
             Arc::new(get_physical_path(
@@ -125,7 +125,7 @@ impl AppendWriter {
             self.table_info.schema_id,
             batch,
         );
-        let result_handle = self.writer_client.send(&record).await?;
+        let result_handle = self.writer_client.send(&record)?;
         Ok(WriteResultFuture::new(result_handle))
     }
 
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
index a1646cc35c..7057b9013d 100644
--- a/fluss-rust/crates/fluss/src/client/table/upsert.rs
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -354,7 +354,7 @@ impl UpsertWriter {
     /// # Returns
     /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
     /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
-    pub async fn upsert<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
+    pub fn upsert<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
         self.check_field_count(row)?;
 
         let (key, bucket_key) = self.get_keys(row)?;
@@ -379,7 +379,7 @@ impl UpsertWriter {
             Some(row_bytes),
         );
 
-        let result_handle = self.writer_client.send(&write_record).await?;
+        let result_handle = self.writer_client.send(&write_record)?;
         Ok(WriteResultFuture::new(result_handle))
     }
 
@@ -395,7 +395,7 @@ impl UpsertWriter {
     /// # Returns
     /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
     /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
-    pub async fn delete<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
+    pub fn delete<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
         self.check_field_count(row)?;
 
         let (key, bucket_key) = self.get_keys(row)?;
@@ -415,7 +415,7 @@ impl UpsertWriter {
             None,
         );
 
-        let result_handle = self.writer_client.send(&write_record).await?;
+        let result_handle = self.writer_client.send(&write_record)?;
         Ok(WriteResultFuture::new(result_handle))
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 5eae868dd7..2c36452470 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -25,11 +25,11 @@ use crate::metadata::{PhysicalTablePath, TableBucket};
 use crate::util::current_time_ms;
 use crate::{BucketId, PartitionId, TableId};
 use dashmap::DashMap;
+use parking_lot::Mutex;
 use parking_lot::RwLock;
 use std::collections::{HashMap, HashSet, VecDeque};
 use std::sync::Arc;
 use std::sync::atomic::{AtomicI32, AtomicI64, Ordering};
-use tokio::sync::Mutex;
 
 // Type alias to simplify complex nested types
 type BucketBatches = Vec<(BucketId, Arc<Mutex<VecDeque<WriteBatch>>>)>;
@@ -144,7 +144,7 @@ impl RecordAccumulator {
         ))
     }
 
-    pub async fn append(
+    pub fn append(
         &self,
         record: &WriteRecord<'_>,
         bucket_id: BucketId,
@@ -180,7 +180,7 @@ impl RecordAccumulator {
                 .clone()
         };
 
-        let mut dq_guard = dq.lock().await;
+        let mut dq_guard = dq.lock();
         if let Some(append_result) = self.try_append(record, &mut dq_guard)? {
             return Ok(append_result);
         }
@@ -193,7 +193,7 @@ impl RecordAccumulator {
         self.append_new_batch(cluster, record, &mut dq_guard)
     }
 
-    pub async fn ready(&self, cluster: &Arc<Cluster>) -> Result<ReadyCheckResult> {
+    pub fn ready(&self, cluster: &Arc<Cluster>) -> Result<ReadyCheckResult> {
         // Snapshot just the Arcs we need, avoiding cloning the entire BucketAndWriteBatches struct
         let entries: Vec<(Arc<PhysicalTablePath>, Option<PartitionId>, BucketBatches)> = self
             .write_batches
@@ -216,18 +216,16 @@ impl RecordAccumulator {
         let mut unknown_leader_tables = HashSet::new();
 
         for (physical_table_path, mut partition_id, bucket_batches) in entries {
-            next_ready_check_delay_ms = self
-                .bucket_ready(
-                    &physical_table_path,
-                    physical_table_path.get_partition_name().is_some(),
-                    &mut partition_id,
-                    bucket_batches,
-                    &mut ready_nodes,
-                    &mut unknown_leader_tables,
-                    cluster,
-                    next_ready_check_delay_ms,
-                )
-                .await?
+            next_ready_check_delay_ms = self.bucket_ready(
+                &physical_table_path,
+                physical_table_path.get_partition_name().is_some(),
+                &mut partition_id,
+                bucket_batches,
+                &mut ready_nodes,
+                &mut unknown_leader_tables,
+                cluster,
+                next_ready_check_delay_ms,
+            )?
         }
 
         Ok(ReadyCheckResult {
@@ -238,7 +236,7 @@ impl RecordAccumulator {
     }
 
     #[allow(clippy::too_many_arguments)]
-    async fn bucket_ready(
+    fn bucket_ready(
         &self,
         physical_table_path: &Arc<PhysicalTablePath>,
         is_partitioned_table: bool,
@@ -274,7 +272,7 @@ impl RecordAccumulator {
         }
 
         for (bucket_id, batch) in bucket_batches {
-            let batch_guard = batch.lock().await;
+            let batch_guard = batch.lock();
             if batch_guard.is_empty() {
                 continue;
             }
@@ -316,7 +314,7 @@ impl RecordAccumulator {
         next_ready_check_delay_ms
     }
 
-    pub async fn drain(
+    pub fn drain(
         &self,
         cluster: Arc<Cluster>,
         nodes: &HashSet<ServerNode>,
@@ -327,9 +325,7 @@ impl RecordAccumulator {
         }
         let mut batches = HashMap::new();
         for node in nodes {
-            let ready = self
-                .drain_batches_for_one_node(&cluster, node, max_size)
-                .await?;
+            let ready = self.drain_batches_for_one_node(&cluster, node, max_size)?;
             if !ready.is_empty() {
                 batches.insert(node.id(), ready);
             }
@@ -338,7 +334,7 @@ impl RecordAccumulator {
         Ok(batches)
     }
 
-    async fn drain_batches_for_one_node(
+    fn drain_batches_for_one_node(
         &self,
         cluster: &Cluster,
         node: &ServerNode,
@@ -352,15 +348,13 @@ impl RecordAccumulator {
             return Ok(ready);
         }
 
-        // Get the start index without holding the lock across awaits
         let start = {
-            let mut nodes_drain_index_guard = self.nodes_drain_index.lock().await;
+            let mut nodes_drain_index_guard = self.nodes_drain_index.lock();
             let drain_index = nodes_drain_index_guard.entry(node.id()).or_insert(0);
             *drain_index % buckets.len()
         };
 
         let mut current_index = start;
-        // Assigned at the start of each loop iteration (line 323), used after loop (line 376)
         let mut last_processed_index;
 
         loop {
@@ -383,7 +377,7 @@ impl RecordAccumulator {
             if let Some(deque) = deque {
                 let mut maybe_batch = None;
                 {
-                    let mut batch_lock = deque.lock().await;
+                    let mut batch_lock = deque.lock();
                     if !batch_lock.is_empty() {
                         let first_batch = batch_lock.front().unwrap();
 
@@ -419,7 +413,7 @@ impl RecordAccumulator {
 
         // Store the last processed index to maintain round-robin fairness
         {
-            let mut nodes_drain_index_guard = self.nodes_drain_index.lock().await;
+            let mut nodes_drain_index_guard = self.nodes_drain_index.lock();
             nodes_drain_index_guard.insert(node.id(), last_processed_index);
         }
 
@@ -430,7 +424,7 @@ impl RecordAccumulator {
         self.incomplete_batches.write().remove(&batch_id);
     }
 
-    pub async fn re_enqueue(&self, ready_write_batch: ReadyWriteBatch) {
+    pub fn re_enqueue(&self, ready_write_batch: ReadyWriteBatch) {
         ready_write_batch.write_batch.re_enqueued();
         let physical_table_path = ready_write_batch.write_batch.physical_table_path();
         let bucket_id = ready_write_batch.table_bucket.bucket_id();
@@ -456,7 +450,7 @@ impl RecordAccumulator {
                 .clone()
         };
 
-        let mut dq_guard = dq.lock().await;
+        let mut dq_guard = dq.lock();
         dq_guard.push_front(ready_write_batch.write_batch);
     }
 
@@ -604,20 +598,18 @@ mod tests {
         };
         let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
 
-        accumulator.append(&record, 0, &cluster, false).await?;
+        accumulator.append(&record, 0, &cluster, false)?;
 
         let server = cluster.get_tablet_server(1).expect("server");
         let nodes = HashSet::from([server.clone()]);
-        let mut batches = accumulator
-            .drain(cluster.clone(), &nodes, 1024 * 1024)
-            .await?;
+        let mut batches = accumulator.drain(cluster.clone(), &nodes, 1024 * 1024)?;
         let mut drained = batches.remove(&1).expect("drained batches");
         let batch = drained.pop().expect("batch");
         assert_eq!(batch.write_batch.attempts(), 0);
 
-        accumulator.re_enqueue(batch).await;
+        accumulator.re_enqueue(batch);
 
-        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024).await?;
+        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024)?;
         let mut drained = batches.remove(&1).expect("drained batches");
         let batch = drained.pop().expect("batch");
         assert_eq!(batch.write_batch.attempts(), 1);
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index 49eff05d2b..2c848d3555 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -205,8 +205,8 @@ impl ResultHandle {
 /// A future that represents a pending write operation.
 ///
 /// This type implements [`Future`], allowing users to either:
-/// 1. Await immediately to block on acknowledgment: `writer.upsert(&row).await?.await?`
-/// 2. Fire-and-forget with later flush: `writer.upsert(&row).await?; writer.flush().await?`
+/// 1. Await immediately to block on acknowledgment: `writer.upsert(&row)?.await?`
+/// 2. Fire-and-forget with later flush: `writer.upsert(&row)?; writer.flush().await?`
 ///
 /// This pattern is similar to rdkafka's `DeliveryFuture` and allows for efficient batching
 /// when users don't need immediate per-record acknowledgment.
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index f336d0cdca..069f2d2ba1 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -78,7 +78,7 @@ impl Sender {
 
     async fn run_once(&self) -> Result<()> {
         let cluster = self.metadata.get_cluster();
-        let ready_check_result = self.accumulator.ready(&cluster).await?;
+        let ready_check_result = self.accumulator.ready(&cluster)?;
 
         // Update metadata if needed
         if !ready_check_result.unknown_leader_tables.is_empty() {
@@ -124,14 +124,11 @@ impl Sender {
             return Ok(());
         }
 
-        let batches = self
-            .accumulator
-            .drain(
-                cluster.clone(),
-                &ready_check_result.ready_nodes,
-                self.max_request_size,
-            )
-            .await?;
+        let batches = self.accumulator.drain(
+            cluster.clone(),
+            &ready_check_result.ready_nodes,
+            self.max_request_size,
+        )?;
 
         if !batches.is_empty() {
             self.add_to_inflight_batches(&batches);
@@ -233,8 +230,7 @@ impl Sender {
                     self.handle_batches_with_local_error(
                         request_batches,
                         format!("Failed to build write request: {e}"),
-                    )
-                    .await?;
+                    )?;
                     continue;
                 }
             };
@@ -377,9 +373,8 @@ impl Sender {
                         .error_message()
                         .cloned()
                         .unwrap_or_else(|| error.message().to_string());
-                    if let Some(physical_table_path) = self
-                        .handle_write_batch_error(ready_batch, error, message)
-                        .await?
+                    if let Some(physical_table_path) =
+                        self.handle_write_batch_error(ready_batch, error, message)?
                     {
                         invalid_metadata_tables
                             .insert(physical_table_path.get_table_path().clone());
@@ -392,14 +387,11 @@ impl Sender {
 
         for bucket in pending_buckets {
             if let Some(ready_batch) = records_by_bucket.remove(&bucket) {
-                if let Some(physical_table_path) = self
-                    .handle_write_batch_error(
-                        ready_batch,
-                        FlussError::UnknownServerError,
-                        format!("Missing response for table bucket {bucket}"),
-                    )
-                    .await?
-                {
+                if let Some(physical_table_path) = self.handle_write_batch_error(
+                    ready_batch,
+                    FlussError::UnknownServerError,
+                    format!("Missing response for table bucket {bucket}"),
+                )? {
                     invalid_metadata_tables.insert(physical_table_path.get_table_path().clone());
                     invalid_physical_table_paths.insert(physical_table_path);
                 }
@@ -438,9 +430,8 @@ impl Sender {
         let mut invalid_physical_table_paths: HashSet<Arc<PhysicalTablePath>> = HashSet::new();
 
         for batch in batches {
-            if let Some(physical_table_path) = self
-                .handle_write_batch_error(batch, error, message.clone())
-                .await?
+            if let Some(physical_table_path) =
+                self.handle_write_batch_error(batch, error, message.clone())?
             {
                 invalid_metadata_tables.insert(physical_table_path.get_table_path().clone());
                 invalid_physical_table_paths.insert(physical_table_path);
@@ -451,7 +442,7 @@ impl Sender {
         Ok(())
     }
 
-    async fn handle_batches_with_local_error(
+    fn handle_batches_with_local_error(
         &self,
         batches: Vec<ReadyWriteBatch>,
         message: String,
@@ -467,7 +458,7 @@ impl Sender {
         Ok(())
     }
 
-    async fn handle_write_batch_error(
+    fn handle_write_batch_error(
         &self,
         ready_write_batch: ReadyWriteBatch,
         error: FlussError,
@@ -480,7 +471,7 @@ impl Sender {
                 physical_table_path.as_ref(),
                 ready_write_batch.table_bucket.bucket_id()
             );
-            self.re_enqueue_batch(ready_write_batch).await;
+            self.re_enqueue_batch(ready_write_batch);
             return Ok(Self::is_invalid_metadata_error(error).then_some(physical_table_path));
         }
 
@@ -504,9 +495,9 @@ impl Sender {
         Ok(Self::is_invalid_metadata_error(error).then_some(physical_table_path))
     }
 
-    async fn re_enqueue_batch(&self, ready_write_batch: ReadyWriteBatch) {
+    fn re_enqueue_batch(&self, ready_write_batch: ReadyWriteBatch) {
         self.remove_from_inflight_batches(&ready_write_batch);
-        self.accumulator.re_enqueue(ready_write_batch).await;
+        self.accumulator.re_enqueue(ready_write_batch);
     }
 
     fn remove_from_inflight_batches(&self, ready_write_batch: &ReadyWriteBatch) {
@@ -656,7 +647,7 @@ mod tests {
     use crate::test_utils::{build_cluster_arc, build_table_info};
     use std::collections::{HashMap, HashSet};
 
-    async fn build_ready_batch(
+    fn build_ready_batch(
         accumulator: &RecordAccumulator,
         cluster: Arc<Cluster>,
         table_path: Arc<TablePath>,
@@ -667,11 +658,11 @@ mod tests {
             values: vec![Datum::Int32(1)],
         };
         let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
-        let result = accumulator.append(&record, 0, &cluster, false).await?;
+        let result = accumulator.append(&record, 0, &cluster, false)?;
         let result_handle = result.result_handle.expect("result handle");
         let server = cluster.get_tablet_server(1).expect("server");
         let nodes = HashSet::from([server.clone()]);
-        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024).await?;
+        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024)?;
         let mut drained = batches.remove(&1).expect("drained batches");
         let batch = drained.pop().expect("batch");
         Ok((batch, result_handle))
@@ -686,19 +677,21 @@ mod tests {
         let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 1);
 
         let (batch, _handle) =
-            build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path.clone()).await?;
+            build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path.clone())?;
         let mut inflight = HashMap::new();
         inflight.insert(1, vec![batch]);
         sender.add_to_inflight_batches(&inflight);
         let batch = inflight.remove(&1).unwrap().pop().unwrap();
 
-        sender
-            .handle_write_batch_error(batch, FlussError::RequestTimeOut, "timeout".to_string())
-            .await?;
+        sender.handle_write_batch_error(
+            batch,
+            FlussError::RequestTimeOut,
+            "timeout".to_string(),
+        )?;
 
         let server = cluster.get_tablet_server(1).expect("server");
         let nodes = HashSet::from([server.clone()]);
-        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024).await?;
+        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024)?;
         let mut drained = batches.remove(&1).expect("drained batches");
         let batch = drained.pop().expect("batch");
         assert_eq!(batch.write_batch.attempts(), 1);
@@ -713,15 +706,12 @@ mod tests {
         let accumulator = Arc::new(RecordAccumulator::new(Config::default()));
         let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 0);
 
-        let (batch, handle) =
-            build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path).await?;
-        sender
-            .handle_write_batch_error(
-                batch,
-                FlussError::InvalidTableException,
-                "invalid".to_string(),
-            )
-            .await?;
+        let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path)?;
+        sender.handle_write_batch_error(
+            batch,
+            FlussError::InvalidTableException,
+            "invalid".to_string(),
+        )?;
 
         let batch_result = handle.wait().await?;
         assert!(matches!(
@@ -740,7 +730,7 @@ mod tests {
         let accumulator = Arc::new(RecordAccumulator::new(Config::default()));
         let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 0);
 
-        let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster, table_path).await?;
+        let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster, table_path)?;
         let request_buckets = vec![batch.table_bucket.clone()];
         let mut records_by_bucket = HashMap::new();
         records_by_bucket.insert(batch.table_bucket.clone(), batch);
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index c386adf70e..330affaaaa 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -91,7 +91,7 @@ impl WriterClient {
         }
     }
 
-    pub async fn send(&self, record: &WriteRecord<'_>) -> Result<ResultHandle> {
+    pub fn send(&self, record: &WriteRecord<'_>) -> Result<ResultHandle> {
         let physical_table_path = &record.physical_table_path;
         let cluster = self.metadata.get_cluster();
         let bucket_key = record.bucket_key.as_ref();
@@ -99,19 +99,13 @@ impl WriterClient {
         let (bucket_assigner, bucket_id) =
             self.assign_bucket(&record.table_info, bucket_key, physical_table_path)?;
 
-        let mut result = self
-            .accumulate
-            .append(record, bucket_id, &cluster, true)
-            .await?;
+        let mut result = self.accumulate.append(record, bucket_id, &cluster, true)?;
 
         if result.abort_record_for_new_batch {
             let prev_bucket_id = bucket_id;
             bucket_assigner.on_new_batch(&cluster, prev_bucket_id);
             let bucket_id = bucket_assigner.assign_bucket(bucket_key, &cluster)?;
-            result = self
-                .accumulate
-                .append(record, bucket_id, &cluster, false)
-                .await?;
+            result = self.accumulate.append(record, bucket_id, &cluster, false)?;
         }
 
         if result.batch_is_full || result.new_batch_created {
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index 0bfe4a370c..ab5f5b6f32 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -101,10 +101,7 @@ mod kv_table_test {
             row.set_field(0, *id);
             row.set_field(1, *name);
             row.set_field(2, *age);
-            upsert_writer
-                .upsert(&row)
-                .await
-                .expect("Failed to upsert row");
+            upsert_writer.upsert(&row).expect("Failed to upsert row");
         }
         upsert_writer.flush().await.expect("Failed to flush");
 
@@ -138,7 +135,6 @@ mod kv_table_test {
         updated_row.set_field(2, 33i64);
         upsert_writer
             .upsert(&updated_row)
-            .await
             .expect("Failed to upsert updated row")
             .await
             .expect("Failed to wait for upsert acknowledgment");
@@ -168,7 +164,6 @@ mod kv_table_test {
         delete_row.set_field(0, 1);
         upsert_writer
             .delete(&delete_row)
-            .await
             .expect("Failed to delete")
             .await
             .expect("Failed to wait for delete acknowledgment");
@@ -268,7 +263,7 @@ mod kv_table_test {
             row.set_field(0, *region);
             row.set_field(1, *user_id);
             row.set_field(2, *score);
-            upsert_writer.upsert(&row).await.expect("Failed to upsert");
+            upsert_writer.upsert(&row).expect("Failed to upsert");
         }
         upsert_writer.flush().await.expect("Failed to flush");
 
@@ -308,7 +303,6 @@ mod kv_table_test {
         update_row.set_field(2, 500i64);
         upsert_writer
             .upsert(&update_row)
-            .await
             .expect("Failed to update")
             .await
             .expect("Failed to wait for update acknowledgment");
@@ -379,7 +373,6 @@ mod kv_table_test {
         row.set_field(3, 6942i64);
         upsert_writer
             .upsert(&row)
-            .await
             .expect("Failed to upsert initial row")
             .await
             .expect("Failed to wait for upsert acknowledgment");
@@ -421,7 +414,6 @@ mod kv_table_test {
         partial_row.set_field(3, 420i64);
         partial_writer
             .upsert(&partial_row)
-            .await
             .expect("Failed to upsert")
             .await
             .expect("Failed to wait for upsert acknowledgment");
@@ -509,7 +501,7 @@ mod kv_table_test {
             row.set_field(1, *user_id);
             row.set_field(2, *name);
             row.set_field(3, *score);
-            upsert_writer.upsert(&row).await.expect("Failed to upsert");
+            upsert_writer.upsert(&row).expect("Failed to upsert");
         }
         upsert_writer.flush().await.expect("Failed to flush");
 
@@ -546,7 +538,6 @@ mod kv_table_test {
         updated_row.set_field(3, 999i64);
         upsert_writer
             .upsert(&updated_row)
-            .await
             .expect("Failed to upsert updated row")
             .await
             .expect("Failed to wait for upsert acknowledgment");
@@ -585,7 +576,6 @@ mod kv_table_test {
         delete_key.set_field(1, 1);
         upsert_writer
             .delete(&delete_key)
-            .await
             .expect("Failed to delete")
             .await
             .expect("Failed to wait for delete acknowledgment");
@@ -721,7 +711,6 @@ mod kv_table_test {
 
         upsert_writer
             .upsert(&row)
-            .await
             .expect("Failed to upsert row with all datatypes")
             .await
             .expect("Failed to wait for upsert acknowledgment");
@@ -826,7 +815,6 @@ mod kv_table_test {
 
         upsert_writer
             .upsert(&row_with_nulls)
-            .await
             .expect("Failed to upsert row with nulls")
             .await
             .expect("Failed to wait for upsert acknowledgment");
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index ed90fd0521..82f8135206 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -99,14 +99,12 @@ mod table_test {
             record_batch!(("c1", Int32, [1, 2, 3]), ("c2", Utf8, ["a1", "a2", "a3"])).unwrap();
         append_writer
             .append_arrow_batch(batch1)
-            .await
             .expect("Failed to append batch");
 
         let batch2 =
             record_batch!(("c1", Int32, [4, 5, 6]), ("c2", Utf8, ["a4", "a5", "a6"])).unwrap();
         append_writer
             .append_arrow_batch(batch2)
-            .await
             .expect("Failed to append batch");
 
         // Flush to ensure all writes are acknowledged
@@ -230,7 +228,6 @@ mod table_test {
         .unwrap();
         append_writer
             .append_arrow_batch(batch)
-            .await
             .expect("Failed to append batch");
 
         // Flush to ensure all writes are acknowledged
@@ -332,7 +329,6 @@ mod table_test {
         .unwrap();
         append_writer
             .append_arrow_batch(batch)
-            .await
             .expect("Failed to append batch");
         append_writer.flush().await.expect("Failed to flush");
 
@@ -485,19 +481,16 @@ mod table_test {
             .append_arrow_batch(
                 record_batch!(("id", Int32, [1, 2]), ("name", Utf8, ["a", "b"])).unwrap(),
             )
-            .await
             .unwrap();
         writer
             .append_arrow_batch(
                 record_batch!(("id", Int32, [3, 4]), ("name", Utf8, ["c", "d"])).unwrap(),
             )
-            .await
             .unwrap();
         writer
             .append_arrow_batch(
                 record_batch!(("id", Int32, [5, 6]), ("name", Utf8, ["e", "f"])).unwrap(),
             )
-            .await
             .unwrap();
         writer.flush().await.unwrap();
 
@@ -536,7 +529,6 @@ mod table_test {
             .append_arrow_batch(
                 record_batch!(("id", Int32, [7, 8]), ("name", Utf8, ["g", "h"])).unwrap(),
             )
-            .await
             .unwrap();
         writer.flush().await.unwrap();
 
@@ -752,7 +744,6 @@ mod table_test {
 
         append_writer
             .append(&row)
-            .await
             .expect("Failed to append row with all datatypes");
 
         // Append a row with null values for all columns
@@ -763,7 +754,6 @@ mod table_test {
 
         append_writer
             .append(&row_with_nulls)
-            .await
             .expect("Failed to append row with nulls");
 
         append_writer.flush().await.expect("Failed to flush");
@@ -1026,10 +1016,7 @@ mod table_test {
             row.set_field(0, *id);
             row.set_field(1, *region);
             row.set_field(2, *value);
-            append_writer
-                .append(&row)
-                .await
-                .expect("Failed to append row");
+            append_writer.append(&row).expect("Failed to append row");
         }
 
         append_writer.flush().await.expect("Failed to flush");
@@ -1044,7 +1031,6 @@ mod table_test {
         .unwrap();
         append_writer
             .append_arrow_batch(us_batch)
-            .await
             .expect("Failed to append US batch");
 
         let eu_batch = record_batch!(
@@ -1055,7 +1041,6 @@ mod table_test {
         .unwrap();
         append_writer
             .append_arrow_batch(eu_batch)
-            .await
             .expect("Failed to append EU batch");
 
         append_writer
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index 0efe388247..baac77298a 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -148,12 +148,11 @@ mod table_remote_scan_test {
             row.set_field(0, i as i32);
             let v = format!("v{}", i);
             row.set_field(1, v.as_str());
-            append_writer
-                .append(&row)
-                .await
-                .expect("Failed to append row");
+            append_writer.append(&row).expect("Failed to append row");
         }
 
+        append_writer.flush().await.expect("Failed to flush");
+
         // Create a log scanner and subscribe to all buckets to read appended records
         let num_buckets = table.table_info().get_num_buckets();
         let log_scanner = table

From f0a740e9f3d76fde32308a32cf9de28118d175a5 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 8 Feb 2026 00:35:38 +0000
Subject: [PATCH 121/287] feat: Add unsubscribe_partition to python bindings
 (#277)

---
 fluss-rust/bindings/python/example/example.py | 13 +++++++++++++
 fluss-rust/bindings/python/fluss/__init__.pyi |  8 ++++++++
 fluss-rust/bindings/python/src/table.rs       | 17 +++++++++++++++++
 3 files changed, 38 insertions(+)

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index d56879a430..dd7f1b14a8 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -717,6 +717,19 @@ async def main():
         print(f"\nto_arrow() returned {partitioned_arrow.num_rows} records from partitioned table:")
         print(partitioned_arrow.to_pandas())
 
+        # Demo: unsubscribe_partition - unsubscribe from one partition, read remaining
+        print("\n--- Testing unsubscribe_partition ---")
+        partitioned_scanner3 = await partitioned_table.new_scan().create_batch_scanner()
+        for p in partition_infos:
+            partitioned_scanner3.subscribe_partition(p.partition_id, 0, fluss.EARLIEST_OFFSET)
+        # Unsubscribe from the first partition
+        first_partition = partition_infos[0]
+        partitioned_scanner3.unsubscribe_partition(first_partition.partition_id, 0)
+        print(f"Unsubscribed from partition {first_partition.partition_name} (id={first_partition.partition_id})")
+        remaining_arrow = partitioned_scanner3.to_arrow()
+        print(f"After unsubscribe, to_arrow() returned {remaining_arrow.num_rows} records (from remaining partitions):")
+        print(remaining_arrow.to_pandas())
+
         # Demo: to_pandas() also works for partitioned tables
         print("\n--- Testing to_pandas() on partitioned table ---")
         partitioned_scanner2 = await partitioned_table.new_scan().create_batch_scanner()
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index a2bbaac401..526dad7840 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -420,6 +420,14 @@ class LogScanner:
             start_offset: The offset to start reading from (use EARLIEST_OFFSET for beginning)
         """
         ...
+    def unsubscribe_partition(self, partition_id: int, bucket_id: int) -> None:
+        """Unsubscribe from a specific partition bucket (partitioned tables only).
+
+        Args:
+            partition_id: The partition ID to unsubscribe from
+            bucket_id: The bucket ID within the partition
+        """
+        ...
     def poll(self, timeout_ms: int) -> List[ScanRecord]:
         """Poll for individual records with metadata.
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 8af6b13e69..1a7dbdcecd 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -1657,6 +1657,23 @@ impl LogScanner {
         })
     }
 
+    /// Unsubscribe from a specific partition bucket (partitioned tables only).
+    ///
+    /// Args:
+    ///     partition_id: The partition ID to unsubscribe from
+    ///     bucket_id: The bucket ID within the partition
+    fn unsubscribe_partition(&self, py: Python, partition_id: i64, bucket_id: i32) -> PyResult<()> {
+        py.detach(|| {
+            TOKIO_RUNTIME.block_on(async {
+                with_scanner!(
+                    &self.scanner,
+                    unsubscribe_partition(partition_id, bucket_id)
+                )
+                .map_err(|e| FlussError::new_err(e.to_string()))
+            })
+        })
+    }
+
     /// Poll for individual records with metadata.
     ///
     /// Args:

From b05a497be1148b9c2f0bb4a1016c0187b0e72366 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 8 Feb 2026 09:01:45 +0800
Subject: [PATCH 122/287] build: add how to release doc (#268)

---
 .../actions/verify-tag-version/action.yml     |  37 ++
 fluss-rust/.github/release.yml                |  42 ++
 .../.github/workflows/release_python.yml      | 174 +++++++
 fluss-rust/.github/workflows/release_rust.yml |  60 +++
 fluss-rust/Cargo.toml                         |  12 +-
 fluss-rust/README.md                          |   4 +
 fluss-rust/bindings/cpp/Cargo.toml            |   6 +-
 fluss-rust/bindings/python/Cargo.toml         |   8 +-
 fluss-rust/bindings/python/pyproject.toml     |   7 +-
 fluss-rust/crates/examples/Cargo.toml         |   2 +-
 fluss-rust/crates/fluss/Cargo.toml            |   9 +-
 fluss-rust/docs/assets/release-guide.png      | Bin 0 -> 363329 bytes
 fluss-rust/docs/creating-a-release.md         | 453 ++++++++++++++++++
 fluss-rust/docs/generate-release-note.md      |  28 ++
 fluss-rust/justfile                           |  28 ++
 fluss-rust/scripts/bump-version.sh            |  54 +++
 fluss-rust/scripts/constants.py               |  45 ++
 fluss-rust/scripts/dependencies.py            |  96 ++++
 fluss-rust/scripts/release.sh                 |  66 +++
 19 files changed, 1114 insertions(+), 17 deletions(-)
 create mode 100644 fluss-rust/.github/actions/verify-tag-version/action.yml
 create mode 100644 fluss-rust/.github/release.yml
 create mode 100644 fluss-rust/.github/workflows/release_python.yml
 create mode 100644 fluss-rust/.github/workflows/release_rust.yml
 create mode 100644 fluss-rust/docs/assets/release-guide.png
 create mode 100644 fluss-rust/docs/creating-a-release.md
 create mode 100644 fluss-rust/docs/generate-release-note.md
 create mode 100644 fluss-rust/justfile
 create mode 100755 fluss-rust/scripts/bump-version.sh
 create mode 100644 fluss-rust/scripts/constants.py
 create mode 100644 fluss-rust/scripts/dependencies.py
 create mode 100755 fluss-rust/scripts/release.sh

diff --git a/fluss-rust/.github/actions/verify-tag-version/action.yml b/fluss-rust/.github/actions/verify-tag-version/action.yml
new file mode 100644
index 0000000000..ad16b4f979
--- /dev/null
+++ b/fluss-rust/.github/actions/verify-tag-version/action.yml
@@ -0,0 +1,37 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# Verify that the pushed tag version matches the workspace package version in Cargo.toml.
+# Tag v0.2.0 or v0.2.0-rc1; Cargo 0.2.0. Compare base version (strip -rc*): both pass when Cargo is 0.2.0.
+# Requires: checkout before this step (Cargo.toml in workspace root). Use on tag push (GITHUB_REF like refs/tags/v0.1.0).
+
+name: 'Verify tag matches crate version'
+description: 'Exits with error if GITHUB_REF tag base version does not match [workspace.package] version in Cargo.toml (strips -rc*).'
+
+runs:
+  using: 'composite'
+  steps:
+    - run: |
+        TAG_VERSION="${GITHUB_REF#refs/tags/v}"
+        CRATE_VERSION=$(sed -n '/^\[workspace.package\]/,/^\[/p' Cargo.toml | grep '^\s*version\s*=' | head -1 | sed -E 's/.*"([^"]+)".*/\1/')
+        base() { echo "$1" | sed -E 's/-rc(\.[0-9]+|[0-9]+)$//'; }
+        if [ "$(base "$TAG_VERSION")" != "$(base "$CRATE_VERSION")" ]; then
+          echo "::error::Tag version ($TAG_VERSION) does not match Cargo.toml version ($CRATE_VERSION). Run scripts/bump-version.sh before tagging, or tag the version that is in Cargo.toml."
+          exit 1
+        fi
+        echo "Tag and crate version match: $TAG_VERSION"
+      shell: bash
diff --git a/fluss-rust/.github/release.yml b/fluss-rust/.github/release.yml
new file mode 100644
index 0000000000..3ca2be6277
--- /dev/null
+++ b/fluss-rust/.github/release.yml
@@ -0,0 +1,42 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to you under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# Configures "Generate release notes" on GitHub Releases.
+# https://docs.github.com/en/repositories/releasing-projects-on-github/automatically-generated-release-notes
+
+changelog:
+  categories:
+    - title: Added
+      labels:
+        - feat
+        - feature
+    - title: Changed
+      labels:
+        - refactor
+    - title: Fixed
+      labels:
+        - fix
+        - bugfix
+    - title: Docs
+      labels:
+        - docs
+        - documentation
+    - title: CI / Build
+      labels:
+        - ci
+        - build
+    - title: Chore
+      labels:
+        - chore
diff --git a/fluss-rust/.github/workflows/release_python.yml b/fluss-rust/.github/workflows/release_python.yml
new file mode 100644
index 0000000000..59c8f8c91e
--- /dev/null
+++ b/fluss-rust/.github/workflows/release_python.yml
@@ -0,0 +1,174 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# Publish the fluss Python binding to PyPI.
+# Trigger: push tag only (e.g. v0.1.0).
+# Pre-release tags (containing '-') publish to TestPyPI; release tags publish to PyPI.
+#
+# Token auth: set repo variable PYPI_USE_TOKEN_AUTH = 'true' and add secrets PYPI_API_TOKEN / TEST_PYPI_API_TOKEN.
+# Trusted Publishing (OIDC): leave PYPI_USE_TOKEN_AUTH unset; do not pass password so the action uses OIDC.
+
+name: Release Python
+
+on:
+  push:
+    tags:
+      - "v*"  # Only version-like tags (e.g. v0.1.0, v0.1.0-rc1); avoids running on arbitrary tags
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
+  cancel-in-progress: true
+
+permissions:
+  contents: read
+
+jobs:
+  version-check:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - uses: ./.github/actions/verify-tag-version
+
+  sdist:
+    runs-on: ubuntu-latest
+    needs: [version-check]
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - uses: PyO3/maturin-action@v1
+        with:
+          working-directory: bindings/python
+          command: sdist
+          args: -o dist
+
+      - name: Upload sdist
+        uses: actions/upload-artifact@v4
+        with:
+          name: wheels-sdist
+          path: bindings/python/dist
+
+  wheels:
+    runs-on: ${{ matrix.os }}
+    needs: [version-check]
+    strategy:
+      matrix:
+        include:
+          - { os: windows-latest }
+          - { os: macos-15-intel, target: "x86_64-apple-darwin" }
+          - { os: macos-15, target: "aarch64-apple-darwin" }
+          - { os: ubuntu-latest, target: "x86_64" }
+          - { os: ubuntu-latest, target: "aarch64", manylinux: "manylinux_2_28" }
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install protoc (Linux)
+        if: runner.os == 'Linux'
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Install protoc (macOS)
+        if: runner.os == 'macOS'
+        run: brew install protobuf
+
+      - name: Install protoc (Windows)
+        if: runner.os == 'Windows'
+        run: choco install protobuf -y
+        shell: pwsh
+
+      - uses: PyO3/maturin-action@v1
+        with:
+          working-directory: bindings/python
+          target: ${{ matrix.target }}
+          command: build
+          args: --release -o dist -i python3.9
+          manylinux: ${{ matrix.manylinux || 'auto' }}
+      - uses: PyO3/maturin-action@v1
+        with:
+          working-directory: bindings/python
+          target: ${{ matrix.target }}
+          command: build
+          args: --release -o dist -i python3.10
+          manylinux: ${{ matrix.manylinux || 'auto' }}
+      - uses: PyO3/maturin-action@v1
+        with:
+          working-directory: bindings/python
+          target: ${{ matrix.target }}
+          command: build
+          args: --release -o dist -i python3.11
+          manylinux: ${{ matrix.manylinux || 'auto' }}
+      - uses: PyO3/maturin-action@v1
+        with:
+          working-directory: bindings/python
+          target: ${{ matrix.target }}
+          command: build
+          args: --release -o dist -i python3.12
+          manylinux: ${{ matrix.manylinux || 'auto' }}
+
+      - name: Upload wheels
+        uses: actions/upload-artifact@v4
+        with:
+          name: wheels-${{ matrix.os }}-${{ matrix.target || 'native' }}
+          path: bindings/python/dist
+
+  release:
+    name: Publish to PyPI
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      id-token: write
+    needs: [version-check, sdist, wheels]
+    if: startsWith(github.ref, 'refs/tags/')
+    steps:
+      - uses: actions/download-artifact@v4
+        with:
+          pattern: wheels-*
+          merge-multiple: true
+          path: bindings/python/dist
+
+      - name: Publish to TestPyPI (token)
+        if: contains(github.ref, '-') && vars.PYPI_USE_TOKEN_AUTH == 'true'
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          repository-url: https://test.pypi.org/legacy/
+          skip-existing: true
+          packages-dir: bindings/python/dist
+          password: ${{ secrets.TEST_PYPI_API_TOKEN }}
+
+      - name: Publish to TestPyPI (Trusted Publishing)
+        if: contains(github.ref, '-') && vars.PYPI_USE_TOKEN_AUTH != 'true'
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          repository-url: https://test.pypi.org/legacy/
+          skip-existing: true
+          packages-dir: bindings/python/dist
+
+      - name: Publish to PyPI (token)
+        if: ${{ !contains(github.ref, '-') && vars.PYPI_USE_TOKEN_AUTH == 'true' }}
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          skip-existing: true
+          packages-dir: bindings/python/dist
+          password: ${{ secrets.PYPI_API_TOKEN }}
+
+      - name: Publish to PyPI (Trusted Publishing)
+        if: ${{ !contains(github.ref, '-') && vars.PYPI_USE_TOKEN_AUTH != 'true' }}
+        uses: pypa/gh-action-pypi-publish@release/v1
+        with:
+          skip-existing: true
+          packages-dir: bindings/python/dist
diff --git a/fluss-rust/.github/workflows/release_rust.yml b/fluss-rust/.github/workflows/release_rust.yml
new file mode 100644
index 0000000000..0a567a6a22
--- /dev/null
+++ b/fluss-rust/.github/workflows/release_rust.yml
@@ -0,0 +1,60 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# Publish the fluss Rust crate to crates.io.
+# Trigger: push tag only (e.g. v0.1.0).
+# Pre-release tags (containing '-') do not publish; release tags publish to crates.io.
+#
+# Token auth: set repo variable CARGO_USE_TOKEN_AUTH = 'true' and add secret CARGO_REGISTRY_TOKEN.
+# Trusted Publishing (OIDC): leave CARGO_USE_TOKEN_AUTH unset; token is obtained via OIDC (no secret).
+
+name: Release Rust
+
+on:
+  push:
+    tags:
+      - "v*"  # Only version-like tags (e.g. v0.1.0, v0.1.0-rc1); avoids running on arbitrary tags
+
+jobs:
+  publish:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      id-token: write
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: ./.github/actions/verify-tag-version
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Dry run (crates/fluss)
+        run: cargo publish -p fluss-rs --dry-run
+
+      - name: Get crates.io token (OIDC)
+        if: startsWith(github.ref, 'refs/tags/') && !contains(github.ref, '-') && vars.CARGO_USE_TOKEN_AUTH != 'true'
+        uses: rust-lang/crates-io-auth-action@v1
+        id: auth
+        with:
+          token-type: publish
+
+      - name: Publish fluss-rs to crates.io
+        if: startsWith(github.ref, 'refs/tags/') && !contains(github.ref, '-')
+        run: cargo publish -p fluss-rs
+        env:
+          CARGO_REGISTRY_TOKEN: "${{ vars.CARGO_USE_TOKEN_AUTH == 'true' && secrets.CARGO_REGISTRY_TOKEN || steps.auth.outputs.token }}"
diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 4155ea84b9..dfddd8d48a 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -16,24 +16,26 @@
 # under the License.
 
 [workspace.package]
-categories = ["command-line-utilities"]
+authors = ["Apache Fluss <dev@fluss.apache.org>"]
+categories = ["api-bindings", "database"]
 description = "The rust implementation of fluss"
-repository = "https://github.com/apache/fluss-rust"
 edition = "2024"
-version = "0.1.0"
+homepage = "https://fluss.apache.org/"
 license = "Apache-2.0"
+repository = "https://github.com/apache/fluss-rust"
 rust-version = "1.85"
+version = "0.1.0"
+keywords = ["fluss", "streaming-storage", "datalake"]
 
 [workspace]
 resolver = "2"
 members = ["crates/fluss", "crates/examples", "bindings/python", "bindings/cpp"]
 
 [workspace.dependencies]
-fluss = { version = "0.1.0", path = "./crates/fluss" }
+fluss = { package = "fluss-rs", version = "0.1.0", path = "crates/fluss", features = ["storage-all"] }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression"] }
-chrono = { version = "0.4", features = ["clock", "std", "wasmbind"] }
 
 serde = { version = "1.0", features = ["derive"] }
 serde_json = "1.0"
diff --git a/fluss-rust/README.md b/fluss-rust/README.md
index 5e771d9d28..b1116f1751 100644
--- a/fluss-rust/README.md
+++ b/fluss-rust/README.md
@@ -133,6 +133,10 @@ Then, stop your Fluss cluster. Go to your Fluss home, stop it via the following
 ./bin/local-cluster.sh stop
 ```
 
+## Documentation
+
+- [Development Guide](DEVELOPMENT.md) – Build, test, and contribute to fluss-rust.
+- [Release Guide](docs/creating-a-release.md) – How to build, release, and sign official Fluss client packages (Rust, Python, C++).
 
 ## License
 
diff --git a/fluss-rust/bindings/cpp/Cargo.toml b/fluss-rust/bindings/cpp/Cargo.toml
index 0b83de9365..8606a226e0 100644
--- a/fluss-rust/bindings/cpp/Cargo.toml
+++ b/fluss-rust/bindings/cpp/Cargo.toml
@@ -17,7 +17,7 @@
 
 [package]
 name = "fluss-cpp"
-version = "0.1.0"
+version.workspace = true
 edition.workspace = true
 license.workspace = true
 rust-version.workspace = true
@@ -30,8 +30,8 @@ crate-type = ["staticlib"]
 anyhow = "1.0"
 arrow = { workspace = true, features = ["ffi"] }
 cxx = "1.0"
-fluss = { path = "../../crates/fluss" }
-tokio = { version = "1.27", features = ["rt-multi-thread", "macros"] }
+fluss = { workspace = true, features = ["storage-all"] }
+tokio = { workspace = true, features = ["rt-multi-thread", "macros"] }
 
 [build-dependencies]
 cxx-build = "1.0"
diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
index 0a0daff93d..804e1bbc0e 100644
--- a/fluss-rust/bindings/python/Cargo.toml
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -17,10 +17,10 @@
 
 [package]
 name = "fluss_python"
-edition = "2024"
-version = "0.1.0"
+edition.workspace = true
+version.workspace = true
 license.workspace = true
-rust-version = "1.85"
+rust-version.workspace = true
 
 [lib]
 name = "fluss"
@@ -28,7 +28,7 @@ crate-type = ["cdylib"]
 
 [dependencies]
 pyo3 = { version = "0.26.0", features = ["extension-module"] }
-fluss = { path = "../../crates/fluss" }
+fluss = { workspace = true, features = ["storage-all"] }
 tokio = { workspace = true }
 arrow = { workspace = true }
 arrow-pyarrow = "57.0.0"
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index e28b3d2474..0e61b23484 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -20,9 +20,9 @@ requires = ["maturin>=1.0,<2.0"]
 build-backend = "maturin"
 
 [project]
-name = "fluss"
-description = "Python bindings for Fluss on fluss-rust with Pandas integration"
-authors = [{name = "Fluss Team"}]
+name = "pyfluss"
+description = "Apache Fluss (incubating) Python Binding"
+authors = [{name = "Apache Fluss", email = "dev@fluss.apache.org"}]
 license = {text = "Apache-2.0"}
 readme = "README.md"
 requires-python = ">=3.9"
@@ -42,6 +42,7 @@ dependencies = [
 ]
 
 [project.urls]
+Homepage = "https://fluss.apache.org/"
 Repository = "https://github.com/apache/fluss-rust"
 
 [project.optional-dependencies]
diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
index 16629bed16..cce6faf258 100644
--- a/fluss-rust/crates/examples/Cargo.toml
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -24,7 +24,7 @@ version = { workspace = true }
 
 
 [dependencies]
-fluss = { workspace = true }
+fluss = { workspace = true, features = ["storage-all"] }
 tokio = { workspace = true }
 clap = { workspace = true }
 [[example]]
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index c92359408b..4d9be026f5 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -20,6 +20,14 @@ edition = { workspace = true }
 license.workspace = true
 rust-version = { workspace = true }
 version = { workspace = true }
+name = "fluss-rs"
+authors = { workspace = true }
+description = { workspace = true }
+homepage = { workspace = true }
+repository = { workspace = true }
+keywords = { workspace = true }
+
+[lib]
 name = "fluss"
 
 [features]
@@ -54,7 +62,6 @@ dashmap = "6.1.0"
 bigdecimal = { version = "0.4", features = ["serde"] }
 ordered-float = { version = "5", features = ["serde"] }
 parse-display = "0.10"
-ref-cast = "1.0"
 jiff = { workspace = true }
 opendal = "0.55.0"
 url = "2.5.7"
diff --git a/fluss-rust/docs/assets/release-guide.png b/fluss-rust/docs/assets/release-guide.png
new file mode 100644
index 0000000000000000000000000000000000000000..bf7602ddeeeee58163ddbeedb0c4c9c92efe6ac4
GIT binary patch
literal 363329
zcmb@ubyQSs_dZTZD3VG@%m7MA4BefAG%6s?Fog7wLnGZFNJxW#3epbU3Iju<)F9m{
zLrMA_o=2be{r&a%t@S>v#ahGRocr8opZnhX+Sk7JL}_cP+`f75CKeXfZPiDLx>#5w
zWLQ`@GKBb;BV6;)k62jPv~~&#+Nuf)Ky9eAwVeY53yVDoY;Lamh>IOzL1Au=7~tf%
z3H8#AjEvPa4{UG$(%u7X2Y$}WNH;c~ry-l~!ouUdch|3}yPdEAwDq#TGo|NNy{>Ld
za_}JlIH<|P{?NkQydSIjHS+OI*=<Ik(R~iOep4(<YHS8VD`)JgF{W)wb0M;0hRQdI
zKpWsWZsI^1p0z;m_TuA+${Vr{?^=Ms_4HS{DIc)VE#dh^MPaN_0YE}ET~0OGTDJf>
zh>o?7a@0!}-nY7UB@bR5x!;K;CLW-nkzF9sxfCO#&xy6PA+sb5BFkjyXrFIO2@YN%
zmG6I>7Hknrf{Xj>Noe{TCftx9Y22<>vECvjh&GreBbJtia3A}=rrPr-JtLhMTM@ZD
zGIYbjQWCoU#r6x<KgC$i(C&$WyMczfIM~^d$HL0l62jx{=z=*L3ro^l9P`l;;%))-
zc64xZ6Ze*4{_6~J%;)RFAZFlSr?}foF&k)T0~MU15TFo`AP+CI^i3cTC<(Q)7S~l&
z{(U*-FDYhQcXt<Y5Xj5Ri^ofV#~Eq^;u8}S1M%{M`1!dpXK=g0oZKzExt-it{vPDd
zIEoNAFx1Y)-Okwwcs;I#rL%{-6f^VnjsE%hd!Fug*8jPaliTmd!aN}8`ad8(9$wHt
zV`DCrygn+f1+{}<?tDGIG@s;OXa0YV{l1SR==$dWHJQJk^sl3sN0q)Q3Hrxu(l^yR
z*$lC;WU*8g<(_zBZ)X!Un<{10v*mkjj5@CieH|`3;ZeF%xog=`{jRhr5LI4U-zekd
z@$_q$$*t&U_o6iI6pBP`1xhBeM&NyS?Vq_euTFSRmi<IdSWi|{C6oQU2EF>S#D=^E
zGrVSDb6(0VIz?8mg7EGGv56kZ;!q_1Zy(JS$!Vkt%DZEd{<m@dYbHR-;oxC9x&L`;
zzlY?-AzGIe#R+@@QvJ7v%)`w;`PUxT9FJl+*ah$Eo$0H8>!rvN$nX6tZ}-}S?S%L9
za2E(KbXxBJ8w=*Iw?Yy+i~GN>ygw@@nEa6}K_~goLLb$CYe<a8ZXx)WHi#?^OJWd7
zD9aC(qgVghkm6)Mr2oR^{o91fK+N;1%qMI<Q2k@m|8?=W0}mPhN5}G?sl>|Sh?B*)
z1HL`}*W4Dd89}GW#r|1XyY`CcldW(1>)GXn#%4SxpZrd8oA7>qT>Ug>Z`w55;Hwf>
zRx{As!f((MUuM=`N=u0226ZM;^yhN>Ns*rIYv&oCfeH;*U|17QUhtL<?CJRRO?ldx
zH>KQ${Tt-RUM;K+f0p22*IDLHd9%!3n;3_^W<0}9`j1@*w&7-#%(;l0!NKqJwIIi}
zj!pu!Y91M=iCM{9t~ZJoJlI72_IPJ##%;T~9QaX~UEpiIoEp81?D4c7lFw-KY%gH>
z7ydOV-;jl$ndkktd(0edC#HN~*#43pcd{j?L99W5$Q*`fg^$uTZnqf)*6^B1SF`dT
zJThmeSl_Anj=BtA6nb8g|2R)(uk?zmROIvO@u`nqNkfa4Gwq>gTk2VYPoWz3mdS(v
zbv696?Av)+dHrmF^xeZB8~-g|XP$TM-iJfE&HgR#&P#~r4y4Ch&(ZzYMjXB#(Y7-c
z^lzDx1`o3*NO0V>IR3Q}ZLdcZv_Pi)Tak?z2jf==up3KK{<RSWuSa}Sx$^iw-r;|9
zgZRPi7a=a1|3AzaoHF|k82eCGu#Gy?`2Tz&8W`TJc{_V|B*HgCIqu%;S?{GdMJJ5^
z@?p)xwHWf7dH8?5H(qVLH%kozd$=B^$k+du0n@=aqCbT6P>rk7ejtWln=4Z^oY4nL
zv!3Ovjc0xW!h&rgCnrsK;S#|*-*EX4#>8hT`p*6pBl<IIH_<+wRfc)CcaId+m^92x
zegw2Wvms3=>8o;ia^wuu^Z))$wQoh#2KI3U>L8NVu8lFlg7%e1S?0gs1J0skMSGM?
zsU&<3*U?*CX=c7VpAI)mD~j7LcbqqlCd{-z%|GOQ_P<ach_}{UHLT@49+LUx=d)3i
zMsZ#f@0MJ%`&!?$7tqInv;_14OH2z@^m#%H5h^98Yq>JqwZrmu9XF`^PdjgcvfSv;
z`*vb@8f~9Ldmm7uri6dt9F&AnKNsb0{keE_m2wwl1M3j*%+vIH!$E(G#n}mCa{L%f
z@DEX%Jy84Kmuwz@C?(!;g<sRL#nqv!id3c5Zmbv*Aw!Rq8*sL<z1-8N0`M1<xUu;2
z<mXaCNdzE3RO)=YW{UPlai-H|4<~JX!T59gkF}jQIjwp+?&=%!eQZ73w0mEa+D8(F
z<gPRJ*)p1Y!$6#7U>Q}rU5#8l5@lKRjtp7!I~bS%uT0Yuhxji`QOzq89SUGJ;yLZR
zFaH8!Fb5Jnahrc|mE5UQDWdsO^s40ojkMeR`hIGkl%PX}5q4k0*Xj8i^l-}IBsihS
zCI`lPxj-8DD49)baOGrW=tF7wo9sQ8>X<XZ19s3R!<>x>C>vd%j!y4Lgh&ToZkZhj
zx%vBRNbJ<=J$D-rqSOpCF)<-h>2eV^wn|b$^NYoYi_&_k>7-3EdL&4WXJP^(CZtT}
z3UWXG7XrZLBdihu-DR$m<+oG<g#6(7++P=K7qIpGh-$a_5K`%MR*g3)teRPm_@s*K
znpe1|ES&Pgs6N<y?;7DAj0<6$>pG3w>o<QS)deFhk)o%{_1S#ybhNks`LdE+rL`!{
zRD3|@*G0pw&QQ8sWtjl7EI~XXdCor2pS$H^6gidu%6^@LuW(_q3Ov?L=bU9DVhoNG
zg0_yTajs0=wulO`D4Dvol$FJ@Nd?nd^T@>WQNW<-S#2nQ$O^|htA_UlegbXznLw+?
zko9&Kk7H)j4(g{aqrlRgrvlTCY-U&AU4AP4Hd8Q@a^5rb6zD*#_&Dl~htpKuY!Srh
zo5~Qsp&rkRfC{9`e<gM12ITB4R@UDPV&b`xsjrRGzkGS&i-`QrQ>&D^4R1MpaGcQG
z&~i4*nNcGy?e6onM!%;v3;FcFAwCTWp7^GJY2O4&jkd{nx9f&AZ6+A`B&BG^<fW_O
zpGkGFY9r;i@Ajf@iWNiBOh0a_UTxSJRowJq`;*Ru6JuLN=)wsjTC8t?S>>|ua{bV~
zp~=8piM?il@17{fjq;}57mTAj5}Hn;wcPddFF)a$WN~KU_Fj9N3)t1^T8)57o&4Dk
zNbn7+N1WyLmds`jRbS8qYoEiYP3x~hyUaw-l9p0v0GlBp%a1`VDGZbuI!P<krrt~~
zKNn+QsdCmjS;@8NKF&4q&Ii`IZzVT7PgN17E<^;qhS_cjQpb<%D_T6C2VNeHVVqlz
zD1l~#s2G2#MJCwdKzcr_&yTh(@a#GdlE!g6Nm9sjP)Dx7Iq5%urmVrk?{|;R)K1Cp
z)sMuf|G{FiA+mbHF9Mvmb0i8CJ}OM>i`l*V*48_@_m73m-%+HiJ}aX?tEMyuJd}Lm
z;p|@@I&Ko8vHVfuQ<+1u25S5h{pQ0zR=gg$pDMVxfBIsU%bmUN$JYjtBc2K+v8J~R
z)qgy_T%J*4%?pULRct=H{^3*Ud(jhQZBY$>|J&RYIPB2W6<pDLEMgkSB6V`%2BT{G
z%L8QaKe*ga2<#_$S(5GfyurQ>V%=h7odKzKW2EcE=9v!6Lc2uz{#=NtIWVaUk?@<s
zxU8`^_T?EiV@5CD7ge*+ueI+d&>kB^=+O^)6)MM-qi;}XzI5o);iX@BhkF#2wepkk
zh-Hm3wlB-)z`|s?ilIk3>*ndaLu4`l<q~v(G`o6rpl{|Y)PhEH!k%@r<#;piVVvtw
z@pV8*g_`GeU?*=C#2Zr|rJH&kKII5p%lfgC(j7;a2A}oW+BTT{_U-jE6OV7(Rz!OB
zLVCt5TP3+$1I-N;a}UTc=#ZFVl_eYt)b(hEf9q^%g$86~y1k%e=2P8syxK4&bML`s
z5*>V`{(xN9*5~0?kLNwIdpgn!BSX?vX7m$jlACv7^qE_Hg%90y15#`-sl#8esC}44
z8~$qr`c=>>2m$tYcI%7PLa4eoDs+&c-mLMg+#h`U5PNY(hYdYx+NX-pFs%NtTsozp
zQ-MH27ca^<(~$ngssCV)uGg}9S9SrQiqe#@z7=S$m|?t|N<0@WKLqi5*&*;U?%@X(
zk{E%*;H0!Q8<T@B&&`}8HwJgdqfbv4A*lkl!~~Z|biJt0lY5|s31TKZ6(5bAIO||n
zt0!=<G24Ie5HCMbN;SBFUZ1Yoa=EItP7I>lppor@*jbU*;n|W0^*1I~HGL~g{9>4J
z!N4yHUR#e)b=dMWHbphb=$s&sg?;?U6(}I>!Ec6(CIGL`v(0!_tzaO*&$B$9{}i|t
zn&h)CVpc(X<@WQFe0a25sKe)~tiZ-y3Wc*tu=1rf;*kUCl&#YwmE~e&PKqF#-)!@}
zwBLK@KsY#2fw{!r(H@-ZyW8-&>?NrNjQ#sb&-tj-$xO0S<3_Rjm%IA4INO_>YM9lr
zt`2c!w0hM82$a;w6#jTLY0%s6y;a`i^xV1S2p#L)f2SVfjUfbLSyL{`idXZJF`!oO
zj}t^D8Yu!ZXmiCuhww_39I&TK0Is#L)%WX|LA&T6YB&1Uee84QC=%2%v$RqUpMH_?
zKw@9QEgq4C3-CW2iEl&ds4%?lj%UamH?+wXwC+!z)=8eC%Z#dK_Gm1zY&vaL#W)Pu
zffwLdf8cTQ9hkAUnW;Om`48PSC0fv-!AZZs&~h3t$PZt*STp;%Z^lxvCT?F<SpsQ~
z<k@85MuXjul83cKPbp)?zO7Z7F|>C(Ea5~nj+1dyeIiC*8ZcfJr!3msZ+GV><86Tu
zc0ZrwheFEC@^TsGkE5GsR{wDd3K6mhl_ZscGiElXU&BPKDva`W?Os;Ef-T@LAZ1lH
zLR3rY=*gg&-~JbR^WaNS>&;rVXFi@U<TVSrE)K`ER4}u!A+tLAra#0_)<?*EH;DyM
z#cjnr4r<!2CdweBC7dD>Bl>dVeBVFnK`H`zr}_?B-<i_kachy^6P^>e<Vo^Bi~Ldp
z>pRIW<dZ&7m9$kFX49BK5A6_vi0~}j2J!~7?^C4}t<S_xpOOSsXrz%ECiwNjCx4w%
z=V*-;Ya)9p<CZuC;58)Q8PIHEkWd~F{);o+xv42?aMs;t229AD_36Y1Nt~ylIV2gc
zE)hvGNsp(xuMowEqADqP{s9>9v&YqMt*f<4W@Vt)`D=<<h@4S|<CbNh+kd=laK36@
z$`KM`)im4ZMIW&pM<1^qA0X0N6B|!$n6<OK9?F+)Nqd?jjor9NBcYPeFHIwJq|%AF
z=?`i&U$%uVqlbxDG9xr;OhD)(%a~_N8%VBf2(*>OrjSy(byc+WL|6#2`O3aw28Eu{
z`V&QiACU3uEW5&65h@lckryG-6owHV2(|uaAzYvNQMs_=jKhAjoZfSD$*YOBOCe_k
zVfj>fVfma*WURE#8k~NL042YTpA@_pGRwD2fB4El#YvvZlCD~NlBzm>k4cZa5(^$C
zK$l;ao$FELDn4hQ@y<ois^t%58!SSUa(1H|JClgv*0Bd)skx_SY1R!;!}6=ua=X`0
zpS}0T>x)CM#+K?Tmwc|0*sTZug=MoxhZ}%KK)O)lVB<>LBBS@HpPFHJw~$+$&xW8?
zptW>}#WxZS+Deh0LnX~v^v{;z-2DYF1+DP7<zy}C3=hk|v$5RKln6$(G*eGQdVan5
zoLg7xHSfH7ai$Jh&v!F7Xpa5YB<3=Nzq^lZFGuMyk>p%>4m`PHt#OMRKwn5-T$2+Q
zfnDUjH}=u-S+{luVq(HUvEwkNF~gqpNQh~lpDj%WTtu>+O*1Q9V&{^mri>HmKDeYn
z@WuxnHRyi&a(Bpw_ceFit?=X03b@a6@1(FXD3Uv^Wr+4p{z!g@tg380ALY?DhtO8v
z5xF^g0r8Q08R}1%Pj|zyAe+?}<FHEP-Od|}&bosSpm7WBKWxW6(GQ^+vd*wWFZa5c
zZYUGw<I$>%*<sRvekcWlt@tQ$0dG+C=EKrrC2Au<5DTY;_DjjI=FhTfTJN7~ejq`h
zb+rf@HU2@!hrzNO1gXe|NLukXtq1@jiitD4hS7)9N+H(BfEvF8kwDX;4j_XS-NS-0
zBU5PFn=yfO<9$i4+R3c1GoZXU(2ILTeey@ksfE9>+wudIROH^JQCH4m1(CWb>&z87
z=4HJ@Z{pefIt7~uSF$bMLklyjCsyAk2gTzR!dDt?iq`DMi^o1qoFt34v+}q7lidb4
zC<Cp&BE<Nh&$&xKeGT<bS{cCxAI8W2TF%W?2etmNOg-Xb1=A`2IGGC!^gL5oZ9Cs>
zGE&Q|d0JG)Sp5P~x-tnf22}e5mc)t7iY6pb0`anW&&-$CB5@M(>Cv8uso0WI%H2J)
z4)kxcUn&5t!Vw%E&#KAKfnGqs!c2t2=Si_((n>bJ?W&#^5(-(DmE2ZsM3k&9wr$1L
z<y<V(OkO~?uyRjK$Z=}gfg83(N`59dwK-i$8&Y1UDPf`G{&WYta%=6<8U?Q`m`I+P
zu5jU2|J(Y!iiE(D&@x^4rH)j$c?LO|ia^#4wpmHO%L^NsgaHpt-&hisLw1KeW2-ln
zC#7CIRL9fy6}21InbyC8g~kn7wiIc+6n}O6WZv;vw~y{><W|090f`8sj#p2ha|@O9
z!WlXft0xAz6*bi0;=ptJyOCQ()HTgfyWI4*y5tU1jhs|P=KS35ptyT_lU*0kCkrC&
z?|%dnFs{QvW{De~({?4by{ws5CGr=_mA(#}pXBGpJ!J-;yyH~9f6YBF4~bv!L{mSn
zvEVTC9^foE&@7QEIGF#Wfr~)i)w0JI^3I3DOhk~;do)wSz|s0qpmIbOwbj>zm3R7O
zF-yH}A=)bg_EG+QM^(-aF_PnH=hbmXRdHz|C@=#uUo_7`78az9oiNLaFLyi__^WmX
zjV$^!@w`b`)A9#ien_Mu`wiPz@duka;}V+_c7YRr)()>d&cN|&7I{WHiF*pWy!dj;
z@}>o2s`1!_9d~vyRD!$S-RyUDM6^Kh6vQLH#0=Z5!hn(8w5>k0q1Ho47}U2x`k1?}
zhJFj_5B6{17H{l`+GAH=#AOjZe89vOrqkQUS&;>KKu@Yu%+<6F{U+PjIW_!NFQbD4
zuHw&<aJ2dl7RSOVYS!baxqX^n$B#!|Ig+2x*+~{oTVPgdedF^~0`^UJ2by+sVoHH%
z-g%d$I1%UvF*Ss0zP$pELcnqte{Oxau4c47i;e%X2EI-ed&pk)ag;v_p4QV705NrP
zmdNo3=OPSyTK6sd9b!BXB}|3k<YfF08zrsA#Z=e#;d24!+vbr>g8W<2oaO1a^QOA_
z(Nf{E>*p?liqvXv_us9R4Fb@f4QBLou!aH1e?_ZSa>6MAXgrCDjgcxMMU+4}PZTF0
zk5ak2XFc2XFye#ln!bt0Q`Ex8t;Fw13<>~xaf?lID0j7)UqN}2N<I@nc%r7If#*05
z+zU2AwXVPubwViT7AV9mx`$l}*B?*24N19an==0ZyDO0;M0O`EF!BrWdu7!a3VZNu
zF&xD;H?+<Dfr9Jmz`D|nIJKbkR?;0iEysuABba@dMQ<c;h21^GH{4_Kqj9So=`%8D
zv(tLx`#r}%4geE@c7pARA;}bQ{B@CH_G8-o8PoCvf8-8V&lz;i0Dwvin;i6#=BnYb
zDog|<QTt{lhVZKQIGOK!DnU^d_!<W^tc>Y88$R5+mz40+UF~aOnb+5fv8(dmL@Tih
zj&rl=Coh4})Wlnh;=^-!B^{o7aFo;I31c^n#vh%xz;4+I?_V-nOqjvfYUg5?3YKhH
z-Dws?!wcv8O3SiR4Sg~kekFVlL=X-v{hW2kHKaaQ85AGu$5U%4HntvGb)J)aGe>Sl
zx~wa$$C&eK_t)5^*t>~u`exZXl9@d}P|WuGO`lH__bYL2$9(<Q6#!~W-EoiUoa!w$
zH#hs_m=ht$&-?fL4o`S`V`m_k{krQcaleAg^jVT#uO{e`=_6w3u+A6naB8|Z);Itz
z0}cPcLo^de3}3k5U=St-0EzY`q%k0M*i!k*7a{$(JnHWg2S(luYHtrBiP~E7X@J*z
zqU$|FiS7Z2yX#kTC~gzP5#Gc~-FH~?BaSzB2u;$-sxu^6i@6i`c)4oU__x=qpd>WB
z5A_Z$8@1|^rtxKA+n3WUkg}=7RUpg4l~5{)s%Fnb1QWZP^Qvc*DR@T0C6*(9YHF_C
z#l3@X82<P}W1ZcnZ~DmaQ3Pj)$JccoSRzMx_7Os5xlDm7j1#6sWaze*?WIZQP$?JR
z_sGWo%iU+{oMrX$smYThOYqOIpNi3qU%dW7X3DI=w!c_F6%@1%&p3#sXsi}P_=vG7
z47!=fG7=%niUm(!fn{gXLcz4+0IQ7jf%v8O0v?J^Okrg-N7lZ6lY>x1l4viJ%AgwQ
z7grXsd@Y4EeEsDy^B$oHNg95R3rhx+1??81fqI?J{30}`qQb5)PFT(U<ELlir~5{Q
zdo1Sojop#feb7U?cL!w@M~iyJ^=1b8JZb0kT>m6jt3o)hzdqSwTbh161sYe1r;lq+
z&`fuA>#iZXry@({-bvFj^l$;M$0q*<Crj-nU`>JXHZ4!8!k~?mxP|-MEH}}j$glAO
zvWPrm0Mgj3lBYsw8*g5+v=)=k6l;il7nHc``E+TGPmlDH9p{7ltLzYu6u?pB-fvG9
z49k#RPhpNwdN08_#aoVy<r%tI$>5^S2i!)<cMnu?-{0dHF{M<bYN7EFA4I8|MvA+d
zTHzmN)f6Udy_d#qxV?s5?&0Zh%Ob|9uB3MLxqY!Ce3tcN!|I#&_HpIg_1e=^&;Z9<
zzRc^wfB7Jqa=b)xc}?3sZUixcE%0IqKv^?j;`-(8MnMeErsw;0@*f_A-*1Sm<e%8p
z3`ragE7V9^ws=fDHUWPSuDdr8BTJy8Tu1rDtWUffJ}H7WaGnjsTWpP#R11f(?IMgV
zGEWgK3Cq2;yUhoK?w3asb@<rUSt1gdgTn$)l0Mty5Sfbw(vlrGiib}+mM5m23=(~Q
zAH%gZBp|zTG1PF^FA@4`{bAwx5eJ$=H2FROuA`~vHMI$nq{l-^ZY_xxq>ug3aWWJJ
zm1&>ZK;(q-_?naj1wXhuYz!A1mgE-;#NY%|^W@C9yYQX$YPuij5Bh#HAoa-8T;9it
zTd^fvR6?Z|nzs+fbfl-525?;S7pGx^N4)02+Oli(A-u()UHh9Xz|H<VB9FXQ9g)qx
zhMy!&!c6xE8!$M?Cgjv(!bC*H?EWHIv$@KtBS(3L<AYqdzsc{6ohAye51zQi3CTeF
zYz&Vav#?qGjLZ5Q5x+2HlWVdoK86<GDoaM4CaNYT81UR??wm}Iw=tuvCff;&=Q8M3
zb$<wEwXwP_&BVsHPC@QqdtRtnL{En7DAtSLHbAO=<DbA{v!Wi4$O>H`uGTf9oCvBC
zthU}TR=s>jDMoC#>L*3JG`7JSJ#@BJk?X>BUsp&C5bMq^Q{GSpHWt~k^j%&F;Q1$@
z*AfjECo?BZkCqR8aO~kA7Q>}wduhzH1SHkOkj!Ue{(*h`q}`pAY?`qJzWqta;X);I
z++{v#CSS#D`De=#=)2vW2s6anOGmO0IS`b(dPMgz_v<)^uHn=J7MXBA+D1_;ZE3`t
zWn)~9O)bXU)ibp31<!!wvgC1`BUcx8gMjpfu%7_{5Wmvp9N{+*LAbU)&Z^HZd48n-
z+$I0Um}Lx4YDNcBY{7eh3DUHm+)G~Z_ADxElgad`GByF|frQ7?5Y_d|;iLjw#S?0h
zq#3Z35={dCdvLFCfCM}ZS=IKNOv98LXgKiX@uMZJrdE$yo*fb7lv=5t;p9`Yw)243
zXgcS-=KKc~Huq?5GfAZJTOdMQO=BmRBc1)t0aW8g&Mou~RJiW$oru-g+z3t4?xB%D
zU22M>DDkKJvmbtaU-8_e0(4KC1%ex|gf?U8<Fm4R25r_u4OMc(vaTq^F;_a`>((?%
z(ztRTK7Qk&9ANE>7|Tk?>&d3j3<HbMW{%I9UzU+F3RtVB<|mbG?A6i^PE1IL+=Xz`
zc`<MM{JniS@CvdMB$vbBTMGEHGEs5HvDhq>OaP&{AIPOD6R<-nJWIG<lG;&XO)*Dy
zFN!4L;819!I}IL&pv<2jJ|%3SU0PWmRUQ&i$TjR$_*&Y$YY^}ADlOMK`@I(jAU|-~
zr_Ydj<T2FIU*jw7X{0!T#3r4`El)ocs;v!r47sb%2<i#IzGU{X2%t7NnufcC6HiTS
zxdi?VaN1?bB9Akw?Epx{Oa#sD$GX`!>8iUnGUtX3Vp}&8Zxs+vKXDhLA5-t=LM+RO
z`tf0tIkJP@YsVZp`eGeZG@>!p22yG408UJO;6UQj<uim=tVH2?C)F!jF4sqwU*5MN
zq*>|dqRw%%O;Qx%iF^4V@_`=h*aUAK;Zv+AVW=}xQ)<-GqwLM6yIbfVOqjabkJFFg
zei}<Rs9-g6vA4{h$>2-;cxRIrLOsghHIp=m*^84!Mw%?WF<f_!Qs}ZR29*k<sz~A^
zT2$R1ZOouwevZtHXAhx4ay6+x_soE}5il0g;R`}bTEqd_^EXz_fZUbyI7dN`od<=;
z&RquFj~iAag@+n3Om@{hK^PBdVr7mTKomTG!|fii_?94WEjKWr;zPIqRvh-W0=D)+
zMG8$t>+uW5cO6Mp+#{6^&HLR^a&P&*wG%2UP0<AQJ{Vos`F?{n9z=JqRb}Z*^=|@z
zcZO)#^nl4@^T~))p(0@+Spg~EI$yxW&-iK*M~B*P9gznv@w_i~KU(nCtmnV$iNqF*
z@}z4ZY>0vkc6nL7{gU>M9%n6621!WcabP#jvMC_qwhUbEqM;8~LMSXds0hpRbk2u*
z{IIBu+UuW*j1@2aY)%O%&%g#Qr$5*HFzLqFXN^_L-QjaEATosefSCPb<Mao+uoZno
zHOGpOp7U<*Dqp~#(z*FA86hnQIykL58*?vzS;d-&t)}f_1tg~ZgqS^ltN{}ae1t*>
zHG>hh2yhY83k0hUU@$7SlR%6-!_AWd$}9jXlvrv;C?cZQQSz)-!_hkyTna5z#^xQN
zV{|^E(q9t<%^<u2W)JkMwP?ma!>8WQnFG4~$+CJE2HBRyCRy0f=LZ%5t6tuh@~pQN
zY?q(mzpR%TzHE86u{a#8na*ng=b;qKnd30%%JhAGP{XtNXn~7G?_fhin*^V`ZqhPF
zl0}3he1`3iWf%lCO&t+{4jrcSiC4~*<rL-gLH|>^rE$P1au`!Bmt(auPTPNW_$r?=
z$K^8A{hXn$&Qx9>;vQ#8LCZt2wn)#^b)?+WTSY@een_0*`03j-WV{o?aXpf#JZ3vS
zYsk~eFI9{bhWG`MDv)*)P?-%ldi}6n<pGGrtP7`s4tB55CmrZqNNLT07KPvROKfwM
zZhz<ejED!(h#2`nn$5e$qC*-mq`6%;{i5`9#MK?Nz)V#Lp_JRfMN32Ao1UL0zhPqv
z(UZcJ*P|O6EE~cMz@52+A*tLPpR@O61YLFjRA<i1tpcykDAK9WJ3cyARDFg1%EId(
z9T%?I9+XWVF{(3++E5gAx0=Kdt0B*m5OZMj0zt?Gx;^gPA;j{_Wnei!Q;|oWO8z9W
zKa@CH`rZ_wln_6$&!h1Z!371F3C$a~0l)ddh7g%^*DLlKNuE?v@%20hqer~6<!aqZ
z6LG}RGrfBg>Ik#9lT<J_nLkVh{!6SKdcbsU_3eTd-{m9~P8dYD5tGP|W!U6o>|7R*
zOfHU`u#Kd;I<Q@K5J>+BmYfaW%`1IDH$n$=t1Ysno*FOHLtT~AG2$&s$4q;kIX3Ji
zqK2Kx)o-C*+Lt%5ngpD#xY`cV)+O{d8py#A5d&BdO!38P8Up|hE>(i~muLCET#mn&
zUTNhab-Y%K?9ACbnuw>q!-0ltN-<~==P-`~vQLRb)F0`ax<aJkrxBVW41K%?Q6vx6
zWZ%#AVr4>=;}~Ci&RF!6xs<p?^AW3gnflT2SyU=ck$=f@JDf0A=8bHInbaI)Q#-tc
zij5x$twDy6nfM`^GMy?kO!<Ves-5k300C_Gl5=81Y}IMl7e%7yIPTp|A<iz~;lDM6
ziCozdzZCCU0w0QB4cNc5;r-NMH@e^SSA~h#0|z28&dQdbu41T3r;eB3wA;uz#CU+3
zyMiB$x_q_)zQiW#D|U=^8!iW94FY9LLYW9_Zg@WJ3!~YV?Pw2Dqwxjlh@FC}f4GC4
z1_equrd|6u($;EcbcG+L+0@O5m{!C#{}TRQPbU^Nhd)ILc3d`GW)VkSm?Bh9WLyFp
z*LHVxV0~^ZD4;L1eJYfqng&WS7@abwj%U(d<+43lMI^>y&8ZmmwR!O84o8UNz|KJR
z<v-<|EJ{KcE7~@Y#W^P!4gi0}IM@7FEIH-4N_lfPyXNP9U7Z-t+A<mis1Q(+crg{~
zL?jBx^T<-&uNKUmWu<RT6dE21ZH{uqSFT#P&=(J6np2dG;tkDbyetA|K5Yr{-=4T&
z+#-1Bd^L^{p17J?o1UV~N+f_#t^6L}{UYiyGqX&dHVRlasXvZ1qMYWcQeC<snm0ax
zY6@N_Q03A#VgpQ=OO@Oe3UG6e^GkGYDCzZ8Lpe1$?#A%W_g;pTJvIxK(>r^RU$gT>
zIZFagaE<`C{1;$R$0_Q6+5c7DVlsp$t?G$;C!V0h<>6Rn)9M~V4Y7u>ESd>1j=V@{
z?(udm39Y%;fpmGMuxrDWLqEm&vL|doVkKh4zXa{mB)xoy@bxv;I)6QZQT4g2YoXrJ
z@jD!%hH+UGSVYDWLb$;zhZVamC$m1QL7I@!z?)LOhHau+Y+bNz>Uhz`NbyPfHgYt7
zo8IBC#jKRO>S8LeoXMU)sb>nIV$)q%rk`RH9Xt$A*PP<zHOz;>bKv$HAG#Zp4CVEe
zGHTcSXaaY7RTKGUZi~$DqNpeiqxaU8y5MBAMBmw9SuE~gM~@9;qd6JOEPkif8G)1J
zHC<7+g*id2rk49YA+7^a9}<eGLA{NS9pkWQBQgpo{F(iZb4`v%*?B7Unv@CUNm9L)
z2p%yyF#05>^`l9pVEf9F9P;Kj;I(Z!6-3b<60UpxU6uODIjW^~YA0d<{y>D?*$tZR
zDDI-#nF%=GNrTTokzBdFp4~r<GXuJXE9honyN?lxNg{haST7yoOqk*C>gED`J#8H|
ze}p-N#Xg%w@%ehBgwTh#-fW1iGO@DRU3%myle%S@c{<F7K_bJy;=-TYUV_LKy&;tX
z;fjaR=pQWRD_~046Lo{05&OQ1c~Q5PA<DGw@~Gm4xJwd=?aJEe&C()|2}2Pt5)Ohe
z$v9Sgjg;@>-rf5HlBUH;X(*J$>xD@X6QKDoHOY6YOEE_fBHWspXA^J_$R%<m=Y<j*
zgTj4j;@CVg*@l<Z_zO26ShE|%IkgY)g*xATETd!yOd+HZ6dJ=&tf?+sGgiqO)m4&l
zlx;R{+V}6#Yj-u(O?;Ki{X-Yw$_06Xrdx}%KA+m+cJW$`zEw30{!wan`Qg(;cJf3!
zcF@qY(I<bdu^i#oL=bHDyPd#LLPeTPa4nfK6R~&yi|&N#=K352(oyPDS5@4SWrL(A
zFb%ai4UZRB{LY;Fw1qvQgPd43F>c+R<(zpb?@lK<RtP|R-jS%`b#NTbaI}A7TS1ut
zwOGv^itjdK8X^NwT|6_}tN5?n<;hzcJ3?Pz{eP$}?_}B9_enKHCC9JlafvDNRTe@7
z?m_`cReXXi7%k5%S2KhtOrjcamhvbo;UKw?RL*o>QtF0pG`JT-!0$O21Xn$txc3w*
z3X;~lCabKNKqUuH)JQZ*;x-Urd%ygYr|$KXkzvsc$h-En$mEu_M+@ZAx?zvFW#SN=
zxYbv94yQl44HHc-IJnid{$4Nl<L-Cr1OG6;b4(TSnLx$NtJ_mH9;}CzGffD%-<uPz
zle?GH%QiU#o5LLBlDLJyGdaKY9&O<>x!naq%W+S?kD#ooB%hQM4HRGbf0gHyu%>vH
zn}oA@#bvsm@Wr$8(keq_PJ6YUYXO2?r)c<ZLs(SE2@8@XKOuRVmfKxvvYAvC+-a}}
z2`7WH%#MYgYnhhCZbdaueqMKY+5jEsN4h<xirGJf`{<TxV(8nXA-@{}6>`Pg48nYG
z*1RAy^iBAOmy=4h50<AAGp87j<l}EET&%jTCy|QI2hs0mPkGmitRpREp0f5uqZe~H
z>Y9GDE$JvsVjSfrvcj@VYpvQr636G<{lrcIgwcv+d{AqOaL}8^8l4>pFF<YHnap{K
z*?9rCPb2e)iX53%nCXNZN3B1|RxwYb5HT7beb_f?&yST>*^$}V7$sc^7zJ0kWZrXk
zXvhH)7ine%QCS#8O4HMBTpSGT(TI{>0?urA6RI`WDUxcYajY;k2S&RH22TV$tUr>{
zlT3qPNLL>rbhOggXYc;EP-fK;r&eo3`8AsO_z+JL0}$n%ws<f~mwR^{>Ch_or`ZqX
zYhxg1>nbvD((%kO%v0Z`e|Kk}TctDX$`;8CLPBA)tYjy)%LC_x;<2}uv?I6uw?5Xb
z0vQH+xziJ0f|I^A3?&}D36RYF`I&8Ww`nhDhkAdX9a5RtHa#fg{7YWpWYYsk-`F;g
z_|9;OPzc~)dWR-;xc<BU$#+<LNOxkqc?L~N-jaSR*W}<njnqE$1uO9!-@Oj|4E)z=
zx1*1E14>wAO1mq|d<_F&#tp{10u*V5!RY~xgd*Q7D5zQ%f^o2z2-yhl-Hlz<=`+8h
zg2zs;f}#kQEz*tfw-w|Cz7W65p9uY`qw=7@lHxSVHz>FqzQn<{$so3+{x=aH9L%cS
zcTYns%1z*Ba8{^;JEmIpwzRzQAzzoe0H4c<;COMI;^5*~Dv9*Z`7-)F412nBzZ;i0
zfGn;NL%Fe+mid;kfKa2*h8dgtJYH$Zvx19}_F+oS-im_C_(F-vofavYM+213niD30
zCU>T|RgS;d<*9$=z!6K?GL&9T2UnNH@)L>C73N`P#<Ix(tKs?s4_6^LOt|LWeSx}K
zJ6EL@&2Ne|GvBO89x{pEETEK|ZQAdqt8udO;Sl)sfDo(t9?=xvv>jBMeUY!aoxG|f
z6!RvSWXu(#Ny7F-Z&b&sM><3?5$BE^JRQkaX`#JcSyBx)`pVH-x8hi>gldF?O(sNe
zE*J;C!g-FP=9th1GNoD4glMj6F0qg|hbp`;R%h?q;&&|7&jA7#_uY4dCI&ws6a&M~
z6Tf=Sf$s>eEO2bBq?zs-PzCo8eh8jHMobwDQx>pwW5dThy3Oz2=#ftHlFXp{Q^!nf
z=ORq0=C4-LYn8>&5oBO~_s;bY6!Bt`{dCruXik8#(X?-F%h;qww>53dm8|GZX38&I
zVU9gt8mo7!;+tW&2liH4S?n4(^wQ=G<LA7dNv<RJo5E^r6=6Mgce={<mwM_f!54HU
z0Rkgz_q9y~_*jERE-<P&O63E@my2V_!@#9?feqh(mo_k&KRYUSH61odH40ba4Z8(u
z<|R;J-|7@)a|DmU6FuR2z_6onBTyWj2v0sp3Erv7YrU_erIsP}X(^wQ2NGml^3Xv3
z!OFL9Tkm6iO316Vs|lr7ijI_9^I~`5VF^#q+9Jk6k^%i^Zinmro!`|jjuE07J({~r
z?)w@g^4pI{r4ENTPTKLeN`#&nv2fR2Km`~8;+;PkFyL_Rw}>lPlmGUm|MpTv%ki}P
zYKD#Vd0XBWQ5t@No!d|{*jU6%)nr2Yw(IIDJf5$-xSw+8?#gj-OWXlQ19_jU+IZRV
zgu;i-Jpr*QGUK8kzLw=yO{$%ukchuc(&zi?yiHxSgJLFl-)Q@;+G+IC^q>*r9(o?r
zz2)*FFofx8NHw;Dbh|^>qx<4V-ov@B-LzApjm?DOZr-CRhAAO@g!oV0H{TE?EOWyr
znZ4FwNk7o}!B%;Nc7!I3bSr6Fix2K#YDp`z<UyPqX!N_{f|40!cQ(8S%sT?S-Tv~0
zt|-U4qJu$+ikVNQ)-Ig8uj}XP^=Y2i7lRX|;PH(?ixIwW4RdWP3(Bl%|D@*qM8URn
zy{PGX^oxKTv`gc8&PMQEo|ePWZDX^X<lqF}yf|oL0`J3iL|(?VZtF7}{U#qt4|`Vp
z^OP~k@VyjFL1~8xpv1T};H#Bq^_)jfUXO?4F~lW?L==BgQR99jeu#<UH_4sau|AV6
z$nI-i=IA+MLjoJc<syCt*mBa8cc|gbqzV^yM>n;VbhvLF7xK@Ndc-=Mk|h3V4q-!c
zKaZerN4ZCiF4h9~tWvn;#!SJb6K5K~!~oBTRRBijW)nhf)uug~%<_x7rGL~eDU7<;
z(Z8m}IhArQbAn;3S79*HV_>gp*3X-Q9WoAWfC)LCIJf~?_3%696P=0DU-Beot%Y7(
z$$Zbvxj0BR1Vr*_YY}DK4Y4_FOL@$IXdp=P6;mm(iG!YCXk7a2*YDCLeI;2^RL$Ne
zYi6KN6BkVrBr6UR{^<HBY{>|xn3hwDw|{iTfZnPAV1fxznpvWJD*LS%Id9Wz3Vtb0
zBzoP=ocOysO-I{~qcc+6f_TL8SPX}Km~H)jla6N!0Frvdod#|?Eh9=%M?&K1h3=ia
z6k#Cl8!aGx)b?uXCctmKL+~`X7Y3KNUS^V25g>ok;C^#iWGTzB10Pep|5dvbFJUcl
z3+L2QaV{l<LBg5h`0vc`kN|tS*p@OAs#<F#Ix3(5I?LD7lJY2SN0Xb2^c4)S<lS8=
zaU_x=Tgnr?9nKiZcQDNTiJ_~}_7-x7iBieb$*sW)Z}B9dS@Hu+D+N`_t%$D-mm{(6
zmwd^$WH6mtsh~tU*sv(F^;YC!I6^ul<cAZ6**cXr^qhj&yvkn6$tz>8*lGS7$pph9
zWNU9j=)wgg!B0eQ=U_x+?;T3kLzb`}wdKM?kK?MAAFVsNR8C`X`GF{v|7GQ`X#d45
zzdDVZ4_9&JfXj}3PP6t7U2C`!gsh43B`}P>%cB&3sgfzebxwdaww!acMCNj1TRpNY
z-sz!kRvm0`(n-4hx(CJhN?~z(KT$WM8hcqn8Q7ntP;!MK&b8EyrVry2)<G!>%sq*3
zxy6|od}8M_3@c0dw+-I&Z=0Wek8IDm#eS9I5%aB8{pIKR<x>$3<^#Q$oB+z$6+Yn2
z5_#)VE36%iATnnIrxOu@E-=O`Dy|y#dwO`0;I~{~i_y^*#feOder)aD6x;MRG@p@>
z`u1^V?)U1Kr3<#znjB9_PV~}tSmGU;Cm;#Au7B29c0bYF%O8%v%}%QwE<zb{+20;p
z14Q4|q0o6j$y5c~6@`}pJa1Z*kvZCJ+emv6{_ss?wrOB94E4RPKn#$)MGVe7R%HEk
zIutmV|D6KOU#+W{Utqj^UmOkT$qJc0$T@k-;5EtT*f`}LA-`LQ&WSuPE@||TXfXR7
zeYz55YrS-iG|^v?6;F2d1%|9cG^fF_Plio^a~{y3&Z>l9#%bNYA`R9amtfMGPZmE$
zId-a%Jnu_OIq90ofJ7nYSvdyX>yZ5~4@*8M`NSt`Ofk7Bn&yC}uQ160&*Qu}Ss36o
za+~f%XW6l*M?43cI5^RRFPe4urjOjq;!qv3_<9;0FEvRp9)rCyeTgaFm@IzrjCDbP
z3cai1t{z_y9X<rnC28cihus&uweoY;7<|zD$LBpVw<2d>2`Rn^;(BT9wkLH`93`UF
zue0Wg&#8Av-RD8CQu*Dwv)&q`tW~3Ps<n9T`|%T{GGrZVgh&LEe{J3^`G6?NV}V==
zJo(hvteWHd`cM$2gwNPb!h$ov*BaFEOn{s>-ZvQC0O+L+ESWQ8wH9P&xcS(G|J;>6
zH)r!%>e_FyA118q5N^FelgmLzPR)%X2MK(6=?RgcT|jUaX6=<o+21O5nGYr?=B}IJ
z*HR23d2LRN(M!9Fu$@<LS38xFX0W57W@&3A!50$xG9C~7zp`zs;xCv+65Xm#8y*6G
zzRH}tD3+F{st2Th5eqPb(u-oCX6xjGHN>)W;5n-1@(XLG!z+&;h)KxJwK&YwcK80C
zS}Z*dlT3;u)(%m8&`&j9PSi$8uBjQXryoK#Hh4tE`Rvg)993@j>yi|ayj)hZD{gnX
zl3Ia!cr)st$~Y%^kCmuj181dWGG%M2wH4!rMlo$A8LbD|d+w$8`2FeI+Hr0@84OL(
z7cUp-v6sQD#u7|W=8R*IfM;r{q&7Tk8XqZC_Tn4@g{WXunH^x6cQ)|^>1rt;tb4Nf
zQtOf5U6yWdppiU7j9(xSzUD~7r9}gAs78cbG3ys#w4E2s&Kytc5FqaA_`Zzt_I(T`
zcWEM0OZekFiP=VMmoycr$P$t-flKE;pWz?z=(fI@zej^ntC<V$igX?}lM0qSNsa@C
zlzsi<Q{c2U%5gND&LO>J63Kqy>g?Kl@<ilwz+WBS!BjXSPL=PcQZ29^qdYJvX%PlF
z4K0%ax|veQcSw{sNHqg0Q5lIP$C#v2^0h<~1>d~{+H}<Phic8EV>RQO5gkrp=MV(>
z{0WQFAoO6?l7Ywuclo{*G&XuYr7){;{^hOWJ>DfyHOUG2N@!Ln*IaCWuT&KI(J{(7
zO?b-6A=+2)Cg<MAk*A*>b{{7HR*u(`M+yt06T99_bPxyC*3c9KbHAVW_>N&pGSiM&
z?<DafSYml}f+qMUV;O8~_<r91`OHWj5Z?Oo_>J5H`gC5W_D9$u)Yjp7Gda3bnix@x
zRNu;^6AuRPlMNXzyS8c$nK-biI6a`?42Ou)qKQX(I(Z}IrkeH|C9(tMyl^kj-e($;
z5{UM!ij)vngU?t^+!iSb<vt;|$18{rCR9s5wm#nt+?P}iibsp~#eL1(iuND)le*Ki
z;;BtFy{}`@mgeZw`tw}?4}HXO0xx&H+8$r$w~Z$3J|@-#_rtb>k`3G>lXvj0rY&Q*
zp}a}u<>j@D(VVO1%mZ%K&W3EQDpOpU;nKm0X)Gn(*#QcNjWd|KoNGN{;pv#Bgk$lo
z+XS(RVH~+Z3<IqjD$?jANffrS5x6@xgCoxk(VV?0I2L8X^p|4bfIc`;>5bzJPor8X
zJmr>!a5{9XWZSRHy{7&A9k~-#T7=m0`b*Jrb-egFiwK75BtA#_jyuDJ{BBxC(c)Ec
zKCfX{i@8i1L30UrU<b1gITLsQCGrlpXn(b0N+8u-0pC3)UN=FqC4Bt)Zl11x(l4E7
zNCvFK0Rnz|7<tvvXX^D$WDtX^^U;$MryFN~_nCx02wuOH=0jusq>CgGOXr&O+}g5?
zrH0{85zu{HRS((o?vbEKen|eaJ-{n&Ak0D$XvL2%CjMOWaywwc#0&B(UQbi3C{u%3
zfU;o7QpV~7w17Q_$UQH1sJ!j!4CX-1)n}xzwu*tV>lakGrpcP5jDyDP1%-tki&1Qz
zrMKb(-D@B1zihW4>x$>!!FU(34-9Iy%nN*XIYJ&_ihU!5HPUdE*_nyGt~A-H`p-{O
zUh0>z^tiASueh?m?V8KFnKmdveoCZ$ct$tIaI+y0xsl7U)w1XBJY57eg<!?|^6i?z
zJpxG#1P(5HpZ~qY`;G7l{O3O);WrgXU)~R`IUfo*KIogj7(lcl#A#rO@|yA%!-6DJ
z7|1X-D6y9n_bh`5_w;7hzAi`ht@oI?O?1kRp6v1aNokv$yvX>%l%ZOr`x{~o^PLbj
z@w2C6xmUF)CmLNZ508~|GQ-Sj7YEzfm<UE6+i6VxU4s+jn`C|)a#PIz$=#z8rC5-c
z$M60cURyjhSd>}{+UUtmn*v^5@A=@~*K)}3c8i~*HfG$0;!GM>L|HA;M;#LE=tlH;
z6%?=c-ODV}__OscUZ~tSOXM>x&6i?0ZbeIk4MAwPph)efPa3dUrr$L=y`x~?TY+Yr
z3Fm%<+qbXNPEnV1mgM+6M7D|E;1~T8n|Cc8MOjR#rga$2-q;Tygwe3D97YU;DllEv
z#tBcee{l%oLy`8Ra`ai5IK(v14E>`_3#SgQjsu<F86l7*RWS!ykK}`NSeJh#5{OcP
zt4FoN{gVVD8{=l=$i&WW9p3E&zSFTbOk)@M+k}zQK>bc<%|$P#^N$;2;p(vpOeeq-
zOSfXyUGCkE;jLF9drI8{MBPo83~<etuUim$<AaQ=LrLT3fWL(>ylA3O^-%{(m(@=A
zkJU`)K>^<Do}=&Pc}6DJJ!y@iR1qDkR(Sn9k<#I`3xtiw<8`e<sNheZ!bYTZY#kDs
zQN5S^WkjKVcdE&$_4-y<zT_8z9B*Zm<-OnQAqmN|SZRrEt)lhb#<a{09Mkm^N*6=D
zx!FFmCmiK)24er!8$qmv<GAP19k*_8hC!(tHMy4#{uYzkd^!|9jNRU@i4ScWq&D9b
zqC>Hb9EHlOH2``N$~v<Cj1Hrxb2RoJv=(3Dg|i3ON4z)HV^mNPdjAG*Ve?`A^!t*W
zHz84#fD<vzmy?s-C%PaHOtp$N%drjv0qK7-?LE09GHk=J=}yv>*O1hpHN@0MvR^U}
z0#;;W09zLOwyhV$jMCa<jeIPZ?7ttswxB4dVfBTd&wlWlw=KjPdEX=Z!ToEr{}R)h
z?^mYlcQVUNb^<Z>Fv1N&6Dh!U^|FjA8aF>ka=X(j#N$MhNS+w9mORY2?^DpL&ez$F
zV8T%6J81-py!f3#Al<Ja;1;%!=<7PfU(g)a*ma7E>4X<cUeV5))`29*oW7ImZmkUc
z$wXW0v)hQdiQDuw1Bxk3$2~;S1=?v6sUDGV3@(vLTVudkk?MGwc4Dm^Nt-}e5X3|o
z!Xjg*DBVL7wZ4{AU-1Ulg9bFBYLiED3JBTY52K%Z7J<3$cO<}74T2}#5p#U5XId~|
z3CAy(XX*)aT>%B2BF8^4<qF}7X$RDN<RWF2=NmyshJMGi6s<I++u`+e<xC@O^$MFC
zuV5GN&cLtQCFOxRONgavRL<6<a{NV1u(sqHjfQ}^1g2}`aLeph<8{t#o@VoD<1=ck
zX3%XAYy7%9F#Bed&ycJuP5ZYn{aY(;Ql)2UJq>@<W9{=4vQ&hIZ&Mcdh<&~Lx;Dm9
zP6Oaqb7$jqjZaeou%I{iu^eS!0`=H(8l)HkOwehjzP96x?(I{3Ga>GpLw<pyyM5w{
zb3n8c+YwSy0l3?XKrKIxy>4mTc!=l@5o^a6kQTyKaMKcC9NbU&a$?=CV1-&rkdami
zR@pUyy?#Bm{xIG6ZK4}$lk7bGuNp@?f|;yZ_29b}&^tDeXw$v-L7J7yaXr+%6ru9g
z*3A+pWHN%@_oK-}mE!?n6qf|?;%8Iw7hhUOu6|_usMj^=JKytL{UW)GtUuQEOz@bb
z;%5zVWWvs`;=UMg4xr3*8{F1e-&2TRyRr<ldi#ig-bJ=mzi!GWvvz#iUL$wLyu16I
z%E4(Q`0r?LzD^P8<vkV7i<%djFis9QDm5z_(~@Z^mlW1p4`1{*+w`lHli9B9s&>5F
zm>Wj*{GBw9Rk~>T>^x>Oi3NKH)W@P}7bONmy)a-=bUw$Wlc=nZh`@N8%{z4+lqitw
z{<gwzg)?f6$p49?iYsGoex9Hgl!0)KWUav`Rg;ubS=)V^kGHtS9n;`Eezf@^mLvTW
z-WLH<rnu)DLPPPyp2Jl(&qSD~UJFnv%egwW>S<=Ifv%EdZ(;A!=`K6o#?B5XAapgO
zu-IRW0cq-+!XVN-SM!Ky1%j2tr4dtMX~n0Ki;*m7^^BP=aY}r#zvPbxB*D7RI3z^K
zxq`71Z}HRvvoVryp*zfgQEMQZtK`m|8UwQTJQN|jJq%vP)7F`e)htxu#SjU~^ViY1
z<6+HrPy-K!mGhdNr%Y#?{Ce{4J<zB1UceL%tn{)IPokU{p%f>U?|*c{euMxn%;Rex
zeI0_ce|6-4?vL}Qq482N2p)Y0R`VT9S4}4u5qVGD*Av4(7w@MfXw}WRN@Q+@TD}RU
zcgK6nP6-j}0ppFS*9PMa6i9up51LmhQ&`ZLFN2?HD<fb!rU+P4j}PX-^0H+mbCY^Z
zvvb7Y;Ph^{{@5_lyA<ZQ1eOI0W*7~jj$&Qbnm9eq(&=*6I%CFuQ^xRvMah0*d2&T(
zOjGrn_aGHo9j}#DR;52AEj|ViXr@))Sc<Iug&;{Y3xJ(rTA2;>1!EV*s0?$Dv!`BV
z*0kkov4~QKgAlZbbbW5x=2QCGn(xS)cyHmX_#?{)&R;YtEa-_53gRDJL$NWAlC05>
zPpn%MkBiDguP|i72Ap&-6jRx@_uMu&W;q6z)Sq}Pu7~%7u1RcVykJ|KH`Tpg-|N-1
z9$kx_NkWQD#?$%0|BtAzj*9a8z9vQ(q(NZl?(S|R1PM_P0qIcbPGLYwkxm^NMG5If
zT3S+(?(Xh*@9_El*1HyexRwgT^PGFmKKtymZ&{Y3R#ix3qTnWX-GiVSescK{GroRY
z)qaze^A7<`gK)XSnTShP50$2{hW-@Pst~cpn;)N;^EAX78FsZv7cnBs1v_Y7fiAK~
zUfyHOEX?i{PQ&*E(R4o5?(v^W7DfS4z$d;o><F=_Y6-YK4FC<>p9B%Or^E$)kaA-A
zSHhU<>)n6=hP@>qR5I=s{P2&AY<ZIAkE&4$Ce*ENH}>aX(Zb07^zPeg7WrAYP0XSb
zX?rrGHM`WsTF!{%?0LVPjiF{#bEAyDa4V`YfN*mA{nM?B^O4HY<$^JAB3NFFYri<_
zKsIsZ!o1~PaFjGP14Z`=S1|2OSJ(*N<gPa5V_}>Ah$up<i$M&7!y7uj0$=Q~=NQK+
z?l!IOu-5Bm&mDY@EA=;ZE#_2mh)+caRMs_A-8ikM#=Te5%2Bne@oqO0TeOY`eCs;a
zgODY~Op9(J@rkAaxyEEO3RE-rOWQM?LPlC=oX+HJs9cozN($8%PcZr)=Sxdvx0UR9
zaFA;MNbT3MICJy0DuZKvwNrj`_c2&O?$MDS04vE-szj^5*gfu6*`7!d|DL1IxSU!Y
z=6R;1y|X)<%9sA7>QMRoKcGPeZzKvo30cgx=jd&AVrIZ1{*5Qy4Audk?ZhSXk3A%l
zlO)+@@<EO2Z26YTcl7I92%VxB1rZmgHHlsS3)0RccdIme^BDf*=4QgVTF|i_e0!ag
zpnUq_uQ#pR0;o$S2fpZe3K;(U`8z^}X8$5hDVOVm8|egu%iL2_?9)*#+&(DfKEzZr
zA&~Y>?ePrRjfjiv{ogdDR)ub2u`F8tHgNwJa(<4~<UW$U7>eGwKYyiC-!H=y#rd)G
zdFK|B?^dY_UX8jFYLJWYa^MrzKK?E=&~UTEV?w$omwKTBVJ%lceVnknEAR~?>YW(0
z<2u40T19Wx@bFsZq%`^qve!0aQ@a)0F>c=%of!;&qZyzWjnr%LjX@MdvT45fy}Kq+
zK1R01G`u!jQcoZ@*pr+SAG_mOJ68|^3&a_!fNnOf`l+DxWWuCW(R-#!q|ngpZLAzE
zv~OdEVGmX&YjJ<-9|%Fuy2L2W80Wy6rfzkcRsegd(!Zfd&&8?p7|_xRJUi$5OKE&(
zjs%ydZ?3OR5RP$9Q4Ji&(2_Y{s?&ss)5$U0qu8shi|&W;`q6KLMrd3w|0p?JB#*0!
zXYd|Yp9N&Wn{AmcUG@U2%V=ya-T!1<m?T}i!*D3;04D^O=cG2{ywAqP$>t>Dk6)6-
zPw!j8L3qjSbG%1t_W1Pp<QUCjxB|a;bl)kzkHW_%!)JKERJPyd^d26aB8_P=A3jWD
z<;2w;$`_t8fQ#l_?E0f@XkK!X57KUsgeq(OuK}zij3*F(#33xwwsf9#!B3`sYt14B
zpyEa<R;mtN9Ij3b-`%6Vf+|hw^l-8H$NFm%AOddA*Z=5h74b%*?mr|m7UB$7)G?BH
zHl!mC>fr$jl<>=V2KjW)(;l_L)hQM%93gnkKXEPZrcUn+@0C=pOM+L<S7-YM;-r(>
zUh~@FaG_;78)4j>Mj)(PW&1OAy4?5a_*%y2DapGDU+I+pBoNJjO19TGq|K<>oDZYz
zw;u+)Qrsl(k&#vQ@3uhZNO#4Z*UC6i7Ero7v;sO@O;1vzN*7WihjXbl+Rl!~B`fN4
znoFgA3DAe})j+&7)nX6*JbaXgQV$)xul73+QAmB1BEx!Q%#3iO(818zj)${{#qqOy
zxCPK);WJTTdpAWIxN5v`4k0NQbWKp9DHH6K{u{r|@_$P*))^@FA{o}c>bGcl9NA{K
zbC|N<v;s%ywq<-4*9_+ZpM4ED3ky)~lWXN#hW*M><k9uk9QBM->9H_MYDN&vH5M$)
zd*HnPkj2y@<nZ%&bc?`cSdG<Pk{Rw6qjNsU8?e{Xow(ig=2#}<YKirYO{+k&QCH<}
zn?e~7OvpWPm<vQfkNvm=_Pg^P#0KH4%#qgL`IMN*l(WmZOJ(h;tuDhhkiXS_gjFBc
zRNVM%uFB<Fjc?ib5?1uBvLN4*&7|}>*qB@y$8xNh52dn$8+0)eB4Pru)9kQIzx)5I
zpLsS(TIR^K<7t(XX@=A@neG6f6mU*stz3Z|pi1I~Mz;CV)M8As&CElz!rL#e_uBBa
z#G;BD4th%KXgGO#e~8wBg>K8VKa_vpJ<fe{l3m;)7+QE-<mk^iK=50p??SCLJvejl
zi$6ouyRl`W=0tlYtHMY#xf`&7N%tJHYS4C1OkK*UkkPyc*urG|^w0v1Aaz7$8oy+O
z0yX}<^w`1|Uy7+1kh!#E%oqOmLhz^6_v$~LW!fGa=b9F_am}X0w!V1Tnn*tx4?Huv
zJ#e7an$CXln(LD8g?oh1b^YwSHkJt60-_@C*HhFUQ}jjR*1sp<BK>)M&vV?6-WSa=
z%miiXU20DsSn+MQA_++c42FUq@8i$i@>;YXBy6LF(sw;ldTc32tvD=@xQ)J<82?Cu
z2cHyP!z&(ePPLaN-^h-yrB*%dV@QJ|wck!`kVbsDz}73ML_Rg}rR71|(J3GjUM0V_
zR!9#6-V<VYl_M|X|L40g0Zp*iHEfcg!q8zNUW1Qku|EFvr-%*1E_{#jfK=R`G_+al
zI3dEe87v?gM&YSVhQ{&=Vhf-<Qkm?`7QGewHK6TZxot>;By;(WpnFpBfM{nYE{{3_
zdu(92&zgd1f?3du7!gU{02Xz9yP9-F(2WS0%cpMFa-x5r4>(a_{KLp#$ExHyEXNHq
z3xj{NK{}rm-ODLJQtf@ckO{ZeBf*rAl+spWO|h&F#iqcUhkZh=7&vQ;S*H>QU5w?<
zd&-pd3Bitu2TIj9ihp@aX9<@2FyrO4PMH@MVA=;#SAa6>?J(>ri(ON6l^P&C^*NU+
z8PL}{dp+S_J?+{YxzZ;oUSULH+Rt=Haw&e0tH56N{d6jI5(MBsy}URlRFE@SGkDC{
zEDVNa@p9`sbg-kbOV{eY0oPJ?7t#}<d5Wo7Q0{$0!m5E*$vqZY=w$2gXp+I_+D^%F
z(njDsq=lqTMsGiUr*g>Ix~MIWMlnb7IB-;Eg54=EOjm)K&B$E>C<oDEyI5E`ZJFjP
z^kdrFeOm9T7F?0BOpoUaVoMa3<jbj<wmfhH;&7Wd>E2bM&(mOIbm^uOa6jcn1Op4m
z%?cYdtE&f1EFG`aG%$|SPa9YX8|W{nhW@ej{+7J7sY31_Pp+-p!1tXJ@tXnabNwTR
zQ_#5o(eY1Wwrdb34>dWBP=j}G)HR_BRV?6Gn=1a+6qUt4C1>aFS2Pm|5`ID!$_G#1
zF^F8MJxwhQ{FZ%Jp*aoALP!p{B>3f28FhUs0*-QMe+#-0$v3#cbmR&Nkw;b4w2L6T
zDie%!0{EnCL{@g+p4Phy5kF|`6ZwE>zgb%DtAKsZ*|So%X2{@EG)&Fb%|<+Z;_MA<
zM`T0<qz@$AxiSbX=_KX=abTD}9`Q{!b}YJI;<BXg`Xxma0sO=2JE)PAZtTWtn*kR3
zorwtCI}W9cJfh*Tbt}rfPFaMz6HMtP<A!4@pOSnvi3`p0V5g19x;4<-2D^N2x2s)i
zPcbGVk3u2*{lK1NlfAs}kn9#@M8-I|2K9x7iJ8ZCi`Pf1vbW-ofdPq1Cr+CAhz>#9
zdZONo?@7h%(Wls<UPljmk7iCAMe*GLmoL(k<7CUT>~iwaQ#a2iaryuE&TeQ!jmg`r
zbuS}ZI-+SaG{u(_re;kYFG$5s%B7!(vxJY(*`H`iZvUZB?XQyfmWoe?w(qAs`{cy(
znpjIJ_HMmsIZ^*BviqCnc?F2mf{Xd$RrjOs>(wge9qc%@9y8vnS5o_1u?t4a<*?5G
zwZ~H+;Fb=iwY2Xca!a_mI?>26qfzR|NQrW}aXh~Z@A}zcR|Dl=s<m0vVM)er09#6^
z1oCZnP_t;IBQoNV!iF?pIdr_tht~*n;eQ2_7T-PDz;b>fzSoRCLTYFiYfrE!cY!ZM
zDc^>aN6Ot2hM#(~Zw@vw^R<#S?uGa<%rvce!wOo&Bb;f2He$SN77^|5&?5Jhp6n7c
z^)d6ULKeiit>}a54hmno4Lw|U&A2r3CqnpPxjYPbrzLj21Jq0FHH%T|$ezZ&o^s&T
z`PILBwS%lcf_#GYZ)&zy;P|n|u7Qk_6iPtDZuELSXYnI2|I`A@;4eRORw13NY&WDV
zrKn(+!?h9Z59)>9DxtTga4@ixOVi{ZNI4^FA)#RY==aTYTzfF0Gu#G{mxAKNNKcK*
z5$@n{vp!YwH^r467i*m|pI{FR9IuaugRr@}USlc>+(QNo5zGi}zn^#Z6z22NbJ{(E
z&Dkc+UC&rP0lnfL(+RH)#gu*M2%RAAf)ELz#+Yb-Y<}q;N29jAZNEr7@<(61{lW24
zM)U}i1|VH3#8O!=uh#5E@ohdY?xL;r<N0&>T4mWBD%kljSyRHvxMzk`FEKh>EZfM<
z!@>Wc)&Z8=Yl|9}ghrgcOt3@0@_FQ$zHuTfoR_$xp+e9~{OGrO4#|ni?JqkzoUY_@
z?4*{`?5RP|{WOv9{|ov<A^3qmdiWC=Jie|**u*}bB8K&760jZmG0gq)LH!@`r~%lF
z4v$srAs(lV+C$a=penP@v#}O>0Su)!;Kgig8;P@qf)`n(zyBwbrGtweS6WRz7J6e%
zBy&3DI-<s!_S7PKK+acl7KJh439E)7Rn$#iv$6@}lgOb%<7+)_e%c=pg~r^QW!E;(
zbZVTMAHbmOi1+q@w=kdBf_d#-tg|>zWX;%oe8!cf2S=7;W1m3ppU!W@KXhvDGR_YW
ze17cZ1VV6AEPcKH1;`5(O$I_Qd(e*Oe{^e$;^6S@<L}G`h?$kp_9vLnPU`%s8mvrO
zjj&%Kf;m7IYO`iQD=^JXO!98TzAvHeE%5vBp=p~tZ>=hEtD8pJ3SG+X0kZr@y;UB`
z66+I0=PJwM9#RMaA7>%h9r3a`yapol$4wW1i#NKH^$e_*d)9sTuijdl!^`k5QwRK5
z_=C5AA=@W&4e_2MYUxSY515ZklfWVPV3Ujvll+o#&_;X1cYSl(G+;INuf1{2xm3CV
ztl}N|u%OVJqT_`?Y?&W6<#Gu+?r9Zc0V`7lv{bF?%k|@5czM)|aCXYCHW~gRlm_$c
z16&fZ;ZUW{cmC^s2}4BAFsY?E#bJ?2hj>0yn22UD<MQdY8};&qi}>58hi@4P28iw@
zeSFB)k}^M6-E?hF%Cwj(r7OfIq~vy{E+4l>tU~ox>Fw8S{)HMsN!Y?Qd3DHnA++z#
z9kqYs)0B)QR(t)=g!piZcCOb-npf2Um(_JUU9v;9wv8hZNnS@oDy!dyVR04WxJj$u
zu-)a+{F(VAcWcMRzeXRww~1(bBpz|xcRwV!lR4QaP7}bJI!lQynBhFMRZzJ0{_`NC
zhZCMn{v-9#-kuZAoz%oF<P0C5i?j1M)vUVCzogs=$7r}=+!lpB`X`vMAuuO8Jcpp0
zh!aVTAa6)nPHp)-3&v^dAf0<xKl)MD!*Ps)OUV}8;*EBj5P^aZykgWR?8<+;WMVSh
zm?KnupML#@y~$Q^cRWn_phv5|wwgVk;w><PC+X75&v_zF)eM*spHnMCJg1P$RV*4Q
zgO97b8rSB%P3UbH@#AyaR#ODboczJU786FZ$e3v`)qd5V`EuUQ_=%ZH?>5!5kvj|6
z9$`GCpFSMrdG@ZKyS4Lsry5UI&Mk+S7Cf=~gwcjrLTNr!9Rp&gTV4^F*8Uws+g={&
zR}|>xY5uksmCQu9Hp$i(4EA0>d*C8haU1*ZUOiu$oXJeE^!DUPRb$Ccu}hDu2S@qH
z#laZ-`A+AdOGbRxqQQHPMGaNjbaJVto8#in4Lh!Ao)j6$^NLp^8#eD(*K%l!(Drvq
zeerrI2Ob}K7h$_*1)0dhTB<Y|7g$e3DF|g3W9q_zy{Cc)`|K)2z7=l+Fm@WO8GbGw
z=@G5oTB7#YNE+C!i#}}0RE2Pf8!z%yyz`f&OjWA7sT>q%@Gx$3B5TVlX)Mn#eN8K~
zcQI9Bx8ZR3ZtyNJ@Zg#-%GeZsuWo$v=6d$lUjopMWsDBvvvb}D2Kj__1Q3a-<kE4F
zYf@yCiFR#fzJNle-r8~rwmCdH6f>2pMr`aQ@D|?4J3;JP8AJSttvW8={`S4JJN0OK
zTZ9Pt=!JIeZE~z@K<}7XMsUF#Byx4}uc^QP-4)LmC6U|3FEW!ppQ*js=U^f;d<wWW
zs=n7DBzj%4^Wlj_KD`aqmz7g{ZU5jU%jU|h`Cf88p;$Rny#)qxdletU<;*NYN_o&}
zm4sTll9ejjk^kR&F4#6=o_nCm_N)gp<`@td*pP+ug%`axI4y*olgJ&M0X=tM9c4+S
zG;RLrH6R^fnqhWE4z<g}$&E)}D*nCnT_(p@&=E1G%++X@MbapMQEce!^%O&&P-2kh
zcj^~kUAkYE7A1Rsx@vqlJiE8B49AWa=-ZATK0NPH6DA^Cp+|GRb?sgj47F1XcxNDu
zW!V~N!E`|(Wy2K3&RBDZAnXIOc#-Y_`b#B~T&@i8G4BeT45a5In_UoT&S)Si48{nr
zJ$}3?Z=)0Rc-Yz%gNj&_9ibT<;F-ifnFbtSnI?9ae2`QodQQNM#_u{)zfQZMyKi)@
z7U+q~ejs8%I!&)Rf-kivm!3s1Ub`;z^Pq>5)%t`b<R(T=Oi74$L~>?7szQBP=%WSw
z^@Iycu2@pTIUY~1)Bg<~<Dl=ROsf1L)4#$`BL(}{tYKQWsKz814Y>kqJhAzw0LoIO
zFhy#N<#A=~4w;yZGr?mu=`4*7z9Q5EXeJ+^?ceO)-Z*|V2Q722ycbq`Z#ikG(UueF
z>1{9{1c{ngs6Amt@Smw5K}{18^!$sT=k2;yKu=Z3?B&d9nL`k<x!(s(QdU+w?AR=t
zfUA9@Waq_>FP=@8)9#tZI4+F8>gyAl%s<yclqKL^jWzuT<Q7+q*2nE4%V5^h$5ukS
z)aHS3U5|d(7+rc44VKei4M?B%wGajyuVHNaLJ03j(``u4Df8}X1TpJZFt%n!x(#(>
z5}XD4uVoBl{se3H2R<F2?v~8Kc#XTLX5qd2yp{LyBS4J9Yc&IHVjq-|4)76&nZ|py
zVzDmSM@ApC$mYA@y!6Tn0R{P1Yr=Qe|H+z{f0baF%=HkwM5_kFVRg-~y)6*+Z<^;!
zDoL5i)dJZjaZZdC<>fv*Nm<6lpS<Cl%iWB;F>YM!1^IFd6ARGY9tYB~E!0|&M<bgE
zX=5ak1FI4o1um_oVK&fT6!)uAXp%oFaYzHUXBf;p(-R#EKdk=X`ux8LTa$!;MJQph
z*?8;UHr<}y5|zuwgdcP?HUv9Uan1h438eB_%X$SkeNC8y^82#H_@MAw$czvo=plQr
z>6{;UbYD4tz%p(&n{Ep5OckDbVvx4IN>0szG0}sTcvoG8+WqO<lh$*_^!l=`hVp<r
zahItoQTVAy;+w{LehGRs-q?8_PzI=|e>6as1TlWc4v3L1JAUsqH@O%F1=z8*ncycG
z2>8!BNhH@>u&2=tQ=NAcW!GT2^Ots;>I>ScC6rY6$@k1j^|Eb}u*iK%e~}hY6OW&O
zIqWidoOu&+6G(;AhDFbsHJ7(nQuxXF%cC^d)Bn~uOmo3Lan)9^6liq4t%b5XfmlXg
zUw`zT;M@K)Y9EUWY9{M*Y4DfC_UnMLuRFG}RhgXFk8K^;jA`B?fS#B6?Z7Bm_weCV
zSaHsOpXo1W^Cxt&Fe5z3^XAE!`RmaIcTFp5!4Y0{-`BXDvZA^{ihB4AA)j_%Ezw#>
zF{7;gYdoo}>w}{7Tq3l-M_>2Z$ixS8*a1(wX|!$S@y5J2kvyuIIrj8|{^o{Wz*g7O
z_vDc;2^u$_p-=8Wz|EofU@K5f<2F)i-~CQ*bc27!=hXLeXs^YtR|DP((!#k#>u66H
zRTUZ>k&BO8Vl{1el7CRCw?B9UZoS6BK?RLZk`LPjPv2Ff2?iFW=~3OhDr`V9zJPG=
zeW0_M;jo`44qTn8>=~f<V*)<?oBh^cTR_+0d}xs%Y1aDAZR301XzY}Bezu<#C4MV%
z(1D8fZ1&50Whz4W-q&cCg{(3Q*)G|VJX%sfq-K@v<CJPBWo{NX$qYR50#eFS4o4M~
zUj)#3;zh5>B{d~zr)uM46mDccjm!ms5NkEMnSp&g`wt=t^f*CEN}?F$tor3&V)<z3
z%Z?nLDbYs`@zc>itnE=F4+Db}M!46@G4}L_N&Mj*+M7TVvHdLfbh~<127m_VSHRmd
zg}qhZfXC|de-XKd<>qs%D>xBYztg~J>^ohFT<Xw5Y9Woy5VuLdn^($Ik-W=rYaq}k
zHT)u+kXP`p0O!0wFPE-EfA5!}`<!gONM-}rytB=w+FxrNU5H@{ths~5Wt*@~pw{xN
zPpBMy!6}LPWE5%ayWw=5h40UH>X@2Ef~n*dADfM5zZ&iTe~U$JaJh<CUmBrp1Q#@B
zVy*6TM$wvL6EfD*5l6+h7scc7SHNzlAMdhM<^pCleuw?RDw0%KA$tbd)>EgaW_qoT
zZ(Zx=SuRbv2F7qM&ADh>sL6BAw`^oTXQ)K}WOy}50=hte-jAZ>lFT^%uC3|h9HPPo
zLha{~Ik5rnCl~yEOmqpi-_cNKK3&7Ws=e>-PfrQtHUu~E?#f_!$ED2D_nE&PKbiO(
ziPnx9Og}4Rh9HyHI&f|7bAmSX;$)f`0-sghuk5;Cm+YlJ_`xJ?xI!LSCA;X)%+VqX
z+#w9Uav4Kcg|rvFm|B%dRx1SUrZ*Z(5Zj#819>7m*{i*y7W}t-O@^^ysvCg<7`LjX
z&k1a0E}!}w1jmm!_Fq4)y8ie<?pDbJ8rCu>{Szs1CXSiYA}P;5yyDcqS9xND+3LZA
z-dHs*W~TbkW<f>vLI<g-KRD;7n9HJjO(`l&NX&S>D0^ceaW)rxXcs(`3dSiDrTC9l
zh(LC%3WYLesKv8b6`vp#0q$8s%5EpGY_*$1<Q@e-&^2uWT<Gu1>O@1bCFI-*70Zor
z(9b4Y8>!nGM*a^sKnpMX>(rQYb&DjReL>vu7Lx9QlXN;xjKa&s&m93X3*Lg%XR824
z25l2ylD!VJ0zSfY=e9gJ!2~C(wK=@Rgn?scU`W^W*S5XiclRykDe_hZ;8wmMt#!UE
znM#L;FMH**LzYv2aT77CrJMJ-r~rP$fiM<}x+WiF9|7p>Wb3Hx7pWl=nkjuwV!3Up
zW7lgdN!_G7mst3`LZ)9v)z1;6DjK;a@@kkmzN}>yq?Yodc4Dp3WEDPnsseV_C{S=a
zN04CEAGxntv6}At6_j7*nYLw^JVG|A2;b#@Zo_=<u#_%I{0ZGO#W>P{QT96J?3wb9
zb2MxM=eh!c&;a_)&nbl0K(^8|2@?$fTy-MuB7bJIr7WXrin{3uw7tB0Xy304&%)b!
zqQiL^aGiZ2f)2sx^e5af`y`3^V!va~_3f|*Y5raj7mkQk-BjV6{~AI)wBM&pF8I4s
zz)Vow7?_5i!_YFzX+w`9J42?4C~wa*ZpEpAVrsmKFLK>rmMhsEV5H1bh=R=h@o>iV
zoGH-ci0^glHy$L`@!4TB!bBF?`nELgBw6<K9Xn<t!+H+JG1zy5T|N-NyAiDET^E_i
zb90`L6)4vlMcJ7Z<C)^Oj?@7yG7&oIh_mJ#L_>gxPBfo<e8%hgcc~5!nj{HY?|i(x
zLUel#n?K`~U~4RaZvs+yu^Ad$`)N1PuO#3#U|UAnR{GIC60=JXD4FHyMwfEqJ<44Z
zb3)HC#SQj~M2)(hD}4nNc8`%<$xO2B%#!eZGN!>|$fp6$5Msjcagw*dP7!IC%a(z^
zs6y2L?lEf;?bRISdLTNUD*yBK!%sTrcW{dnz9LDK^9Uo;StOfLZXvDrlDy4rrgj-c
zh|uvAc-KiW(hEFb?{OoLK(^i&ALXPBhl;aIC06@pBF+ARiFn*VCBTz57K9j&VTi~^
zTuO2&<dn&!{j9<Dn3eNTIr`C+;GKDSb2D-HskjZt>^cmQ8EN&E3(+2M)<)}5fD_8j
z6xB&s5}Db1fz*;w1NadUh}TE@vxlR=5}mZ_;d@ukyn9HLW||971oc1t#y98vB1?d<
zSxEapKUW-Z{YK<(#J9Swu)@B5rGJ*nZK_CS9Z#eNs2^EQ{Cf>&h(2!-|6?-xZycEQ
zh;E|WmXZI*H6Q?D+|^;7@vZC;&NZMBY51&}!ghp7?WRp3>0wtbqcY0>41@Vd6fCC6
z-GVGsoX{iI-yT6c0wnKgH<wMf^)iGm>@J*(VvrFK@_C0<TK*fl>uI}wHWMJ}Z#FB)
z6bp;oi6<;UkS<t6%O>&Ep2Zz~;q_++n?;J=w07A1*)|$f;vCi%GawGj>8~|`uCQ+O
zc@E2?)ZCcb4O||OH(ix7x5s_<S}@C_qUErWR&G49EJRsaZ7JSjO?*lHmKaFjM5AK1
zDw6spietS68LOdus53eA8G~W%ET2){=OUfxn*{ST(>|pYwJFD-JfXc93>yZ%+sUkN
z&1Sz|wcpL&{IG;FUUfVSIQ%^OC+c07wiur1EIv|Da?zzC6DI<0Sn%8b?Gnlxds9@4
z_wKs4+~U<#V6N?2O>An_)$YyC?uG@@*2d217w+Syzc6XM=o}@H^0q(ALLSR=O``4}
z`|n}lu)(XM#9KMgQ#4|!LlcBll`iqn&k3G?p8|x)HrO&p;7;~X4SpzbLKY3h6uHB+
zE>i*JcqFqh0)CI!H&KXoIw;15pF-9nC6R0_LQ}IZiF*0PPsG0~&j&#;66B<sz8qp|
zvLctM(+z$`mV~2YxeO~{b0<jd0r-^RIxT|~hciY?33$%5edCmElOV!dbF`TU)1wA;
zI)-X_x}&FDIUme1;GZ4p*d=jqW^b=)3tV3~wcOLyCz*~tmDznA^pby*>;AZ^Sjb{~
z*>aL03l&bPe1XQ0b;%Dq(VqWIo%x2b_IQ{czHAILh#rC9O(}8NjQ+d58o0G|Pvaw4
zqSnx+j{3D0?&--CM8IIUThfL%4zCwaZ+_bt9Gvvu&OQzce2rGgFnlK&B^|8I2udqg
zt%Z*zle_N#VTsZ5vFLMI>RbHIJn54$MioTVrm0Dsy)gk&Oh6F6nmoKnzH)A1cZC!h
zAt#fY#EvB`7zV77!Pq{SI2&r6H`k@>{<{Gt>Ff+>3f5^(UtH(NMUaO!g$(N*7xAth
z;vQDn2SPihjz01?ZSs_9at->kr;VppnD#-~{DN9cvqkc)Mri2jbW1s2Z^b7;u^0vx
zo+)qLCyIw})32Ip(U9z(h)3S-2tpWHUHZT_zc#(_ESC3|yZ#`O0Bu<^Y8m`1i8LU^
zS_exVz51%!6n5`Z%(#x^A;s5YoicZe_;#M{Q9TljOQCxLcTyR08=PZ6hxC=>x~Q&2
zuT#!95xxa=r$cmjNQKrI)3$3d|L~)SLNGbPoo>si?fBp8uft0wZg|K((hV^AR*I)$
zn4uMf{vR>$bG-lC=TSqh>bbw!8e3_`e4s&;QV+>4A23)<wa!FGJqEb)@m-^KKV&%S
zn>^bV-wnOlkt^60V|{>@`-GsM^NJCP3TYS!cK>?i5q&3p*o?&bTe-ORmzb<8%urH2
zts&37c710*&wyxNZCM5^oPh3!gM|2%tj}HQ)K4H2OB4+0MD#e!FLRxkn4EgRb9sU9
za5Ex%t&4{s(g|Ehjq+5YLZS$8ILcKrw}1B3Q!;aw-`i`v$pF=^&WQ>Ih@Q@U=0b3@
zoIa+7?}U%cA*s;IS{$!r_6dyT^0@bR>W~>Gf?exTq1i+`3n@5?1Tl+-Dw0v}U$i~?
z0K*YjBhd_5j+})swWr36V-7wOu+U|i9YDTpWO`W<f!kgx%mzDm0_T!sz9i|zNI@5O
z+v?|9ld6=!_3Cu_7=R0#D7x#a>Yv;y>Ctr~KZGZT#;m~y$Kisn2>u?2ew7C1LPtOX
zC^!w=c5BgK0S88hTY@vh@(fr6YJ=NFRTCVtyIWg=X|c$Xl@bP3qLp4^oXG(=M3ecn
zLK4qBxLq<)DMmALU3A<s{_3rjaYCLS1UDYC!UL~Di6ZnPo2KdKk8Q0YNTV*(k*Y_M
z3d1d!v<Re2e8Zc<=>L0^reZ{y_~$;$`urx#U5W~;!J6S%FH|8}Ez#yc<kvqrmf>t0
zl)MWj^xhipuDwJ#HsxBG;NHOBpQe>&pRDQZVfq(pv@r&AUky{c8C;~xEk+xY4#<F}
zcvFL4+dhe|{q{?gAn5PQH5nChEJG@+jX^e9N2fiLqoz)=ZJ8<*gC(M0!hVlnWzsLP
zu#Ar#_YRoT6RnA&{kA~_y>be_IgZfs%a*|prWb>bjI-V!1Nkeiy3+lG#P*FHvQ97}
z<PNEOE@M+MbTEv7(aiZqY;bs2XfWX<|0gDD5cJ|c3rJGn-rG@ONoXOmHV3QFrSI$f
z!U>XUgMB2>KxHK%av{QN?Nbe>deC7Cv7)<A5X_RxHXt7x*>=Z;T`1AbWc|Kj*|nPK
zOn&L}N}5iw1xJ-Q^&_f%lzhL!`3qoy;t9NHrChg=#;Z1AQQK+#WI%g}935oZpzYIG
z6@R@#n)<IezXSG{^pgI>-}s1jEsmnai2K1U8wR0xId&)Gj!oCY^kGzSP8^m=&o3ro
zseGYC|I>93LTp{L{c{GKw=4gBjn|Z5r}TB&N%<b>fA%g56TWoDmxFgr5+^Yq*&<5>
z6M!g0aUbJD`mOc0X>ZRu*TGNjcmJi#LWMPit&*92J1~=qGWPV^`6`Sb);o4;1$&yr
zV8|R`h^>&Nt&pp&#u57{snFoP-8l0LwnyDBnBF`xDCZq#xfBr`y*<B4KQtOJ4K<iK
zkY4`jeLB57HSlxSbKtzlexgFhgaSfjPHU@~nuUF)fW{<;_Ex#MM^jQJsDIQTfetK#
z#4)PiRi;|tEFo5NvX!Un-2du~n$KU&#LY=!d10as%!>I`S{;(69=CCM14obPw2H=%
zvosYYrJ4`XkyPSO{KIwpu|GCBiwfMxqcP3pKoG7{?V6eIpMN0bKC*jH!pWi%MWu5~
zUs!E3Kw~Up)(XMB=|+f`zx~Q}H1uJ>0kn{WdkLrkx7XE?Fc}5qD2neYfyMMhWu`PC
z?{@~}v(`oc&BP5B0E&Ms)<%16eA3zuMSZvLS1W~i!?!VzCaKREKOP~4aUC8r@JV>{
z89Z1q3@>q_@{RiQ=PC924QkVDXP8)C%&3>2Jt-9T_Ta?U88ZHsBVQj+I9}}#sz$=O
zST3RO<rUpA#da+R(v4*gMT=p`hc(v;p<68^grFZi{6N~BDIaXvj}Z46g|*Yl_&wKt
zMgR}S#HabQJYDaZjDbt>jW}XDU0@{I@j?2hS%ST*H1oF=Ui;?c{O0c@q!*R=HOo-j
zV7lXva{PTxV?#euJjzlCNeEkQyuu*TdIwPrgb)RySh9Sg7M*t#+bJ@x*F&%4uPVb`
z<bh?*H^2GkiGkZ1K?a{D;ne$63QH*Jw~k&$kV!VJ&VrW;zN$6nd;~}%#5{JU*qd%|
z>REV{Fdk33EcbkAc^9(@WoehOL%|sJ2AoOm%bz|^vJ~!BK72k-8=pS16Tkc4w_tLT
zgzRy-$T;p@1vx<FAKH$Zkv{9@D{dCV1E0s^07UJh?@v@&lAk1-nIL@G?l;B+{v#@}
zcz#(Q9U1w6sRbtLfYA6Pq;^S7L$mWEJ(1-xMfI#k7#_7yOo>tiQC&K9&V;}BwpzIb
z@&^)NqNSJN_8+L~%@i64p1ve-!lliz8!s~^5fk${vi+`;6Iw4oE;4u4_3>jsOrSo|
z-qr7%cs4mc-xE7|Ve3hR%&*&<%VJZU5E17EC2ugLWKvJ!x=3yE{?$xIM2AYtFvpG=
zYl{)_E8u*Y3@(k{ZN*2Ukgc@o`0@P-Sl3UI@;+EgeR6U>c+W;(jgAmnW2xYh!%8Y1
zaMN&AbtFnI<P_s~I_>G>#-#hpE8nywsLXj$**KJm>-T5Te{%|4%`$*)YDZD{$-J=o
z%bU>*MK<8Z53V@6@wea@1-8^iPZR9@l&W2kP*Wc&-~)zY$Maz%+ih_j(Py<hQ`lHc
z7;ts-8^JG?X-$S#GdgP6!Q;;g^j?V)z=B&GY;C_ubTV>^Q9N2_AQnr?5nqnrnZw44
zLBTo`L;aU2o!X;z_0#X%MgHI&a2in<=<87tD`6}lK=%^DncDnUTuegb2KRQ}>E&6J
z#EJ>@ByQd%{jJ$RNY`LDE&$Iu1SNfV7pM(1ahY)N@J73TCZd1Syw7UGhCRfF{s7$s
z1f=R51)5%lr4_ec`1|)y6tQvmoc<`HWZ63@v>+aA=BdWErXADHCbR1*Tk!^A#O@DS
zyH`xUsNF%JPwt*+B7>4Ch7VGRI8FGOqR2Sds+UyR0$Y0s?wWxvUXGXBJR4o4CKt8$
z1>Wahtbc#vIJFmX^|M)SI7~IKo(CTq1^LyU6zK0UzKXTN=%tBEBlX-9HH}Z8Uy<xx
z=4p{(^~Ql_+Dsg{c&!)Q$gw!etV8?2aKk7X(hwGyha(q+4Iuzx#8m;iF}`iKC6qXe
zOtY!i%P0snLOC2-N}(Q<{~|?}4#nHLQyDZSPi9+x7}wVwR}GH0=0P7~*(HwdDa;Qa
zU;o%Jw2iMfAm9AXxQDJJb&qK84O+Sd#RK}lXy@CT>*eC6n_<_m-&DWUOq1c!{1k}U
zdC6cDbDL)#oLX+ojmY06kc`MF%3nL>-rr}wM{8Nqzx<r?O6{AY%sQp*C#%2~srSR}
zk>}mI4nFhjW$NJRsi`)zTM*PAgZ}*WFL^gCSI#vApXZ}AiAu?Fj#2q3(heOshXqUy
zhA&!lxYF_%BkT;0j``Z#c#9_3M`K6Oy6;<ux0quV(5vWi;!X5e>~#CPEE+l9STLdz
z?L9_|!Ls#;i{ijf*|K18M1N0DMqnD=-AH}a%1_)8lmDzBzw}QJq@H#*x8-F#3Km2H
zRm-62?X?ds>;l|6M)DCCrVwh-rDf=iBS1`o85=SxvYPV0XmbQ99V>;BzJ3f$2^j=!
z`v1hsf8l(}p#iQ%k%%3Cl&e}3xb+??q#Ud<C#I&e7XneG3&eU}dmo~i8a@~EMLjv+
z;q^qtD+dLqhH_WEr>7<3qa|oKgIykmwJuggLMiOJET<l4Z4N4V2?Zs4=*U1}!h&yh
z2Z&j<%{7|;x?l9tH2x$ro-bkE0Iq?64mXQYE;>y5obGS~)~bYJMNvUv%RKQm;o5=f
zDj1o4Rq03}TdqC*I()M7fBDCn2V+nv<hQ*Vo4wm6x+UB<a#0nl4q&5SG+__MRGX`@
zym}y4Kg<MGvKhsqvs?7u$x%e=(o+@|L922>I2tEXr(5XGHqwsy5<#D$_4DJ#)m?-A
z`{8OwlT<;QD29mcFlhe~t=}G8qM9L-05{_Ieg?J8x&ks%&Ztn|IF>e9osr&xOHYEt
zV;`4&Xr?%$YSpt?)%aVWpA4X_KF72C-0oJXP6HXtAZixyJ`K?{&mpOzo;ya5t;2~s
zYA_FQCFr~4`)<Krw9NW=dESL4<9?B=Z&OG+F?j#sWN7IJ=Ch6dFIsBVlX>a_nEFDu
zg&b!Zb~bjXCEN(EdXsrGexQq6bz1EYv-8ekp+g-P(Y$Az*wQ4e`(U^<?GDau^YoY&
zzLu5=Ta(rL(I@NQw3bUJqK%))qnkj6KjzVaBKlU7?rXOUM(g%OWjv_M>*H<Ct7rR*
zFH-+VIAkk1T%K%yaa$j*!#hz_49}S5l9DFcQ$$N&WU?ew&>N4UmfRRuAP>Z$jdA3I
zI!;zSPHuyuS@0oL2c=GPu+Nb-`Vb-&Fd2i%m()scd9pR`^EQSUCYTjeFZ}*#!HdUr
z4I>YO4e2DMP8SbNz3x&HfjSz0x9roMv&-G4zg?01iT0{pD5<Z|m1Fuk`qfIoPGv(*
zM+(^XG%T~~wH9^lecrD!tqLFncr!>8p&_@55W!&D9BcHi|9<t;sPWvo&U(6n6(x;{
zqUsojtysS}o#n_IFeP8);AkGio^-W`upQp>yKex#hY`!1TUFpSHdc=5sX}l+8Qvk(
zOJ#wrU>81J2yli&JqR*;9AuC+LC2g6sI?TdN?n#8or6&LTZ(OioyKR0Y5A@wJ&jYJ
z=doPadr6U@5Z%!;GUjw#kYk#_$@8Zav5O&O45h4H$!~wr$Mjdq+z)%?i#qE!C69%6
ztcQVgZ_Y@q2a=3s6?d`>$n$CMz|MaU61^l*7ASap9O$hz5?DPQsA=hA0Dj#D_s_+N
z*iWc-$1xuZu4=u9^MVBRQlVMgWU}6~7%=uK0;bI<+thK>JLBal#FH;lMf}d3ya6Ls
zsY<Np;;_q{*Y1FfZ4}gj+JCeGSM;js68;x%e_5CNQgyE_353EK*lf$Ke-F=D_m!i)
zlKO?xYS@sKhR-HuOdro1Nom`41K+Z(NhQFF{`O4hDYM;JNtSZSg5U|fqx+{hsElXa
zr~_e7+5-p=ru%j)%Fs0_o~fEa;8V?(vlv7t8-LY53BU13>{CtRs>Q0>H+(9^4={o(
z{Tvl5JsZ@j3GAk^OV=xe++T-5ncH+8+Vv)J*HOVkw1XH>(Ld#F{R#1-2d7LDExqYj
zH&3fO=p0+fb)n9E^T==B2zl8A7S+R;ihH;igndngeb8LB1~g>3mTM*oS4)037Xx1H
ztFq90*raTqBgqBtKgfjAz#Z;u*6GQHkkF~<{H@eT72q)8*5*tm7qX4mOGD-)zYl?l
zi))o5J5Cozuc*~|Up74Flq)hQ@9;N=vMAAEqG6R@j}{qD&(e2M4PZl36$4&TcFrb2
zX4ODG3xsf?u9l<9%Y%NV{Ag`RF^S6{8_!f#FKDBBaCfY^C5hXx2i!o#w%n8GDqD@X
zEWKPoB833L5(_=amk%@NK>Q2UP67U^fE7D~QtZ=8cYG(eAh@tG=b1N$Ug5V*?U!f&
z{9DTDQ3IGz#I3BRLG`f&e|-QF-RAchD>Te#YDt!smKF&zm0#8sS&Ctgt}l*@IUdOw
z7iG_bHztfauur(62_vhtpVS+mjM|A|g^7lQhSu4yfPWbO_3`JrZ7I###edCSF350G
zliOta{JPuYO3-me3V7_OR21)Rk5|4)zIZhG{tyVd3;XvUC9q{}Iz_D}CMTvbpk^@6
zB{1*lr1M*ZN*(qI`p~Ev-D@IW`>cH|E+O$^)ix#1jQj;%WFAcJTe8FnFRU=f%q0r-
z{ObI$^4;>v@6XHuH&=C27^nt|D%B3txnL->^GKqmbZ|@Yi7c{eHSc11X`YxJoq?8i
z30$=B*EOsh58+Km`Q*!^<sTiw-UpV*-2vgnlvSB48Vao#@L%$vUOj9uzssX_Mi4eX
z(;p|PF#n$y0A^62HUpIf3nk=TpKZ~LN*9~tlc_K*R8t%9N*z)IR~>J=h8P7dJIB#N
z=wHk<cvt$6mT9ea#kO%P#(c+#_cP?@Bw*RE#!01&1BZ<Zm6I_oieXS1bZ#aR{Xy_C
z5yK($NjiddmN(6(-wq;ct<DdYnYp+$(6P5YG@0{_J3PUu0AI5#1S5y&Hg12Oiaf9P
zDC+wxt0lAM{l%O+A9rCKwI0(g-sx#sBEIQT=U4-1G9>b<Ezhn>nEr!(aP?*x$HHk!
zH38Y1GYfLz*9i*p*4|<k&8ThtS{tK91ySTc5E3ZkTf&gR4)?|1??X=x%)1KIB@2r7
zJ=tOhrAMD{etteElX5Mr==Skyf7%!K&C&eH=0|_9Fn6Te1zAxYnVq`D`ah`Q;Q8|q
zHPDYc1Y_V<)Tj6=-pH?5^&`f)Co>mAZb)Zy<g2pA`IFuv4`bjg@g5Z|{n(1S?pSU-
z`E6!P_1;o<yhL;m4L%mjkhVddUeSv<3HR45n|ch$<F0Cl7Gq)yyQKmRUnnjm%Wl(c
zBTricUN_O6!}Yy+(T__ZBB?>sdZPa!^LBL9yhf;e@E-rW84BEo+S<4zH^NnG#OAH}
z`o%wHC9D751HuH9Rxu-O%Qq^c9zsvs<kY5t;$y?+%~i9~%nYbRL6JLM{U27uoB!P<
z9H<zYSBV(4Z0uiOusMc=4_0su3uuYFu!2+to$u>E-{_&rKeV%gkj-&ma2GKW3P_;!
z%L`H|$Xp-k3Lj+WbWOpnx_Io<l<5AME)_lf9yhrME-Lz$MklER5IP$~YE{GO#SOS_
zate!#PRmYN&kg!Wne9QA5i+d{cf~B`D%C!ff`VkmK(Ln(A-2?XyCeJ;BOn&cm_L+H
z(4l=N+(TXDLulD`ytdp@c^LirZ$8$_Cn&TO_kifPxNPO@{#`n|t7taw^ZLT@K*%Ht
zxUOiV@|gu)=JM}!xZay=F>s!&vftUw%qcXkucG5D@&7SqbDx@WI_1CO3xS~K$&jIL
zn7}&qm?9P1${{{!AZe}(-n%gC(=x?YH1$zc4gaAc9fd3h5Fu1ay-Eu;rr6KIZ;~Wy
zsSp}E{FI9$IOGD*INux~47E7`L@*zgqui{tlsC~H55Pk>SaW<QEif!xxa{TWF4<F}
z^2QK=Tt+h27Jhx$lt{lE{J)oye#iuwYOW@@>9MVf)8Cn@ot6;;dtJE~a|xgy`Uh{K
z@6aE_EQ<xWUrvF@X(LRp@HsuVVMPKirRX;YD5``i5e*?By=u%QkO-*)800SXPDZ@?
zahHq>vZ05oHH$X|HKa;<{+JNs*KGB=zfZ{)8su3q^V9duy){rlF5FusF$g*qPUom%
z7#DZIPn}wBaXvJ4$zWC|UF`CCibpL`7`4Zj%}7~{E9NG>#0Ogqlp^h_y^n=_kajIt
zZ3dWxJ3w0a_b`l}1mhWm#c`}eJ~=B+A5^}|1X0o&OLdp)C}f>yig^G*1lz%!0?y_!
zzXN>ZaZi(>>n-Vn2f5^fTXK{wa>8#$pXTuB9VLXRInzk7fTQL~7-%F{uF2TN^RanJ
zJ{V)&1=3=QfaHY#mih?c0qxSov&7l$lRCn?PP17BD%PpLCXkTq#3uiBLo-dHb^xur
zaF3dz!%&ZAL6A!8uI!}8B05AkO{CFPw@&?7k$H+}F90olfE>ZUa_AMsWmKcxISra$
zeS$%C1~KaX3Dqe$iaR7fM;e$5zrbxU|Mi}ND#*%X)~`PhgA$48&UjI~eEYZysr`ns
zALhrOgI?>;*N|0|{B1g~L5a>B1~X8JguPk1v{|>BPB8}}Ar6Uw)aozNc;bwkMe{5=
zqw3T*KL@`z1}p~=graryPmT&cyJ1z~4@H%8!!HBdpbk4EqjZSqy`>g+Q36_fP@~3p
zm&oj1IHh+sNPsHjUJb5?Ov+>stU649S5MM9XaQJD3qc&RbVXS8CcQE}08DOi8F~b1
zOwB!#+3hK8`A{H&LR<(22kFY3W0Iub1JApfpoU3V)~)3WZ4j>6Lc1DE={EL+^qEYX
z7Qyc5DR~+8Gt4YemmX0^aoQ8m@H7WtiFGQ5Un&$TgZ5Qehve#2rcK!*`vWC;lD~1x
z>Kp{CRW}OZsP9B;;?m<?A*T(1furz$Kb%-Y4_Gk9aDhsL{uopm&BLs$thc@+Qz+z3
z45&mk_t5&ouyOKbuaDv-&oIh5tS>c_dD0{fmVSTMFTYQ($VpL^r`yjRxXJ?Js`_y=
zdlMh&1=s+y>Pz9@Xnt8@Dqr;VJr1>=&Umqj?5l~2?|KaFE$mGWmqbpOOmn9YgbP{#
zuR)no!RP)ASrcH?n{%+VH{TYtAM5TCs*AN^>Ezadz{9m*7P$)!540Fp+tDEiDn)@_
z(eR@}ZSCx=Vco2t5GDbRC&WUgcoBUcZIRp}a@X-m<?Cm-U#t2X^qPKo=a?_tu`Mxy
z!GWvgm?ma^KQE&H3M@{N3z)Y<PbZ*8Vd(-^JqdM4pm_1}hmp89lE?5l-jLv_rWETu
z@F4#m4D-uCS*lMfrxJ6L%OHWy$SW$;0ygc{sP*T$-0OnvW#&T!+lz|uA8o6_$ix-X
zj0=4(9hxZoZBE!}POeBS{5Ky@2oJ=AZ8KcLYtPg@A#4}#ldj%6+8wJPhXxS80XR+t
z4ZtHlsQrEjHrc4RP~1uLY-fLtS!cds^^e@gpY?nnrY6dfh1D~o$}-F)5a(%SkV59^
zYRM>qpk|z{V^}AyXFJU=A)Q`g%{k6AU+)M|f@lb$QEU+3eRsxKIg08#YOqQ)&9l!U
zL=ANO8k?g<!fHG#PJmk`jW%BRf$X8@LIM3N+C?9km+rNIHH{I1Gq-3rTMFRo`X>VX
z0L65JTS~u^;|`S8O(Xf$O!8Ft9FAjoL)#g=%L}KmXg>#Zq8qs+q@-Vc-5dha6rK2y
zXS4=Oj8@}$xco7YyR&qOg@$TSNqTGz_7&-Uho&O$fPcMAUDyT}W-9^dmI(tjuTLSg
z9o(4ST|OXF5Y|CQad4kpyvly^YwstaR}7Ag=U)>zo;{LvMI^xVBRc6&ZyDyORx``i
z`%(pk>Bwy&oQV>mzTL+Uv%Z@Cro;I7=1GH>^S$}0nWnBiJMddx!2?&vpgwF64Mw%U
zAQK-wFw=%B5Gk9&0=F9oOc-p@6QxWEs-j$;@6?)bA-NVLqJpPD$GjT_$EZ5^#Hi@K
zJ7c25x<>5{-F4qAb)M4G)0e#(VL9aig`nWs18w6L5t(Q%tVTe)!~{ALmkive97JMX
zcfU@mdlF`2mBV>jysHBl`qLVT`Ok7EFQ@;Qkxb5c2U=I3+EZ*vgQ8<j;1mT`>5NNE
z;TX%Nk?)xrVq|Th&G7Ukpy(ufIwdd6D`cmYn!|={{$k|7!NMTn)OJ3f_MH8j)8cW@
zuy&-n#IV|7xXenu8%YH$Cb(k#dAO4Vaz`}OtH1kXXPPsf<uTD2cTP(lxdj7+*DzxR
zWGWND+c1i|uKaOFxTupMK{CjI@Ic+9!sn$5#C|#1WLs#e2WZ}w+ZbR%_+_FrI4H=r
zzVY7Z6kx&WZm`6xU{?s=)14w`^Kewf?9jP6Q|`<lCGY8a_vC*P4PO)QU%$Em5d_=e
zT>V(;w*G`#sTi>3?;o%;I4uO_kRqy_Ea=o#ieLUrDPqKkG6EQfz!NP!{u<OM+lRcC
zbiw<K0A#xC&B^03RgnC&9!Teombv&=Um=Q1@4VX24L+~ARx>cQ8Quq1@Wz0}@Hc#d
zESH_pwED|A&s2e-O!bp;>&L&jme?1~1D^g+L(&S_e<AcLThB4$&*t003Ur}ori~aD
zTmssLR!l*T6rv7=f1%f}7zQrk;PJ_V2H*=Ac<8V6r*U3io_bPx(oe>epqAmke<aqO
zMel{4T1fl$%nUcTs%$8#8i7i8Bmcn$OjnSV_&H>&yj{l7$>=GwQLW1ty<cenLU}N|
zuJnCsUjz~SS`hvd@{D8<$RuzdZ#aWOv37{vE0y8<yhHi!JIql+5E5o$-|@%=lvcUd
zq!GHFJ5%3%$lp{0#Yv&m@gH3Z?QnO*<f7nRfou;6)D5MR!&LJ!3AlEjzDK2-#R=ys
zlOPs*i@ecXLhsiYDXtIEUAhg|Lem^S>g8=x1=)5=BtJYHS{=;p*66<RXQ;XLV7d1V
zSqb-X^}e@o4KERt3oX5_9&|v)oB_W-39AE0$P83_3818|&yG4`V%>q}OvC|aN!Pv|
zXnz)hn?pW)y{~`pAb%6yWO}&r+r1hD5+&-DdnT<9=msqZGv!-zXZPjPF2RWlcSP&o
ze_;1He8>x2;dsQiHzfZA!|-DXVCO#BR;ms$Y}AJ*`WX)(3H(1l$X0(l0d55D+{Qt(
zTXTpvUT0OH+)-@O^imWi?NcFSH>S;c{k*xQ@&ls@vK7k+)HQ?J=p^)nl#<{EzZUCU
z1qH4k%bYx)u+{qkc`%|3XSVbX{rM3%^^oFx0vY;^yp_BVP7=Q@9<N=#pyP!~@-b-3
zahX9;az^C-mvQkShy!Q<?~4l60+Heum5)~6fRy_;(~9c#>CW^4;DE5p>J)S$l)eA^
z_c8APPLOs(M;%HztaO~6nda;&?CMg*4OG5|Ul=@^DUbeYv@q3r1Wd*XeEkRf>zd|h
zkzoYBoIXIdY9`nJK>eGMEJkez&PtU$Z(t$9NxRh*I||L#iKZEOL8?|TPHE%-m$vC$
zBAcZTd|$3w_yHqNmx*6Kcx$%YCYq&D3GJoWHwIJ8DtC}ra{Bafkj+y#CYp!c>v*H9
z^VN(`Yre=D;6)ZD=6#TB*_-q@ULcW8N1?n^|C_daG@iF*^~bOsCo=HCP&Jy_qxmo>
zMC?-BwkMuNG!H#EG;1)NZ3TT&575`KgJfBUx2%IQD<$Pl6mEmY;~m6=)%}z=Y-t8u
zyZtu@pmG_hd-op<dUCzP9{{G3?M&E@!jU+(TA_I(oWNu#Pm6YavbvbXwIv1mOUIN_
zj#+^Vu!}{KSwSNmPMn>~BFG06qYa*IxvbtT{qIkrBehf=Pf|w2IrDj*m&gHf{Hw9E
zL$bENde^l;;GTf-YRDDf6Tbk8v&?B;LD;DoRTxBl9SfB<VLSR_&Bw@2MZz9slW3O5
zU6da$L6a6P30HSf<9S)LCeqhx=GGjD`r;L)FE&1YGCC$6v}a{O{+>8;e)#=)X*NwC
z-q_+>ONYA@pikT^)~&e`%S`wTQ{^KCGicy-$I)3^xD3j^>5!ITslhn(e-uhOJNO>I
zJde1`zR`iMc$gteKuIq29qr^jmQ*Bz)APv^vtSxqkgT5+zm!filn7HdTX9;Ey*tRN
zIB27#?NQ&IG%P!Ak<<oIF^}>zvy=5R!wg%pAc@idp?{gBuOYbj1~j_=r~?T{WZbRp
z012|=ks_{fBmC6E`M0^$SL`7}Os+}OTL%@U$R_(`BdLFUEGh*iO^p&ba*nBBL};w+
z55EIGfM4ZCm7ERSUIz^E>(3j*Up}0WVQHBPs(5%8c*+yt=Wo)bPzlg{Y?1hnf81AX
z77tZowp;VF|Al?Fn>l>1Be#lSqbrsX2y8nt`|TG?)u%|n=RqM1q$*wf4A=<87u62j
z->#k&KIb2=cFeHsOVJ5V#ix}il$U}@w!92co^3^`)A7n@iU|jAUxdm7z?>J{G$A?w
z>*cy&c^pmEx^A99MZOX;Du<Ud<R`v~7_+B&53+hERLlxDPOb9IKTYd?1Us{OQUdsM
zU4h$t1u$~P{Qj&UDV_d0*?&u+yq<|56M_)H`@7_Oyuqv(iZg_=jwHvuHs)G_KcP@z
znaAw?Kcc=mD9Z0|TVUy4P>@`@l$P#p5Ku%yq@}wXq`SKXL_k8M8|e~|E(z&wsrRhk
z-!tzFGyb!);O>3Sxjt7N(%}>nG9<KNWGO!thc%(_uzO&rVHy=Wjnsc*tg`U!Ljp7L
zaWoIm)5`_SA4k6F5$FC7{}3W<cA;wv_}m`L!l|coyYD+hk>Bh@q$PuE0Oe<~!i7y0
z9`tWHh_`=06HodIq=c=d*p|oOk`;%#6V#_cFyGkUkB1w||0g(hb0I_~z$~rkZ{fmB
zH8fbKk3ngj%eXIhS1fL}%1HJOmH(sl&r~$}Y&Hy6S+KQWBaCw32QaA(UxQ%DPv_J1
z{sQf%_<W&zkuFvr**IDQ2w2IK%kI%{Bx`cc|I-@b3Jg8~zMr^Y6h=0*F9MCmRYmU#
zTf`iwh({_#0#?hBc%dHc9Vfs!GigTgy2o+2p-qYpn<4=Ih|8_e1LR3;wyHN%7;Av@
zYwR~|Os+kxptzyF=65ki8_$HUBTG0At2aSZ(MEcgoh|G+0A^-d!0$1KsPPMOb89+3
ziz0b3-kk~u&};m4EgLv?k^r~)Q9p7V|D;&4BHowsS);fyFvVIL1A;%-jd3I#q^eq~
z`I&DMyF~CKgCe55Z2Qih0dGKNI^Y}s@)gLY_THV2idqQv3X+_;+4<n&;1p%5|6`Ww
zDG-X^VKaBY)zkC)*ym$6^UQh=H_H#-i2aqb+uf(nLml|xV;!^-!9R533Pb}oKtaqz
z#gk`m)bQSf8nV1bJqIh(A~JZfM`v`~;|^o%5wHwl6FpJU2EK$T3w^WE>|YLz>^6rB
z4H~(cQoqE7&c?3nnwFmb*Z|ubx^z2}>&l}Ti=a>k*<WmZ%!w$Y*}_ex7og0oibP_i
zEbz|)Pu}0&J2;O>gisuSKeDF=>%@m(ix0+1#&Qr78hHgBS|e-rWg7RZWzDvw{sYI&
zDSnCvsU86`N4Wt)%z4yr@UWw)`o5b-)u|a!b12PLo1A+_C;X=`L;d_Tc-~*4VM(p5
z0KMglY+wL>kGAI1Zz|ST)Mn9{<1MnT?tp??RH+A0TJ--z=|XD1O=vo{dB}mmuhLgL
z_1NSHZ-LpPwacDKuhD6zEC?B3y+ly)^9pQ*L*YUH?f$eY!jQ5Fr1fU5W7bj}LlvW}
z^`C3N;`18LNRA?oXf<z=R5Q@xF+wt3%C<_(uU7}z7Dn_+B+yXZcPBCE<;ElI8A*(j
z$$NMH8@<|{(fGVE-&4xAbN*?rOfjOs(hk5FDj8X5)^>FNy6b5n*?YifS%H)k0T2T;
z(of^S3P@Ps94v5g)Px0*3v+U+-(kgVLHj$JoOg>xj#RW$46@du!K=NZ{WOYT?zvg2
zRH>$iOD#RoS<6?<wn@B8ZjuC>`6o=@-*<}TG)?ZYgLx4=(hcww+y@CwFOzensmn?r
zHjuamr($pNv?6jEAfaUuSpvfC1eEe@8!s{A?SJg~7<9^13M~RwTwLCF4K=f>&?5~*
z6-l(ndPd|W02_pLSlTjs<^hfe*PaUHFAHvD=dAwz01!<#0Yb3@o`ST}8I>)&h(z!Q
z&4X%_hCDSdF#f*S<;GFfCQv2vZ-N5=E`&`!bW%3GzZpUgUM$#7-?c~8lJHRQxgq#G
zAI7Bu0s_7XgqItZygT`CN(g+^BWXT`Zw;oP^rSfyoKCffy@`@3f9B6}eSX2lSS3sT
z;iKR4Ym%(FzcEt(@3e8FLbxfb9u+qJqg!JdC2|9-IEBJ8ub3n2eisITUT~M_TmlGm
z^(op7CP{Wde|*L|?0=^m%)cAR1DhqR5#3GT&`qpFeD83vpq(@dLXUCef-Zfa69JYb
z==!?X{VZ1CcXyMD5EOjewP5Qu2dq#!u^0F*EhZ#tCjsvMqRhg~tYAWF^;XX2_rk$k
zivv1*cGVT`(XKWQ(=64LuX<Dbve@=F5D~udA$)N^9)T0g7KkGa<nbQfAhZ)80WqJd
z8ynzwrt{4_F4uvWq*wO8b1v9VgTf0CmTzmhwJLPqdgFb6wDmV`!E>SB{!h~%nTMQA
zAKqq1_-GpNs7KxW=%+vHE$|ckEYx(lHSX2;q>u#N%8AwOVdC;ekPt(`6X0S{N#m4G
z=dmuG#uzEI+mSfJCX9g7Ag0)zf^%R4Jf|xDrwaZvAzW9A_h|9u=f@)xCb9<^52wEh
z^vXrM0#z@7Sm4>owb*zEb;$~WGtUk{gg$`}0AO9#_VQfy-~?6K0a;ePKnDAcV*Y29
z-hX0$7&_m^PcQ;8fH^1celSP0O=ae#HHFGxiNZ{Up5XRe?U(4R%z3(FrlTXUS&1mL
ze@Ohn1Up6~3<h^xq-VzgTBN<>Y<ps`CyLbBz1HHF(vg%P0pFWfEck|bi$q9_g#QtX
zU@7^*4J2X`Uix)5S-^mx>;cRdW{+snomuT((}FTqh8M9%{x_7dgyKvKqvB0$lziSU
zaqvUME8S0nq1k2stvJdCklhu-pmdtaf&^NfAFxJ><@%)b!d2h7xMV|a!~GnedHflA
z>TLM&fT-N=cV|H9d*TQQqCnawa!&XZ6cuYKWk@$q{>@W-=x>%unpHFTe$tkC>9++d
ziPwrZ!<knK@3WUr*$w=nGb#fdbvG6$AHW9+9#Q(0MA=v^IkIRB!=r0)>f>hj(;dOT
zF8~RZ<XBPyK6}H<lwP=@g97oj&x&_nEY*0PBr21K?916&$GSLj_l0Vs-<=<A+9aBy
zE;Erm|G5C`WZMU7*Lq_V!I(UGIrdjY@O%SY*p;#XN`OT^vEbG}k`Qbc22kB==0S4%
zT3nUs?Y9!Zx+n!&;#oPav?E~m_y=kMMe!_P^+|r!-wPkPg>-O&`=BrM;UNYBW%4B}
znSvkDJFl1I&JOE+zcp|_U(xlnfc;}3(oZ?ruY--*Q5$SGrTF;x@eHaI<<KKwFDq5@
zj})&7+{oC^S%z~TVutwbeCXBauT+krhr&w)VoVv10k9(E`;o-<PM=;W6Xv?;PDCyP
z-9<d+qg^or7=SBtE{;a_n};Ky<<6B}+Oq=}qyt!|Uzl<7-wKtoQaQdr%=ihb87m1?
z|2L+<Ib?CbAxmc>o+Z5VI{tXJH>)w)_nKD90oP1TxU@qo23?Z$t<udn8=NWug8`l`
zB(rf*yT(*LOTgJ_`Fnn}@-x&~A)i|}<@Sijne#t%%<5_WfemHEDN3{^@fTTeh(%Ez
znBrZxTr(HF3dB!1ujojDA#9r?(xU9QB6j{<D#>){eHEEcNQ>v?lOdzL`5!Z({VwFN
zYX<OQEigrX1Gg3T0kU%gpz+tF0`dA1*&VoO@=w(CiUCn$<NINN`)hsB9t53M00Gzu
z4q9!OTi^a(+zGb&_1tLyWk_r!mxC$dAJq2C!LRh7Z#E)Be#iy}Cx?|4g#I+HV!>Pw
zFiybDfjMbJC`ym=aDq4DX;qVTUH0cb%`Te_rT!ktG>?MS+g1T+Nja@EBZ76e=ksS9
z&ZOh}V-m5+g|9Q6MP>%$2^!P|<3SV)6!InzLXccV8}Z$kY3(u~d#R}Mk3m}i(o;UW
z+}AIpH!^|cuYV*<@Ei^9+XMofJfQl$P1`*)%<JI@2$!I;8oT&Wu?ew=&;7O8a9QZ+
zi2DjqXyII|$M=zaudB0JXRuPFU@M74FJHdo1VmZ6Rio)JiMR<J1eXG6ci0sr6fwbm
z9d%0{idi$2I3yR6MrHZ`iFUDmIe2ygjI$aiShP}|`KOzsyN-CH-C$?iE(O+3B3ic2
zOLH$3W|aTv)@FiA96Y(oh;V}a`8pzq`x@6ems5L5W#F}9Z!|fb<y2W>|FO^GdN_2v
zqF*5s?Ce37y{a<mwWwvMB?x&IIEvTvrKB|6o*`YMmtfg@^&Y;{1o}-NP&De!bc02x
zRi$#Ok}(c^N-(gmjT6)uF)#BeUc`gtg$K6H$%TefrSnNy!a(I_%P*r{J}=;QoOG9g
zZZYE?M|yuTT7yj~x$yZ~ORe$+n~lJ8ahdohnr4757j>5McS|_Rl!rY+e={4Zk;7x1
z{)8P38#{^n!?>K9TCCV*Q1BHtZRyEJ4oxu#-m1h5EDiWg`@p79Of;afw;xyz6ckR2
zNye-zBjiowY3%=2gucR~lL3K@&J}+vak!v_A^3268Y3_dhdZ94z^)1Ra^5TRZ+;?5
zT%`7wqV=<f-scSrU+m9sfbOzbaNzV1>(&@_Abx&bo_-O1LW9o+#gztwgbv^(am2@g
zwmUw+P?8U}?w8m{{LVXxuRl=&S|-<!*qC}_!TSAX4_q98>5Q@C1~!YyRCNTRe(A&;
z%yXOr?i3Wfx%Lj=f)^vV1-z8Us~_TmDP1mB@TClXR$?GRy;EqQYMqCZxZp99x)eKo
zNFMfs%ic`hApTH*!YVkxe~xC~{QRf=!Dk3M#MedntB}l2xF#&86lP!pvD3*I2Y{0f
zn}j>JVm+DB5o`edg|r46WXxvm9gmYLe&R7k8LRdYwmI*<7C#B+UG~zDkdP=LP#M7N
zF-j1F5>#>`ExrLzf!@Ds8NdLP*~v0(jq~<5(SH_H{zs!WC;DmV1Fzs>r0>$01k02w
z$w%}uVN7&)eA=M@dsRCd`pmLG=`$mrGtjTmn7}wAL4U-wH&GnZq|S6}F#{i#V0dV6
zo`yL}`v-(j`n*vU1g@_DskNi)YoKqh7w7nJhLKR5|Ak4k;liBs*)^Y(0m)CFoiBpA
zi8y}+UpH_l44|T9xb~WxGNKb61|KFxq}sR1Vo=BXUebK(vLvT{*Xou2oJTsG5K2z|
z9EfA%&mx|`{bncF<iLI?NtCWf=kG?l;^g&kce(rt5Sfjxg2#2?5`4Sohs*CeJ3F21
zBK8@1SC1v^w7{E(NwlYF<G)G+#-@_q9}9NCw#K~1&fDF51nBA{5cdgp%#hlq#f2Nf
z&cWQy>f{2p|F@r!Is(n@$ovi20X>R{GzgvwWQQWaMU*lQ#Zm=Upn5-cRt*nev!^xa
zJ+fce3;wdEe>UvWzh$r2(ado!s$ISQ$Mwks@9OKh-dpSHT^pj)zxMAux^~S4yt8b2
z@5B}YAkCqEn_Pr?l0Wn{1L4((--^d%SNOv>HvnCw856c5A!J7Bu|*}H#QgXis_&#c
z`xu-I%d{(ry=c&&a<nApGS->bGw8Uu(-0;A)W!*%=N7zAhi1XF3YPLpqFw|MTk=2>
z3kwP<nz6~dwVo*Fp|D(uO&<Tg$W0|gf4TPSCfSo9z-ls~K*(tDO#s?@u~H9)zY~z3
z{9veHC3$B9TY4^J20gMy9Jz)uM`GWbS2kZBcm`ZkLZ20?=IHOgm1}QT7;g10pY?=>
zVj>7W2~cVEzPaE8>_Sx%YI!!A2=`(0O?073Qo3VNefvfu_)dHz+vhGhaCKWeY7?L9
zydHf%bfsyu6lzacia%#@K62iI9q<knZ!Ux+mxiPjxHopbeeAFWTRR;!wM2mkVAI(E
z>#HH_CJ^c||9s#coFLsvei|2WDj2TyHZkhfSMC8X*#?ZW?*j0ofyKYwBxi}V26S^E
zUVwgmoy++FIAqQWWA#YnpTv?Q&Hey9W>MNlJh?z?bF||-%TX@y5d!$+4OV?TV4qoV
zNcr@tjpen0p#|)CQsgqg;nZWV4qIjya)lm&<AbWiJlw!IqlF^c42>8(-=ARa5#>`H
zV8c^3MRpJ9IZi~?^f|*oOc~;Pa8On*pgfNnd%?J1L~s>qm^Y0{eTH!bj$a5P!Y0>a
z->*RL2*x3220P*_YT}&3<+gWUI>lnbf;s+@(sOxitA9G@%K7{s!l%V!KvXG4Hk05d
zl{3off+KTzHNc4f;0NYaM-%YK*n(%lyM*t`aF=Lf^P_0fmk)13-tdid^<(zu@lBoe
zu=I<>iFM*to=$)h%u?DEf;K0X4%Ddu_|e*)`jvWyIO_hzf4@xxP^`U~{u6Sc=s6Zw
zm{iBC&?rgP&WnwOo)Fb6Js_+f!3=sODjjLu@Qw*xqK(f%ZP9r=;QT&gXI8f(!9)Qm
z03k%!N<G5;p=Hn(Bus$qC`U^)8c!FoH&;8T7k0Etw`Lpl&^+|M!xjl`UlMzk9R-Js
z5lrVlhr;ULpygL>d?#YnWdwfrUlC??KXKuNF|h1|Z_5m1ghJpZiqRf{-uVu1;0gKU
zdbou6g8}tY#H#}w^`SHf#gYFQ5fFm?RXS9nj`3p|fWCDwhH-uvr}eKvBQcR8qjChO
z0O2d$O6Cwv17cz>{3?JKPbXueJV5JP09H+GM!%96@;@^)nh+SF{o9D{s^z$zvFbHy
zvb3V2qFN@=G9p>WB4Pcb-C*;?=>zx$gl9ZIa$Ta?L?j>i`<PMFyqIAV$(9p0-OCwR
zXdC&{xcuV_68cZs+vJg)h~$==3sSn4Q!HIyBkgG220B{jO6Fr>U(c7pYuA`W71zp!
z%N_Kd7Ip)<maZhKimXp1I~p7}zb$7QVH!Ea=E5M<3^Bz8_Pn$!EfC$49us3pwu1b8
z<BkC2aX`Dx*4q~Z6{5%KHaPYJD^BfP7dVg3j8U+NVIZN9Ql?$AV^$n3`M<+M4km->
zg7uN@Jte^WjTNY<FExFK<7h(YCH#lc8slSQ@pgiYX!}2crQHg6)e9;0642@-b{C2#
zhP_Os*%F)}L{i<i4Cr2gly0-pYuaSEzHx<$VEGWN*X$W{Fy8jgx2_BBqgZVHSTc3H
z5{SDa?})QQIh_p`uU4vcI<CpF`&;0C<hyyUjv)}zr2{99$Y!WQ2pjFnJD^9P80EoF
zMwv+BJo_hOKjvW)TWf+&Te%&aF5VCM?Z9dXw#9maN=JFx(f}27>_b2mOu#w;PWysG
z!C|q)C<y5Iu>ct<p@Ba@;Of3(uj$}o4`}C82ZS&4{i@HhBPRSggRO7}t-KF1=m1XC
zmo!VigN#tGOVr@8lNUJiA?di86issfNhEyehv3GJFo8fZgwPJF``c?1@GBe5`1Zl0
ztNieNeqoiW;VFF52i{=81AhC}Ao%={d-V+kzxcfy$WsZ}1Uw6>K_i!GK5?klpp7+v
zWUj%CF}kkMPY|)6ZgWfz0Cjaftq{E5I2e5!faKy#ZWUu1Rrwc~Z1H3fr)F=4jwMe_
z=ZTDWk5A)S`Q%u2Tia~D2|`E&)^>*ql#r&?3(?}S^77(e=(sQ$9&A8=L=2KkAI6rY
zNjkfZcs|J7sD>Zn$)yeP@sJ6AQyehHB$&qfGnakau<?%R6<>@bQ_PW2(4JnrDykQ(
zt2OhvH0FA84SnipeNei=Kw|X)P&O_@!%n1XZ^-8Lnhtfe4Zj+l^-GSoSengJ*sDmW
z)A9CpJXW9=r#H77ZAIJWx-x3G9FaKoxz*X`s-yDnhOJD#Uv-nS;5O>PatDcw^P|2w
zbW{}0D`k*o*kL=u3SQjI3!!ijWVI{HCf14osyy`Q71(Fpkiz1|;C#BO&~XronNc?4
zb))N{{+$hAZ{c#-?(&il#U#%E2qb^MB<m9H3jllu00~j{orAW#FOeysX?%vQ?Uq`O
zJw%)KzF6hziGd>loU53U3CcC3t$xa78kzV^TYaiRZ};LeTyTjb<yA4@I++^4*N;wH
zgb&w%*k~d1`uO&{6%z=yHPZW`4Ze)R3*#=oJv-4bx&)}oMxuQrO094k3}?x}@6>P?
zR=zycOX*wYVmlPF_m_9}dE38%-jB+lSBhA&BRR~J1>dwURy+_r<(W2hs+LCv)_Kz-
z2~Q3jN|9%v4msQlwC)^)kOUy(KV7c3H}akV9G)T@8ulQ<sm?}NyqFlY5|@Inm&Vbm
z&F5|bLzPrhuT|Im+GB3o0#>z)O8YFE8~utO;pRrBHbTVvuX!>%$o-v?SAU_dzXBi6
zq$|k!m=m9$k_Hyb!ezGs=^+{r*8A)zr}XDHU&!?;@ZTrmRI?_tz02-5L%h=e{TUU|
z);|efr2}D5@B?sQ2l)Lo2L7R)Hz)-d)uB{KFE}e-e^&pYiHoW3?(fZR$9{B>6~t$>
zph%pMBSJ!T9<dqQa6_=lNZoMA%wXFx_nJgRTh+m2n2|?~?R~V%u4nC?fRB0IB;z}=
z<U_gV4UR=gG`*v8YNg!q&xfDRR*5Q1SuL_$25q`9u78E#`OI9ua{sc-z~N#zekrOr
zG53mW{zv`WOrp76V&~OdZa2o_+j{0dde5|LUNSE^nl)33{wc6$LU+Rj)@Y&@iP-xf
zbb_<%@KLw>PP7n=-#Xu|I;fqmWG;*>Q)|{d@8aRe7W^o*Gm(N0<-%9GU7ellV|kMC
z&vkg}4v<vx;go&FY%nq4Y~|XQ(fBs<u}gb01zl~XZ}GzhRDnu{Fb%-ZuZg--eqW=G
zQ!0NkIs<P^TnZsZ5MP>FZc=Wyw%&ZR^hJveJK269O3b9^6i%eQLmW$g*KGGPVGvfO
zmBOlLJX!Mc04A}k6AD>R)qp#(A^3*gTIUiEbX{CD2oH1yy*zG*KMO*ffL8~2psD04
ztOHR)a49R06~#I#4%?*MOyU0*J4?vk0`&glSos6cD-jn3p|3hd(a_bk%HPrfv)MVb
z_KsEopC>+hhb=H)q2R9O!6QGHeowRm)jnX3<i4Sd)^!SRtIf#Pf$#n(2z~s0f>Pfu
zcYf)>5BL(X&<>F$eC}@!zZ9I^7Qb6(4EzABz*SFwRSNj^RrCf7r(i@s0e8lIMxyAE
zm#cUbh!%iqIbHD_==l?)Zz!YI3g6KD2?sA0k$bd8+b3u|FZ+Fad!iV#NAjrzS4jdI
zb4~s$AR7CCNjWKOs%jQhHAN46WTA8jeaMmiFdFvP5~i;pxJ627>KKoi3p)bYV}U<Y
zBM?NCJf_OD-y)-T1iFxY+@F<$>7%FKaO&v`WvI)$z47^FE77}siy9*9HRA2gzqG&H
zC{$<ZU6#UYtIuRWI3umR(LwzYbFek)%X;ni=X9>WLrkvImEUgQc6cl;t5NYa(Doiq
zHLo3J)aI^eHYyx99mJCHJ1UImHq>I!JjsU|bbdF6rkB_AOQA49DT=14Y+G;DZ!7XW
zW(X6>(Iav^FW(|w%tjpZWPc)#a0S};>k3__^POJ_fQyg^LhZTW7JuG684$(^c}{jC
z*xK+Q=kv$H7aji@JM4aRVB+MJ6aiPbV=ekVfX=;<Joe+uMHpOUWMw0Pj!&0_!N+>9
z)E@oRJ~~G9z8*#@v`!g60LBglXNj?g6+zl(vR!YIjFhB1h@eOAh*NcVYgC#hGBAz+
zqZJ)<>rFXAkT>~0{-jq%#CO&mzA|`W2H$oqSVFvpK&E$~4ajPx-b3KA@dlJ*0IU;k
zbUT7gnZdVEVZ_wwnJR22X*3F{$EFb6PG3BaD-a6cbQ`;5eeS6Q6n6+@#Ws}VCBQc(
z$E!c!(d2WQ0CFykBBi+kfQCQY@)&=ui_C$}ky8I;MfO{zhMVf(rmh;ZQDAlunzV9(
zCH|B-F9(^TZRGa9|7LtVGzjcacjUN#1DN1b08rXBXp@VhPS<-9&7&5(N-i$N6yG$3
z3*ixxg`z<aukMT<kvx6M1eBrguc>R(0&^jL;_E<rO9)G#FI_|HdG#izBhcT@^@t2C
zdf1^=r792uOu*j^wP%+A<|<KV4DnbsJG)AOaVk>LsX83zLZFEPcyl!WeU082Ns|5*
zu>yEH^Bd_Pc+_Hevz>Tvu0T$`59AF#0p$itLQ*>awg9vD<-N15+wg3vTPo&ebn1bW
z;(ApV$xygO>WFViXxQitD_d{VoleT3V|mPZEP`zcdeCC?HRWuz^Oqpg0cN^`R@wEd
zLkHjOCgby9auO-?oCN)@j-PRun@3dYDj68~eJddf_?s%(4b460NTIBH4#+Yx84woK
zD3NQw--OlyF=J4XgROX7K1!2lCkYku8`ZB}ZJw8k>uD1eYow^YJWw=aM4s5O0Se+N
zU~GK`2A!k=*%*sX+{m9a)YRWjV5Mfli&r1qL3@GmmpGHxIq&Omjg!Hw1@mvGH`wIK
zJ^Hy4QwW}s9YS1EJS)kPKW`hIK9nC|kXI#TWDY_uyt`@`{KcpYoSS340TGo5Of-tB
z<o)>$>9kySk+PlPfUJ0XE^!4t!S|qqI~SJWo9i(taL%MZd)KO)zydqw0ne@xA23cT
zn+EzBHnkpRb9nv>r&ck5*HS$!d0*;@pL6u}=1WJEKF2bmndt^>trLIf*akc04UL^L
zoXDYH$sF}M|D`qF>g`$k5$-n&MEflo`pA%WS;lcEIll2wNaP;~WI>3`V|SIpqY5X;
zeLsRO3{B4aRj#9Dw6NFM$d3N*mfCMjW#%^|a3Ij`N=o`UpX2+La91qzm)>Kh0lmoo
zJU0Gf)GJQWvbkf^?|jQq42i|n8h(kCz<A$_xl~ZfWx7?+uGm8Mj43(-;VcZWuE~*0
z8$1%nqe^@Pf_r0FlWANgMO59(HjlD#0fk<MR!=UY#E!tpz^e0IsZKHgd5CJFSoLc(
z&8t$)IAFn(?v;Pj@!25imw!Eww?Lx1Jrx~8s1He#+IpfW>h)&3&}R^2BhidBKqi*O
zFY)VsWk>J7_WXOT5$j%H6kOO`(w|;3x@aBDX!Ap9T5_Jw+Bt*t7N_1XzQ?*p#tfDp
z+0(AI$k{(cCrGRZSdzBcoI`K&TbHN9mFBm5*5;iwGyK$LoyIcpc)C5Dex2Od9sk2;
zP*!b>g%5vo#N*Q*Dr~ZIj;)mjE0&n=Mfs!MwM|!|R%!0#9b;OR+h54I@-qbm1<3(!
z<b@@}o{*isfWvy|Krx`pOA@+3N#S{eko6q*FY7mpMOyuA%dNC<hom1ae&s2F)6-v$
zv2Vsr6J%HQj1xj8I>EkJ@||jCj*54`emq1aNskUba_G<-oQuV#f#7A`PGEQnW5tEz
zmM4tmJ+CaH<7?_>lc9xJNOQ2?`SXPq&pOSo`ir-J>UPMWkJB(8V@$jMskdKS2OZ@T
z_V~s~-k2?aPO50Y-Wev<zB6H051gq3n>oG}E*vxcFg6aEfV*aphQ^{+DzxkbHxhe6
z{VK>#VOP!E7L#(m6KEt-5_(s-t;ap2<DWGc^m;$*gpZ0`t+uv5zrVkxMz}}=W(ZS=
zl>w|rfk*yvJU<OTe=<1YIiH}%Rk0ddsq^IE!oCr>Xi|8Ai{g#JK!ZV|O#s5@3c{Lm
zoqkWEaBB;j7u~G>d+HsU?M-Ch8rd&CEMz8n6hLt|F^A$g5bjFG4S-{31rYl6sE?f*
zowligkHsDpxAP@LJP3?E34lOS0Ed=yrj%r;t-j?2kcU<-&<%uw9$<opU<AAd&Isq?
zK8&D85=yI%n<LiM<F8+RWS)}shY8Rwi+CRRL*kR$lS%_qZ<HQP8+Q^w?Q*WaR-aIe
z)t3^5aDHfyGJ7FFMO|5i7^n2NMl}8q2D>Z?RJSK4qj8e=i!F)-pRE__<+HN!3<xIL
zd?N!qdZV)(V5_m~yulCL9pZD&d#Iyz))~BVRjWUY*T9{TBcqCo%XC-QKQ11n@as0a
ziTmg~>f;>V%1)Ip=X$Jw&Vasj=Zv9jmA(ecv!~Mt#Pe%C^B&U|YjbqRF6;-PKrwt2
zyzn|F%w8Zf>F@b21Hd!{kc+k1Oi^E-^7Sy+$Z2@Y(D`Zsu+lb|4Z+s4|L9mXGy^5G
zO%Rnn2^)~w3iyo{>`J?2z0}-bFcJt!m`W2-yE+p3hcFXBMTGHt&>UerqU!jqG#bQk
z1<6{}!j1r*A6MpREmWCFpcYL4asSFSay~l|P)AC_ZWU<YK%6xP*mg+2`P*;ic?^cu
zdrRK0_sHQ}7A+P+WK<a|_WjJV*J;%2ir!oNj=<l)D{^-MIXpuyWj?K%N@4#MJg>*%
z?a{Udo57=s;Ple`8qHkrCOCi=UVj1Tno_LF#!pv#-`Nh4E(C`V)(&%yIXEvcba6*m
zyst+LmgQI8BJ!}~$(KH1(=THwR7_FX%#l-jVKP7nuw9H!5B(=BJNFP>PaKh|Zj~ck
za)H8N9H}1#C$Pw#KD>XVd72(^<j*~%F$R_BEL!-Ygix<=Tfk_>MnxaW5)dJ{RH1l1
zaX^((JU0Aca+*90eey&G$pKLh6PT8v@qXl&0GF#Q0oC~nGcL6w9{mIG-lo9m28ITg
zyP!RSOJz8sSyBP8le@1QB={O?lxY0WjHr!K1^`_got1q1U5Z&m?d5dsy!*{{l`nX;
z7C|KjKe5=w;qq4m^pcS{5WZ2asI*-c@&5^VJjbG0lKU7Ha2!61=<5)l8}4k~;lvzh
zs^2b$^RPGwMX-2AA%QDzTQ)kXFZ*V<7#)4}NheEV_%*CAuc`{Ft#_Yjx2_YV)wz8P
z8<A(A>WFjrvxi()wKH}+;gR{(^cJQ%Swc<4l#p@QT&R$p9V(X|tHgN|a=39zcdElZ
zI3}8a*?#NW55WyzA5MNbO2v^g@w$SKP2G@U*?nQ=-uk4-LOm#T>hhwschZdYR28wF
z=y-I8l>#u<%2)oSfp8F%?F1<0Ut#DS9B8Q>Z6LvF{?UH-s(bUh?-HdD3-}&bAnZ@7
zMh^i4r_kiGzaSp?ngQPRHPG&lggk;dHRWT1dm8~4)DaW>h6!V6AEQxQ09Ptt>tyd@
za)|<bN<gm$y`q<cc)UJ$@esC>g^(rm2pcg~c9j?Bj?JeH$ZgBqdm;@E8{;b}z%d{W
z0%o5Wf|hwUqg(B*XBENU5JdBc-@I1<pydff<k$qcgO7!JjC+Wb``|1u3G{09y5?(B
zsvqnSPH49#sPs4o7AXr(<UKr(ys<I0@^EBI!>w?uV}$6B6|j&GJOa$>`J>s6y9*Uw
zq)lzQC)^G6&v9^6nEE3lYw6$ZIvSk2SIyH*gTTwtYs9PPYrOA1tJ7Tr?Dq+9qya19
zv?T#P_i*!gWhMJRx`S}fjiqX|*9>r>kOvSsJOL(&L0~0ZM8U&S!x!QMN$AhO5=qKV
zX%Xh_dF%#%4i(x(3XhIDj42Ri+<IvrCA}yk^9C0aYohz@ExJ(uF5d(<bpwM5mEST?
zkMPxEz5-75X$tVvVp9W&e9~&-%@p7W7em_)S@y1o;49rAGsxF2zXsi+jN@sT1vL%L
z1}G9dG5CS{>%&w3V5j;uZ%M>f*>?VW?eA7;Lg3a952)IlxO)gpLeo-q<;V{KNz*@t
zqkx6DzoGmvi{EoE2ErLs#ETF_om47J8}o{pXjdar$Xg-#o>PaSbWv@jaER)|daP7B
zOoF%^N180z>$9|JbOz0hr&IEgkoF=D(g@PZrQKaHOve(j>HckM+sg8J`b2E7bD0W_
z^PJk}mtQW<c_uby*rrtbOmA#^@v?iXBP-5m-ruab-=>Ppi>wL$N_$tVIC74cnBLB4
zw8NYd*ZvA(*EV;<2}b$x21m0OowYWLZwcsr^S4^h^VHeY0MR&I=rfq8-o7Gh>)pM3
z{Z#-@6nr=U4?z9AzO6-pjITW4oPRMPgstQ0M!7<8aY(r3ti>lyu2!T?Q@}P1P4vU2
zmNEp#?u}AHDsauslS`rLam1%|A(R23+yWF3mF+2yjo5F3udxms^7e3p=`UohvNw5c
zABITrA%U)>LR;#}dQVjs#}OLv;a|=bK0>5D`>2$p9ez9u{FXyz(U(6T8`03dH3vKk
zn65O~gI9$nVgRZOU&d=cB=$H5L(c%9V~hI<j&6hj;`xidCIxo{gMx`awliy`^HuA%
zHEnS_*x9`PVle}=C5%dl!c)!1y^2I^@@jU>{T5av4a(!`hDDW_R!^lP2$P+tdWbF4
zg{Pt}yKRxO{JdFvyZsx(QcGy>IR$+r5Z`S@_e4IWf#;HUHxC<kS??kxR7+4S_mjgG
zHFB_E-vT&6o(*7u{8uPcO7E{Kku)?ZoKSF2LgHrXp2WbXpnb?*AO>eG80OOBNL5~3
zpKeZDi361|4i4=f1AnE;FZqC^wk02%JxX*4Cqi)n-0|=U5Cqc@T<Qd5X59Q^SMokr
z%ux_2U6Fy5b)i97V5w-1!@#gr@{;!J=QBu`-1hjV7w*b#ZhT3fc?0?n<=O|)bnE@f
zCi*vkZ(s*+3S?UL^U8Tbu?)sIeqV}$`XE<3Dy$s#O7qI7lq`ZKf*FW`n?ywL&jId*
zdEO?~WAF5D+l7CPRQspbMB<Czw$i&t<yj0Sms?yly78z7U~W8~ZB>a*Yj@{B2&&+8
z)`~PdBCnsd7pnV-BcQ)`yJ6a>L&g$)!Pol|`bYJQ{Gq-5;vwKYrAbAXI}KYvfO<M}
z7?q6-5nKAokTDahYmf6Vw8(6F*;2{7XKpj{H{Zb499ud@5`9tt<df3pG&K#r5$xUf
z_o0rpn-L~fw6QagJz?|1UQo9+08Ybaa7*z}))mF*9<WGZR_C;V`>Csq`=QvW9rfgG
zNIMeHo6>)q47&28YHaC`ap<eSfH{#%#7ASGA9#sP$^-Yl*}dX%-xB_(82dpg=nb4Z
z<z6FXse$IK#U!*k+hta87EJCP!?R~XpvU-tfBcu{Zw4@h*}@Dqy+Oh(8Qf!_>^nGi
zLp_7+C`m})UXT8`*6EpvfU<W8uP*-uJPeb8CdT?U>jan#so|kP0O%xv{L76-dOEx@
zn4$=j<8^SauE{y4ZKK;BCOR>qOC%C8a4x0%ERbzVQ0|Z=wgz6aQdzS{m8+r08&;D~
zk+|Nr@*4GCS;b6QKeK*Y7oQ%ZnWQORA%V|Z*VJQ%ThI26#;)cX!{?M&r+0c}mgvT^
zS9R=H7tsfhGq-5#_HqJC+Cu@nE5R2t1&r%mM}(mI1}fO`J-AtL0HCy0pIj<WYAl%A
zI@Ku=2zC(L>0c314r5^6P*C2Sje56Nt^6J8V554vw3qH_YIHej*<KTFi+GX!<L)CW
zw3?CH5-*a{jqkVrM~tr}>L~6RzyvQa(|swua<7&3CiVZi0OVj4Aft(bc56LdkrkZ)
ziXMu!p8<~g%WM$5k7kX@k}s^6^=hNS<^n5vP+q6Oa(S)#`81eU<h&54-b2KtWAjQ@
z8!e|<#hp!!i+?NwZ^9UdW`%A8pNhh*VmG+_DidwSOdtRi4C{p;W&*EC>ae{Xqtb96
z)+APj=Qd~a^YO8=`%*nj1O;Y#(D}4fh!M3`FDqt!s|SDG=L$we`EPfAJf%<NkvsUJ
zseD;`e&&uYpQbyK8FG*5Z(QLiva@h)8U5*gyNFHj`#sGAIsf~BjiJWIv07%tZHb!o
z*!<tfLx{aZ(Zav$KH4AmugR|G4C~M}Y)91SNwDjLYnrk;rWE4fIPALbyKLr<_Wi{s
z-RP9wTF=x8*LIP|Shi0wR-jy6I@oz(bC__U%yL4P&^N(gvcGJ(?rLPLSLahe#z#z5
zJSwG-?zA1{^Qkhi?a=4*n`58;9KjHZ$y)2xK?1=Cq*Jb96=K<j=cS6vl|F%c9AWr4
z<Ra8R%|<(PR3s$1<iGFnL;633r*(V(h@_Eg72;pKeC$+M^_kV(GqK?X`a-H-EkQ>m
z3hE(Xz%0f@GezUBx=@DNZ6L*Jw>tH9d8TLGhwb<DHeQ52ig1+KD*kAVrcWC3P3Zn=
z&0@{pQOHV&l-DNFEXO)O=@-Xx-tB3W<$ylWS!u};z7TvD4}uec@HlWj(^d@3mIc)R
z{9T38DX>@Rj_WZ~q(Lea+oN4$jlTdZ7$>NmsI#St@1b&oM=we6BJBxDtm~$K^s~WH
zSmvX38e_WqJVdHeY{MmV_wZ|aCp*Bgy}WS;R%5zP@+xK<c76qG+X-Uv1Y+ZTg#8-k
z0WF~Yr9_#mzsRbi2yU7lNPhmMO`ATw@qR<WhaX+bp6fx-VM~<DPRZvk$>?tn7VrBm
z>D8aPxiA`rsNo4(@~qQEqQ8f;Jhlp7F9j9vGqo8-jaG@a2HD?nj2g}ynE7yM-!C*P
zju$H%IpGr}DPb5Dh<dE2PI?xlB{IG4UeM`jwK;oYC9l~2AtdN4j~5O{FtfQKSFUXU
zIf3*Uuz{w~+CSCuG@*U|C4+)IP)+c?Y!61_L@h2SsZgkTBk&bWc=J!UZI5`HBYWy6
zOM5w!-zb-O_i9ll*od;q7H9DHyzx0+R-JC~t+71VF}bD8@;tLetpB=qNU0sLqNGu0
zqc_|bY#|t1<0h9kJ_6|TuQG8#P1AQ7;J$4LH2slJ2D>ix(Pf%hw!P}@Z^i&xOuL}o
zEA)hy%zK8eFUp#mX1VxWJe#VYWCrV<3Tm=6RA>4E1m{MHz^FjQ^&9I1yyX|f$I;Z_
z7<}D@#>~@pHm(TwV60hDDqQb)r^E_VBhamQ6|K2ObZY>B^OF{nm?3X~k<99+=}>B(
zBel@OekxOIFQNymHMYGR&+mjG`|ZgfN(FE`$bYCA6}==+{<a;cY^VM0I!L^9*Fc<p
z>te?=`5otS#zV0x1v7aQZqwi0!JIi)QhLgkhxmg(Cp%i@X1*z&b=L6?8!Y<gi%GbT
z*V})8j2Eck0A33LCl~C(jma=HCU4tWmM<Q+wSRMj(V=2)KaL#alb@wNr@T0%SsvC~
zwLh~IjlTA3<n}FUg=AdM%$ge+NOd*PO4NWmI?x+4Z@QG8iddE0R@!N2M&FvI*r?a3
zSU0qJJw@jXRzbn<L8sJGfg!qy%pVJ!QOQLHD`lh613zjRO2@%c%Y4=?68a=Oq5M>I
zdni$i=p%?ZL*<+hiK1%c9JurYk!Bw5FGYp#!I`nhlMQyyzFtb)I8X&qVuTJYg~x^g
z0t0Ipn|cT+;&7txWK0tG^AaOyMoCb;vy88tF?K9jc)zL3yTsB4e{T?w(vLQxlD`0`
zc(OGxsOdFoq*w}=`J0*~7r&AsKL7y}=1+_+rXtar-%)%7igsebGuo6e)$R)J;KVrw
zng1u=m_~(tA8BLjA?&i^N3c>oDg=x<z?*Py5eXE6e+R&gfO&)bPt>udy{k?Rt<JP(
zeOFeTrz3WWv>pG%>CSQvuE!x6pN#tUeMf#LmnSsK*A~elC;ILo-1|1aEcG($>?yBs
z4_E79oIvA3i%+Db{d+^G-y&3AEpGC#AVy^Tkpu*%2snUDIC?bTl`K!f<gNJk5)gvW
zY{a>RP_o@(XIDCaZE6tw{ab$#QV}c-yObg`1~w=YlyGGCQbN0WxgWKQWUhML!V>mr
zl+*E?y?zX*jZ0DKm=X(B=4VAPUIh#`Y)w=<ZF7c+xH<=0^RZ?L`-&?hmBSjUO(*-~
zH;AV#p%Z^Et{4NGmyOv~U6d~n39gv>>54zQ#bczQN1pL6p3l0}-0+Lc{(V*m+2X4Y
z5Weq7wPN_&2ZiushPZ2P_5lg~o5e2$PlLl@$QF((h~(N~Lae|E*-f*n^=Bvz8AXX$
z0uL*a0~+AB4I}cbe?5{V<RW!(Aj;SuRq$2B+^7w+H@%-$SuPZK+Nbz-3sYbOvBo*m
z+|LBrk3l#>9Wixst?q4+($nFQ3*c-}03`^uhFpIN(0BqO;aAwc8hLyD`%`h3O`KRe
zzMY8Wzp4z-W5Ox6Ar8TP+XBs$F?c5a<2m=HOQRofJ8VE!OL4}B3S^3%=uZl7Ka4y#
z$u4scFf2wN=Nh2XxIXlnw5j1vGe(p5ydL^0EHQ_bcGfih=^)vtS9NC@C}9KdEbk{*
zS_VlQ5g+zYV=f8l*XZZS=?>#C%~S@Y3o_*5IBTVBmKZ;L2_iK^nzmn*ZM&6qFuJ;Z
zXCL<iA9*8MN!(#%YcoF0<U{<sSm%to3=Y>@!QT0mj)={XzLJi+^-n6o-wvfCg*ceV
z>6keO&em=>Fu)BNnapn_hJ;qOqNB!3<&kEqJ%gMq&g+ebh)uuiBrraOl|K{oacgT{
zuFCQfS~7Wq!9vXXIY1-Tpr^*+V1fV6wIkBiZdd~)<5@`&wK0fKB|bzCXPAf`+WbBI
zROcaA$NE+A``9-b75#FCSHxaa{<JW^V}YKPs}Kbct;S6OnqK|Bw4HvZEk63Vflk0d
zAqb1_Od9*r$d6f50GBL~;xqgP*t!190+tOXM}qA_25E)82i2vYAoA{cEZ_gG&5JO)
z{u6c)B-&B%4Y96)3(<01h4xDyh(HlCYsxuyRki?Y!Yh#alM+_<TOblr2FcfzWl*Y8
zazNA(_+1Pken1G6ig-|e+gRv4?_Rih!qb$bEOghk*DPA({a$bM+~_SEUb6p0)Z97W
zVkp~%tmruDOYF!)yTdmPv!GXiAGqt`trIq+q+XaW-!p&|HoRe#nXt*n0B==0-tQ8x
z9bBAq3Z}f$Q8te!6cnr_Bas7n%IVxc{T@Fn_8}v*Deuq?E4Jx4>WrV8`PD956uhxH
zRLfWI`!zFK;EU0dXM#=!U+-CL_6l~VSrd6|&l9(eQ04zlh9Vt}5~rqK+090w*YB^H
z)?%gA><)Z7U}9oW&EhE9R*YwIl+kYai<{8S^CQZ&+cqJ{PdR|($rE~DMx2895wnOt
z>H2yD`mT~Z6&7h8zMQp5CH0CBh?z%`e9`(k1)X6>q~Q_@(6N%v0t4~(kMm8`bZ^FI
zdhB{TB5MN6^DUt0q3IoPHCjf>eTtIYYf;a?(t{di>KvIn^80tU)eP@n@Y~n*N(!fC
zMhQ^8Di!uxlw|ws=oo;4M={qV-HDOXIC5MwI1-pqD0ZPFB5GHkoxeH|)>P4(G<wU@
ziZ&A_auE{dBPA6ilF8l?BJud~5c_e+@zW0Z*jnB;{o`MP2O<CF$0N^f1A?@G6~cgI
zfWlwAF>F2qfu|BKp;D7sj$ct1y@$FGH9B_fYQpOM!zA@ahheu4^}XzB_3e&u^{L2~
zfg~oD9}$ZmN?q#_6JQ!lT5HH$t`dmo5|7$c`{v>E7!VW~fsb3g7=K7M&iXGXn3)<a
zkqI^3v_T(#dXNa*xKoh58B~<GmjyEYEMJ@RdlZS40gd!Y9Oa4}guZn)MbR$m96`f{
z3}UO)BM%|&g|4a(OiF&lb0<GA&xN0L^QC8WYqLug4kt>x9L%$9>~N=K&em*Q{(0%9
zEGb4l2aNqDfciESVo@)tWI?;^+_+!4A+>O1C7r~{SYA(SX`=gkD=nYGpF+k<Y7!<A
zGhEwn`Tl`@UYg4ExJ}RDOyVuS*KK5&rxH!Wc&7c=!#U21uYB#b$~pV7m_(xku}g;v
zAvS@Zx`jWjcmGD4HALLAnUs*Ik?%iJ8b93s9=|u_6Q*=v=pnGP5XIB9e>i5=SG}bn
z`{`6s*<@V{v(RZ<9cpiov$s^cxWH23sBDHP&Sf@WQ2n#<5B=td^kAE(OA~pg#CTCk
zGk>+Bd9V{_v#%CEiTmpwoE@qU0Tp~v3od32NYHv^L>HAPGhd*+?r^*pm2laBlLF7t
zQTVq6WFv{GfDaU^nI*RR=w@#-^OlDVkr!AU<unmv^<4BP;L6@MA*=42Xi8Dmhr7*E
z7r1Do>}R|w9X2OU5eeT|Zv6m6=uX9NRghyRGLBcK_Gjox2j1d1o5jX{KzA<oxA7O9
z1!9hB9BCuEczpx^v2%C-0wJfisZC`08UW49H_fKcXA_i5qr0-RAicqV$3||xdb&+3
zOy3FMwTiiImV+CWluu3Pq4ux^X<iZ81sXY})CIzJF@ylH`zeAEb+Kd4E(q?<`1=GH
z1ZK+}n~wFbp97`Oi=fis4qR`Q%wg2C^#(1h2v03^3K&b2>wAyK_TxgNUq~{?k<Wkc
zv5{rs1ns@<CWBM^rrwbyy7B_kU+)wTTAK=oGB`C`Ezg3uKkG!@%T&>j;8|+d@TpvM
zBBw0gu7?p+TlcaGKM1O)(bg5c&+Pe=1!4CI&<$>ZqO1MZ3Z>mF!HanP$>H(&jSN*_
zcl@9TzL?wZfI%i7U=mVq@o@h55%nqkU-qkfvI}_PGx{_PSw%1|h>b}jy*T<qD7DDd
z@_Xll%EhXL7n_2uj>0x&j2t*Tpl<QEQSZj+tHHCJ#rrU`w*z0;>XJ%v6Mtb%_;*fb
zKb$YUy#A_R3q9FC(Qt5e6X5q8K{GrpP|0BaRHlDg2Psxs*|K(g_HBg>neJ{@(t&=b
zxe$Apwm7Ow)wuPxuJBR)QUm?QNzKo`NgK|dcTZC1h^B`vt8-9EM=HwB<Y#4lMZT+?
zv5{sS#|9i1_&(hKt?Z;l#4RCtVNw63ZG3BQ)D>xTSPN}t)5+Ml(DYQIjYFn$6FBv^
zKSWXpzYRpc&WPH5<t*%}k$aN+!8N&FR)ze<2ye7SJ8!mEgQ;nS*_<>#p}iQ-?RnEZ
zsdEF1wO}*NzP``P1B_AI<oZ&eYQxp-LmC6$jMT|#5DWlVlHs||cTJOB&~*Om{rX1A
zyVt1eK(R?h!9Q#Y+I#s36mwHTF!Be+07B)S;D$a6`uMSbs+`s29&kd)zfgbf@gRgo
z6z_FG_PCgn<cR}N%z9?N)x0!YpZ-|$>Gvu5kc_tR@<EmiWgxRY(I>HrXVv#(`tC(b
zM)6G6mHh_h@s=>RgY-Wnr>oanB%?d?FD!qUA{frHx7pt{HNOk0Y`AakVBO;>iZS)9
z2^`#Aa_S=8JDvMl$s0M@c4L@{f}7lUsjq$7OWBxjIdu4z#`gX;o|QI=qg#g53?pu`
zDE!^}c0#qwohg%MrQg~9tYjU!{A1c)RhjK&^mD_T+x<-=R#e<28sGZ{8Rv8hd4(s&
ze`4NO5BGIxFhuMBib6!j?EmEWvijy-foCK)LjJto=^*E2a`I<M(b(dhsdx|E#jhy1
zp1At8NIo!sT55wD_tjRZjU(VkkOw*^@-GI1Sjl{DK2OjxewhBq7`X4~I}G_-Qp$~_
zq0U($U<`oyzaj8zu0~hI`xd~DUAkjXfh34SvQBo^ow?Rc!lLz0rXoh4Io@b7#o+_(
z;O<*_ArOT5qgN7!4OEiBTYM8JboNS5X=GSwfqZFT{YMTKC>5JZK>dLyK${&mNVs?{
zgS?i~Wf5|iNJ+60AV29ka;qq(7fZg|DT~#}S3*9#k@yf<e%IYU(IZOucW}^dn20Ef
z#`$dm8H*WDLgiq^UdW!2qXODtkP4^3+^faD2JHGGGzBKA54r-zH(A~`(pmg;Hy4zV
z;;50Bc(e_t>v5VryqxX$I#vjG(JSICvhdy)IF!O77tq8cXdlHp$x}#Twg_Cy<j%Ey
zob3h0uWTC~raz`D_0P{2_`{moC1%SFuOY5f^!~Z8m%IKaEnQ`#Kg>KXMkX>TprIz+
z?5JVzufWwq!v$`d+n-7F+4_67?M2^8bP6G=Yh{G;#U2}fQv&aUaK54((YrmC&v$lo
z=*nxQ=5B&UtU_y9&ns@m_lH>xOGT|OO_sBI<wM(qM}JVzeD96<a5H0L8S^;9m8d2)
z^u16-+<wyK%-*5LE}w=6-$U!t-zpuSjn>*`tDLHq)5Dql7)xzL1G6;vt<@(WLfsD+
z;;V@py}C`|syDoBpaiR<5q((DWr_9zD}IF>kNr3zJUrgDvAIB-fTJ=pI{Jyw3gA|$
zK}HE`9Ew|rn%)vOl8(OYqhZ}g61GPdJ{*NqOsUDBkR%Xg4D6ojX{CXt;m^5>A}4(H
zJg}2_=W64Iwl$hi?_3`I|5CWm34I&QObqqj-e`Yc$frvG@uWeabIvk;%!*Z?J&8(L
z?Kz4E(Gf4s)^V=tmI!V4y*-ATh!4L@Di)cj@&UI$A+cH>mC;#n?e3@LzAE(^b@!zh
zbbAD{n;@Z%J7l9ic)u}02+#=N7Z7MZG5Q6}2K}IFfffWBH_q)U*K*)=^3h(E(Idun
zcwe20on7!~^79OrP29Dy^ku%vxge~tMOk0IZ0{kNbo*)lmYenbxP<I|86&ov$Uq4Z
z$sW9ZVv<soZinsWNa6*>2XC$$qR(0d)$UIk>5Wo0BeO$(n}M}M3tTmmb>=@Mvf}U)
zA+p9wTc9bt?A5zGKk0MRFPX}#Hm66lc(IVO=q=ET5nw?E?~4+g;P%PM;IST82m)=v
zoWJT7SZD-sG2{${KIG8Ddvf<54p~wZdk8nz%YGL05bl|6;%<(}^iybf+g!LV4@@tQ
za&-hgrKSDB!B6fjeyOoOvRdu4zx?MAV|=A5#QABpdE*etUyc#By2kQ}Z_ZzC>c?ki
z4t~#_?{Rq_ey=@oOZW~={2IEqa8#_AW`c5CN~DwxjD~$Q^U8ERsc+qW+s%H6Z*HIc
zv*nAr9$C<6sI<F$zzOj-Y;`k!aM_;t^E^(CfUjjqS4)Y<DIRKEiV<vnlq<*cVXisa
zcqCPPBvXV+u+BEw9W%w8$YFE9CNqS3VUgeMD(L=hzpO#M>F-_qI9b<-`vS``E>zAC
z@wHaKGOH6coD&DP-N-s;joEjmF#+ZReia1Z(5Erh<e&kjzK8N&7(zn-n2y*-JrrXv
zVF^Oa?`BH{N@9`kx<S;YR^iDeA8&Ub8{BFDP-&SyG5V<J%^p{ISzsZd+_R9CLO=qV
zJA{M!n;o|k8J>bSl!+{WqU=uh%j(S%a#z>)K7X}X;b%Y8<G?pS)1U-=$+WfTnbo^J
z9-F!^(c2q9q}aIH@aN^p>&uvpk^G~@W*)hH7kjFz!?;jyhj-@;pEN>V%TRu>-t1q$
z`6@Gby5HF27J3<?l4$dln`>D-!>!zgttaZ%DzByP;mWy{+kJ<h=~a1k=8OAUb8)7?
zjg@F;^@igw<24h5h#~L4jMg|tv@|K%$yc2;-q*5i7+>anjAv66z^1MjRz9xv+=MRE
z02i1>x&&TjQo-DA05WDFxaeVLG%85Hau_}Vf~Gaq*<H_+RN;%4h&F;N4UX^<R$<Jm
zNAoM<niNu;R@`4Cr*XZ)ND&GWFfmkU@=`!<_Oqns7aL)wc)<zf3w!ywH2a-GRna&V
zVU)%|wBd@OnipwgqLo_VghMnD#ZmFk7X{^K4UvCcm~ST6f4?F!;u4gPCfBoZS=4Fh
zanT{uim`U_EZ7w3p?rh1)?Lp%?ZRRETjcxo+#;n>MC3NwOpK%Vs4(>h*2*8<oj#};
z9!fVC3)AN!O*dPnE;NR$q=Z(rBbF{T-n*~tbbTFp`FQN_qI_~^?^kSFg0I$4hAR%&
zi6>m@Jj!kDw*3BLD0Sf3>j-<CjXjdM;(Y(q3x_HvPa|LneVVq&5-+E{S-@{>X^8JP
z5c~(O(AO4Kj)C5$fdhQ;@gT{Eta+4sic%@je%|HeLlDu%rW<=|n(K!l-5X6|ZyPIU
z>(ieqBIVIGA)b6!`?4sKjFF$~)0)^4o`NaoPA(lU2Ik}B{$m>!+@%p3DOb`jDW_&^
z>Ftd*f0o_RI|aXU`UkZxj`<R`70??^zH4Kf_RZdOqUU^HQ|(E?7Ara*CK3=4f=ycV
zbXKh&3qhVepiIBzZNcKp4x}V(=$ilIzUjbC6~t+Pq&&d|QCY7krINSLcc;I^LBpN^
zqNo7pn3w@Zg*3kpwL?Bw9<LuHBk{*l8_(f$`BW{N*D1X*p7vb5&GhlL*B>wUBGyuC
zBZuK#=O(R)`2;Zu{K^E6$P~4Hi1>UT7TD1uCt}F>sR0g50<D8GU)m&0y9*-~O7893
zfCRw$i6xS%kLM1A1~H(_?VmBzit@YyscPI$|5)&e%dp+59MAu;O>&L-3Y}@OtTP@?
ze%07=UFsCECQryc`W5NnfV0D@Vx{B%(R5DHk#^k{{?bv$wr$(CZQDl0ww;b`vtzqs
z+qT`O`XA%m*G=i&Yp*%yGkxCf$J694+!(5sed*sC!$+d!Z=;SW?D1T!H}-oFPL?_C
zH(&C*LzA|7Uzp_odfjvCq2|5^eWHYZ>DiA5llj*^V)MSbMz_xQsh-dzFtimj>T%Y4
zq))wiHTt}-aU^jmfN-HV=n&6vwYGdjoOpP*`d7coA;Nn})T-Xkkb7^MCJA_yUv7JA
z^5gSqVe=`eFo%|=qaO1z&BU-TQF+*ZN${U<=#BWi1t0#&QTg8T=o^zxEE?4X3Ca6<
zta|jlDL$M|%JnMn>~Y`J`$Veeo(86ofWN6|^?hp~jRv1^k@Q6<NZLoEN}cW>F*pw4
zk{uUgXvb|g7kDY#PY;kwy9XZJ(!l%^n<6&1(G(zI))EL5{YRbP&pW{2c>!A05O=}y
zIU2uZ%J&<*U+m@NLDo8fjYK6XHQH=}e0W~Q=OLh<VS8s3)F7YiSD#nF?I<#7OfWoV
z?*dSiwlZMc5plNViIZN0fB)03`>S+;B5ur~mww(K3Si9@#q0U!I#{+*zq#|8+8X)C
zmyN0~2C0E&yX|%}kUFQe(`~~J(++M?L~QmkC(^j3O7&tJT1mh(!_uU>RC+Do%69Q;
zK-dK&EVL`+)5)hZMdPw}9JrJSJ4`lgHxYbZ5`YnU6KSxRO^^Z&w%-EY8X$&d4WYeP
z^6nU|-s$pCC`t`Xf_XvE<&@>+8N4M!_G0yDNW<YEQ9*?v0fnwjLydU09*{3NF5f&J
zH(SPmVv+uaHv}v$=EqZ?z(Y415j$e$DC1<LF%+1aMHyuTc84SYw8uGeuxeIx3QTqv
zhXUTGSG9iPEFFAF`}y@?j+h5`*uI7Y_ZV>Xe;1LZIMLZq2O2|a;htN{+p1H=JSTtF
zsTgABX5amwmU+0F(s@8cLJt}`RGk>NVV-M#riX>Ni=-+Pq(pcudQW{Rp@XP}9j@w0
zZ7${=eJ5Hv92?#4Z-~S&meC|dp@JZh%$(Mg*Rz9*iW>XRPAqgx*a@kXz4fqp0;!f%
z<NEs8x^NJj0IYuPSqGg|A<EBzTw34ib?Njo?0qqb;!?Z66Aw$GzNv{VwQjv;*U1lF
z{g6$gAhw%zWm%aZ5w<3{JNR&Ezx*nttHw>k%uy_EmY_{+DRGjLJX=jwwJ_{<bfN%z
z8dtKQhiRJiNG5d!Y{hd>ZkJP~D>Wzkz`6M>XRVuVFBo)kyqSzO{6ISiK*PY0%v99h
zhz98(ZyGVYXkmV3FT>^a3j&rA9#GA^6LE3|ys7JFqnMhRNfmB5bmDc6jj>!<vEnbl
zDXyQ$<Ir7!R&5pB?wXp`Xg2(a=e>`R8k5nAvMBIGPq83vaqDaICQ}d#D4qo_2Bnkb
zAC~i$ijC!xhY~xu4-*H}jifTIgvVtS#K>E!EN=K;zp~;Td&7B-XZ)aQ;elztoZ$G!
z_Rcbd%N$D=+34u#Ccf@TUN`oMn%SRa`;K<H6g=7)T&_3k;J?Aens>DlDKHq2A2(@W
zJPsb;AI1m&o9XSELm-`e{r3!|B;rE88%1AV{dEP*96C;OokUc*<ktO(OiI?E!E1~I
z!2^W`Jr4-(K4D}UAGoPzEe8|he?KL;3o7x?gEkrUx3jW30>s}<j$r8K;F*%tu;)~=
zig_^AXshT+MZr?R8BeBg-pvYmx<d=6M>ub~f0;$BWl_ooBzHq8J}uO7L%71?5<o1L
zZVwNG*Y&(p1J@#vLqnomgnM7-z}APpF!WsiZ@}8Zxy#+%p4Lo>$*w13{<5Mv`Xw+h
z6A%#@i6o?5!aIiE4J>7JYPc@3tURESnJF^aHRu;)8KPP!0sIDtrb8g<ozr&Br#+u`
zk!$H}AQDUl%+DK>Qjkpu!Qipw7v<Ic<d^q!rOx%a6bgZSZNYKr$h2;Q@^$W7;B+}S
zVHe{57Il6V;hdJ|ijc?!;G7~xxi;okKZDwSk`Nb@;N6$(9n_^6PWgxR$FV`Goo-;H
z8vxL1d#pk1G1=hpf(8`RGh?tpOZMPIbU-QCKsUVDOCB}jw|Ls5lsPagxI%WBc8{+E
z>9RPC-f;*H3Y^;5K+G=A<LtXXOh#N7qJ9{8wb1F}T`7v|qu5+jB1u{(U_q)Ely@nk
z{%jfi!>&;)1$c+S1BJseBcYG8>S~J<5bJz+O4G4N(mw%W8YuODl8}&yc?Mbi!&wxz
zw_^eg)~ML}bExRE8x8v8?KS<jbkkshy>m?YCcCx+0o*7vlanYV7WUqHdfk{QCPzZs
zC!2tioFL@b>xI~q9JvD#hpK<S4hjs=E=X0@eIOdC-sMCd*jvj%{5l*Zb-Cqre>nax
z={qbLI*r2r`>Q}?g(;sgzo#Y7?;Q&0V#nYTX0PqbbzlAOFwg&+YQ)r)zkXo#PM@tO
zK2|BR&Z91OjNFeDr^vdl&-d(lFVxq`d-t+@9QgTWEjanlSJPgG9M5O}xyg8$EWpW$
zKRh``-njm`+3oA(xTDXxmW*5)8EVndAc)aKd>+3T%@FK0(jr#<oo~{I3`z?*xMKqJ
z7%kTs!~?y|1b%*g#5!ZnTQfjLU-l9l0l%)PjW%~%eMqIi8RjgLBQK_+HyV4PBk<i#
za&gi;HEJAZXXF0kYLkXv(d|^%IymuS+NXr4E9tXRX<~KXH2lEM6OptGYcr5|$8K$f
z$K-m)S0b!#bq~PnS7MjAh_keDQO34$w1l>cTBf6!7~TGYlnT>V`Iy_*K{2R@*!ByI
zh=oP_Ek@r<c*3|``-KPOCx|**llKs<-K+>`MvRW^6z0e%^ZfxGH2x773$>UKIOpsA
zVmO)hXSLo5#m}Gt4C-w7c>KukwnQWUZvY4;r{jOqXDbLsLf^v1<xZ=l!EZ2ya{CCE
z5>{p{<MmW{9RpEk@Z3DH#B1;#7!+LLHPj5l$8tCgK)CTGk0YWOS;?Y&-=D$c`Qbu?
z-fvEi+5bF$cg}JTiWjkg(=8!rVO6a5*i~^(aXC^VnYq?l+1MZm{Qd9oY6Afj5>B*j
zdajt)(>AI_7u~Ik5>H(tjVR7kh23s5qL;(AZ{h}nxM-lOfBh?=Ktl=uypIbDD4)XJ
zza&Q-JCgGWyHV3n2~#a)KKWM1FBX(H>)ta8XohNIYv4Mc@mPc^l+0S&oCu1uc4JEl
zqz2Yj%Ic?2N<%kTtkBz*x*S~bxKChzuZ++ob;z{opKg+&>vg(O=mmbCE_7lDSJVNj
zSz=J0wk_35!Zyr%a>B+I{>sk@11A!ct@eM|nOEs**0ByO+t08Zta8_y)>kk`w+U**
z%Kq`|YG63kSqO~5T$<7kC@Xd-`nVJYfd^Qkq^D%8>e@!%7@HJ2QSxsej>SQ4*Wzu=
zRe3o0{Jpz)t@jt;bw|)SHp>fVRciZrHWj-o#_VU;#p?Js5MoBCa@ehlItO|Wj66i8
z@V%>Exttt9ZcQuvY#N%r_LmvBn4{E>uM>j){~XXg`LE?%`iUFm|8b?1j?IlWZ*Lv{
zwURf^-7Hn5_xyg9@DgPZ9SsNr`KEvSpk-hf{fA;@z{ABw#73tcxces_(^JmJ1&5|D
zAOBc@&^NUVjAdwM3lS47U}XS(BTL2R6Jym-Qs?e6=|GGS?&5f%@p*kmU7ed&-MGw)
zRn^dGs3==ty1g+Dz>@bNL`Fm;L`Pk#4=O98&}_&`P1E<e6N4oT!=eFP>^$^tXn37j
zKtjCo90+`~bD)TL3;qR}cWm8GO-v*bCcXp!1zCY1U?m)h54oP@;Uy-Hg)U7Nkv!ni
zWlUB<px}5NhYlqy(TG`rgdq$N0-H<!SKo5e+|ORc7u$ljf&6m4Rq4MWSI55o&#>Uk
zh_Rof<hTP5P5guHi7QgrNXE>>u^*!&(?~1vT{zJfm5e@*qRA_-CY4HA>(xT4zUn&q
zK}&y0N+h6lTJ2Ye|M)p{TvG$~gUNB2#mfee_8D}vHlo-TdFoChXZ*InXX5lJC+UfU
zU7zY7N>WT=8^YjU9`jA|^%!S8eK`F1`-L<36`KdZF?0#Ll7V%lLhuKRnJ752-oVb^
zac0|4+-a(wa&F5s>SmYjIOqq{6px_x#ik43Gw1fkNbt(zwKxqN#{FiSjureNLaRNW
z0P5oNrT4F$7S#JrRfqon4rp$OX-rr~yD<yb%i&*elMO$JaMDafT=d2SnQ@NHOwbVc
z9ut}~Pp;Xad~=vE=Wz;6cJqb>efjb-b)pM_mIOTt3szgl^i*}tNJn7WvT&;KwA{bd
z-NM`|Mh2dC!HrV|#ol2iZGD{wnlsl12eLGnYjI^I5d$}tVmRnk+tPqPAL-Nz03@%H
zBQQ^7MRrGbHiyEMuz~eB81j~9U=LVf0sbT^D#=;@LOs=42#yO(V<db;8u!li*al<>
z`16a$<I^>U@**_tBTr)Azu`XYzHYScwzPn$`q!BVj`lGb^<^&`g@fXLetk(PO{jZ{
zGj!el(6k!o-C{z^r?5u@g{!L2YBblcbZHMraMayKd9~Bv{o%Wnn5aXHh4z)4mr9|E
zK)`}+x!p`$ru^F~64Uh>U=Gf@DerfH()D?|Rrp`~(M&3)%bwy8o9LvTl2zzk?9sae
zKZC<YJ$lo&59mYh*En$-4wk2*5rV5K!E>dCq(0qB?Yr8y>VSs1Zv<1@R!|%sueK`f
z!5zhiiE>C5pBu3`!@HhYTl+O<LYzKR;A*c8in%-h87959CBoqok?T~N_A?@T?=eD%
zZ;pwb_4=Z6;<oqAg~{u4FgBS3kb6I%<N4U{y?0fLb;h^Oy%fL#`mNvj<EHD29R2&Y
z3S5^xYH$CNGDV$jt_J)Kyg249`qK&u@AlaH=HNMzV{m1mW&GWeFg>C=qvQCbj?wlI
z^i<l$(o39KT5>x@#M$~6M3^7KFvY}IIZka@comHgk9(m9B;$AD3DZd|RsE4uv7-W&
z+Si3m)$PWN%<ZvFo#D}Ysl^zq>&|x0{mYlfjwIIS!_=gM(W4y+68@qRs<N4AOBo@^
z(u*woCtNwd;WpC4+nOffjm_#Q)nri9HtvOKxhviN0q_AT4Sax#MJ3+N%P>fFYVAhv
zG(8P9m_oS&!HDEOr?4DwXzud0<z#Z^BA5SF=knlu>)V?m{R-j3_RUaNhqw<I#Ce0A
z$KH-pC=&<<g|s3n6ssU)fl6&|Q%@eA=DUl4dKfx*i5n^jo{_l8FvLozX4_outLH4Q
zGUHbkF9z9ck4v+PyNR5%sg+er>%hnBcn;;__BI+1^er#qYk1=reX6VDK>Ypzrn<3b
zO~#?204}1JwX8H~weT|fEPgxaX-%F*t)rJE<&534&ono$$;uwio$~QAW&INAmO22g
z1Nw{Kjyu=)T5D~wNz5L;`f7S2)ZX4+!k}Khn%c`A50o1s22*i|OefpWCd!sdAdlVR
zH`VX@wzkp53YAbOM^$3w(Nibm01ar+0b!AZ?4&4!9^DY4FYj3)DYP1bSW8lAZJ8Ub
zamTImo!j$jgko6%1&l*fD|MrG0hI9xIn{bTes2?M{B8%@4he|)U&FHh(O-B9AFwGj
zp)RsZ#y)5t?{nk%chefRJQtsGx*auF>blv{`Rg2@`na*pSWt&|2o)htnZ)nqM%EO$
zmZUg{r#r2c-p4DWp4ioXXUiEfRu}cn7R4igN|$GZKK8ty)5Ku2NyCe3M$RrQfYPR9
zCnOLq2R(AVy*gH(%rniR!<GXQGJoTYH{uWkIR1o!64KJby1cwR)By&zknFph+K28q
z#&_!RU177KFn6DFdqMN$K^)5lBhpTPJhU#)gD5Bo2?aC$oNKef%KQlpJ>*Z&75=T?
zU)kH!Pj>QbBo00N&GR_at1x&A0yp;>rfs`cudk@7Q3SvCABKW}629oE7$%Q($dJu|
zP1*wt&0)jS&4oRF?45vLG(xXVbb_Ekv3Ua8Z8Bz@=Gy+W1^TYJvE}+b=U(HhwgJp)
zClPC3xc+S*o(GEo8}{OeWj`y&3nP2dJ>jn0L&dVayanCzv5i!wA_l&3%K6@7UqCB|
zvA$pTt&)13KAkwYACQ5EL~j;sRW14o<hhOu;nD2X2ZYLx=HY);ttgN7tp$Lzs55+7
zRbbL7<1cFwCWFF^d7RD)9dr5Cxv<Cl?2i3+U;5O+L?i<2)7*UmBRkr#_`Dg<^FoJA
zHhI|vO-j(m7)_A)rDUP-Uv1P?=~X7Xup|F1h|`AXiJjB~*99qQ9i5%Qd>r-j6F}n(
z14IKF^rM54(f*+>+cxsu;o!jDp`pY>-iQTv+I+i$p6*tHaHg#t9l!>5bmUZPW?=!R
zq2c*4Y`zmfEVYlFGv^Z4#GCP;_UA@NIC}s49pK%+P|-x%)X*eRqsN}KH3p+7gZ1=c
z!3SaLhc?3ExM9~8nSKmJ;eyW1%@x{C{qzFX3^oAiaZCgG59`zKL`5XKq=tfbG3-gB
zT<YjCv9V~Noj&r@`a;0&bbG4Q1w1*fb5d0WNUMQ>)?e$1Wo9?Ketoqy_3nlTP``c<
z<&8R*lf0+hG%v2#-T%PbXhNvAp_Xd<`%`y|uRa!*rjv(9s^^bQnsHx(k@HTIghxtR
z+Q8ZpsQ1fdkS|L!8V$vSXL;4g2|;&o0|GA<z=S6m1&n*el)E#;bZC-hLQ$!7De;K-
z3NL4G???*2C}&sDj_Qxpz+w2P$-Tti!I3)tzJT0@!dJ`uhb8kfNUt>_!t9B6Jm0Y@
zH-K5Hr@Cu>W#4o=v1j{lLN0rhjz?_Dr!#rGirPwIP~?_@m&5eS#CS77-E6&jn?dKt
zGG-4vS+V$2L)Emyy|prmy(15dJ~~3Me$pZ>6+MxOc;KA9S@ghFUPMCmI`?)1qk`Xm
ztOt4f_EA@mj6w5o=P_^lhfLt0y0#LRV9E;|;roTF!i0AGTA7r(iW=Mkt$0$!eh90~
zgOo(nHeq`_(owvzJGA2C_VmkRulp^!-f|oFF$RvMA3b1%;M<%_l}WegKEJRtR_e5H
zZVTePX+O!hz1>@S5s4ed26qu#Hzg|&!$Nk%=7u4GG)HSZ&$V?`Qc}$<^bty8b&V&X
zpVXqV33QxvqkxkJY3B0<=}o7{ousziGQcxV)kX2({_*6Psm~<ngP4|fN_biE%ycT3
z4+j{+>xsEb4&6{u4@`iPQI|BDy!H8Sz}^kObkK+6|J+yv;rwvQ_p#lGhObT-l8oc^
zcn(K^u}#~C`=0QzR8`jve{hWzPtcPa-${@STbIwcXhB{SW-4I1UqK@gD+dcgHBe^Y
z6Wo^P9m9TT*Tg&h_NIW288nN{5{5yXd#t*iX0zoLL!CUS>`!-OncZ6As@=V&+zwi3
z(hTP;V})gIbEW!*Jy8liuc?8y;>b3J>EOxUYvbp{tT4CE=g)%+wxjDu6Uk*a>1Io2
zf>VS_uZj96?0jHGTT#P{xktr`S3kv5S!X1MI(R`D$?lv4PGYpsc5VbBFKoR1?~)JC
zS)$bIQ=5SpB?n`IuEB!2$#4|fD{%QdltW+k^)dvlAaZ!Fw#?*+3p`LrU`Bz6S|lK<
zWB)2D)8Y5;-<nP4aQ|WlFj2UW_F3jkI?+=kfW2Z$i9!i3(P4KYo1Ho5oq2=>y%k*#
zKKrgc?rfezYh`@i9|(m@QIj^!Ei;O6IvVQ%CIs%oc&OmQGMcQN_xmfJbH{8+$NIVc
zYO~ANt#ttEJZ*-h4hMLZ5~Y<9tEG?S+GD^knX(C$vqkK>?W~izb;~vThu5O5DrU?A
z>xCU%E@=2N0b|uuTe=+S84WdvvJ-C_P!u9;t--C5-E!AIb7o01)ee959{3J`q}_g-
zY;nFk%4t;GuXR*V=$E!lXBc*eZQA8PPx)H1V-+Q(21ZL@Ckd!gDQ=BImhj5XDR7Ji
z9y+&e!w==Z?+I@-G=&H$C?o{ylll^fL=N>!9AIquV&eiAKtOp*x5ioA_0`Gm<4Oiv
z=^OLLre#H_w33h6==gwc(~%+Ky<HGpFMWg0Mthdpu3Owc17yAyqc|Cj<jCcE!HO66
zCQxa!bM}EoOkC<(+97y4D^QygNx~?faXq<`v=jYPQYJ{J2jZ@I=5O06eV&68!Lspd
zoE=7os~@6)v;D)-#tLyi3dHj;cXuzt_S)jCb#usPVpCx!CZ!X7PXF5mTxm5ZW1||z
zKTZXO`9P0fZB@XLoqAZ{K)iN-L5`rf3;?=VV*7H3dOz=F?zmrvF$~7IP-&3v0gFJ!
zVn}WtvsvZr-RBo`jg#`}n}7M0#YV#X2Jm>09SrytzB-BKy>fSd|HFGlNnf@1>sjX?
z39E?1RfNhy`{m+_E0r<7Zlg@u;j_wZj}K!Z3`5T~@uwS*;OJ{yOw7ZhbM6ML)-eIb
ziwehzk8k~32E6uw*Ahcm+E?em%d6F0dT$*dV>@a29KvIxb3w-dEK}|9$U1!Su-Ki7
zlc!ho@Fx~#`cy%)>cKcLJgw$!^sJ*;iFM89U9y8u0&#vZwu>36w~@7v!8NH^_ZnD(
z5NblJrr=j<7+^&r_8^<fi)C9MjW=Ac%<-`Pud?Azo)c)kPtG37oOkcW<A(UQgDrQt
znV697dVaT2##?ULZMp}Al%zU;n3)4cEf+Z69ac0L@)!keD*M~7?|lyp<;0nPfthrG
z{tk5<lM-h;3lkF^m1gGf&@d$>m`#EFB1XDa4Akp<k<>L!Nedf|1SB-U^S{*8jqori
z3=S^ni`Z%?FVfHq1b%%?B@c`bqw(`!GyAV3C>w!bmH(NrWo)&!y9k)p>ooei&4#&J
z#qzz`ig5CBMr%?_W})Ub@{DnKLQM9>Xp6g9PF*6nI?P#b1H<pN=UyRVtIGMTsPpO*
zwvu@)ESrAK+3tWq-g^s=KAjmDZ;(Yl5e&o-5A?V5MNC$6<iN0{=RMi^eY}Ip-an6Q
zYR&Yo)xI?m@`I*%EvoM?VZ|FwR1p;F#OqU1jge<xwf%Q>xo<v%1-K>;?Ft$o#;vvN
z%Z%+t>2Ql5*@l~(t$JX#-N}pDZYYrJQMu|$hh6VzPvEU5xPQ1GZpaWbdhGi;+dqc)
z(7<S)BY=!<GH7z+=3qhch{ue`V?RU^_zl@OMm6H6-K4hr{d|9$@NmbhEGernsi9<Q
zxQx$KY^W`4ayZcs+F<#{4cogftdz^Di1oLRDX)UQ>?8JE$6eO(AeLhvn72p=WWD@b
zCQ{i0dz^KhhSBERsO`L4-%?ZvRYOP#yf(cqY6`#b2?!YMvDTsofy(z#P?z*d?ilBm
zQG;?S*zza2ok@ZsH$g}nyCdiHMjOiYuUAs;x3}G2I@jW!rl?8C@KBU-3Pdy9iT(B&
z51$9^A8}dZFh)P&B-N>H%oF!@S&<qhy>lsB8sR9ZX+??XutSSu^(FL?xZ-Lc?m*Hp
z<T~KpTi1t(09p-Kt7S-R<f`5@G!sg?y2MdsY|X2hD!zD<2RRhVt=vbah7JR8Cr6=`
zN6I>JNTL-411odF2VRY7TrlYAsj1Ow|J4?yr*m|5^MWDR7GwvLnNALWTAEdQih(hH
zb1f#e0Q9GRJ4l!N#I=#Z?Bf>$!!m=|H`Fz|5frcN%}S{r%~gm*v4)Lm|G}5uiNR@z
zf_X3P_tA%Kpld=c_|PU%+Zus1Mp|V^z*vFPO|?9cc8R?@63W0|<L91AN^|t|@RLWw
z-0QJbnruw)H!0t7?lScq1Z`zEdFx&yY@602?*V1EC}557e%Hfvvg;+k7Q(+_wOIgS
z5qrReg9gEwvY1UBD(dzH0PJ*{@Ud@zviw__O@^qGH@Vm`k(<L+|6<!>&mK;wKLerX
zgXX96$wg1V4}lkKtR(wT4$US?;uOJyhyaTt+zdlw#sZiB#V+HOSu<J5UkP7ACdSGi
z6*A)J>O>JA*$<`?WqDsTlBRt^Gcg$=zT2QKrtbO5SC=Z=#+0*vF02j_YgW}I7x1f_
z5Lsltiq~AJRHs(puhSP9-dq-MPo{V!+2%Sn9VB30d&q_Zl0Ivp6=Fp-;7)wmePZVI
zh!EW~hSh{?F8-1!ESRq){Y)I85GQ9`JDEE8%upGU^(cKP)~_A!_(>VSmD!-#v9LbL
ziZJ?6APWLOrlY44Ler9i{s|k{Mgdd6!KT>nMi{lmx@~P!S<!o6GBYtj!}cqVR+yRY
zM9%kE3L4y6*OK#q`8T_lB?7GD--??61kqJQ_#2~4`~9~}zW;RH*UT`voK2g)*6`hC
zjZQH+vzYRG1k`ucav`;d0#3S{n^}e6Xwcy?83lWU{EYY+^8U0hZ20{$&d+4aPKA_-
z$i;Hnuyid7PT^KIJ{i_0BdZL)junUV+#>cf68Azr_J0FP7{>VdG(LP+2|B9eJCHO8
z5Mknd<a9_HdW!@fNeD$QmK54I8R{yE@o@g5>Cw|Q?HTCIlNaXu>#5U3+A&UAnhDXv
zRT1tlFl5`vf9Q07imfG?NyDGOlPbib#*82Jl;o{mcau{0<o|*%uvK)L?|QWw+XEy8
z&#o6M<|~fiF9LP0guE;XNDc5Inn|(cJzM0~$)OQ}mA&*Of61QzxD%vjrjoqBBu4wB
z1_Q7&C~E$b>64C3uzCjW=oOyjfPN$7z|!`1&O6appi}?87H*+TPT+U$&%b-EI>y5O
z^Z#@Y*S>)L^oD}MbbT+W%Bcs82OmwsWInDKOeW#&3-6qT0*NQ?+-1z!m8*r0kM*W|
z-ktl;sXbup{16b{Dayz}N-7F=^ah(#Gpvxuuji@y=k9HziJzMm4-|Mzqbhiw#N}Xe
z*k?<XCdBeI{@63P_#4#Q+k19-Y&$q3u%mC2phtI@x@^4O#6ZG3tHIlai(oh5<NNG|
zjJZ5KG^l(z7EO;MBrSO|pV`uF1%J%^TFp<GokQYi**mQL=K)*S9I}<b7CgBwc5-h2
z^>c%FX}o;}TJh?9mI+mWPU{Cw+8>r$ryvCpK3I16Ti3Z5n!HahJOdq^+cAq<aav_F
zwU0Q2%G?W0#=aefN$RF~LK@n;-`QDNS!3wpqM`wC^!2tzdHlYT;%O;dG5TWhC9r%o
z|1=;uru=8@YMuT@>gwjn+!Id)W*|>LQEgB6-Defm<L@iZ0g*9R&e`>w8wT2q(DuEg
z)ih>Gc2^P38GL#AxpgtjDo6_5_>9I%a$7sK9MP5Iy&o{?PAr9Wr5^tpGDw|%>U<mQ
zWX0NZLIJnS@vx0@)Sp`{+UBqVzo?8lb0X`|33waW(O@xFmvRoF4hdVpV*dS~w5;@T
zAh?Jx-1F#_n5HRg5(@l&P|pe>za3~{kPqFdlgqsLR+D~s2=_do08uzMKF{;f?=o%@
z!u#of<*Hs$xw^=UE2(Wz`aUcpEtl#*E7n&X|MAJOk0Ebn^h=_#em9z74+B;DBp3W=
z;lnj_5;*CSz`gouOl6dEu^DdbSg-d9{Nwc&ib3yRV*8G7>P^>SaN#^HKb9Dlnpy*&
z*EC9mXHu;9EglbOdoH?_(a9Bp9({Y`*P6nv0*678LdmfPbg6NwpeB+QwS6pR=294}
zr>$^)j?Lg^w;kfK6%oe~&!hZt$fRu%C8C@i>#!!R?L;@%DbN=!fK}vYs=AevTL=%D
zrh3vsy~l{eO@~qnq_^u$6wo6p<I9=TolGMf42r1mu5<i_hldh8@53!H%~0A?J1nG(
ze~F12Hui2B(|%9<+5JEW@f4HhRmD_2u~bKA5-<wuZ*iG=Us0Be3@+Sb0m+ODOfV9;
zqD=Z#Hf%FDo5WjHp-(r6@W<h93gYLpv9Wmq>t(=ykOU(LX#x`TF7%zp$?muB2YKTL
zriW-ppn@sjM@S%hTH|Qc>y1PCadf}(<~)rqAbzd#i;HS9A}24H&L-BWX>x@kH-l<+
z`Xy5$R*vgHGkqkEN0Gbc=1+`azZ}Qn+<x3t-EA;T);mcAhc#-UZ~C2dx2L>6eLhT!
zxr#>oY^5=e2Xv%e12)GNW$kLn5n?*sZAXF9V`T5QcKnT><}z!R2%>%W8S^8-Y&<)4
z@NB1rM>{u<GPfP*8m7VdU{wVzk@ygDiUvVo4V=O=wxzs*RM1npo*N!<1XSTX2c0I0
z^9er_Zbgxo{jfFhx_Zqk+@yMSi{y6A3}FnWA4zSmJ?8tfse>pfqZ#V+ocev5SKp7A
z;b1O#7Ukp!qh|`>nn)`5;J9d-xa4`ZM8jX#ZTRT0V9yv9cb1@M8z0#Sz6`jG@hiDa
z$w>?vT9kEeu~xtl0fnDyKTwpS4<|#+ts3Ko2yf@>M7%sAog&bm)x;{)X`?^<tyoCs
zhsh5);-LnBYPH=CVPi%2*S_atziM85ZX1(CFuDGX0PJuW7Q@JnH}n^Xw6AmLpuceS
zGS_9sUyZr~q8FHefZc}TjP$ZM4ns5Y?TFiKJHjYA4PxFLFO9m3vj7k_2WP#ti6LN5
z*&&W;l@KlEKope+P=`93O<}2xv+g+nB>mNfmUYoW`onfwSkTV-Q`3bIsizixjBWuH
z(Z;4FR>#LVOcUDK&@1>@Z(CO_4b>1z%dCoZmA%?qG<b1IwSPeXcSYX`>oOL`c)q{;
z)$fj&R;LxU>hC7)((lV>ira-vjXg=P_byRob-LML=1<4sS_tn5ta|$`?rQztKXw>C
zYSv11xoq2KAu;qkiRP5}b}b!9o=o#&&nO}CN9;G_<X%k%-I<B^h%ca42E)#EwbdhK
z!t_H|#|*~}H1q;{zjed&{I%i?{Pm*nypd&}A|kFLtLl1iF${RYPLdmKDU4Me6WB9m
z-;4wQp9O$zCcS+);=`v<4EIW2h`_$Ev*ViZ`jUnxH~$cQ5w;_X(<p>F+bd8LxV5*^
zFSAN{TtCI~YrWGBblGklL_<TP-~jVTm_$Q$e_*m!ylsrIrkgEQv+17Wv;Gj$=Xs8o
z(pyAE-G0O^J*kaAIE739&!n6@r(iqruj?1J*T;vynHqzxJ2#vCm|kmSn7p2h5ZMa|
z+xWGpqhGa4qbZ8LTtvVt@(d)g?eEy`jQS(19*aRv+ci5N&VlnJ+odmj<=EF#IP^Tz
z4fYh1(N}>dl4%k$5%)Fgz(JV`!G5C$&e!WDv6(mT*GvUBv>R+T6{cZ{mO5eASM6Q<
zUed$*V)gmCbl2y+&1%OTf^7R4yJ>>cbKJK57(Hd`4Jiqk60ICE3&caOeh@|;E(0$Q
zF;Sch?1|^Yl8g8^Pi=n0_Q3>grfPTQ%=l-MA_h<K5pt~jORGFS<&12SYyWr7;re>~
zFaIv?*ZpUkkNwG#joq`8xTx%;<;EOG-1NySLlWFB|5cgKmOqD3!Qi?Wem(!utyv(z
z!v)tYA(2v)<vQZI{>Kd=F9utWOtf&^W#N64s&P1Bp-5}kpZnAM@ig!xm&~R~emdiG
zXI$9ewE44QHQ6f%xTJo=RO~7M7VFJtZd16@FUvjikeP;1^YY^UE7yIO%PX4xY{+j@
z91VyIRDl8QS~1S84-O9YtTz{WGiEOTgFm}!%nRcUhs6wrF|P$ZGuN><qf+(vaXq^S
z({MfFt@r5YD1+Osk~QQAcI}o8W@09j1@a{6GgI2*z4cMG3h>~=?k7`vK35P-M}?@q
zD?lPq<elQrqn-<R_t}PZy>Ns7YWeXC#c5wWaP-GtHXO=sX70&5UIUk1rczJ9y|AC=
zh;s1Y-6+n~#exqPw&{bbZhGkx*EY81u}QmbT6(-dEt$hf4Y<68K0=zAB}h|Epp^*j
zWDon*<Or4=XXB}a-Bd=I+Lsseou&Tvn$L`WQ@g=?vMo4{ieZTmd;8>v2E47V5s)Wp
zJofv}lRN9Kv`ufc@6I@&mqcI2lVAYij<cQ#{HQ$i2%xnV^FsITcj(#R^XMa?1M@qN
zvmQQx?nz^_wq{jkMu`c}DZ(^LRnf*^H0~E|_C(qK8+Ag=E%R7LV{{dU{x4>&Brph9
z;-h}kkg(9f$doJ3FBdYiA=0Rpk_SY(`uQYt#^>F*UdPFH2_*Clyt_^<fTE5FmjPqH
zB+1NtNoeuZBG9bHfG2n#*gD3Q9cMPF0bTynSv^&Jx^i`qx~`#`x4a94|Kr{J_3#f?
zec3a6=FK0(Qu_-jqWSf(F0D};FY<;4Cb_P6ES!MZSwyFp5=%_KJRMyag%e&S{AQPz
zU>X3DtgN(>7HzFjiU1dx+BvOT(P|g*Rr6!CL;CJ78HRx58nbS+X?F+B&;|r~Ayxq2
zW^Z&VBwCI2e>Cc)q-2GRFO1m(od+Wi?+Gq+IHpPc+Xfmn$=ssYcs@+S<4+bxLeHO`
zg!bV2-X8SZKF3JhGe`XUV6++)Tzb%OaN!74rxqpT`;I;CX>}uzGa#E5O3eh$6cSLE
zj7EbyTC5PwUCh?ywD5mF9`$^rCaP%vw%cd~TSy=jf+{&`ra&SghAO3J!|+s&e&hL@
z9MIdvge4zD6{oOfx->2%8xi2kAs#SYM`mhvo~pPKVy%+<(v_SG&>0EF8kJ`KBZ2!A
zJMO<UbrIo6S;SA%I(RDIN((Av3Pz_a{)5KyQed9uFAGLdI`4FQdw^0^NOnnkOsIYm
zRR08sCeHhPAB*(Mq)#(BoB42cc+6gV!!ennrbu%CLS0woxz8Xud$#)!F$4>hz>@sA
z1-8M#sCr$8_YqN0t$k58Qvc@zm_if4sco-MrxIAH3(o5$Vy2!zL_skj?AH>JbW9NA
zEdv~<YK2X03RgsPb){ho1-+J*=Vbk5-DLW#BxmGtzb|VPh7}SLf>7{iBfk@=Be2qJ
zurGp&8))zXq8w-@Y?IP2s=t@7IVrWYE8D#CvJ!1G-cP|)_@^CAZY+NmzlVl^;c&lW
ze$4&+7}g@dvW9ZDpU@vSSs+^6y|k3s)~|u3$H%iAFXeuHVJkkQ>|(oeQFAx5D%fj!
z*=eTCnnWP}6qOj2+z}NM!{&a|UhZ$&ARHVZ@MBuUoU7TT!o{0W>wkUXv7@Eoy<ZyK
zYLUX@>*mes>U3NM6H%*K)_=Gwe~-Cn@jcKU{G)-;I);ObY@Pq7;uGm%yU+g<7Y)lQ
zF^={YhyTqvv7k`<gI_f#zO36q8b9=;vXUB<3K6;|C^#70f71h)Y)&h!bhVJ~d~yd~
zInfyNkMrqt+Q!->!U-YPH*q8-^>fEpgH%;Yc+k#$I#z`CoKNy-z(xz^a^PH1`*fXZ
z5DJS9-zN=t)<e7(HZ^sOJkJAl$Q(q=m;HIeA;7F2m(2z#Fr{e#PaK%4cv0|Wl3ou_
z%3B7EUP%SQI+d_A{_pF=dXgdHG;v<LSiwl7cX!~ddhr?8$p<f(<gqKqZs04^<4cJ6
z_(YE&3l4jGMi7u25bNO!TV5-mVRqhZ*b%T&KV{*(2I~rI(0$+H#I{tqe7*or<l_m>
zj`2o7a*s~2i>o_R!irFEQ&Z8fcl#qNt#)ga^it4(n#g#X2Q|L{&!5|O7X_VxLhe;=
zPOP&A#KLi5SiCQvU&UvuZ@7az1b*gY6Ex_%(4_#W^R4&?bB^)4^{&;`?WE7aFbeXR
zMo9^Dzr(i^Hl3`L0>gCFLrnAD=V~$jFg#>z>+`y?v7f>5>EU9(>`&m>KAVm0vYgDf
z>A${#d+i=7JJBSG|N4RALct=#rhu!UF`)y<k1<vPT)gUB;eRI%I%EDT=HcA}>&o4>
z=$!cHmfcQ|p7X<Jg}(<Kp|ZcPwxM9`4s#($?M=;H>knQ%S(9Fu^l9f_&m)3TCVyJE
zjo*77;|@nS#*VEN7xIr^jJ@O2OQXBO8lnc)k~2%5v99f6`8cOz9tPgh^P{2?W2q0~
z;#RDu%`3;&ONJdynb1`0$GdT{Nh>_G^ShQdbY`6Z$T6OD7YFu3R8>j)8e8hEF%kL+
zIVRYjbEhf<1CS3Bws<*k1*R(z7YzrB9ceQe`sZ{GahTf~?-9k3&<M#iIRig?lOE_a
zTbEN5mYi-z)RO2~nb!qR$do10;lH)FGx~?pS@uWAI??`%^-~qVFZk+1@z|>FhnY9j
zTwBE=9&GOJH|Sh<a2PeC-n`lB>1X_o%Zj;LavZvXgMvfZ&e)G<QpkNX)jNwnc$=AC
z9&rW!acv`hHm9D{cqhxXTQBN<DUJ471%o{0B==Pq0h<h%Tcx-pYJKR3clv-4PD|_f
z_cS?%N1T81K5#-1g)Qfz=Ht^lCdp0C&dGtB!a4r<*PAY_@llkliH6tw@BaM1JsEI-
z*6;`V3z<0{aw|n3<+lIr(O44xt2<OZ)BdlhcNw^$$d3i;JM+M1KB67mo1L-tv`quR
zQ7XiJJ4u3S2Yb*`G9EbSd6&mg5+LY;K8MXq)pXg=Ap*)R?IlWM=&|Cq<d9dJM}&Xb
z;(;1UX8u#G=_Lwg8F4L*&qt(t>R}0odScQHo`If<NmXNoRdgP2vV=;%L`;+hK{sx|
zM5K`<tg=!Xl*$hi+Nyh(t*EPTKoH*qJ82B><j5sXyzUSFQij3H1Myk3<w0)X3tR!x
zFWo`CzrJ(%+Q#rzbe{W#Qwy0pS!zXF_Bz2cPL<u2eH|UzB2G#LL_9Q;f)k%%o144?
zW+hSVdN?O6Vy7HeVIZL<x$yw~W2P|+k17A-4`9ARN{d>r6RjF_p2-p2SkPDEpNrYY
z;4?=oF^1pYrZ~nK-MH8{tNOOnXOALCC9T0?^FFgMrzwkQOo>NiBgaz{`uHhprF_Ky
zxP^L3nrYK95rU#TxeX~7B0S~z5HNQyKn9aucb<UUCbwS=ItWMqd_E<gY~V`x#?OGj
z5zLdLBOVs6*|&HOGe|Pi!@wB7X!9e?NBwOzXGKce`IA(G-{R=e2uYmlo&E&J@71h?
zh=nKoG}Rh3uOKBA9q0LK&B)Vf{UB*sfOWvIY>g?^MSFUuCVDx};M<b)r8FY`-FmS3
z<9c=i+CCv`@!Z;m5K<GF<GDuyR>uGBPrbK7b|5b<wmQ9mb-Q;8xyo1vdUo#P{vq|t
zvOC1z06`JacJd;((bsUes+AhxMv4q82^j_ULjA8brb}`weIjxJ6~Rf1#}m8f0@|sy
z<P;EgkG(hiHC|9!IL3G#=0awmnUJT8Ha$Sna#MS<YZR8JQOkxqJ<X=7X2VHCMbCP<
z^?QlY<z6I-f|GY%@I2eq!E8Y5g?<kC<)f5OIqlrzp4xJ3dYb((>08xLK5g#|>X$7A
z)q|8*t+#9Qvcb-0*SsL~M-o2;#b|<oBB{mDxh|hsFMHSzViUM$pJlsC2L%H=hT(d2
zzuxMCYt_F&UATh;RenscR|Mooq2X4ZBqd^iYinMa58Jsq^rtk)uQEAIMc*8t*M#%w
z;eq9r;6<WLJ}08|4<A)KpBXRWJS4ex1r`<-CcjU+Wj6&mc~Yq(B{U4o9WWr8(DDnu
zkZf|j(aRDC!V}EOYp|wFgA*?PIw~>UZSb%9H8`ET<P31meEa?OlUU(V=Hx4?`Xo=>
zG#|mL8QGS^amio8n&xi&a)s%;;Vdb>=1E;ctuUh+8x`%4P(b3LdN5J_uwr&?IQD%B
zXL?$`yoP#^C7ED^#lSEAYG+F9W_qvYnZp<9NAStqP46e>;0-2&nfuv1n%kjJS!3Z3
zaPZKvnLkKvCoxbuIz02`9^n|jA6;EtNo%}psx|Kg-m>1_AwBQ+y!R|+);GX5HU|<a
zZ{X5h2N5nNXIVzjme|}>d(d<xWxOxq^y=Hxu-}#8q6tFtioZ7Q@@jqiD+zKcaxc%y
zs;j|Rl}IjbjRq>rkp>nzL4ACE#*!026jXAgY0jNao<NbL6j3C-H`goZx+~R$QggBr
zLnsKkU><r5M6LmYv;BV(bsv!9#=LdKy(%BeDx2Z7a&8}=iFg4K8#}(<9J|XnwFAD%
zd4mrs1mSH}CRM&gyUl(}>xMU{wBzqD0^vPR#Hfd+1^LCYj+3vueV+7%oPYZW+kbN=
zhIO$#Uv5X<_Q4}Nd@nH42N0n9#NaseY7_!!msK^8vVWKsmq-(2ov6GN7yl<<K;W!#
z88lzb8Pn+twp{Ix?9js+yot-xCeo=URd$m45j2XbqwE8;oeZN8(HTlgOABjiV&ePU
z3f-YjzN(wtJla<1+u(tgp+hXb3r=(%l8HXdPpPA=C8K#;nLB9Msww@wmap-%(Z$h!
z3t=bu)jzi+S6Cy9?uV_sva$#*H+vhlEL`YccMkEXj2(?{&t6_ZQq?L?e>mrfBkbF?
zD{49xmMXB@Xw=rn#foh-y*&139K!AgIBYze%em09=C6gft({(mK|s1L%^B-^aay%|
z8W96S-tmj*gLPlvY1x0h@Wx1Se9R2lAGM!fH=}6nZmVX^<~HcKfNo3N?CiA%yfGM8
z|GR|2$*#6^8g|=FXaWa?!(u!^OIZ)8g(3-$2Hc4YcL0EF!p0^9|MvC~nL7@wBmuJx
zhNSj4s_dX#E-OB~=*nDfx0X%F`GzEaJqiir%Sf0lAuTbs{2^arFHPxal#Fy@W-h(&
zP^#hkYUC-1gTp{w5sIWG_Q$hBzsSMOkO~29pMimYRPG$nA0H3x4ZPSZvv^H0v0+vJ
zzQL{7E`0mIPMo~~#o!8rok))!-8g>Vk9<Y}14n(GB0w>#nkeJ^?l?Ce5j@Hbb|Bfs
zGl}ZDAswq8|D0<D71hY%`tb5JJf07a^6y&5;uh~40~$u#Q)pRVGk9_VUXWV&OQ#}0
zw$^|11nVInVib2zx!%|PKq`MM5G&G`{ERP)(~vrBG#Iv5Syh|l(DnPKSPuLw()Hhp
zLraQR_QUeKmNO(gd@_6bh7;I@2?tbE?ag!3EdMDCXOV%Wq-kb6tnAR;EL)l*GBHeX
z^rZJf4z{x{yTh-$OH>)RhcG{*;`;huMFSOe(!$416))orLJyl^!QNeuWo5J31HGFu
zB&xh*-Xi5ZruxU^xsQEn%*t!46D^<jSHSr562~&NZ4j~dVGI2%ec0V4L~MDsrNr2N
z`9CQb9L!(XqwO~2bRs%w#Y^w6p(Da+D`~-b^E9Fg-!Q8rD`{D1RZPzru|gz;PMfbQ
z0fo3}R@mF^_?H;>W`AHo9d>0^)!q9=U2qB{@K2y4MIhkEdj;3+v>?YJ^}vSz=p?IX
zfqnn@{Let)sLUj&%f6@JL<9uAr#1r7!^6hB-YZ5kaKJgFp-bbW>puVQzZd5Jv+4>&
zfefE??}gzwp5%D!H_h;)@S{y~d;!}#1}J)7^ySR=2x>C)GvWeS5J5{HdJawh8P)ft
za?R8}zu4kEF4c0or<!1+ugy+&u>P}_KdkBynEUmUC#iLpO6qQGf(kKHnd^eQPZxqJ
zu78r_KPDt1@$HgU0}byN;Uo=N`Ekpn_!z$d2EvF#k}p{`St-r{U_jJlBQ8f$N=`z_
z3F`6^Z};Fp#%CV$v5+O)&-a6vGruUisfx+!$Lv6?^ytYjnb;er<aXHeRkX<Fwyz|K
z)>_x+kHzIi+(I_q?k=HeWW)`wv}uga0vJFG+~W&NPGFULi{c_vmpMOyR6I%$R=gP*
zxGOro!nS{ef~9G|z4tK@PW6@Gk9|j{dX^EZudK9`fS60&y^3<)QN=)Vso%WU7zDll
zi7NS5c4ShJ*1#s_>^7^RnMG_g;pnv4^-tq<M%MlD<P&T}6&wu^Oe%{ceVejBU8y7R
zdO3@YNDy2zVS=@8Zr;Fc_1obGZlu_A<AGhsV!#p&TzPqUPS;b!F_51lad^@Hk}k!E
z#d&)z2or9U7E}<Pafdgt-3UEz$5}z(&(9UdCePZ#LN!9bZ?qW)B4d4)68`>L!on8!
z6}F*7QOeo#!`)$Yl7-?R+zk>588u+>QC3P`2H6Q@T*Xu^mscVLMQ))qzvgHu)r|Cp
zAm%cLHRTZ0V@Ci=Bpg;;Qxb7JYAumoj0<;*Rm;1e>gV&e9nS5Dg#a;eDGMNHgTaP4
z9`A3yA}IxV{>3oK?E%IO5p#K<{66&^m$Zd5)YoDY9}*5)Ad<;7#afGGu`)i}GxX#t
z1<~!?2@I2`;tqs^-+k*--fe^-DLFaNDkm^ngd(1d(G~XCQ0(H=4}Q`=_=ey0HclL(
z@{tswuhQ>WoObvrnR~0qiw`)4>tZ}YqSkprMij^Y@$q~OUbT*t(Pqjg{DX&>Eg0-4
z)uL+30L>5rc!kp#9j$n~z`<ma`ug*Ww$J_G&Z+FZ!N<YAEGG<nv>-CTxa;!RDdT1P
z!Zr7rh;b=C2X8#)=`#9^&zp#u7PD>V1&p|;Fj4SHwWz#Zn#Vt<b5|#Or7mmSrHExb
z{XP%6wpgIQ-=}U+U!2Pm;1&Rs;6BG;-iQ#^MGctI)xYkGx}2J7#mLb{nR8p?t{v%T
zM3II+f4ebE-)yMOmlM>%_q6XO(KOtawPdi`qxNWa;1{sEtHhXa&}F&&XgZ<qb4y1c
z-$LGkDHzbxspE}*XhT6l3Iy8mA^(L1W+i>d$DQ|R)T{f(5=l0oYyX@zD=i!!QZN*7
zuNs<Thu=EN0b&pY|0VN?u(5<>KQ9WdFfD0XF>7f5?(Lq(0{e~hQGe#>0gy?+g`;?t
zRp3v`9d{LR=MhdKei#iNmQ(rTS5ytzu;dN-8)O96@_7|f^1wN<N>%Qj?|};tI5>sM
zq<Jc;%SyWxXJ{(vTgw{9(r<aq690zq?GQE8@S*k+1?N!co7LR)a>7IRxea44aK8?F
zzb9TZtYUsUKfk6DULXY*iHZrOq@ha`NF5Pi1nb$h&$xR9TTC=4u)yyPPl1GLq!uPC
zws8ZeV_zB`o4gk^w`Y<{+sHtdY<bNjOV<$#D51C%+oAV0E4*6gf^Zu8X^C46m7AQ*
zLZzZUU+5E1XorY`7nh#ffnWtW(%0=xSx*73*22E%TxsYMIA;u7d3o9FxyeilVS^Ho
zOPbKjV2|J|dr^wUJy*K6G^~|EejzC+z`+xZ%KvZ}FT~a9A?WIfxb1I-{rjA5xXhvV
zKMsivb2K`&HM?%+T&{#CDx~RhBJlt)v;w|y2QxG%)<hdaM3W%UwmKrqgFtgAtxLbp
za}s5I-1ytoT1Hh=ofxs{gQfm>RK!iO$dpXHYDX{52Sz5038`0o7YW;gUE!%bOP{yz
zD$1J5;S(2qqW!_R3BFG7t0nQg)Kt&u<6y)_{UD%e>MX8p#}DVG`z1H>t#oDsu1K|a
zfyuE8Q;~HRSi>r)9^5xzV`gS1Ou7xs|6wv2hXgG5wjB&RUc61EEia?A5~&-`y{k#s
zbcc}JU@@WN;{C#8-ZkrGj&)AK6|4;>X^g5u#2hIFC!7EVov%iIivU~Nh4)mlBwWP{
zhTeF*$5YccASQ&0h&|)KJ{lby$6MO|v+s{Mvkd<-e~irOCJ`PO*fmt3zp~OZFG94v
zBw=9@F}zoh^d!x$u4KILC@9xz#w`jr5OM(c+DEaq*ry}HdG7w_5Jcr4po>V*hL`vG
z7|Hv1iXFYx`O+5#D^O3!vhdTiUul2rSK_S8=kECu6kibcPdE*6;h7nMFGRb19C$8L
z(63vN|LXMKG9%k7TpVmmJhnRBM{?W0sG;;~5HWFKEhr?cX#8bN-Jsq8T&9-&qOARM
z!+42Ed#jzkWL|nM9P@v*MREK+*2dVrzp>YKWWxnzS3u^F3Y<&S_c{Rt5%-35`g{$(
z8}6~KCGyIwW+MJ<jE|Zi_r}&D&_ZY1H8juHu{Ng~>$i|#;De#-eQp(Gx@Hz;NldY}
zZwEo+)`-Fp<99&x7bPv#=!Iw}PZDwYFOy>D_ZcW7!8s{fTxOePTA+U%v!|y=5nApr
z6cGrfEeI9|j+$H)svWsnKu3BYNUlL9(L^&M%S?uq_%^=~x|vwPuZDWSgE^2zCGmH9
zI*zEIZ5|ht9C^ys1fS*wdnLr4Dl!!f2gQ(k65AIdyJ~oYdra-sek!YB4xSi38F4Za
ztkh1sc1eklV|w-V_wc2i{3<aR8j-D}7h~C+>|-8o7v`jOi6q)^Jt~9lfkUP8`U^G0
zd<6e?mw6^70))6*pouRR{N;`XHDxwD3GjX^WLih1>v(6z84gx3-Fa&K7zsBF6CaBN
zF6_UbXMRY<UrY7d510v#=?f@4ShHLQ&LuRi5I8NS-;+R8>tTJ|8v~GiI07_<nqIU1
z0kHsscohHN>_crFAS;?|Sd9jRr;ttr(dtSq7xfPq;sX0@2sKJiWSc{~=KTK+jsM1<
z-Mpdy7D9P3nh1}8H4#Uj*)wd+EG$UK$iyR*84A@nKfWlu#TYLBkEU~QtMm=mcD8N1
zCfjzcY`e*}Z8tR;lbbx*wr$(?w|?K=`yc2yTJNgodGG7G&r^N?B+s1o_c4$rm`;^!
z3HAD<^)C_f_#I6sWIhvqAvdapdws2Vise^;5HdQEPu=Pf;D5K2FqV75)LxM;H$y?O
zt;1pPE&cBs!aU6`ev~mX4F!7<?_Wg$*cIn4?y~{dJMp>>!R-y7Kye60r-6j|$HQl{
z=lLV{?ekQz#V+Uf94cTkBOL!Parl>?_Xv-pOFZiD>Gd_;INkD_)HI?5P;ls`3{uMG
zfihuf8R?zu*9n_n{xN(+-W7xV!}zx!SuQMxNqn?EVgalSVRATUweE+`9rsUJS|9h<
zlUOM!Sz()e+N}Ac{DOx(v4k#sZ4wc)<LQXxTn97P@z~(}hW9Ib4Q)IwM@B%SuXFk^
zTp@wh-$X>ua#!BGOHY>SV?JPw>FAonW+`$PO_1rhNA~Q)kA*mDp62b;c1Zobc{8x>
z4DR5LRbqGk`Iuy8IV5%GJd5aEnK(5?`Ta8Mt1tPmlG0CFiG&u}V&wOfpZNDKI!>gR
z8T;4WI+3_q8I}C73;A#}5yH(G4$W8y3|=J1wqGDT)B{vhFb6EFh4fVLa!;BNQ<7)a
z8(ph&c3cR(ZM5piD(v_Bi`{ITQ9pt0j&M$jvq@4vId{L*b_CBUZ3g!tX7V3+F;SEH
zM%ok%+@e14+fV8m<K_N+mRg_U#(wtY<{64>#bT6<jL@L|tAS8H2lPXcYTs%Wd1&qy
zPvgD;DT$!ku_4q08DtJg&#7EO2`?05?EP8jE7ZeYUgsGjg%5S4Y@n!^oXFb*j~2xM
z)(0Elo%O@cl)RFGdbFUiMfC4l!Yw|pN{G3TFL}*R`lbezq0E$aCg)`IQ$MDT=cAZH
z{*ez5o4y2%3aGI0BY`oyePT&g+^USXH)=BmQj7>RRSFRu6}ZQC{H_cR^aKG%E^i6w
ztT%(Vxc43<db=Hj4@F3~=|g9u?971YjgPqxdEd`fHVm7PU<QS&6cO>zxBZ<Uw292`
zP8wuZqOw7(&&it(zHp-<IfrDhUEu>=9vJ(|kx~h311R2Mag+7>*A?7nh;W1x`_*MV
zQUL-?a2;aZC~(2_AQee$?tM9?PKdh`dALFY#Ks$CQX+w%%h{Cd4~*!R?SFn*TAt<(
zyuf9E-?tM=rq_rBI3h<OZwJd4wsb)jFe-&6@Ov!!-aipF!Ni85hQ@{zw}=HN@RnuA
zGpI=w27$_h1_`gk>dOl%06v3%F{I60dOV5UsaP?48Eivk2F=-dN53@<U1ebx<kRJ5
zT-lVqlT`qLWNZN1d3PSXp+_lI^v|E<9Z$y&5?-}(2?o+aweWu$(QZrz;f$*uur|uU
zkx)d`GzzVGTw3|N=2Fm=wB@j@t<?FllVrg<<4-ml=yQGc3=qz?p*4{OrHq&v#*KWB
zaMSK|<oGw`l$OH@^pJ@f77rmkz4xjM`B$o4F#h8no4d#oEi+zinf(~iWY{k*u})#L
z$tdbduiB>|&0zo6o&DSj@{b&{O-E-z2VsL!4O4a195Taq8~7te`tI7LN%A^z>Kwac
zB9M7sTS!Ss%Tc-M#ib<3zEG?Q&}wB_<!W6lyR=l^p87RsQy`W~1-T`?x3u(%KJ2^}
zoa_6@A}-fGGFW+%_8{otD|)z10Adoatq-MJ$=)_~B`2j@G=p82=K=kX&2@K1T&WgB
zq6XGY58%@rQ?cjqTagJu;<^44#YHgE(w-2~KB^3SH!DVit2ylHJ`ZPMlzE+Dnxk#=
z_kef@<zBVLecKi~lXyr=tRFg|z^I)pF;Yu|!p!1FH!-hkS*%0alWkATmLw2F01h6l
zXj0&5ewvG^oI!KI4AfKIR*Vm{`QtdVdIv5oxPy)V^qG*ZAtBAn3Gk;?qL0CYsPnoX
z>8%dIrk&;x1NN&5PmuGo8P1%zvumN5I&UI2B3>6$ASL3qOnRmG$O-OSGfrv#c{h68
z>nIaFAY3CfSJ)Ept6AwVg^2Ylsip?0)$dpn1&j6>+m%WF)F~-epsWmLBm|q`m?Jio
z)Qh^Qes?t9o|0Ov#j&Q+u~8i@j<YNU+2D*$#i3=MOp!bHv9(2rzOPS8GnAKgBHasW
z>8Qdv#nl!SWAW0_ke2`M<9|3?1g}x>!AVNm#SuzI4wxuMZ{wO1xEJ!)1-82$Pr`HB
zpV0{7EE-*$sejMHM>XO)Fos5ik<s!<j8!u-^%~p-Z!~xi-+i^9!3VrRCdBQxW&K)(
ziLPt?;8fuJ^4Ge%#MZhyvuR{{rr5`ArvQIs@H%!cxn8Ni&P3XCXy@i4+z+=N3+Z^>
z5(BO<ShAXiSO4^GT~onV`2pX2E38Jrl9{nY?u&hxyh!qPE{27*?Ptu|hLTI%vJW*j
zFZ=m}^bBCv6Zp2p*mgn&<otjGchWHAM1WHn3<>Hd`IjDW<dKY@;M@XH|0N?9I7+^x
zB|gB}4Nr<OB-RBoA|j>;kea!?m+dl@)FkbfU_tVr`(J{h(-RmH(lD^Vs@>D;Y2Fqi
zW?e88GAoVmvep~BGMmi#zOGY&x4)YTf4eTL9wbTQrk7fWMAdUNm}S7ZfwF3f5XV;W
zJnZl0NLGZ05x>ADlvE*}Z$n2n8zucx<#$^~QL{=ylqJrt)>BBLe)+cc6C?d6f4R5m
z`VX{!{UN`Z=%edd_IGU{3&q?>(dII8kACVTxv2tI4hh7!MuuZMU^~5Cffz0S8&WZt
zzkeA`76z2GMX>-el-)xB+laAK5@1+Vh_myFd2h5r_EuSwEYdos!k|?vJcYiJfpl-o
z*m{7rmolGQYdKwX;RBeJJX`$#oz=$PK<gjW`@jB^PA{}~bm&bPYXv1vo2|^p?-Ay4
zBF@uS0OvBmIFJnkJUZQsvKJVk7+<W^6*7-(Rr7QJjpd%_)y<*H(=HuT4ZLE|!CO@+
z(V&l)wkx$F{5o}szCdEo$K%N?xam-A(w%x+iViN}OLs8nBr4cRb^~^FG<y-=Rj$E`
z%v}l5-`}W>M|2i8rMHj34Xn7kWRrq|&XJkpr)u5Z!(C8d7qbM=24CY}j}ugo<mggQ
zN&b*lM(V|R3n%>n=A(kvT-xBl*^!l2ON@Tqg(&n_E26c*5LLv9vSz8pSEA;)m^u+V
zhefN_wv!@?;t!HwO-+GYFlNO{B#?%DcyHrF7b1Xrt1T2m4ZPAO{IXC?>ZWCy>O)5c
zknBG{U6LgHX-U(mUc`0NOzy3svP2=Uk=w$yLAnxi{;mwwEL$sGsflMCK>pJ+)*coX
zM%~zT+k7t5@#}K^UzBYiot!=<<9Lko?NjBn$(fuBMYK6UJGL-6mei$N9aRw*Yh0I`
zuRW3>E~Jw%x*_HE4SxQ>VK<?BH{DpQysHhZpznILrQ-GFY2D%1eFreyAJ}qTF~Xjg
zxBwQL=7FE9GBjZc@F`(}e{9|mg(6;c0nw#%@?FPlu1I63L0^8byozJfsC{mjqaeKN
zxHoSxZ0l;0IJl2h)pQL?L}rJaCFCESdLnIFI6`k&ExcAxMiNx9Z*5IRrq>9|YY4T)
zJ3u(D5eV(M(~jFb*~~6UIeGMk3G8Uzk1tm&iS>fWAF+7If?^?`5}?<u9)iNtWhBW`
z<Pz-3nyTkr!Il!&so7_d%0&`E%%n9$SBma5<rET5Di0AkF%*W~#xXP~tO)3bvpD&v
zwZGcoX`5$XIxT4UvvHu)>ub+mIGEYNG#|nJSG{3^{I5nvW=})|3;`4~ttS&wLnM(?
zw%WN<OX*0?aUzGvF|i_s-p!Xrv>SwWN`1c_F%|@K?#uHLIu47e_gh!tL4KheBnB75
z^@0*Q)>2?Q`0--SigfAZL_t|^h^N2LJ6c32n_go=_Bn@uzvfUJ%Yjv4aZV|_HY4LV
zU!XvWhWEOmX(0+Fuf1qo(WX63tq6~rb{sqPOk0oMzN8JHlbaMK(GXFO?q*~$oo*83
zcXT>V&h&zX#P?d;&!+0c^@KrHm9pTiHer_tx$@=u9m|O)|C)d(iZ$tM1Y2pf%%efU
zi_utpw800$Zrql7J)bw9rAu!7XETk7=C3x}d)XJ_xVBcHr0oDEv_Q3^?`68m53{P*
zx2tRqNJfX~mzfYu7|ZEg#D6%&oS>H)wMb<W2rq6AX)R-TbDkx9e=0Np!IT6l$nyva
zK|;<=pn@&;OdIaoW}!fK)Q7zW(Lp2ortT^^!-`ZYbkTcm!n%|mypRJxEm87w+a{pj
zLrznf*GKteY=jY|Fgy*q-IW>;T8X{4&s5Vp|Gcd@BQF;rfA&#_VMb~C!NE{_nNXii
z0hBq~Y!HhK3r`YWgR1zRZ#?T|ueZ~m?x~yJuQAmz3FcDVf9_i6B@{X<cp*wvBx(x>
z3t|{#-orBDtYl$9>8|FFjPHLK8xsu8*9iH>F{NLV_68HJG}$!Ek02xu2N*fhu+FJi
zq0VB!cqa;bbHEM|V>~yaXf|b*%bc8S!@lyY7W1#va&zeZsLqO&6R7p<rGD{U<-Frx
ziA#lkhKqmoxw}OsJDhZ-z&JL3DP!SIz@XNTd`-+s3x{;*j0BHB6E9$7qgBSDv5>vk
zK#j1^A!oiUsKfF75>`gp8N7Reh-{4Zetp@GpEcdtE=PZ~Bm8Ig0$%yGK|vHqN5^pv
z#YiD<XkZX@{_R3<(k~in-Dm$RgsdIbpF{8G7!b*l>FLeyBUE^+?G0>7d4V2qdXPbe
zRz0W<p#NpU;YH9ia0cZ~#P0ijCVR2<4>oVYkmhxzK}pmk`2n2`i1^r0$c;9+**k!3
zdFd0u@wR8ejZnapr+nAG?dLWR9s=UAfS}h#0*&^zHZm?Q&9&)VQ)nat7?0<pPSzYu
z={fvz)BGG@a~~gCgL}6p`sO442UOjSG?R++(WAH~5ynGyD)Ii@8mn!e5cC!Fmkr~M
zPf3<mp2PK%!iy6<iiG$V>1w1k&&7qf7|L#AK_fQZCIXgb-$U6Z2CDv!Xl{D<>xC)k
z&h{uWEpDq>>yLD+QgSnK(p-!OJPeE`cdN0Gw87SluiAeG?qy6Oea0F@3rpjXBhnO9
z6fhGq06_^X`(SJ3>i*tNzS}A2ys>wvagik&YI=@8SF?BiAF9))pL?x0&er_}kh`JF
zb7XhP&^Ed}`E@Ri;yR*a>_1b=#6@MOsyFG%ICNk@M8pW)uK*IZW#Ck?ZAjRNW8%LY
zv2sl;GKb7|Z7lW#`FUM93B(G^35)rq8!6_QpQea}C0J;;(u^iL(OJq2nOe{{l@%IA
z?5B(wKCj?E>K;kJz(Nu;lNc9w0IWZ#4X?Tl?(m1=@ED1rTN4(aE6&zm#!}-N^g*{w
z4n^uW%rtc&@&ZwSYut&0<tEA#3``zrwk1x~Q1tOeU(gQ5m`Qa4Z63Y$Yp!ep6Ay8P
zl<?NDU7uICC(8}^1gA=;%q&c~ez)o>L=2K*c|Q>fE}dk=Ra;H>PVk++dN3a1VNtaZ
zRFSFUL5ZM$etSP}dc=Sk^Lo{rh2V5do5RQ064E4haim=h$Sslr>sR+IMqNWwIeeNB
z@9l2ql3QBOg+S}xp4-<jaX=%tE&p1F?~$p3LqUAdKhyjUc{WjFfG^4qoEpi(fuZ=;
zP&}ERg{m*DkZ+oEXbFFR6ePcd5?n;u?}JBD^>zry+kR|Ngm}*$h0=+|X!@XW?kWxY
zG9Rg-<^H6T-64|cD1l&AOwWqQQ0m6ImxI`kJ_+6H^R<0B@+b@fS5g^?4#hiec$^r<
zs<fI1mg)MKTuBzHeLOBU#UuxT+iEc|@RBCZbQXRcAf{4C)Oag(%Ah(zYU;}~oC7P*
z)emk(6K_Sp9bGK&4r-I!Qs5}u6T{L}5$FQ|=C&Cfmd4yAhs{aMy3~7?=MNv&>x<rl
zzz*^qj*`tQ&~+6)7=t~Y8-WSE>Irv`#|VTqS%-8T^BlIT)a3tn!L&q$TF9R0YqO0s
z0j^Y^2t(;;N#`Esu7F(sM@{o#O?zSxP1sTczFvfamc)5>YiMiJ=0f4(;QJYSiE5CU
zG4WNU7GBRP!c1N!XTC>+8!mp<f!SNfAAB7uDI0_r7gMw*#5yI?=OH#@s0obGk0mJ{
zPjMU&j!5#wO6i-k9Cdw%(;(NQZ3wbb=$`E%X<AaV;%LMdqD}V4^4L;iBR^2>er#j;
zM@F1feZ{OY^<^S8wG!O7(f5DbQaoLq7uCAr&$Md-c>5LpG`xtV8ibskUV<ZgXijEe
z->TYFR3@g&9v=_w?48BO=kWGTu7Wc0e=?6r=iWb_rWn!t3L0}&6c2maP4F$!sp)CN
zXD^r~VY^-KB%n$9{88>omdm%zPIjROeZQ+$QO$EqUIN=6App?*cy>UbWpK9I$U9qS
zByA0ixFU$34p@u467WXL<3NtkLR!GdhSemrVyrD;t)L%Ia%%xictTQ)jK2(is~6w!
z-aMpv-A-sZUNY{>RKHYqe6V>3QXf|NrImlhUDe;TBhy~rZKZ>c^8w>KfEhA=fY7BX
zIAJvKf`kozmbKdAMDG9jsL5i`=W7RytX!3GZX0;w7{OiZhXX+|n+{s27zmIkN(Z?e
z7;n6_C8DpaM`fImes&?<{a&sF7_vk<&cA%`oykpMqa0cP4k_OX3x|lF+rDoQ!afwy
zcq1=pv3SoNFQiO9xJkZ+j_QF7k09gX5LptXcjh)%ubi9~V_G^BE|-uoOf&a47lR?-
z4U;q;67w)R;xp`tm?Dx(o<HzwO>%#+8CTrkdJ;OQQ!GlOs1GC7rH@;JzqvG$?_CJ@
zn#sM)(L+IF!B}Ynb4RkB5YAz<dAXLIO5tYL-&XgRdda&6ubK`GA;(>*Hc1Fk;~Zsl
zE-RmXz<M$0m6n@5peYK`N9o>PnbvSGs~Oob!*T8vZe<NyXjvM9QOye#ck2x)VjRAx
z@hAVp3!o?^Os7y^WY3_nUF(AOK#enz<JK^(pv*`vSS0>o`BSB^xSsk@7>Qr)^RpvS
zd@SJ^Kp4mD+|kpkx2s~H^})SU7{dfE9i(()5nK6pQH{i7_!8S8@rnHlM=*gyppg*#
zrvWkNg^n_byqp|*TNG)n?*gW#9;tH#o&Gv0SDp&~<>c@uxkF};Wzh3uK=m)E`hRAS
z+NvAf0o}|q58#RD=TKh@36J=$_k~eOqB>q2dR8I2iueGepDr3&`Cjd)Egdk4HcK@}
zKQ$0+E9I1W&yf|fD992VRfyyZ6)vk1x(DpI5Yf$lfJzFfKW`^Q1^n$>)Z75k0FL<X
z#er`F^1x~Wv8Y)-W(mI|w4@#%Mja{PA73mGu9>Pnb0%t!+N$@BrUv}IC*t%;$^e`$
zP?6t!26xFVo~I0Yt_A^h^8HSSe;kZHe;Yb&P8N;g=R?E#fDdAFBy&*<MCp}>n{Ij#
zn_MppJKEP+W%{lQMp>g*{v>94lMk#rUv9S80MyteWl6@sfF86t8Zil;78Ag<+h=?a
zy5LBQo*NJqJ4(cOYFN<uzqo_8`sF}EJAdmKB*wRSkF!EZ?-R=wW}xttL$mnzndzL8
zJJHzJq)u*Udz1<*6G8Br4z^9p7}p~cjIPDQJ*P;eN*MZu-zLaQ2utJCXR?sM6?4%1
zos(RMxbN!g*_uu^3Q(nr44z+0drubYzOU)AJl0p-AB6jNz~wb{4*;GuMu9?maa+z{
zU|<8LJB0gJ{gDOOL74Gj!en}DIJ;#@UB08uT8avnOV#kO$yaP~@W9;Gq_0>hDoLyD
zj!lodmUu(o8U#n|2a6Gr&j)PBYoDv{$0IA+2~|yIaZf&~iBzI`l{U2RRrPcErpt&<
zu;fisnv&{awv1*|FAlpEO0Msn4C+o?WMra*4Nyt1)#c0cb)WZ*(@kF8Jze~CZa2$v
z127V15k;5Iw3#cGF)`-l<69q4GL_ROSc_r)pk8z3O`qL6v&mjdJ?>db<@V|{s;8wt
zB(V_u49qWxPJNjOxx>N{Axibk`k`T~7JNh}!aP1YULO;IeKG1ijfxNLsiU6aOsgub
z6N&IdDTee~Rz}uq7~UJ8b}gjA*uU3ZIos*Ob+OvN^}=q>_Y{~dEQuf)7l6Q)=M9lm
z5G3ls(n#*s)Dp1w>1n-&{_^p@7)c@t=5x8<VJ&leB1;s#?_VT#+w{CAq}e>FLNL!j
zP*rWaBNM7kR^7>!(2D#VOBiJp>;MQpQ%}Q`CK(TR5z3AWlhe?tniW-5$L`-*NXs8E
zzOBd1V0B{eMXxQ%)7Rx1^J|Ggd{R#06nD|$YwMd%>cB%I-WkRW*r7A&Tj3n@+zx$b
ze%@SWu|69=5Md;UijoN)PW}*uSOd@c#VD%SD<`h{HtHiPQ5jT3Z?(S>WtG)&LBP6%
zBJ&^#CNG7}IYm)+rdW;?<H!qcszdFy&B@RHsQ@8`?gtzP=>!mp1kR#Bw&_I*9Z&ZL
zZf%a77gOy_=J<VsKbw9HyWAYG4Uoh}iaVPG&*+h4FRr;!ols_U-}pS_elf=ZN_H?M
z1}V>X#hH6t(WZBMdwXAexA<dm`7}CE>M@m(4E-K4OBAxG-XXVmnkGbflXOnJfM>ln
z&JIsrcQvq9O9)){t${HFP8~f|qF2RaS%`gaK!Lltl5tB|3c2);z>Fq#K$s87u4K>?
zbFVgw!QRE__cXs12H4JNIqi(K6JlCzoyJFTxW~oqZ?Uvl6^?-T>RH@Tvw`T4AA~x!
zRRC}b?_p#-ZW(eRNuxN!N{FGo#eG<Pb^VTxPv*qmZ7i*^o}y-P^~pH-6q2U3vsGEw
zE0__z$IJ?A&deHF417aDu5T!qhqA7JqtI-5_UndFz*1)`H~IcaU$y-d{2)_P(W9Bo
zkCK6HIgUDZ`fgDMGSRwfB!9W!<q9?NEW<UK1qsmm33W@_ArgYnhK}I>*GI~X0yT$C
z59<{AdND27Pf1CUU{0H^K}sYgd1Cznt|#}z^P}867tRw}9%;?!0uj2~eSvH57#J8v
zXA9*jh#FQ;4-cvD5k%h7N5q4CU(ILbKyK83LnGh?DILe?cVd|P>d93qt*Sg+Xw|_$
z(CP5k=X(q_MNW9*K+adO>5dh!mOOE7<39|HiDQ8G&=k}=XO_RrS65CrtY(pcGtU-M
z{Rc9!Tz9bxUaf6JfT$mNS=JlE@tQ%yl0Y8rq1SIQxSUMq7uTt*m78ZOXEl`IzCtoy
zA4IB<`%xO&x!7unlv24PrxJ7a5lW3D<vPNH$3y{A#;+61*iJX@a75ghNFm`c+_-@$
zpKG@w;N!noX_b3%*Tc5qqZXgh=BM`o7BXf0763r111=N2=+G|zU4^D(G$;d(1F!|;
zZM4Leu+v7*G)M{Vqm*fOAwQ<flW;iJVq^4liw-?Rd(DyIQ1#M*g`m@5yTtkX4#WrP
z;JW^ggOXpr)Y*BWcuP(BzPF3EP9|da8oUd)EYzK}0#9z%M<8&=_jD6|-Gezoy|TMH
zBxZ*-H`cKfH*S$dKHU%42Bii7GRw$^(Ql!jdKalt1lqXwwvv`fDLnE2a(5@th!W-9
zhlc+?_n0&l9>uCJ72&Msvz#LMPX~m%4YWnaE>>!eujb;BPm0ZMp8-=yqj=CSgO_y^
z+_V3v^@S@V!Eiv4bM?mAc3R)aXm?4n$xa=FjSYTFvTa5J0GfM7gvLj8h-Z1H=`<na
zgJ_hu>Ii_oL1jagg6Ce#Q#jg`2e`W-@cgupcv}*+_!%wEmsAvjHz%{RFm<&hEln!%
zFK9VNC5yre5oxeaF{-Ia;0*yse6*Y7Pd!w^Oqj&)+|j~Gz8ggup6m{N{8?F*;KKyv
z@R_Lsk-yulK~Lg3;EuJkQ>Bx-bYm&01EUgb8{2vYUQ&%IX=xgoF;w+N)M32N!4_~s
z5T~P2cVk2Ov&kPjSL>*-<)@K^-uS_v9OMm0?6I)nx8eI4|LRF2z`+@D<bzGSdxKI*
z)oG}U{t|Fru7#L5$1nD#L7)R@*t7M`i>*x;gc~#9s@Qr9{uY7+RDHusjlBOuv7!rF
zO?zLPoh5>fg)1~aK#>h&6%;C|rKUy1JP4ZG%6t!puJXEegcJD4>#PiHs91ZmY0JVb
z$tozW>*)de6N?Oq2@h{OU^%Rs7act<KKLYniRl*|M+Q}vpGqPi&n(~XdffbFljnDx
z(=xvUV)^M0bk{tswob)2EgQ^YL5bU^yh9%#98c!~fL$DFFV9*~1b5DRAj>DxcphDm
zyWrDlL4%a@`bz^+ltF2QSwmf2y8}7c3o0DXXsg4kkDm=$*tScH+M%8GBU}4L4+P62
zc9J2tDUfSpL97@8YLtbm<oY9~X?VLJaYbBK4sgUwX_maglwRFIG0#@h3E<M_(XSui
zS`LkBFXhVN|FYF--qpn8HbF2?tM6&_!A;Y+htSoOiQhu`xuv*Wr6u#plsEM1tfTF?
z^5`tW>0@j>$PMK=D<+Xx)9yi{ZgI<oSd6&dRlEysf;tFhZ%@i@zDD^luSw*3H*il&
zLl#A+;vRLxtp~@&OJ}nlV7tKp7iwiVTwrY`@Yy@}oG{@beU>N8XV-xM87dilm;YV{
z+h{zB&rZVFA)`#{_dYj+T6EfC8eaf=Y#`sI?4&j+8{ah2qEK6};{SQd2gc`}j|@L<
zS#f>1b0%SMQIGQ#>A!jd8;6U;zyGe&t)L{$t?x1}P&nb)Tb0FNU~^;lTvDoPV$0q6
z{?YGxe=&Y~B66GVK!@vg7mV0~<szjb1#jBlQ%a(;dG3+HWs9vd$q-n7)EBVX*IG+G
zh+t3~=fAs)Ee~19kE3AI>?>E)G6k~E*}p#<NJ@UXD&bJKoJ)W5>e0nqRc9%!{mwdX
zJ=62m=sZgH_Bdp7GJ!7TUb(3fB=$iDfyfpoTxH<4s9q=xQ{buP3I1PGvabvgDcr^a
z^BTpWUfT~H9GVauDV!A@LjlD8f)-2T#yH6axJL&8Y2)Hc_%LlktAwvvW|GkQf|PG<
zw@gil8hcaN2lkedwsO_&#aq4JzZ5~%AEsQrzhmfdw)==>)BrK&5(8heNmJ9&lK4@y
zT2xopYk0FU?%H=dtYqd%)7sv8Cn8M<|HWA^g<Z1anG;4iNO@6!qoe~tDJdZ(QELoN
zgPhCa$0_i=K#p;8NM)15i(>>8(g6QR%%6<abxXv?Y%xbKm+rzR+DgcitSREu`qBOP
zHOzkdfIhNb+ej1S&R8b2w9j4g!@XfQ5R&Qpmwn5fiE-izRTSWan&=PI#y9fYakpWS
zf7ERwy|&#HDid3`bm8{<5wz>!;I~u(sKK2AMp1X}Kf6taYvWs5PEI5Wu-E!O?Lu6v
zMSIl=)^N+%f!9{>f?p!8uZu1x0vaSA0_Mc~18H!cDF%j`3RixanThK1e=yhX5=*{p
zU97xoOb^V=mG$I{X^<7WcAVSx_U>0{B+(!tU+&w^NYYFBJ6HJ%L52L^|7>{iEaAC&
zlDB$8Dq;H6L2WkN&U;vCsWcAM&2hyqaPfzK-S+t2J>Qnt9DO!K-5ut}%14`s$padi
zx@{QqM8H>!pb?BRBFLfUe0BiS(5lmdx>eMFO$QMs)>*13e7`@R(HWHcZGO|h<KO!s
zW7t?2o9xsM1eSQHsHmI(nUaT(lQ|?K$fW)>$f9LWXO%VS|L*JO&b)oK$cAhelA=IS
zFx)|G;6QA=RVzx&!KzeI7>(QEQoBsSC%f*I-M<MWc{1gzbb2!JDukKPB<j*^bZ0iG
zg^+QCdRkN?=vrzjlw~8==bx1*+3FW~f)Ertux7%W@qUh-3?CXwYpG`zo~~IHCh2@S
zEv^T}A1z37k`Um2fQ6i{oLbKQ_UNM0f@B(16BT%Woq@j@g8nWVx5!rb+RzfP9EINp
z+e(|!j%#{2{1!}{@zyvy55il+B7YuHt(Y7O@L3Ut&Y!CNiu6I|asvVs_B@q|LU+_$
z3K(Zn0}DS0bh=VTs9ED>@1HWH1cEW|ohgh!Ou<aa85!e&ns#K=2X{9&^AG{Pu<(do
zFi)!5IpU>|6>?A^3w#BH3>@xSoE}~TolBtD0W0DBMo+yzn4Vemam6%YcBViqEN@9P
z@uWv%d}4DTFbWhMoC=CJ5LAGxe?A{88CnQO7L(ZTA!#Oox$y7t8<Lr|Bnyk<fGNm6
zq$&LI{wTh3{r|B55~c(6Za_0JvNOT$TW+D|TY`=Dt~+SL*cS4GJ3n@9I|?h>^miYZ
zeqLPcjX?qb&MTUpH<8#foZJ|GpG@RB=JTHrW5^mX#@R}1+|DM)<0;;v`dO3vxCV>j
zkx=m_&uI%2xV9Z-T{5Zo_9h5@hffiBAmk0|c2?5_c|)%?xUg;BO<U3?3ryO+-7}F3
zj00LdRfw12fN{1gfh?OM&}MftJ{E2L9N%p<IBiqBQM)5NHWd*{oSzOSt6iJ5TY2q|
z2HAIo8)=u&z9x8FUs$Yl24w48-)+yv@WsM3=>2qI)=DnKDB9+z?+3r(?bf<8)VX;p
zWl!zo7WG282Yaa{5)3++*COG^FXjn&Lr8yjDOtD-n5$@#l_U{lOh>Hv<0Q!7(#DiB
zmqP}tcge=on)X!nm0BqJ!Ob+mak&dYnK6TlU^HRn{|fY8Nd%#s#%LL1gD{0s=lQa}
zzSZ|5nldpkO~m~7nA}<NhvBl>JMYHmO+b+M5iE~AHr;+@=aJWKWvxt(_|BT*M8-yA
zy-Cc&RGY_M?;b$ll_nv&YpDLz;l;!*=lCN2_6@f0+{J@K?DIC0nrd4`3wvEm!+eTX
zb^41hff^2mpNH~KqXV^M%e>(p4y2~|E&+4<mpR0E3-7!(@ZdVy#njqb2i}Ij!|H7D
z@=KI+Fv&5qAqVQ1Di<El%UW7u`?P~<hXdiQqHR)PKB3ivD<f1G8#Qx(ra2|s7bmrZ
zI}`E~`~=Ab&0MY08=V0`PJnu0n=;xnzL@zsn0$s)^W85vB&HknlDui9&reE|;Ydx>
zK(B4|(q{G1Wx|FO6~CtQGQk)OTTu14$i*m%v)(aw7$Oq<z7nhXct?Ge2}RNi4tbx+
z74Wr~xa{#L3&&Rs-}X4JqqZwimtf8Z$IVp!Z4B}fnuG|=@)rbB^u*Li5rjd%EfrWO
zUpIAm2i<Vuu+gMX@Fvx5b^fCT6TE|sB<u*o2b2i%hGUk3c!T^)4#PD=1|KR8?{+UK
z!s0P12$oi|r-e_5%yhtnOo7ecLILZefO;`~lzl~Zbj#<D>NfycWkpVfmdbX6)py_Z
zy6fs9+M+6Gt)43=;<}-7=(*WH{nW&oiM6pWy7~HC31*^yV7b_bMX7yBsX48OPX$pF
z0CZ(AdVDkmrGLs`Y%@j8xnHJo-Z|mfI6>Ezwt;zH--i|Q!vuLj=NfS!DN!{(1Aa4y
z*>@lLdhexCvS+0AMUT^QBXI`*WZfFj=(oY2Cdc05Ho3u7Pk&qK#(_zO(Ze4i=e!pB
zzNrosrhy@GGxq5In)(CbBeC86lud(dVghB)?ytlMfjN}tg6j8hB>3BXaI#RQ!{%3C
zf|<o}FruBEIjmok8Z3o+D&4p=j!V=9mFM!*<--a5H|n8?)h3rSpRrqy3g<H9Rw}U5
z$l7)mgM8ZbU0sNyfg+6!3A%*kp&r|k)?JMWDH><Uw`k3!_2cMge?nM?K;nx^8JY47
z*KHhUjjn<atB_?+kLOyKT^425iBiB?uR*S$&QmV%gwReEa!=tT2l#>`cMG~c_XB1`
zHAv)Fb*Y05C5FH>4XUa30Nrotik6U~p0uL8aa?jiQZtB0@H-$nSGB)k#+##}qA-AJ
z>0GmdSN}mwO#%@dmaLy9`Nz!pT%kZ?E~Z2Z5V^&Jv)b&C2Qvkvk}AXTB_HSK_PbNN
z^!4>84#_?SQh#}2e{ym6nA9nOJ%;V4v+RGgV+sKUE75^-`sr1~_3=0O+cPw4|JcF`
z0lAVPDSMQEeRWeQZHS;x1LPDte%|?LiHF`9b+f3R>~rOnlFG1fvQ#yDizTIZ<QTjk
zV8bQI6;7zRo%Ei?9Gq4m5fHTjiG9d@I%z2l4Tp}<=El_zch_>wo9~G<C>q?}_4Rr6
z(y7A;;hsy<?{D4Hvwzzi{-A=J6#G|eY?NW$#YSlwy!`FlS8jV<%fuqJXe1UI=$)P%
zHyqP{J|BK~J;R7TIiEJD!ZdBoj)Osvj{b9b-d#x8K2Mw4*-e62R`)jM{N}gHrm`pb
zZ*HDoD6cRT`dq{Z_Z)9exQx(nEen}2T#-PgJD@4I!w+0MC^6%&n>+GBb6N+g#!_}-
zi66+|sx<6vok^$j7ret<oTi~@?%!xAyB~fMPDFn7FUDT#I#x8k&O~)dq_)|Gi3a}H
z<iHW3ANZT<J|e6zd<ZDV{TR=~p%l~1+_nl$M*@@iC4E6#h00x|vH2n)-|4ekmR8VB
z>{2vWe_If!FMKSYCyXc1eQE`qvK<UZSFXLS13i>t34(8BwpX);sM`?#orgLm!bdK-
z+sy8cC!jE<36C%l(D}f96T{eFMh=CirRl91q*PEy<Oq%RdM6wMiwcB_f#K&c3k}V^
zc3Devm&=B9vqf(Us*>p@cjP32&rf`-$vb7Ezf^5qTLxy$VG9P_U=cJVk(r@5%q$O;
ze2ek@ZkOg$CtP=D{F6j~tqdvqvOUFqZfZ6<-a1EH8i@XMuAl0=GlUMVN|{NKtI(NF
z;~1%<&QqMO11o4R6<U_2MZr3_FegWZZ9H8ce3-Swo>ga~0wSmls579f?#g?7_SL%U
zsc)e30wVU%Qd&BHV_lnp^Wk(B6vU6Mj=<&zc@^R{LMj3P=F*dQ3UM$Qh8$}F`mZ6O
z;ca|#fAP)>GN#5qxL6#yO+h-mX0U+nuM&XZYv`1~vtC_1k|3gI!A&GW2nly>iVHmS
z`+HkIF2G`49(WZw(MC8CQ1JH`)OUI0Nalf{Z`vJ-VQiD`lNS`7-rJm*{GTg`Kp1FK
zgc?{LGbbn$9}GRc>K1mc-;;LmpeFzT*tO%>PIy!knDCWHAW+1aah<+996tqm*3$iO
zW7|Ym&vzq;OMu&N<+lSLIOs@%P#DPN>2s{w>9M=<t;<Q>HLMS7nQJ{XSHFa+|4<V9
z%BKMM+Tc6<CnwK5%iY`%4~|ad{I57tlheh%TfSM^ZoW%uK{uH-z#I$cG{WUqo8oc}
zZ<xG2PT@4jVofOf5ad8#!({*7UQ*JZB(*yfzzBvcex^|eL^Z!1UmtD{w;Dv9ux-Z?
z=+R7+Mzd;5e@_nP&84ypClT|lg8)$9L18wo*ZxI)4f-yA`+Y-)ML?)%<f<^!R4dg-
z2vzAQgdJ+C1{$NZ*qp;UE;Tt7smAeI^LKvx2YX71Y+i!i?2TA1#m8|pCL-c8>9z*t
z;CZT&(qn)q1q|FiJS18IIOE}kbGgsA@>;Wwrn38W@{&@UeE85t_(qVqQ?XFQ_Y4D$
z$$vYp!P?ex1x|kumeqH}y4!8bPxF6~blwAh%i5@YFLL!Uy3tKJa45u*<Z7Y0cH#gL
zkEzy-{`Pp}@+z;o7|>5YXk;S!|9oJcKcO5D>-T`H-WX52@Lm1!m%6N!*S`Ortda2a
z>$d-UHOWBcGz953BnUEo{;S-bkpU736v2wAQ4x)a+rPxfVq@3W!Fg-o0MGT|rnjD~
z`E~Pm3U7yfTRrp^|5NM*zcV*INCijZ<RAT$6iGTJb<1p9fo&B#%l&Mwp7mdPhZ(r+
zF$T9kW_3Dm_db8*ha<Z=$<76uxp5p^;13L!SE*^JM=fhuZDE~fDQ+|=a}6oH8x=R3
zf%AAujC02nmL`v?m2SJKX;dIwao(*~Le1a@3NsONQUvj(+Ki%ry7vy>B(IQ+sLY<N
zkQ?PQ)n%Vv7n)Uw^5vFx_TjDWT=<v#0^#Oc3T!RT=rr<qg;ddk38-|xfg((~s~5dZ
zjN`Ah2R}oYj!M<(3m2bgFcXo*X7curK&{ZVZw<@!I>L>Pi~BP&BCS(v1gh_I*;JS}
zd!#qpThB+OFxNZ5i;hSLElQ5rQK#MFSU?fhMAD)Qp$CK|)XzMMlT(V_&(R`8mMO6v
z!6o>CN@@Pd`7z*UM_H}gDcfhWa@ZbDVhC8$vXBF4>e0YyJ<8_`lOht?R?U-dNAYP|
z;`y9;%CuEh#cy~)mhbTtGjrwbiAF8?K0%oue#Lz3YYERtcY5{nMqO`cS=N<ZVG|6E
zg|yT9PVl(C$qbMBKnpfDyA8)!E|zYb#KNLW1UZiXBWzpy=+?Y4{5Iy8WU46<+|r@n
zppu2Qe+(~i4IuiwS*^_OONxFromCgzXSpz8=itb+_u8@6*fZ_56RT6+$C0oCg^W$1
zowt~a^}w2a-*#w%@grBX$)`T_W9WG}8>WwX8&EN@{~djHBKe5fe&~M}s(O$|h!)l4
zm4g(7vInLN1X0Qz>wAXLpm;}O6C4_s71m46{k3@ROZ$}rAgbaHZ0h;<g;o%PUCg$W
zj8p<b6_*<-NI4(}UakFDRP0cu+^6gbV-$u!^9RX@tG6^>U3QfJmHiYuGUDsvqUz1c
z>O$E2_O{*Xi7-KVy9I)7&mVHcA{;@D8hi3P<0_Xgt5EEt6>w%is~kTPb9D`bNuxvd
znPI)0j}x(j0$(!7Xn1y4v!@eAu8cX`@Ns7Pn*IaB9|XIRGBYRU3&SAi)%KXjSK5=b
zKm*xd*vMQ@!Z+i9?dH6!6lzLJaTO5*PII%Pk+z~^z{hYH<m^y3g16aK6UM<l<Cu-s
zw(YXzswF4=XzyUi2L9sP#})l_<XwKfd(o0iQ=L^?ru<fyg!8S7OFjd6_sxmbT3WK~
z@pM;AIHD}G75dhu^X7s(KtjAb)HEwJNbEFyykv&WAz(@ps&8dPn3H2kBc(wKLyF-K
z;b?iGu$7s^Gx8E9VI}LqXHx^?KN{r1Zkw4ba%BSqm?GV4ZRtEfYosq&rV={_3~KYN
z@+G<Zm10qfc92r3se(|O!)%@_AN^+#<H8C`uQj!1^c8;3q#D@P-4uxxK`igZN?Vcv
zP}$a8Yc)2h>2^5B9WY2`6-=UU-TtkVA#Vm`WVO8!BhPo7Gc`BjJ}$Zqc?=_aju<nI
z<yDs#<!6YGZKp8s@U^}wtuoHkhMdNxB>ZBQYv(2e31E&_9;RX!_z<-ks^ZfQy5Sts
zg<-QY0*BoS!nil>&(pO!YPB5cO`Vb=%lKt)DjYDcs>l;2Oy4`^DlQ(X6%?`@2+!1!
z7><BTwyisS>0V#~1-urhB6K`1={^7tB{U=)W0ATJy<3tVn){=Ew<`31=flR)Pz~Bt
zP{QGjf%PhsR=4jp^rM~sQjtwo*#6zf{+3j4q@-`YEl@B}#3KEocVJ4FRz@|JFSVfO
z#Uz!N4~2SBG3LCtUgg#bEUgTaRBxrLAmt`_AkLaGAveY<t0~ku_Vkx82oQK>=xp2}
zg}dWG`pb}nciK$cRp^vbiryNk^tIKv^t+^0C|xb5y{=sK7>zTgdd>SHs#Mxjuwif`
zL$7*QjBtmYQXs~pZ}apFzEmmk8{m4CNgb6a+aPbXS#ikj&X45qS<X#e{d!Im0M&VB
zOT(`HVx=cr6vB%pt*BT!9}oOU)--le*}Ku_OWHZV6|w7kx$aDRvjw2Lx&-1u*u>Dm
z1p+}8it=2hc-VnL`rttT!N%c1nICs(cf(3Qe{6Xs|8FAUmdvpK-hHtU7)%|gF&VgH
zd7yoAZ2viTTFsJ0TM*^)Y-`P!ZDrsvvlyA=YnlkpC*I(^18dhaA;^L>;g%#6-;0`t
zs0dYn4CdYg*yphtOO1+VV-R2L8`|iYnA0fg+{81He<*OFAiDc-@oyW7TN%G{hlSUv
zBi$H$kH+dv=>v3Ts|)FyK%7fmPVtDDS=p6hySnbSRE{nc>{RGF^q`&*{}lVfswKOy
z`*l%;kZCD0umNyes?9_$USOCw6~ECBu`r^+NZHnUG}JBU+|nAIK8ce{smJ?+|4HRN
znVS{`e0=c<JReE9zQ#6WrAB>SUGB?~$MXbzJ-&dwZJ(r!&e8`WZeXJ!RI6*y?>n5U
z&X+aT>tMiym9I4&anZK-BkN%;@iv;zM9$uwTdf&(eX6BG`-zd4n+UPx;<_4qLL(Il
zaoHE+E^kU;D`r`ll~3(!R=<SvOkOCF%%;SxE<57+J35<wxq<(=SDsxK`WCUw<zAC6
z`qKLVw_0$bo~8eOO%!!#&&BGv105WeY^bN<KSH4_HIE62YyayLjwwa0j1ZtZ(zG^~
z$vHaXd%_BJ6IYioC^R*6-Fi%vxqOSDRl6g@d)YWYK*RKwhIH*5WFd+U9>D_jfD?2<
z!tV*T(+F#MoG2A^0oy|$6&w!k9b`(bSy4*2G~8x<b%}v>AlJm;;(+{ob+O1u!W<YJ
zA{N?>jfpAKE5fW-lTZI4DD`v#ABlWJZb|)Txxm@xJ=(um`1?LZM2@eu-Q&%6X;42+
ze|iWvwp_oy`RMPFPti=s&2rjZRg)bZZPeKvAN*9+;<9CpqCM19q6Bn|`>X+4oNtnR
z^4Y`E*#k)VvTzfk>~a6wW%cFF<5T^Js*afMR)K8p7O1TeTmGn=RC;F>)3%hgAcGu9
zlil5#?+FAHbHGU}2;8m`iK}rxmA$=vGCaarPj5=6R|&dARL4)ty=N`G&cte<7J7ru
zBt=bM{|8p^Rr|FdDvX%%3Qpz>B*KYIF}%#VR;8Y6oS)WCi#RMMIsOld%c-@wx60Hy
z%XY+We~Le;_*br@LDV79da(FBdZ-j@cV72DX@7Ny@1nA>yYzv0Tdump!6Fw6XzPJv
zaXQ}vD8^(;CbISL2H-+ZkmITvTl~(cfN7en_EN7{U=3GY3QwEW-YEt`0Y$EsaZV}E
zNs!A#dCDm;p)>o#V!66d;Tbu-WwElB;DMiO^!s@A1J{KYt1tM!sbx+loWzilH6v$!
z22qaIh_tm+p4Sk!44lZvQXB7D%xKRdUm|0REfPJ-mh_g+NxS(x1yiTu;gQ*xi%B9M
zB|a2*@T!~`9K2av4rdmc3Hf1XLtJ1N1P=BNB(u?u@||JdIkc$KeQ==)tZu!xfPkus
zBGH}!&Ui?Utjq<t%j}<}RP5Qc?SN#_ij|`HaKWkxosl~NO@*w9Saj^KB_*O60j=S=
zZ@mC5)SU#651CS@9aFXAvPgX2X}qUdf;=3B^_1l~B8{&=umTh)PcMj&t5TFyugj+8
z6ChdxZIFtF*Ul7>2u$ZY!<>8|ibieQqJk8Sh0%j=#t_D%P!NKab0#L_dEYM@P6yBd
zsUHu&m&zw5M+BmSep(Fl<g_#ST=)E5z!NU02}S;QBLMnh?=5z;w<{L%Mm;lxh;MaP
zwSKbEps1|f`0rn1{l<W}l*-zbzU#eEUP%%3aK9SDvBTqwt=Uk39-rywx}7I)&`t}K
z1F~kTfZYbHEe;4I&y9Eaw$Aqtzp25PcpiTSRC*L|ob*s7$sAH{By;gXr)2080v{kr
zPPY7%*7d2%i=9MJr*O6Co1?*h<z(L)VtAw0PUzK#TUpt>v$&F@YQ<_gv5;XTG$|#9
z9ubdq!2pwC7w^#V8)-cL{qF8X$r5qX<CPMPy0#>vKC7k2y2v<PubNAkTDA1xO6f;X
z17l`^75!fi7jFd5A%2jNwRWkm5dM|6LS-{6D`xYOUvq<808?YPe_#VMde)N7&`@X~
zQiL4xUp9EFJy6@E&vS5YJ#D)+Kh#vT$6w6aq|ocp);nCW!QXWIlz@^-7x5sJXvGuD
zKuWoE81!X>?rZy33vb~67G9`Em7O-X^OLsozvvb#|B-z2{obE0AAm+in4IE$!m~?`
za|e_BN}Q3Ak^G%RBkvbRji)mT@xcLQQ-w@*FQt<>NjR8<lE!LVPm>;8cDE1i(WWHW
z*dq!Pi2DwZQJ%B`TWq>vwBcJ|*PDilGd#VcE%2$KAa?ba;Q$z(a+Q`;>hxHQkpDA>
zz}s~g!D?8cm_7|(CE{9zR{>3}*o<T@p==GAH8}>$XT(gmeU`*CqbKltFjPMq%ib$R
z4i9dQ`KoF-O~-p(m14amfINEuTdG2Fznf7}<k!0TaF4t_d-*KLfGa8GJ=X;$fgWrz
z-_fC{RxYMYn5|F4&7if{SDO`n;U_y{{q#|KI<PM}lm7zqDf?Bq8uH8}<S(@hP)q+w
z&QC|vpf$UZ9{GEv5h8;Nc!L2TSa}mYya72U0Pg9xhj{>PG$KTJXsxE_*0Ip%!#r74
z5ck{0`OQH1D&2qM5+rsg<_IH3S_Xz<;M`gzn*PTR%v@$7DnPDpex=cogGtZ-zU2pk
z>f$-SJ)8nlz^yb5Pj4Vf<rFCXq4L0*U_TxH@3bE@jsq2t)Tq{xuvw}??P88C*q<PH
zQ1SKch$X*|Jv4F+dBSz&U|=U&p$_HOj_hFjV9ch3hJKwdnbghjh*X^j0avcOt>Vuh
z8#=Va9Sg~*`SBTruRNUwe}b>jy!p)FC-^FAzLSm#6BH+zUgPR?-tTdE5hsz;TJbxC
zdXz{f8veBI*VeCmH~cTP8r#3BQ~c_=zf(s^Z#MQuSbb*eWLzaNW<AQ^X-86~qv+38
zG694^>%Y1iBI8EN8zi%Zi#n#n=GhhU)}|593C(WS-j}%V!x8q*F!N?%(KEJB2t*Yx
z220!iZIN*$%{YKuuKY`j&vS+pcpvG!sOnRn8q3MZ)YH|LH)Q-&qEpjIrT(U26O2y-
zP4So&o9-x2g>Gd$kt_QJwX@Vu9ckZwoL4BEk*o{ox|&k!TO)GAgv8*sB003zm$Tur
zEy#d1opf=IYXQHhd9`qIa(V!UYO@_)_gbI@c{GTB4LZa9-%hEM!shP3K+A$N|3n4#
zgMoX;3SS8%nEy5^hA<9<FEJ$XLHOa~sm0#1%-I*Dw*dr^6{J3~!ZIHpd9l+_6~ogz
zlh=62I<1KYtk^WTc{L0%cM04nJqSzDfTcsT^Iz=pYlb{^Y3dq~UY<xR^4ckcB@4M)
zgh`f1o5ir1|DiV4jaQt{`mWZRRl{nQ*q;bLnj3R&Vla(lG76b;&(c)4$VSKS%e;e3
z3L+Tx<{X{)CwOVG@e=}?lc4fJ#P*b8f-v!RdTN5ie5qh@AO}WIl0)7H6oNQM+FG*7
zL^z;mw?6_s8&jByj+0Y^tY_!#KYuCI(xbPL!fGquB02A`lJz=eYk7B+-@ZW34~38?
z*#bIAh82hlDLT9BS8&oYVp)X>k<42yh?7i#I=8roEV6@#+?BaRSfeeQ5Y({C1_rE$
zqiw#xX_)i(X|jj4LO!w0lIgsq%+djr=oKP^Rf=*|28aZu#vkE7^+QwUcWFlOM`LjA
zt?e!m^)ss4_UafeZpx4dc!?xH#{yi4dp`2p+jBv|hYfsf*IK2A?&(8&HUUR9*e~l?
z@W6-!p-Xd6a?e;9S*74RLT%f3WR>7+%qDqX?%O#!`XA1=P*Azg=Ja`@j8%<g1%=|f
zbzLMm2D%Sqx}?XH6K^_FDFHhpVUSnPxLC6dY^+|fcl7C;H70|T+=hh<LR_jc){tQh
zV8$L!<_&*2%cXpfz0nwsz!w+C^R?C@#-i1TC3U2l3g>!2FHVyRI=#>A@rVe;oCpG*
z<I(Pnn=}46#zdLN2~dKv)@#YQ4}i3CF=-%VyDe$o)!HmGq89gpcT6b$W{>(<iBA7A
zSi(5Ui3-Z?1+jvfxc06-%hdbs(sSkO0*ar?A&^ixfXXyoe$Fh{<e`!6Z)A_FLEHCy
zfgX=AWk>*kNxAXK0-jOgbY0x*W&*e2ba42Jl!?>G=z0BLy+wOFaJ&AcNJ{or32r{x
z{oi9<Re)_IDY-f=>(ZhQCd~7-B|QSdO>}*kC(~lRN%2+0zt<fiuhzSgfY0BEcNKxl
zMu>|X(OWXpW0vO}9k#)qHh;EwyCSkw7KHp495wXBx3Wi+To;@ky8i-z)l`MfL)NvM
ziFJ$>uIT7FRti}{Vp&kul^70!^VYRg#B38pQT4`p1APUK!^2}`dwWLsD$6>`XM!iP
zB#CnC)6~qmh^|-ru!9IW=|E)jYbGq`KXFG|d(G}4t_FU6R>Ssxuj?#T_0(F#8+=eK
zPzt=XeJFE_Jg+o(e&Mm}8?0$~zyA5<lw54k=q%B$zp83s@rLA;1&#*=fvi~;j0w~E
z@>HttQy%;OXga6xIJ~!O$F^-djjhJE?Z&okJDI3Snl^T08<V85ZQI}c-v9NTPUc_^
za_zmJXRUQF)RrRAXx|^cG8q3i)IM#1*bRVbkuQH$f^b}MIARIecTkNfb{SoVdCwXb
z8wVSE@C&w|$WR=g#&yW6I3EE-Bd95>RfF&e)NEZ+t=~EhzSrimhw|5xnBke{%*VzQ
z%uX@TNLcc_BxV(qnW8Ns8mT#w6y~GV&jvE2+Ao+3aEiWKCo0Kj{#oNmz1PEqkrm$-
zWkdqa5mc185<*tN0)TO6{;O1!`Z$TwpwC_a|GXx9eSOpJ9qRs4r_yY_i@nt!v18WG
zJ7+gb##Jo>Y}5YBMu}iqXU40xX8`mzqMwqqb*|6B1L$m2JsJ)bP-1E;g);oX7;Dqh
zfl56H4OCBBXYD!6fQySIuZZMdZRAlm^6~X$6Vh4{)N3sa@gu_NCwwR(AD|ZD$rG|X
z`6SX}iZ6PfVzjwl<~Uh+@tReI#H<WC+2edn|9CheofjZAWj$4ZOx00!)pl*<4;gmq
zNaB(=5zfWq{mCBe#yI(h4GQAVv<lgv4~`&eKgYLlEmP`^dkQz1Agjh(8W>+_7|}vg
z;;7(vkR_Cko_<WcbSIx$P;h<y>pqs%QtSVgshE%#=Au_Qpr90;ktd1IKKhL~oR|+@
zM#n*>z6~gS{H^w^?c(UiFdI8i7^coktdO7RHRI4);^pz8bt`k&oV6U8vtM0MbY2Ct
zfc^AD!aAQ&S3>01#WZH+kqx=>*%pHj>ENRi-k&@<`j(V>(5$=tH>OXEM1I>4;uTo~
z1*@g;A%G{*fLXe6GKeGIQ>=al;q>Q1-%5e7_mPOkgrKBH$qYO1jIVI1*ArrKcS!eo
zPz1Z($p~J@s;q>k6@S3U$hdF{xJD)<AFuGy4m-<q<TAYkWp;ZI2i?H%BctlfL&WX&
zw21cnO+|qs7LGDHmrwfN9=$_)|Euihz$U*X&z49({;m!i@Q7!>+ty$=unZ@oLlWPI
zy}~hOio{#DdFq0+JlqBB^HjJa1!2QaJ3i#;4Tm>0Z+?$=!#63~SvS;~(!5K*SaHm~
zUsQaWa~cvwA*LVYJ;z@<Au5Ea9I=^Rhh-qe@5pX)ONESyk+HE#+gZmM1XxVV%F417
zyf+xLQlf#W!sAW1rH&`BHm?WK5p1zmK?rG*zao#>=GDktS17zN_Vk%Bdy@(U)OuPU
zG#<TAjfSOUIS0LQhIUG+xm4%-kf)Yj#E=C;O_8-p#XNnSu`pFx!Rw&0<+p=HX??zY
zUd~DScj`!zC_?L~3{4Fj9i?jS*6c!z(T&~gUK#V&&_zMNfr9f&DA?)!BSH$z{*^zG
zdXK%xqs%NAtH6Q>{%1<WL=PgrFKSD<r=eM?o`DGD`71^X;-u)5{lj9*h?n?WjuVt|
zqUD&>o~S~Np}s!7uk36cIc4S27uHTO%;7{dT4%#G=@QTPgB2I;y24fl>6*hbM!a60
z-u26~GkIV|7zFvTtv885i+v6rH!-NSsr7{V?D$HKxg%Q&Gc1qCshnraU%g7!Bn*|O
z{Xeh5NkCnkcQaLE4!yl2bM0COy-BfMFson5iZx{%65>uU-heCD<%HbCjWqhFJ-q=n
zCZa&+6s2;Ol<ze_;2=PnwN6~a%sfLn#;36wVD?8`$5NN?;)A|`HV+QReSD`%laZJ(
z-LhaixFrKZ6&I;46VY{EkN=t`wRFsX^IlOJpiwX`_atxe=<<v6>}70ZB<@!3aemot
zL@k-rZil^y$gjvaB0Ta&Z5+X&GUEJTG((Ot4?*MPUO{Wrp)atE2~JWD`GCp(^73Fx
zE1)~G5XI?gYid60x30_l9I<yNzx2!9c%h``WRW^>!}52RUeiZ+RaLYaZ*0&{)C}v!
z3CW`3*&KXU%TzWds-g>|d;L9gZ=aWWcG~Z%r@xVI?;cH|#hXp;I+>F51}xc{9xkZ*
z(Ovrvq0A9rm;Y-C-*6s4F4=}+r0w~9{i72`C=%%3id#(yRba&-5CX2KevEuu+&Q~6
zB}E7XoS)mbgZ7Zrct*MN^YbU5mtPskbSc)~E>(A?Hu(kU4KAmp&_P?C7*ITHYq^yS
zs;;awJDf6ll=-!2I~a76FvRIL?6W`6l=b<U>CZ`S0&n9xuTsl2_g(Vd;kAES9hnj4
zQ2bY3am}J{a($37_zUdw{2x|9#oATbH9cpOU{=N*-DcXel~dXxIwuj1y%(^sw}xFh
z8Rs~}Dj0}eq^mG8{d-f<xY5qz*bq2r9=X#cV<Ul%UjtNv+hpJ>8Y)T;*I364gJ4l?
z9)q?Ig7ryVoV9un9L&bu`9_BKFwIJ;H!qSFSTA)dUWy*re&FkjKKhjmKIiw;y=w{M
zIpNuTQgHqO>8cQZIX1bDLEUOVd$!f6XX*&({gXZUEoMUs5kDVJ)ThTA^Vf~lr&Axt
zlYxDkm+~%+DcCxN%HJ~!N<DUf+Lv{17~mIM%TB~K$byCgj!uVRC$$ZtZz_VCe@pM@
zTim{F<>DO^z;Jf`Tw)eH<EyvhBU#q~Rs6C9fO;g&#L%N+R7k>ug@@B%nx;Vdvh+6?
zwi<A@&?1d_{v_o6o%2(v`g#`){kDQnvz!ENoFFMoB|P#;_Ukcwv0A6Z8Y9lVTfP#}
zW8%>$TA1p}BY^wiQ)FF(UNEcR^&(u*WCCge1LOEugb?+Wm1)A>a02bqDa7kdYxDl$
zsrUj{vnyWc?Q^``jdxX$V&TK}k#{I`1Ok;Mkaa<Q!kT#VQ{+$)Si%k|HD`U*t)R{d
zP`nw4R9`7i(3slkl_tJR^sLBKwKouKol@-_y(26JCpfdSHCCl2Br!EdQH6Iu+{Sx7
z%)@@4F4zk}InxD>$d)DwsD7I^5t204E~m_SmNdL;<fv4(fg(hCi>v8=-^Gb|B4vvv
zB4n^#o3`*d8i6^8MFu!fGK%rHLAiPh&%ZzZI>FJ+1qV%*wn(Eyy_`bnKEf~inEW7v
z@z5Q#U@ye9;GF`uOqv8}pm+FNEAms{QEL-4V}^u9fOjeXsj9N4AWITL6ZIqg$GO<|
zJ4-k5e?B(_BzI)UOd*adYVvDnXmPOVH!u|n!OOP2aB1u5i%^WaIY>O<JyZif(e&iQ
z@^YPNSUf(Qf|<RT%x7^F2?n@a(}T*cM`?Ey<8=l43qKxG7`X0*Vg=;|wB7s?8uy~L
zHL>i{0`GR7&l{||>#5N#|0j`Ld|Yak-i5pkUKlRoHDGjPp3%#hfK>Z8i>4s^y*k)y
zIn3W9XVxCk_U&DH_qvUs(OmuF6ghc0n~_YBli9b7s%T|JbW8k5_r5I+euVtd)M;1q
zsdC(P+la~Ye-7@C*L!7B^-9?3EynZ-;9fhkF6jUW$zHbA`>{MMTpSzK{dAxBEsIOV
ztfmwIOZxcHfvAto7MiD{s??D|04%anbovtulg<W#P0eFA=E%)i1zc<a!F_wD<DRj`
zaAa!N%5o!?$(@jg!ClWAUN7E&SJaaZ-bwpjqQE{$Lj(xU30-a2q16dGQG4E~bNRCI
zY+}HLmPlipQb`E6B}872OXqm2__8Msrwi;{9!)!Fng@gNUF+D2da_thw+>AF^I9q)
zfXpaZI3zR+KWr?B;Y&lE-}n2U<b&2_B!?{R$+n{CY4Tl9@ua@5iI{h-=S4Q>k5;OV
zA(db$D?7<CGE|IWMyB?VDy(r3RXsE(F#L&ifB)@*hK|k>!?a2GQdy*f9~1D@s(A0@
zIk-P9g|-TlPs=z?#T<dU3w}PU7gn3ac+e2N?Na)tYk?5bP{R#tdl1)HVpFJ+e|F3B
zE#7#WB+?PQ-X#Xg$x8@Y?Xd54QAqQ|C^sn+b3_o85;52~=pzC2sDAnRA~>I8)uhDd
zMH8hoJY+H#cRg1o&s_O1$m_7m2|oZ)y{Ai&!$Uj*CS_6~rpQs*z#cZ)49G^C#>7R8
z0uz6W92a5HY?kwxEI8tns2%rSlEH31XA!O^{rk7>mB`b{0gUN%|Hw+6uOs?tADOf$
zglo0A#j|vZN_Q%AbctNN4RK-Lxl&EYn_c77!O>_jfuv*w@}6(w>U`+L(c2?OkIY^l
zb%#z=W=qu7YTX^nV8vI-o|6&naz)y4+DOApd3__>djctfM?Vf!CZ*|v|JUzLRl!21
z0}*j|si9=Rs3rc=)*QO1yDx^Bq&}Fh9*jR}fdpKas~w>3kfCPvU=}Hge^k~U!NK)U
zd@Oympo`uU#=yXUjw~L871`g1Ie;n?{q^SRP{vSuHsNOd!_8)JA#Qds2D7aH<>h79
z0}V9}mlemWz4uR|mrc`nm8H{g@TELivgi4-Slw=nFbppi&+C-S2gr>hpIlvb0%ER3
z5Ba4j{Yb3tIl>QM18yZjH_r=bf@fWO=klE>@PqbC$NOnYX3Flv!<}5OOP&FPyH<#a
zmm0<yG~|KyWTIksGE#M`7!AQrTnAYU(EYxIrp8q-lJ-L|<H_BdfQvatGM;fcc{*Ar
zQYRHO(oT0BK@E2lu@qp@SGrjA;@J>4PFZNT(GT_Cc6Lvo+JvAjlNbm)1+89rI*dgZ
zyM*ZXc;7LY{D>BjuV*3Qs-AqT2%1^?MCi@}<X43%!Ee~b+>=aDMgviJCw^2V6&;M4
z8Xn4`dV3X4&cAdjpb|Ftoq3Zdu{>jTh&yM8A<4V7q4&0E$+9V4A9uVTZ&m+N26|{x
zTUuFh6`$lk2M?}f+2&*5=xJ9dR%?$SU2wx(BZHwKgm|Tb^kqOvshAzchWorC#di!4
z%I_@eFDgz`b{0v0aCsJ)hU$nL2g(7ER7@Vs*Dh$jX&Ur@Em;(#a<#v2G0_Jr`0@PQ
zbRWGaVZ+hL&JO&;zI_Z8s6hXh&1obHnRZ1@qM(xZnAl6p(aXF{jJ7-?-`kOHRH<yg
z;Iwx)Y^J*uu{@teSC9TrIrZ^_1Bmr>vg6Zu++DF*giaZ$&f=#sJ-#vGo?W7PtE0=z
zx|X{*PaC{zMqxW)oEH<RT!Q=g0oOH-QxvpMw^Ll~zpd8KS<aYIUw~jt2u~m{#Khwd
zB-a-exitwh476VXu1rZ>AjX+2H1O$Qp0<ba98E>yvyt}ulJ@Gf<k7Zl`;JFw&r)zd
zyIwe;&IR{L{A&0aJjd}Z;W;5aGneA2m)$v-kD2LPW{JeQEl2Cg1kYAcCov-k7{kq<
z`t6(BSWHh?quY_UHZy|_CKx}yWz-OI396A_Zn-g6R%8;MSPs1aU60O<o2kw~+MB93
z9b@3PjhGo|!8SJ3>K4HQ&pNc}{-rO8gouvg$TgC3Pyir3BaQW4PdkZBDNVW3ukj?C
z{KH<3+es0Ls2dM>H@u=ggA)>8Q5dLaldb}2^}JlCAO3dLd8bs|%!%yzY&KvIO3r~q
zRnY#_NmTR`G}Pnlb-=AnNL3%s6tW6J2|g_f87S`!OwRmo85;!&!}$SMyKv3>JjpSm
zqM(3OC_6YN6mO19z$x?S$bY#5bZkTpLWSXE2H&&m>mz?3SeY&MvvQPw>WxMOdv_4h
zYI+izlFo!XJODHA9oM$2CcDmn=rpuZ*85>sD?p^BJJcTuiwDFo=6*#e1XGtrwn+MR
z0q@7rll<ae<C<?cFzoEGkHI{tyZ-~S-vr87C8AV$4Z(h(P0z)J{lfh3ZwPLpyuvJb
zzVmBx0XNoagB#|L_cy6ArYdDH%L97zMt(2(6#m{rgLRC5#f1N=EggyFR+WB6!W>N1
zdmGbC{k4Dy*~=dUe0eso^TnHQ4=}Rj=Oe07R~Rn_DNA5bN^1R!rPXXb@3O@h87uDF
z?JTZQDp=`Q%$iLS`A|TiASIjCGf>H7yfaE`Wju(SoBJl8zbm(}mFXal6NS4Oa{iIH
zMS@qQ6Dw5WbS(sgEmtaFKnQ0GPGAE=ViHv`x?6b25Bg3yY44w81{Q#9JyTy_?>Zen
zDJEZ3ODy-{Fp<d|itEj@<WIr-C`zcX`b)Y)A&SG!VdJ^uRYQ8QKKj_(R$t76_{@tJ
zL-1BB6I-n(TxYe}587exfxl!%1#bPOWLfX*I`$>~*loeG>2~BG)wpa3AALTeic_cW
z6uN?#BNSq=S9s=&c-V%A^0#GKUJl+EGST;u%0}QROeyxewraNI2d25r$ZA;=BUhNX
z)IDzJ^4lXpfu=%u&GRcIebKtJS_G^zkB5@~<Td#@7!vIEsT~8gRLtfWB9b!O=F24S
z`txB6Lh?f7^wh9o-pP9mt@!rb<&#w3^Pv`h^}}zn#IDCyKtGZLG9*D1TM38xFp@7Q
z`Ek$*<|6WDPj49bVo4!^;_rpcU(@w(0VB6;zCcwU%GJv&OEK`r4~D6BGaO`m{_kqX
z!#whi!k$==1^Kp?-=e^{JKDCcN1W8;xb*)*U1NzSC^>5A7l&6+_Gk2RZ*mccZ!yOX
zl=KmEQ0qE$qqQ=sOyxm|CL}<R1K7D3)<BX@^6o!TXDh_5F6bYtCiZN3Md}NKyiO)7
zj-t{q0bxVNMINERG&fCM_KW4sT(XSuo(DVike6Hnx`ldb@6G!se$lj>u)6f3oE)LZ
z!*2IX6b-!Dg5^`8qUM+AR%9s_I+-m(G3n#NVRZuoBBASE$ouUuR5cY9w4veQIen)t
z>QF9FNu@)Y48ORlHFrlIUhm;kNgPWFsChcKrsvZaM~B#yTnn{1p<6GBxH6PS<GKYh
zIFzar_4Vy7uDRN=WI|yx3@;iEwQRDA$ank3`Z&Avb*y!65`WF?+R$)W9l+{G^0;>e
zM_pXhD|*uw>aC(T!2P$mspVyK)rt@d(Lo$d(z);oPZ#yIw7dShtE!wQgM=hyubrZA
zMc3j#f_nnjRqda6ml@3q28kIks%1^CTve!l1w52=R#U3?mLa8$1|RsVN3iM}_T!X=
zWtO%c=u+I+kk4_yV;>x7)CGxH){$vxXkh(q=T#j~-1zsdb2>L+HM>cCW;1ju0>9b7
zxLR~|z91WQ=G)hil;K;qdE&ho^l28kTLhw5Ke-mo_4}_*_b7!-J(+pJ_#n_{DR>BG
zF|gU@DeW|drHIj*Du(vYb1fNAB7{5I|1|3j25$;@^VI9|Z6->0XA|JajR`?97oEZF
z@VdfL9tKh65EOGcWd)-sG4JI?JM5AN`FU}Lyp|e{{NS{}Rc6A&q0py;Kw_`WXfpXB
z_-Nk?krjOxGNgj>Lb|1F_1x3%FF?(1K$4&=2W!5VtV>EhmwLPc!SP4nT?5+Y=pLq4
z-jUEXl;$EQuym$}dKLpSO@~}b7i;l^igempfG~LFR+~IQ;7!f<V<<>np@`Aa{?(|Y
z>~btQ2o4C=FkTG-g<;|bzM$4k2tK4RZ!4^gUVokhc8KX$BxG$}PNSY92KFPf1n1lq
zptU;D)DaejY3Oz)RONjvjcfdeDdg#hi+D7&Hw>U}I@q7l#oVt04fR|k@p8J$YO`xg
zJ1ZaL&#-c2?fg<Qqb<h;ef~SQIN`^{TcV+;`R~WVpcVT^0)RBn<^x{T-?{C+u%CeD
z^AsZ9P-_`lEx>ofv)_!iXDmZA0e)jy?k7z#P4DwxGARe=_3fPs_{*zW{S|>o9ETgy
zF|)PvzxrZQv%0z|Ql{c!LL`VFkGCGsg5BIp@|?PJK<2g~5<1c_rN3u29fO$UOwDE_
zY$F5YpM6uOq;q&c&fem0C=VoXUxfjWIol)<x9!C0<q9cmf}{)%{67Vfb$$NR92Jo6
z(O}rD!&soUE<zDm(1dZ3ihl^NgEHHU2;qn8n-Xw5jp#`Jpt4?f&=8J^^qNG-ljy%<
zM<9BoijwhJenNtm5yt-a`r5e|w1@B>K;{`;7VALCcr2=k5^nMUoXD7hE2SIi$R~+3
zC%+Cwe7mY_QQv}fGnbU4MkYq1{B`=?+B^emkNl(*iKLrc!TL8go4n%4r-Pcz7`tYF
zhI6Faax#-#MMjKnA8c7xLK5HM(~YuvhocYVht1g3FG)AoFQ<&PgltRj?=I-JcCxEQ
zmC-q3v*|(jap7jhH&4<2wP<I1!ivvnBZ}d$(XIX(9`B@08jIpu?l2ko{vO4}X*DRy
zrCeW94)ekHXvyfvYLUpbUsqD5EK2%%oe*(5zjN^c`v_lLr7#pEwVoUMBQ&S!gYcW|
z*jR%#?isBUtH50VE?dzE_w;DJk<iT`CKe$fqZAGfivgXR;O2=(5u#+atOC;V5ZLRM
zJZsPQKSBD6h&W6||LFyS%RriKm7<LM=a&l}>a8SSiA5;qf2z`BJwBkPAr8#_Dgg<;
zgf%IysJwQCigz-rCHD0SsX+E`s}b>F<?iQ9B_T(;!K;hu5offB#-R-X?peeumQvvI
z_wli03H`BwdBw4Z1biU_8)n@R4`{04VwYLX#Mp$26oZ2Yfkyh#iHOInKLZDP19gK(
z6IwtWEi$MRYbWF|FROf7hpo=U&96XM>U+}OXLWPDW#=$ji%4^+Z<jBmM+?`}8?$ca
z`g|&5GAyxmF$v1)75rnms;zI!5>zIiQN}>#M%Ie%b1~IBw*81HXa|TcBO@(w?2HAR
z?#RSY(5#Gja&%T2Hu>df0(K|V4ZV**3j$~(g!cw9%`1QkyogPWk#gw$0;(w`*Rnb<
zWKJCiLxQQma9TJO1cC?<)dmu}P6AZ+_Dw#{l+v?ulvtVd`WvWrH0qS$Da~Jd%NeOT
z(xenR)B7dT%NYJm#W4FpHnr6YZinI{a*%uJNLv8$Mg5iH0*jb~cnX&_e7NyTd8@RL
zJkHg+DTBH9tWi1l7B}BAcYgcB^Eejdhfe^hezP<b114IGJGl~4aB(Q42l$d`V5(E}
zHu(hbLZ4-9Am^-VGAR)SVr&8BwGL*h>m>jp<yZK<zr~v&U9=2{3dFXdib}BOi!nzi
zVBuTLidIAF(mX*Z%x037)nK-qQf6yC|LTGIwn{bMe>qXu)XwqJVLm-_@Iq`IOCp-X
zijRSmkFFN}I?%E_6v9;c^$I;&xN&Tw7wi=aj)Ly@F08UrmVs+b+mA&zzD2CTvx^Vq
zL){wMD(HaEmm`Yc@+EP)Ll{`t34^M&1>~k2S%Huc9C>OS0wZ8RXZ^`oaT*A%Q_<kj
zKMnCp4Yt)NiO<i`!O9Df$+;q+)gn9pt4c#k=WBy_$Mk3Rh=e-7qzzWNArT>ZD<)%S
zeUmu)TvRoeRzo0#O>5#o(W#2{o}u!>()2>Fv}C=httzG#kztY(J6N#OVA0w2)Ym46
zUX5NVrM`Gs-Q<v0;$|rHLHCU*SWUf3A%5&gskC^~K;F#Ga6l@t<QWLo9<Yd|*Z1-O
ze_bxLqF5~`Csxq4Oys<*$lz^>%9a>gK7TQP(;+brZ-ytCI8CyDIf8L^pu)VcJV%}V
z1&aV#mk+l*)c<n*8|E40#5k#HoW@9!^<_@RJscVoMKuMBrv}5)0q@dHQArBPVAP%i
zg+5vO$*vs%nVC|cX`vm?pcr}TNHRRf1Qf0v0h{LyL@$k&bf#O4>Ka^V-5&KogGM>u
znaS%?mX6`cJ3hvfJ1rcHy?~_Wr_i_!HX}oA@*K&9oNp+y6Y>u|E{0~E%XYy$UeLyw
zowF2Kt&Y>*b@sjN?y!0FQ6HOGD;QrP6Ia>AyLDqK`Sj;ioxnjQ&Y4kHZ;BA4c+WB7
zjutH_y@A_9G94Li)Kn0;eR8&NT3ddqp97dfRvYP0%Lz}-o!q})9acW;Nl24QANT{o
zZ)ej60$&br<BC!9jx+W5S>@6aS=?v2+-!T3(eKaImFI$lKgTgDn)6imXl6^lI+KPA
z{h4~K5EE*Czkd!SmCE2~^yMG+McMY$d={K-q$@cw_augsE8h%HApm&RZ_pkH+2Rk4
z*utLj^w$&uKRW$vr@0z!oYnFN;}lH}WFqUL@emMC7|*{?E?lp-{WzGpzkDm4{}pvK
z4v>=3iE%Ij1ycZc!M9|Gg86pLMxEI#o!8=_(7;rTO*jrw;7M7QQK}oV;ye)`n@!)+
ztmw(C*YlkChoC85ir@RqNTrjpk&{nN-<`*jq4dYw6K;5(U(x2;)nsnY{~23*Nnq~R
zh3uEv*vVieZ;p>`Vm{9sXXYkzKwH&9Vb|f(z14{cBp!AkI#Mqg^ET*j<t}@}v(>Ge
z3@|@XH6_Kbqrr`gjBx&@-AxN9Uy8BjSRaN0dLAGy^(pxp$qlVl$@1MFeK>i=Zg4yF
z*!6Qk_2$b*kS&=}iO5EU2i?ulnXT_?()L_N6QXOLRUeknA8#=)P0x*2x!=P}iaK^2
zV9vk-UEimykJef$WDKl@dtkR3kBV)>a)r5At1nvlxxG`qu@L?~Ig!39JNkU1Mke7*
zZn596YC>L@&?ZR78#Wa<sZQ!H9@|S)6;x<4whni*3$#+k)6ghJ8sS<U#RO9>i+CHI
z5Q#1scyr|+4c5bGZ4)bCV3eb$_DGr}edY#(<;EInkN;kFviqR|q1vLTsFCe+L65Y(
zcJe}K1XnBymqW*_|2(fO5(92D$k8|08`3KZ=l5e1l=3g|T(xxv9W?X**~wDS5|hEY
zGO~UyVc~7PgL<XPYJBt8z4sDu_WJl0Kt^y%3`mD5K#?C=&EXEIc-l-)3N{=mMWLuC
zU9)k4)48l-#b6tp?@dY&kPlP2f@2tIqzDZbqUEJTMBJyYzC7Q^??$(;(NBU}vr#Gh
zUM$ni?$>1I^`2Bxa!^%G=Dcz<lDxN5Pm$2CnxHM2_G`eI?FS_yJsoG}<CRj{?~3w^
z;$>%T-}joc<MT$Pvc0GW>+}T<!xA={6MW-d{KbykTXDVTd-K$mZt)#rcESRoO5Z{?
z8X}?2Mua|u;%hkgUOsL*>GbNXc{;6Yi^9|<`m%U`gPcS&kJ!|Ag%s4~zdLrX_A99F
z5BIVqoO($CnM$L!O}pj}lH^kzt}x7c4GB_7#}b<MY*5={w~alup9v(o&&KU<?KuYE
zHA#xTF&0Mc@gXUc(sHYEo(QnIFkqc0;zr#9&MMe&>|mnF18LK=g>;Mzb##TPsp9D9
z=(~Ks1QOWiTL!_(q1R$MERnEF%27*<1D`X8#$sNFyc<OSXtkM{+KMPMSW+&h4Ht-p
zFyU>24KY2s@9i8?<EQ_t=fLgW6S+NzX`u3AeGs_t*L%HH2kF}oiXMhdZ4((z+lqA+
zxSn>uxoTKg!cSZz#2^vxc~vaA`irM(nri=yXB>S;X+q2`N*x+^WYRPvtj+71)7dxC
z)O3B)A_!{PDq79vO!Kl-!A^o!ew6u#bNsidp))*C?kM{bT|+m|>8pbRyypQse@AHt
z+EO%5keNE?(*ImCSHO;+tIn(FQsE!6ftCrG{SDm#?BAC>780Xa^jv*43E^|GUrhw^
zCd^K3kk5tHGg)*FFOPpJuC<41GQ1pChGz{|#x*mjbF4&Pqo97X?dj`N5bf~zDj<^x
zW>51S5uryWB_v>1b%IK-+(E~TYau*VsLY5^zp52?PZS&2Dg;;@|BTR6{(GI6R3RjK
z*@&al#<3mevCGZJ)0RBiA|p@^3~mzgo`44R@Sw;9Og+FZ*a`fXl`;{S4$M-3BE)Lj
zw!Rl#%>}=?yvlKB8Ny<-5$xKVmsRZ?Iq|on+yBo32vH$hmz>^xNaBfO0>j575w-QZ
zJBd5!nawVS2aQjhD@dyowaw1kLt`r$ok$bBEmfa~H-yChJb$*OW-PBlKifiK5YY4J
z)4!O{SBr6EyhT1Y6hnTuL)$sq?L_juZeZjii+5FTRdY-!!7kXy>E4HoY7!c9zaxH{
z{}+QvN6!v`c>frkP@i=k?WpOD?x`1(#@iy=*$7?iwoF4h$d*_=J1VOh2u&#^XAu@l
zCn@xP5z2iCvQ|U(i>(i+-SfC7jgKo5jx9e^5+-K8l1ZpI^41v-07XTQKi{r!VN@+F
zs6v!NGbHCrc2iabQ2aZ@Ai<@QNEAUjcMBZ`i(XUo_7nvZlftGs%1Et*UHZ@Cl{l7;
z{H{Uahkxp+KB}td&`?ll>2U0h+hdptaza;6_Q;d#pfN@X36von;7K-m-E!qyuh&)w
z$`i961iM`B?#l6EIrI-4@qxVqrY9kz<9vq47Q$!>c*2zMMN*iz%7B*}^i57d;Dml^
zFE7upstWc*)O8R6&S=kEyk0-3lzT*dcfx9q`B+-{g1K)VRbg9S>%`|7g~3hl`x-o4
zQDy~+0WK!sbuE(W<tUtInH{!=$X=sj(JVOLQUdEjSa)3!yCwU>Rh*8jhm6h}QY0dY
zMgd1Q?FZ9SO@SXUkDP4<2(j|}U9j^mkT57E=#)~xx?+jZnW#HS{&Hw*BR|@LpdkkX
zo=>B8h<r-NuFkG9DhH-1x)%AM-V8eQZyQ28`6o>bcNR5AzPgC1Y3jdXGq_A2ICwep
z6L-U4&I@6ws2gT^_lok@2t>TGu(5FvIvShhib&zvK3A#T^e1|eIM|(|O+{zMii$yY
zQw5M36_M{G)&~nnW$k`8BNz#7$6MpSBwzgA*bY(?L19!E*fJwL)!9gmx^8p9$4B<c
zge$YJFd@|Kb+?&}F4R?%GFy}tWectK|7}U7iD2p;O;DneapRRmL(tAJpL?%y8eI0I
z_`c@tmeHfg8vBG2!4)Nl+$P!YL4(ma>RZ}hx1%}wihPPrO{~?t6Uum4pb)4}>c2n`
zLLwO=h<Q&!z+n}Ct&6t2W-CznjP5>r&V2Tlj}Xpope;-2pL>C$)0lRXwp5yPP227*
zyK$oNJ)YA<Kc>ykq)p$HmtY>5dPtat3ZYE;U;B+WAJEVgJjeaFi5?!!lgf&AYFtOj
zI<a@ZOARai4%SHo*8maa%#H$2En6i<KbX~zR-C%(f-g<L-}=H}W7s+HYt@2awdmrl
z5Be_due7%+CO(}Y)NW@s1FKVfCL-S%3O{&YWn?w9G-Ot$wzz^|3OQL=YGmueN;&>E
zghigKp>}l6(7;bdk@N)vdUnFW<P4IN=A^u~{H}zGbBdlF=Rg1xM~*ZrykG-dFzZA4
zOs15rczllI|Fm@e(pCnH(;G0~W00JVT}t&@<qx9yiwop*mRga%!TC0o8RynqR+E9B
z(bvZ8O=pj?l9t3u;m)$zY<Jn2n-lv{R$&_^-<Z#oY1;J^)tADo*^uen{W10Fz{L?%
zP-c2fCbk%y$YDG5x?eaxrdut@RmhqONQR-2a;3=62$o_yhF?R_Z#*yaTBo_r)NOHn
z|LJy2s<4$@%tLumUHvmvs>y{lA;*)e+V~YG!9;Ha=e}KAQ%@9;<ZqPG+p)BqMLzW%
zAAf1Qixd_qt|WbjC-C7(ST<%hfX`=SCW~lWA+|WTfCjv1-4=YBPzMz$u3Y}ABgN70
z*#|)}x=c+gc+gr#cBX_)3$op6*n)ff8dj0lr70g>f9@{9HBe32iPbj*C*YYG8dN~t
z>`zlePA)9v7=?7o`bA+K9GL@TMmi3}BqWs2J~D;UB_tT+>j(8%Sza!kNmwH`o=_Jk
zuD(3Cr(QQ*gU+xCio^bKlVDI~f-aL?4lG&0NOcz$F@C7twPTPLf{_1<Vtxkc#l$pQ
z!*>*v^Ox_$8U?(EHt<V+YEH(ip|5M*=L}lm=HPaVF2P6Ky*26L2uP<A0q@li%eN(Q
zxLoi8$sJj+5iVTZ?<rz6f%!a$3XrEdvxvz#S(IOot2J+?y0YX4hqz5>{OM0sMEKKk
z)iw4*umn#9g%fNC4P0Kv)JU2$Pup>1wQ9m`@%ulVK5hcWH=Z~dEh0T_2GTN8SP*hu
zQjD6cy~>;Fo8xdW5RtSj&t#!o9+rRqarl`m90_4ym*f5o>7)3L_tb*iv*gV6;~nyt
zNvrA8Hvs0PVOP}FDCVa#+5z0|5O>0G0tr<dprDFMr<GcSHZ5?k1}g<kdZokb7tF2v
zh}2MaG)mZQgr33016Pc5xFK-M9#w2x5jKiUR#vvjcAn-HBtb^7SC8zVN0K!Dg++t(
zt(lmb!hY>vSjhOVOYo(Sk{k=3ys7f2Z_}HuWJJ=)h@|WNb|REHyzk(?O1F^-s>tyS
z{Ch=?2M1CU&x}McUhrqxn@%HB`=^aQ?`RxL==5*|GhXDNlq`!9%Q6C;Bsvc&9Q{#R
zR1_|BoeP+xq<ejx64m@Lh8Hczg^%yreYjDn-OA9;aC46w{X!%c2}o?(fQd$cr#@#R
zi=Te;TI~!(uC{Vzw+$w}SO-+wfIs$Q9BRwsSG~Qg+#1`A+nQ5VUqFw?B<70|BihFt
z*#yGxoRYwPxa3;LmpmJ)7)v(V9+H;mUJ?@1)1evvIqJ?XuU1Kf7m5Q{q%{T2Hm0F;
z;--M7Yn3-@`$uwKv(T6jNRTf{1gil8?v?D=?b@oQ>rwBe>-F@{t|U=xcywHMjB!$}
z-32F#Wyw2f;B!d#>nUS#(2r$Gkex)}Bvap!{G#v9Wa&@AkGxut62^%Hy2l>WVbXmY
zRD=%2{6*`e8BaaRk>ceGk}6tRkx9N81U}w^6{1d3QOksTzO2Okpe1SoaJ+b+lNwbS
z{F*Fj26O?E^n&7kheexP%9o=WZgkl|`F$Hiy$H3G0!+6BCMtHqj|->Ygr@_}!RH#Q
z5uEb@Y9s1$;n_<s!F0UoN`-8yf!pw<1z<!pE2(8Iuv5HPcN~IvG8T7cX4`NhV8bHA
zaDpc50Z$txqS1ajK`^~(NZ}sjRGXUyuHmI~_T4cdBqPBjZgo^&pn-lK^gZc;DAd+#
zRbNJBJa-LjLb~~3uX@<f8$-IsBmyqE>z_7BB+@xK#sA;KLi8O;bQ`e_)ZvR$r;z++
zIgwev{eIFPHh-4g$;L_p1BxVphR8V6qwQ@IRf_kN40zD=BiRoc2_Jq)iVNYiIBv*o
z`QIUfXw);I35+#uq1%?TnNFrYwww0|NIEl9eNXDvt*{klE&0_->B~bF7a3q<vQ3{I
z%AbtmVURi6daBv-Ypo9Ivc!gTfSGf#Cq{Z{Z2#AAS&Ajs+sX>n9=4!%+gCVl#B<R=
zl4%W{;&da8NkAL7ga3TR^g)sfq9e`r-B2wMn`cWNa{2lll+9t<iDtK9^P^mE$hZuA
zmux@zeG<(AszrYzzW$ATW3@9Phq2T8+^8U-+84+`zgi2?;Zq$7`~wdQ4Vl{t6IOgZ
zj07z{nhYvLp9AI8CZ%3m=3GYDYYW~oKDu30e*eI6#WNFqq6f;cy`N9P5EoAbZ-HU}
zq9EJm<pK#jyD*rFI}|HCm^C6zHXabq#z|<&oXlmEE;s0?+5PBUlJi#(g~LV)lba)m
zO9CAsIrn+a$!~hEdjH(WI*U(RC`#TZ=6a~BIhN?t@*(Ne^(xr)RH+6QC8nzgi^h29
z$4@U!wq(E`X3!>1(E|&O;6Y{kv6OLn@b$XxKRRoEa><7aEM*Ol`PePhm9|RSt|Iee
zjgXX5_q>%O;NuMe_?&p~`%KnjP4W{ctzX98s;$<0V0PWya@@~q{}}|<sF4gVnf>H#
zPqFKo^UC&^<tzij=Zt9C*zW1z&H-?$GBW8akV%8?MNV<izkhD}a}No_736QwW%uN1
z1?RhNx~q~^Svy5BDaoo3RR3WprPvbQS9&|1OiL`6{_ILF2YA3pN{6T9{XrBk_*GOD
zFLd7*WK<R;{5N?Q14GxCF6}9;>Uc{<8k~HmDX&0}SjYpX!1<o7GVRhl6CsypqaQ4u
zA>ZdPrvzmF80@&}mIpbxSR=xrymE~Avjw;iA&S6JgVkadk72_giny^{?Tp&Pz|9@&
zl+dR*)cb?=eCmo@@&N(wVxdaT;`yZ5nU(NFX=%pJco*v#;*iRDVx^HN>GAiGTO&QF
z1wt$-U9CUUdTJXI4OO!xWZ{{z0S)<{jec5SP_;J>`fnli^W<#Yp+>^s?*Hm+QwP^Z
z7z{KttGQjzxId|5J?rK+^xiy3-yYVKE%wlHacOa^?nRh#6*^y8T6#D7e03SNTu+db
zR3Kj8{+urBmteBueCJ|1zQixXGa%$4j0YF`qkr4*mwmO%cOePmcreprdEV)dLmHe^
zsYHLtLB04%;CMjDPQgtasrKBbnxrViS9JhxxX1k(o@V+tluyZ>jkxLsQX$WBtgA~~
z>~h9G8VEtgflrWrj{6DJtiK(K^)bH@F4bgq`Wx1ze{-gQ)plZ-S!dpvO&OPnN@NW=
zEQ5zh6nfP0i4@Ojac}j1afP2p)J=mr3<DiKy<q7-OdM$W_;Sq5%=W=hNZ?KR;7H(u
zzCOH8l8(d3v>u3-Atk*85W9rMR=9<P3ZUQKFtNzN)hm>+Bk@n|Fjh9CJSsSB5&*~U
zG=_>m^$541tcRJgg56zgp`(&6GM+{CE=Y~bXzqqMw_qF^#{?-+k-@`mAz(mzwf8|}
z)|RD0Ub<%E7<3D-1#1DyjLeE`?Yk3o#0c%|CX+B48yvdzqXKetoH{33?fPw}2M3)&
zq@Ltk(P2G%N_vXEB<lMcmxNE9Dpc1ji(w*(-GY4;g(Y#e^R!|o2IT}KBEpDiO1+u_
zGb7>;x@wK4*YO2AD5oN%2mi=dp06FlH{d6ag9s{zlph}O;|H)v%uJU6!5~*DbSDC#
zB{hai?rGrhmSZaq@0bY&2y0r6kKm(X6hT1_riJYy13?LslanLvRK)t5uZPl2#@cS~
zoA9g9I1@8-nKi&iielSn#`G8EX_B>2rrx1hB#6cL&JOf1xVq$Ei)4?uS;GFa-GaCD
zQl#YjSyx@?fcMPNV!py{bmzDBt?DUu(T=2btdYw#u7l=A52%bl%Z$+sr{XPPWJCBl
z%c5iEZfZ`f<nQ!`!mHH`lUGSSWktAH^2-tCms2U$pr&DlD#AZ(k$)4f0qHJSb}0@^
z*bm&GMOR8BxKNN-_6h0Na}-c(dk4uv8KUS+yT*W?j(ub#Wszg@@ev2f#6iE^z4AI7
zgxa;*f!`C<TQoCQp4A_&sDVwF-8Q8Kg{My84U9ZjEO!%#UG6*Q^_}e(2mUuDfe3<$
z;6hQ-l9IEar~!)~Yk_ZHDD-698VIGP2)vpM!i3!D13LylJUX_RkD%ZXAmd0lu&qXN
z9Lc89#Oy%eiJc_er;u={P=IgiB97WYx^46&<UBeLiC*m}i^&j%9zvgw?%dw7>`@-#
zF-$0y-*-h8>q~3L!Z~9c^uZrZ7V&&_WPj?khRi)$0BK2sWRgT4*%bNBi6kQ<RXq5+
zwMh|`>#ci?)bqIlP7P#DP+ik(7rY9A|Ke)Oeg#6>UMbO`{&uc%0WnA=^>ux&$9+&|
z1Kg|$`)?kn{dhSl(FnQkuDNbQeszRqFY~IBbROLtoy>sj4oM<`6`%$;&zmRM>X!iK
zq5BKUoHIU|EXz+)9i-kyCa|Lrf+tXBGA;bX+ULK^*%uG8D5RmGA-tBbFVSjy0p34H
zU0FyoA4{~p8T9cIQ0^D&;he|WB0P<AVQ#J*$j(c7&H;9qjn0{!<;fNt7<wl<+H1)D
zh7;4p)dT2<Twma$?b(_^a0v|Pr>6ksT(<e3BoGOQQ&9HPrz~x?J%7I$ggxjBf95T=
zZhN|U`Nbbb<o^$Bby^AP((oD~0e`xIZe82O)7PY!P(wjFm4MgH`LSrFb)8vp?3Y)C
zun`MRzU9@1L_j~qXyI6f{-J>^Wh5~*Z=5OQCVY%6r^_j)DoK1&oMl7@*0e-UisgOX
z$RX7#AXQPhyCGW&CH_D#C$p&!UtKbm$t(wyFKB!J!N2*`;P!ia8_m~m$DbfOUDWg=
z(Q2g-uKmpzQF00D=nL&mfj~IYC_jj{?0i{H8d*qgp<tqtX+?U_mv43l+<m5cX+Akb
zmh&b5?l@K6YHq)A7!%1<)Q63mB~i_bR^3*Tx^|74srFd3+Yuo|d0ik2qSK(vDaS3v
zzr@kF%3RZDY5{+Eco-vnn?t9*QNX!Kx~$Amrw&+5js}v9jpcZ0$cdsAa=s1S|2FT_
z@N$gLQTV(MkOxQAgisb1tQ4CqY44225%gyjdS4HE7NDv>(<#GFfJZ=Em3A0BG~!AN
z^<TFLHWwFzC#mY?*=<v&21M1~Cid^r{M+8AH)YgfpawOZ%4Nj3KA_GMyh?gV(mNRR
z0J_rXQ7y04BDZKhtGDV>5ab!Cki*-F4Fqkj*~%)<Pm9OJOnqM7;DvXL{BF7ACidYI
z&bE4E;}k>em}{H~k868A)3w9A8xY~(EY9@7&vUGj!xaU0bZ%Y3pa~(96gh04;4dJd
zqNL`2&VHA~r{5pJ^fE6+V69Y<bGY&!74NV5cR0Ew#yqarSThnrbCgk7pGMMUC!C^9
zbzoujOUCoJ6_#T0P6}tXdHEFsRS;@(49jjrS5S}6YWI7<YNrH!f3d-bkp0&~_S6xl
zUC#Bt&AorEE8huu9E*BdE`I9Sa6CfM{cFm>JpD(cVy$Xs0y8l?Qb<>8h|J33J!&CY
z^7C2d_5K06$wj}Rv$oc0g8?(Vb+(mJ{`U9+_egF%HPql`ggQM3+HX91x_zI<>YvSU
z$U(D@xrrzy>+I~T`<g?ms;X)V8lm^cacPp8l2YQJ{e>TaZgvppVH^*>QOm|73Xke8
zMTA*fr}3~G$BKcazmtMCDKQyzT>FDWwI5)}(gurhS`Ues4CXB|U`1NQtT++o!{^El
z3~6p)-Zu$@KVAw7jy<eOhq*~M)?hJp^1sH%PG5pch`zCqC;a6{Q|9e|12lCC)VG10
zx6R|GZ&$S8(F!)4;oJaJ3C2{6{A8#*;9{f<d!_z9AB$>K!bO-~##Gk1%vp1*Qrg0@
z6?hZVdGBI26WoUR+8aY)Cr2&VcU>3lt7cAo;A#lg+&ug`(^M1})<0A~5})k#aE^cu
zu~`I3MI80RDGU?~w9!OYbvJ{+)`_>5X$W(TiH=QiO?}c%!Bya3-?y?-HB&$f_&l6%
z;=t~QUOsPq?7|9zxs&&lBH+MWYW;b#%<#p{jWcHgtW*p3;WNP#{pxQErWVktgA@hw
zg02C<EGmvhXyE2@ip+l+Brbc=8}2iQ3RQT7GEpqp;be|PN=ix-2++dE+4mkodR)Hv
zSY=ox{%6d+3l!|8UX)U$^}YmGd;&_KqGLIM`vM%fFgbvOz39Q<@gabBVz~6;!2hnt
zKMp!~t`2)#Jx(M`kAHpEX=Yl`^EP;5mLMvoC|d8LJAvHq<}8gLE=30g4%`k|TZ;W#
zEk#yOi|q`)11&X+SMyBh^SMFV0eMS<{@m<9eYRls;+IpEYjCovs`#7{q@uE>;Fxlk
z{Rog}0i=!=nTRF{cwg&-7+augux$rMuhB}emWu^8kP9r*sOe?{Q(42>s9gva+Q$mS
z|N9Sb2a4M5;Q^Z{zmbRpcJ3#!O(m^$`nV-!*;?6{iJF52FpG#7W5EyTczb}nNoLpk
zop;litT1ftDr#zGJBB8OcV2TObc7y}@nf*0{$x{N4(WYIF(5irgZI^UB1{x+7`<^j
z;&Xx~L!+w`%=Ngk-*$m7Aq~%$zdnu9Q?zM{6Ht_}2ruPx{4d`YqYCF~ufC#K3i-mM
zl8BVpRa5pahFp_}a{{sbXso^1kftn2sozN2?vbXQrxQ6ItIxD%WA<h!5n_v9LxnVk
z1IgI5*lXS%NWZVOd`ea*7b+^h-+8(oaa{RI7>yW7WKS^EhK6Qfg5yyvZVv-m!Ay79
zIo(H9?FA2QQYu3X6pw;RPqIs;Q<AbYUBt7@KS_C!j(r3{$l{vLTRFb8e`R7Zf9mRh
zb3yKHFHUCLq9$Mg=))eS?%=WBMYCB<x)j4jte_rMzQ#y$$N-poFQ8m5ci0WALz_|(
zNZ{v>*)BjR8bE;pObX_if&HY@ng!^}<{fTqrls3fiZ1;K{*3P?A{g)sa}uUtkfAP&
z{=`Dxr9I=u`iy<DRCWBzNc|{}Au0CnPd@VX8_dIj%eUYXiX9)8g=4SIA8vtRQ79G6
zc|5bp9IWMewE%j>kX^kvy;Ue3r)sZ@ouV<nK1tkp3d*0j+l?xFHO(RsjZ(341X5c8
zuPB;jS3kF(`>=3&H$Us5O!NCVjLY&+AIvMrRj{B$)v4&xGtzxXaqu^@)YRsgc*F9y
zl1+P8ta9B~rra;6=cyDC<6Vds1h-|1RnakEBkjTQo}Lemj$)=|ID1f0RhUh0C&9YW
zU*|$<+Ag`<Z`axFgLha7*!}VT(v8XgW?=r=<%50OWnS8Edk}l&&GH_t_1ThHvbS3%
zWXm*Cb%c*QBT695o7iH%r8v{|f}SAoN=Luf%NTdcO|1Ln91j!R2hDp0*=s81)hnm#
zMVp24b0JPgPmdtram5;H2ty|rN&z6K8{Th$rVC>Z`;DuVvoF~4byxMuVp|K7#Wxig
zmSv5}z|2y@^(V0CkCjrX07+nEs*aEINMgaa-i4<hR9oFCP3DAtV{!N+iw;WP#s{kU
zF)@^%tEQw&mzf!Rho&SxZ{X)S8t6kwuR2a#^?HN~Xr;AG_Tb^-5<g=qkj>qm4q%;t
zaGQh3NAR}K*E^Y8Y~7?>u22V93?a@xp^@-~^*+x=bAU0blyu_0^?n*98oo|r*0&@G
zsdUm=y4oWMW<-2E0kBhk*L)?xc;n`Aj@Z}-8X7v^S>)zZ5=po;Zm}XHEjDGr0Qf`u
z*ubn|<pSEuk5|zyRR>46$8vQualwFxX}9~nimg$<F1oY!UE^+ZL+q~md(5URbLwzj
z0wXJ`v9Cri;$Th9qpz$k*bpe0QSWfY>|GQ1&}}Io0t3T9N${?b$C9qYA59mtKh1j1
zb`Q1H9vX4YT9PV{a&VOKbr|9}@LyM6mv1DjtUmY_b<?t!9Zvwi!z+N_wAb{DRD#HB
zBIcm$e)frl+-7JvRdZ%5so!`$g3#-r8y!<M=T<R~)MVBZ)68cB#k$*+B(D*Z*8_U-
z6y#Mo>g&T<(iv$1<ph>O(xfUEPQ@qSb65WM72#R<q?6qhG)F!Om?r<7qW>*Qx0mzz
z6GHMWzxxmnMamKXb?(<W542PKdJviEi)zqb(}jZOcHCgL<)@C0ONk(GIVuPsC=r)b
z5vx<{oPvDY6ARA9$OFOBhMv*&S)}Gck-hbN4+A!y#}NwPAe_ycnZQpp5@w8c0~U_i
z3bLJ>5z-`(Z{@QNo$BAME94RA1;%XytX05?`0p52Swk<la6>{GSxiC+t!nP6ZwQID
z@GOf3HyOJ8_I(^}%(L0=OiBWg<>kou=I{;HChe3nbiT)$^@YT+!@9T!Xd7Vh?GGo!
z2{g<2%vXJPKmfESwg7g=3m~eFz6V$zO!2UIvl34)o|PQ==JH9K?Xot|5Iu`-r(JvV
zPmsHwSgUF!S}SarT)hf$PPGI5WTqk3RhidqC&FCu9<fJ=p%~72p19EezB>jd@wVI-
zI&fm|L$t?BFXQuox48Ar4Oq^6BD?s9$TDQwYAlVl6N>x<?OfssgQx674)M<A!8^+y
zK%`wzj%n2{^8O-Z3!B>HCo$eZ^w@ra4ix?h$5dvE0i}-#85=uw$;1JRx=?xq;NRNa
z)TtO4#&xFP;o<v0Yk%YqcI)YU9CWIEuRcDyYRb<8)*yB?=Nox^Yu2`Hh`oxt_{`za
zLu>RpI31|dI568b2I&Awl2B*OaogxV2^F}!GRbW?so*9=!x@0k&7ZX(%XAWF<a7lZ
zP?WKTZvACeQ2TXjeVH^aSh7eGos6S%qKihM&qxos>$3eUzQuEz`I*>FaQ~tBS<8cD
zkZT)M@%hhWpqc2h%*`o6?&erW>Wm4Z8?Npnd*FPwz4pZV(_ez;eKW1Qyz=Gm46^d<
z@PEH78q8LjpW$KGOG?^O&plG4)W?%t;q~!o`Mc;EzFlEfmbEu1^kiq9-u&^@^EI?w
zZ!TsketScV5*n^&!~kC&8UflI`*|ZuClFXZs+|+u6#tmWq^U-|wI9GLhkP{MLEXxw
zqxK`VlsJDdBsLsfNlxk*Vwm}fI4$)(yUt<4|2yii7b+?ps6Qw60;5uqQ*K-``kKuj
zI==@B8rp1cm73SOSB2gl?Hh$$y{%tL&PbgwevV<C9Mi^jTjTWzEvb~adp0`BPuDHI
z0>bE@>71DMJ=fU`P}F6KJCV?cxFrgYV^49ejtEo?iQU$jjVvP#tADi(>9{uB3gX<9
zQ$GZVU-<Z<D*Auide8nps@^iF%{J`TE|g-$-QC^Y-5rX%Q(S_(ySsafJH=g!yGwA2
zTX6XDyz}in@BW{eOeV>FUFSO2I@V3MwiT+i5>#_sgQA*A5ImY%!-daPw-ppzg+dl2
z-d7$C@W&njLl}bZ@hzB}d;cv}WdudM=etiu1nv>y;RUxw*(au^hH}B(z^1Tfn;FS>
zlwPw?L^425h?GdVk+NZNFV5AYcCM0E<Rt)%e30meNESwFNKe+f@%PM%Co?<i+?ciM
zbZwx%l@yzyfW@$2%Vw7zf-`Ov#o$S^kl;B|#;@HHg#qKr-zCRPc((mNSev8bSoRym
zu{D|V;IqTR!|>0%YRZ%}dX#<?l&NeLz+sxunf8~E-h>2K#*!eYHq=l!=!MwGREAX0
zN+1d|U`v;&&*Vj}7(NN6zjvW{naG}O*L>eACR~HWThMKB34?{N4KdY9?8T)IwelY<
zXQW!%O;jl@>x@MUEx=}!$Uxn{*(`Y^quNZen+0i=!Cv0fUj+t@@UyTH5iY2s(*8Y(
z{I+v^q=;Y7>KHR-Cdq5kWzD!Z<xeJ1&guX7hM(zmgZtzRB%>$;pp|IkNhFC;&^@MQ
zKjt+#e_wA=<`P@FSf?`e1L=}KjY*J~(2%Sl;*w1?I?b61JRKCUnB6{82^W<LG-uz`
z3xmb44annbu$2fLCaw51>d-i`bADmu;9!^jU0&3Hhnk-*dom!29?2G*6jd;dwg(*^
z@<F?$w>va7GrXWIz;q-cDNmVI(Cw{ms^3sYz~6Sf-|6@f$NWLArnbiim>!ZtB{H9>
zx(YguZFPRKnSk!PIj>9F<Qv&4;tz>a`umc{gJVD$cZeS|Y->aUKLIM~YX4#}{!8S>
zTOrqj^W$Xz{bZ%vEG}<wrNBS%uEG!|gQY1#BmHk^yurD@gv6-HO))X+O}5W$gSZ~n
zg5WrGhvmcQ8kzVL@R2?#7bQ-S-<nf;lC4hXdj?C~j_doOjH1#IWiO93^yt^G9KxyH
z-}tX1q>0&1-D5WrT6misXl$gL2jVH^hXTGRp+Si4BX}?<`{^$^HQ$O~a96|%eQkez
zti-r$foA6(sdD8a6Qo2_A1#Qg2MCQkTP28Tj|DZdjT&sU?G9J?NB9tZmaNen97Nh^
zOpUkwoVK(wcH)^vX=+0jeuN(QCLak)wlOf`zIKwC6_sF=7uU(gw;PXNCuS-Dm-V~0
zxEYpN;D#pO&rXPDOos-)CU(XnX|{v2=kt<Zfd~LSP&S6qe9t}mL-B#+l0q1X!R>j2
zcJf#OXDaM<G*!M<ovjlH)T`^OBk~f3=ET;jcA?njK01=g;|CVp<qx*h>|M`pag#3D
zi_Y@rHSURZ-DL1)x=iKCOq|f9%yAy&z$UUmNe!9J(0R1$;PBp4pid!rZl5gq)}&xK
zcvfKuw7ek^3vD)6WSi+2#fU7B_6fzrzlZAHO^l7P<a`GsxG6j*vpK&nV(ru!2_uV2
z24^{YHis@WWMq?8u0>8-^8H!43VVc+ziyEr{7Ezw`X$E+om1R?W*j%qd8In4{qxt#
zEGau7{YrI8D--^5)k+lai;O~nCzEN3aQ~C56s~+|59da^2d_iEd)UqNzcoUi82P*_
zN*XBO>-Tz3O){l_$3KH#M{4|;b)C3sq;0*S{ol-q$|ocH1|K)WdvpwbH$TduLcW1^
z3QVtQt+FXV*gu1CoI&j#HTx>{_T&!j)(mL-WTA#h!>n|_6Uh~@=ueRPw4?l93B5rP
z#Qp<W;x9Sg-T{wv0#5}qLVZhZ!qHs6n9S=8&c<i{@FW(`goJOs$cA5qa%ee8Fidyv
zvUNROu0%%JF;Z+{g#a8tc;?ZKA;Q8Rc13o{PWzhbsLa`@eg+NJa4&=6y(9deVX(*`
zEPIY(pc<Oh<0>C1(vDy67c*sihig(?2T-#wdc&h)bfAAs79o3F_)hQV`xQ~mpZ`+N
zmE-Z>_4v3rY>v2CV?+>PX}Tq1LMOmDx)nQ_&J@}GX!_ib4{-4=%in^^vg~+gPYz7`
z;)^^xDOYf5ZY-%jJK4Jjm^bB}n#7^$&)H|(%>ao70X|#%$c({9GzSiZK~<JhKa{}R
z?4V_B*{dN283BiNVo^rwvW*ioS1|Z>vougVpUa%U`+K*NJOJo?ZMUBjD9_xjk!r?!
zCN??dV_&I?yTaZGLd@Z^AE>J9v8_h_mum$^#f<27h5xcj=2~S94XkC(qI=ab`iVfG
zId3I4l_+iY*J@uEDxL%CKF4;WmC>Q&l<Msg(97OTes;60=Lmekua(YOwm;9lP6C-G
z%-%X|ci{@4p`*{0E8?5!95>Afu?rAr^vO#?v$C?5doU^zpSInCse74kv<hN&p>CTK
zZPR2<r6l!r?Ko%Ybu7b-%q5L_KtVVJiEDr9Yx~79lcOy1z#nNp5?#M^yiMUJQCt1+
z<yp4J{=gjF5U|T8rt%CN<9E{RU0f4ZNt&-^{FCW?gW^Oj$Sz)udRPs(lDv|3v4wV7
zh86zpl+NUL_pOw2*au_RR`Bd^jks+GoESNrXk(HA>F_qyTS#-;L&Z*SP^Uu&9`1#%
zv)GUQe9SwbKvk(HGYI3NhA4a{L>%R~byxF;*ZEz!bl~6Lr<K>KKB;aPWE%M{`z8Sl
zkW;aNfC33oF+RFiYDEsmZ2{L<Vqu~mhF+A=$VBH2UzU=alhf(Npu#Ilvz4Bmr{dmi
zxS%RS^Bu<7a5v~5H77;|-G1CT$|2jAc-awzeJHK#P1&60&v%5v|Hckeuqoe#!11|B
zds1Wgj>PYmyU4l|I(5FNGh)DcP9gTXc~@DvY89+b>t2YHN~Vlnv#Y8)zz3Y!A!(p8
z@Wc1_dsUQi+*z+~`p0M0GHJoU%$&j&qbEw_*G9j62)nB3QeQVUzTcSKO*Is)3A1;F
zMykhmyS{WplT_a}i>fhWIGW7wuoFLZ6r2uW=aO5M`ABjcQ(?d?7Gdu^;+0{Xg|1lr
z=*}eoD5ETs@~D8f6l2GoH1}86NKDXA+8;|(sO>r>+H~DOwBF%s)taOsky$DEB<Z?-
z^>G@G>*accjS`Wv%`S4>6h$EwD|f>i-Avp@^^Ww@@->AgDqu&ZM({&TvEqSllt92V
z=x|GV(aZ)+I|&4f4<u$ERaePhG^lyz{HSp=Py4uk*<rDH;~jy;VXaCo7+?J0z=R}-
zQQ`qY`93WD$Zw&z)xyNY#Ff1HnZcJ)>zL0-CNdV>0Bk^4Meq2jZ7zk+>rxt_(^wQ%
z=SZ25=9ET;L$kLDyIPO;xZ`Kl{X36#ojz`;$*p+(PXjuT|7@uf+5g1`wYFow4F~Wt
zP9=B+FsDeS)Xzy(*u1$9X+QtXpSWFukHu`@u+5#-zX6aLynQAv4oE<D{wxXT8#4)+
z%THG~N7-tnL^kq&0c`rNd{w*TIoI!n?*yf1{i5yMslLop%vY!W5X0$R`^Aqg=y92J
zBb(_xrT%o?s1u1zAC=?50LbV?TRUqbYw;r}SHcOI3Gm_^N#Or}A@MK3$P4$D>&W<0
zo_V(>p%;q#`^pjQU{|xEZt@vf%BqDtVDCnFJNUk}MnM{fM&Y=8uns$038qFAv#R>z
ztMg#0>-DNUaiQxdN44&RgOR=@E!TlGd6_#2RXzaPu)qm-B%c?L_F|)0tQodO=MP4J
z_Y2Zndj|ooDWr$=2bV<DNMLdIbl)k3+F%`qcsk)^$bLj@Ul=*R$+nez;vA`JGmbqw
zPfeQR%%KY~3dUjZ)9)7Uvde?-<>55yX%&aPzE-aZ@6IqQ1pBxr;T{1SD{6$uy(VR$
zUMmy^Jt8+km6|`;ExA(2;r>r~5n$oSo@#4Nd0I-}nv$>Cp8PQl7BNAzU|YvBDDZ-u
zgarp%G2a0S7I6MuG8BbnIF&f@wkD15PbeH{$%;5>-~J7Ryi(#=M-+)^4|iBbsomy*
zxt;xrw*CI<>xOdrp~!1z(e9cq=Xtr#`b|FLe1N@92=>P-)Pm(38c%uiC@7)z6C9PF
z%;iOIek$KV%Q`q66^--91FcF;F8BOFodu2h(#*<@ItQ*-=X?L7b=7yB;taP5%|W(J
zTD)hRkKh3CFWtMdhrY)sy=kJXV61--_`q^(q1dfAh%1MgzEP^jeK8T?Nkf>Gl@iPO
zxsDoRe$(-^IrnrtiO&M;a-C%*M+CB+?sVHx`|DmaI^?@ha>>RvBhhMinP<sn>}Wsc
z>$vp7Ay0oG@=?VU;-}H#@Ku%1ZJE;vPd71o<%oJ8r?eTejZU694kx0+kT6j}K8vwW
zf38$y-u*p86T-RJkRW3=!oX*NdtM_Zi5a6r^5X=>Cf%pq4C4->qQsiFNe&p#L6tce
zTuL>gzrz8HxW9FGTJ23Hg$Uwh(OJxqJBl+2c|N*Nwtsl2@}x!<7TeQcXBYpjsxj0Q
zC)y-@C9=c|EUL&4LO=KyAm0jiffE(CLHG^F&YZNYg#Ih?rZ=Y0`*}e-D4O<UsiX=v
zP^wrP%VxP+KRzSh3&9cIZ{Gz@vF(IfSyjy-FZOzu7TwbL`o=G|7bKZ40xH%)A(?)&
zEG{W=Ue>V+YDRtaV@v1)7izVGyLP8u8{O2J`W(?~zCn~_R0<}oV`?TQ;>~q`gIjZu
zJ+{-c>>8Pl<M;sIO04C^6kRV;riFLrw9D-vTQvHG8o{IM|2@EGi@~>nWXg4S@L3yV
zRp7VGVz08nm^EOt#H*hAth3%DX%sUxNwzE6_qqXY7RtM+NcXtnG`Z9S>uk@7@MynV
zjnm^?NjuP$1?F<Q&x{4m6C_1YtfxIxdz;5?hc)G!#O!vWz&8LDWGET#f9uQRgGyY@
zWGjPX*Ap$=wGZlnvx9{y2^{t)F(PKDtF89<p3PX__An^kR(d}y;=w*$oT{n8a76KH
zy~1)z(4;#89U~*>q49erGb6Q2T&B;f8y_+|H>lzps*}_w*5q~M^lz~zvhR|{akVbJ
zvrl4NbFiY4UQsvS6P$25{WjR2u`NQjLZ9~vh_hT(EV4>Xm~x&f=onWL8MKw+&4$CC
z+YkTA-}JY2&ML<KU;wv7$JuNl<t!h|Wa;fkSOiD|el*hd-tH}G;xZa^BH^|hds=lp
z*J)Z8po9sqvZ*q}K8};Es?>Y49`)Rj`g7i?4f1QN_Pf|9R3NiHU(k<y<u;0fDe%Xn
zM&LmjcK99+G%Y&rbo`7tyYzwV?L5P4AeB7K+AOK70>@m`NeV9t-d{uE(67Pi4*ak9
z3ORCsU$FT;X?#K)lKEVSF(Tq9g%Dr(E@M*K_T#v>Szx}w{ki0K+7(HdwR4@9d#R~R
zX4s~`BCk=?S$TsE4dvYj(GG?eYo|iZ@<u~QP+3X`UT5){0bJ85RG?-XDMC(22T`;|
z*NugPCBF2S|6npz*CoV=n`|8tO8>euUJ*BZgt+E;JhgIjf8{usyj1niAkRpliy%We
zD-?Awf`sFwZ?mlx%K903&IV_hnXrruMV^m>j*Orn;D$LgbeVLWV&5$m_6m+Q&?IlY
zWRb=W<;?T)slT7hNiF8P2uZS9MDc468pTlPnD@`JabZ3(i~_$K%;0Z!0ZOd<&-c#g
z4WzG7{pX02A5(c!?bAjAMxWroCwzthANcK&B<eYc4VbSHkN*IAs{;E_6gn@J+%CNc
z3}4TTZuaQ!N`=QjP<K76ja&AqlM^ZT_;>JevBRaO+{P!g6~G$qW1v>jK5$)PiwPC5
z2|#Dcc7pKsaL(HODX!&N?{I)b6$<bvvCwzF|J>O52;b@i5N|_<>KbRy9zxR*eplx9
zzPE1LHHH)XD!m^tMDgm6N;WB@%$}Edy6LA@MohW)cutEF<7YQ1vPWp%n`wEm)kN=)
z1_qun=LQ+=xL^h!x~n?P_#_YWq|zK+d0`vH0}Oq>T)kWIdb>>x&12e4N+eCLM2!=o
zsHH}9I{ZNbcv&6vl(%LTU*yDIlT0lvl=`N_GBaTThxv*8kScQfOcKPTrb+OPHU2^E
zHoG$QWxZPgOTJA2<?N}0Lvj>5*O}3+l1NjBwXhBSoLhN)n<#~N8+9rNLTFF3$OPJ<
zF2dsnC6Dt?kuICT-60=WQNs|UTn>B>i86z}N)Q9xqH~d$+YgXQ4+nSA^Mb2g!f089
z8+(p*y{7SBX?cDy*m>!|d7QgcUkyiEWDOLfMP1>~`!Ns0CXTb*mH%1WAoewcf|VvC
z>0n$Ry%OE7HC@n2DWoX*`1k1-KaMV3$I8m2U02pZXi0TJMZ$n}u|Ggk_q|Tg1v`0f
z_-BoeYT*dfzl-s7iqi=r1%=Y6L(T&1sMoy6$Y^j5kr)WcyNJkl2JZ{ncC|$9+hw#+
zxLQVb?0tipF7Rdae!OH9t2a*tP(3yiq^1MK9HwnIeYZ5T71CTSEv3!Ilh0rHv^~x@
z6+>Y%c2jQ_oEut^dzlO6Tt?61S_7DdRL<bP!JdxF3S;Nf;tWGff!;@dqVqD))hdwV
z;^Imft1zM^1MM1F;s^kn&WvO-l{*kw55Fjb<NfGsz8JWSQ(BS+`@e-(^FyOL$uJ^W
zOwY-{@|c(<>rf+%E+FqjSNT7{zC2u*P0q82_)&gaRXd%f!VuV3-TD@FZLD|Tuu5ZQ
zk=VQf-)>&5-)i1~<01r;p)4>X@hf%MJ^omew)EdGRh|Y3>%0fO)~Mxd4k!(b{j5>q
zes&?zg)j%&$r;yBn5~_!y#<Ed9eY+q_yLat`sNnpW2?n-)DnTJC!^Iuqr9|H?v{N1
z@|cIiW5}^s@4P-kFWckop8pVXeboZaGZb?U<^2cHXC_%qHsIoLg3!$CHo}c{JlCYd
z2!-M;tWy^N`r>2^!mlCiLmC30gf`ZL<~!7kdF*dtF|kXI1NB_|quLoCSJYQQ(u%bu
z6O_P4!DdHoeSV2=m#m`19q-;l(XyxIMW?oZw_cV)13~Z2ZX%<vPg*ytjTSLFsm|m4
zP2dTw5|zY$KvK*$sU%#|QB-XHu{lySpzK}8aJmTZU-KuB00?%Kb4N>62GVhJV}l!R
z#I>+ipmIMti)=Qo|JNw14V8@!Q5Mn;?cM(kJM*1ccPug?0p@YAQY8g46f9;lKt^Ce
z7<2-;C%m9%e(T4(;uB#|be%WKHd1XGEe8@%VNPq}q)WT<TprH-QsXtOLt~tFTL*Cb
z*rq~%bsZutygMG=nHkL$?hRVjD5Sr$x~$9YcGIb1WTs7i7-Y)ie0Pxu=ZkhZ+lc3Q
zf2hLRM{X*RcB5|yx8yjJe`)lPv~1}fFiKp0=TRu&o4ZDKvT4o|O48jy?zMYw_4~?o
z3^>cl=x&20K!6nN;8!p*zb7MS+XCB6&ryklGdb)Dz=tf#YL6ekrwXc^m>8tc=bNi*
zBJIafjwAFp`29VCu+k}6;szrtVx_al|Av1#VmE{mO$mC5`OLOW4CkB(Du?J~!gw2}
z1a68x6Cv*A>{$g3Q+xu^PA|O%CabT|Zi?Km>ueX-JeLh9r^H7A!FHD~g30WBq*gU%
zq@(DSSxo=l!=G#9cqimRyWmQ)k=(W(F|C<PO$=lh=m=6FH)i;<>MOrnp%-`b?b%{M
zG-U*{MOA<CeOV(EqLJ?R_sB@aq1EpdQD1<Jk@gGVr^k;Rj^*kp)EIty=U2@PQo*ur
z8W|zYC!gQt4xuoVabC>Aj-fE(WF<GfSA^dy7^EVaHPo{|OalWQ?Ru|A{s~M8)C*5V
ze|h!naRgnRAJdAA0i=Rx42AD!#iiDQ<B_LyadO%v3$dWM?2Dt_Pucn0SYD6lWMsa<
zU{FvvGSooMbHdb=-X{Y0(*-<deA|h(ey72j{CS@Yd$&=8N_{jL%fgN<oYtPfD{?cq
zY(bH}7EpVlJ>l?G#}c#PN@n-jwaXH>^_gYk@iQ-Mo>EDv5vp^<Rq&LJg^aRSXJgs#
z&~pY-s)ur$e@kc5i?%RzcfLDf9H?j=4TVd&;brQ<92;Ee_5rw>M^{U=>zydCq}xs!
zt=Bq}K>@b96HJ%4dT$n`2b+Y7!l5hUE0!5msxP<RSMS>Q0n=}y`?r%%CYM)pkABu~
zktfTZm&~8k56;^q63)HKfH$XOA5dJ~GYjF-peHSE9_!f=zthdZM1$$G3j-=|Dki;_
z>BO>cfAwrAT*iH*j?}1v8+QJ4zDqmXJgVHdsB`>Jr7d5sY-U78MBxhp1VU%LOTS(2
z)gCiyP_!|9jUf#5H*y6A6g4brIw~SLJe#d7;<Mq~1^4rH^tMeeVJgLLG!2)wpKEN@
zXn%^gzJ)a&X`3vMo9&@X^z}B~_4v3+%WX)YXS`(v>$d=`iPj6K!~?IQub9cn2TR8t
zV}0;3D2_L?#4cg>|Dh}hW>Qp*&J8rxyBTzPJXotxxC-Tkvx2XVAFw<-PD|GVLwV!~
z1Bk8=k;>K~6b>BcTPC3})YDyv3BqpFx}#E07BpJrN0m>lrhl&Nx>mY-QHjpCs;JYM
z49U3mhJL=4Bf`QZVBA#`k}%A!k|BBosL-ra$x@T$An}qdYEI{C>q}aEdAYx!#=7z!
z%F37?P-L&jlqDvv63IHkrS%fxc`bOdo~1cYkV_pm{<dt7A@6=$1Qi+jzTUDXqc|ht
zMxn@+feQ_gd%?ckrW^>Fh9>3QD+ORQHFV}7{&}<%4sN|s^*^Kk#&yU+9^sq%hEn#x
z=g;}(a(&dd{%b|n^K;3{`I3@-w#qT!fXOIyi!xp^EV{9Kx0FkAa;&j>(-&B&N{a9g
zf8{tjt=s8fERfClAG2zMkKj@FJMxf33<@wGEv0vS%YfmEjK}M1w-P}R@^N=$6Z0FT
zZf8fad=6W+ex7~sk$Ih@m>OF$nyD&Xb^@2<n(ex%{!fnR7<fXUXn5*vv+W9mO;m&S
z{hgY?!>t|;r_AJNj4<}M>>*iQU%<HOWjYhX0C+dZ$=|zI3@I_(B4z86%zzP&CmN*m
zE2`X&B^Ebw^U8E{c)@8UnAqtvrLNGZw@3SBK`d3RD5W%oejdb{tkhY$OlD619S>~t
zmEj6GL<M1-V@*`rDe^4GUA5UIFjQ;PL83Nlu)J~uNSVmm(?KTirUAYvCu>a=H$@;s
zHsXb(=T$wjZO?V$m_AaG!1v&JYNm_{lx_`=zI|{aY~)}(rHuIWIBU1T$e4gg@h}y-
zcy<g7OR|_uvwIN_kF-pmRXI)mt?Zdi7m%a$j=HO25w33-nexl{ot&GCqRE9V!+9*P
zPGM+LU*R<6<)FWHLZ;Ei`MG+d-g}r$;Nx~@wo{q-C%U4TSFxXz4Lbamba+Iu@iEdl
z1C5xTP9-8Xy}#bjU$;wWtDx9{ki5=^zTb!PikCa@&&ckxYMS41vCu-3Z~b`O7qgx;
znrR%E<HX1E1*LX{)u@`^u%5QkVDlPHwseay^KNo?pbYAS{BG`w!+6db?N~3+M#a)X
zS!V9pFP1(jaw*w#KiiCP`8xTGH9^qgz31qXNTjH&V?THB0^S#zTr#bvl|?wfZ5gp$
z1^yDP2VTCP+fNQbG?XZt1hZlB=#;2#82+WM*yH*?o^NcaU=}PjzzLg^yX$q=-r=EB
z?m<fQr_x5T>hWn#ow*J-J=OKOXpUTMq60CBGp;Bxb}18OAd|Fbq6G%SMojw1GOMU|
z*H1)4uVeJw#m=VGE!2)`H3y%CF4*=6R5mEJ&MWY4aY`U7iwRAVsUpuqHzl5PN)I>Z
zWiDO>Y`81hu@TLM44JS1rcAa7<Ocw~a$P~Z);m4jLH$|eKa3`8kfr{s&4C-4!e$eh
zkHhDlp0!d~*@3Kqvj!`u|LeLyKnCT87;z@8fzoK)4>`CwwATfm&T)jnTe_aOW;_0f
zllRr1jF8)~C*El98h>)ZTj=WG(Er3%Fn}!@;w!Z05y{jaD*g6~*%A$<*Ay^iXj&WM
zmZ`J571onHF?A7ISx|6eqiX#DOnxr3^VVy!{B>5k1gUxFgjMbT2BH@Lm44nAe1O47
z*Cdbf*|r7kx;k$@C;n0X?3`hXES!Q({#ZfcVS%kWY=At#wwEVZ#h)#c$5zh;F9!lF
zm6OHJTi=O(bDQ6lp<xi|pOvYlf=$&U&6<}#)Dsg22=&R!?T}t%b^_T(Q<T)tCjDOF
z1Cn`O{b=Ms`h*a5h-?3l^){(Bp4QjP%QAh(Q>bcI^pCN5v|{{UhZatl<y;KL?SH4*
zI|3biL65yAlTQ;v!ZJ@#cf055*7f2>%D1A)>en#|+kJJP*Nwo5*PGEWOQVz>n!NLC
zGe1L!y?Oo^*02m#z%;Q6?d!R_P6esG4k<h<-TuP$z1acK4YaR}>z7{Y{k<{fD+;|-
zA^hJ`sI<eetwtC^T^O^yRn;e8Eez|;o9i4aIVS3Wm5P>bFryd#&1IMHJ{GE)%+=zz
zvd&f$BZ{nTdQ>dT2oa#L$T2E-y(NK#{~G4x;Rww3d0lveweH=Pe$qVQ>6v|D#NAtg
zMTUwq`fuCK0C})rbH1Xe>kpPF%4vT6`V|iIAHp6Qc^>q`z#S7B5pVGT3+@3Q=r8zq
za{81vYhi9K;~!s`GR-;p^>v{X_L?vhZdw2-Zh!1R8$Y(}q4>yYzK2(eK5pl?BAU_x
zt2GUrQ)*gTk;2pY=~xpg9v+ndL3}Y3WBf=BwsOP)=Al-3$ql}XrB6b%#}OrBRE5c}
zS(0_ZI#uBvc3HgfkvcQnC;hW6z6L_*8yr4;k}7b?_IF_lgTe!BJS^R*#-b5TQq|rp
zFG1s;pD6;tq1y_wirf)D61@%h{KCn}MPFhBA_SCp-J5}oo77T&wS{_==NmO`ct%P@
z+0;UpTQDGPozvNvNlBHA>di*uL#BHqp<wgEp_6_an85$_v1Kk+M~pri`B=n<Fo>-<
z@Rkaf7aG#_{;jKKF*+3A)m5z#y4u*_+6lWG<?}D0&g9<^TqHu(1|A$gga-z$>9hUR
zJTdG0p8wPF0Od(yQWVYH&vwB8e2*xO+kcwzUh3?u+eWdPow?x?uUd^yiyiL4);qsg
z211VYy*ZBrZdmpt=?wWvuWajk&I@0W1TcxaPnKO8{|^h`8Ev}DI9dP+ef<1#wLy^h
znM`$R8t~phaAlou2VdACTMDYy(r$dR+W+i7-r1F4Q|aUvR5q@QNo2|P#bV^G(ZfCS
zCxEbS#TsKrH>oSUluyo|KJbi%ZF!ene_yn_lJNO~-Tb|lL*j6I4-Kwi2ll)7XhO6i
z%IPIhI4w~K^=?q-RbNcPmSu2hg;nH`XBMldK57$;-9DLZW}odg1drXo;gdutk90ye
z&f9HAlvZcs9@)<=sw+!9B9EW$p<jZ_)Yljw3%sUl5Oht#p9O@Nu&N|GeCI588?Zm3
zvr-74{g%&nb@Ks=RfdnaEVG_(_jhvlsG^I6{D2~vYA4m~ZZ!pHt2%=aj|)OXk^4K3
zb3FwgRK%}sg4Z~pNKo<U=M$2eqzs3ecV`}dtJ!faBr4gK1JYHy_mm^O8V3?(G>g54
zIZyg*c5=HT7Lz3M50|(L)%|r>O{nIp<I<>gs>-}TtB&CqY%_3RIy`bVN@-~oG)*?k
z2DaDCHFVFj(dSJZvWfYC18&d>cC~+?GYq|dnLw%!WcVTOTk~_H;y>?CH5V(~(FNM|
zrbq>EjGesXn@QqSmC%dh#g;@-t_$KW9mh?UgHG6X@z^Mu$#p5ANE_o~gNj>N_?k6R
zF{I@5ss%e9)ip;@urL!~3Vda&C3j*rh`s+posz!01<~k@VP}VlJ-Q(%7x~Z;u{;vc
zm+)v&k?Jy#GwbZZBKvn6(?Z{$tQIz~F>ZxvlJU3$4^G={Z?$7{JimE^E+dM!HtJm@
zTj$n{+1x+t8BmjwiodlmnidZr<Z+l!ns;5V`bEaU{z`6JW+!7peH8i#c<ME=GI95U
z>TpL@j4M_sE^S6Q93~5GYegZHND@z_aZ!=Ri-c!95&AF{f?s|Qgfrc0cPucZLFq`}
zG1m?)v3H-FKg4lXb1a!tdBqq}zX-+1pGou&JLs@QFE1xfs5;xaIc%&;z8n6r9T<6{
zoeLOGqv8v@d4%t7Qnc=<5gW93UU15#aoDWiPLa%{DYYht409G+nEUMl)^!)oi1+55
zOAeynjSa%CDJ+<?VIkE1x!JEb_dnh2$L)5s7C834V`+4WFuJ#XI+FF-vndAm5usim
zjYyQ<589ZrrsD&C7&=ovJ-*#Jhz^)bCnnlwM9eFFz!#c~!QP%$6o5OMLag0GbfuQ$
zDte!mcm8LS{Qv9HeMM4%c95kuW5)bC7^<p)iGK@an7cneUbX4r&#YCmOmxlPcU8Wc
z-hl^Q2-s_%(tYmJPO8a2h{&~YM&Q)XRJp#=YbaxJe~v3D9rpY)dfL^$?Wz|-i28N1
z)-RBMs~5Cz8i>2R@GhS&2<}rJ{%-kzveT$8^_+U&eHwl@x*g)F1lIT11^i42-zjXw
z_<RM~spklFH>$L^t?CRXyRTKw%DpwaeV0NI>=zKmsEU5MsMZ0o`|CFjuvj&2yS*8L
zq3DU*WiZh9mnNfzA<^%=xhN_fNoPIgOyysSKzHCnmg=(i)4$nXzTZfmn@H*ELYqMz
z9J}_c7fhDQ5)J?#0r3Pj)}=>i6pPPj&vGa2Le(o^RcU1ALmTRiTxF(P3EH*%>qm<1
z5PGYb8HMQ6viAca32nC-sFib^Fo(O?PmZqV-IGa4z@E_GXQSn0otDsojH6A8;k^q?
z>+}3XFB&#gn=P}?#DR4J9dimjy5*h5t{C10MJW0nBCC%E)Lj$Kr;QnM5{@#vb7Z5C
zU^#iz>4gcu&$0e1ocZUjL>x@Lb*c$lcwr#O@))+WS4{69rL4LOMoTm%C|6HJ*Ef(r
z=JA#9HN0N2jP3#}$XX2W&nI_c1AJeYQ}U|Js9b*3g;v5+1>a(a_L#Of0r__0s4qob
z&NAtIp&#f<5En~ft%YaaMe!<%^vHY>OQhl&&ukQ<n-$NE!Cu4o_qUe^BxWQp(_i{Q
zZh{Hms&-hgu=BNsXQ7eGK>Y?gJv|*ya#2D37$uJ%VEM!Pl{t7mR_WNe#gdeHV5d^Y
zuFG54{NF+EHL<9T%_r$U|6=<XHVh>#GHsekhl8Sh)nQqaN{zsHFS|`T6Wc#?j(?33
zJN~&=?%Vyz^X3os97)g~!^30b)QXq{7MZk%^efz%>k|zXG7;DYFi*c)Y^a%GQQ7Ml
zeZM)fOO2()_;r!+mI*`ORO()T{6gLb5W~hkzW${KjGveL^XJcl@))&w(|43c=f-OS
zSQ}Z<EwDF`)p8QY<U^6oP*>E?VWx##MeCn+>9a}D;HtjQ$%~-71!2NzhI0C&3s;A`
z0(;Waw(XTjZZmGU3BSixOq<X~><^>tkSd3ci4^B>`B2tPw7PYZQ~ru;Q;%sr)XTrz
zz^j0B-pLMAw!Ki=&47<f2-WZ{c7Ik}qk!y4+KPO}Bcr^qQY6#i_;quf=-9}0B*KMz
zHm@|<pO@b7f9*v!{K;=xtvhgibDN?Z874gC{C9&1cmFaIlCG9bv=Mpk_7o4fE5<*#
z-69X9+Bt}ym4bL4izg8Gxdu#!o9%2{rkfj0iM76)_0Pn36fW$tK6!5cG^da@9UfRw
z#EQw_S*H+qwtvCHT<7-@$P*m_3%EG$my+5o?fCwmV<D#gkM@8{6myTi97ndNz;_2v
z1N~-vd@gt;{AUjItM`3n9>D#0*Nw5QL-uZjeWVwa$4Tg?F9-rUPC&Yvkm(oe;glW#
z|I>vSLd@G%FE-XDZb#sO&HI5k^4E{8b6ILe0}jVX4&gk&hOxlHk8vM;#@KpEA9#h#
z7=JIq%Rl>;Zc{Q`17&nwc3|bfn^fc|Ypz7v2Md53rHk<xZA_DuP}2lUfCOv(Ioe3G
z0IMjN0z4b1F5rO4lA<!;g7bTQc!-T7s8|J@WO}f;&$TyC%8oY3r7_hbEECE><wiM#
zX|t8<bzMi$g^hdc{2IxmL(X{$Pq|}OK-Y<}KpNMejEIJ>sMZv)`!jdLMn(nE+wsXt
z0N6uO5C%Y|cW@sjC#xsoN%l)b#G9zCYte@)=}^1<<$JX3`=)LM{OEMxuWVpr;TcM8
z^bKGcQOXU+mVmsB#=qqBzfkAHIh)L`LxB(HnoM%$quyAHYzKiNoQ@e+3KjLIuu9|R
z;biUm#;x|6kc~#iny3RcG&IEc-IQW(e0$HoJ_%l>02Dh?ncVw+J)Jcrn2ZG)W_|*s
z*&KlbU+-{F85P>`nF<0u1~Oge{#5)G-1(aDCG~p~{1)<nz`rvO%uB)DLnvV<qrtQu
z7^MMP^JmvbL(h|Ke%8m3nY`H|RWWef{9aM1V5CP@j{ISr95M@o2BQ&)REK(h|CnfS
ztbbHi-zsQ4#2L{`ukHwJ@ot)Gn5ig3<9l%?&5D`8fTtX6=pwaI%v}QC;(6}>GeklB
zfJbZW2HU))6IH6+t{uUJojhmNO|j{=7o9i>`$~%OGdK?52Tb8Ga$XbrxdC9yB2&Y&
zMr^ICb^8A~ynx|>^BiDYGN)vTSSZWmB})whc*)5JwoC0^i;EodFl6;|n%E{5aM&cP
zIuzffm20DGak#j+Oj=ZF)d-}ora_1dt~N>bg#`Kt(z3ANh=(UYNd(rnSL=r^t#}4U
zzBs$SKeT;k@mM6uN=T8+u1ag+C!A>guKvp3^hp<FRxjj(>2Z$w&0|k(-u$DN4<Fmm
zotjN;9ap$kv$c7_h3Vx;Uf=1t8m}qfI!hQILadfL=i5A<xQ=p6Uy-QDM*Vz5SA_*3
zTcG`B`&<*2hqauQYYVJ~q%jx*zAGvjDIoNE&hDxb_}@x$^cpyrGf7tDkDn{gsNY^M
zCps28^LE;v{&Nc$_T@BoaB!)K;sHVHif<`3{~9~_(P?*FtS*Wk4i@Im;@|dtYDFH$
zeQ$D!%(f?C@cbB{fOAzqB-o^)n@K$o60U=cYSK@`<j%0F5p8VfL=V@k9txx*kQdo@
z?yl>OIr6(89Jy+d*d;0>rFe&eM=QY`d46Vk{H_e)44&rm5|;3U;i3VNIMS;PmYDE-
zL+FguUfi5M{T2%i*Ab34V|R{0%m0>ZwSx!H#!I?zs#Yw?#Y3Tn6`*@QGD@nGlhoPu
zO(#uzW1C7dvho*YL-~CGGeZNCG0vkUGr%tPF_`i0-{}?hl>27eHemGggOTBfeAm+`
zHsU8u&@-5!BvM3M+i=R`Jo(iUf`<mGS(vwSOekp;Yv~t>iJV-tDwPo6QvbRT^7M3}
z0>6y3L&~?_PIesxxLCJ1LO2)%d&>3Y8*434W_x~HxZGvLh)X~Dtfzh)Bt4dQbZ>MY
zi7RN#rM++-Y-%eYyTAQ**Ax{PZKLXX3bk<f`KSBNzT^IPdV$x|a*$gxaq>*345$Ma
zweSlNeEW+3A9G+2T|A;2%tCFpL7++l&8k6QUC)c0<J5C$iW1uZIp3J3m$jp<RNoeT
zo8oCCE_<DnnyKAPxY`uz+w1&`aaAanjH0}xloYf+6Si)f3x&qR{^RJu5B1-FBZ+cm
zvDh8E&@1u;u|6MxFqx143WmLN$UT3k3%pq5u|Q#e>|yhqO)ku}Rg_4EhAP=VH}yB=
zn*So?xMlEdviK@w>K~97^Z8nBt5-$4<2v1|9ob^Edp}n)OC_W`PiCU2PJJ9mgn<!G
z`?wQ!A&Ck59V<vy905A=+Te@F1+A2CbATufqg|jjJf161qx#ZE;HVo!cj>#UT5Wg%
z`};Y4Zs|;7lf|xlmkr5Yci7lSmQ+db)1<VZ9X|=!F9ypOoBm2quY!sZ6sck*E@S*_
zkHc}fR(-}l^L?+X{pUJD*XN~==fTZd<62XPoaatXQ-Cw-NFKkI6JFFo>GEy+GtQKb
zM=}^Zp39h{Mt^fEEIhno^a-;QRX!;xPXJU&uLC#HXt!}0g~Izb<6Rf=*vAy1vSzZ~
zQ6UIFAo#w`NqZh&aNn%GUFC|jd`RuB=hTk=InECer6#=Uy5d_ms~IOOL0$vh^Mfp7
zsR@XEuY(#S<RQfPp$SS54`3@>b)ia8h-<ulkpRH}9|0^l{0WZYi-H|^Mpy4nFb~Lx
zp^Fla*<X2?5FUzP(+myG`C^G3mEH>ex#~Mse}Qj9>IPSTQNd!b?93&Am?7Kdvil6{
zycSlpa+ZjQPXen8kP!_!mT};Zv=dPWdddPDznJjg3R(*E?65%<_`SewqXWx&d)^^_
zSIIjy&hCI4-D6#6a6?SQC4IDHwzR4^^B;9=rf*#$P%YLU07Wx5;y0t%Mt$D{JTRy|
zBUa9IxVOW>3{YZm7$lLzMV(Q6KmT0@WLakTc=Bny1kQ<${lg5yq4xx#C{6yMW*0<<
zvC1Y^_gjis)Q;ws*+@5o#+Q9iPOZ3z1OsF!Xr8j4WG+``V&u7)G2h?U;PsK8ne>-9
zwB>ZyUu{mUs$!)lLQ{)|6xo$Go_^%b*FS36@z3T_!J!#P-3jzPA81#-k3=8WlQClI
z%SsD*0XG!l3voo8kWn?Jg!&YW8@*2uUEjKw#Mn3BMhW1P)H9<YLzM<?`v+F586Y1-
zL|!k^P*ckxp==c^!X*vWtH=l$Jya4C@u~Qj3wwKcKhzpLm8BJ<H15R!x8u|~O`k&B
z0<FUTOKQ}HLgIzwt1C9mSWx0e{CpY}PRz=(`TOvET!4SEkiK@B*h{7NB}Swh<=PM(
z2?=Qgj1RSs&tkVSy*(ILWRj6NgLj*ZiPk;g=`CL98UCMa3|NwpJ72T<(mv4cyXG(?
z4Q2A9fjwjUR7)T9+WU^)rZ0#odxN+Up+_FOx|uX}o*dg^`c2wEqrC~)Z~By+WMi?V
zdek=dNH9WDDhnYV--!U;<AO`xx?w=(j|kMGSqWJ-w`)#^WFZ`i6PzOwA*TB;cQklZ
z(A7>aoLZYKc-e{-^!Da^U5G;bO`zv#@4Kr?;`O>+9cOT;En<+}pHdS%xlx{6qX8dE
zghULD(gluqVM9-k>T8*Wo<*rrD#w)}s&_nGOvVwY;09z;*mU;YGLaTkucw&b_GH=^
ziz7o$bxn|@YDj#HKjNIXUM~>j`@iGC!m=LLkmoC##&_v+keL;$qG|`<MvMGv^GVpY
zOEJXcF^?vVup<6L$nM}bc7Ihh6zpQsKz=VxI&jjyY@Lz1d%pG;nq@x>Ub%01SlBG*
z;Qen`TfNO%uk%J-fynVB!q2r<b$Eiv%vOWgFD4G#T5hhCIZv7~|GLQ4jZ8R>^5gOR
zD)Z)cqDBF7xiSV)@W_xe!vol=TfF>7+xA7?I5wD)@nr+q`OhzsFku5us(6RvN-w@w
z=X${d#m+M&Gvs6)n3wPG1fdjV#df+p%XJg|+w(35Dl#eqBQ0_$J%3qJ)6$LA9gwX1
z6PZ*%4-4!=CnB>#Z}$tPn=gIn?RPKqk|!$GdV5zIJE1MYj1hr7Mz`h<XUuYd&#{%0
zF7VXghnXPsQmLxD?n2qfs{@4>{{=H>*4apajt<_j>n5C+N+B~4Ok*0*ra18D+v=Z}
z`}Peffftc0ErZ`o7TjE}nEhXTZWFAVZf-skFrE@4dJ-bK^XRUpEQfHk-6qp3FNGuG
zBLrZ2t)?Lx46e9)SgN{**$%lf&bGeUkNCDf7D|q=@F6Zl{*2G6<V)grUe(#1Ta3R7
zju0;I>9|#wa#PY~@3aKs@q%}Rkef~=SW`8Pl^S#@TzuKh_Ia71u?QI~f6L)QTG@7D
zzTqfMhW_eivf`tqWez(<OIC9lUp(b;d>bB{GN8u8Zfu}sM(+F$uS&I!{q=A^DlT5K
zGZpEC%zh><DSixA`b!O0xWonQU<ta@MBd|)CPnX|B_A~S$Y|1I-gN#X&*Xcztxlg3
z)fF!dm$`J1ki|79wy0G<RwCm$F&?=67BRXj*I=xjv2g1hQ9@jyWhq987at@pZMuu1
zGue5Ab!WI7g{!{TT<2TR)j=WwOPa%w9>L?RB!6K{wX85hYHWwrct2gky24OFUbsqH
z!cL`p78{jPZaR}smKrIA%ciNGEGQ95N!#2XmZ>6#7@0z+<y_7vw~<Kg<bE2J<)Y7L
zk=-0eP(3w0a@57Bb_|&sg(+?;866!jB_?L~tLZ!LJXi8Y+XKVZ;<C_hb6dwZvR#)y
zlkBGBcD8p@DOc*;1MgDJ$YA#a4g{#+FGn(|A6ZmQMZWi60(Q&EzEoQE>`)tXa1^gl
z%A4<E6#N4?TjS8^6-O9l&FG#d%j$;SMOH?vZ2G|KnGQsRExZ!?t%>IEzC-RlqM_R`
z9eDX=5wG;#2)s08YS*q-O~6lhCHjjg@4IFi#e+OdMxv%l+8oKSJ~Gnca`F}RryT1#
zWL_v9zZUeLQz7`BJQnj%Z3%){y{mR*>(Yl+y7X0RcOC&Uw2So$62+5|RP#BFliIJR
zee3nyIPi)hzY9xdjUNSXVf0z=_{>=80fSO&o4+tb|Gr1YIZ~!)@fWFEme0n<o5Dtb
z;6&6S6a=0&Mz?sEJ&Lu6j-PKTav_LXI(6HceoI;y$j~?Fn<UNQ2>oL~!1uy)=(te2
z>v37Bkq(+wEX`Uql9U=Ik<6T?NljlT{RVUhLoYW}Qz5?nrR%?3Vu7+N#zq(hon}c^
zBN4_AwwJ_1L5-bA0Q;@8)EflVVL@^YGBS@~Mz-mHmASpCia(vt15TQEmf2e(f2%|5
zV%BN~__Y3SH>XoOS>GSL<K@zb|7r)xMaFn>v+O=^GkSM>UN66{q~S;%KS$UZ{QUFZ
z8q3Nr-EQE`@cF{UH6Lri%Ska43oe2Gl4oDJ%k90gXNUX8FCJ`D0nPG(kDz!gkFjdI
zJjp&{$n|Mm>I##8Q@ukMy?&_n>lJ1z>+V#4YZ-Iq%FN)k{2#fir`G~Ydj^cBL6jG3
zz5A|Ks;>Q?J*@qZ^nWM4=}MAxI%%xRo&dveem;LvelZGu@^UVr(~XqS(=ZItwVAdk
z8Fb?H!auURnt|7C5x9^qh$%OK-M*kFuuWyQMvq%v&H#OZB|>M;-kAYXDl#!R^kTh*
z{XQBVE#Gr5s{NvMgT-_Rc4#D8C8IrjUV6Il>(8x@CGC|tKlE}7ukTR<z<oL}v(nh-
z0}B;lV;>cF^8lxp<!<|k&c00VdAB^yPDT5K=G~yXUo}ea?CGi;QR}dF^rPEH;l=~|
zAd@`|ZfQw!D-~xgPEfmdPB!GG_4txyE-fE0pPagRzjD~*kkoxy(|!zKhBUFCEs22j
zPfZ)&Zd3O+bVU}@06ED=dx(z)KYsEOn<){-avM&v%3iLgB?LoK@04{)CaP@K0JajE
zu?sLr2U6+U`Jpia^&3cZn|<2gI`v{HXOpC-3l=<it6V4|OWuCeWJk8b-?$zz;2Ayo
zv^s8Rmoc8)h45Z^WME5D=5J<JO&5@vqC3ryH_d&9_T#XduxVXCz(|d2ugkvV!INu<
zhuiifBqrhv4UOPi07XTEXjVIj*6g&hOsD)$-St^*y0od?Ug)=~_%hixcoZW7L65!>
zT}O|7&OvWS9*Q-mPOY?@$dIK#&BS`})GL*E{jg#LlK@8eMcv+H;Rtxvt4>a!ainU|
zrQ8I^zo)^+4-F0B2)~;BPq>!>Qkof(z=)@%P>qm|wM>0IE!~M%s4~%8T*cZ0LW~h1
zikHv9TSZ=w5Lc&$zZo{M9i(7dmXvhb)$l#pT;jMi2@EEtuhq1>KbmU`s7YIDR1v8b
z)iu~W^q?w-h{S;CauD>+Dp^K2EQ%U@DxY)@b9i&z>;DEL{zWeTLS1bN$ZVlBJub7O
zacIUD&0fd(85HuK)^`J_7o0s^B<g5TUW4Ac0!QNE5Ygqc;tQ?B)jig4gIaOWu@myU
zU$RStY_c8~gD*;iEcnz0X$G&kP$7Zguz5<^7*@(g2b!`y;xBg-&Jx18Q$C1QGu_3R
z^|$+{8@V1T58Fn*=*!(lnssj!#Ohq}vwK|=>SdEchuriAEva*zLOm;*^X~im_~qq3
z;9jQRsVT$+c^dudR&}?xNdV97l_P|3G!a%1_A<BPj!)dN><q1OOQUsH$L+#Bp7*j_
zmNFP96LkrGjFXY$?s@&^-)}!}oDh-ESvRulT)uss$T$V#v@ZCE_WrFjvJm|1SHd36
zOfNrUCOmUQwMKya86vQ{d@>-R!rUa!?Yfv&+xjrlstVx#J3XlV0|6dRe017i5?F@-
zbL;VF_5nFx;GUY|uS_^^unU~QWuS;(mhaUJ0O~Cl9J-81r_-x2$ds3s=X@2nV~%p{
zwnert;NphllS=%R88b`(vv`_0=ySJyFnP_#WW%E<{_ftzJ+o!j3AcZ&yU*I?s5>&_
z%e!O)btK-=->I;@lAZ7P;(bN9Y}6x{VXccqtCDua=G<+Kqpbbs`e2x^{;N}Qw%rUn
zu|kV}kCk%AHjnpV(M(qDNLfK0`yr<C)f?`}>-Ot<YL>;LM|DI(!H5aVj=+5um}+DT
zE)A0?ye8qMAKMiz5@TDr&1AQVZ;+{!D_gDAp<-LcjsmSc-yQ#;MdDV~@JV0(CHKYW
z|NNN$=fb|rA|BX`c#72mCVb4lY_vIYBh-VX`v{$=|DIP^5CO2BGX-w`;IAgOudo)b
z%7qsm?cWRPG4DCdzudw0WA`w!r)KkUG<Afyg(fTI|C|9B0T#_4qb!i~Bdg1hU&UG6
zhO9-PU_-<R<)No<BUnlz_!L6F`|C!Fl8Kx&#i}3*;5JTf`^uUKeLTznrtXTj{vseZ
z+vS8Jo`H66bC@K(<?y|j%nSv&?z(#^cNAKtUSEj09xpjbc5VqkhakrKZsDJ(g?n)G
zaTp|vj$vYl2W7>QVog-%zKi*M_3x)oh0gaywcqgr00M|JEZ!GBprJ=uy_En(eGu7Y
zyu{suQiO@`MA=OD0{6<LW0l;Cp_iSf;A?r+M@t^3eR@B@uSL$=A=h^S>~$zFGx;rG
z_OjQ-deg&=eD-vsXcS^6<gN9&KFt8LqT3?iUCTJ#F9fF5uzNbyv}smpJ%KhH5zXGN
zO$MC@<G78%j19}U%+r+|As6iMXspw*FTY}MwP;)La|aJF2ncND=39KQlGS4n3W`*q
zQN-P!Tt2u|cQ2Ql*AWg8-4_JFSd@Y7ZVc;`Rx+)q-j`b=SY+3~n(D310@B<P4A>dz
z7&%uI3<8jMpYNE(<b#5$o8}$I+pobpX315=9n#V6J!2vbrem`rZW6G!JukYcyFY5U
z2b<m_B!+;~5&2?QA0bYM!|IYjGChFCrCP_%NA9P?)QQBbBki<*>rHiV3oWD0PHBAZ
zmK_+&?{9a2YvAZ{(Z*!dd8~lVH<*abGYB0WqO*X_&w|gTjL52CHTK8cD5=jPYSRMk
zs}gdLSNOK#N&~ePFQn(^lMc{HMCyI_v@3x1_xX+N>nbrxjl>i2l;<8?N!zq{^yz4+
zU)t4rWHge!z%y@m&0y152TXL@fa{3zzzBN8?nRs7r~&sD>GGzHc&7v4f)N0mkHX$>
z-;TfTk*&ks__;;dNZN&}0(7Qh(hPFbT?UI+3C|8|Ql3xo3EPi7E1YwXlPSOxx2{E>
z@D)L)xGEEz?NHYUV0TCMh}#voIE~(5xIMe|_z%^Ikey%mgr*+Bm6i8YslcgETAqK8
z$^ACE;okfVfAwQaXXcRv!bw+ez&`My#JT%szN_nQ*-mPyo{HcV8BnoHI1=jGt8VBc
zydZEo^MLPHZuP<)ws4<GyunClgERmB9}R++2~3n|aul+jB_W3$U^$P#8C^^u^52}!
zi@)X>q>Yo9$on5-FZi$9*AN)U{^j>>`=zuKqU>lvc=4<$WN4~O>He4UmA?qfvtk?9
zapHX_e;nkZp|t$4p78Ta23IFNf97r@YD5tl3BQ~*g&!ZIc(xo?%y8Hrl@TYsEcpqE
zgn93u_!$83VE)QM&K9^{TZ1c0qnoaLOn5N@b^zct?Ay}skB{t%^e~*9sH}?I>CRcU
zSLHvT*0HC2fzq1aCB5mQ@8^GjuqUs;0p}lcZ?fU0m?V>!6B%xc+wv7AQ*kQ^FHOB_
z75-h1J<G?O&pr`%0Q<epCL0<5kNK+P@E^|)^ZbU27NFXMNB1<hvKp=-n|yE3P@4Jg
z(yA~wm`bc|^oFCD|BtJ0jIML-)^1kQ#%j{oHXGYkV>Y&JG-{m2wr$&uZQC}#r~7^P
zIcI#oGBQSzCu^-6*PQdhlm9*3w)=TnHAPB0RtASc3y4+dAo;ju*6XKXt`a#%!Y~rC
z2hg7A5(HExn+3at=R)2C5vQcmv#EVpX2jKJ7lN5t`fr;mAKyu)oQChpEz`4Zmv8Ru
zUxW_@6=(|0RY>>w<ViO*KCgeTk%EY62qwBMxxu_Xj;Yt%z^doD$Hf$Rrq6h*<1w8<
z2{haS;*4ZmA8`?SbJx3cobW%n&uT*2OeVqxq2N2L;TYtYH>pwIc^W^hG*B}?Nv2$f
zoqCm<hp6OasI<&}<2E+cIP%z@bNaE&lwWXYzC``AA%m<vvLo=G>)z#{&(|xQr+xEg
z?cPG~c_&Zzn_=60&C_$bXNLQ_`w#anFZ|$-HtsLQy|&L!PXWJfoj87YJ717;%L9|_
zL@8WF>^h@SOsN!>(Vfd~7`nefHY_6~$rN8@Jb{!Pqa2}S;0xZlu8V0fqq*A2;{Tlx
z06Hg|CQVYPay-M30QY9V6dA)DJHDL32JkECMDp_~54c>OW!?-6gJp7-=kGSJXhZ#*
zIE4h7e3a5M@0Ln1MMXjJiFa@G&X$QAGDW{_Fb?%$1vR5gx82(gMni<Ed?h5MMhwUs
zYqy`&9?%;>yM7NHro#>WrDNPSyUvz-YPsFa?DAT(D<(1Cdl$ZFr1o<-^mjDNswt7I
zlZI*5_Zm!8a$?x&shgMGfm&>m<}nUo%T09Uw3zyR8M>GBG{?V+G+kG=brWe@2kVS+
zGq<w_`a56Y&hQV*aLY*d1Mc@{mL85T55Rj6zDo>^Se$YGlv&To{R}$3boS0pcZVvR
zZ#S0inO}FOnPY`LXKuZBl=i}$PtDUzE>CaUR)L~oO-=_sjOUj7+|y|#Qx3PgK9%Wf
zE@KQ2kSnkLL-QH4w72p44RdOKiScd4acS62I*X!;zX;d(@bE{3D{sK}{PX)40$SXH
zR6FSMmNO1}<<A4n2ShZVr*rhV*&?$Q-l7BbbP1OM$}r!+n=jFTuK=utK6c9NZyqGh
zkH5b7@-*jL_$A*rhF0{B{g85ez-Bi0+K;xa)JT*rqjXQm679&!ADLZ_n)t>~U_+jk
z+#wQ<jFIA>u=XTyG!k3F@gyuHf+>6Mh80GBf%+w)3Qf9eLqTMF;1kTn^>}C%sc{;T
zzzUtAH5rJs&Ha{t-OF=wG0tdeleOoeO$I$stA+gA)^t`=DB@8$YdE*bFR&hw`G*MA
z2R<ZPMI+rjin<XTO|^v+Iyxw9oYNWk03p#-&)^*<?V&%fX3oCJM+R5+RDULZN-TX=
z_!DMHr)Dw-v{WNt$YkQ*^okCd;ww~xPdS}+GgQ@y5#(!C@lS{)Lfvl;e9yR>iOK}4
zUDqS(gj<}~6e~)KrU>ZR<7_AK!NO-IERiIW9fpwe*K^ZH1s^Zl@7wP@(9e97(jR-7
z_;&=aZa$wy4za>d-}u`W3@b=`&2}FJ9Yv_nSXSIfB`>|TU6s;A+%uh<%T{Y2DvGb;
zWahIS73?Q(xlSd7V%lCnXC6KTD!eC8-TU8mk8`%FT<uNWC*6B$c@(#sGT*GZTPU(a
zUA_M%b-NyA9krblM%zs2NDbuo`;56uFp@*7E>2ThO)Ehs+&qvT7(W@<@SpP7mk1dw
z?c9DObNfxe)%B5INn{@!;%gJnZ-)ydy$Jso9)=#TDRD9a0)j5$EZw7+bhv33a4zt#
zF;|4em>G7X6c?{^HxcGnCF}u#k59vqMc;VFKl-===lW{Y)Ddwjfo(FS#r4*VVjkDU
z7;HbpMgnZ{$_$mDx8s~s*1j8w(MM)TFtg7bKy+dFhpc4z_p_FBdO&?Y30vPFj)s7x
zNRRdKOVnqbhWVKMW02X3X?cjN><zOlV}A^r0>1!b_ynQudb=mLWlMQ*djpGb+Kqiq
zUvm$FuOH4eLPzogoxIj|-g{!W%T`U%Mg?s6;3l8qA*+dFOP;19X1=NYU1Z$OiruWm
zk^~M>(dDYG=4NW9poCJEZJofyU%vx-SfIGy&_UF}$_danqc2#l(ho9KfQV7{+y-W&
zmMSR3xz$0mTFpAM#Y&A^AyiU~wPG&)7{=(50nLB-X~H;EGOv(0@(q_ee7gaL%Kxxr
zZ4!wxzroDglS|zIoN2d%@(i!1KNefIuY*&pL64!eeKn9XK0af%4`MW5j*>3`6)6~Q
zZ8neVl>w1hVOY3h8I<*M{pgNJzu4+c!;rJN3)ox<Cdf!y+(Uz`U~}q+^gtN`Z%}Tn
zB8m|wblSD^iGYUd+gPef)#e%2WRsvC&UR$YS*^<^0%?T{68cJWq%xw<#R0g5T9f*V
zyFOn=`kt#a?~wm!^<ko_nwsy_)OV)OLpN)szP8k`agHF$-_yJ0uLf?HAu0+_H~P)K
z{4#1EiQBhZ=SOam?49m5+cH{mW^AtBwCi4GEHnTETAaSg$guo1_h%8v?{_5{c4bY0
z*%}o@uwW4s7NRS7??As^`mhOg<d#W2&-1KlKWvMJ(FeyQR8*D3(iQ;<WTA0V@CI;m
zQ(l_jSH4F;Z@I`F_+1lFifu3eJq;o;HV>CoR464rDN~xf4s=$^AtW*LqNfFq7oyI4
zfniTBGy9dhvUNyJ4a(V!$)!y6Df7yls5Iy$X0~ch0UezvRiV%lW;f~Ed>uU77;oZw
z$*uz?*VOGr7~P*7-Zo#*gc}JJ3%^0oeCY3E|Ec)K#2dx*mE1otAf?CqAvs+PkI+GV
z)fJ<9lo*kg&QDa5Ga`~J)=SbNfqH>-dq+Wr+3V}qXYe1QADG0Rgul8t45@uxkEd-J
ztuO+Q-P85<2G9eRq~(f!?(@|!9bB4FJ3X9=J>}dyp&Tp7LJ&qMDy6*X5vENt2NfzN
zCMFzzbEV0?OCPvM5_vqEA-~L7{*JOY=fJ^ZWMrfc-+`+Jh|+&on<xV)Rn`V}x~Xa`
zf!#ZQcdxN=X`h0bf4cOqJd@E!ewz!2xnRQabg7Ss+xo9Y`9Ibr*maOLf>E$t4nrtX
zVBPcD?x%%iHD#*9M0|TLT0&-jR_4nzjH`*JAz6)LO?Qe*${Bz9*HY$%wm1JeY^lsk
zVM{$Iq0dsPort!c+%x>AqX7>G;xKk{bWo!Bz`9J~!fZGcOZj%!PdI@NZZfO)>@;v>
zt3Op_t*KSJ71%!%M-?tCFb3sPh6=@wmq{wmF^1gA%rM7_hxPxF3Vc4yyNSI=J+=Tb
zdLlk@7#!`7dssP8v9NW`EDmh3i}8Shww9ptJaj#6OgOp5tKGbNoa-9a#YWm?Dp&kq
zz9K`7$_V48<z5SU?h#|Yu4z(M)QAyqIdde!*N>>Z_vzG0<+}O?RFxlp62a#1uro;9
zp9p9s$cS86UtZ0M_)J(QGdf|EFzmWt-X>%u=@`1hj3$MhSt27>mfJuWt$0CAEh(^n
z!%$Xq85dXT;9fgjYL|`;rtR74ldN?4^Sx9nCHyCMK!3N4i5PjdzTWS}CMLJL5rOg2
z^aD!hAoV_x6#v#~+wVLVlDb0b(FB5?E-njTr%TT`;mfdxkPM*R=OO-eJGDr9!#D;G
zp*t&&4t}x-{VtJ#6HARNgH=8Dcp9yUR7du~<<_rXqm4~e!J`$Te{T*6-Jh*aHYt!1
z_YR<sjIz>t%6>qu9V3*J1qW<s^ifV3*^&~PyhJ#zfC!HwV`!E{;Z9zV0q)57_&r``
zQhHSVCVv3r%KqES_4p_QkZc$!EMRDHlOHM8QWd%PRLQtt-XWDt$+3h%mRz*JviKRl
z^Inmxj7B%vT&k4nJh|UZ`CMoFQNX_Puu}8N+T`n$3JRs-8`7xXIyg>75ntK$2ojG&
zx%t~|IqM{EqaBBJS$*T$V<mB2Kv`2R-1Y6~IBWeKvPjWK+pkfFXz1va(47eWM(k<T
z9OwMoIFPy(z+mu9#&2$>Fe)}eAGAJ8Rne*!A*d~);gbUmrv6cpr!BrT@#<rKZZ7)M
z9v~9`fB<;2LD7AJA|k{l@U&JBHdOS|prJdSSeZj%ru(;{?A!AZ?2KsQcl|DUR7#3@
z*i+FDt(%(QlQ&akFoDrus1S}9Fo-p~4oOLAVW=M3tht@A)<A#wAE1kk0a@w2uhUlp
z5PJji=?QQ!wp$#J_ZGQW)BnzeK7iL++D=JXLeH={7Gf_qGKN={*>~LoyaX1AI$4De
zx!&(@M!unjGr{e&GG>~_n_tkm-D;I;Z3?yXN9X_Z1Q581rH{-2nAKT~Ym`0&>q?Vc
z>3DLp%Z$hnobWL`4rufde!)u2TCRj0Ei#se7p2ZHB_HVOd>ce*0is={QrRX^0;EU+
z0^DJ1W=spx_9mnHuGIhIIQZY&YeS6Rrxxun0hik?k?@*_hGtYXA<Ga08u5t{3YWsM
zX15j+8w&D3o$3?)L9#nf*NvlAf_e8!?L6})@DWUvLLs2jcV4d^Cs*n<na|U<eG}+!
zCFsd@MD=~b&z#;pYkShSf!H`!!kVPyz~;Q4pzQLBRbsn7w0>&<T%B-CN_XTNC!FKU
z^ylYVZ(SbyoP8d?Su9FP2EsPsArZ)gO%es-i+Ny&vYja!q!N{IcC`J((YRb&w%)1|
zwd&7ij^HchDxNlk!}bLZRm|-%_K#Kan?~nC9fl%%&OOg3dF$K#KUPCoPN#Bd<5XMh
zip1U9N*xQQkLQ1+`x(B!eh>K(?77<q87|&Kgs>j2%rN$pd<R$B;(+owMY_rSqQAAt
zWn->I4sTYHI}$GtV>(}FWx+m*S|HvmTyA=faS<Rf;em3YIGs*R{99u$69oKkYLrV}
zvy5KN1^J%s&&X`NeP4ec?wf_qNR68qCW!)rqfrjJGSN$Pmnps#x8<^aMuPcYhYRD=
zRjr!5W5dHt_v%iRebcsGcU7O01>fw+*L%A5JS#6fx~wcX6fH8prPkZ-bve|fJ@1Jp
zOKmH9E7!>C4=qMD!a-@+i>LI@<CUk+1X~O8-w4&C(fEG2FLK1*Uc$gRB#J<?T&`z6
zHr?Un)m+k))X}>(;Q=Qf=yX)CCp&L%e6%Y~X1rF~ZB}d@cEtZmjLqppUEcm=28+wJ
z(8DxXKYpI2uC_XTRa~^p`Cnr!wqzu^MVPtY?)cb54l=6~ZVkUa5TG?TvTd9y3PyeL
zUK>BD`**)^15DS7*Y>%vl<hUFog?dUR9_+_u(U$^?2NQD%VJ;{7gh~E%i{?IzHd!Q
z(lIX;ID)CNb~vA}S#FUdW3WQf)C~S!_+pVn^H-kK*+qbeg=J1?cP1s;MF~A{oj&pl
zV2IQWCHef_eth7uMy5Koq;N8D#}?Zb_XdO%)a1SSt<oZ!K)-;+0aX(GNxHI?E7r+u
z>gPi5|6sX)yuJuP5;ZnGGJqtym;W#k=!5zl^OBH|;C7IXtdah`0U?2CD>wv%0ohP5
zMwbhBbD4r`s&!^vs~z6=m+L+J?Rh{qS5gL5qiLoablIfB2zXTp2@59?PLFeh@>xPw
zhRfm8(-wUkOW}a|v3`%DPL?11A&W>Zp~F5h`0bAD$JSm+0U?8ODSG3lz1C@^tnS(2
z1fLabttAniU0Uc~7$ONNLOYexFYE0G3A3X((#!c8E^;7RwF^8=`$zT%k4<>w{1S46
zybIhop7;dLFzOd=)xFM6d?M_xn5ZEiplTjc#u?NiRL0s+WZ%yCZ%$&(+6{4dSCg`9
z4G`AeFV5Y}$B>XV2`%h4IO$@nd4R^?`sn)<HUuam3<A#vT(P!Y9XIgt3Ml>`4!2jj
z{DdA&jeSG9gPwcs^a7T7KXegv^+#`dRRuQgw9wfyN4h_6hBmza+9bPWdT=W^jxdo$
z^~FTe(V(ECV;y%XvjS#YZl=J35FyxDEys+LBO+8lkAj%@p@4iC_3i+}*cOezhB`|@
zz+%yy^Tpv8Fsczn8Sw->q?GJ(18_N(JCuF<*04W8s=9T!YG?P=x!PC;E7oNc@O@3A
zRLzw88)>AT4apLz59=!^Ol8`BQZZLiaE0r0n(k3|-gckP{x>05j$u}uENusgxRey%
zP6ygHtc_hm>%R-#1R6Y9$wv-~Q{v>9_y<Hai{;Wc;YUl%|FTzX{P6)ZPGgB9Zlvs>
zH9UgZ%D!62nGm0PW0@PJD0)DuYw?R0sEamiN15k0s)uQ>>47yM6ky8CgZ5c5v2qUf
zRPf&|MTt1^$T09xooFXX)WoE)2rmht?8Bz~Ww9j*I9Q%DG&D4qG7IELzcdyc4`9;E
z;dXlzz@Xos2?&1wVb1@bwam7Hgdg5>n+X__V(Jo<9|LS0kd#4u-ggQB6ruXY3;H}G
z4gH#3X*$9laF$L~_c0z%w}b}-27qzH!ForB@oGb1;UJ3iyl+#)Ny)FOreUjT-e@F5
zFae}wIK*QQzo1BvkdKYGO`|@mTz^jX>f^zVMAs4BdhgK*#P5Y50oyTE$ILl9x=Y~~
zRG9YHC71JcmA%vej4CZXE<5P@&0<bkk)Zmr-i*sfReuO!TsnIC59^+f3^M3m`N1)>
zH4rS8gMA^p!=v2Z<n)8q1mxt1UkMF<d{-yjz2Fil>Ae#(o&TKC@s4Kj=kj#C#7025
zz)ZkjDyZCD87~&~wErxPv(i(=7sI`+qiZT!575~Pd>3eid<oDU9@;&ir=RrK_dtFB
z03YYFowt}sf2&^Anizt6O7xowx-H)PF|QhlFjh*p-*eZHoW|b2Em1~OfbjcLL*En$
z?^dku>t(;_d-o?}*qC0b;OIX=o25Xd7x-ZS4tRG5Kp;x7#Kc6%vj7jkw|kFmH&(&s
z^>#iKf0I5(j+UHlkX$QE;L|IQ!}$*1x+gWh(Xq)t*g8TBT(KyEkWbq_0!re#q=Q=n
zJi-CIb-A|uhrBH)?qn>5bsQU+RI0P~hfL3)f~Z><B6+w&?)-ZEzxon@$r4vrL`6%>
zlF%-(aO0}AZ}b&^W<<#zwT|cLgAv(dNCfal|1JRikG^wd8Yv-1;9}zgBBz!#k<7r8
zSZTy2^9l;E_`At6Jic%hs@ZP!28&5bUYm?exm;dGbkb~7oc5XnFH)2d<O^mX0tQ4E
zg*j5#h4c<FuXf28Nf`i>Pc~>oIU|0Vi&;>aI+4Mxg9jUQu~~@@(nTnrnrRYJGD!}1
z9VO32=f_5X0mooALv8>`RF)U~B4CX7x7xYo>s(hgdyaSWG4}iCdjY;@<S}dU78`D{
z`(CHBm0)-r4s<YR?^pRY#wy>xuZ9C@qhYY=HeWhLJ@wDT^Ya|DZu#qXil}m^@kEA?
z3i(o9wgWg2>eRPRDAiN#z02#`8sIMknc1SN)la&=&`pv%%t)5{MRkYE+ZKKhbXyTb
z2oIm5y@vS`@)d3}b3+4lonLm^@<rr5F4LMYXTy;`AX;M(iDbh-SuZJFv7WR2(>r`=
zH9Nk}(d}2Jd4R4E*e4n9R=4@VpivVto@CQ;(Oe!F_Ui(wViXv^UBaCPtJlxSPV@C#
zC$TyD`&OzgX6!O2j;PAJZ&+#HW5N)#3h2*Z_O#>);=%5lXrSGoh>i^NJTzX~K_I`X
zc`YmHfub6P3g@@0R6wR5KZ~_&ucCWcttb1)nVV0<MU4(XvczgKViF=6TIl5ltL}(Z
zVe*Bf$W_jI0tym1sH{G8?>!rjr%{10uA)ea2BO5GrX>K-{DVFb!OEYn@H_BbMgL)~
zrMevzHD2~(h1&@S=6peAmdQjdJosNQ{0eEKEmg4XbI<jBP|;SlSryUQACA@K_tPIG
zKW|D4m&thS#sj&<`J9E`woPr9@gZ&DHdnvxcH!yoN)%-R6&Fi=f?V8>Q9fFz%2{;R
zS;gXjul@BQ>x;t*wNgPm%FSB(KleVsFh3CCBYPBerm;Mw2F)Vj+xGu?YIZz^ot!I>
z#iLfQ9aJUS$sfoSkI57ulo+ftjWPLB9rJSJqMkv7<{SM*wB+f2{avo?i~C(Xo7c|O
z#jZgS>XMr(cmxl)1G2~YS{p8yfI9w;2z%OCQDl4aGNu|hJU$=CFBomjovqtsX7jLr
zD)#X1PtZ%aTD3?tEadLnVAz=Mh6mzZ=VItGk36mq_6ChyUye2_Ugq8>2<7TLKSBE0
zkCy%6#O}bmhQnFP#$#%7*Z-lA_j(KF*k^9FOI){Wy(}kfeYJ3@zdXSsR2JgefcDjh
z!wIp9xegMW1Ka_A)cQiMWo1Qknzhib32-q(<uV#g4mdfnP~e(HmCDmtio`y$TYiaz
z1qb=}8&X9|N_BlwS^4#N|AJdp79->{VX6_}E-5X{^LoXb=(edU6!3Wndjtt{=Oa#w
zU5(1tJL(4v!rlZT0S|{PhTuW9_AkG%{k__nF?dZgzYHMZQd0~LoT_A4zqAl5>g^_n
z=f5(JW>%6L<Pz(RF4f6!J%;~+MB7{wDAiUndEsz8@}DhHNinZ?hemKZOb>_~M%`9H
z;E7N%;`N98%~M)fNUuvNY!YSFH<dA(#A{GE!!Yk6vG!YjazR7!*R5Tl#@i|B_{ube
zH)8zjg>|a;qSD|&e86alcYpbpfo8(tj717$bLEQ314ua7E_i78W<x5i!=gd$hBZie
zt5x!Kmtsk9>W0l3U#3c{VNo&35Y}r?Z+k@9?z`^)R988WJNx^7?u2db_x*r3y8mB)
zbbQ;V!-5nhQ}(=lLPEj_`B;m(|DesP;1BzKfD0QNi+p7r&m2-FqOO@4Wo*Yql5sji
z6frTe&h_4?2*EkP_#5#^L`?@oG5>T3eRHtESX2DU{f=-!acF_V$;Vxds9*7SKt5J;
z-|j`;x_orE|M@|%P`+z|Ouu;AJC+|ZEQX<-o4y~Gxejq_HdB*Kp@l_UnwPCwMpf}f
zhK4|&gixuYR$XnM(hjoGw~I5NbN~*KC_d<l0)0Mb9RKCE!d{q-vb*MTfSup=Qrp1k
z_z--mQ&flB@;41AoZrWOcVPh?1qB6jk0`(IlK;~P&Fc)hgXId*C$K5*nZib8bl6Af
zRv;CWZ99yqa}<#yt2hF)S<JL`&wzBsYuiT4TLJbc+wl*qM$G~+r~&Y{92{6Z4X(xW
z+G$C3b+?IroM`{0nw(ta4J*G=x2XrueZ&tMqT@+&aQJ$JLhDwMujTQB`LaMxY~}Ao
zS7{n@T&ze3Y+#lq?X@<3`nO`RaUkN`wQ~T>C?+Umxo=~eA|oR1=tcSm22z?3@l-i_
zJN3Pfg!u08g$93ypnXpF2=Ra8zJuUI<z$Ooif;IXVd>NHdPq^)@oeNEX>D#|DEn+T
zO&yBH0liN66T8G~ghkkYqZ+1Rvst5`h=f7LBbB{r5CQZ1evb40R#^oLAyo+kDxDKG
zLbNhWxLH7NR2m_ds(;G4*N6RdSIj8|1w={*XEjrXYL$v!4f`KmG4|TR>H{(hl}^ls
z8bOBH7dmv}=VkleelX*lSo@K<BiZN)OHFvFue|Q_V5&;L>v*T!1>D30ph<4B@yUfz
zU??f)gpuUrg{n@~5to;==F3}3TguC|=GT=_S_)O=kic_E5x<K;lC(KrWmuo3BqT)n
zD?;kR@2s-iw%8kwjigq4wav_`alJHemLRNkbqjloNLf%%^&Qg{SzBN`<>zfh1Z8xt
zz>M=t=b`U?!FLM=Wo9%4z=R{8R#11XzqwU}Y^$r8DB#xK*+1QeDh&DAmp>AfCvzez
zq8cm?ON3PFu9|VVEa$1lB>O%zqUYx3m)M<;iuG;i_Eb4ekGq_9;BB2@?ftxyL^&_C
zW8nP^=I6uTiJys-Y3y|7XT9321l0-j^>Bb_X>J+bR|i9%gv~AgA6tn6b`FY}R*883
z{J0L{!6c-Mt6R~Nyl<5GixGF3Xor;oI~FJv!F(;~b73KDbSyx84TIHmJIqt9HTlg!
zw*Cz$uVQ0kefp0~QkSBDXX*f{h1lGXGc&56=W1aQ_vgxK%TGZYQRIkbDor;$c}W~v
z4^DAQLX42;;IN?2zC`d~tLMj1<47uC3Oas#R7exZ?zo5iL9LO>*sZs78n%mu2^3WP
z9PDmOwvLvAgNNtBK@6gPoxj6;-blX$;(mN%7RAOxpNrz(FcIKuaD}E57P>+D)J^>C
z%y;hRcIEv|SMSKpfq)MT@zgYCuIeCd8&J;l&#L@@vt*EuM93bRX6md8cSbRgLW(4+
z`(6<-7v>q<(n7}7#?@QmhxX#(c``J3Q_dGGzPj!Jfq2VFgBFQsdbm}_56*{$$Y5uy
z&@EuKW!nv@#lknBS?lv*UprM&?X(TP#o16V4XrQwUoU{?dSYTy5(<KiG>jHGB3&^>
zTv&J*(XbnC`AJWH1oGFdEg%Jb9QQ}Tyg>Y(JSXCWC!eqygVXsRWzacXOcr<(G9h8k
z25t9JGs48>l){(G=loMbA=Qrg3CZsHImIqAdRVeBJeUMp#D%%t!Nmrw0Fqss_<AF<
z!=S^j1H%Idn^~&^TXYQO!OhbP6W`fKng03IZE}e+pY`urmX38SEU2%pt_*N82d%yZ
zfOJyvY}0cG+KAfD@?W$febQy&u{l6w4`94d=UBKK0o<Q<x9SC#6l_3IG5(|Ce<Xb6
zO6sb@*?$KW(e}u$YoupT4oRGTa&oTw&a>N#%vWyQVe%L(mb29WQ^R!8d&)Yb_2Xn%
z3~6nY^yFYG81mgN*BI>m{ts*8#YoJ_;bBbS0lHM;Hw=A|$llarD?yKUFfs8pTFW))
zs)kO=o)}5(eu|j>uJvi*-BT<?f26Ad3SpE7v9oSuv#EV~&ut(X{e$PSS83TQ-Sr1D
z3+;ER_|_KC>zB{^?o-Nr@5qr}AD{FG?hIBQ53U=Z<BvBEk2=o-0tuB-a0epsf|gOW
zedl?A``eS~cm4ELYhr3M%x3g7H!Dx@Ff9i})n?o2P}&_R5&1vwVk`mQn&>tEH*C?(
z{$8QsX&ShJNuq0@7ZE3_Ca`@V%|Bq?8srtrZ&GXy>=1PD2o7+~Rq92G96pzswx^ux
z?qn6h^&AukLvC{My_?)&x(;mMR_jS*(4XP>J=c|~8N3%6M*T;A(LyQ@4%jz2h+u6Q
zlA_?mWug0rho%WIW>nNcLcTT~)cw&8pIofKw}XEY{O4c0!OtA{(6%s~Y)`Z@Iy%~J
z<8hOzYqpdGSt)HR*i~ieX!LX{P9*~_tA<;~CT7kDgl>H?Z|ymGk+YPhNfkzqUjG~*
zD7IPze_GTKtdD2{4_0qqf4;ZGmT_#G-Sln5(~nP9#OGR{j&3+RJDtkDTb9n^h2`Kk
zAKix=18k|)=FedD1a37mxHK)K3H5mr<CtAtT|>*65r6t<rU1QaX)Hw3VV87NItvfE
zYzU!~nsTDwH3UMJ5gcCuwif+u?KHjF4LOn-_FvK`0SBRC-bxxu)*!+~+u5*GUsM)R
zO8KKt%<tP{MxkFDCGhJGeD?GBeBej1a#fgu$7Ywy6}+2%?`@Gmc;5Na7qEDoQ1-Mf
z;KsjZpR=GYtG#GIvn+YNEF=b?hF?B!`OXEF{4W!i(m`<SsA}R=h?C0$YY+!6;#l5Y
zO-$t`jBCA%teYja@t`ar#qJa7&lcCx;w3Wv2fOd0)~|5aZx3QI6f5s1p^f+bC2URS
zy{#!D#Y(L1OXy3*5-EKDoXnY6M4eS(y>INJdko?8wd8m>IN=2uUg~Pm1^i#f0&W%t
z=mTLvqXZL@F3R=P?@?l!Hw7t|)1Kp<bZk;6kP1q%Lzt2>`n$#JHt8-mM3KW6&7OwF
zr@c%SUW8aq@`J-`Ia`g7-~=?bSo9ByVVEpp0Mk*)cIT)eqhnzF*~b?OX(7H=y3RCz
zk&aa0PU!o^&^u291;Si#ko4I54#7Jy;<ODaU2sjsD{=^oUFF5tzyuwSG8bz8;$AQY
z`T{R1ulEDvoJAvs!T_8K(&HmN?N^LL;nw0}^)rq8ncyB*N5{BkC8}fSn=vuH$21|=
zr~uWf7beH?CXrZbSJ5fB;FFSA2(k=sW~&ZU-|x7&6O7x3%}kmm23)wFW>9bUoAkN6
zcRwpym_n%fmR(J8L7(Be(|f~JACEbD)9tGzmS51p)dlz}K5_<ba$8$l4`}SI;7^c(
z4-F5ugzF02rFcHw$cOl;qra8bjC~LBLnf1{ZE!6AXip~;bLQ-N>hgn^RrKFWuL<(N
zE93YI8$nE@zH-0)yhonN?Q~nSf)mk|q#R<BLBY<hnsN#l6vkz(Zbxv+P(U-n1|JI%
zi?)kXMHfQs4g7QIp@X{-gRmh6ktZ)Qaj9xw@WX2r-hbvk=Fk0<<NauD8Rq0)gQ|~3
zyK&UrK*WyR_upTN-~+$$7eP>5`LLOp&mDp7tHdbG0*URzmr4#FT}xt039s#TNF9dW
zC2bX2`=NL*(j_4jO!4Q;dJs(^JMc^tki~j__<f;@8Rc{^q>aUf9<%s(++*9$&JH<2
zes_1b%*ZIQV=ZAPOP=eMV7TvC3P=t}g&cCrUYmi0g;h*vby&P<=zJ8A#brI9p;E`@
zw~&Dr?odUDRZ{PcwDe@{{iR(24Sgj~VCwO@TW};>aNS+<-glCO);T=dv`isj%HK5M
z1$9wK%^!}AZ;vD!B5X<l83u*&_}$!o;c1qcQPhu*2;5*Ym2lER)}7Hw=MR(YMpuD$
zC8)_I$6FI`HoCZ&GA^p>%=`iFJ9^jZs&rpjSy6xgEbj)(oA`<Q`xQ0nNQ&RDjSsh{
zau*A=eIg6a7vJwMe=~fPi%tkIJN)?K2BAM*4(oCU7nK%~&t!958Aglkeo{4L9s_H2
zadFqzzdldE6Xq#8A6?@jMgoWN4Uu!oDLY{Y4|yFyT%)0LmVcwlTynB`rX+7QAud>_
zwf4uBP_(XK>*lYG_7W_QRvK!Jgk&hge-3U~P+Gu;M<nQ9wla#Enx$ih;jj5AR^6%W
z_F-2##$cW^xkUD!(DOqsyqCEOU_h9-{bl7m&+^{n`C;A<y-B!hL{$6`ah7%;-+If%
z!fyDm+phXvOvg1*m*U!JP3m-a9zs9Q)6H4z@_f(_@3-I3Dq70c=nS#YF4<fzLnFsF
zT{qJ+_7w58#*)6WtCb99&%&zH;{JGaO)r?O_|X1X3KB>gyAeODC7_gpjyQ&o2j{80
z6rufZV#P@Nx9||YX_ienJxqG!tE=GS5i6>Yq5tWq{^|LkcZhtXZOfnDhyCaEgRF|d
z@Tx{dhlDG4t}_HprW$Y10ZDgq-2pN$$~dn*UU};ykN<t7sI6UyL`CaRxAiWaIlTf3
zWSZqrvesxu@yO^nQn1e&(Y$56XgQp{1-${{0VK#mvibZ-i~}ba3l|sO+uOSZEe%M>
zz=A=e?FCu}C;cdkYii1EB845F;<Ylc#yN0YVMxpW!IW%Qh!d|o1D_+1xiA;IiO#v5
z?!P!gXa^q)d@FCUOhG?KY6h&!XET(sceq8HkTCa2fUY)-B09n8qCN)LceMZAqu)S^
zUInlO;uUIBItZ>L1MCjw{A|R~{!50mWvlkSKDiJLbEq@^O#i}DtiSNIPg{HXm4i$$
z$Q|r?P-HGP{WJ*LePx0>cBe6O0*IUG3$t8r*ZR5%@W8r9l9=KK__avuUHd0f@Sk|j
zA0Hnnx?DYFz3HBouz{=lFE-CKCd?$eOg*r#n*V*^Xagi-4vvqr;-=vEGVEK5__ThG
zyCRP|8tkZL&vFu)czk?%B4lLz0{EjV2@utyJ^}n>B64!b7&2L92`;zaCB;KmC=(GU
z5sl=}N=o+fN@qbU9`b}|B;5>GviES7MNu_1R30AO241_LtS?QDHa8<)(t=g#?-3ph
zPq|%=Hd`i^m$l}$kNojYNw-4dX<_Vk(;$9<41ysw+&%?n@=>1A?0z#qWJ3qdss9|Q
z$`!BBYQi3nLGd-s@`dt~*HDUBt#)lDa&7TYfRGfwDG~Bv&vZr<_~}>Kkq?WoVvCIH
za;a6S{e%~W!NON&XnsxtAv@}Cf(*K&6)%Ak^zToR^#xt!Zbj=64`ZkD=WIU}xz7?#
zc#{9oz7b3^rMlWm2F>HnmA!o4mf=C39%K6$r`H?09@Y}pg~juZeVw8CllT2lJ%Zz^
z0{2;&*!t%`wFQ_T9~RQYHK9moc(@Yk&MilE!o`_eTcUYyD=9++fghha(!?kUKUZr8
zvBhLVusGzc{Xl!RMC^`%uG~91arrCwvH}w#i(3@)K8iL!F-xV<tVEo&mSaGi7M*e9
zUG<&1OuEO<=7x+AY_6EFD?6v{Q14bMw5-8Vq&Q9^+VPLA+?BFtW9=@VJyr_ANhE&C
z#0P<kI1*p2rC!}e{OWlLvL1kQe*N0DSw)UW=byVmI6OGFzyAJH18qz&GcrZVNK5`}
zu_bRRGQHbfI<-f&NEnAme>Od*Aco(?5l+bIA5Nd&##;|nIf~ut?RmDe&@4^tx>t&i
zZ3s#>zM)cLW_bdAhNyw-p%C3aqb0x}8#RU!aLApvUq&6r`F&ow=KI7})@SrT&5tyC
zTMgn*;DRqi*xB3v21bI`3a8=)M7HFeVqo_)8ujFWr_eYr9t<jVCtwzT;vuumZEx;b
zu(pg}!R+l&c>m7%-5GiQzgHSZ1hDe~ayB+op^5OvJh#>Z7h2MQ91P#mQfk9W!Rz%P
z5X?Yp;mbf>MsKfB956}xQHBCB5Qd?D-+D4gb?7A97V7U0UN=5=Bj)O=hcfVQU3p^y
z&IVt(UU0IJ@WZR9ANo{0p?^u7LrTNv?+$j;lZ8QYyV$}v9{l%i#RcxxKz$G^&(!qv
zB@l3|x6)`!PDj^32eL<&{VnaHoOYegd|#D*_#^1q?OGPkF^V+ui>z?n9kZcDv|RX<
z9@nymWbpSa8ULbWN<W&9X%(~`@XHU$UB^9)3VZq_rROCn^>{F>RMxL6m$<{y@^qlw
zYeo54&l31kq)+DcD^i-9Mhv78hEun4kHe91fnUcc0e=?i5-YU3M)+IZgU^mzaM5x8
zdL9eu3tr`Icj|xX&t^5@SVUUl)Frg6Um;xE^@A*EVOE`%EfcxjSppHP4{W1szwypA
zTC`Tsd^&WfbCl<#4JS%6{};~4L)w&Ue%Dj8JYQ{Ly*pclu`0c;V93~EV>z--)KT3o
z$IQ3ng-2ZMmwCnsGLPVn*bdiER&Ivi+1DxEDzsgeh}$*8R*8I%Fq|`#dkMWzA$Hef
zpZ5rN%e>wU@O)`V{}z`IO}aV5<i3a*zYg8gi!Kv+c)Kfy@Gy<fD=zp(kuK3!wY!NZ
zlcxS>PIOON0|!$_Uvl|QHIIryeOH;4B;Mb&Jfa>S4nDlcJpHFAf-J(z#VbN)-2TFX
zYHnU0#akXfNXvmAH)t-uh)q>dG1tx&SR)L;)XzUKu(-awX6`h~^38<6)(2maDn#Zc
zOhgvuR)}BH+;3*B@(7P3^%BQCwAA7oiC$j1HnJEl;BvQ@=+b(1;+KuR8`8n+#LA^v
z>Qr%AFMzwYu71g(Ttr_OAQ_kUqR=B^32cKeped0Bi9)W2*ZudNU}H^k6)*Hu#K1Cf
z4J9dV<;(7#X)J)oY2$3K@JcnGUqVS0MI_+38>b|}Us;Kd_UVx^<7D?|R*#6zb$%Q=
zrw6{5c832Y5kxWl=;*Ox;9h|iq+-a_k0$a4rTLSfl!o29y!^bjkLC-?_7;?qHFyql
z(JQBv{2D}RugC#gbpuiA?yfB=>wPRTPcJp&@P!8Q!6b>^ogeLU6cA0!Qg^xEOnJ%_
z7#V~A9(oY?nH@D}7iH}60rm{e&dx1p>452{42J9D!*=B9asQ2&*jl=Fw3=5xs{x`3
z97tK?qle$q#tW5IUxPC**n1RDHeX_K_PKKvio*O`I|j0_uN)?NgR5L}2f`0JcjW*I
znh}-zR*-;D5-l9qKt|}M-*bs^GYyl>-I>;dbcDRE*Fp>}G^OUf&9#VQaGfZlp4iWj
z9>)mOU}U{ZXs?k4TV;AQ`FdnM?Oowdzpg&cc|NgMUtbCP(uWBvd$fLSeC=3tr}?P;
zd&`zydM{&VZDmzUj&eW&nXr<T3YnywQNj2!xe&yS(cJ8c-!P%RJvc(Eq>XC6>!oIj
zL0(_;c+5OVMJ*5QpQdznH^0z(Vg-57o+h9T$jU#Lcf7fIJZuIz>FS(0(`vV>er>7K
z_f@ZPc-UJw6SL@vu$=H3+poW~>==NAzjys(-iBLTj`jNOS4jqYzHQV4hlF_qB^^{@
zbi=G9nyPon+`{@3vvR&TA<CWJvTfDbOo63eDZkFw)u$>lofc!sl;GuSQ_6B0?T^%0
z1$i~UpO1diNWXgB>ht7XT?64{xpyVoTU$}l(cj-2Va9GAI&*Wfv-ybZG$HbJ-Z1nA
z1J~j-uGkhD#jL801heUh9|^t(SZbHhjzs>q(RSkkeuGOezgc7=tbc{Qj5&<D<ZFX2
z$&RY7kDS56RN#ayiy>kQx|_jFWxK+=yRmp=h9y_Q-VeBG9Je18y=Y~x?q*d`7O^YL
z7!tSy8})ZC)UbanA|_E7jZvRJnh(_KF{Z=`V!TkFEs@twwyt|%2&}rBr7$;D66mYl
zx~hemS}<KXnl{iW(S+^UH*+2&9auyOd`kCMuIOKqj(#OJRf*)ff=maZp-5VWxUb8J
zN2#i4W8?CwqH=SI<8}emOz-{XflX#tQ_j*pAa7e~+l1~sQz%c_-k-Dv<7#zRhM8kn
z{ts&68yC#1tdvs<*$$rT%K05|H$|X?KZA8dU0RPix%M-~<-c7|8v_D9x>{nHh?`y#
zYHBH0?Hofb!Oy;TgnU`hGO^;LY5|tkOA(hhz3Hb3Vd!L=>b4gEo*KwY&<+98U<z5r
zTxg_EaHe-Zi;0Q-YR)5jTw48h4WOUDT^qpm9uLeCXK-|Ow4DJL2}$=MH~swxK@HB&
z&reBP{UW=BX)eUCHeF0o)$7g6<!o_3b_;+1LwN8@>Yn>eYnE+d&fZde!rtL-_*$D`
zy1}U(vzDjT5|p)scA|tLySp<Lf$(U9a{N~v0KZmeefvVk>qtk6&5Np{%{D4ggLRcu
z3jYp^0j}=%p)J$Ks{XB@BK9g%)&lg?{7Tr>rlpN{^JQps8iHZcGb*hL4ug{dbtS45
zL_|;D57FY3pHrJXgxa7S3&DzC?+u!YiLrSp46U@>S3yU_F^h%7>YjI1DXy4aevrD`
zu-7F+Vsm!BH>u<=ABY~KQoW|YfqIR*dtwp_!`=<8KJh}bILE;b=^afmc-@JzfMZ6`
zLGTu^-qKvwO_|wd<hGS_6{|qIwSknng#`tD0;BmR?ArrGnk;v82x_6fuGVmAitZ&l
z{w=Qi<5aYv)D!Rk(i5)71;3o{#PqZRcaA)J8;?ifu*DVU6jJ8TCoj`$88)w}Ki`wc
z<ct*t^+$(>XmUX7FAq%R?I#{C9MjMEl}whLJZdmP{kNibV+PE4FmP9bW^cGFHk%Iq
zpMGs+(P*u*9L|R9Y#!ydp8Y1fy1f=Pi@#Xvk>NM_W%#HLozsnTLe?5da!_5+3Y{Kp
z)YO<=URLx|RESuv7G|+2K<r@H5qxi^`J2WNlXZrn&y*VJ<WPPj_}Fp{Ok3~4n96y(
zzwXt%x}EK{fb=FU1B`*Zqte$GLgKd7KjaGim<L+r_Cu>nj7c`4pFuki>=}6k?3Qwh
z?u!KDh4-+LVM~eMomjyS(gJgr6;)!#f6oVpg(-&kErpJ$8K(sVz@Sm~@sEXyxxwce
z3MEq^e?=5GG&FRw4%ju^9sR_5|8I2xL73@EG?v4T8})P-&f>nueW8U{PHF13Eq5uQ
z=)cQD8}}*(Kq&UT(Uc&dqXEC<A|ToN<&pNwe8kgz1?yFhyJF=oCOS8!-B@|gRZ^B<
z(1)sdbJDc960d}(1+_ybB@P;WKDEn;ihT#AMd@asjsFSk%sFb1$kY$Um%rX|!AWr|
z>g0>Lt`{ZZQN(wc{)U_p(vW}01HO<Z4TqZOa{^s%j3QZ&el+NKzDj4+gbKOkRbO-S
z&m7gjlEo6Y-QCG(PQ!;?ELdk}XU(>K`=&fZkcCe!X!3E;&<d_5P_fWx)cw_JjBqw=
zqjt?KQ}&26U_KLvXVs&3xu5n0*}`G`9Wj6b!vbF)W&E3)tJ+9YH|#9ExV@z2Y!)NH
zfUQ_-)Y$P4XXT#)+aBN3pwnNyt<BMmhXT7QRzD})KYxYFa3A}QJ<}~qjXd0CC;!W<
z8w$Ddsvz#JJ|iiqD5UT)yPVp(K}tg#=__q$ZwkL@@a|+L&F%@-ECeT04a$$ArFfyW
z<Z3L>9X9K|w!~(0F1>CLxb@YPQB^z5LUQFQ1lS!BHdzf*!*(`Qfp`}PNi!{|R%;8a
zZ?1IlP4G!5OT~+{ewoFHE{zF6@XJ#un!qLfcg<g;Sl$Ego|Ul6SHw^i^g<#tI`e0m
zx385563Dw<Z1RLs(rZ4vtJi3)uj2!o+h-PgCPCR0wG-U4OZ~L~oL`XqZgOp>p=bs*
zu#AU&OE%Xis~_QhcOt)atlb_@Z<-eNF~r3L>^ujz+v$TG)f$CqTk^Bs&h;XmJe$Wn
z?eMldXY@DuzvCMxe7;TB0p>X;;>k1em$RldNq+h=HWz?trE|8@gwA9Xc7&Jcvfae<
zY~IfdAPxjjGJ*^`$Cqi5Ul3bx;*fWaqB6E5cSdNLkq59|4^uFM57(#Y<be!gDRX7=
zqSlv<4Wa5bTfxh9V_O9>>1^8EM8i7LI5dG-jclT;&R@m^8k7-Ojcx8YNWZ~qpG7Ci
znJ>c7F+A{pU5ZXM18-yt1!dK(Zxf5uiy3CCF0&iN6?U?Wm#g5_ey=Dgi;vNUjOS=<
zsdO4e-iO|emeJPjsXj&Hnf(*qs!U*3Or29aTA-JX4xS0#4wMjIQQUB(u)v7${<uHA
zZFZNG%mZ%3ZSe7Q1KT~}uU$h68%+-C-)eWLp||Ro<JIj|u27^>%sVw<=DIHwv0FC-
zv6gmhEBSGD1h8Q9uYPGu&K)m>_ay%ha!-OZDfpI3cU<?4j-gTfsHi$1DCPV>!mEO6
z+G-dr^O5k3%CrgAvx4TZmW6scUxob4@7R%`9BMKX<ts!TkFaEjUxe!+OZHbtS827L
zJjsNgSB)aR6G&x(?&a&!Dx)}wUMl;O^1aROj~wc}$m{qvjYt!(F!wm(t#jt$y44Yj
z+DG3%322$9e@*6cWo&<cb8n$<Q^udsUD5zU9{;zhf(0k%liD(%rlOKeQ*a6Ft?CSe
zfDTc9{ickoh+gl;S+As4%PuFn_Cs{5xEb%~9Wt<6mkNP#9&psy{2@sokMzSVodd`=
zE?U;KuqNhFPq?fijV6<-zk~*u|EDXf25EA9>g($(!H`}zjSD%*d3c#cWwsh;>MZPv
zAet<Fshy@4LF)>^BF>#w&*Nm&l!Q9Hn_bz^(69uVm1lazaCv#z2ncjz2l#1DHV3H~
z;De8a1q0y$XlQXv3>-@VMxKfY5z%;hqUqO@1#bbosm_?ilvLoxFe&|rkS~NNiheJx
z*cPj;VB;&^+$<qiI_n2wCnJaeyWLkz1@+W#Jd>Yq%gp0y*17Sl+I|-!V*yiQ+drjo
zuVv!A>{7qpuiQ*O{Mu~vHjDPS>q<X~6FDRPs%F2>c?z>q9V0)F%W?IlDo(tf6MZ=Q
zDRfDK+VzTHB4Ioe3`}e#osf-5t>j0@2^N+1r)igu-tYIviB3Z(Lc;!`_};H}F2b%D
zZ_Vy#UYb?dHTzmYT6z;~q?Dk;q#IR(wgyFcLTnZfbRMr;(^l^@j70mjqB|Z560az{
z_=McZa6jY*!JjxCoB2b!=2U5Ff%!|4DaWQgqeygG{S3(Yx&Teuti9BBx8^mwcK7J)
zldWcsSdg<+PSbV%&`9O&uGKTz?2@+fJU<>*LRC9#ct-90k}{eWiKm6WU2$u@lcSDe
z{qfl8GyF)-^XjA}Ef+O*McW<b-bj+)#f8nRa#Phk5S~l%QSn=C(PR3V3XB3Fa7KrJ
z*vCfUdI#J+;+UPG%?}^@vWnI8hpzzD3=J*X@znsXd#PucO2xBT1(&)@xTmnVI8-Bx
z4p6WugR@!ZR%gh{;iWn+raipeiB52S6F`BSmeYzy=<o*{{9?VDQg5LE?a#a`tP1$i
z#7PUAW^vrX!wuBqa3b+O3czB`tW$y@93hHhJVX11#wUoKz40)%Q?YohuG9;T_BKP<
zpsMm(!N<J5G^B=jz|VmHIJl@CEtsu~|C!57R-bJTOJ==|haI@l>0{*TJTUU``Z-9g
zwY`1Zd1IGCH5UyR6ZeO)MT96d=v!1X;A8)Jx8Q;<__UhyA}p<?c_OoT^-19RZnZfo
zA|OU)R@_;<9=^Whh_8?T%-kL)5f^cc`(86@JqhsiTs6<!=BU(XKyVuKw3U^mlP{;K
zx$hIHztAa6+W&8Jk)V^kiZp_ZxXhxjs;s1+HEn;B4fl-0k)&fj&a`1yi(RjD{I&`>
zMo6jWvj?ZiNJxq{6ftwJblg!O9KBL2s#~k7s*X@Q;M{2UHGjSUHFzw%Sws*b*sJ!P
zp`o6v46df8<_VXDd+6rYR`C+TJgaA~YEVH?OWQi2?}oP*8fZ3!y|TX}ATpQz2)kf(
zKa3e2)Q~Y4(VJ;%3NbJ<(gZ+(33Ra6@XP1*R#$t!0W?h;U&e#6lv9l9BN9?f;^ihZ
z6c1RqI_ky4*t(X(I~4T--H87J{E1iK)N0)(&d9@Mv&qz=*A6;-t79PH!bH?@C%zUw
z0<=iU9`bCz9e^+j%Dyh$p1>mWw<v!7)Cj4mT2K}$>LzhVZ7qtIm)D)gNbtX<lqPtH
zg|<DL^PF}{-IUUJSzXa0z%kfM7%Z{z(>tCklQ8igvPR&#`0$rNVG??{6DJnY8ol@4
z6gBohJPI+HgR&1_tK<1Cx}{~;kbsiovuzbaS>VP4RE*7?n(<b-MtNW8`zy#(7|N`G
zoZoba3U!n`OSb(5)t;6^qqQ(t^wV-+4E*%N;64ZJdXkrQc+X|C?LvOH!!CCk@A4x5
zFr{Vm3QquMp89Ea^JmlAFgT`(bzqJ<XQ8{JH4)t!u|Cx@VXEqCmp(Nn!4a#mT|8}d
zw1Dx*9A~xd-Yi}IXv==)zQ+uU$%qoH!9r#65N1|`B+n3kwJ}ko`h3RA;3mc!WUx?P
z7T|z@BoP{pm-*HoIy>Kl7TzTr+=8@9rpnTMpe9V8uwKg@&!5{A86r9xLxw-IF4=}q
zfQlLAwcmWsxxhKSdCTcUZWB|`Jj(hgXLaP^*r@%&vg2jHEB9!xy)2NHJREv|`dD~g
zoMhcS7oj0hkY`NIc@1@dQ~IV3y}V?Mc^|*j2;ak#Lo+j#P;jZ|_N2vpZ-t)E)2c(Y
z?qF|vY(vd7o!6j7)y}ctWpPgoD{4aKSUY7Q-BEZcw;S&~rKy&v=2uz2;(q0O9<>HR
zaf6A1l3OgH`}^w3&e02y%@eV()RPJ792p@Vut3JfskK(Hj7%$in$}02-oKaL#D$)Y
zDOa<BD{p*(-nEs(3fAu!WNRLu2Wg*lm|9!{gWB)r-HP}-+&D5MCSI_hGX6{%5$8>{
zepwE20p6cxjord7L71CRlxC&iUJr(FW4xY()z0U=HP#-`{{8rzoC@5qR{;G?dm{v<
zfM{V{FcEQ+0`rnjx^DP&M5VAfS2J6#>tchDd`E0hbVhNO&vu!1O%H$I$!WJfje4xl
zYjG2Kw2du)_<WQVA2NX5edb3H({FHzUi2sezs@ei!O>AAem2|#$EqAh?h_r=r2QZ~
z-@!q#Jhs6)jWV`In@xeg>Ll9hELR-vaZAgh+XVq4$AVPGuYdt>jc6VNWHh|Kw~ov|
z&>0w2h!SKzKLQr##csbv$-?n?wOwtuo8Wuwftvcv=fiTYRSA%79zr&CEbupYro8!x
zG7N`PnL??m^>jDRLF<;|%Y54)>u>TOgIusUZr}^j;>exjKUyO(RMuvSKG{Hp_J>i#
zFx)j(CDQ8>Mqn_5($C7P_Xv;a>R;PsMk~{T4{wL1OT2q`nCMIx<7&#)!tUd_KnPVX
z-&F=2CrSO1Qh;-T4+c^$-)46xj?y33`LDHoMrcEjD96K*CCn$YQzEOd31}p7Ys~3n
z4lS9Mrlut6s5#K0@TP;lnab742#(6aZZ$Vtm6ofsUT!=++n3|%;EBXsSP+f?A5*ZD
zP|L*Z`tnAX-z@q>7Oa$kA0HXv23u9Z7XET^{fp~yS%V%R^}_*LHHz|o&}@+dV4#S(
z_x{Fg7nYV<P)bC$6+C}dp14e%?-kbXF&Dgr{MIQUTa9&TL|IETzUML)RDVqLb^9Z|
z&THfaN0GCUR|F+^ZGn-p8z9LpK3iJ4k^kghbb{o^$H(^p80p5^Sm<W$7Ht4ka~HsY
zgerR}p7%~hMxXSMdw+XXYGa3&&x-Ou?0|xns*2?OK2UJiE=3vqyZHanbXH+;HDMAC
z76=gBg1fsr!QI^kcMtCF?hsspy9Wk$m*DR14ukCcyU$+F)tu=$-CbYRTNU(x1j4W7
z&(6%G8YGEMZATxHsgOHU@S4hKE~o|KvNBD?tzUMMMoNj^qq2wLchG0oR0?e<jo$s(
zKPU!6!3#@OX6gVl^%ju5O(HXmVUL7C@y)=23Dhy?lqKEn>>%42`C~1U5q#|<{B`&1
zPt{9VMUC<_5a_GM6AT$Vpi`7(jH#8-l9tMSr+8pdDGfI9!6QVc?AnN%rM91u+Z1dj
zQLV9bV_Sr~kML`2=mT_FCkb7CG#hJbTSWq+_4ZAV@{6m~PKmc7i?4QeDB$S=WuCJ=
zPaSF%zTLG53SkXI?U^bTm9(pLey*?MV_>G1wd|drL;8<~%dpzQKEAbiE`+^u=-yBg
zTArU(j9*`#eQJ=<M&B(YPD|x}6i|=Kr8nZdef0V>8~<!F6eBtGLX7A{nkFlHByyt%
zcwcGq5QfK~AwPRvgX)2mDG@&(!2h{AvxnhltB0!$r?DGo>4juZ-lQSjz24A&yM-dX
z)mqJoW3)GAq%R#&n92?}IwIodU;Ksm{N!Z2orhh(T<gthD^Xs8jYard=fpgNfH_uL
zwuhinYR=h=@0eIFc<L9)TdKi`x?PspicUs>W2Is-yYn*M`Gw|6O3aYnAUYWFGvB6c
zb4{UzEB)@$_vVGuj@?#065nhfiYM0xYe{H@VDLdX*aa131bY>atl<`0|4~9?I_(rc
zb~kvdN%n%`&*fgvOlKEzH8NZfZ?@vveUyQHb>>!Zc0jUdB^?(vpo2Om{%DrsPke*6
ze@rD+x|hK@oz+LLI0W<93Iij4s^4gEoqF3)Yv#Xi+%G$5##4Op<T59Ng;7CqlcRKP
z1tuuD?ZIInEp3@84)@Pb6N3vi4T;8iU<7=VJT@=~9F|Y9&%lwg%153SyS0*r-$MR^
z)Z`NJ!So1`CU79*4IwthNd7F!+gR{0b!II7wTlNAdNnA3U0(bh_WLl;-ulgK#YF_%
zeedNP+CFw#g~hbbGY6rT580d>dHERx#HG}xWY^NSDNwb8#qGDWYZ5!u`86`54ot$i
zHS5+sPwL!I_ez^82Zm;1MGQ=vomv(94aL7cwc2R&JQJ7;E1X^WtksqE{HW~+)2rYv
z^TVQ~N@t}QMEJAd^-k?J%S{nI$5-j3)`>Ir47-W!*)eflHcnEtL3R^AJP7`=Ae+68
z%gf707TIxi0yCwIQ#Uqf_S$}9Wu+WvRrvm^)n?fraUCZmS>T&4mD}=Oeof0I-CwH0
zZV2D_JG0Kq{Qj(>|39bjL%VcOd$LI5?Mh2YDeWmuSJs!${&!MIZR-;C6v9oJBZNJg
z$b|ADz~{2h-taD2MNb$l1Yld+Y&<*(Qz`tH#fZYBOW8vzxdUBwn}AQ{7YZHKW-L1d
zD0S7nZJr(#Sw)huA_@RN_@l73DFeAC@J0Q6vd8<=SM{Cc=0{`AP~MeJh;lH^w2bKA
z3$COyrC<d<SJ!4l@_4Xh1jEB){n`Id6PV_(8G*v0VHO-UE(5kReGTL!?r{n;`4anF
z1?bd?<?(U|e8nz)oJ#Ld3sgc*F+H{n%`Ju%wl8*s3WpB~Lt=vb-D~MigX?-~o82DR
zFnlE98GdK!zN3R(-;rMH+RR*l2)ThBczSAWYHC^rd3qHKud|99)wSenV<_XsPTb>$
z1HO0;f#nGB-IDac$#Eb8^|8LH2pv>XSKLDxX%!wGZUSbC${2<~KL19wr3EOqmA-tv
zKn-@au29U^`|b%Z`W@90zS5j(J?@z&mrZ)D*^lTn?aQX=>-T8K<ys`_qM9s0!bh~<
zkT}r4C4aVV&Cj!Y6UV{aEA+{Gf;Um*|2ENZR0vv@1kD{vIIf#A?)!OFMVekzT8yOS
zFln!MN&Tj4bOM6v++R~Y&15y$$~fX%4kXs`e#Myl5hga6aHCA($oOI24%xA=x!(Ht
z(qaYV0;=EdnuBUBQhuhrG)|%?UFXR&Yeiuv7*4ddv_qaPeS~3d`9*`%Y4CXrpIy=u
zihMR-|Eq&Tr&8=IL+#(bJf)XzByeG1>TO68E*6o|mWJ?qKfv~(GkZ6G!G6A3+RCCo
z6HlM&9i_^lU!0{f9LfKv$hB>(wyLc{-$DQ#^Z|XJ?Iv;G8muujK40n5{N6m1U%m^O
z<5S84_J(4yNp5FxX1a;=Qbl5$-Q4N~ySi*$mw_K#^q*cl8a}O%vgy9FrhY)4*S2rm
zPIF>riMP+_Lu9P<TA|g7l`CbiA>&fAL-9gy0pQy^)~D}@>o}WK(J_?x&E*7}LO<A2
z$pWA^k_gcOwCZFT6z%H(_xY&IX{58RpJioHH<)@EpR0bX9xD;q(yfO-b^FNDAgd@#
zBH(dT*3@fCO1Ekh7lFPLM02I_M~&C$#&i`jxA{u`rhbjIP6c{rF*2t4x1t?IK$4_>
zaq)C%k8|B5lZok;S<`Cv!dx7=8F%oT>BYsTQs5Df1?>$$?H<n-p)hSRteH4(B}_F+
z>Gjj=K4wa(INIeHuLT7RRHi*VZkKUqb3TZ*jd7e>*B_=6-P{c4ZAUY8_b}OTmesvl
zY}d_lt5<>UIx_e@NrRw{-xpLW=5bEy<Oy7Jo|e>%FMcm*b-mHif1V=vyuVj`?Ujtn
z4EVt|HOO<69cvPXtTKJRd4n6$q(9<qFV}u4owcv~Y@b?16G<f%&Qe;@fZqukFd5P=
zmEHJ*H90}z$~!^I<jtk=@f=M1Bzg6QXXW|bxzq3vKil_lh5Nm!91gkV@ItP&v-rmN
zEyYf^PG)t;y4Nn%Bm33r;gvF3VDJ0~_hp-tA>I!P4RbP);05>XjI<h6ZDm4ETLoyC
zU4en3i`DO0YQGN-%vv-c)kb(|1So!VSAEFyqb!!S=;<DX>@+;?oL$V?u2Gt=c(cMZ
z68-6Z|C;B2|Fy+TXY)a=u!ZPJ@SXVyc*1QpCOy|ROhU=37b_lT=7zYXI`!b4zcT@@
zO{}m!;gktPrA17hU)~hM(?p*9Z!k7P1J@MRdL||Dwn;;LczPPOzi*m45A?k2=`Nuk
z=PC_QAVVa7#KYhuQ^pB^Oai}}E`$T_FlpaCVM2^v#akmGcSNtjxt2>H8V2S*so)p_
z&6!{t&pW5>rsZVjX-GVoH#!b#WbwYsfI=6F=vSRz1oAh*!bybX6=`AWUf+Z$zp_Qi
zqA-kW{V;YU<En)-+O5}(kEV4*5aL<UKDCM|#ha_3r|`D0&{RvkQho{!S}lxQ7Llk(
z>m2Y1mk)IG7wA5rf(QQH^>n(ftAFknm)D(epgB0qZN>^d+|2@kM^KM1<Wt(sw;h{&
zS1-+69OqMTb)TnTP9AGeVd%~@?-{+G|NFz(UjAmswokZ;xWx@XE<6`W+KW-V;8}%5
z$)yQ53oOtKq)h&=rsskM`P-pHIOk%mwbJx~yQfpqF1xhxmhA)wdNumX3t@}q$HT>%
zrswdy-6I&Q(&~*r&x@KfNO$s=XDOXZE+ZcUPWvm`lem>*phU%e>-^?xriYzaK<&>o
ztosh?T58EK9Q66C%GmPq?fvkTqnBr|(bv#!*26PO(538_kMg_k$2)Ge;EC4gzY?+K
zT)B4QxS@QxM{4&~(*ZIQP<ghCe+{E;hO02DT+-J-!q|W`v!marN5kZHWu2XvS76B!
zO9ojcF342x3kb}=Nu_W^vgVcZrZd`gMTFS!Y!$#{tkR8%h@wM8yK?+u%MBN$zOMmq
z(%gxdgI+{|h`ad5`IfC5?8)YYj*5;>-Nrww&J?-O*oc9U)U`RzeTa>2#DG;*QBi{c
zx01Q(fg8ZaM1YL-gyXz6=whYgWL!p4>%_&ZB$#l{1Ek|Uflv$Yxv#3ju@sqar}Zrr
z4I&}mqr}TP`-Y6PawCpc2F8;`V)og*XmKwpHD&qb`Y|}RO5%NV{A;!#;$O2#G6bF6
z@3neC8<E8!-?ipmz3Le^%8N_rzXpcESrSI<jo0XBo)&z3d_}||jt;`u22b*j3E`Be
zL*C$1LB~#Y?uHKhclT`n1&DAx@J;dT>1r_uHZ;{)>F5yt({-|gX!eHVTifq1A%t6*
zVCqXHD*&B(EFL3D>HsdT@w=2&U_#fB3VQ{bJ~izVfmBrOHeZV5nwap>2^C>KLhVPM
zKz=t|)Z^ow1|Bw|>{Uc4X~^pVmFxl$6oA_u!v6E0JPuzFyvQQu@5{CGZ?1ijhh&-a
zOk2K@;g=l<c~x2_iahK<WMHU&aUJKlj=p}VZwK3rze8uq2hMev_|s0w*<q2v7Th<o
z3?-hKT#<hC90Pqj%r31*!4IGZqn|uREyi!LNIJa~uXVlZKN?<Ibl8f4cuO@Z{{F3@
zS!|zP6CJzoa)kadyQ=qE`N>ZFr!SI5Q}%Cn4vHqT@9}Fy-Y*XlmP!HCt$(RE<-3u+
zMD?D|WFDR-lH;YHE#J<XshIEjeq3V)>gALO6i86Ldj9oz@V;9}cYOHX$^qAVwE(_i
zAB^(O+3>Exf986=DSyL@{sg|Wn*$t?_{D-{OP7cfk@SvR?#Ge0D%61bZNeqxNXjgQ
zAwU5b?1^pyi)^1DubB!#=~Z8*76>Z{Dn&lYxafMGN_<9EAsS2zmtujx;-}A#QF%@d
zMm!?#0tfAa?)ppc%I3aL)tW3%zq8am-uHGcqI<pw-HcGeM~bM~($h=~$J3=%3K3kU
z@m&qC^RQye=g+hZM$6uu7q7`_OA|6?d56At?TtpJ)Aux~mgYBbBP;TI5ncM-dxG{7
zW|&vzv6!-N^=JN_w8)>$Z*ApyLZTKa3{*}F#Hmt&32`9PmE}~Ftr!Abiagkxby<hC
zyBlm|mo7kVMfH5t;QZE7m74$4mM<Tn=cD+#-=2Em_F+X|N96Vkgc@@7dt#0EYg{a8
zQ`?N+){W`zd6pw5CftHN<s7r!JHz-XM%U}Hz=Y5fvXrwFvB(hb89^j5&|~Ihi?6m^
zsO@|It%E`TJi3HzPE{X=+zLsexq>U+=tgp2`e!qA>*ov8cac{Z=)URUalyE`Ia|OZ
zp-+o#`KxMR&hAY*l|wIue;b@HnWf{1itXa^{)K%14V9c_LXH2`Pt%gCrmgX@iGX<j
zFPk4nji=KeKNVX3TwuZUIW9PyUdg9-v{WF<Zh6CEPyePmUQjLeD9Rtkpmk=WUsE?f
zM0z{BnywHE^Z7M8-nQG2c?@RLpS+9sN+W${`XTF0dxDu7YM>?VID8%z8r&1+@b0D(
z=>HT8Z*aXUu^aePWALQxJ3mr`(EgJ@v!Ix_0~0N6!*pdsW8<1G`+s8>62q*um^_ap
zJ)w{>Ud;o$HVxpZx|*(y{HHI7q1aBRyzj_7`Y>B5VdCM|4eE|b5Vp6gaK>6zQXqwB
z5)|?f3GL1{*EqhzFvKZSX``$PfSV3{56zU4*nK3xLBp;oYIbZ=S#R>IhTn_99W+T$
zbbWf1Y(Gzgmghz;X!!U!XHwCA+@qL)BTlLwy;~G5=Xb)dOlNPm-t^5(9kg>`P9s4`
zpLN*f6!%m-MSIsfW|T|x7j7m1EAm$LUPl1TG%~A-ev$)`z=t8hLb4M|@(9*IC6{q~
z^nd3v1k<B(4xQ@Cy-xmG*xFWkRdok~+Y7(mFG|CRh=QNfe?hhxHq@CjGd1F3IUebF
zD2%wHzexYsP??)~RZtB1iXrrH1LvZG_0Zc-D=K*x_6$`$ECE(c9v);j9r<^0>c+?H
z0s<S<D4Z~>M(w3b(5uM;Pe?Dr?@LL>HU>#20}pr+r!jUJoSujpZ|$g5aReogIyxpH
zZ2||D?%5@ekE=Nuk(Maj?Wl$Zg-e81O&J6A0ltD}W6i>DiN7qdmD1E?I|^GE(74p3
zs!*m?RaFynI+5$^S?pv-LM}0&p9wLX85Z{q0Jrphiqm0v=^coI4dsJR<o<E;V}5qt
zWgt&X3APhb=G}_}sLwC{&{5byUA`t@rbYNj1hdsZ--v33SfBORZdKa3Ua=~#g`Li&
zkJu}}HS!?GuChdkjAr*l`FL<RS&#V$SB^laK@x$>1w{gVgLsA>vb}Z`{b?O+9By{-
zVul34CLtC5XCK-|A<oB6&%o?lPnexcE5v33RPiGr5ecpXk{028mdTp-$hntq;YE5q
z?FdA?FKi`$Ns3`~wka!X#Hb5>lFJNL)&r`fJ{WV=IjR0|mi2!!fUvL?@<`u9Dezae
zca%K}K$8tY`23)KgGAi}M0bmwX0XH4Zvj$#nK8P2&rJ0Qi>&n3h-xMO@!=*oubU`H
zR0I_ruk!U|CV$g(>l^`@HY)Ya=zRfaUM+1W)FQ7ht~2!d(NUCPE#l2N?TWXx4*JgF
znM~q)42#dYk*_Z0T`)<{<Q2#6VAMd1JTALsf(pDc_9;}$)I_cDwh~GH3k5CG+_j{!
zaUmM+j|^rM_bpd0Fs;BG+wmYnVJ=#;nxP1Q2Zw;59u<-2`<QuJ`y&s*kp1u{1ntIA
zE9XWLZ+7zt1eY>~>VAI8KiRr<rmWhZ^x69K3%Jq3bwRwlZ-cN7#;Y&s<*-obXmtiD
zTJVEjX3EketYSuWi;q(;etP89+cS>O<6cpX)C<6;Q-ss2hbN(7v!fhFAF(4kRN7pn
zq1Sf~%;)K(QpW{(_woiLTz)up;{-AxA!Ha&o)OgAXtfIRS)HQjN?1}6$ie<fu4A*k
zm*GoQ|E-!=0@XM?qiS90_E>2nvL_o_nd<?l==$f`?sDSu%5rK|%6E@MoZgW{R|Wgi
zgf^qSU9c*qJa>bRkeJ($sYP*P09x9b-%9@Ug5m-QATV0X%lB~^H?Y@c*ZZO~3R!S>
zNkhMWmqO{?(ox=JK(Q$dm6DwduguC)kt)Z886B&zeh_?v@{;ZP82cjm+o$91=nW#z
z&l?@!acUF-<1y}T?g_69<N7@7dAa$QpcTLe>)`u}0Qq_^-bVeF62)o?0Caf_jEclk
z$0Z$agtWcBzR;0Tvp?6%-*)UK-CbXNkG^?^awkzcSmH&FM-sQXRcoDHjWSkl1L=j9
zQ`1?YEDra3`D+5aQ2E6a6_?6|^UWE{-o&CJPU2zhbECcUJTXZ+1?u>^MK+iwoB50O
z-`n5^#VKS06DFf)+YUzs>xlWljYMpCO#XF{*WZTo%f6sWFs93Q8K*>W^mLL!Uo2bP
zg1#ZbYlt}BV`);487K<gT0A^$TF^Q6Hi0GII^X3Aj0Yiwxh^p=JP>SbK&fi8&cBE2
zo59zuMZ^6bzis}r0^OP+1Aq^aXn6cjPw7Nf6;<M`aLUL2MGyjtgWu+I`v+e(=L<Km
z>t0sR?Xn!L>IC>BZ{y37H&@LE5?NeUpRN=RyB2@C2C2bffK2gZ%IF~_i!rxB_ZP4;
zwr}z;miwj)hYX#y)94AA8gPRr)zRh+b@`B!_Gb~1J2I22#l$iTHDe0@{@A}Y*zQ{0
z=;yi~a~`S<cSC<nfX^e##OJ?Gw0{J_u!AeB9)!QdZ=&sD!9k)JM=(BzTI5WZ)1i+B
zJ+7Ba=mTCc@5_Up#?nGPhfq613B`Nd9c*kLZzKi*9x{`1VX@>-+PD;H?@fI*!>d*`
zBD!}CDF^=rhuJauPM8gF3;XR8oJNgq9J<8!hF3;il4ZuW9k65sj^IQ>+DfyyU2M`_
z%%e3JG3TaB3GLF{bw|{pD8HFx<C9Z{mwTo#(74VVFiwp2K}9<ZseYEI{7pAp)HITC
z7yvz93d=Wpur&R-pnnf)Z4&odFz!|Yy7Srpy_5kyoh*60hnCJVu@=j3m6&+OrQD^Y
zV5qCrTpd5Mn~tEkDn6M>%IM4S{Fkuwf(ARS;s5Dm`1J<C{Kq5(Tlqk?XdwB=M%XMo
z7Q{&YH88TMxN6YGOeCiZsR;5n5jb#wQpdq`PsEOYBoEgQOV=8ydAqsX%tfT_9lgDG
zP#q)0EX|auxR0H@mFlKz<4Ggv)W@BgC5IQHs8qTb&#;p}BbdQ*he7XY!2=0`E?}qA
z6kw`sTKu~C`HYb5dkTF6XLmy+-)uH1l#Y4c>;LH-A7vni9U!t#1NlDq+fDE~9DO)4
z-1gS*m!@V+An#A3o!RT;=aV01*Xa-Yg}1c(`-e2hQAEIdF4J{yJhay^nK)P2YYAH2
z9n7<0`j9YZvPH%Cr*<u%Bw#K<IG+Z38NjXJ`2O?h#VeN^42t34vZ2lWYk_iX4Go4g
zq-^t;@md}~0`I2!IhOSP9Yh7kp8biv)EI9kJW^Zl-)eOr(h_9LvyNFT=%oCJ9R|jw
z{k;43x;%T|&MUZ-W;-qcYdXk_PxHW?e|;DxoS#M9^O4J{dM{D=LMFhN!IGZ^EG}xp
znfJWDy;bo(4A}ugUWX3S4dUuehAVt|H*GH3QTkibzakS>6{_rL;At(lIgwfROwEu;
z^f*n1Xgdq<efcG_m0`KU)`GbC>-~>lzF;fbE`K7ZCbgk9<IoTz=}r7J&MqPj?@O`$
zaEjFuiSrs&1mbNf=hA)d6~rJj*MG_-85YFl;D4jTiZ?Gow<(^Z`7>ko%V-_#f1)Kn
zr63^C=tSKAl3NS^`oiIYgPM?e@rwD`zm-;V*&ssyaYxp6KbMKa$*gdD?9*HSh@DN=
z@^C=zpcUIK^l6+d9V_r2M0u6<zf-I;)NSaz0eMHeQB}oT-Mpx8Rw&0fkl9Knp>{eu
zJI(*+p<%XJq&M48J^DpW`RIk38RQC1Hx9%LeOMZ3EiOhOQ92fmdy^AHGMqIl0@1*Y
zXR&5mT-05Sm2k~hSD_&x+_o!8A=ap2ocj?0gZ<~&m9tm;_uQP^f~Ny_b%8}Ur8c#F
zgV_23%OlJ$e#bk1vh4gKj<QmT-k`4DjAPkiEB!yREAh5im%awt2M25(=Z7by(rK<%
zKQ#n6Ic4){M^6Yi;VY%G32op)z&EH+2Sbvn5f&eu3={e5(I8p(!+PD-blR!in6ox0
zS%vzbV8U@QXg5H+Z~3;OBF+Xh-DKo3B&CUf2Bk0}MZRwq?x*JJhlQvPMXH2%w=<pB
z#hxxn3VMOWv%ODzLWZe&uy=FhfWp?dSTOk`WrkTnjUG&uRXvwg`Xeh;n~ewYVh9nJ
zu7erAAMA!FnuQ@QQ5ZkRl=CtbYV;*5uP`X;S7rD?Bl^$(^78snl;dberzLhZW*Zun
z4W-&VyzkU=2dJ}UC~77q5Y+*gVkui_VThu0Y4Y4w>r!uZZU~fdgjJkRxJ_0;rDI)0
zOaf2XfA~En>W7Wpe|sz@IEbo7c<{&E-qj;Shol*@{yz(#F?+y5)4W9G*@T<cerV`P
zG9aGLKGQ#wS~V0wP}S~vo{rJlXjMd6B8$z8TLUhO&3GBbcD-q^>j?vU3;A;Qg4z3t
zaX*SRtJQ-%CKg$BOm~z|MSSO<HPohGAkKymmh9(UmCE+(68ckb|G`gTz+~Q)%tqA7
zjc6TUjL-O)ncP8E%sA~2a|B?@c$5)7w-80ltYdW*7b7yfrE|rzP)V~a|N4R;=()@H
zdi5^e*g*K(=Iij@@x?_AMqyJ>F8p#X(OSpI^hWsfmOcqhNFj0Qrf9t86&x6G0L7xp
z{7Wk+RaAF1Cq!MF`|r*nD6dz&Rmj>uFK*B*V>57Z)s2Y(gTXoL^p<qp`;Py=M|PaJ
z%y>b@GW*JiBcuZ4dR^wfz4;Av{cC$|ZfZ)(#1-DUeRvrO@vY%Sw;dBZmqmQ_K*K6M
z7|Avrksc;-6*4J2d|Xg%#3m{t>X2YQ4Rd?z(?fy=83}!lyL@yF6(1|E?ix<I66;T4
zaf{?8-kO`Mdg}YT_~2u(L+wU}z#co|Y7>-6*brA{t3A^wo_{k9vX`-=2zd*oz50u6
z-!Ic{NDmLM$X_8ukI_kIai%wb?ftkAh#L=&SxDPYU&=5<xZbpj%ra%I3ToK***(QT
zj{*737X8q8jH~2g>zjao<l0P{0)=RJsj%U(_@TfmcAC})hBFSRuZ5(HsarBpxAl@;
zjh4NXWOlG6Q(chQL|jULl4+tmt4ZGFk1iDY2RRRf{r=&bRN63P6GI-dkOpk;?AYs8
zQxZ{M$zTY%n_UDRQ_<Z%KEQrwwcl)mK$pl1BIsBo>r$+{e|mV(=!^tH%2stApj8;<
ze+-k<9mprV8x>Gb1K6BtKR~X9a3nE3Q}d>L<}oNV7gM^coc#^>fBw+l0sa6-j_h*<
zaabCJ{63!L@ADGlbMm@Ek5N7;*RcADMvIp`7Hjk?D|&5iU&(RnSpW0N<MY6A$9)6K
zO=Atf!}l_7DTsP7D33arstR+Ma>%MjvPDaO;e}S1$t&x>IHQ?m>rjaNE<~(1b(4AR
z(sv!XF@AP9c9DQE!Lqlb6QZCKY<d)!KF}b@kr*6uwe_Sh`vaHsq9U%G>#<g&QV-Qv
zl#l{MFPh4T?S(R45D=&-M|j!cfccj#;Nx_AVnGKZ!bIc+JE1<!%H~#Rpog*P^C3Ku
z<0+^hV3e|Jfium*aNC=$TSsr;_a-Q)3)>MCaY)v=Ui~sVnoLD~6={bV(b&b@Faa5I
zu{LK02Or%-#F!C-{rM#DW;WeWM=$B|V%!#$6lIIE^B&(luzNO;pGYpU$CEv*<s?2N
ze5!co>hn0-QM(<B+%0VBc=a{Rv?2r>{*(*Xeaoxp*3`1gWCNV6WPxNSZSZQQC@NZ`
zid9h3-e}4ivdlcI5etyPz2_d`IlbKIVDWu*=@=GPR8&lLUGvO&Om9;pe_w|@I5-$v
zhMcx?S%MoxkL;IhH<)`@w@42;ad#yoU|{>}daK=s%P!lFH2IYo`M*sK3w35Qv%L7v
z_a73YxglWdNP$Ga9s$S&?Ym6ke{K#v^upV1Ftx2Tr4#2+=~~7Mv4nJwrZhX~U_6};
zS#9F8<EpD4oOV_BoX`>zLqerF%nt>cUi6pOVDX77mQ-Uf{i^PmbI(_K{J7_vL^<dc
z77ZhH8b|g3y(>DNEwF_$@o15({%-u{0A4OG*wFW_dB1;0xt=Z3@Q4Ut#o$@6eX&UH
zwO7pS&<j+;PJ=Yhp7~_VHT%!OwYp@qstSQ#8Volwu*gI%fu_yS$04e$r?Cmfr0_@}
zbNZBKvsu_G4ir6Ym49r$Z6oN>LQ-eTorP@_Oz^Taq}NhBvsn)~Vx*<Wtay(ar_}nm
zobBvT${_ylpc09sM>u9cP$Vy0GQ^!)9({#)MhBXk^28||Qa8KpYPnuiyc>+BNp;5?
zmJb(YsdvzG^LpYr%rHrTBpH_>ot{Sz71t7agh@3P@wj<t6!UaUo%e0JZBwFvM7XzC
z0RTt{)##DG4)jUW-{4q7LaY==2w^SP@q86EURNdo5UtAJ=5R}UO$9YSOrB$3VV%`U
z0d?tL_o}tJZYAXec5o;hdnsl7YIGAY$f<Ss(<2~vt_wt!Xzjv-C_lOYT2CMeWk<(L
ztU>lrX1J!1FI)%GYKyx#V!I+u;GcQtXTTYU8rD9gRG>#T+53^u=YJ-Wa(>Ahoz{Pg
z2*a!z|HO9qXt(j{;I)5)HRdn4DpF{J9DdjW>GZj^FR$9u3$?LAwt`haY~|JbrBdsi
z`mWb=e_BiJ$Oj}(RQlX)8F2&4*GP1f{iA{*mrlacP?n|YHx(M>A!Ne1+l{sQ&U}$?
zvUAY}wmw3|f6jkKQ4{hcb$d9#xmSv=PRSj(#$%!QiWD+)3yP&AC=3R~j^c1t<ymv(
z%$burH;~9~c}deC$Dt8=1yftsJ?;CVT8MXlI2D$q!~oB|4j4Q`GTJ=mQ?QMfa`now
zQ^2;}XNVEGl{o1m`k${3M1>BP0V&O!I%H=GfwRS~LPouX;fc()<eYDhcmvZRcD@J^
z$vhI)GVr)&!}O?VKVshpcNeP4)I#KKVERoxU?c;r0gVpc7+^_MR4hN<w~Lf2n|u5p
z?~U4Xj0zz>hcV8g!*cPMFrdBGHluW`!?9RJ`Ik(RkjmCF_qmKLra>qQvZE)snHjlA
zB6i?xdNUqjDmTozG_H19u}>)={i>vp8@qK{ND;hu;Uxup$D>eG$08;shYZ}Tk&>3R
z!1`|46Yx=(pB95l<0UQ3>4$ALg<2%Bcej)`j9wV>JY#o<xml$n=^^EZ;4{49-H<>z
zeEhL1PO(y=PO(JN*_p_Qq9<^t76S7+Mi6EZvxq(}8FRuA@6V7}6VHyVUW=LMA8@qw
zidJN1-{^M1``03?|NfUa5Kg7ExR^5&U%>wg?2?i1;Z;7Y?0GD%jv!!`>Z9B(_kV*m
zN#m!44{DOLK5+gSo2`d2t*fj`cVe2K9?kdh@Z6vOEv>App0$-0o$xRIpE*kWNR790
zl;KH9G*GbI-?-L;_q^7vVHV^KTDzVSEvs=Yy8cwm^ZvY=CQhoa56Jx*%A51P@GOW(
z@nQ+x@lAu|H$Y3z#vQKXQ?>Bo3z}m*%t-LdRPx}06m6M9CsAQT8D`F6k}#FIl^@e`
z{;2?x^Gn%>i2rz{rcV$L!c|Yc5m^GzNPrfjX7M)!OUbXA=oBaKUs2S%;B!5?jr1nK
z0|Z+{>&o^)=P%eLIM!H<S@_35dj651^KJ}HI}lbP7Ke80-hAyz9oGHo%l$X7TcXIl
zSTz<rLTYYe|9ehBs2H7cyIqG`R3|<5dH5;VE5J3;-0JekrUoS?y-MDV_4546Nlmwf
zEWkNOcYyR#S&F~#S#I-)&@iNEc2RoStq)%3;1cMwMTfdpJLH=I9123BWcT8EDkHu#
zCX<)k81@u3wP3&=*IO5%DD)kJjo_d@vQVtQ0L|D0>yxRrO9u~eBH4LZjcmCG9=Q2y
zTK(iiol=qi*IZ@8p_P}6Z+zX7Nt6wWB?si2#EZZk6DOyJcEXax=6^1}>v(5u9Vn`1
zcLME(`n%!PU%*SEP0u3&{`dQT)_}#+psawefkSZA6arK+0!9s9D(V&&uE`Fh2b{lw
z&>&CYY>3??=V=ruV*A_gN;ECy9G)dJ2zyjHRddpGmBHyYOex8w>jq?-9hE&=rSiGq
zTb#gXldyZ$9ejVU$S(vZN3}wIo{iX~%(NOmsJ8{+yF8!6$rz+##KaT^o=qfgTa*M0
zEcCgaY(m!zEC?`#_E1us1+bBYvb_#HWddi`(%}=*l#^0YTn5C$x2HlIS$wX)$O&0x
zt6-SA2uwM@2mMh@dD*!a((9F!pOZ(%FG_)>Af;O{#c{qn7XR5wh5P#%eAE01Vc5Ai
z<cTXC&f}%b%5g>epK<5DoLj1v102)r8v^$LrR;7;Qsr7cg{%MorDO-l-;k7jv~+ZS
z>j%z^V7Woh#tkp{s>D@|UQCUueqF0tz$vkdb?y@$&%B<qPCe}5KU+GkLSdY$87nIZ
z$8os5xd{#L$ny0KxKOB-Cd`=I`D^0z^XK6dJ4OTxmlrV=Be|cZnoD8&p`ej)39=A>
z?a2PBC>W0+0Qz!?nj|7hU&`S%wJus=T`?<<Is-%ld5qc2v?bd|J0DFAg2&)L|9t1-
z;!+P59i=;IQ0}@0J5to)L+Gh$Kf$#ibp1g3M#9z(ngM}IEe5%#4Sp!_R50Kjuy?)3
zC5wW39#6Z2jf<zNejZZXUpyub_@#NM;PXDn%Kz|`zJoCXOGu$T7Ety82qdu5hD)n!
z6?j9|<KIKP|5Gm^UF_682{Gv+^}5WBzozYe;^6w@q25SaTOk_R#-saPlb6WXHalrZ
zoCr_I;jB3|{(5MU&Wg2tEc&W=wA8M<{H!ECR@KliN4<N<D(mc#tPWg}g_&uB{6s7*
zD!x@&G=Bge(jL&H#SX4_p+Ky?s@7?i(f(c-CWu#T<$;?i>X9;4+A?%|s!A_nNW<su
zYJFH^%+ulD-Q`$AGgNh_AUS(RWY}xQrgk(L7oX$dPORfXnTmlO`BS2uxAY4}BvjRZ
zM6LV_xH^NQ;#^5ukwo@8VTk>0;)ceY@sV<9u>Bw(6>^`+*u+E~^e-wn8jAt#sx95P
z&BJ8oEgTRdn1V1jq3cg48qR5YzUh4>KtYd&iTS7R_!nozCaU}BYXc))_XjkSe;a&}
zM7#=QOB|-tFE`-~kCE&9I(l6<bhqC6i0~IZGSXZ->S*1>xISONa;n3(LpO~b;6Miq
z%)Gn9N{lKcesp}derRI}zT`Km6JQn^@kv$oTAD(v2O9|{<{_EDKa~Mo6r!TbADjxk
zhJNilkgGZbFeq$;s+gl5)|ZD&)v#FcHk=r?N0e}wu;o(E>(0|V_x}{H&<1;lP^=5I
z;lsovB`b&TC-}|AF#Z@WbNfuUE$(^tuO3qv(mp2ZjAyBMCIsPKbv{H<d)cB=WN<69
z%BuTdzc4vu!G^0U{w{;&eJ~HwAf%hz3ih_=*FX5%ZHep_eVborYb{UCsF0#*3vUyB
z`O)Z+f&QV!PeNq}h%f#8AU*bGWMq`6E>#+765~I@^co!Buw8fiG^jsc=<eMbZ|>)>
zK3sCAtRD7s#_D5YgecDfqo-g}c~v}_OB^y(2xD*sk?xpy!0iUYW%NwFtLj3#2V7gp
ztdT+bE=1=OBPz?67ze!{!C}NaH{Sg3eU%=!n_2sUi5PB@bLWEy%8GiAAO1fuT?+%G
zR<v}}NRK7Wx-by=J}@RapKZm$LP!7U9L(B{hc$b+jduU|9!Q#yrAZF_Ek-{+DmIZ1
zLF)R-!D+h^7ZF)>v3&fL#OMmVxuim+%q8ZEz9oLK5RAsEo#A6+b-K$z-rjYdLdoU9
z0W<_^(-2}kU9N=I3ch@C7rMuIBP~=0@&(sXuclkjeCs5YF)GdBM#_~TiS^+*qy0)w
zJ`Zx}3TaKFG76!lx6kh@oX^P!zmF7g)1VaNLSZ`sgrX0{g{8wi?4OS(aZm3oF^s}R
z#|iITx->@)HrQ)*E5z`TZzrzR_KqeGnVdeOs-zu;BviAuJi2cQ+FZ=(LZ_B<SB!2<
z>KqaZQbX*TDr0a`2t9nbL@W|$`}wiG*(B}r+|2Ei8ER5Qb<}n~$H3=ySd{Xck{O@q
zq5L>6Oo5$lcf^{?;Qi6t2_;rmCX@2-w(fM;;bxUj_CWM0utT<7h19g&YP9?q8^-5)
z*C4Us*&H!4TIpb?5lSkmT(%;PBejr!83C0P?pTcs-k49^S!?sgm1{Esr+(Lf96onE
zy)#%nD|rVEg(NG!gMgFBJ5v2qKO$k5$@AHDz2RDBKoXjBq+?3sGyda>gFg8^%19K}
z<lkX6JaSrWo3c|Pq&g2L!KTx2UO>aTz;YXdIA&f{2*~XMW16d%8s#b)mKwPtL~RD?
z110g5$6dP@!0$6WNIRKiYgNm+UFCievz#I2Z2+4NCx^eK_~T_ZS8LB0WNeX%7vv+5
zn5Ajy0L6f*LPvhJkr@)|E{OC}R<D1k`3fq$HFULtP&v4Yg5mlP?6S?2>q#e`$<F1?
z)TQ@GD5!fw7eq#yNS2GTLcfB<`ltoC0C<10>2W<Frx~|l4CwPiZafa34bB$TQm65f
z=*NIMKej%5bwl7}WM$Np1t@&&#p1JAF{yHhW%A!N_HAg(9kBx8G%>@f(>u4KrZ<P7
zrn|p+H5A|GGq$Evt1e<45^G~DDCRk_C}goJk6na{wA3mNCeK7I?E0~ay>=O&fW&_2
zcMURRaT;dWS}JFHuFj)7ovcuCSnAU5kv)SWwO3(h3ilQ3iuBNpo5jfrywaXYvwO>^
zdh)6+!9U}{on)+-JZ(Q}VX({DJq}Vejn9|s2{iC+;eS@sixlhyLctoZwb)tP1%&Cl
zY|W|hJ5T>d==g1SE@X)_MQ{{^tVuyiJ5Q7e;`X+YGsbTlLKDpN>C<|c+2z3v-+NQ@
zp!-X(;y|72eT}v5F`bM<>YT+8xwgP9MTSn|TWI!Chc%2u5WckK`%RTHM%2;JfrD{z
zQG+g+*ucLFQ4{b)Wt1+eoSqj-yHaw*J;q6d{Ue5<aPoOwlna6BqVm~GpoBLqf~{vr
zP0e;;FU!HNC)7eg+|psZ4o<ZFZ<KLR)IWq|g_grE-DvBbBP0yX(d74qk%?-F{15@q
z{*A}SA1<fO%u-TP`T@oWO@K~}L1=iMz=htogHT~8GG$5$RGKnPI+^H#&d%$#*U1c?
zJvnuDfo|3RkXAErf%EffuHg+T3kzw$xEq}fICAHe6S%s(gH0%KB9!?JoEraw0ZXNj
z?V*JU`|w*bpejo)hZmEn^F9d|8x9hNva+HABi{VENWlRMR$j@Z>ov=a+j%i4ILtvd
z;5noK$A4Wb5gR9V&+Pqpd6sPFgz;>orPFfqUlYY7<2PAzk+cIrj~9own-8k2iQN}2
zp}vRo+{r-}R!;da7OwxMC{SRdx2Rv9^X|jhQsoz*WTBj<Au*2&I6NX6{AG>ssl1%K
z?7NJzlae>Si)(Xrp0m9E>ubqjg}%0m0A)NlZDQ8%$zldi<IrH#|J9_povzoxWR;PT
zaBP_@+n3qn8fAs<#!?-gOp+*=tu!xIRWUb+jWGl2vkYhcTt-tu@62?gpq-vb7z#vY
zvG%mwW`_5gOMS*&y)Cfp_FTGFb=a9jn}Reh@Tp*7rPE95B$TOct*(8byB|@|&#9gl
zys_8yUAlA@jT5o7pKZOjkJZOy?pf!BC3c7e7r@59l)jopq-v8<+Wd8iIsKK6poQ#Z
zq11c|?3>$yT9f*V^X&t?bE>o2dV?F9xsS4)#V9EyHf$8}=FJ+&>F(9B@wK@%LKZb8
zVsXuw>bkpy(irulz*KBf@JT%ML`u9p|5(x}=|LdT&jDa8-KOXfVQ9p1$PlQ)(6{#T
z_b)XXvfu9ty75FH!#Ddb5*)!|p_&}uTzaYZAZG<asw<!~bhry3=U3Cy&_G{b5n-yr
zXfL@j3il}rxXl3>$G~?Xf3s<5_u$~qWoB151p8rOFdVzRqLY&ot#~J@JLsa-WU)${
z6oZa%+*a%`>gHbT=a!I~<gN6CkT4K8!LlGXhzvtT8k_4e`}_%~fu(iXAkv}xRZhK<
zxpmVfqMd}0y-(DeOg1FNeVnLV2WW-E3kT^&IQ09tULPi^G$a4Zc#*tp{f`zM&dpy9
zPX$$lN#Dv~!Wwo($n9yw@{YOh8Ku-U(*4(xqD;OHSA4tKc{TrCi}088Wv_Q=n1g7M
zp9Kyd0R6migJ+!At-)`R=us;M-C;425tx87)%(m-@wIyDzhfC2s^OY()*TiF<Si}+
z4h=1>NE`LF(BsmuBe-O6dCf@kR;E4n-|j;YxIGixx4K*@U5j^jG_46ALofP-=YB4J
zF`xV{a{^bE#DP^apr)aeSo_kIFA)Mpg3HufXnqy+xw2co8&QSBtaZ1dDL)sR_l`Rg
zg41oG+)a_iGVa5PMqae~)fhPH|9%4dEY@B`5?o!^9&35!#kKjuY~T4|Ehee;j!q}9
zsEOdv1`#jhNcHiuI9#SldLCMJkAe7u6-Nm8#N@+s#j3|{mqZ&q)q0WtZMq7B<#F$G
zvo7V9G+R7U`5aD);UEuv*O)ZncWxwA8Zc;F+>@EQ2Mx;%(2P(s*mqVt%y2i|6BVny
z`%VwZH+cPJJUP1!GZ=PYJ5y*YMwTffu3i+REkcVHKYb@oavmH0L8-a9OqJFm{pR-?
zMKPVzSG#pH!`5~YR%v=StSeCYS>BK7Y`zzCLuD+fOaKYoP*$P^rYXti9Jrcfd0g`9
zW5B&2(Kje8zP%N-BVt^|d3#d6%&O{p>EK@a?!v4)k8>3MUQ94H-g8`k{svC|V=#8z
zQc`%Rs#&W3LSrH#3klbKowHf?oMw=U_-2wss}B!xHNG6Cy~GIlR;;krQs#Bnfq*i;
zqDC09MD268(9Lqwru?0s-@tpr_4#^(i}~oc5Ggk;7DuL)HF`7!9d)zEv&F{?e4Nmu
z^o`t{u!9L_!tK+_Au^|lAubG+Iti*d*0dYB#xzo8`@dJBuBXK&^%kfwS<H#eXIp{7
zU06~wv#ha*m*Js^Ck(6PPmc!yu#U{gZzmJiPQIkq_@&YOLlL8nG1T9b{ufNQj(WUI
z+bd#<;aWl$oh%K?DQ<HKK%s`vv3#_Ds?*HlFt2up^oATA3k}ZV;roKoEJ5_mq=hWY
zUJ~67Jt51+oqK@_|Ca_q4)ud;)KJ6o<@_-P7!mKymM(5C8`#TC|E%+p2UO%>K3m`K
zHWXQBEKVa*ii0!gB|E)?{sSyzVLj7Jx}MS-S%ZG34C^o3=#I#d5@xfE^E#kkG3yap
z|AyulxvWE}ifskK<uCPc)9It;7sR%yf{BXNdSWl!ylST%=>EVv;R$~K_Ip(06?F`=
za?4iNf4uylCD6?*S2qbDr4ek7UGSy?RR4+Xey<2ZLUQTXcu<xd%n|=FTmI!-J&nO2
zlC3m1KjjhspPu6+hsW6gMTYyHu`*&SFo$)k@Qr^ULceAo^K&qFy;Ll)F8+5BjO4?x
ziJ~CY(R#d7-x!l1m|&?!y+L9kAd62pD+vs<AKq6j-Am+iz%sM4uhY@07jT~36o33R
zhVZnL8E#&_i*deD9(Rsic7IGh7F>uHi!2DjD$R2Vf_u`&O8*h@-p7^aA98{{B>@QS
zzV`+F5vq&nD!yb?I+^ggw#p_Y)DndPs&&{*K9!KV?GfpR6Zt(0rzZ80uP>9u{$P_J
z_&=|CC%DBvzoVl=|L6JYS<T>qGt)53?oE3UA*^nN=YMuKIZ?)ff`ZfRJGOuBO(DNM
z-I$@N_r)~^{|R9nO#o#*@<BW3#Lj;yG2pzT3xe!ueq{XG;lNoJ(x9jwZic!;1qeSw
zOieQW^?@Knhv{R8{1buZFqX+f5hXc>mCGarR8Ef$OkTmBR+64*Q$i$+a6bhHlC)my
zo0(8BR<Jn=sWX^-f(C=<NmxsWT5LC=KffIzD7uwIReslEXN<1IA!&k~7h0k6goVBz
zYT)_^Gu!eD6Ot1oB&_Lk|0}s&PDPl)lT~`1=L#235X1FxgRSRwK@frMaB;Tu$!O+?
zCJcm3dA^rua>umK;6mW)f#Ui&`6?Dw1>MP2`?`bY^LU|1+b>9BFSTw?qmU$o$LbS8
zjckv?^kv#){rUqf%o%1p<EQVp$xPuM9SdTlEKWNW$GUg0)L6zsJ;s^G!Tkfe9TEbU
zDnC0{13z2PmlumsuM8i;@^5U79;~2N&b`+5>2B0)q1>Sq*fvP{@w(Jadm#DvcQRfz
zu71MPf^2)2R_95Coi&B(Yr#GDQm(rSLs&8xbDo&gr2XFc@JdH}al%$R0QE#aWSPj+
z6f)fL(^3CmzKh6R(dONKd4^<UoJr|yueShoxy`5(ht3kHv)08gM<3iX8}+4=t^0X5
zy5hAx?+BQ2cmH_LCP^1pvUwpH5EaaRDcrA6Ojpw;@*|}%=4=Oirq!dvJv{jEyL~i8
z#9{s^P@>Godp`sC_253wUGw)+47zQ{*sdBsf%*kU{8v?3Re~xq1>XGcr(LiG$LeT$
zC`qz)yM53f6;{DXYBQ16idl5!4ot(tZHbzlY7`4h02xdsT~Cd*C06Z~0srv7fZ>Vc
zY??R5>I=;>U;D?`V1<PPZ>hp;1U~aR&jQ99PIvvGSMbDOGNZg(n^jcVG|jE8|7crz
zTkcibreD<B`doB2+m@!1ar|Squ!qrxj0!ksxX$_Pyz=!FMp0s~etO&X%scuES_iFr
zU;edd(>l38rzz_F3;0m;T`qxV5lPLYam8$B<KxqO=1IYJ3Q5NqLV|-+`Yi5NyUWx_
zm_d2N)vM<ZQvWLMm`rwbnvz+tu3@!8f_X{)wfy)b`RiX_Ga<8Brh?eM_!NsZZ1#p!
zii^G1bQ%|@OzJsw{Lrm~i@nO%{^@CC!b|%_H;xMaR9$s~@AkjM(}YCteUQeusZoox
z*rU!Uf4$+B243HDx7^YXuKLHJLWMo9FuZDR`99^Spd7s^Yy)z=J<yLVqj^a>uvMi^
zlygOr_@Q@(C3c=8A|i^ay9G9!`o4fB<gr3U>PhkODv=-YbTAl9FBKKU?2RJj^crkO
z`E`G%$2IA7CK7U72o~486IQ<qJcNu$QL!AG?UL8zcUrq4W*6fyJNv850bJqwpgf=i
zyzZ4+B}L~m_|LoD5a+`n=D=L*6Y^P8ddSIa9&~WkloBDVJa3#3+Hgxq=Qj|a-*<t5
zU=f`Ps_QTH4qIJ|u{~SLwI%e)YaFP9;$0qVTHWVtsjhxVCx~;9Xot)AH4VZt8|iU$
zwOvTFsJ#&@m{9(BJ69!D)8$#|tB;G?zEj<s4ORjfU5X!PF&eS~jat0%5^uRUaPdDO
zx)bL+Zz61|;A=cPu4fu+x1(D>yw4%Gn^Wxl&4zor;i1x|xdq4w_}?gT!Y094q<`dD
z@BWyA7qNC2U)vOB#@Lau+|HK^LL@9lwgX`a!Cxg7lFo{v@1{7F`%)X}gwu<!7?R}5
zb6J?z{{8hqCbJ&AaSxJFQIc0+0YO92&vrYSu7s3jR${LWKQTTuKia;mVyAj6Az)7%
zM1FgP6Yk@4yNo)&(4oE<1zGg`8=M`RIMm9&)p7!S74-kaRJVT&G<_JatAneqVm){a
zzrHVG8?+(t<X6{2gEg9Ky_oslXy8wT`3L>_5l9h%a^?4JcOyO_vl5eP^Zi~H5fcVI
z%`OWdZoNI|akH9Nhu}Wxr4IBEH*`=b{LPnXk%FH)5V=%p0RX|dZ*of?RE*D|*Ay{7
zc}J6Om2Oq{*Of6o(|HQ%Jhzbvgu7zYP9d${JuKZ})4+&$B`7Vvk-HekkbWd>T?+8!
zYw;^IB|Ixk)r_F_E;dTY4Q>2$2<nz}4%JkzJLq#L9o9bDOZ*gwly0368&7Z>*(9hG
zSs@gWP^fvOh@E(C5EAP|;d8fDy^>uhNUA~=q3YnahO~Q5KuEncl$MS}Ge2@4P*W2;
zDCj%BNoL+3UAq|{ilvSJoxX7s2{u7qEY9;>58n>b>XaI4o-bRyJZ5$D<AHu!`#zj9
ziNR?QiL5>rv^o$|>T?ln=GwQ3(I>PfJ8)@q=`UJ=r3P19>^LH!jM&&#gZQo>p%RWW
z{YkHdrwLB9UkwQJwRQr}g$*in)G#p5W!LDQ(sk6|TW+6%Dn<FMitu6J4P3_!vK;$6
z6^&N+S$2t3iRP9U$7e@>V8`KxXD<0iQ*FILD(~2#P{D^o(+;9FFaXr%MWLAN#4|Z5
zIguQuUm#S6<I57qAOM1XI2=3HKFSHf<0VrG?-nT@^3kd{WjHbBQ>TJ20h!t^Sg$sa
zi#2*kar;QKxeZ~*S2-*?&ELS4EAJADy~7R@5|#<I3YLGrLVqoEegYJt%<8T(EEe?_
zDrIAY{}R@k{HRKsc{Q{)^i`gY<*_YRU$mV7sUhU=M^lMFhR*&mWZ6b%e7oWXzI|Y~
zxsJ72d(M$LoF#B_gU+3=CrqAp>ajP4b(Kli(XkB}01LrC$|rP&IwqjbCv*57_|Gp7
zX%EEjqSO7Zd%tQQnRkOIBqDB!d#gI%6f!m!`ti`I^kZu`yO0rD1`7Vf<IS0FR;2hg
zHhLpSC&mFG1(qrh_xqYEw8lF<9sC|*jB;_Ly-7G6inTbxK6N@|QohroGO&xpP&btE
z^2}70@a+zm?E2iqaK|j#!PtVP<xly2CQ`MUm+^eR#s*m^>Fy6+DQ_Ahu&So~dU<RX
zG91jqV>#^W!c{zvR>e^>ki{!|6J`1V?KPaQOpOc6B7!f;_nFgIR<F4c7nqC%Wu9vW
z(?3WJ%`lE<^m-=lnI&S3p~fD5I~*KudkF0nM8xk=$J&QOZ9`!M#vNvGI~A@*XYxqE
zEHk+wvO_{)XcQTKt{fpHsKpl+H@MX&d?`3+Bp=F1#O{^k^py~<t0`=o-r*ANhjI3Q
zfj>g}0d=*Vd(E&MbWY0Pkw!BXTw`3^=Ie-JEcSf6=ILC$!UJj&6HCBG3lXFiAXlrc
zDp>b^X+a8Ayb~#wnjkXpgJcj}i9eVhOuk0ASM^MCBcZkysUFt8zC#w%7$cl`_lZXm
z^XGr6+B`}?GC6ljt{o<#!`fSz#wxOizg)gwGRJIX7eb(+5NQ-|P4Aqv2fp<=r}5t_
zs;#+=j4p@I-`h6(?`_ujmewqHnXy5F^rHCeGYX$9RI&?3E6fc2pEXT-CQjJd{|72T
z)xPoj@4qWtm_5Mct0s%Uo?Zvc8u712mc8*!h5>pU<lc7s_U+iee?LZ#9<2<y(c|FB
zpg3sTQ1gv+?%Y|u=DEM&6UWELD+NN^`1bn~jRC#rmX?-@QCc~G7CPf-fi#M<i>sVB
zJHtx^vZ=7qytyNOob#UgpTBeshV?&Fcm_0jRGn{ev}HC$I*w5S_x$OCgNj3C@bL>!
z?@X9_uwU#Luw$UX7%+2xf*4QaJ?DM%J$3EcRpn#iG&oaxL^}o=fB`ekD9=ioh+g~%
zQ>RW<ii4-0afTSw)cfe;!53;k6%UJI_QyQSr&q*>AAVTz?Wy?l`s=Ub&O7f^@`m<r
z<}lP9pBG0u)-Yl6+sr~UvHu#f*CP!~p5&mR7XzX|SXki*XCb>vHCsb?C7K?|&LB63
z91c@h^=2w1Mk$+om;9WASo6m!EMBr0KmG7E{@S&-dSuJf#bYK2pK=h+KleOz>D*o!
zCOr~wrq)c3^is2A4vS&RkgAF?-(;*5Lyf=wx)@)*@t&Mi*AA1exgG;AxBz|ooP&0e
zp%z|D-Fzh5Tuga<my);#Yu2p6A8S_QkCne;<(k^h*L$DU7w4aM9?lUDpuKzdLfgnN
z&AX*cjo_JeuM6~i!?Qa%N6JXUvZYI;FMh?h@4t%_eY{<3(qR{m0rzeF`t?Kap55W<
zOj!#Kgd>;7%vdJT&2d*;n1^+LuEDZpOR@0h1z53W6Qdjk7Y@G!g9Z*1BQxirXZNmf
z5&B%ufAyDlSZ4MY$AkehS1e!to63iZ?A(J8tX^oPk4-!k(8x>eoZ?1iQeSja!H9?m
z6_r~0=FpVh76uI(bWDw?uY7xW<1ygr<&FHjT=W}!F)kW(o=7i<@Q4*`XF3i*3OAG^
zBW)j+E&L7}cI=jzu3|x0EVEmLdKl?IasoPvJKmi;mg0wn%W>U=;bP%frl=#$oYpd{
z-xvbU_N^Ibw(pwa-nO+zli!J~E9<AGeN7|i>PiFZA`*_KJvGzR);`8LUj4zmYb*13
zmd7&faP$~378J?!D=5%{er63g`dsZP?HH(z0W&XflT3>rdqjAcaQEGJW74EaC$-|B
znZH`LY>BaB$70^RdDeN32Z$6{adviA?@Zk4tv_|1%(9;^1`2+n{G@vb3QN)zDM03b
zgm{997q1WR&ixTrjT;U}2eH0l+4!=Rh8fb(7MpQ#SbU*9j&*%MEYAkKF!ed!{pc$e
zXtJ}iaOwETI9t37l`AVXHCwES1(IRqa=4MYHxVDb`HooAih)N^8#K>KMPZp7%2+lV
z@v*zmxnq0G|KJ7uCf1iPI=8nqtN~507RBJf`ton;4{P~#-e`ei+u-BfcQtWyqRUfl
zJ<k16vyCkCc(>EG4^NhR((Igx;zU@VhIQz9)_^gzV7@=|-u`RHKvQ6Vj3pX(qT(R`
z`Tc$H!3P*ROgs(-QW2p_d7-iE?y=VIw9`&gS)`<-fY#Iq-+c3p5~iickAKTIL8UNP
z**mRSwOsxc8X9zoY8Q=Wm4_@A2qlSwqj-IScoWu2D~ndH*Piu+scibz;FOl0=PcQQ
zh<5Ff7`t1Ii)PLqa43jVWzV>Ino=G-Bs2vNEI4jR*D*a0G2FZZG2`BclmcP7v!_;+
zl9Xx5$zl+~AHRI^3Su9;3q9M1sWc60P#uvrZ&;&3+WR<TcbYya@o5pFlm}hUx)@U~
zAFIL-@o+^+Yib&Z%yfF12#)NGXTE$F7md3X0V1H9p0i8E-=Cos`JVpdJKR2P5?c9*
z$21D7N@z-g#>3`K+GDIrV7c5idZbbwEH6JKcqN-v(^$k!Sy`E~N*WRzs$w@2B|rm}
z78*C7ia_#GP->Ej{$QzCHWVQo0rJ}jm6Cs%Md0_3HGksFu93>}t_qZkVcygFqLaH1
zZhHKEbl<cazT)|f@0dB23uztP-Rdb!C~(11c}YGNE%;VtRhUP0K@Ab%g4fs>JpKBo
zN_ntCa4HF^(b47*Yvh<KaMSl+;I+BGA}pi@l2Ua2%N@01=E~LUl>(t^rzxOOzY0q#
zMUi;OBM`>~jXLS6$};urB8sgi3@nF!vD>w<@w#>E4=Z})(821PICO{yejHI6I41dy
z^IJrClzQ3RSzB^9arj%5r`xMXvTaE1_aR}CN_lYj<lAwDc+@1YpV-&t+pVbJx9o($
zBQ8M~%)quineg{=!$DP+#w*hmSd@Sjjs@Rp?l@G0<x75IFiPaWiNJ72S5G+QB&p|@
zpLtv<4|2{h<uZWdlyk`7iznjqw^A@sycp7e3HKm}Lql79c*?3boU63qpd?Z9eDC`;
zXw$YmlJ}5zEg)?Qk8Gz598Q`32yVD)oO;dqg9o}CuN-Hrx4Tau?tSP9?AW*hUoPE+
z(BMGqO|7nAsS;b}0DZ4<Qz2t^<MJ=ntMwZWKa?BXzmEzt{bbUrvZXtykk`KRKv5uE
zA_|2vu~YF`<_1U0cqtJhezw4L{MY?m)t@Gg;vMsW@#Kg6c@v9m)=H0u@Y}LQDoI5t
zeGO_{go}5|xVTu{H1k;urShQQm(!Vp9D15eIB!wG{G5R!@YFrm;l5|yLObz{8XK3W
z@+mCVR#X=){T-u3fzV0PN)_}xsA8OY7lZGOqPWd}8fM@-!l+T=eN@(UwWg?b>C|hV
zy~cJ7{F5+X=0<*_5fKrJo-&Gq^oTxX$`o*4ay&f_8ho-Y1X{2@PlQhvEm~xqJ6?L}
zCD0%qjq#c}#-y|V+A+{j445$%*}e<Lo*#vIzwJbuR(|5WSUd$<GNI?{O5x8F`kbk~
zJ#hsy;VPh(i~5%2ecuZ&#hiCv#Dr_73!T*wEt{1o!xY?s6w4XF?%mn&^b(K6KHiEh
ztdM<8*1-(yj?o4km~}JpW)$5v3I%c7v0bFX=KQ!6=l1R>W4~(e%6K&)BD$k`b+EFz
z7~+t<OQNVATGn5d;UTgPK`mN}hwvD*J<DI(q+7+hb6s|J_r()0ekio^6udEa5u!VG
zMy1d_aq$VLC@WUVgPz`g2n_I3Uf7wYxTrw(p4uo33-|I1LU>3kY~Cy;XWI3{@1MVh
zRy3e2aTV=cv(onGe?11woSvGRs(4;h>@slX8E2~X$3A`xM(n@GiUAr(FnnN+xuHXc
z;`ZBb$9W<Q>h9*Qvgdf?ym+$BSu_+(pwgf*y1Qx9rhk;tUDd!-^g?3;#v@Br6CB{A
zJiydPMF^io_%51XNnSt^a+R@Rol}&>pzZJhXJOH*jTm%JPqnUUUPV=Df8U+n>yu6)
z@0UPB2zIbzz>a~V$AH<laGob{P2$-(!K?x5!G5u0pouVG__iLxYbPJq@P#H%o{a0R
zyAJd?cp~^hN822;Ul=f8fKni2K2#vg6pvzm{PBnVyE$6Ko<!-W@J9#`o<>jk-4suw
zxNa7sxD2t-9z3_L1I##K@T#Rh<KdZiVDai5*4V9s+rUFS&G9Uq-$a=xChZgbj_<#k
zqy8E3=Knm58MoYkwxO+*u_>9L>*W_&3uwfRscYq-5`6#l99%MfO10E&Lc`>Y#Z@Un
zk_MwJMWV=-e*E5>>YtIHnEg7gyLu7=eJtnuQrEh`lvgAMq~?75KCZdx&T3I<*t3Pd
zk7XVZSqM4H&B@BZhBYhI|BIH`Gwyo?S6?ME$sJ_xA~>w96wXsEq_E)wFxekVf5P-@
zhvCoosv<+F#4Kk>W>2QtSX?XyqZ6^<`>)hLV_!DqCft3;Z8*JK2TOURrE4ir;xZ2!
z>|p4Ybt^IJ(FgFwkIUpqLtx8b_;|U)NzQCJo=Deb>`%qQ`QNI4#+o?wR@`^j3~67a
zM4|jB+gE#eI#>I(sW4#14825t_~C~tTb{Yo*utfkUTT#uJl6g=Aqs?M)}T;7EjPaT
z=9@B@^dz=q$r9Xn<BiJty=in)A<>@C(PJP;lo+T$*yp?paqoX_Zcs)PmdeX{7^_z-
z!O%-4i1Hvr_{3F&Ps9bUrN7g%wP4A|Uw()2qlRcph7#70flMX@M-AiF7N3(Ii>WKT
zL5*mFNF2vzeAiVME<yy=4z}kQ%B@+RWXiv4P%}<#_^Xzno(J3d*OgaQnYzDf)~TK%
z4huH<)rC_NuG@cXI6bUz`-?_nfc-(DhGS**>eVVe-z6m_sl#x3J0a9HepI0SV#h!u
zFhB)60<9+!s5p4}<(Gp>7-pPtJo4TU+$!QpaABSJeefWM!Xi{4WF1{xT=2;!pJ3Lk
zS;`VN<CwOb1l4YI6<B|6Itb;ZTENlK)d>{^TA<m>H%KWDqRsgjHn_hi4^qI?BBZKP
z)qi0bx*W||JQBVdvX<3eqLd-^l6{e^-@5NqJj=6fnT@GW?Pb;Vw#GtVBU&q=<ETJ5
z{Ni!A=5j4GTqDY1kB7=i@$jRMVabATF!36p{d|JqTDTv@79~O^$Scvzhwpw`j6tG6
zs02Ob{gG=!GO(&&h#y-VnTpg$=b3oN``5Ov{0?i<FSg-zwWTq2tUo{EPUBFGI1#R`
z58p>Bzj}FWU+uZs_6Lzrd#odsR6VS|@6FV!DR5f7<dgTw;NBdD@HsC}@0IL^7Ea!N
z`zO?lhi()YA)P^Qe-s>{5d(txR!=moWXcN-4OK$2Pd@o1$UlmVjKte-zl~dNxdq+3
zcUS9)`F8#ZeNk5%*v4Y9L{CA*06%XlZBti#3S8s~|AvZQ1kTyb#H*RJLn*TJ!|=p&
z|G~uZV-P9KeYL1q6rOZsJ;TTB&`O5R&1BtSfGj?3f?FXmJ{H&9`8Ya9bN@yKG_9D$
zdE0<dh>Gsq6H`a`#XH}uM0lH)NKB?cs3<A9QZe<QD2^m41wxaqvA<eKq#Ro|Y6Y!w
z5$H4!Bm$Z_BJ=w6^^*`J2Pnjes;f;si5cp*5KiyY4{halXG|WvT$%}uQ-K0;+Z-Jc
zfS4^mBYEEeQ6P+z6goloa|SDg5FQxXww=uMR&Byno{9;tqU$v5M~?0C;yf%|q?N5`
z-Oqp(gVemK6)csthE*ayAsK<5!1SpTkbNK(!!H_ywowuA^YJ=tk8|;aDY$roHE|s`
zx{QO8*N>lzqL5>2p&<_{`oPiI9p!m?Obs90Po<}~Hqz*}Xl4H^B|;ZZIncREDG<7P
zQUO>CAr}^Dx_|A)%_u%}Ib5CeLDW%w%c{B+C@L$^^$|WG!HPjsF{$T?0yCyYTyZn{
zUOYt|v{a3eN*pSuf*MB~_a`!<Z0hD9O1?5gaB!a-$o=q{ij$Y6@unUu7t<`;cSpMS
z@^DeXlP(*r6n{Cln{Sr^tU@!3lBJJdATFFT4BI|f0B_&c76rnp+_fPR%QGt?i4Ugl
z$D%jq$;(!9FA8+>j%^NW6D;%4ZanbZTj(xx20a;?Lw1uR>%sc)+ZZ|aN?i2n-T3*h
z81bs-E?)JtlA4KY`TVSpM|Z=~p~pk)F3l_OY%cY+X66W&W_m7}Hf16tNR4NGV5TEk
zzh#+M+<byCW9HMMKq$Bs#c9;4Kxoap>PD1@|1<js+$L_`&A~4N6)#&n`bCH`B0ntR
z#deICe%rPEFT6N+2^<1KaUh*Oc??*_dR2o|0P`^8ko|o)n3tAWPCe>-rem7ItW2z4
z_LWMSCj$5yh_5nrJ9gAig;^?Qa~|OEFu?I;l#7Rqyi_R=Iyh@(V#dj`cuf3Z#h-Xw
zlp%TWt-oYbFO$=$@k^Ys?>M%<`by)B>qD^|@DgYp)(&<I*fH?;W5CRf{AME}BGeic
z8>^LouD$kJWnG>g2hG~WZ`!N@$FufkUF_Yvx3w4=7-HSx;^LG7p*6sMW5+-vF~BiQ
zfp*d@!^d1L3WN{BzeO-Anq^sN4mp!>7h{YuJ280TO=ut4@N+x!O_6XIf6cA%@btmR
z@mH%FhJ;1H%iRSf#U&^dg}b7{VjMh}spu1~nU10`*wV*eJUqC;Mb35dvs18Zho;qj
zSh5NuE;vWgMuv{7*=*9)q&-@Ob->53J%vd(-6uOvATp}0<R?a3B+z)1r{{PfQ{nFH
z#HuPF*<#jiAHm0q;tjgzS+C%RJ04Ww;gXN5C_t1H7oo7Q5Sba`UC1&gIEhiF5INs;
zb9EEizZrIlm*&lxX&5qo8eV_?2}Fu974u!|((G3|25QHE@owTHUdbu^NH89DYENN*
zYsWytF~B*Fuw}~@^*e0XFx-6e&EiGkd}X+RFU`DW;;M)z!G-G!p;fC^xa_ja@WmHj
zsP%*ImM>qfXg2b-_1@Jou`|#PCjkZ=l=1@C$0LI%8ag!>1A49~m9;ie1fva0f&CvR
z25no1MZp7c7~JQ2B&97BBUL^!X1Vva_xX`=YY(+!;MBu_na@cNtq^Zh1o9Q>F?Za!
zacJGTwR&gP2lZgT*fDU77%+TyLn}?0G6m!foq6V&%D6wXKUrxd*3Enm+&}RAeDmhb
zh=_<_5I+0tGv#fX%8};#QUUhMsf7Ux$>Sv6-#nwG>M{9nbn>WbgN0^x5_+mOpu899
z{L1nYy#MM8xc2s$Dq5E=T|@?<5ZT#TNKZ?}zH)ueYVvRuUPnl)Kv698P)3ViefCkj
z`s{P~ZQY+Z@3byfB|;PbsD5jZbB2dfkduLDAG;5az3>juJP=)?gTzryKC<N8IyHH3
zb%PDkeh*JC1o#VY$-^CGMR~Y?#*O&ur(ZGW?N<;T*0N6Cj43Zi&f4w}xq|n;S&G0m
z5eV{jLy^d56tc|h9PHhz4G)_(HW#niErMFge#!%`vL7iF<-^%eJ)-`<S+oL|43cvo
zb#7gq7OwgZD=_z+S1@7Pbd_b-u3bbwN6Hd@S#r`|u?yWy86_rqsLV-Y8!qe*Q4Xeu
z)aG)&{>2BcssFEj{tcH7InPpF4TMU1U8b(b4|CrWd4X$Hne2b^y7F>!#o%z7I1JM=
zpej%<^bQ^zLd8-kPwMlz)R+I?FJ6g}1N&%Wq(Zn`hM!4h|2+;EFym(Z`t_ibzV_|g
zTjzc%5H^+3(i5UU$m3^zcszKaU_2EFIYH4%#KMIO)gcH4{7s{e13v9pHWCBu3j!?$
zt2;Hh9X{FEW=qS}zW#x@Xw-OY_}ve^&m96Mzt(78n1C`7nBmNkCzj5`TRPzPuiq9c
z%@4z;ZAiWSt_d;`ppY?Rt%209)MCwtL=n9xR0(V8NsvuA(F_E$z!*Z!;E)!@39Mst
zIdrgP#4!zVW1B`ruJ2+w0AXG=(;8(;W?{l@<Ct*Udem1O!%h2a(@`+5OthQLn4yq}
zvmDT{ys9#_2PxZh4JnUtOup6g(+i~@rPBX3%d^2vL(8$pYg!DL`JBSZ|NGzns*MK<
zDbqt7MN_NBNYj>Y&+Xrb0V<~w?!EV3Oq@7Tc^ow3tG2o8WW$j8W{j{1>l`K)Mq*-O
z)B#U;c=*Xy<wn;>&*P3NT{B1h%dMzc+nt1tAhc~20B6hLLSxnq)6b^gnOCVW8tJ~9
z9wZ2)Rj6$0B3@T)^Jdy=bcTvu*G1Mh3jbPyZOgMw!L?S?CMG8LZqj0vw(6a2nx?w9
zi2f_)D)UtBlXdw>;Ka>t%hs51^-bcb#tlQqU4zy_t0(N)V?DSzkfANTy|M5&Jap$x
zXf49}vQR5Jrmnne>lfmIv;)D=Mz;7@c&bK6)RlYFz2`T`rqmSdJ|y&}u^h?049AUa
zpEqvoRMl6}Vls*-Kx~^IV=zww-|K&UuU^W<^k>a<CcLiS+WLY*;ifN`j^7Ar)oT55
z40M&jkL~xywwINe{x@`d6&`H+qOP`_>hH~*pP!$P1q&9a<`7q;o36Ox3WS7&sCSL+
z<5L|k_WB=R3~-DQNQXcD^wStJWQbK5)r8r8tH-xChv&{Zu>6rDM}i83JiMV5Edsp|
z@&JVEulars&*7i*hHWGih$pzhe7*J_sdc9ROdO`>`YQ5~qG(l&@Te$J>}jQfxu#Vq
zubBPVA?)6zEe=+Q=Q{(gt|E9TaDLyjp{X>^)h5*TSHE;}^Tt_y`zr-PS2v*%Km|fk
zA=E<;yW`^I>0DL5SzA?v23&{}*1NPI2V4GHr&1JKaU<*2A+30HTCeUZ%+Q)OD{SV~
zfR-V+_^OLA`@^3R7~B$hds){qIJ$`v4>FOMl8VziN2=s3yQNrR<o}Vtd_SZeO2k-3
zjvQzt#O=YCpT3V5-}($~L_sz_aqr<-)WE6gKPOl52&&67G_p!qA=dx$n<2QR7akEy
zk&noE&*^;z;KD%z(6dK(w2y8lYe+Ese0{}YWL3s$j0paS!`i-~wEZbalmbG-J+MDv
zzl!4*7$A5kz<}{LAu>#_OWLC&$5-`cn8ViS4xLm$Ua@%dkb{geIe5wwVPV3&)f@1V
z9E1e>c`DknMiwg0kuQ=$A*Y!rAyV0>I(=k$p?<8ytA08m*YK!z2(PCkGe&suQ(PiK
z)EVM=WydzW^~y8&@sA{gwh6)BWLxF1dNQmnxS2B!<t3<)j_spri=o~b{5yyTJHH?;
zgyAT{TQ$LaGkmYmFTXrgq#AE%q$g4n(}bcGI@+N*94oY9=imY7GP=B#IYZr5zYq@;
z`ttB=g-JI)gP(7>2R>4Vw46QFBU<Ld>MtArq&(wEvbfltDshE)UpLTFgui$1NkpH~
zQ_-b;q<U@o$;2_ghR59fw6ifprkY<i??iBb2U0V2yG=aXUxPn-AMMboi)~P?_ZnZq
z^DZfsgUUjrA4tPr8`fgh-IG=PmdM3^meT_X002M$Nkl<ZG4OI2)Q0H8BGvMumUL#0
z$dtpwZ&s$kJv0(IsR`=C_w;Xx-LZ*4R6lf#*5k{3|8>m^^zaxeMaLwHV!X2h@=Gg`
zdoT;({y^f&uaPGAR3J3v)>6xp{*|fwwr$(+>Z`9R15oUH()QD*Pq$ipHsj%>Z;-u$
zb`1POF~Dz?yjJoBjp87!%1@ax1ymg586$yo6TjEG)`R1P9(o5NaPBZXfj|HJ6K9`&
zwyMwZD%YOxzW@WIsbox_)wiE&?B*@oYBV}kJ&zi8Av|3i75|!i!G-|86}=8N!-&hK
zAhvsNy!ZASc=CnU4@*v3lfp-ZBB;bF<%+P9EzErM8C)}E6556dZ7LBI?J4=!4t%d-
z;EL;Jz{@`vvmU!2>$caRCv6fZr2eL8P@7lkJLfm=;^BkqXFPyD=MTa=Z@rF}-}=Zl
z+F|!J+-HTb?s$9F0~kMc6ujJ=)f{r7=MQUL>^CPp2Kc?0@$uVlzp46i48{q+gliOK
zr|e+IKvQ7AD5Z`bJz5#~r%@9M0Tcc%TBo7yGHVN!1nE_W3WWS_=#}})FTYeqcPTt+
z_F)ap*B<ZqVt_`nL_!^DqVUsL2n&xudTOHZv3X7_>$|M~`;y|&sY_Sv*!CwrnfC+k
zyXi{dYc@7#dwe?v>=-x|Fkt3$%6n1qiOvWN53PUy{z^ce#=Q-X_f%+;y^be81}LLJ
zpwi&gS6{6Z2mfxqP-C!W=p{ctKSk@&Py}fw8l?K^r=MWFHk<FOF?rkLo*WpkkVGh!
zGuBlxQYY6oqWH(NYz<Dd_9_tBHcb86_O-ef`kBguFV4CTcRVs1ox62M&Vjw)8HNFG
z-vG1-@DrUL%?m0lED*lrKBOd9on^Q0*crQbZpZnjcg4z0JJF{{hbHBF7)8f|oCBCK
zbv)jlw+!97cSE8Wl-Rc27`6mjw4%2>59KY9x(fNZS=e_V69xIkaIYh}NE<gS{1WYl
zWFYR>FA>=~;IO(9H{4s473Jc=>DMad!CpPPW1A@9W+WTT0QAo2>FKV{KZQ7zfJ&uU
zn3A$j&h0Gmg#K;Uz9Sq8c4GA4^8`P;1V8N$FH@p3hXr4}uapNnck79q{qfkkRriI5
z7}#nT-5Ny&c}Pyxv~*B#2z;gdtn@Ubq*PTbqHQ!>%F{6BqVuur&#mZpMwi3OGlNI!
z{Q29nart$3BC>sFR2Jt{>wkAoZ?p+&0cVj9BwnakO1^ZeO?i>+L}{%c1{V+Ni*FaN
z!l;4ga6>5#Y8c<pf+_n?BQapcDP^UM(Nga5Y2=L1w{PD@=2&-hEdx|{c$0_p>eWl-
zNeishf+X+|#MVQQdTGD>tr)1<dmCX7IRuc6de!^ds;8C2I6?I4I|xtSa~)<r^A@5a
zLJ^lB3yVxN<sziv>?vXcX-P;=7Y4g15Y`D2UkSI#q)kXq+lQTEfpGiw9Y{<{lnE<M
zgptaH0CGcX5wZ=Bh(zbkozbyFdj$IXlCPj9NLvBuI?Fo70DiOt&GfAlt?&fw*uD)r
zckWhoO_K$SG2Glem1V-Hw(UTT?&x-H;VqLrfy_F?G*&N;a8cz+1C{Vs#UV9ulexTS
zPaM+H4&Y!`wh{)X(4eQ6Hv$3!5g8e&2*t3lP<V*-0pf=O++3o}=Bw@^t1AE|C&goj
z^u^AdyAU6jAd6S32*{O5{l)5mj~~LNj4)AlX&>DI(G*~79VB7;Ac<wvU!JasEl#pB
z(?zIpr|SRs_;~CUfxc1^K5tG-m12R6{ojfG-?0N)2L)Pi!v(7$?W?=x_K;)40Ii%5
zxJfbn&O>j4eUq=yV81j01~?~<88b!+Y8g6%*`Dl&Ahu06-v<vpcnGpfEZ3UD!ez^r
zVfgUjYK>r9O<ddbC;L4&eN_DCud`T4q4i;cgS1Dlpt`^Ku24MT6$zbK;n7^p^K38I
z7b-Q?26_$Ff<2Yxhme>MhizN8Vzc~n!?jNiD+;ANi6LGd-9$;Qm0B;lh&7jPVv(t>
z2-Q=-nHxSX=XK+kH5H>6Ld&G3r72-}uB8UJrqX&cz5hup$w%iIvvZqxtl6Xl#`mZ0
zML>8D+<EIXxH%t#_Z5XTo5D>ctiL+U#Ncn;?b3;eN3}T@g^j@@#$fV@*YMGg>kt~;
zLX1A7OPhd_!hA#t=@z$czF6GJRSJX}XV!wPH!44QGPF^O&~Aoypf$<;2QoBmBnk$>
zA}n1+8?}>-f8%K*Yr#ixW9SX`XJLM>2$Jo__HEl0U6r&q8TsNN!%>t6{R3O5gZvI1
zI|<F%3E`n_tnEAU*r{GAYkBgzATLL(YbGF06g3k>sURaW6S*Q>PoPq#pPxTkwGLMF
zRAgk7SlJ^@rD<c6kBWSRi)~+2mY0b@!XD|19YR;_miu_@6WWnVw#`I&&`*qkgolSA
zA|eveG9R@Qp@pD8KQ(^ToGN9Tadm_u72Pkqd~00~>=R4kqMWjQ`%dwm6pvK#?4&Fv
z2_4V=j}*^5ojP|Bt2ylu=;tHloj5xFi0wE|f$S50lceA0&!4a6d(*E22M$yW-iG$?
zajK#{+kYSicyK_&9^=Q4N1*Hv3F^C+v1rEM-`Q-lPW9~B6B8y(z??aAl;A9lC_M7W
zBkEm;4#Jd{_147wJL`Kq%VzsHPk4z3LO)+GbzieQ6GzcVG^iu-)6-Irm0PIrb4U~i
zb1R$?<a-cTjv0o}ueb?sz4VkQyLd~#lR3^ZNFRuTpD=_IV>OeytVFLtEH6Wt(u5U@
ze?V5^R#E;gs}uLktGSZ{*8i#Ze;Hyt%D^Fu24P}KI?CmxI@2Iobret_9yE9SKo9q=
zk)N+Q^bX=Rk(T)g-+u8i)-Cn7@I&fav4lrZS%z(inJP_YR+ZptMTK5t_odN)1t~vG
zL#ee?8p&_Qc%`9twM=Oznd$rY?L%^MG7cO#AUu*d;REf(FN+qdJb0mZ&Aof2jzl<-
zRTr@Dr3~`1dYyKLiskCzrG8DH%a@DP1Nn%IYAfwHgmtTys(+JZSf`#CHn2ZVJFU0k
zwRUVD4KEMPe>LB{iEDn-_i3SF7ZK<!;{q;_FV-gs1^Z+1zn7jDB~od>JlBR*;)k?S
zc7|4d+n<^O2g!#`rM1QoL2Jt9O~?@sb5tO-4n9>vV=k<l1KeD+(3_^Wb)8i0<gkWN
zE&@v@8i-qh?HDPSeGSJ%s^Hg*ku*^Vi;LZ(#>216S6HjrCZx4e9<1tTYfz(ZT!inK
zm@MPB#aZwd52gw@?rH&zP5B;VuhkexO_8xI;M!a(0x}<OSyy7>r2jh&Ks$@)8a3Wk
z%-Sxx^e)}?IYC*aqxL{wThzwBW7ZbnEx+mt@mje{lr;%uWqL2ldoOoarRsc9|32_>
z6U7k@+B)zhm{R)}55E=|F#LK^Abb-ZJ}pG&xPV#J3mhA2E|HkV!(mBrp$ONd$)0te
z@OD#>qUMuS*@wg<DKQSK)=*VbLy(^r_Gi|wRBqxo=+_2UHRET=SS7S_X^war1{5eQ
z$X37Mu6cOpjaT3yn(CzKIc{qL+sge#aegM8=;$~t5hZ5dEo+pUuP8|$OcrlMa=;r|
zGxe$UZ0INowi5Vk){3!X$141=|4qD8t9AC;+A(nIV}SD!X)#w<SM1)sTQ%s$8*jvv
zDN}@AI!zfa;Y)s}oX<}5w`%543Q5wS(5Ih%s_MczegFOUxaOK`l&2uJ!^CBn9qbrr
zC<crHndok3Aa?gIa;?=^;+T>fMc<Pz*vc48sbyV1Qdu0A%!|}Q+m7Aw#D8DGHP_#Y
zO&d30y;#UzzkVGSF8NK#2MFul0`9nQ=s=t%%DcUL_d+k>1GE)c0)qM$8^C`w<vKXJ
zVAS}@xM0W##b-;Fv*Vn+Jn;l9=K;c>r*|V~5r%8->J4|&djhtU3%_}FRxWY7iJ^$u
zul2@Fx7{h$z1L&idR_lN*Zzs35>4;7>(~`%oN>C;xfgn$ej2*V8AA(^Ng&wQdxZx3
z<p>xsb2-nKo_+RN6;pkSa>q5GMGM(q2-xR)g$DcO7%<RMJY!JMkVc)2Oy1u`>l{rp
z%(p@#4+IKM`iikE@>n)*+^D=S98JFVG{*-6ZXUiO@GSg-(7ssp)vIV7=xsgUKdeM9
z!a_F`i-%(J50@?e2~R%%D&W})Zo;9V5+TDm5AI3a56+4+Z+;3BE**}@R(`V9YQFYi
z`PTA6&94?3rIuh-#>q0@vaV)5s99H4M+?nXGwf)eby=EsTU#D1vq^EI`l0UfScfJr
zQ}V12uT9#<+7M}f*C-5dekXW&d0D+PpK-<+>K%6*dgr1Z?H4-+ju`_q;<R}2V)X0R
z&&tO=m1rd*fO8z@G0K(@sEc8MMi(fXOXGhgo(Z%6{yiArJVwxK@R94lIGW}Gwr|;>
z&Su+%xd~54pVL=5IH96gpW$}v*k0!=SHtUINxc8+qc@fEV0YnPY~8fcddABcHL7it
zl2Oae)@S7^6S+i)+*VO;I?^(86_1q4gJDt8NQ#R=-(k~`u;F`g9_8C8n#|;F{k2q3
zjZNXnprTY19cL=#K^n{5^q0sQ$k--0I=hRJ+twn(w+HDp>{L(|ec#>$6qFp2x>jJ@
zmd$A2sjC=nU5Z=odjfObcotr+S~<?F`GQ)N_2M7D#4Dfuf}Xv4DtS&F&WbrADk@CL
z(Wwg5xP(VUAT>#xX;CFXFdDmiCnBReO01oD?$vkk`D@RJ5!@<SP{Sum+Pw+G$4`ZO
zL`P)AZ^ME7GL^GWU@PQg>_<$FmP_Ev=5l0vK<H#G1tBDM8=fEUQ~i;!CkAaI+DWWj
z-1^WnSU&F^_<1;2`_9=$8s1nw{|lu&*r{6&B=6pWJmG7RM@W5~NRgAJJVU(5N7_P2
zScEd#oSb?<l@~9vlYYTs?5Jgucv$R%4LcLit3$Y*|7DA`<8W{0?X4pBOlN%@>)aEk
zr>En=2OmU)j6*_GoMY53iLJ74+Kc%JS@}yYxdh*S`>hg`WGOrZx%~3WmDMBD_@*u0
zo?BC3K<1TtfQM@`$;d$)l?cx~`#g#NmQ3VYP>G4H6TjS-+X!qh%oZ4r(=7Abm$V1-
zzMP9k@48>?z}F9<UCzXeo2KE?OD;xua1aYsORyP(_2<yI7-phps$JVQ;<JxG#$(US
zZcrxYUwARDo-!FDhYdl1k62+R?&>)hsVc7m8`rGF=bwFw=U#rZLFF;huuI0{($S+Z
za6o@Vgtk`cj`ZEx_C;z!3_kkcUEC*@AR7*jc;Ini>RdL~YR&sd<uPA|a|Cdb%Szve
zZ@&5hFFku7Hpdq=px8(}^3*N3Y}^=hY8$TNSNF2efGq4$jtK+oJ$>j_iC=&HRpnJK
z2axonMljZNkJmS;3b9}Q6&NsMhyw9<-g&3B&73D0))a)2HPhpLV_9UWJV@);vu4dw
zZD8A;fBt!8wVr|`_06BhyPA#7-v~hGq$lC7J7=Jv(hIK6j>xlYLMw7oQ7nSbT=w&_
z_4a3f%tlPV?Pj>U(A%4nYyuN8aP)PUaou<+UegDr9#v~1uw}z)eDL18c;VG|OmKsK
zCtrU%uDkYX^gW}8+9=xQX`6w;eMx>cZoDWI-)*%G)%OD?-G=YPf{T|+Gvs9*z?-kU
zfV&^AzGj9Gyc*MQo_cuV<MF0`;>}trzZnN%AaTuf6oHEV7mQE}gl_H>T2CigCd8Y3
zTh4sWQ;L*2arHjoJJat>60_qkeD=x5c;w0Fb@Y0!eFhE}Ytxf)@$jK&AwseZp^fUv
z@`%Bvze|hqvGAuK@a7w@<HtoSj+n*--h9V>xP0Px^f~>=W5>kj_|>Ey$45Hm|M0CE
zv%f4~Qx)Zicg-;UKQl2xaC6R?XTV)NLz(*5mCTG=_QkF(>+$v*ui^RE-m5G6;qN25
z<M}&p!I(=&HJGkunf#c@lt@n4jX6TA-hKaLhv!|(n}}{_<Mtb;Vyw`rZCVA&+#rJ1
zGWg7VUrUlx@|9`N>eW<&5hjp$I-r6D!5oUK2m8g2fhNF!p@%3Od*+#EsvJ3Y5KNeQ
z_?s{ME?6%L_Fi?>RZ4-7ma$D;=gysrhaP&!y3a7*(cfI{<5E25QBN;V<O;Kx|BZo&
z@KB|YPW)7si}F&o1G@L<iTR(thUs2D`0(W?;MQCVc$$1^v25R-SoK&|P^DOtnQ>5z
z5&7fY*IqVJ8}u9C?}N;PRZ1=uqG(6RO+P5iO<}!@qM<DC4a&<zQfrGm6o_TDKjpWX
z9F&wK>wKxmS18$edkWqB)GU*vLBC!euE@==;xj10QI;b{nG|pV6;Sw;<&6p<q#4$(
zS&c=D7UG*PKf~r2QJSg)+C@hzW_*5@R;Xllq@0cf(sc^X6z>;<<=kh{maXXCr6V?P
z)85l`UCM>Azeg$O1hfc(w~QAT@uov%r1%}1@P_;w=s$Ecre1RuE*d;Y_)Z>*w$f`W
zW9Y)NEdAx+P*poxI&}5$#GlI-s(+JTeZP*P+*e*wU~OlG7@KkqmeY>pbd-p)>ahT8
z#~S<ixT|c;JYZ_=;NYU(XXX{C-($I$F;`a}rfd_gpB-e3kj~4%%HLPumxVv$rT@KU
z#f6D$ew&Hc&UV6=;~35mFOW?EPU3-3wcbAfE*8Z=%aA%Od;Q*E@37!%FLW%OB0o>h
zOQJq#Z5tKwc+527%-&)ZQ<Ovn>MB<SS}sAYwPCsVtRk74MA@uNf7d#=AvxIQX1TXb
zW}!<Dl@`mql&B(<AF4V?SNd%7HYz+qg&mQ9$az)rqgDO39XhM{juvlK>Y<(s$B0>X
z52Pkx*|MehS*!uS|H<4sQw9ir0=+$PNR&}i_a>=$Y+l29t<G$#0&H<r^;X^G<Y>#S
z%`BE|`La~z7$;{}ByQh;hh}c5k>W^?PH<{Q&*$XTNc~00*FokiLXpMV^N~`Y%wc9f
z#)CZaacKB}3imXAM?+VnzX&zwjFY)d_PW_I@K3`4t+B6Lw@x+d`s=S(mgTwcHXc;@
z9ox>)C%XMCn{}XP#KD6HD+NNX7ZDK=Sh8e^I#Z#+JiP`TVd6f~6}Ojn>R>=GzG@9`
z8?6P)>Z<(Fjx&y9j!wNU3a!+>llmVs{&M7tGG9SKp%P|Pw3g7QRO)kg_kfqDHVk6w
zW7bvkT;DItWt~YIdHMRIM{oWgIh7_4tA9({Fo{J#&(Rqjx^!3n6RwzyJgI+)co08y
zNaz=leP}KQd^}{I<m#en8J4E^kyW(bk!xTNwPQfevbJndXrMt+j$^`k=TWZ4d`C2c
zVh1}08jk@pFOC^I=A@x@8sCbl{SyTx$<L-kf+!JkCH(TsFSzv5OVydm(XLxZQzv_x
z+A+W>%&EDn4s7m;j-rs^=UKHz)}Bhg?bf{~246HB{m<)*3op4GzG0Cl-5W24!ML_o
zqBK7Pfg%*2E`sY@w(SxHLK-ROs$YE_uUQ7^34-FmSZI`*am;hIxaQ>v`_;4u+e5iX
zvmVq{ysoQ`TUVSTy;n372_XT^pJJJHr?AGCNX8&V-LY#AQD?kTB+DbUc%<@}gDI1^
zs1F~tmuQ=Zlvz(cO;KK5^{~Hh7zWq}93SMRaegOIKt4{C8n|zdmh%<D(T)d|*nY8N
zpaupw?yeQjgJxWDe&xNM8*4;9i62e<`JK#|F$1$_&sMx?(o8SC^pa|0w{G3k+-l;U
z#LfAKR?RH5RpYB6<4li7AT?nJ9-Dc&!cBgr)}G_|Z6S`9ViOZEV#*A3uy`Oeea!L9
zGUB(d!?<g1N6WUIkSJ%yGRh?%@=qKQ8Qxkc4|YAPKdu-%60JlQpjf;QZv69iy!GK6
zRbE(|U?e4{s=TN?*uGO2QOsL`7vA^)FFZV5JOOge<@|i~UB|Yt-oG#W9uNHYU3Bfy
zLzD;qQbu+uC+I9jD*PR?mGa=w(c^L9fb-xhUI_C=c4GPB1(^5a60vj|B*v5rL>{6*
z>gphM+$tUnyJNwJv+>!G3vm6!5!Q;5E+KA8@-p$k>rbhQ9~8rvYy|5<<-s;BU6u0S
zrI%kL<@H5?ua7c_l_N5)YgR7Dd!KwM!d>2QcF04i5Us3#d`!HY^*Z6(x1UA)ebdn?
zQqFx9ZX{gFBi_IM>;qL^gv%jpw<r(#wP>yMBGBn<%zg3!bnnz&&cD5sQPkX=Z1McK
z1+!<}izVygtV)E;Bsn2g99MP3mY+YynvK(O(Yd{?-#PKdHfE&6V%&%cQr9r#?Tb~)
zgX}Bv<=VE5RL&G2vVf0HyBwjdTPi)C?VHzQ_N#BJdPYTv5@kY?$}3CGGkvKfnYI%%
zpL`MX-hN(;i&iN~ss#2+lVN~k(aaOyeDjSpUvri*a^y($&V1|E2uFEyLKO&EX?J&b
zW$B0tgls6i>-_lRkIM3+{Sf3Rd+{Vq<|{&DgmRfIWqy_kh)=ewhV4DWG;p%k%z9wi
z&);Cc&`V8_c$e#>1Z&E~`wyA*1Wv@Xbl%)atnSN%yK~#0xZ`I2Ps5K(R$}-Cebjri
z=vXsrf*bQ8QZR4sM{i-`HMgo<y;=mLO`t3wVotG4yyQ`Niom)$iEv4CsV_Yk{U!?_
z|2y;@hELyo5vO&D*1}x!ZPbPxGs%}0=HRv2&tS#_dNFhM3KWk(Eo3pMkOP`>DNkFq
zW|{Oz;3%s$Cy}CpTrBu@uKH)#hhO}FE5?lwE8j*4rbelHHB)t2C0+;m4!)Sl;M1y&
zSdI76?Gs@zZsxeauzk&>9A{}G1?%`6w{s_EJ@_B>|JEm8<C-f**Il0EtrleFBlmx;
zSuP8Cf2@gTsX&L0vKUD@hXi-Ts|E^aIV!wzoY5=dBlq2@{y+J80WKdsR53J;C<J85
z$^O$c7%-j%>0yD2PqYYUVCKx3XeAya2^=4Guw$SpFklEL&dF*XQUrKY<b2}tAk);W
zDYSA#!86X^5fKr}8{zu(>p=y=Qx(d^>)E@Xep{{j&77QNEi9FlTLafGuK$&VshBtS
z^J;P1pEIV~Gan4TD#Uxi$M3v~DL37v;)H}ohyb~ptP`auEs?{0S%Vpuz_H>eUJxjh
z<1B~$C1T<5qc>kt|BwCmbxgnMT6l>iVw1N@WWDG)i&yu6NV&$#=Ft!PGIG$mO$3q?
z<KQg9mCm9(Se$bJw@x074}V;Rb{#rG_D-Ul=PaHPH=|2y@#a?RDsL^Q0XMoX4T#wI
zDC`i)-ap7+r8S!nYeqtAD5$Kx4p!V%l;NvS-^19+H>l`teytE8)*)-9jf94yhsg?|
zn^rBEum0PdF$iD1^FN%~y@R4}DrIccUZS;TjlR)Vo0<vZWfva4?+&~(XMxJ2oe0x7
z3GHO)4b3bNc7f11q~qu@Bzu26UVY&y_5b(_GIm7i%~PxwS=)bDZH)4u19om&gPX6u
z5WjAsn6(Hji)U&V8IPnF`ESOnp{pEaE>JY?u3dQX*;(p;<b-K>=E;YI`Ov1$GOK9c
z3Vc83eT<r@6<5O|qQo1ui(<f+i2zKQFyc*I{e3i7w6zeWGXHEAkD1r0|L+(7j*$cV
zs=8Q6#KT)@L&yKRU>*hzAE)CuxQUnWa7E|Vq~l35I>{JN<!xClhCulL3>N+V83y$g
z3$s#~so!A*o`Nq-Tk=I%n%3V4rP2@d%t>#v<{;coC!K<wdy-d~a~Q`T{|)VQvQ^oP
z`@VhqV!(g_Sh{qn+B=XQdiddoF>c&AWsJmpM<-kTo2ovMQIVn?7LQrazmD;v28+T*
zv4z20Rf54mS!s!QZ_30Tv2gdlS+`)5c(V-)3q_K}BOlj~&3|n|uU_5p<r`1ostK23
zc)!!D&8vsXOOPgBpoCIFvCwP=*dJ6P42z6{w}-o0Z}^U7*9HtL5KDF0Ir++JzK&O^
z=q|=@rsy#Xp;21~4R}{trj`9#3(d9PLXt2UX@uPT5>O!4O}u4sjVHauqmaWu>ggcs
zRgQQwEGQ~Q3-Q>-CRJ1%Qo=`!&u|UQS=Mj~=fOj)D9t=}|2_El+r^gf>g%`}!~Dk7
zz2vif$4(X3$JY-z7O#GMQ7c^|6(K!LTEN4%C1!v68@irxzEU3S*ts(fl@yC-$aG}q
zYQ-MXP6sp6k(sUyaX1LgK#$4ZqQK?i>LN;{hp_CYZ`6P1^M>P{7oWvBy+!d!%CW^v
zL5a>!b|ltzvHryc`Ql+M0O4&~X>8givc}Xmj87$}jEoF8cu~PmM{efi0&Q1J6y)j{
zJ2kSZ`;qCT9A8nIB(S}<KzfmovUi{Qtrf>Ar2dQP%lc!oS-M^<Z_V<barZ3~v0|%5
z302-j%eW+8j{R!#CGU*!>7{UYY^*BAR}O}<ElOMJ#Zg?2&_&gAYb0_Q-H`t!7NuL;
z?qquiel2{olCXNJyATuNEY?F$lep`}J0-os7b!obDsdeji6yL&Kjo!|P?WJnrK%7f
zrWGs*bN8+;ylxGzdBgZpc@H<u^EP9yX0)2mR$jNvGe3UyDMns4#TuoV<P|LzR5@cA
z-YUn5S*wfla}bxL6-+&ahR-jmQuMZFa<n(K4jA1#g%*#rLOoQ?7yQme8Pn0l9nnz{
za!6d)n!r3XpP2Jhrpybn+gD?rRV@|stj(QWRIRJ#TlIL#UD!{Y13ngmf(B?QoiKIk
zRAm^U?mePOVgI#bz>b0AfdRATQhCrQ4pOPtcnCG?vYBs>M;#iQr!go*tMR6uD^{!!
zTE3T+hG=Y__V{)TC=AFNPFkF_MqR*f#(Xz*#i{STSr^Tok<Xr9-s-=uwEPwc6skI!
z?@`rT(v#k@Z64p7dZ+>{We^p$1L-fF#-!u<jJHqK`KE0;#!>Mk!)BI!h;6w2-j0Eq
z7~ps@W1QYj2z+O}<5IZS4t5MQ1qL|(kq>+_(mD-opP9ocV?wX)R3Id6M6c5CzyCh&
zx#u2q=)ki>z3*&jzV>*>2LoJ#707Qf4P}Y~A<sJ5k4FObAIIw8Q4{g%lbdk!%x4kZ
zHWD#=;;qTbDm1TeXKXw!9(cCoX$?B;hWU}wF>@{D@iH<qgeQ?H{I*<02XSrpk#Q9e
z5CDJqZ!Y{gf}$gYYjL!Saw?NXT-5ieXdm66(vl*@Q_alG6ypWjFq>0zXV4f5>*??B
zSJf^Hf3ZIN+E$0<5icf9x!@){J6jn_$S)|6{$d|GC?gLZo?h_v@qwqD2blN@w}M>K
zN(}<(3nibY$`t&H3`nN*MMk>x$H6RhF3o%#<!snn%JTR3hrhJd!`;nVrm1s-%Ckf=
zX-vIybFx(bXC6E#1|hW9CO0u+p~@4ydfBwmq-{)j_PEE60W*&$BqZRy_ufNraIiH~
z8s_3UVB%N<>^F7{93uwI9Kr9N_h#KV#%xb`a@O6<T{Nyh1wuL~pb{>DiYMG-I5c$b
zKH)9+7Zhk{Bsm?SG2hAx_qx3_3p%J5K%O9#$F^)-i&^(xfj@QuZ9-ZiIVH`4ux6r@
z;Ei-S)}J<cJUql`uo(xEgW|2o$s^{8tRBHfPTkT<<h|U>jucT5!J-%@^4xEHh$$j7
z;4co343u9t4cFgry~sKaz^a&3go)?7B=LO5v9^21c64qZj+Y;qfl1>=;q=atiheRW
z9wv_l{YqsxxAWU8Ey%(fvma5(@-ir^pz+}7;)y^}9!$*#=6v@HMqb!Y4D9POCB~U1
zjya|-nvaV{O~8R-H!;NNii}*5r;xmNC8WVm;@oiS(-<+hA3_4XG(Sve8HUHl?7$aG
z_aMAo2kejEt>phm3Ppv7U{8D^-uU<{Ts3|aT<HqX2BuD(hH+wef9R!GB0vmZ97v+!
z3sRpYaPpwSdkm6N_bUZLVw*w4T~2xm=Dq%sggYx^vV7NEjPW{V@hrPN*3SD>@EIld
zRnSso>!U^1^o-s;am{5HV*ct<bm`nt=o$IGC1a*1tXa27DG-u|RrH$tvaf&s_6xd+
zK$mDYY};O->cQ}K(d`f$6N`Hu6GtXDT#Z&Oh$#)E*QUuBc<{~}@YUiCGFG$_A?q6-
zvlCrKY4PWeUc~RyCSiz;(xORk|7{u!7`kWAo;`T%vBwl`#QB4I7!xN>M0Zh;C9q$b
z0-Ty6lg8$8&N=6(BovgSb$NpQ5JaKjA9X3WSdAtjqUK5&w9RA#UM_+L1TWFht_k`B
z(3|uxKlmRmyIK_TT7;u>fGhSUC5dv_4xL2uqB5$JZ1Bs(lVMSDmGFd@Zvff^w?g)g
zZ5Sa!&L7PC30IA|NG3-!G1n~h=$?%--=We1yzuyaxM$WYi0aS@PNGc6&CQPVRFyG>
zXx!cOMz>Uiy|^(o5ZEeMCgMPBUAX|KcU^#`Yc`|*ncXx)PZmjAP`HtI6{UrE>i!vc
z<i+>VwR;Z~<>d&GkSw^#P|=%-VuYtyZKM((l_yA8l!yX_0y)G84rwFW>fWMFpNgw4
z8;P6`=Hb?>##jgivIVMuYy#GTE^Ygd7!S0LLMLxW(L&#Y9hBA+{D;T}&dtqT2}7}t
z6kt5CKNWceTCmT>%~J$n+Q6~A2-jVCDe{ZwV8*rMYc0<*P*m8j^XFn9HQ@!icIk}N
z<Rt78WkdsR(*IP%JS2iYg%*!340H4F66T=@(-)@W%1eh~-y5Ic&g-vG%pNnrnmp{k
z#}@-+<`P=AY^jJ8-d}LR1^lrgUe%-hV#mNSV}RfHsk*T@jW@&{H}T$bu)ce@SksG)
zRKfG-&sT~iJRmt0=Q6hKv=Cr(Wi+BZE0w3Mq`g`Q(zKty>X1P^I)riEkTf3NzSz2X
zlWYX5TPtKd_IE{T5uShS9{lHtSCqvYu90zZ@krqw%>vHCB%wzZu5Tr>Mp@TH74Cp=
zB^2+1hwi!&yG7{!)n^`ow^AbHn6h0JnW^nFmq904|3qQl5|2#vL$W5l{P=&A@?fu?
z-LY}gW>pfE3<;$c0|@HjL|v*^yFsNM;>J^e<4xZPBVTY?oInBdUT_yrHwvVm448f?
zFDt~$Pd$V?9)2DXVu{8XWk@7#v}3=DO4`UxXd`Z7OJ$=&E6xT2f`ZYyrO-xe7vroR
z9kF=TMhrZsXRWl6Npm#6hKaIk^BO7VY|u|qw{Bf=Ff&~?%)6~wy2xI|Sq^Ea;94YJ
zkBp#=V{;coisGNAcmaIy4jDV~$#~_Nhv8G}*x|aT=crwq{y?W*eN_J4x^@wP|1`1g
z6l+tSn;ekvP^MBbkyvKAw!#5dQE+J8s--%#`C-o6_+id(*b%=B9V1#D07F5%zP_%q
z-z<Ie*&8q5iW~11I<+$#4;3MHPn=N2v<m8i;MT1aP0jC#v@JKD$$Jw~T%ze!Pj5f5
zW)zIv*loCY(7E{X=ie}P$ayj_gbu7B9HZwZQjQh){GFF@`LsLW&?*9*d|i-`5HGZ<
zrsK#&A|3B2W!6T=hlaGqo^4w(_}nw_`43AlVT8~QQXbh_Rin*{vQzHH%;Cfbg+*vZ
z*UbN;MvW3H=Gx=hslKM2avk$8sW8Wy8E+?JlUX;;&lJ4B{r20H0wE6wIX4k_fcV^V
z&nX(fd`l-|JC3zZJm4XOg+`)X+qMnLuK$367<KVTJaW&ic=hA&g{iMC16o#b9L&-C
z^WRpkRtkiQk*rn&&a7gjM@1x^SydcyOy!WI__(T<M{$>tk)=}Q78h97QF3RF4n*`o
zC8Sva+dL{cwxzy%Y}W9jDWSMRvq_7DW+V_hW)0uAb_KegdA@qzwQE<Q3kr}W%9~ur
z16l@)cRx?;6QcyVI;o1s%h>~lp-USdy!-Lz@DLimAWs_*u&uu}vSp=H>$0?`%jxGK
zDRw(veC|oS@a8AhXjDk!dRtUjgsiNC!V@W0G#i=wSt5)<r9uNOgT;fH2$^hKF&}+S
zn~(1nt&%nU9KDuX%B!#*VpY{j^}o=$1v#16F8{{@7Q>h*6Gft?fFPk4357zg=n<@Q
zEfw!(gdKAD!8;`YEWbxXKhWrf_A*j4HHDGna7P4O^j?8D(=^J$uRp<%F_Yw34rPRo
zRVV^D=?4yo=b+sP2@QjX>}huGuA=)?M7fL}cLiL^4r0!?Kf&AE3%M2rQ4@YtzqTLq
zQDsm)QPs$x7di{=Zu`>mMRMFU1{ht93X8y2wX}`Qt6JI`4-|wd(o+#CYu%4Ew%!eo
zuh%P~k;TBuTeF|Q^>;lA=hoq9=j)FA{5+(k?H8jRJJr6lxkMwaUK6gmdMfts`3t}N
zwicdl&Z0zU>4TaPoABApx7D(gKH*-jyrd92<-qt@ATv{cuO&@1FC0r<jyA2?Q<DGr
z?6V^17#%I&Z>};7GHlo|oO|xMD(jP(_Bz_O+tb-Ga4KMcMlS~q8l;T0o$QK(W}cuy
zAqstc{q@&Y<3gW*{y8R3o@^JKJQW7r$zDg<Go1*bc#dZ?ril{LLbcI|CSFtVzsPTt
zqN{;zJ*ov9;lb34QL5^#<qP=E<Y^m^@9kj6Kz$g{`vM0g)A7tR&s2*}k0Bu;a)2ga
z##pro_6Iu#8i@gpx2Bq38(DOdMK|A!@y^MNjcnnnRjZT&VUrbR{TpuMb+Cs(Dc
zcBIUyXh<c(K|@CYqCi;cpwIIS*QG+j2|1bCP*+`Zq}iX76xg4Vh*c|BV%f4^@y%QB
zB3Wml@-Y|pkZ4?S@lf>Z-yi4pImco=jeKA&e_-Mrk6+s|;zWS`cQF|9>#vLP;iq5L
zT3n}|XJW|UL1J*RKh8PpOti2#a?m{M8pKa6IT+rySenDG?OT;X?wUW>V8ybf*u3*_
z9u%_}I`R^nb=KMFBeK0cdUQijfEY)XqHOD4OHt~TqMs~uXYRoRSn=C({3?bb7yK{>
zJL4_PxmpsBxMZyGQO-mE{{7HX%5)J!V=6E5UF&J4iN|qQDrXQI)~%JZrC+gV;m=t5
z``TJc1BQ$kjX?tkqF=xB(W84;F%r%46i2z<@@mb{{_>bGuzK}sm7ZsVoEHe^pMSpk
zHS2+TuwU#LXhIB}>a-G3Vb(?Ry=Zh{-n@BgUlA4-rVR5=m@onKdft%vy9rTi&&q;<
z;sVRrYTj1dIpa2UwnN#kx|TH>W89ar7fY6{u;S2GdC<c*2<;<-v2o)jOuOePT-5I@
z70-+VLmTW**p2@@`8p63j$|=7%y7=7ZQDg*Pi!one(fXNalJmv<a@o2QnB9|z0dBC
zISV%9g6QsuP0mCMZ#SfiVjg7)O5mo-`~K%8qVP8Ln0QQPZr{FXEk0ei4N=h@L`iLz
zrLGQ$Y!e`7Wnz&1r{x%XkzNltjx{)d`UpcV9*;kldE?Cf!{F@S7EZZ)l)OV}ZW`Kl
z?u4xEE3tg_I$S<tfRZ6Fn2(R!t+Mg+bVWsQ8&xLH?{|od+70(Ug{h+7K-Iyj@^q<m
zl5x=`<M5xU-{9GIz7kK4Z4jSmQF>G<fb9GN6`6f3sFl2dj05|yQtSW+h#YKAO1#2%
zU{DZJlk#!pZC5Jg!AdbcN+m|yd5QfQ6dH{?XU@X>i?0+#K&^|SYoo6p{J0c%+;|nd
zT*MTpg^tZXn2L{HyI(~(xG&k-|KU+>mGa<?_dSJ2@4o}$8$;E_^gj)4bn1Qv=pd?W
z^m+LHk0gY&^hHXVro(d!^%?)%Z|CEJzP-_0=q}Tbwso@K9~%bD_e=+U1j-MZaWQGq
zB&8_clymwCRUkBt<6$Z-$J672@v!j9E3e>+E3QzMUYfFj$JQP8)Q!ggEy>7aCJBu&
zw1^cbF%pV*xww1F#3{n#-7Z9Eh_)E6W=cyzWCU;moj><or99Z7OLt@^$6));A~l&Y
zTAQ$N(eQSXMPd&h;pXix3Tk1<%{+j#%pB#Wc89o)^%XC9oxPf2%GjZ3v3xCtoiA4Q
zWuiPP&39E&)kRHyG6_=5<<(~%Qp$rpdiKQjO`AkSUblhQh{#AZlZ|*>LZV9CLKYog
z4_9GY>_uK-2{P06iDr2!!rQh-)}GxMa8`G0j@gTD?GE=QV{r4`=kF=y!Ct+4W8;Pm
zDqpi<4v&b0g9xM~B<aP8f$rV`f*(H|NKHmgK{58FrXW=m4&D7)qgy9G+%{#bXsgHI
z>~8HeepI`vHvfscHfrU;Hti8sk&Yd^^rqg`(-$rMJdh~b&9y;9cqkG?5rZ4_7!ibN
z?%|K_UE1T0sT0t%TW1UqMM>2kmhzZ~wnF59KbCy2lm|oFb%LWP0&d;5-P->x1&7}5
zu1JcDMXoHI4$a*}J3d-0<BK9?>H%@7oG&hXcfi@x58b<V!reEB*1uQ}x_azIRV#CC
z6}G=?5)AO$;G$I|3N&-)&Q*C*;5R`OM>>iJ$sXcvnqbxg^<cl)G0+4U_$Q1hwt?Re
zm2U63_a5AT|NZJ)iHL~6+i$;(>C>m9vv?jkRSEDC(HAU30rG=OaWG5F#MA}CoJ~JK
zq33dhIJ>G?+!z^P`?cayCEokr(@J@ebIUeyWzX%39t)N5^zm1UXoYzPk+M%K*$1``
zLAZEC;o5sJmsVDQ#P~Rsbx*P8{mCm&qE%2!JpI6JR&NTmjxCFjb-4(a(;x;F_6feu
z;(C70$C&y2hluXf*{VFK0-N+=sDcJ&+Q8@<x1_|x^PEK>)U=IR_y_tUB_$8TC-*~8
zptiou*aST;NgI{pjprX%%7dhhc8UUM3D;{&#0XK?6xC0}#V0Ts{Kc3;n3o6AQuiWP
z=#+!$`;d7+tQkeNLs@(*2KDKM4LcLit3!B`F}BQJV{hyhbQI-5LWk%mY}vBaGJeEB
zrg+<FEnXP2q%Ij^nUX+-!OBCjrU`vhF5WZaEsB5LW&C~o$`c3-48*e!O&0?f`dc<*
zr)s0V54Vo(qw?w)9f>Vlw^_?0UDc*lpm;-!6;D!H$%7HYA|i#=P=R=%C5uH-AwEvi
zza6`F$4>ER`S7!^;KP?^!BrikRN-0CRD$$Bm;I=e2Rn7^iR4{>A+MA@Dc)g3@ZR-M
zmUyU2RL`~-XP=e`4RpZXl>I0ak0(2}XCWXs4ABlr7$?k`ZF^GCIV!kDe^d>!uReTL
zDGzq;)*Wf_yRdzKiM5@fVG(c<$!H@O?JjtZ7J>TgjQvQ@%2RawcA?_~f<qDIUV(`t
z2g3jN4Y;sxFIAp7e6+3asdUfp#BA<=`Q;Z?bwfAtfnL|_V8_6}9Rp_W94Lpkg9i`B
zqD70;VF&q0|NZZOamgi@sBeXHIfV=UiJ;bFX&8l`2@SQ_9N0Pxcl_smr9fEX<fc3$
zmzL{!KhI)xXN6dz%NDIGU-#y+9~V}+tj`W&yg?oXO2vSKX8!YuVLZra+r9(bU8qbi
z3pzPAqU5faJSvV}^Gtk_X*I#c)g2qwuT|b}YYDCy{fN)a98^W6rZS&O%nGTFs*@C4
z>C{}-^JsP0&vnp@C4<i+W~?|-m7p<*Ki6c4lD!^V+BkwEGE?JliA8y^Q~S2qx^=5H
zyRh(ZB#9T<%ryOKz=cE6OK5}kQWttPKI@Fru;!O9l>%XCNU$i>Yr4Xkf$fcIkAA`W
zlLiiL+X?^u-@BMNc^Ve{v;c3-dPXUvS(7=ri=wG0qYJ%|FUpB&V#(RIAJT*e#Q%`+
zws6kcgHeO~U`uQ=y0#6G{uQAZN$J$g80)C20L!NmT|h`ETKkKoU-mx-MIE>mQ4Z;q
z!+V%KI5$^Etd+5+(pxLu_#0C@Dn*7$^2FF|__{eEyGS2eWM=DwnHR-F<h{2|Q#>n8
zqnecUmB|*cB^CJO_2)5n;TnVpJxFiO1bRHA!IDbPVEp&##}On7U{p-wT(o1u3Z*>Q
zI=Ty7iqf%7_*fd6Av`=x6pE58&%lUF#-N)hp+<`lfsUQKpjX$9`1qyAlmcO^pceHi
z5H_?m)&gt0VOOb)8lRhW?zK&7>G}%GoTH1h7E)Uc)H@C-e#>H}Q><Im8SR(@Xz-=E
z-db9Xzu0D4S*_l-A+_Hd12VOTR)5Ryk?mag?Pp4Put%@ckht?NY~QEHm6KRf4GnR(
z?n~hxAvE{7=py?`&LdsKcwF1y06cipM38z6@beZ0LcPDOUQ*LOnR&s|wJLKpFNqM3
zn|}*LiSa&q4>aLw4v_W1L0na;FG<?0=OPXi6H9LSUZxWtUoY8PuC~tAO<VippPQlU
z$^WGCAfZr<ztHeOT3Q<JxZ@5n@aI`$&vg9jWiP>w0Xqgb=W^Z=(^tah`~Lgyl>sY0
zla^(e*^~3#$pUJAmHN@xmQf&d7Gr4K15uE2gPa3iaKQx@-kWaU$x?TFJ?t2$4+9+E
z=DVyf?#UKjRd2T8WUHOMKBp=M{#f;gsygR*v$wkFA~A$5gUp;;oT_cJ*ZbtbK-K(p
z^3<uZH8E}I(xr<s3PEFx6ow~!_~D0&X7UlwWsT$eG`1G@_(zKYase8$bQ(jxErMF%
z3`w&#HV@vyN6alQuU2%Wg*V5SHS;!eXIXJR=6(JVF2CmHYH34d+|c+w#}s+JJlEg5
zHwJIN&i|KH+?U?^2v=Qx8GJlkj_X`(>YAOg5AVPA8t%A%mbI>quAU;KEnX2>S9wdr
zwk6_7VaKLF)jti)IdwP#pFHz8E*&{UgtqHnH;f`diYOAi{_<=*G5ZZ`dAuRsU0rA-
zjodjgGAMXHcwj$%`r%vk&p3YVd*gxIZp8R;mnuGKO&LGNF<|>WuKIO>82TTM)v+cN
zU|-Pav)Pj|FZM@<oW=k6?L76**b}4=r{8)L&g$7&o`lOJoo?oYs@(LQZJC?bt;BOr
z&%!5P{cMdE)H+y<y17`^T;0aptW5m!<2UM`5wE=NcHDXUE$G>~oje`6JZr}Gn`6d+
z;jI;j5x!49{Z!@0F-V6NbWFqfpHNrdt3dn3j)8wU2Kaq&Z6QBt>eQ)9fzTMMCTb|R
z`{08Qs(IITzWkS??SwU7DW=OAX|u{q%$xgpgUj{u4??Q|A6b+4Sv?PW`}!j{`+z79
z9>9(F%)%27Ooy{9-)611&3x0k)#|am7<%7*K+{ydLE>F6HWtBsN8_3+#;I^)$id9B
z93zwq2yNF5FMsh4hFvxl{=pqYfpC|KpO#5y1Hj{-eutZ{xg0I!jFf2_4U)#_Z~Xq-
z5|!MsLOe9`PQpUNBb7Yalo^lW5~VyS`Y3XyWatM*<G82X=o$Tn;-$y#!0ivcP|cHd
zL6MfR_-WBHj2$*WaAgb=K#bXMW)|4A=`Zzbdl@x+h*AYKxH0YH?;$x4c5-wU#la|*
zgpLRd7`nG8uS(X>gcTQRxd0D2OU@Sj60)+g)!FDLi<jcT#A#?B-b&8ubqbcnf5V6B
z-1BTabl=@d7lMX_3F_MynMDWBKykh#XN^=Klr)50+y25LIifa7nS9sW%^PKV_sCs)
z%(!W)QXV`cXMIjmr)vE#ZS-#$jt8H99pCpG0T=HeI8cF5DzpDUCR#}j??3-GX3n?~
z?Lq=A^)#(#Np?6E44Az_e0)6ay6Y}+5+*)G<qR@8IawK2F!F?^&yJ-mllC|s&6^^s
ze$~L0kC&E#=xUk@gxvge=+Hqd?e0>RPKFL0T9v?l_qSodOzm9AWV)5fS*{`gP%p@2
z;Utz>vi2w7&DnRW=vlIu5jaN$1^OW|Hv@NEHe3XdywpoGpv?ymyJZbVOqhy*sE)|m
zy9)=zd^;yZPI6Q@jf;y@`SB7S8ZHWKiHONPsNO}2>(uy!Bv~JtA$xza)FoWGq#fSx
zTI@;rRfHP?YF#+388+}nPtp$JnQtDZ%K}7Uj?JPxNUQg3Xr&0XDVM+Trmik%)7oDY
z+>(`hSU8F|mk?hO%uZ8_TcRirMu=P7+}K^X?fxh6?FTO@4>qP8BY2*jmWYR@+$yyU
z!M;5*(@S}@vQONGhlPrFpLo@R4qbYR5PASI()Z)9&D#V&+M<D<ryH{JwK8U*xWO%G
z(NV?!`iF%$OB4vT7Xo=D8LCCMyaaE(^t6i8(d`g+#%Se17Y`p4=Vv2P{wG~~15WGF
z6#-(=zN}b0KS>)tc>2FexIRqklw`4FP*!jdnFZSI?QC&_d{(dLL`ac~vucJ~*jeU*
zq}}K<Xq1#00;i$_NKDO?x{%<lM1=Hzg7m*dE>DE8B18x)LA2vzR2|#46-x<XshdPb
zX?_;A3;H`owZt{!hNA1%JvgIFl(ig{z<z0R445%Xfl697p(PVzA?W(+uUE<yCQg$V
zZqLw;fqwu7%=bZoc`6VRj2D_k3l}K`LbGn33eA-%ULO$1WUs}nQ;}kfqR3orD{#p6
zaQ-IkQB+i@niso!r}{1BhQ|WL5!b7=%jRR+osXeYw;tFc%7Y>XWTh8EWqsHy>qAVA
zrVspDgvgpxEM=!ac=8G&#JUR=?lnFuv1#K*bQcBp|2}v-&K5!MF+=)FUAQT$pZ-ac
z^_{TvyU+063-M^~?uS@Wz;kx<K!|vZb9QbH7grDLOHL5R_=zCDiFwT|P``pxhYI!T
zh!^5tmR#8|ufzS%y#oY>Vt*<-j5w%-uUO!rYUi*E`@>VX5w?c}23NoT@-1$;?`d=v
z+GwlLM&$~Bq*WY+jtjM+<D3v09E81+|H1vNmZx}2YK^4ieToK266HY}Sb)$-*WLXn
ze);Tm_<OoExKEg4ZJ@@F&>Lk%Ie7d(H>fC`JG8_0U9qZM(xbs`!j$LZ7>l=^&`=pq
zdlRe*gKb6FJ6@P8L@ArMS;k-YZe20^;Td9-p(iGe=&xug6)16J6e$cY`{jEql07-&
zZnh{ZvOXTZEl`v#o)1L`o^bAY{X~JI0=u`aK$3;F3keNHiZa@u$2pY;yL61g7q35w
zJ8!xcXLgNJ-;Vi)NK+LG1L^U*MyfoEvr??egT8^Slwu?UZo2(W$tM~<;_ap|KUbIu
zTk!nLuVJsaWHjEZ_zh&HCLy4cFzQpb;iE6U!_)WPsOd&49Y@;H0o&J!1*j?iXYV@T
ze6Iih^W5Hh?>lGjP>4cGXi1{7iwccj3WWwOr6s9<N?W0%sWecu?9I8ohuizk-T(P|
zf4=Wq4o52L`?|+{KHtyh^PaEwdc9xo*SHJeZ97t7aW@L6TPrw{dPYV@DyF|G5HF!r
z985?`<Ty3xR87ZA*^g48)FLPhb_{pL#kV0YZ9T&L+|LRfuk-&W?s}Z0vfs~{Ge;Fc
z4nvaIw&TZ-SHgkvvN`k4KT&>jo@NaE9T<@QFLSX7-OrpkQz;O-xVTWc+E~*cee6+u
zy!vD1rBIKlzoT4dHIG^X>Ex;Exj^WiQz=jjE(Ahpgy;4V1M%wW?-frVIsK?wgUZMU
zu;KS#HXfqKt70k;8ioKQj*XQa0t4EBmUxuF0ED?sg|cuzOT?y@;<dLw!iC&Rmr`Is
z3w21m(*Y@;rIj`8P26u?x6?^O!rI$9Ac*&53XwRFq^hc-$7&Bh6z7n@Ytt7WuXzi>
z-p&x(@l5lOvf9|n3dHqG=vCg=u6zeac<<1z4fgIosPG^>is0ZNr93!z_|2F!_9k?t
zwPIf%PkIw})MS7pL&F1A>Mm5lNx{@NqzuxevWCijTC5s&@7<68eR2EL>4>JM^4+`k
z;Ez9k$MSbSAPr&gL?mrFSg|L)nUoNR(h9+YytP0|LJV5B>j2Qw^c(N3#%u0b5&!@|
z07*naRC5pCO?pGVQIW^dMcvs->Moa18gqz`jmGWw%)yMwH{lpPf6HOanS#{EnPXYt
zOxs2y)!ow<!$w|;r7JhU&C4HoNd|#mkez}yr0Wju{1V&u9>kS>FCan8jCDm%QFy_-
zl&v5u1<y>Mg?%RofBDUK!<qaw0rAF0!V+)1{H%I*sV>5y<V;o6nwl2e3pgv~!SQ$8
zi&58KL#41*@NjpBgT2wmR3u(1DJ-Kv`oJkbf|#1_6d_Ok`Lxq9MX;yEQ30cG8F^Hg
z6rSUbB%-XWk_O}qWnbg#@mHO9F^#?K;Aa<KXOv~;vR?A#?1MGOgrk3Jo(LX73kpVQ
zP<&iIWM{}O=TvxQ*-VwrW?xfaI;=Auj=ySNcR_YC9vL&90eI+}8eOaOD$0Y_<wfKV
z7h&eS$1!a1AS#xIlQwtZd@QrJ0o4?OtE?z9J^eK}(s>#4lm)HfI;mI3cpf1AO>zwk
z2}g25EQXJ{9gF7v4>lIZl<w!5_D50nc5-x9`JC~*pkn|17d>Bya*}uo6Jt-}eNfK0
zCQX`DYbE`BtJmL;Npp^744i!o$hea+DhKQWG8fA`;WeBOpalVPb8~CG?8rQG$tC0!
zk?zp*&-qXna~aJTFk`@s0W$^+49MKA`1Le6@!osysh6TKkw9Za;o;%vMx)UJX4+Aq
z!F(}eKw&_}gV1r}jq0YGZh|Nfih%_&SiN!MMrB~3fB*hw+UQ@>Uo2_N%~5p4_7}oR
z@sADRXw8SQb})ER!kjR%W>n2J-zAT{ym|Le!{WC;<#Dq=+61|vgi1+AkLD-?`&Ct@
z^vL0`vSMD2PH^||;N5`^4G!Y&$z!o*-4A%<rG<zH^j3ZEZ0{d*S>tHzb>i?Y*g$c=
z;IK$I@VvdKs7RfEq)<3m%T~!4u(GluKh+f;EUP`0;0_-A1Ea1TOvQouSn$vccsSE@
z4#!DTW!3Kw?AU^K-TEkeMMOqXh7w8;IX^ECc~qnm19HOWmi)x?jJ1s|ylK43nddXo
z7KaaS$9>ao<Nso8KkzBKwh3=C&$@j|HCDX-5^kD&ugbGs+qNh!HtLt0n8*ffq4qh_
zj%5^x7T%DpojrVfy*b{U)cN>_Z!UrSzrS`pZo2w1#V-`TRAc^A{XEyazYN1~nWFM+
z-MS5h>B}jcpF;z-S;#ikQ9jC^O7QAM<w-Z5jf>Ia_x|ri^}q7VA8-Se41_<)Vm0V%
zDq-{GtYSd7-%iSth|%4al)uo%6~>Jlr}p$Z%vsIYoR}E{|1u2dJ;cQqUyLC`hTyBO
zzEXyHLuveU-n@BAN8@~URB+BWS5pgA{X$b#Ph=VW{QZ?qh0JRwgYvRc6jB~PnqGW0
zxVXAec`ye<hTnqeQ*XzBe!Y3NZ_vthGyvCf;eFOrVb`|bR8)1YYf8k&-5C@g!|cgp
z=vB~8t^cy_H!csQ09A}0eJ({fe;uM1Kxfh_g%vbnOG~;@VV;QI{srayGN?cpeq4N0
zcBi-*bVqs7QT(>aFuGoBlI`TFE9|X}GK{+ZDrI-Hs!9yGiY#dz?u@+x={v6Lmkptw
z0rfYkw6R<g3^@gc%;|ey{e-9I6(YdXIERvgT|M?LTr&Jtm1b>0nRX=&jfRFts8^D{
z<fg}$+=a88l^laLYnG@m`8me9qIxi0>X%W!*J;SJre#WbHY&z)Gxq<8QDY`y);)Ki
zd$&#q@E79_^vErQk_mi+Bk|}H3-#j(?^>4Rz@D8dj5S?wXp99?HZwk^0JEOD2T?&@
zq~+)Zoc*P7d9@r!hprdm#sO{c(GLfy<Ku+1oFY`vxsxj$C8S5k(V14VQXo8GVay-S
z2m`v^wbLeXVj=o<0^)Q=WTrHYe?}QJ5sBh9{|xl*ZFt{^i;L%?6`%^Sa@9&@JxD4o
zol_&^pDE#gJ691<6R;NRFY<#6Msp!C<{+MWWF|IH=3fiv%VH&+*Tr6?hN}n5CQsye
z3?%?IxZ2d#RF>ei7oJdAxz`lqh*BQpgv{>|5n)Q`eB2%PVbYk9RM4Y!8fz;GI~U@>
z-W_=U$%pXGmV<~0XE^pNnG~~A5)jp<9dZxu#vAXi#^d)-QG)T!t&4=y6RD0PiVaeq
zLJEJ(yL~iYJ0dSN#t6r9ilAMnzZ1)lfZ2~ejq9(uQYjCJHyT;YxBm7s%YQ3{Lqu>o
zfP&MhD!q6r-gTe_@(nAOV(qBm7<=7iwc|i7NX%*buRkjVjMi<OaOj{RtRmk+sRWTg
zMZFpGp2E0M*U@8+mtuU#X1|#D*|qIg%wbt~WtPIr%?a6ghUceDlVyN)KW@Ry=@a2e
z27|PP9)IzN_u`4AE8!m=MURrv9FsH%Zs!bJE(qla!M8uH#(>`4m6s-sAGzOk*K{m?
zW<KUWzYLMmZgGi9c_K9_8LcCO@cHsZI6UhvbZHgByo>`}V-c&tisi4Uq}sQ2z`g@1
zY90`VMR-J{^15^Rbz?AtmgL(+MN)XsmR6UF5p!riUSF~Z@2&Z+RybYekE)Vflvz+f
zh$@FqFMb{GFL{y*_p<nzH~R|7f5Al)reA#Vg-Tuel4f#=7ZCy7ztn^IV#a_O0}U{s
zX&+e+uD<$eWhq-W_5%0KxDTUm8Vw)1GCyC&k*<%67nSv5V<}unfow9KGbuEA)rI|$
zN&!j-+Y$;lSHjW7o8HH=;NNi&zI^{hc)K~$+XuZEbDgl)Ld}dX^Gr#8CKfzkC`Og$
zq|_>M30}lYobn9Uswdu^KNCH=c7}(WE7y}6<dadnbL($->Y;Ji8kda7@G!&(&7kO>
z8YE;ED*9x^J&zz|^BM$jBP45(-Xy7pXyPIse1xGH7ZXS8PEPc`TY!j`QOMxh85bAZ
zAjX%`8KfCx_5L$Zw^?i|6;UD+u;Dr>U}@Prl3%RV9N4uDGp3JI@q(;NkX%l|b3WDB
za6?_1sNN6kdy%@6S~tF#XrtoXbS$`Ug!)#Pl|WyF1h$E|6A26UA{`fx`{zD^k;8}5
zu!307u|Q#dF1G)%1^>Hg0+k1g8qkhnV4*|Dj@bJ7a(wdD2;4eyh>@O&PE{G5=0%U4
z4PSqX*Vk-e`W>*B%6ytu4Wy^*6!FRz+5;axKac&V6I`4e)j>mQQanCc`7Rz`^eO@<
zoS&Hxhbm=YqXvhQa^T6b+%$F$`W+@y&Wjs2)?IKX{im`d4<D~su1cGGG)>*5EOt&F
zD5mlt&=xD#K8If2JHyGrfzM=6@NgrG-ZDR3`92<6un2)vxJ#kJokA%?R4G*ukX|~h
z6bN;%kne(`-P?Y_7u%RJJ=+}EZ-~G<d-y7Ee-XV0W94fv;erlPsw{Pv8cdsZ2OfT4
zI^Owo1HwY77(t~@Ytm0C8MzR)%G3Y%5vJdIv#O)iLAtZx?^szOUV3`2O3JD%&!jwP
z(D9Lx;YxXM(zFLKk#u}GX;*8WQVAWuch^=tIcFSx-kWHm_l+@`og9z0?K|SYzHNBx
z!!>y1o{5T%XLbs&b!9&Pe*N^*PpZ&jXhG9X;$=Yg!DoBJfBs>|Tw*f@WDYZCG!c>&
zi;2sYEu-<6P-T2d3@QlIOy27`{k+4Op0NKkJy2J3!I{jDmNZz<mTM=dKxjup2Eb8e
z3#z)h5+Y_%k&}dS@(JpLt(^^gNk0h_$J$=jAX>s>cw2f|1LA3+*%nR|){*~z3Ur@v
zpwd>W_EaF;m&rBMhU*ADK~w0?hXu>zIwBqf<sjv3fa3j-rYffKrB%xxWs){XPl{8E
ztk8#{Vc`%XPXBx4Sv>N<U2wKH7`QrbiGPfT4I-2xRtcL0roJKdH4OtrW7fsBfRA6G
z`tQ?k0B)r>>;+Fe$u%}w8MXRp;|6@R#@LI)){TmRCCD!p#WaJ*nn1-i=@l=$u!;r<
zCLqY$Q0Q~_HgKkB2o<_6$8suzxw(iUk)cdf_vOrg>GnL`6eOO|SC-^U^&L1=DG=H@
zG%Qz9nSty7dwT`?_qsrNX|Clxo+3lCEs1Yn*VbQ@@}PJq&&teHYqhkehnElWyaU57
z>q})=!$YIc*@^VHylDAn@C>EWCA~>YIR%&D;lbPsB;e(@R^j%sBaYK!lr>+CTaxZo
zk~!he?-NXw)E&t5*woGFZc>6%gM>B8M#VB0p?Wz@kYjAT2lDcZ;LUfxeDNJJb9jj4
z&^*hNNhV_%K91Iisno(;DtR^5Ouy>gOoOD}o0I-D;lYZY?LECB8T1g_SmwE06|JJu
z!290A(Q5BvNxEGy(o`<eru@wF*HY}=P9mF7Sze~@C%S0t?%TN)zwo@Wb=v@XdOx7X
zcMbW+fnJtKAbWT1`pvldGUKeIep+&fC!R0G5~v)K3Ml%!exN_|yQzwr(sT7N6mP`K
zrb44sMvy?r&ntnuyPL9bt6u!cizIud^TMCZ`i!D$dR+v*M~xb#gjnUbpP!#fZ`!nJ
zX1e~2Fl&xv#=zObfUy=EbC%w7pS{%onw0cB7#0?WS+i#0si&TT{0<Kf$C4#WaOa(O
zDrM#Kb`SK|pv|1B83Sevm@#l(U_j5^A|NjYC`3SB&--`ZeYe^8?s?IQ=0g6H80gop
zpUPgmREdWjfsa4_SQ&0H8(2{2IDaofvXeJaT2hJ~`}v!4ZlyVK#!GT&tWCz~!Xrae
z9rb)F4|;E&mz9j$M)t?*4M)(qb0>)0-NA##IjkfeL<6l3R6rCN$ZGOeii`4*l9s8I
z+9VxY2WNEb6oCz&yoJcvbR>SW0>M6RwdqTkKMT67u?MyzvK<Yc5ju5{v)lcsB%fKp
zk_P00cn++E#*bB1BKIhj-*WR&SU{_<1Tmx*7UYYiJd4dKEWxtp=EI2|XBzW9b$)4a
z2WpiEJDLpR8M!e(^87=XpDm3bYY;wE5zp;YGcw2%%}}qMT-<qf8&00+c61vy8L7Xo
zQG(=+^E7xnz&9V$3nY~XTX*P;Qu5XJlMg1~?Cy=$Z9*tRL8k=q3F=))SU4Q*ZFz2;
zfwYV?n6gB8%T}<fK8l;K83eyyc45Fpof;T5R*`jvd|0vU1>AJoeF$&e9v0<d-07eS
zA{Q5TFL-;pu`gLEo>~QYc_}H$^m>@C{v}KVojq8VCt&2z0a(3m6OBywl@7-4W5`=b
z7&Dw*49Hm4d-b(z*Q&(D;BKYKNS&Mw3e+F->V^4Y#()_E$6-MB6*BLO=Rx61ivpn-
zU=V{P0?U^#$1~47V>;(D>th^;z(4zfbj+!thHG59I(O3RaKku~h<MpE&Vb|_n^hmj
zz*gwr{5*&k!pO)7r94>Q*uR9=%VIfY`uEU#u|O#m5e=ZcU}cf|*{us@2nZ*VA+(S~
zQi7LH0InW02rs_79-hIzC`=N%pbD1uUc4VgVrm+?w+ok`rwzKSc{$nmYTYi{-3&s0
zA@RdX+w=S}<wzXU?1Hwf<V=s!hGPAo3D8RC!So2&n+KFzqH}0K*$R0jRitNf5FX?}
z#{fSfJv+xxAT(thVp0-pBFWlUdX1_mFGm?^hof0pIJAEcmMnS<-)=8Ka8MwUl6kn-
z2n-3zhA*95Jk*N}8b7w?*>Y8-^a2ZH&;f>cO5X9)SGbY?0wYF`L!aIkqC@+3<Ozq-
zXt59F2aWxYd^h@uF^)A)!FbJeRXPnlIUYJFL^WkXYR@k%#6h8gi+UP#s3?y%1v*VT
zXD{^Xcezp^baG|+sX!>F!Zq~3C=e?~A^LPteOkRRU;Z=(H2r>H{{hUNJsTnP++9K=
zRB35x=-IO;1`HUW^3ZMcr!zDq&^&44vy~guv5=E?LNGUJ;&oxcf(1$#COkYGZ!Lcd
zcTK+wT`8bpCIS_j{;^9jJD)&I^nU!faTCYC2$&gdr#>{gR8nY3glY~S*o()Wd`5i@
zqxZRZ<$ccBTXpHy9Xq#g#e^9P(EEaRDva*XdUJVj_f|an=4Xg#)du2qNWM#7h-eu}
z&vr3*@X5uPJ7X#Zfa;ZnnzpjByyzmjYrTIuUV7^jXb&b5KRP;=o(F*^9(WjIZ@d<*
zLwvd5%4VcdB~I{IFDDg3FJiyah3=+g8o6&1L<YnmQ(1w?Fn`3vCScizpJCFCS2al0
z%iCMIhrO_84@|nDC%)gEN&$LLB&Qi(0TMHfh5MP;-omg!ed|2!sKQp$JJME_o;^45
z5mcy?MZwA0g_h@c;@*d!!xQv;W8J909v+?u4he%;61cGcFlC)TC(rPjQ&v)_1nu^0
z+)JUdQl&sxpHMlZh0Sd&kY=J$LWBJ1@vjhz-+BRqF7BbqAZ;Z70)lgI{}9ZYHy^ux
zTZhlK#8W{d6h)<UHB5$#4ZSi^+z*Ei$0`LviKCS>gn@C-BQF90;biQ@)V6;}ScFm@
z95Zb;o_}I4%UOS6^h6*%1@*k}LbO>h2Xmf&g^c$ITHudW@#A9-k)R02$FDtw`|g;4
zUY%R9tRno<%nl$0G()p6pck^ZxHvra*kcqXqE||8@Z;m-Ar^wfBAkF8_svSw9LS7;
z{}={je8^am1CY_9N2|j`@!YJvHUIqc&k!Y(^My`Q<DKh+m5n_uwS?EUrn8+^eX^mI
z9Yg5S+T`Bd+S(Bj6k>Nh&TECNH8O`#Fm=PX`0Nj$9XCz;_w85nir^$z){B@U=zY}~
zy!YxNga?QiYaMubc_T8aHTw4Ji`mmB;LSA~>0UkvaS4Ve!u*URGOycmL-ifLT)z>w
z-8htyWqoV3xYi|E`%9Fit!UVwjEtD@&_KkPJi+|$fjQ{XsXbhs9l1d(q178lr8rj`
z@r-_)yi9V4Ca{OffIkH~E5Z7c&Anyx_?VHNMvsBpuxRnCDz4!jFjM_*VdID{9iy;q
z+jczje=8I%rG)BD#FTEA-+%rA-|Q3Gs10eOIyx?r#sgwv;<5DIPcY?{>l$EFXd^iY
z=t<gW%1uM?_3w%FOz2IEMOmt?<I)U|Q}dTB$F+m|!;2nIG|iz3cN!OoCma3B;#|D9
z>?IX5pH?ZQeP!IaQy^cI2P1nA!<QfYA6kd{H%Q%&oA++qn00F39yd;$jxhGqc=k8J
zZCPF_!l|ftbpK|o-}EcS55L^-5-q9odq!F^-unDEM7He+O9~xFMp96pw1|_PC3fx2
z!H>VK#HBquG{{dLyuE$Vu5B9><)q@tS5_b*lwKSYl2o`V)1gvwmN09Ke2lrlpmBEZ
z*sk8!T9#sdejbjXF(W+x*dt1LP#8;sXd|BVa|?t;b-)wPyhsJY&d8&>NuZyPvbI!7
zq2++~t*~d`M$-7HN`X)YrRt4LW8co-@Y?F1(2`>)`k)9#8|k);ic;R9=PrB&58Zn^
zY@49tWy3q`u3PcO>hEfmNF{zW6@3F)sz>jAigf%nh#=kEm>H%jc^+JJ{}W51Z@lq_
zDsfp^8NGEUs^5YGGng@8#(;qV8UHdbizV2*?z&4U5Q>8B;lqcO0PStJ-KO^cVsJt4
zLC!1OoqQQTt}4w9E(Q(6Fpn$OR)H48p8*Cw=|~v)WeF&!S2_)94d*%^5!s%vzECuq
z@r{OHS{VE8-DFhuy`ar;)(C|OE~|i^?`1vF#;A1qjqi2qP2(@kdv<VkNBb^=@x#7#
zN{K0l)(I>4?;aI_%;+OH92-ZEwOy%b!$S-na!7vlL6=qVbSmmj_!M$ZlAfH1b-O9Q
z!ZkQAB~I1a-qjoFO7W=&?z;U}r93Ek3Y{T&2nf%?bk2gD+@nS@$cs2Bs0Oh>QDFhw
zsj@aL6^H2xPsN&h11BB?${H*dp~Z8u{P(?NAST^*JLV_GW77}oaqHB3kzX#}1#QXi
zAwP!U%S#Fn8fcH=l+83Om0PPo=;IfxvM8t^&xV3I6<qW4iVVKsx}P><R?)5Sq$lWO
z9GB9@P2p9>qCTuSX&wLUM-z^E(i@{d$uUdSmPSikDDP-dG&uF?8;kJqRaa8bWT5hT
zF3N5v>z_i)OZltlrTWcRo>OV(WTsG{#Gr@eg`=H8WA(hCv-&PY5fGyn0`9cJnR85b
z4>j-&3{lF1SKKrW<8LyQ2So`?%23xwOk?I)IWovo6{v2c;HzGq>T;^i+(djmGR`2X
z;=xIh<yAskbAFM&Rg?pdRxOcr_z3pWxP@4-Y}`+3i=o<3aCr<{$XgYtsVpPb8o_Zd
zR7hT$Uup>{*|o57qEQW@wZBs1Mp6>U%qdj&#qWKA*>_Ebzo(Nbw{9c#(R7je$otHc
z1T0+k38l6|keO!C<@LkW{WikO^I;w=3e?a*h`O^(VVqOqV`DJu$yZFugJOWo;8!vm
zm6yyTQilq908NblS;Z|Q|Mskb#<AQ@Xf@s7;q3>R8RB!w>G73DeAwRExdjk)<1gO+
z9LZ12CcoWN84YU+U-C}qcIBn>tQGj5Pe}TK%=L0#ym+xHP*6~iqFIDadHnIm(WOh5
z6ZWHjz6RzJm@)9*!9Y`U)45!GDX-q!3>!8~DG+L7yHaj3*eDj`&$oJ=%Q!ce&5Qvv
z2Fw`vJ1`*oL!lpKj$gfcwaQY?&h`HJvdb=0@AQ7-?<kWw4>JbN7Yt~+Cn6#O_uY3N
z7A;zYu&^-29~J`(x8HudGSF@wKj%=33KK?vcg=DzUL1dwb`zeGaIg>V-HCkOTf5uf
z5Lsj-jTxT?H_LdSN$AkJrMheOg~U~JYefl-2H&HU2Rn6ak6pWVEB?3ycAx;dKaHow
z#Kft%^)FF8w@gipLoto$R+biF&+c95(5Va0$=Bh*$6ugg-XkW%^mV+Q`teWax8jX(
z9Vp07!5!BdLfaw`zkBaK@=Sz3Mm}Od5bP|gl(D+TX-7r1q}-+<-<O}AhMoNHO3$?)
zz49cwcj<%~w~Zp#Q&Q2a9hRB-iID$WuNpkg_HCoEXa7NipTYIW+1(dz_Eky-uW^3z
z92OQz8LtHXvOsZRo>Cs{*trYk4!*;hufNBgH(#U9z*R#rl-|dr#_q-75ffk=+8PB(
z2azVsX@WbI5OOn9aWFSaJ?l%N$*`C_hXe;AF)2lrG49A=1k=fZC@4Iz;5mG^@^vZ%
zG;~CwWlXoMU!#-<+jQ)Vj3axITS{YG(tn7Mh)Bwr#>Ai?H(O_^?tVd`u(cq*P5H%A
z>C_`I6fFZ1Fk)~&>^zi+&aHxL>(wB#`QfZ!K+oHU4jod8O~PA~IbUQ8@3`X*$QTvS
z>%dvb)SQSJ1OH+S=&>S37X}X=jCJeQLB>@i=fP*6eHJ4}jzo_hJ=DCW_aXmcbo{+l
zt6P9ik}u`7Xnas;my?05t(|hvBl3HRlv|^XS_N5@<r77-58r&r`2YNS+&FB2TI{&$
z8_TgQe4Iy%sc3j`-44bJq=(~l72l#o4U!U*)$cVQy@Nk~@SrmXIueitvk}PrOhN)J
zYAUfm(V)X}crK)&y4t8idZuBdQ?I%D`^oO6>eL1iFTs*SkcS=86XkG~M)qm6zLM|U
zA}aCL>#x9>Mv&!f`b1?FMYsx{>*l*U&^=%lN-BA<FHluM565!Cm4Kr;M)`IALbpg>
ziVii&Qi$OOF`kf0Wvz57M<&tOKqd_;#E_0iPD;Y}8#bwA<q{m|uapO+ObTDMUzlvY
z-x|HX0l~PTUoci}isKo*Cyk1V%z!~-W~QaWlXQ}grz`TalCXNk+v;B@GxXXUaM6W5
z)R|L9%Eg2R`LiDxgpQ`aB&_5styxa5&k4~~$|O{l8*-!aA&vP6tp9v9;&=a|<oTPz
zsf3X(AUd1B>@*BAWYbZHhDwu&Nou+w_n_LJACK=zI)?e)91Q5ajojZ{{$_0y(Y+7_
zLQyDmb#?tqXj9pX{jDGZM!NHgXB|->l*v&9Z3Nb=S)&vP<((2lGIy`PwS9DE>C|v`
za(2asZ@sMk_50@B9ee`eZA$?IQ66LjnN&O}tSrid5tm+%NAI7il-zVbFeXG<TxziK
z`*kV{OA5~j$e{4$=1r6byAK(Q`|p~fln3hz-AEWo%hf9Y^B!M_4OAf99iI+wE(}=(
z6skB@1}hgTE~OsC#w}aXI%Fuz#oi?zV@`AS(u1|Sq6lBEU8TxcQfN$w@=XNEV`7eA
z`kZGl(WE>mLP(kbkTCKe+Nu*?dgB|k?{O)r?cB)}If^RIs0EqHXiMhD-f!N=j(syR
z@WPI@#9IZe0&M#H1(oN{-Fwx&{$&Eaxrp+h7L?Q9#EOz77rPFfyJJug7lPO$2yk~m
zYA%%+IPM%p@*^*ip8P6|C@h~rS;)F7LiK!93Z%woy|~%XJEiFjZ?X&#Odmzy#lg)F
zBSuZ30^wYGcS<n6^P0)UT3{~~{BFdhN_a{ZWPv|^F&5iaPF6UaY6#XjxcVR|K9;NR
z#aJ-s0i`@B<rbXkg;<y_c24fN@4-i~^VfA)y)hO+e(p$4H;5JbPEhHu`{5_0K&S-X
z_~ta5U!`HboEQU|u=w`dZ&e_1qpSP=jW^zCw!VF0)S17SG0-Fiv_(Z>oM|tFufP5}
zuDId~Wj#pN6Fu&lOyFF3sdfy;=1a;f42g1DX)$L0x&s9HCLnXVSaAUv!Lo)*9d$ir
zPB~Uygf$<%t-_Yj3Z9C?xDFKLPL}l|@)EqW^f@XIdL0*E@{oU@z;G;F{3c@eMPkF@
zWcax|AwAcyxRZ9&*gXE<d#iB$utD%}v{7+XMyI$`akmr^Mg=c=-ktl@OSqM5b8vv~
z3D+B4uTvy@+MkoCkmTX%iRYf2%m34h9z@T2)n)lq;4_4n#p8v8WwBBoyk+_vOul7=
zDM4cu6?{s&h!^Q~Uwopzm6<FV$+yt(NVTb+{J;~q&7?fo6m1kt#f9fz`v6~ey%^;-
zuCTGlLIt}-F%MMQwu!=lO{=kO&x5$4&zTz<k@5)65AWZFcfQ_^(8wqx$BKt#)`cEG
z+-<9rFOs(wKLb%7JVts$DHzCi_E<xazzQQL+=000eH8Y66;Y94h^BI+gvcv2HsJ4n
z{5eJp9cWm6WFHntiH}zIm;;9JuzE0ECeC;qmx%Hpl?p^BQ1=Tdui(ns+8%=j4OI$+
zw)MR1NO=Ur1Bm=G71MMt=SDI?eHUhj0Wy}1IGT==yfhtVgpo3|Kw!&u^j>`f7QDKO
zN`!TAG}~Y@#U!VqPdC!n%vt(~+&6q@(D4?PhETJV--p8UN1~(A|Ar~_Y<Zhf9#nL^
z&~XxrVdUS-KNJg|eF@*LZin~`9$wj5p|Gq<d6RY)0|Zn^-TeCwL|k)OU183%Us6xO
z_iw-bhV|>$tHTdXCq4iC^YHccRk+aa&a>*7i)+TfS;v4{TR3hy(wm+L=ue+MT`8y+
z78a_!9(w2@eDJ{siYBV#Eu8gY{KW~%On7Q&UZ{HMs0D$~IwGh3YOXO>4t!B29&U}b
zNn&W@I<4BaQwg-NvQ~Gw6qppqKKSHIj2U?~Tx_irlireZxCY_zsrgOj^_pYYw|fsg
zOOppd=C!fn80(q{$NBOQJ~Ysn>va6)-i`H&3~M`Qbm&4si}%;jI<yO;8~m8^YU4m)
z-FKUCdGD@dYzt43%X_`DN?zIkLM4ql?Ab%B2WkzIF9rze!~=GCWNUbPNcytQ8hy^e
z+LFp)vTgw$G|-ex&)GNMGZ=o}t_(#QmwXqEa*3zsec?&%+O|br(Zce{6@R!=s5Cx)
zXEDZ4n}dt{^g?k-nTl)g;D{}of5ziW-ob-+j#24L9`Y|BII?4ys5b4@e}^_LanZo5
z;Oxyqq7v~0Zq(nhg)o6i8z_>>!Bg)5T4$t@0xuUk94#zGes(5WMucGRw=1ywz=P=D
zql2NuFZI-YOyz6{i3p9KnVN)n@mx%WUtKQgh~nkiirz8BD1x=6^cg9yDe`IFblwrI
zJ7UJfs|_P$Apx{@D2E>gF5;3hLH#w{a_wdC-Mk%_u}?^LGFJ%bG~~C!A@9baX$=Ky
zUc_5p{6@o6ku*#dBS94ShlJx0tzHfsJr(U+hpTtmFjY=gy@N7Scqd1Dh>3>*m-Yso
z>oITQKx>qm!pOcy5K)wO6hD3T0pD8DXhcIn8dK1d-;8QE3}fmS4PVwh2|kQy&2I=D
zQj{b6_yU__vudq*N@_)A#@zBDY2l#*d&7qHZEAiN`c}qEa`aw2@WfKs21U?_2lsKu
zK~ohwF3>4o)Xj69R9H)s;Toxrco=Qdx)lx{`Vl{q*1X}$zDiNIrit+^<5OV6w_mDz
z8(&+-J9!z6zE(}I;)bBoG0rarv><+r^m_K}s$K~%wejJ-^bxW6nw6G}uXfVjT0|>k
z#2%Jmr5n(c-s#?qa&rbTA{s?8{Wc!N<L01iF2b8@e}#vyD@ro*QAQqkNUJF1QBm%<
z?R%&|c&QAcCY1zL+q3NXM>Eyfu_hn6ZeCzkj91gb3T?UmIM_850y7G7ZeFDh(ym{A
z`K1zG6=P3wfLBmp@DV0Vn4k(S;To?&=Vpz}r7~l{jDd3r1DZw=BfD~bE?%lc;LFL$
z2{UKTRL17SIB!$y>$y}9b6Lz7Fk`@s0W${bFkl#avcLg)U=kj1czC$t`Nzh_V(QeX
zX5+hcs51XDW8gRp2yLY4p6jl=PVK>j=cM8D&p%fRgqnuZ@6GqW8v`b$0^3U)5o*qU
zSlUgv%xMXS@aXK(s?hma!rv2?K@9@vuppY}{uhs!g4U6t>b-7jepbB2^`Cu&r(gdV
zo#=URw@G<WcquOQ)K@@7yO@HbxaP(&=zsBraB*-zKKX9ne7+LvHf^IzJb$=Z9YtPo
zh1$RG-My1%5gqW}OON8J!2>Yz%6_UGI!{%A)4s5via%YA_g?22=m9E2wrh>O`wyu+
ztH}!r3=Ty~Qi4i(;vLg*0gV#d(O_{#Y9ijDmz#rB9+b2Dw1haC;$m{d+m4<4(WYe}
z?w>pwm-Oz59_=FxzAf{Tvttn~k3YB@4=!AWAo95n9x&x6xbg5qK~6df$<Cbizgg(k
zsjc#CQ(j(*%=A=zzVaPx_~QVT8Ut8{RAJvJHdIEo!T<bX-H#Y|!&PvkAvMh-F?ggk
z`1GT9RXxIODsj-HJm^W|y+_k2ci6H!K3w=PI#QX@)x}xWqksnP4j<fu7apI9AGReJ
z0{JOvDvhMLX!7hLvF*#Z@%xT@a5=r)==`LOrH|#N$K&41hckQt3R905%7c88GK<p*
zQ67YKOU#`+9-#p|_ord6eY>{erB~lnd4w@ce0(DN5{<&8B)};mitnQ_@97t@;?-v;
zs!~@+6~TNtYZ%buO89F6BDbJr7jC%W2E`-Q^Z!}P)SQqR1OH+S$e5BbBVGt+%$T7R
z2whxUke6pj`aJjCbIKE;I4{t1>Ax5q=T_A$EUAol45?gGPX~fR!jO}mh>{9Jc}^6~
zg6L_F68{)=)j)Xvx*G$iSD?<2xQ=n@Q|omx4N#KGfla6_%0(%UAZN6tJdSj-x5l$i
z%vbN4dvUb4p}aud*|waw2^8mQDKeo0CHLlo4qZ@S$Y_ekX`x@_eI>o-iL63i>^?mF
z(Cp?X%8*t(bE~M8fgs*YG7qIR@GfAYSk?KC&}X7JRhXBJEkFNE`K@oU>eZ!4tWZIZ
zyZ8nM!<|keD(O%nE2DXBDfETZ%ht&glkR$q3WO8r)F7PR5sPuOh(=XS1np58S&)CJ
zcVG}bXVc+`kdH-qG@WB(C2bpJJGO1xwr$($*tTukPRF*Lj@hwoJ9D0SXMRC_I8}A7
zy6(N#(t5pLR694ouvi(2KM1=BFV-1j51R>%Bv&3rI0<ZQbSk-KGew?~kxez?2Yb}L
z+TRZ$n-wTdwp!U5`3KbD3I0tQbXo|Bia*Wvj{Cqmls^`bm+t?5Mp62>Ri#GbdfcAB
zJz3X%FKscTlI8dQz_n6(+eU*Zz0ygX%i}(})?jis!*fHK9=-48`2G2Ij#y&5(VElk
zK{yo~i}mdXD~W@Kc0820vIX+lt@Vq~HNTw}S%Md-Oc{hnNMRIp^xnm}jNBdn`(+NL
z{b#%K_Q6F-H2ODo#<6gU;;Yry$xQ`ploOl+_5JR(#h(zn-`lR)jnpb+>i;T^Y44Uq
zCmEB}(Lxz{L5P_yTFM<4Q!;NKVZ_vXiK_LCmE$&=k2vgphp%YEC}-x5iXp5#9(r`Y
z&ZO6u0Skk3lvXL|{2M6xyY@G(*wyi@qo{^q(6uusDYaW*w0Em^Lo9>mi~O&_ClKEw
zn92mb6#pW80uyc9)f(XQ<q5H(s99s@;<)gD5k~W&v^nBXM@<PFViqw(1yNyL3Utf*
z;lO>mgo=uKIM5Wl;Zel0gUEC&sDB~yrkzQkOl|nhA|=VJ5X=EA$OeV96kC`<<yat4
z-N>)~G)TU_SVA-uL<N&Bhu>w%79jbBn}lwPV{k{xX>@j}@hyD^?zywse(mwn5Ta4Q
z2KL=T%*~HXC+I^U`qUF6^0*S$SXDXKow(oV@Hlw(CMX5o!=x5}pHma89d!3=Fyi|8
zbK^hQqcU3MSHg{WXA;&F4AkR^QHa&>Oil<byssuvo$;UVrsvO&!V=8G$bajaxS@c*
zk<5Ky2~0FA0j9zB*48jYh$G5#$J5!400;3O#*^ucq^F3VMo+Xk)_%uSj-I)vq&K~N
zsBvDB8x#|G<B6!7U1Z$I$7anZ`CGKpi<u{47<&O0h{V9KdqWc-+1y%6Mo)0@xu!cO
zn|427-ENR}Q(SdRG}F>TwJAlLuYKD~9#$0Ju0(RP_cG%Q>9t2Woknk`iH!`;6U{~N
zB}LvvrV`jr-1n`s9k~mQt@}+vC@F!HQzf&?(Z%W8qIp6=6a?iyCod5h`6vySDA0yO
z@a2&K@D8vM53f6%_J@^*#|-o3h&UEdN*2$AyU8D4*}>R6PG;p8ZteBK`-}n33=f#h
z9$A$YYZ;{TItd-gZDE|2>rIe{o9uv&=(J)pPPEyI2r5NOW$0Iv4?DnT6C6-Qe7SRC
z3?xt6chz+(U6q`A_GwQNgi?beQwFOEKmFypIFr&+Z4QyE)=|IMDI(3j*|6LJppPgO
z8_T_$l$V>A7^~>M+l8PnzHoq0NOwlMC92+9+y0X0y(>Q=uOy4AJr(t6Gc%71+jBjs
z{jRt!e?rmsWMsh}`U-~aQOdMe-#x52&h`Y278fhZJyYOs1r|J!F*!-2u|r_+3hTp%
zFC;;Y5s@T@hk1}PCX>N!jx@Sy?Gat~G1I#L>iBfa+{28D7xln=d$lfhuBW6Qhgd0^
z6M9cdP4=^si?TP^t75H}X|~#)=mm{;gR!3Ga_1A1&yV3pN1`Zcf&xs|{ENE&Xw|ko
z5;{bhDm0NS`T?v&&TJbcJ{XWsQ5m5x9CPQBfWu-I?MZeBLioR%bU_i=7%Ud>e4l$L
zzt1~~*Vk9Ye+4zjWoY(!`-O_LxhK=FZ_(i$W-xS;CX?eXDEQfezPx8e&6Yc2zA|)$
z``qcF)H8c$6HpOF$jfO8JN;F&VI~W3BB=f%7LD(OmD*0%>mMKDF5MP}UkY%3b)UZ<
zuxJpgLJk#!{yx`kF(}6`tA1-7nQucuMM5GtjXfaj6oc}<zg$*S6LL`g`P)DqI`Cw@
zJvKL=jFVFLJ+uM>)dC$dW?`mO0G4`dt--KJtWKxxiG5f;%JzV4MyPdxaPzM=Wz$EP
zM9N&rV$ZbSqp|<r8um7U$pQR>;>2(t)5wR-7PxG_3rmizrDm|TlW(W?N}|c5Aw}~f
zSdZ617XPzm7Z-Z3o$Bu?8ncD8Pdi9&NCFAL&QO|AtFTR0D4jfCklH-Iae6|yQ7?=X
zoTu!czcQzf$HqsY^+57i2KOmXvb-;RE@Q5m&;Qs{?GC2Q4z7nV?D+w?3<RxMki31Z
z_qvqA&=wH8JWjQ}m4$)W24(A$AZqQ3zfCW}Gz&}>3LM>izjK*kji*E^MhnJ7v>fqM
zAq)obSn$<H2jXzKiq?g*RL@U^5Ml=JviZ-@IsaisIda>XwaiPv%I8u+fVk5BIg==k
zDTTimJ3TNs8~LD^oNq2t{A+|A|JEfK|8smy!RtlUgabFG=X{}R<L3j#>noB_Zs7()
z4Kzx^OpHro;0--gdm7KQst16#e({rVq8trG?fcMr`Q%M<_csDNj%KPjM>}Efg{ZTw
z7wA!lDBT$H)5SN^q-2*hE)|0#I34OaBR1`sh&nJ(+3N3%hsChWzwp%CvWUy&3DNBv
zl8%g2@elTwQ!21c#$)-GxWO}}N)exTbQlpgh97>Xo5<{DGptl}q14R(DV|U<s}#<E
zE&8Y}6B9F(JI0q%@0HrB!P}g-?^i4pJl(y70`$}f`N}o7?6V#~y<Bf(>*}tns?ST$
zicY}xoEZE*f&Th_U%lsF_(AA}U4j_g&V79TVtc7)82@xwR?`>=91JIZrR&b}{dnF3
zq>zL9`udn8m~ycGH(>`Zjs#={bNx(xGCS^zwwxsH5dR_vKNf9Qp3#5g_3J##9?Jgj
zT<X7+%x4cKVyEWKKaE=5O6GKPn(IhV@mOp#^aPCzMuWeYoJ`=XTZ^&yt6>NPwI0L9
zE~`UBAPD@ggu@Xn9+XQTEhy!t-}f3uf-p&o#3+-}GD=s%flts(kUOj=Ql?;&7N#``
zVII%dn^A8p_Ja(j;h~^lgo&dvWNEh)K76@nWQgtV_n7xW7cr_*e$46U_;LfuFS4eR
zI;Ip0Ye^0P8Ld5kFk%<6oxBZvUQp;S+>vZ56UvS5uT*ZgG^{H$IRigM46uWz#g#e+
zGNjqCu=09t&0sIR3kP6QJ94^{SOT@pdO>&?p9Vr9t^T2Zybv&YFwj~DNO{(q)zRDy
zEQqNdTNl4xa@TE~McOWV+Z#^yI3r>rhq2yoqxMym#kc|EsnxIUd_ivIW!ZA`sO8{2
z`E4)=RCX1U%?=)6JTw)$2NF{wC}$(!`0K^`VYsOqog0+NW(KvT@yA=ToX~)*LP0?V
zX}4++g_wLjK?smsXiX+5(+?R&Mt+LJcuh+URGGnG4Z>kf*l-5XnF0S1^-O^F^REV6
zaYL-)<(-%}WrdY?IXlm_OddBhzLzWH`D(qOx?B0~*ya*0bI`zVrxp-VOs_KXmW=lK
zItzczeQ5=xd3O!*>^XxzC)U<Dc^`*iGTb&aUp?<`w?Wwsa}{#g(c))&2yUw1fQ$+U
zBFdHcGOdwKiY<TDq49e=BeBQe#1ehcD;~`~B*+i>{5WIIJ+ye>px!j*rQ{|&IPWz?
zCUlQuKxf>2pWNESeeDbd;Ir&k7!D3YX?`C&mBtf+-|~OnibOco&M7xa%p3i9Yrex+
z`5+?;tuWoiX<T^{vHRXJe^#<633X74sXI)hxy@Y>J<2h~Qkt8VsQ7*J@OGS<;S+Wa
zY<K=DO&xuc1N1tCEliO)W4ILhV(j@55qyh8h%Wkoj?}_pG8oMImCyD6xHeTZCxN@@
zD9;#}e#<W*$Tov6{w>`L6`m~O;@PMg7E_m->5)S?Ctt2hkG;DBT^+5UE(M_gqVcQv
z13X(!nQU%kCPLC?)Z&F9_oNluWyLLyY#%6E6R1<BB{U+#6|E|WEg2j~GOOeF3jLzc
z1Fi#)eQ$A3pYs9D1a7^XLg7`Nv)xDVr&<tpl^TcxTV$NX)`eQpc3LpFwijuZzZ-`I
z-#2ePH;<JRHA<NKucXvewVd#IZc>iw2km{9KEIzs;eJsH70VuDp4TJM)6ZH{o#A^5
zl!J34OG_zIP0~9?Sd$cos;bJ((2}4sywVyh6ij$=&oI(^jbk*XrDX1rijok1+%X!X
zzxnd$q@rE%a~)mv+ZdLK;Ct4k?Xcuox95W@chM)^HpJrMB9rwBt(mUkqJnwOJQVTD
zRgyg7Zk-2Rt^zgb3dw)X2UN(bN-iBCIK4nL8ui_VG5kMf6<=s(jOCtAu$ak&EhCnI
z-H+^S4p4J_b68(I2}LJw_uJk{hQk44YLt;uhnQ`Ym+{Pu<Pe2Gc|TJLSz|I~g-E^g
zo!A1=ze|G%e!i|scXjeV%CRSmzV!Y|`7&zl$k5r@$Aa>|NB3X95&8}?KZ#$xBN%<R
ziVBHyM#;E{^h4oGHHt{c0~-YW1%}B+_a+-&ic~fjpSH9aM9(YlM$kbR2+B|)Z7m}8
zM6^1X;9GCDA(*yp&9zf-b@?23awJ^qQMSb@I)Unoif&);izpKRA{Yg(Ji=Q-)=F{?
z1Pca>4TRwGc$+`fh?Ar%n2B{bI5<j71k#=Ebn(<;JHmv)<44H5B-5aK@lI4XF)<nP
zcKZ_jP=Jg4QUIvY0bwuSFDvjC2_gCqT%5JZ6{ys=h3|eq%VSv&bT12dI^br#7=v`U
za1(khd62ROIf$Gfu*9s@?~R?gF+WTvV(+OyC^uVr>GQgoiExk^SV>8#MfmPT(P(gb
zT5kHIGgqF+$QhIc{M!U`&bk<~G!odTl5tZmJBv&vt-yY#7ja!G{Ntstd|q3<E@&R&
zrIJDb0@~C$4x^rIh$mYg(Qp~%%S*3d8>;DDv;gZ1<MBMa71m|fftznLstrvk=VX0p
zaP8O4y1OJ5B6}HEmh@`sw%%}(-WZLz$$h(06u6QwAoK8J=DY(nS8~QVq%5aW%J;-$
zjRV1{lS)|L4`J|q%NO?8rzplf>ZiE_c!5Y&lT1GI4^F|~d5)p_A_=ZjriEjHh|7tj
z!_%oLUU-GGa@%cffrEg<DM5$qmx_zf**06(X|J03a?n!c{sQ7QF79gfhU54P2%Rb#
zP*1|XE8^pdMP)cl&kal#vy{4~3buJ^-58r8^TyjOBDLu+qD-xP#~J#&la|g8!eimW
z?^T;$BaxEMI}@WpT7RsMfH(mCD1d7RwE1B+)IaisPEu??3-lfvX({`B&7Qj-e3KOq
z4lYFLN9ZoUyqgfEuki4Vn*v5lwA0ZaN7QfpwLXINJ3(?z$^`t>Q><)X^?n9MOuuuD
zMU1W4Lu+*}?B31E229LR5n}x2gfth27cmzX*g029`g1$VGK<jhQ7S9tCU=8@dEJy%
zO)3O2W5MDI)lstgM17-sPI0qpY@3QjYyZ@70hf8_r!+bp)L?bYmd2O=8sf6Qkhsw;
zHq(9-9jE_gF*(c_3O-v)TmD-{gTbIzg$OrhQmSs9;_Upm?wZeB31#RwR7R_<^nA>z
zl>G{-i0u51ZhG2~T$^9f6q&HINvJO~KS$MU*Uvx=3L@Sx+}<*|U5maUCQf0M3&Onw
zVS=)Ryl)+@AqgM+UbJTn+Rn6<y%7Bxj=$W9n;?O>SA%ITN88(9a2heGCo~vurG|&F
z^4cq+zlx<)Mx2hQ$RDTjySQ(=Sw~rYydTh(PJ8v{B&G|$@Kob!l!g@w0K(V~xM`~v
z{L$C5Ufp|_`nexUm-d{?cXey5*bNL4QdsBWJm~M;!sNczZ;pgCMg_@NClCE=qFR;0
zPi4J1zX{CAG#oXOe-QcaM+DOnh-*`+8kOD(Ssn|zz;*oX0blXohQ?x)^A?ua7xD5p
z`-(aYAi25%X0CCsDqU5PtZ)ERLhswdcein3zke_*VfYzAWBsz(0(BdHoH;z_eX~AY
z>ae?>lb+bm@Thot8q}<ced%-sf)Gao)PPQ@4hI3(gYFE7$(vEIp`^utF{=P9TgZ_F
z8a;8|zCE|EIUk6ZGGayIit=XlBQPg4M?y^K=?bH*n81m5G}3)KZFVEWNJA+LEB_1~
zXtLtWP8ZC7<z@MHF`v)1s*zg0W2)I%b`)*8aC*O!)N{je7;s=(kL?6H7E9Fow}xf^
zF*?#tp^N`*M!kM}_2Z3Xz48-vo2DemiL9q1Vws!}L3z31k63)|gP3mMl=x2mI)7z0
z<VR0vTT(b@I&Q@WrzMxo*r|S|xGn@*@tEardZRAe;Rai*HD~3vHIN{G5_3blQ`vvI
zC;lU#rg_j630_WoT|iR@yk#^P<P8oqA%BaMof2r6kB-Un3Eli34_KmZ6TX#Q++~rC
zgbj#+{|!>#<AbHN1lLz|y(ZGKaDqFhQy-2wS>1?RS>~snlJ~B^X7b(3fzN~t>|Z5h
z8QDt-Nj9U~J)g(Z+ndD>b@#xhk{npSZJ*8Hv@e6o1cWvkQRudMHbh!I%N=tmE%;Kw
zW^?-2QF;xgpH`jrfDshQ&$`F@?8WMST&6-lMaZB6IS9`5)XQ+;a7DBr@rI0*V~)FQ
zoE|zP210j`!AVg_Ggq4-=V*uIEm_)4vU|;#t@~E|h=M>A`(9v@E=a{*_vbf`3;@VF
zHlt^ursmO;Gu58&@^U{KXRCAfm=h_Dsc@|D=0+c!*A-<^^9+E)Xox-C-z%T!6!E_H
zgCH2*?hc&$>ha`Hu`&NI-!h{Hd&(sW+S}=J76jOoQ8R=nZ}U(J(&j;poaW@E&n$ao
zOqu;}ItRqZE)z}lG5FKQ`9niPses;6Qcz=XxsbQI+%+r~ocplM|8LNp7Z8ht+#)gG
zPbQaBh7P&cnaOf;a$0K2Db607zia>C*@k3jE}1j^q&0#lQ|Q8rb6c@#LV3upvNUB&
z4ZC3f85I#j0k9c7U7nx?L616G?RNro2t05_ARd(pU2tf=X*^MR{64U7CI;;`;&_F;
zP7vc@rgMnqhTtVEK+Z1YbeP)fh*%77Z&jHc9Gpg$NyZM$-8po9-dr7Eq6MkI?y1CM
ziz_1^y)Z(9any~bR<PR77xKV|qP}ir1@mXWU#BssJ6YgFpu9C-r&<9;ox^|Jh*1hV
z-gtm5_;yr^+V?mX@y{?q@{K1Xy*xbTwDW$%IOHVpaMd?G_!Dsu?(O>`f-yB*o@*Sm
z`lscHb9GsHk8hW1-m_b)1wgE{ztPb!v(aidv_a5k3^0MR1ko~kC)IIgwwry{c%(yz
z^pTl9$gb#nPE-=x|4pauJ&dyDZDWgBh8}hGj^N0HYY=oO;ZQb)Js9NQ)|VvSc@5j3
z*aud^FDVX`euhhANqA1_ls347jp*NcnJxm}dpaCIuW(xJ>;74eXI15?4J5WSa)VA2
z5Xc_LNytPU>q^X{6dxYN9eCt|xf{RiO8p3XzhXE!saba)N;13I)BM-s@pG|*By0{B
zNp+Zsaz7D`;bFgAjyZP%JZT-JWLoC;TTigmte15-0DsDu70@_<WQ!QUrJ$gA@Y5g}
z_TezuWo0BZk+C2zOuX*B04$v-JF$u&>EU5&`@X%NbZ~hyJ*CS7*HpmJl1@OaLsHS6
zj0B5H7ND*++(W{pkZx3^;Cs%kbouKA-Vr+R-TVqGq-7K@%9|aHg?Y8Z-geX3ek2s8
zo91ieGPD(3v(BqWR7>8MGAMVZg3!m<?q>yiC#(&%)J7~RRQh<4JHkdOU@Lw?SrN}d
zu*(SOm<#-Yp`)YJE}@eH6<P{dYy%ktwBwA5$*XpZ+dG>>^nse1kO(joPC$qp2)|NX
z4iTeVk<=s&A2CO%q{pJz4DPBk_4yxg7U*KTg38>rH8&1=Jr#=aa;Z02KFM(bb*fn-
z-e8PS`9wULzq1nPc!(AW&J&k^UA}SbZLV-7VZav<UD%GN+flN=*MeWt=|keXP-YLP
z#w@A!tQ0GQRG^alu~F%U!U4Fuud079+&{^J(qT%y%3iMMSt}_=P-B8kEKCr?5(K^>
zu{a#mBIhF`Ba<2bk>;bL8G1F1BmiSIj+(kT&%kk6In6duzRv$=0l3VIVeGA2*Np(2
zsn7uRyBVHjH)2$2!SmHdHb(U^@gr^cVsd(LQ}$k<;_pNhpguLnWCLa8kiWDj&H+Zt
zq-oZWpY)!VNOVW42cs8tRZrjL9|7|0*|nNrz?XDLwv#j415x_+0r(nW#JSl|3%E3@
zjv)U$8dE(Q&zf2r#Jtj&l*q`@2h;d;bJ9}KkBBy5A~s&&QlVf{feU3brZao6S2oAF
z*tql?4@oIi3W2ok8TzN7?i%jucS*MyYvC<ZmRDBb!N^8Yb*%0aD2bqHVk|#Tg6An|
z>5Gv|A*DD#i4H^l5n6YJK|^OmlRFXBARQj#im_v)(9#ooyIuD$&i0f9fq{c7dooH%
zD7oi~>uHfGfp8EJZ4SfCHTDG{tpJmObvTp=7ZcR*`}V%`J=FpC<Dl5#1j5j_2dMjL
z&uc4Cesa}bUB$c-^ZqU&@r+=MX^2dBd2nKGAc~8N4*G1LA-}hV3uUahr2KeX=}8oc
zSG-#mb79jRaa#J*E}e+c+6UQ#wrH$eC*NPT<=9+cDkl~!tv$#PWa5FyBgo7gcU;JZ
zCI6e#8*>gPn$?S-`)Nf-ZSalMikSrt`uA>spg9AJvov6VBEeVyCM{NJI<v{8$><M6
zOhS@s_A$%<0lVM&-u)o#p>3<tMtx?HHGz-eE7_9-R}9Xe;9fFkJ)Xf6PS`IIG6pB4
z^wo2xS4V=+57hoVlgN2HDea{LRRnC*2(7JeR(<n<fL}HX3a#q2rIbgMrRnFgzHJw$
zngcwl?+?doVJKK#_vso1JId`#EG)9<h`;^)2<q#E5F#uP>3#yN9Y0a}gbA05R!Z5@
zd}0Ef=lL$R;tw7M-`x%cBLJ?vpp2}lO5=4he<Ga44t?)NZi@;bqy5d*YZi-JiaXdo
zNyD7-E-fo<a^KQ#s%tbII5f^c9omykRADo0v#mw|pMrk8*S}4mR)Xxcp)NQQkOXWp
zT}4S(@UjVte~1%>AXg@jT|LskyypG-XSN8pa4#eDj%VJKssg~Sb{g-)KR{Lpv51b2
zmUYnuTAigmoab>7)}{5^zUAY8f22w6&Q>A2GntFz7C`GmQio%>UQy+@C=P;}t`vF~
zhd&d^4<KAyJU`r+N~`dHyIyT12}8gNvD@k_f;-7eNFaQDe_db<S%1dKL%}jwnES!5
z)502EgKDO@5;wB4GzZ9Sk<$K}(fL-sW(4?HQv)|#$2t;w%5bxn9I(VI*JmW;Xo1og
zZ6k7!ZQ^=AYy}d07YJJ?DifyMDu+D)xp+qtztYro7e&zqjdkjY$6yw2TY8=QR3vxA
z0B((3%!C%z(L_kKNTkq8m2ztRL=SEZfLZRl1p>cu=ksD^yGiq+&*q&O8Qq5soa~pO
zu>ot2K<Fruf1vj_Qt=o-nqUphFqe+mc1fowXWx1zMvvM}IXb<n9|-Vjj94si1F}B#
zg{fRjpv_<L1`ZdwFBP;R!CwtG{X}N53a_Gg+^&Ow#<j=w^qDHPlbOzfaC6CqC>Bn7
z$6eE05VHn%`}=Nd*NIA?19W#VafM*JM9m*#zJFUBh#gqrjP>pun>-&#UP3sM7t7zM
zlNIE_d>{f}w{X|_T>(-Lh};xd^BrPUvywY!n;pTE_s@65dln)`9BBsCC|(|(6)$h5
z^iT*Qk8m<Djg=0lVMQT&ny;V6ysRdGlc^X7WKIDN9DkdCArdzPvH1w9ic-|T^V5o-
z^D;WBUGS%qE^fHvBzjs=yh_BTc=r~FG;>4PD5r4DmV3s!JcrEp%D%gohZQNgA>V&V
z1T1!HuQVAy<kjrjCVfh>P*Z&@wwQ?oKupFA;05eO0u|3m=bi?8F?mW@w%@EUipB*Z
z$$vyqpZ1MSJP7BJZ+bsTxAnfM(t25O_!v%M-L*An%Uf<=Glo3e|4qFbUcE$=FizI$
zb)m|OG0k&u>QW&Tjj1)S%LU>9=}8@&{jHT9I&D*Lw|xh2p%4G8xpKyZ{}$pz&abur
z<$|T*%?eZIF~2VStiP`*JvU&!TrOwGxwJil;s)7pyR4)WQB{?}7Kl)vWtKOk<?@CY
z=v?#QIO(lqRV6!&G&<9bXS4SY9wTL~H&hWf{B4C?;}X6bu2yF}LB_{qb{Xs7%x<Ac
z<?Z$x+fVlg%?_7G>j*=BWUC!CI8T}3J8UXbR?O@Bbg2iSEUs79Gi=o(op^OTN9j~}
z<N$fo=?hWU@rn|bzzxiEioat2d!I1X#eCLRc3J+p?TuI0*{NO(sU`y-Vobp-3FJqi
z>9FN%1ba0W8?YX-w#kiEeU&4mB9hnI-uzttI354-HlG;?#c&C1D&}));&Qing|DOg
z5e$Wcf+x0Dz7cbc{-aP9O`ks>4r=~Q6nLJk#%DrJe2Rv<8)Sa6C1ygS)b4j`c3z+e
zj8DR#5^~0`^F>s)C6Mk0fbwdl$=uYJ(S9G&kx@Z4mTKQkqMXk2<8H0D?RRelt=L=7
zT?Jh`xE3`KA0z$irNQsA=RKzLg1ORe8~zrNSn|oPzC{bXQSS+C{WN&pSAM+MLfPI-
z*HBBLu}`tq=!wTL@JATfL*lHrrifFzOCg4}FuH-dr~*|BwytA+4P{fETk#$f&}!);
z?Tm5l@kh}XooQHau^#g^Ar7g<Ks>NqSn=|Em4P;vU;6K4^cw|p&N)&O3*8=eKUR+y
z5jy^r5zL(b=hHbt1Mz>=kpEWjIUAT23L;Ts2taqbgyw|60Od$XZm!Xr!D80=|HBag
zI*t#-q8`eJF#cap8WEexn65}54Eu6pm!Y?u&0n?*%}RvP=eRzt#|OVpE_Scw{2Czc
zn-)_~gd$I`k3{%osaqd@W-?(Ie+qw;dKEn!8yPrWX{~0eD~H2w`jkA?l+k4cUoi_G
zdEH6VCIMoHJ!mC-QUSGBS7eEYyAXeBanldjPHcslte}4iJz){`hQp&2l`f|_5(5Z0
zZHAa=kS#<k2euD&N%@ak3qiC#t&<6>G=JG<ib|`Eg!nmK7$IbK460KgM&>d@_j4gn
zrgk~7PVm&*{T?|to2|I`U)>ObKKT-I#52dMm^HaujitlyHd?m;7Tr`;Fj|s2<A=th
z^Oyf+WlQTOFdvwhJK5|t88t=roE_<R4-doG(_2RDckl}CYjHv`r%vG_q^b02HK@TB
zW!Ma=>6h;pgr5v++6BO0=p{n<p#Jdd#gF~oj$}9bM)lIDv)ULM&JsaQeaFvc$@U?+
zzg)9ZMrq+7j;{_)#z<kJbpuyHbF}yYz?(5GmdPQ*EhQBe8jQ83P~s$IWwUwpsSqXs
z8wM5<%XI2aN~e9SpO|p`V&FZ)<FiRjR9RDODyd3H1j5<NBQVsN{4n;y-zT8r(Yd*Q
zj<X{J_5R(wzrQP!6Dv%hPkz#exqv=)`@1=@l^c)t`$K?u^`MC41BjHYzh`nPaRbKJ
zq6?XP_H3uT@n(2eW`uVV$UZ;|Qr{%UDH*1hLNvlO6vEuK%1yUAA1C)TS>3s>v->a;
zStGDe(k-fUmn1BVt_E>g979gp0o;88S~+n?u^FW_U9w7s=n~q3lt1=z-$j_vD=tc3
z?d6}-thl*)9&V}QJvBrkZj+o(z^vk_rBVciy`Y)9;xmf2x_pRexZ|b&3T)5G7OV4>
z1u(Fa<p_N#pd*2av-?T(FF#C*mGNN<7k^D96;JNQL-*J14ZGr|LbB=deS*7`sFYIX
z`L|iF;_I!qjq1$u0bmOwiozyfgJsfx&WF3{*4Q=lIk5Q_-uJ?9R!y$T^LK-n^DnBG
z^iZL%Y->Ef_2Ys*aZML3lLAVVl=P)Zpq%u#fH4&9j=SR1_A}$I8g2_KTOM^`U}z+7
z3Zf~)s)pJ>lN!ZZEMa)^RPvNQSip3=C2T%OWVq6q&nHtZ8WUrt9k4Oy;@04k(sFq{
z8}G4cSd-e?Bqf23HHD6?<pgrY7pCE<P4)?Z&X$y!ARr)I*N7nMYMcFPdJua7BjV&>
zx97mSM3#gcGQ9juGkQum$)`Pib4ls-XYtwiB%LaX2G>^1#yStcIS+?9_OnEGV|biv
zvUD8#P}F(R?99?JLAI3N?Q}MyAJW+7*Mq$Ex}%FY>#BA{Re>h3S2mZHwjop)zb`D(
z)!kvaj6m_FPAEg$ih}Aa^u-(^S6zAbHR}AZ+;{dwWgj=}?4xUA+s+If26MrAH0FYg
zpxR#onDN`Kh$$9Kfzus{666C*zCNCfPvUadTD&;`&APDM54ZtxG(iI!T_mK_I8CkH
z68NA`aYcXn)xHhav$z@9whKd|8s4|XXvM5b09r7|AC*bB0ytQBS2PeCFcly$ruX%x
z{J2K$@ESqWF&f1A`My(5@!gMPEV<B&ulXzno%|K6PjC)KZ72!w4H6D&4R71s$JaYY
z<~w4*VRo_@DqI`hBH}W&w54Q1R}Nf)HOBz)(yi8N5+|cYuRcT+MTJbK(<x*B@;?%G
zbF(&)p9aJa0T0UNCg;64;4_yD#X1T&8l4Ux9PBxz&Z`~dGCFsx;Ln3dKhP*tLDgPO
zM1R<)viL8K(Vo83s>=hq-VzIX)YDOzGOaP>Dh|e|_o!@PWEq~O6vlyTZGEt-9)y~X
zb1^1l*DfRdXIEIts9|QoCF)-N@>f+2hqgrMg|6&N-w(O(V5&N(*c*SibnG<P9X<{I
zb<`BKRx$R`+rq>@G@M?oKi?WY-yq^}7xr^V<XPh`B5qY@bHUc_VTZ#WUMQ_&Jkj~8
zKkr|a*YI)j74~ms-R;7*PB5({h1DU=NTqtA@|=8(#Hbi)gmx^6`>3Kc!j|I5%c%eW
zX8CO+h&U`$h-P+nD_-gaa&l~^46e~{$iv^+rzc*y;_;SPb*Y=15(NAqTO~Vg3u{9F
z&*R<5>P}UAECX?~fgsT9Ww$Zgib8K@I&3K{`ssXEzI0ViR6*Y3nrHLyX>pSOZ|cws
zDU<M!uz`VXc_=Cgf`7pp`s*qT-a4{*>}VQEaTi+`#IGKhQQ*q)qt5blc(ab?h5?-8
zgn0I5A_Myz^O-->U^F@qs%T{k*y%vbE4dz;$*I^f+}nzbwszVl!kl~((Jcl4ff%%4
zsi~-hXwjHMEH@fVB-H+na`ItJ+R+DNft)~tKXPIV`0@6BJ?m8Kb*V#zMwl(UzIy!4
zVw1Vz3F#|2S$8hI^tb0St!WBidoc#jKqu-&CxVf|UK8SnyJWr3Dh(y%*7u;&*LEPd
z&T4`LG`t4j@3BaGsHs=W)&4ysP$ANs%1M96gRK4n<x-_a=uYGHNC<vQtJzTUbl~V=
z*$HZR<fkB9Qtc_dYd4jD5?;g$uEmbj3GWLv%l{0T!P_ue#n;XxzY$!)r|{~3a&8)W
zP~b26#wo|bMGqXTMm0T5qY3MTG;Y3G(xU2>%X~tuZ7&IrDte>$3oOK37Jw%B#*7tI
zpeVs*^N^N;x_bmii7B1sjVUGYi2++2>)+VII-`<$eU4UJ>;9^jF6Zm{jC$b)qNz<b
zMwKbJo*VK|ztI$WyFA7T^G@fDYfvE&hD7^xcDqu7z-3!TlbmQ0qD)OZ=3~tL5e$c+
z7wt+jvT?Uw7$bW%U8b1)6;^U`aTc}ocT@X)AU9kE%17Y*-DvWl5ud@St*l@eB)(e^
zZ19`1!Kt`>K$z6*kmfsC(>6^c`gIMY-DE*i>YdZ#A2YH<9Inz4YEEmtb7*`t+XB}8
zg&4xn*wba4!ZhQ{Ey9?0pKZY74$0keL=>c$i%pP{`LUjwx}?#EuyzbA$;~7@RwUD_
z*@HsM5dtK<+N5&mp}m+y(`T7H`9oZ`0V1#-olyCqX3sSR^aJbF6-Bq1b*jG48PnRL
zA#fXlRXjPgu~4922AeH0KM|b60h>mDAUHa*aq-<i6NBKD)n?G#`V@9}+;Ae%B$IUK
zqesOB$^BJ3(=f(+ZttHs7aw7{?#kHt;kE+<D1aS^Xvg*3_W=Mu53Rw`wM|M?*q7_o
zaGH@+au&zzeR~vn+951OmxqLTR)ns|)EfOgk|`Y$I!1-WUhN*tD*rHm$PBXXauuwR
z=kd#(za25xqrTO9mS62RRokTi@c2P9Z(96GzP^JlJTo|T1#5O@%HLuR?5TpbnJ8uv
z$r_{GPA8hqTuZ=v_m<VV{RcJS(`s!+3Jd+#>6aar9~nOu9}tM>{Ie!lXu-4L-GUjl
z4d#c2oFzH3@_oucEHw2g9t6cd+<z)s>IGTCMt{|>iib}P^r658FRSkQD%;p3uN{1{
zuu+Oc>AHKQRBiw<>kkApl@88~$q^|leaV=3F-1wts>Xx6{w;S_Nf7}^f5xzfpmiw~
zL4`PTo|Z?zX8fOKuNR(n=xfDSa-O|wxARr)8KTlUQkF;x#LHq=poa**%PAte?K-Hx
z|IZI6oKtN}RtGQO3mH)K96bOvtxfb4KQ=?c#bh>x3<?gOewgVi&YW)f53LyJPX*2j
z*WrG%4ZaPLoSe*LF;~#H8THwRT61jmCBanSi9}CNFTHmdhGVDL7;4<il$|FmD)lk|
zL7?h=^+Or;{bofIT8FNB30pANMU+B+wSqeSNjZ8aW_dbS*ePPefuN9A^V|5gh2tRa
z%)P+BZ=2Q7d|xE<@F1j%R=1uQ+kT_luR~hj6dNr+H2?B+Pr-1QEf}pX=G~#?NQuD1
zQizOiPwyUtp1`X{nXtMroKVIuS!IcLk?XK*r<J6w0vBKY@DF9L%;MAh8GG-At6)rw
zZzmaq`~Y2Is*@;~wb4PyzUCfAxXBz@&l1m`ZM21mFM2##&rzgdLrXD)_$F^Abjae~
z={}V9l8WQxWUTWJUe`<E`DkH1@ikcWc$1gogFbc<vVMX?AzW=Yrcbi7jz4y0@;y{v
zb!{%Kh3squ03t=;kv$nK|2=?fQb{e>A&CVhgWSfnRHlL;H`3gFiGc_(HSaJQEnH<d
zuA;hJEJOlyq=x3!Dh&4hG=#9uCj#@F|HNlqq2t4!ua$RbExI)Yqfk+IgWE|w+X1_y
zN|)W~^!-=~?N)xxrTt2|lWR<=-k(VVgvIf6iX`PT#^N$q_8FxZ#F`XovA_g|H-kFk
zr(~8NemGdnFD2rLbUdKU)lde?#?XDUvFYjQ?pd`ArvLIs&akIX=9g;?(&%C_zoU$(
z?;2Yj_Jofr1aSjT9nABRxylCnC(<B$TyAS;1rPPRe&_uP4Fdv_(cS!k4uB5PT|<jC
z#AR?+<CxdXJaYoxa0qQ|a#Zw!s62YyohGY)%mBmX`&5+mWO3<6C0HahMV#$aIPE_H
zHLLp3evhL&`h_N`l~n+99&Z1sQ#=y+7!~m9j))y0p?Qk{t;QTJVxJQ-@?cI?{CclH
zW|^~6nJ30C?7{*XQU{GKq}TiC`DCM$7k)adn#x{EiFj&Vo&qr@-+@ysp&R{dt1}er
zlpY6P)>)-l;Fo+BQ;YRftH3e=kfnIPff*l8A2=?%k}$r^YhLbj#pkuP9gN+q7)`Z?
zg%K2Kw}_i*G2w}m!4Q>6&jrcjwc2h)KG%rcUFKM}M>1pTz3KFiuEP^u1#W#r8JQoA
zbEM!nIs{2b5y_E(?&l(`7Wif`NK*w<+!L7tD?=pK*^<UOkxPA*A3)-p?WjtH6EJhY
zjBg_1<JYEWr_<|I!9q)O^7((FK`vgsYLxg+vObwoqLVgb3<d=JDt-IDY??Jb98Wx*
zFAnz{;3gxV_4_rC&OlEqxHA>D7X{>NSP1`iaYXVEE<1DCtmYz>m6a2+<Nq%L@1sbK
z&;S9$^bob;=BSjc-t|tXi&5ck9yj_HK#^nC!`-9@$Kb`R1a*jkvtmwrT3OG(q*xI+
z1qwWFQ{Q-aoc5LnS;EU~S!U*Bvihst^03T6kd`PP>vXvyYFh!e@D{s4UKN3QO8OLR
zHY}~h_bEs3#(F4UdBqr-5^vhRV$Ln*$oa6htD9R5%6WApDGEpbL)ntee8l_4cr<71
zoIl$S3>4fkv2`y<aDXI8mKb=1Tuf1AvC^HQGvc_1w!n^`$ir>A3)5u_^H58)5Djcl
zRIn)s-4nJ#NZQHRmbu7`e*MX<wYAzG4!Uvi_WOQysSniad-({H$BPtTSir!g*%u}g
z)S^yp^GbmEh-}V?_a|iAg}Xs%*}?uHl>hU`;w%d~4}4ygAs~`TQR;UJ)(k#)bAO>G
zHIh9ckm)ZorC+kVh*4-GMnkYdN_;!{Jvq}<nM}7gV*%v9c;>Pu0GXd9qGC-&)aWQ;
z-afl6?s1~XzYixHm^@GHB}R}YV5nM?%7=$eCZe3;2oBh?pEe$een@kBPcH{Iu791}
zH8`HMs^2XuD49UrRgf2@s#TEHbz^e??ZE2>>EO7#JH`bbsoSR8iIDs-iz+#d6o?1s
z2ZyV19S5T}_{rcnp$tS8Xs#H_udoYWPfI2~yWxXq_iYYOUB{4OTewt8xcEM?#{~?*
z_~E!QW2W~ipi|6b>Akb}!9?W<tHX@bm@I5L63mgxqM{sJaZvVTc4UUJf3YcFq3n$$
zSQ?66_4u}=Xk2iNU<}2EUv}coB`<mRrVBaBK7J%nLbDWP4o|o2ymmP;yD2tO`6cD0
z1=Wp4zHD1+O2(8J7Hm*G`bmm~FU9tEqm8R~&l364(k+IT7m{Tm7&ek)T8Vav%}WAj
z)7`)%e3or0f$E@<7CU%T7GI|;KYUT_S3HBM&8?KXR&@%(CKQcVY@FO34t{q5HL-9_
zmEu;LNS`}Xvz7kgt$cUuCe99DY=Fw9!OmbTVS<ZK;{4B>7)AN@q)J67*%=6QXX1r(
z<H8iLx{yradUm^fMb_XHI{URx$!aR#1m^vs!#DjoxkI-*gh8`j5KY~J6lY&^H%-S*
z>1F-9Fz+wMf8+#<7$7VOW_eK|MGvte!HlG&qS187n>x(~VW>Np9#SK-%Ut_rCFkRp
zQ4g;9rtI{>+nR2QKZ0x}g_A}{h{NTeUbr(yeC_m|v_ZoRi4wDZ2>Z8zz8-I1uBUSi
zD9lO5iK!Z*x#ZNnDjn36q^R(2t*W0?BqDuT-uygX6lFl9UN>@OPDKHbY|VBX_~9Aw
zh(ZV&3N$wj6uB3&*4sZ#?s&Uus5-9-k~cjRC5VKN)C<F5LBx=nh%m(H{qV%p=&GpR
zLYGlsFtghYyg2G9+dNVMf|9~s3cFwC$1~G%WTJ|<S8qvMJzXlZmoqtBYWFztF>p0l
zMJ0qs?Vez}+hYbJQ3&fsP_Ym^?&lG7tbZA5))c^!WNju~#eIZ}qLMVFg9#$-j)a2W
zKpqci;d4aS2<!d(P(J=;hQ-m$`yZM;hWNxz*UQiD3}QIGz>R{T*p&caM<Ju+^8tz}
zD54!fNX`>5$&w)eFw@?%PFW@MbRk_2plGaN!Unjg+j-FBAl_PvxCuXb!a0~f@Y^B7
zL~4<!Rz>orxqw7$ZUDkgRxE<QRxEw4a=q2GS1LX$v8>EaY{)R_QNQu@!bpNY52tsc
zJ4*0oPgi1QF&|1J$EmdbX4KJ?<5Nty!+8Kcb%*+ULg8w6Yg~`Q@ZgL7$ec4hnD7CX
zB{O7po1KQGiskF|5r$+IeafLM*(4^>dMIl>&kn?qkIj_&(^e!)C?WQ?7`TVBU;~u1
zzAu7E%9y>J_xgq>CjH~4!>`;poDebr-(Y<Zh(!-X)br-@`Caj~3D$jA39qWE`OukC
z;K~G2XtvZ(dS>@hlA*vr(uZ(C;q2Cm%_b;oDt~XwfpSdW_g?_;nMCg`J0q)xs1FY>
zuL*P6)(dRX6?lzTiTm|>@#uN{jX?P4>aW;IZZ}aeCGuDZ_x<+mo_fm><ioR7VX`JR
zun~5@%n2I0l!dGQXPoz$oU2)Qufh+S3DL|7F2n8glsu5TZ5n5Xnb(WCN^6eGoqFg{
zROzY}wKFb}ln~hvS*ot68~O9+s}gq-R6Vbe<yAua6R++m$h6*VR$^LuiY(hJ3vp-C
z8mZqi&p0jIA~A`*srJ^JhuOCq@difU8Z=z)C5A0m8%eGryyega9Q;H=^VU|VS`wC#
za}}Pqlz$8F41w+P{Mhlm6NJSh*Yx$OteLOeDpnzPxm_+|8_HY9bbj;zfA#wfMlx03
z`WCbqde>nkC73?9&ot*drtV}6J-!!^Hu^o%ShUX<izt2c`jhky`30}@hksNsDHSLA
z(gX0^&(rxs#6_#3zh>wkcdu^)SQL~zX-LT(Yh8-{U#+~fw@|ByXJn`!e8tFI`tzfE
zMQ>2T<~$H3Ez@J3a5(-14I9P$3FlaEE^I^CZ;P=GMoHb^#gY<x&NNo7-dO>;J=9$f
z`_d8$KHb3g0mq0dy44Br5Xc&UyhwNc#^v{Ek8*18`|?7A^SoMbp&oqg4+KF2_#W2}
zEX2E)*<nC_PB0li@&Wvn?&o!DOb)vo<&u=IgmEL$fA;{)xw7@d4_8(7wGL)IqoL7m
z#c;sfQJ4Um{WkBicn1Z%5SXZteu_u-VRA*v%D`YiC{Qp^(+>C3lFEF!0s*alH)f$x
zq2%tj?`RB`RUi4i%S9J6<_E>hM}s#4-U301)gB)Ea38XMkj35`7-*7)P%msOM5;WI
z=L&ep6R}MQE;zg)BY(U22nmCX#3A5;9$1;K6nrVPnEC`RN}(~_CU^>lFi}O%&yZEK
znmesV3}i+9TP(7HJULQaY2RbBce2*S5Dy;WPY0ZPn+00btye!W`Vw6Lv^Dcc9FxZx
z7G_O!-cgMM?D~(i4B?8$MR|6rD)(wM?oBL<pxI-D`dlZCB*Qo1X>?>d*U88#o&yAQ
z4DIkCO|iDeoTFIa`;Nx0%cf}ZOgkl(m?v1xBODtW+k{|;@TopP{ny}0?QaRvt-KgL
zNT~S1n;qXE=T`=Y>orFg-HmYG8~MY5ma;e_%G}SSvEKo{6~DW3@Lubg!@NGVsPW|M
zG#VisIrWNv&g@|9*ZLF~zVMm-MQqW&3j)Fw7~kQrr9lR#Zy%BIP-@I4vz8xfEG>DP
zs=;BDq^gIA3<XW;?(<*_u2yvH)s)<#FzK9MuD4D{B&A0KXNXWO$yxxvW&sc^W}dRB
zDCmEO8abZFnGw;kDo(Ca^vx+g?)RHT+1P@+h1=Y~)**#D#Fi2y^}&ykJjJ7_YO0kj
z8A(L0eIcFpZuKog8>=v5WIzJ8(}6sAFzL*%@@OEGpe#l+_qj35moWa=)&y|766M{%
zM=n0q+dAhMm{=M!y~Lp4-~%$*0-s06S?+wX@VNNCM<$@7WJG+v*+od9y^;~}1J6sW
zykG0y?f3ihgjm`zqyl8aDfx-w4OCc|ofYcB;RFj9ENM;~ciMj53-xur;q>SJOP(eP
z`R+6%MCH!8y5VI0w4)L*$A%zgTfhwsOlv|XWwgWM5*mdIk=s&GeRF4_OoXU<5fLfh
zuuZQpc#4XC83wYMer(+)nQmkB=h7Yn>D-Oj57b?*ui=b_+wlMfDF&c43BBHCUw28j
zAn7lyddy@(uSmyo7N^RRy%NT++_FBI8ZXRGkL0BbIPFQG4B_YJmtLcl!uS7l48>&<
z=30p09Mt1Gj!I|T+prK^`w3ZOI#{uWU-wh`MMY0Nd_U4>cz!h0U}Fv>{MnN@EhPzn
zS28%sh~A|aZtwiSQp^X`rz$HZ;q`XPjo_O=DzfxU@(`QcpdgBdqBL;Vd6qdZ3wU{X
z4RQ#k^<XDNZl{Y|1G`cjWU0a#ENdZTM1b3>h9Ffasmvcq>xfV-J>1>>?y{9;p*9<W
zP>81l4PW&;mJNkJ0m&QRpu|ztxuVrTC;FE`|8{0gZM&92tLuCA#g!!Ou)H~kQ5b?0
zEJ~ym12LlFBBYQ0d~6YFS4oy(J5_j+b{w!o=5YScq~R9C92U=&XgEI6z=IVT*r&Pt
z_OI-URuhqiIOLhvU$Q#N-;qMalrUE^I}tb(abuqd==;+r_#z)67EfO?+=0?|_h6j+
z&r0kEH^)cOzYGYL{ZlI@f+=e1S_Vs`$Pf0dS*V#Nd5$w(?YO`}>%tPB?xz_31o28m
zygF5ja(ypr7_<~2wBq)t%fo;`gZxGz5hn+9j1eZMrmmDAN9Kja#Yg*=7JY{<dMF2P
z%9BdL!&!6UL3KBqflK}T5{gatv`_Z_U@iRKQt6PL-#;JK<xt8Ib=ok<D^>Pr=VENn
z9)DQH|A)OJxj{Tgk^;0>k91-*xYh)(or)=i&U;UZ{^d@Tx;$3AMin7${6>jZ_zNj{
zAhrn;*l<;w_VXtG)Z+*fCv*^;a#$^yy>Z?#>U&--%a!*~(SoFwM93(yW&KigeLR&3
z^2Lsj&Z1bsip*jZA-IZ~dJE>YVasdS<@Xcx{2W~dc!3=%W#;3%<<MA2Noxx}rB`s?
zJ!p)eMD4V@u99*91wlIu$IeH{rufAxDE37MwL<pW8`$mbz4~Zy&04DyHV<U*AkwEV
zuVqEKrQ+B}OP#F=F`hA3y1p+93G|!MW=SQrmdypIM@O=fC<H;~qokU?mf5VnEQ#RT
z>h5r>hoS@8Oiva?tl)S5$O-%yhKAfwano<Yq*1B`1{Ojzc5eMsPLSW9UqQk)E<SQz
z$z|7CryhNRbhIq9qDnh5n<ju;J9NlC>V0GOULF#Ec<n6Rz)varJ1PoVoM1C7lf_&Z
zbR9Tp6c`2s9Xx9^0Lep=wb;J*P2AHOLwr394o8)g@U6_)*qG615cEkd^QP`h`RA?N
zuF(dRf|xM{9AjXeQt#Cm*tld784?Pm1!93S<}_QDLXb2c)x!&hhZ9cVyAiV-cSkJM
zUWcBNWi`wbpI^x1G?N1f&!5At$3AW{U6>bRZk&$91OW}_aozNoZlDRskrGuZ9Ee{Z
zUsI$QI)orTRp6_9zQUF|za}~|@Y~_ZQDy#3d)``4Y+JuYpN;h{+ntEGmX2R$XOPlo
zbvG2uV336u{0gg-lfs&zv0{@bEC?8`WqC{haZi=m$$2}Tjdh0WVQ|93aRvkurlO{w
zA}-Oi28a0`ShjQ5m-pkjjhg#lW~t`C<Ef))5^x0Ox6&Kq6!ME=nm6VTny3aZYi_#^
ze|masH(dHlCtTot6~tq0ph-c(FIi%N)1x2y!M~Tl!y$7IEDu@Vo)94>*Pj9n?uyWU
zg@G#2B>I)7=DK|_GLjT?1qy<^6x1MeSR&Yx$H&JD9(KuI#|Iewe4dy+ztoM$Vhv_G
z0k#d&UQE*XtCX*9&#}YmH+d29_#p)YFvHz5a}$=xQa9F+l<|qKN<rc{eD((eL9vhH
z*9`-p+SR?77!=8Y#dlZh2783t%})e}BQX*+uUIKpPfdgcFi!+;cuurz^{>D`WBFnB
zX?B99y1<`&dP)iT5=W&yZqQ;mNQc)`mi2IUF+sR!cu)#nt=fG;2e$`x{)4vztoWoA
z{Fo^daJ4(kzwf_dvN^#R76TNEjNHsjd6;sj>6d-zv1khIg@Zww(-rr(bGMnEYxRO{
z&>!xD6y}&F(Z=!_QS~}qC6MqCAT4*L%?JYX{S1O==(*DK*tte8|MWn~E@jRB*#KQY
z%H*h`Y_>Yuk7K4*;`&(73gj!KE=vT#OP$}9>5spWQBHDmA`})4%yJj~YQ`%u<SQy>
z$c;&#_{nq_!i$iz3YVn7KI7)ZM<FBXg?0n53&kiRUptJ!zztkTes8;h;CFseKLLOS
zR#;$}3-*28d=AA9e;Vj9MdS@yS*Rix0DV_S9#1z{q|OHZ49^(=pC^9$1JSdX`(Sb8
z0s!{II6O90a%<HwTQ^WEjKQ^*b`ZveOWGLqT%=@&u=o8W?i_C4CBjB@yGjZYel{4D
z@h}1oQy^bu{u$5NJ;saJ!1utnf5Hxdt6ZLhw1<hcqY;}M|GHYK**N8-gZ4YjpOhfm
zNu{v7UCzk|?ft&vNHMD&xP7P<Y^&8vafX&Uye=F&n??J>bQq#<g+T0C$`|&7mAr=E
zrofNTl;;V-=j|dPKf{ljbiyFsZ;aa(9X6Mj^Wm#w)<{0qL%RcaE;I46Y`uG?+3^aY
zyLKX44VdGVopd-CnI`e6u~C%=Y^Kttt8(F{+lV%^!50VQr2Y>8KtaF0)_NLi=3wR{
z&*7FEuhR1n%Qo#)1sr7uV>~DVyB<AysMg6np+&@a@QN$0P;`fSAb7XWsYh8ytmar4
zurP2;V?Y$W#A%8sSxN-<`1p8Cn>G!npME+zckZm#8OOEfnC`6Acnbp-1}qHxOE6$~
zQa}Ivv(k4;PEIC2zEsWSqehLwi6@?@dTQwBe@VBkZde#Nq8KpyYl%*E#~pVlC)UAq
z5LH6QpaOH}&c#ztJ;i7ku4*4^eP2g(I2tM3nf%d68*hS}<OYFJP&h`eRDzc%gsGH+
zN=o5l>?RK>l8&g}d3CP(f9vCKaKZ3XHJ^kDn8Xgbdo{Ny#>*Y4l_Gl-o3bKuK!G-N
zko3YcPg3Dr_-N`;y@Slt65X$~XdhfeBuU5k#dNYHJe6wlg*++OM)6)cH75Tzu8u-q
zz0w-FA)O**X6#VsRu1y>{5;K@%-X&NkJDkIlXA}M*h7^?9i**-v%MMH)$fd*yBK+h
zmu#!N{}H@gzATNro>FZ<$loHX72dDp6)*;q;vh?8!x<U76+dVf`8r}WxNX~ZY~8d0
z%T}*f>8Wu6e;PdIvdn{l`PL$$<8blNu9&}YC1S&Uu_Lq4HnvX4&dfkSNCd(dh$3s(
zR=oSxYwF*WJ^0KKIR3ca=-IQU;?u>)GLj`__R>kR)#~vl%ZrP!eZwCrdu5rCYXf^T
zHE-{m&)-M-+QllOi)o*!%bW!>uH@tVzFhY?JG+KoYzzZ-WC-V0-cK$4Zg_-L66<gf
z49L4^<Q~sI|GY{qzy1CFl_8VN>sIu^gCNm*Y+>LKFkt4sAw!1Xh8u3c6Hhz=305GE
zszi1rHW?2*@PPU*<@+@051|Sx>ED0>Ps*I)Sx;(4A^f~rY5hHpm&lj}3QKId_FSNh
z<j~tM2wjdljRu5Y!_PmM&Jl7@PKN;T$%)9>ydE33rlNItH#+;QRy3O~srJ##*|qQ1
z|Mgejoj}qCecXY?>H84i<$}D@O5{+!A5FE-MejX}^hfSgPBuj*(-`lw*=@BoKXvm)
zbrtO13VD>z2|XZD4@EcctZ_GD{Ds<hQ0f#pq>yv+eJDAW{9s_CJ#^qJP)(V9U0@0Y
zQm*6?nRH$ro&8GQIv{EMXw2tEnWog?Px~18@6fp$MxQ$d({7o8^=nsS!Rs$$?!31V
zO+A=hJ4FhrL83?sY){*+92JZE0~gv@B)9Fxt6ykCLU|*dBUIDS)WtKI*PF41vhQwf
zV^!NFDtCjxcZ|ZWhMHU}`ClFXT7~_e{V+PDB4@nt!V8s-lSGRZ*`pYEKla$8q>Hpp
zW@GRE;X;|#5I9_=wV)ic01X&0KnYyM2qi8qPKC`CFY;r?j8Wc#tQW2Y$o(r>WFjEg
zJ=Uv<q5ec>st~W^GJ&0V`dN7Oy>HRw_*38!%uQYXW(Kg=6KVE7?fHD(H$URueb*x@
z$VYEjZN+k`HO1M_GVWpwSeTcMjr>0xP(X!j1-3pOtW1rG+Nq49isM~rYfwli82~%^
z@A#yp*BM;+D^+IM+`BNm(z+#!Y{r9u=-44#h0WbU#V~1OLSh>@Rqmpai<tS<z@Srx
zVAzO}=-VY34@^4;pV59W+}{hC`3_zPYLeTp<lEHWoiml?#v*-754`op>$qj+Y!rx2
zi4Bt5w&muXitc3a<YZ@|pvaW#q@o06?9vODI~S-<ofEL^>vxcnyc=n|J|V9qfC^4r
z<XKi@<L}|)kFuhC<vrfi`B%=lWF}Z}crak*<==k$4YOy@R!Z@EX`s4q-#(ml(n&bu
zj5Ab4W}ZJhwOXZE82JCffDnT6t%-o~$tRyw4i|)A6hr@w8#m(h*I&o<>C@F_;@^dt
zMraP+mWT`Wz?NL1>ogl|c`E3UPr#8ZFl)c@+|%qb|L%m1pvg4jfQ@rt6r0Wcx@T7!
z{0E1IW8?*w;%kpqIBnD=h~j&;jm#r?{{(Ui_4@hqAAe%f`19dS!HasP+8`TdL&w!L
zN}daClttPo>#)#9jIL3kX`{M*IM{E~DkEaD@l@>DBub()g+kkG%CGhZExg#3ZRl3b
z5NGHn%(?$I+<f2D=t{-#Tq<@;6lY<~xOw>_Ay&R=t*CCQbPrF$=%FWL?3nXWkiHIM
zue=WNR9-d)5hh*jv+k*(<660S;Swse_wIWFUYqw49-Q;MJ-L&IAKE2G@i(J|P=O(f
z1{WnZMR(y}R92KRT2Gov?-vw?gt#cY{rtn&lV6ID<~;^KD&<R*DWT#Tqm6}*FUZMM
z|MrUi!bQ<B6iM1_`qR_Xamgi@kd}8rCY^7Ha~uIH`ru!95v;8Lw-_*Un|Mcj;e{7)
z<&{_3BLJnOq~P+)FGnc7)k=gQvwj_wdl6Y$InRpIq1CHpIJbc|DfOVVtfJn%rf%pJ
zfQ;^_7?o_z%H<6vzxSpqksMEf{^-;B+}0Rg3Ee4kmnVe_x7_<Ej_WrFGj5uI-`8(Y
z<w&GGZyNdw82rk$9+&-U9W!gx1V%Ev^Oh-yiwJH~sd+#70Rr3BDMYAi`{Da^rRX5P
zYg(zFnzn{BBH-M4@8FanZ{hq)Ct`z*SCK%2B6liQsJu2>#=Hx{(3fb6Mfutg?w&`V
z#dUOc<WGeYGk5D+q;DE067lf<CtriJ>tsCr`X}mfG7V@P9R?VjWRR99*5nhOCPV+q
z@pQaUnhU{PUg~<~N!ygK&Y9m}6b<`6n?Dy}ftpWd`WKbZ9v}aahB=Qs0BNUzHmqBW
z6$PYT^DhQc0rbcyAWAsfwx`k<O?-EQG{8%kIN@RnnP}X|ah5t9!F*o_NCXTxZ3K2~
zU5~j>Jc<XOddZf|mCl;lF`woYnY;$CCFI+rQ-MVc#t_#FU%oyUrw{6*l8MpV5i=5E
zdyP^|a_8Q7|C^0?>$Q29c;l_mA{;PsX1p?N6+DU1NBXaU-Xa<GS;kSm$E~ErB+{b5
z<=5YWsn=bN_KEzS1joE*`l=Gx4rZ)EW0LU2hUK_yba(u)ng+DwbcwRRV;((DtY_;M
zTW)`Ru<#>{9C9M|Y?nO1sulIW+xK302vIb6edw;KaHrc#V?-#<#1y5rWu2`&hf~hx
z8lJAh?fRDoXaJ|(YDi?bx=>Q8=b^gapn6}3N7<WQ#_v5eA{xWTT&A+S`h}u>RB+v*
zi1%vp_BLZ>ZWd0XA>6BT?nR_Gjaz^CQl(wXXq~m-*WXlMYu&T`sH`kgSId?ytM@n~
zw?K_oy$8Hu#w#Q$0k3_s0r%fE9gjTsmP#7WsGc5l?ok&?8O1wo`&Oj$!4ogNP35&y
zu>2=I53F2Xzy6{U-8Lyl@FsQ2*mvxC0v7-H1^Ns+gAx2_suvWAq%eO;W(W0-(n+5f
z6bf`cVHlo&`~mds(Gg1*>4icf;njsZufL2+Sb@0eqO;ZapcWZ^8|qtc<&Nuan~l`;
z-FV}(pXz2+zst)rY;#kp1MXDo_4md0cVVQ@A9kl>-V4v*=DQxSm!tT?YCe&<NZ&T^
zeR)|41+VE;6w_bhn;$O3n6rl{K5#?xkiF2O;6mCb^FucGbrShYAR!?E;tWItdGYb_
z%E^;B@;lo5aulG`YJ!CU3j-~{fLXJ|Xi${8Mvfe*6ul%ugMcW1J@?#mmXdr6aBF3;
zFkoT8!oZQlfY9_ZhZhzW;_kceR#oNY<sl?QEL3##L2;sI(U1xq*1^KSAz{GmHBUL^
z6o`}EciwqNMbGI#r(0r>BJ`3tS&;A0q&=hxti&zHfEatx2yT~6H>|k@#l=&ZJtGap
zj65S_CPsu&vE)HJ@5R^=gAurB35E>pX?Ngd%FWNyG_i|BDYV@bnPw|GrP@LVV|Vet
z`QQQ<=PFd#BJC*$Z#IX;WyQtKFQ!gPBahyft@R|U?fgjECKlwwiw^J?ef6pOuamXW
zpWeRyC}xC20iufz>==<q#Jm}slw(?e5rqUHd?=W4CSOBf$M((m?%V(3tFOMq+wW<f
zmU>X<5X}fx5(%)1<?h^}xQ=yF=${7X@=L}|)-*Rdry4)$W*QJ)h~Vh9lre9>p4?*f
zJxaQ~>^<t=gH8yeqXSi-5%I&cJ8d(*`TS$`FX;rP-Zm5Gj2?wPJvwtu6-Ri6m#sR-
zpd{tk`CskKs=TO1H)J1mQiJHg?S-cv*9A567!=@(eR&1;)KZ^7VNNb1A<_U-kgcn>
zr?D;$4FiHx;j=ATv`FbZ3Ey1ywyCM9Dmt3T`~<AI`_S-erM5887zWJTEc+6Pel9$u
z9XocYeTvA_AA0B^713Fon^<&HV_0nF{pPF>lBOjf>yH9cfIf>Ifj}vpM9PY#;_Wi6
z$Y)&Wbh1m2UX1YcHQecF-bB|e->+$ch2Q*u)B1Izj9JrAb?04?mCAclQCftRtJbh^
zF)uRp>v_78I&MjA=`fd$0p$HTR4{c01cjpSm|<A_+Glja8j8G<EL4<`MruoAH_8%!
zW@Nqgtwr~ob+CU18>T)(9~A7{i?tiK+Igh<xuj;)YdS^fNT=>Tp4xe8PIj((EDnTC
z%e_ha2n;&mcsg<wx<iaBHNMmX9?W-=zb^~lzwj>ac#}?WFrcs{G-V1NWn}j4-iH3I
zQ&5(a0x#!E8h?sh)de0-6<D*W2y3^kLI(zqlD-ID3_fKHf<nU3f6yuDLnjNq?oOEf
z>|1CZ8;vwZ5)?3Liy4SSv@M*aPSWHl9XqM#F7EE?EQi7pE$jW@lP@v)j8ouAqeUTi
z>N=5CWeV{{-N_ZJR-uA~kkD&pn5B)CG+c~LNJb2GKnz~&6<HSt#ejKlB{<WRDN|H>
z!K3Jfi{o^epZoUhXM64IzV!z!{*V(K6$XTY6j7+0JegjLX+Y?~(Db`@=@<R#tFKle
z8N~wLAn%ZSX=V5e7%<aX%|uxD!&egrYmkXg6h}Ju?28-6orT9=`xLEX!jZN!Q%x47
zG~9|0r&au_Zzz1vRR)CWO&9k#{PT44QSIckV{dOrL=>|3WMIU_SK&e`7&ui|(wk2G
z1;L)7kqhaCZ0d?>dEc&ev`S?bqeimWZ`XW==E?;=?!LA%Y8DHLv?s=LS5LnSr}pj6
z4RJXq_L{!f3vAZK0eYc!ruTbYj|(U5isD?{KV!1W-M)=KM6pIGZt+fh>o|I!*9u72
zO}!O;`}Ab^=~zakia-#R$Nc?#P+5?JicD=>C`3SWz${F%2*f6}$Mn1I$3^3>z_O)(
z;`{Hv#hXvPfXz0~_NKhHq9DZ#1^N51JJTr7Q+bVqg?RSw+^q*zulNbizy1#Hn|7sI
zWF)VLt606$I-f5Che|Cxek2qMxbO}bb}lAgG6rr=T-aH5bH`2<C<nIRnSCxUE=7-y
zZPo2VF2i1!bs-p#?_P)%@oIJdefKM*h%iLvYB3<Z<(6CMz2487x2@O3!oXp`fLV9X
zJNG<gKqwx8#2c4*2$FAY=uk$gVAKRrhON7aISkbw6-Ag;tCgz<{Cy)-o1C4s0=xX!
zuUzc`1*MviZ_+o_c#|f-Knof422SU2@g#{%UF(qO5JuCjuSD8Zxqr_y)B2`stD)l5
zQm8i6if)sImW!hjAIKt45IS4lpZ+Hf#_4oO^VNzi2xT<sEJl--)I~NggCGCCju9`4
z;2rF%Hq<&WPYrD(8&U&?Hkx?T?KpivufI+kRXHI%NGsVM@;YuqnX8N5{Abee&6D@4
z`0lt;SW!tjr8=Ptp1bpAI$H3AFg*^r4t8AfNc6xMD*Owm=srZrpNqc2G#U?frt#ov
zDuxTYK)^d76vd1fy>VkcokR@5`J>N5hjz&no<t!mGz@`(fs9h<f<>Qb=7Xn4%_d)$
z(D+f>V(9dguDvk(@ou={>g)06AHOR)?uB`8vfdhj2%NnbWvIQ1UX+uSNnuGL3)k;T
zA(<{K`QNi=4}8C1E<QMC7%mmV6Wjaa<*MoU{SM=A==k%mxEALQJq7#ejftBDRbu0<
zZup73vSnpeNMuArftHL-!zCY?yMh*>lLTIQ<rQ@nCpn^EESrAuge%c<3_Yb1SO*IO
z76uNA0mpf50wWDdl(k3bp;wed<lBmmkH?4+BOo5$`}gm!*0!T^zK}_cAd!==yY~*{
zRk<+wt$j*W>+!yv93-~ZG!G}egW^UKn7#&tMB>%wp1_9mY#RKDVM7f?Al~Fkit<pD
zo1=vaELxtL8f5O$yf+t|e8wm&?9(6Lee*Tmd-ol@{lRBVx5K?PZn|kahS8BszdpU-
z$~|~vd^}U1r;i`*oIVZC-hSjG*j7jO_W&8wt$ahtC(v|-N$=PI(^gkcUz|7YDhxR3
zR4n}BbG$=mWM41(-7#ss>khs8<AQTX<BXw0(4%vTdfr%DO+5jj(Rlp1H*w0)_wn@H
zC-ChrE9#Z2Z?wW4vu5M`b4H_MyF`79Jf!JwzJ%XaZH2#&ml6<|%&my0%)Nyam>1g&
z2xTnwIwEZfj)=qE56!{w(PQxW=bz(0^Pj=G&6`a2CeIyu^u;-&&c?{IN1$8Bb}DUS
z{gj918xy{ZL@k^B_%j$i<|2IZ(MNdx;U^C2*lFaLi!uDHvoK`vsfY*-R4=u>Uq{S%
zQ1wW)oa?TpXMF?1aMcaBV92nM_~D1|@Y$!I;5`aNng=16dh68~G5jogz3xdb)VfUJ
z?KSlons+3jT{nF6<8HjW;7vR>`z9KR(MqfVXx+IFuAg{0MxQ+#aZ&VWP6!H*#j`XN
z+qtil#;@Y>-1gnd_rM5smHc8wImX?mW)I}%;e(mC-$HlUUi^m5cg`z1u7E4OR@%Ow
z2AWXw(KBba<4(o2>1`PO&P#o>l3w-&d3m`uXA}CJtXqy4tSVkG@pIPs<FU0{FD!WL
zP0YCGL2M|{Mu~OvbnkyEuAX!i&N+J+J(+tbUgvq&&qn|3GSa-d-|`;rrxBf#hd*(l
zMHe-5fW8V1Z;dH8PNh;%pxOsZJ<^_X8v8}G?e4%?uE}ZIV#X^lECvtEc^N~7pNILc
zzlPTqd}xx?J6|^G23$%bvVncLQ6fl$(3_@CQ3kuR4;K)e<ukfvSM%NTo~d2l9~si)
z7-e$j_Dy)>wO5pbwhjAstGsm&0|uXk3FF6M_!&bG#66inV!JMwb?0rUY9)~w&3MaP
zLC>?r`KTx=R6;`Gf6G&;+w?UwIuS3t{V6UaFZYKZe#DZc%dnY7is?Huq-YhfGtAcs
zE7yiOe6P0Fvpk_{^?VeIX?M=XnIlHy6Gqsc|I+<fSBEdG3UoM}K72I4so@xM+F&|O
ziBwP29!WmhqZG_MSxiMi5#as!<Bv3;ZVPb?5)>4qS}hUABO)S{LlsA3@}sm%R<kS&
zSQt1)F<|KX(@r}LXP<pGJ|ayfbC2wQ=FOXj(W6PvlJ*w5!K6J#yJ|Jt!hnSV3j_Ze
z4466j!w)~ix8HuNobQ&Em8s~1*IaWA6~X$dzFPD4zh=m-j{J=nQ2YY&%0!<~qUneM
zq3ENCgKGha(%iduZ?$hT`?|ledH=Und3e(yJoyrs!&6QG06+jqL_t)D?~k7rJc)>4
zKc!gQ@H}^b&dv%rW|{bH(YKiO@EqdJ2R<HUD54Bd@?`8trHoZ{x;A0TtS52&hc7cK
zjgBm7I4va=TDDKs=Nh~-uQ(cZ_4Gj!o#(Zx;{>fHp}tb@6CKUv<YZINz=8KiIj5`5
zfRIeKy4jlfo17WNR-xmra+@4hMH#HAyQHuH{*1g69UiRo>uNYX^{bG!ivFQQ$@8M@
zSabAQg|i!t1B6#tR*P3;919<)D#JT(%)^-RSKABq@DD-j$Pmr9we2IMeBmJp6y@$j
z`flB3FLzgzl-D@+wQ-7Am$}l#N`8Tp&KQj+?^}iIXFSNpF(^XE*3=u!SL0n?QKiz9
z(b?3lT{VW8Vo(@GgF;XC!;Lx_+36eb=>0R*|LwD%#MEo9L;(4r@=e>Sp$xy2E*S-a
zQC6)DD&?27V_!}l#7USKLQ0;dK*}rPI206?P|qz?@$O_Dmv#s^9VCBKWn0f`Fd#S;
zzG(r!edAmqD=SOwZACX+=58-9&6hUsVNGu9%EEw!ftF&x$Oc45MR?gFKkr0CDv5X%
z9UZNBO6%6GQ$e2o&ANsy#ouAgS9{q!XwfFQ6KN7H9iqHUErRkyc!0VHCA+khCb#yB
z?FQv_-Fj%}t_NDVsi%@REiD}hF#&jD=8YI}#$cS-yQ88%ltG)V44JQu^MS8Fd;@1)
zILY>;{%Prk^cEWsN(YpTh!OIRA8-;t142*IlYo{h?##@Cti)Gbdp8F4?TzHvP_?Ez
z(n@A+5q!M(*xk74zGvz;Qr+o*-MN3-4G63DYkI^{#%9XhZwt`iAbwLkSE)<Vh{nR=
zU%rF5sc6?OhPrn3Wx%$fQ8mlK)!kD$7~Vpsy^atSMOqBmSifnT-GETOSwmB)I!T9!
z-l7<S4x!vy3<y2FwO*c-Wn}NZ9-cIl6w*$=8!4T%9J7!%gCge^oygrg(~#UI5g)$%
z2tFQpCdQn3qLQo2w{PlHgb?2!F&JF@<3b#N>e*6FgYfllt1JV;1~Jq0O&KFY>pb(!
zGx+-JuNBWoY%N6B>G<Q1R}Ryq6#1S_+NMkWYfrTl{;!qsmvftr_UO?AcinZDA{a#|
zE1u)GZr!SsE=_bD`5fzRM*eaGtOA<AK+UvfCJS>mnapolw3Kld6|;LC*PoO7r<}mV
z04`G{-7gAYUShnr3q>{se_e)5u}%o^w@q+1BLI2k=i|$%l1dV7JL6m`JsmDk6DB8J
zvj8-^T-8)(1lyF?YohJ2tz=G#qxBxW`{QhSLpoewm|H9V_!)10y%z2031Y+g^_(E|
zVk*Xisa)iz-}4Br9CrbYHX{`?q;CDCRAzV5bb(qh>OQagTP;LtVbKPCdckl;bX<b^
zKXdpf+;ZDYdZ<Xp#`Wv4c=2zT^URCb<ghp<CMM9Zal68^UZk9`dfjHkc>(v|{2(S=
zcn%f8wc>@ZFK-emD>+dLp}@NRe0`MxVQ6$4oOkXhwGh{BXG?yYwzMR#l}BU1;P8VF
zKEP+6f2J0*QbsS5#ccfe@hSqLq%`w`g*OWW76w|50ily*Er_5|_<{usRCH$9&<m4I
z;K2tUR7xWf)yjOEEwAke=d2+s4y_`t3u*~=@lc_=C9|tdnN+UJ%C*wwhAnB3?VgJW
z1$b_(Iy;^YRMNBA1}Os7mD=NqT>E;sst61zjLzoCC~E?Zm8BjYr3a$T4(76EUe<Ta
zZxwlkslEJzal$E=(}3_LMu84g287c2>WWeXaYwvw?Rp9e%9xTg9@lCi+k`d`3ervw
z3|%i3`_g-&K)0U#NE;1R*N5Z4YFn_r=>B?9u-K3E(62kGfKB&7rKQzyr57e=8W5K6
z_QCKGqYxSBc{rM>zDLDip@8Q7w_a6c7VXQli?amRVmt`6#m8Shk3s!<(?C|UfJ_7A
zT@|RXMP59Zu){H*dC%pn=}8ym2}-;{opat;+;#VCGKx~MZp~`^_Uq4h`SrK4k?XjD
zg!tBs7?LK)w#_Yc1hOYbJ$~xdw{bS3BZ|;YARs`~@s6@IUmG3Yu0s!u9yvm#I~)ho
zuftK+kt)M@rTXQUUodm#Oyw;|gdyT>T0p$x3LFc4Q4O^Y76y(Y49L1=_Q<#2e!F7M
ze){RBO0j>>o;}Jr)qnv5AW^BhckgabdlYrSzJ_@P&{*mAdk)$(vsO1Fp-$rBj&WCA
zf6(MQL46LJtmQI4$$vm_I7ZPZ>`bnY_wL-ubt4VCcJJo;Sx$p<Is;?0E<gW3#I<gX
z))YcTgooN`CNoYAHAD=31j1qxaQ6cbHI$^*y~c1*(^eoVE(sGRUWfC?UZOl{N?Z3(
zfvB8H4$>D_dY}#p4ncf;JYw0_kU$Ye5M-U?$&rRp_Z<%MO!^}VC?m&=!>L1uWBc~)
zir<mPD9wUJXBSsSx{HHE3y+D^2Jcd@fOr!eId%g79SUvWQj$A*`!n@AGk?#%C#e6c
zub-lvuI;1)s~mbkE-fuXIlV$lU2g6k@b>aXcx0q<Mi3DZiQq%%r)n#|G5dGc$`!pC
ziL!U!fw*?cG&TMrWXj_{M4~85`#e0osN@lY)_ezKkK*N_8Bc;Q8D~v_HPG23a7)@F
z3Nk{wv~JT5<M@Bx*o*N1aV6umgI*a$sVq025$cGqRvfcXD&2%r5kEdYf&Z-$84+f0
zb5rkd-R7II@(+%{<yTL|$n!4Z`>~CC4SG?h7f^Z6+^G-~pOB!O2!sX&s3H`eoSYbu
z+7A<Nm|nNodcURJQkOtrXbkSUcXqurb#FBM{g{z)!TA?oiSz4bs`Fcfjtzm_mp1W_
z25y~k+uaXf{FPT@E1ll#*p<O|Q@%f{g87L9oFpVBB_fbc&IF|IZr*{I#AuHP1Jeid
zeRN|qJo!Hu5VZ}0882~AbIQ;W7<kfP+;-=7Y@r+?i{F*>i7znUjVMLOwI=UXjH0D8
ze1f(#0)6<AJ`I*_zgeqt`L1-IqvMm6gSJa1OvF~cBRh8PQbNE3H1_uK4<L?+Cprrf
zV`BmHEd|oZbjIEH*^6)L!m-<?ubw{s7;@GqoPOpAWw2bvJ)PcTIMHd23tZ{kQH&9N
zeD(MkT$_4KIr3e1pmP%Wzhcrgj98wo_|p4wbLp*LEBm=qU>VN&Cq6!2?caU9_5RAd
z?{&*IbsP<6X`}SDoL*aJ%$R}s^XDr=9Z{wb51<l#P=tEo#7WXx#)C)0s99~WF!1li
zfUJKq*N8IZ%{Sky3<yOIxs!Ccz?o;B3E2aMhli_lGJjcMVZg$Gg#il#{~QJkEh#jk
zM6r&EiNQ9~{83R+s!@|BPf`l>Cfz^RQmbYQ1II1~41Yk3afLpT2o17_mZ;6ESFgsK
zZ@!6Zuf5jJe?4}4dTg{@cpa{;o-|*h5tp+M_s^XW<m=w7#-A~4I0m15A_fg*^rOHy
zxM%G^d6jmIA<mcDw~592ujga)_Pfx#qjtziW{oOab93udL!OPuWW{0Z2I{Z<6(}v*
zqq0|2X(jWPmnA$iZNw)0Bm<f+>4JPl<&*!v0<^_cP+@a$CG`m&_E(hP@mVu))4fk1
zD!vT@=sZ~*!e{Q;O_@qA5)$HRI8cRc+tYLb4#z95oQN$ee#ZBItbr$u2up27gpPf1
zNUpv&>623{cU*VNy+}^!iZe!yrIAXmN){Rw!}o&Dd}#z(#5UxSH(ODu4HL_#JDTBO
zP$*6p6FK%??k<>h>-AW+b~9d^`yfL6>6DLsWY-8Z%v2@2C_bIKl)G$$u<ug0Z8f)A
zbk5G!ff<U*OKcGcr5NeGe*aojsFewCz4aCyoBg0<d6gW0;kAi#1(D|onEBm8m4yKd
z1BVX-=DQj;Y?w0EefZ&r)i)@P^8~~p!+-wsAL{x9SbU|HqWwrL4Yo2}DesSr1=j8;
zq$6U=i|Q@JT3%(EAat2P$L_~rNH^fi6`K$d=*5V@rL-a|M^*_PzY<OwISxO3Fb{){
z>!PFVs=GCZ-@f}o84t#{>qMvg5;adM78$26R<B%!VV6!p`@|TPLCXj=ty5D%bFTEd
z+V_N$RpRUlC%AKsuh{R5()=t$#k5Ao&Ob2WnyGm9(OKx&Ca!*=q+{Nn|DrM;?ApBt
zO6g=%1aTrK_74iil0O#X&c~)8B0!APMW#(B5tO$Jhy{{?;^Go@`Q7)w;F|GcY|;6|
z7*os3&3CkA?Gju&>Qbh4Le8FalfBm243Wv>9}tX_E*ye2Z+?k3331rFuYkEJS8^5o
z%4|G3_c<Kbts`Q?wanPDFeef{?uziK#?s#xt49^I|1cmjJ%MP_S<)LB1vw{h+$NoW
zGM@d<cSwkf!uIqG-UYVp$V3#ye-{ip3GQG0h!Llqp!gH&p~GSA(qC{fjR&2glhDE6
zO-1RJcS~rr(oL&ypzk^8)*)HtF#UAMZe2Ek0YxtpnF|*##BI0TW|uuCQ7$a{3v=hr
zRY4~HPM(o|i<)Tk-}T6JTD-`M#|csNkrzw^vl3nBgcD9s9=Rl)lbE?$aCBmT8#0-Q
z!)e5(fY&lwY8l~1)yYY}at&>?gDB(@sFX5nP)d(%0!vq{LVigl{HdhuX!&kSR`1lf
zpiC>Z=*dg!Ikb1le8gdl?x#TSPSvF-NeHZ8zkw6-V0xpeuC>^xhjk9pj>aZZsY^gB
z=^Vh)KYvrd_fvsiKrHcN;}fZjv<;VDe<x<%HWePW&9Zzajv)A`;%0i!7P;$V-;6t^
zalF>USi5cF5ylamTe%>N${_OJvv(hix$t7lxML<#w{OFW<x8>P^%wE|;<fM%i$c-f
z4BI=vK2;RLJFyM0VGFiV@yr+y`csilU`JuOT8OKO&w?V|*AIVQip-osL^0Y?Ez5Vu
z202_eKK^_c*}2AW?ofnv*#rj6e7$+gW?X#n#Rv%rQFFF<zZH=1=dSe1WYRTJl=aBM
zfQ5l(V!+H>XECD3aC-0m<daX7@UcCkg$c7w?wx=B`A7d8cj!y69Ydl}DKuarjh_UZ
zsRV9dU#|8p_rk*Oao4oTYQ1Q3zSj#K3K&xU+xK2m#S}4et^s#O{uSszhZb%m6%=#-
z&`1VT)G>4xBQeq)&aQ}#*L036jRFK@^DH<}`rxH$O2O6MF&i#JqjjDGRJ0XT$xxTu
znE&hO_@Ej?;Y|8O?l%dfjf|(9y6I|YBi+`z&zt&fhR@624@sx>!mpn#ffu75<&_qo
zq+lPCS_ffk+OJB1H!`q|Qi@mJDVr#?DW!O6t9b|a?oP+sFTT%k+tJA4rcZs(WK4ty
zcwjqU-7kK86GKnvrD`(y9IKV|B~)M);N?L<eP#|crkOt+GrI8miHeC;|9$%p#3kb=
z;GS8t>AYo&icmOr`t8biFp7o%8T9@qAVZy-m4ntK*_M6w8Zt8PM?ivBeh9YF02N|P
zLVdL=lA?x=U$trtiYxZR+f_S=aBN5YYw>c~SSKCn`1(1ImODcK2;H1ZC2H}SD3G0<
ztrSJXfKUvbBx18gCmk&#X0_v3#DMJgWM3!|nV)_3Su9<;R7E3<kB^79w>Ngvz)c)f
ztz5a%uHfI)9`T>Vfmz!cYC}WwcSGqKy4O^>CVf-o%QN{m>yj8gB_+30|0aK9XPMt5
zZ*y_pR9l;Bqp4rF)n;VFdVTx?kkV29JDVg8o=x9mJ#UVxwe&~lp_2p}O?K%f|2-Nk
zTPPvrJ&}0~G}TW@WBOszo3p|r7h!R-B-g>A;p)Hfx=l{o*&%ODYwDzF;Ac&Lb-iIU
zq>}&Mefl<#y5`oQj(<(g!*eC$DIo0-!pYN%UdNN$tAA628H>i=FWm>e7Y^fR@-}tW
zIMX5;Gfur4!IycLYU<E*PE+OUcceC*Wct!jzQ+1jH*Hg85Q&1uCc(VB3U9<&B=-gK
z-xwGpPt*6N>TjwKEzM`zrN>Lt>~0=jXq(be{hQ}?&!&F{9gWt{1jJh1?CQ7FY08O=
ziG%z%28V(tQ$}O>a_p-JNquR2;tTEU#pHE7tNn!I4coOIGd;h_w`Sh+ZasT9kh<oU
z^hNfRI)BamqwPw@M%pM!OyUIO$tRzrxBQOED{~4R`mN`_R-8Hw9z0m@^%~u`9Bn<b
z+GAnB!oabN0W-IYlKh=_-idqexkou85Lt{wWPjm>7jVZNcc}SG)+UqwSnjjcb_)X*
z1}qF5ix`kOSZK*A8k;=&=%cC&A}f!Nk5}`xc$e>x(m~OYM>}17EaKm4^ZyS9gw`>8
zx2vwYN*NI5<m9MtPrkS7uDed@7Iy90)n;r|TgU1D2UCAvPmO_`MC&UT{XQBH9#p4G
z=1j`bP8c#0kKK74rra|JZIcqPY3p`1Ppa0tXosttwx%lsLgBQKi^HQ6mECRfYrYQ#
z)Vo2Mfp26q62!?J>u4D`QO4kbUw{3b^LkDBhgKHzsirzpQC;gZIMV6DQ>o^95gng^
z(7*ug5be+^(5cyfPbxC}{>MIteSmKB`}3by#)I7{C)u!SIWlORDd6cFjL24nbbPi|
z{f=zY5hwLK4xKu7U}TzPbney-(E*;g?!v+9d9c4XcJ9@B7)@bA`lt3I)H4`5@&fG5
z7=Z7;`wm}x{wZF2`+ZwXAyp)0({YRt=%EY>v$FQ0sJKQMzN(@O+o*>o(3K7%zj$LV
z9wtxbf!ikA^#`1(cPbjG`6yu!f|^#zRW-ZWu0u!S#YC-?k`4{r=`in)-+!Z{yc%7U
zLo2~bZ7^Ww>s6~(VbY{Y%HUfZ{TbatG58jlx=Cm9S!W9a76uLv1{~=o(OdcAi!T(f
zTY@^ZYu8RW%9DTv_uY4&#aC)6%GG+`(#(zIvy~~NOf~(JDlqlP*#?fZh1?Pw1CdR8
z2S#A>&ClY?v6B!QlSl)?HEMi|_U%Cc_4xC4Eyam_x?<{#dvL~SCnGjG0?wr4viI)6
zqVK-O&3DXVX<o?Nu?eXqrU5|bPFh!U;-weBOLV_%@{~g+x!4EM36!qHwe5mO?zo0D
z%UpCyX^S=MH>qbCjF=Y_7muGlnU7BVpZ(}l7&PE`goOl=hN@&ly>xv3;X8PE?n?-Z
zZH?8-mnj1}!2?J`CYNtlm*)&0qRt{RCi#W%C~co|fRPe}Zjd(Y*|mdCl4J4Z+jH^s
zz+SlgqH_`8s~vnEp#4Wy=5Bod%@-Im?kZJQ>)1%7?a)Sf>P7<xDP8FaxclJ5!9(#B
z4G7)nc(WisUCCVY=}bZN^?v*84Gcdo53^=WVgHk9JQe_VH#gNb<z#_Q<i7am9ZbFZ
z3EJbtVq2=@*EE-llOCHMT|3%ZpvR;Y>%92#Yn1_^7b8yt8S34rE-yxoYY>86_F>fN
zgK))l(=ht1GZ5c8MmbQ;&CbFfzb?Y$8>g%CqRO+ecAcgH<woZ&ow1!&&bxL3Lj61x
z{c2?LDuZ=s5(C;1Ml0n&;fyoRP<l?{e5yl-4(i@3ue^euJ$u@}t0oIOj1RRn*I_KM
zr9}y&OeU3B8fLx!{`)FSt_WtuvQl93<jMH&fB&mI2bsyIrFB{PjywijxuFse<p4X#
zqQNMI0>uuC3+FTi;Sn)N=GEr368LbFTU2oXyZ7uxVstAkdjAEa&AuI7lBs~gncKNl
z18PrPjSjFdDNY3a>OyAunhQ07wxZ$Np@1sFo<V*&AucXa-KnV7rOS_f1=>5qBOiZ-
zY1dwkFn>=@l)@}_z=6ueF0id?5$9Pv>nI$UiX=I&Wl<L|#_~*z2DhwRt8!PA>3Zac
zE$9ozoHtS#4+>M-MR|;_sZ+iefjk;XtmHW?J`%a9dc&<A)H!Gdw-Yw5`UBtpww&JU
zy)=_X+RX2?k{+r9qvA1a$Y8iS?WYnO3t%I)L7`SCJFf2lTy)8$_-MgvxbTYW5topF
zbZ!C-?6(<`=F+>6fgnaU7;|cSEcovR1P1#cBd1tJA52b)!{)VLW8=1T8ieQtuQA5D
z!K)g7Q?TQi?R2SQ2<iCPx;{7t^!uSbao>O6{VIcaz!f7xi9R@I&Kz{^+*!Rdjg8a6
zYq3&T7_cx<7XxNvFW;Lei--ZCTuY>8VX%!EGe$+(kqFL5HJwzmJk{-DGk&WD2g&U^
zsI)>#NVxS%E^{RXIrNm&2AfuWg~iL(VC3Mwn%UmSoG%L4LXoUqwit`jfi`X1VaukC
zYCThQ2F=|Bx^!r(&P>jw?k_c7m2=b|bVuRJ$TbRN2W^9DZj9XmJ;W*uC1s?u>OgF4
zg1S@60TIKyYL>MxU(+me-v1J}-f$JY8+kX2Hqvw)@vYh;#p-LJja+QTopq`|_)m_X
zyg}~X0qD~8IDiI(5`_a<jO1Bej#eJ=e7X-ySFOcyo!gLRWv%Q#PxZji8zS71cS&9i
zX{sYQ(wo_PGQro3(TKc|nO3FNNO8chosJaxjk+8IkJrWr;v}P$)M?%|7Ru6@^8nIq
zwA+3%Lz)7~A+7%7r*E))eJZ>?J(Tke$s@|b!emJ7*aN5Z@6EYF-gDB<tWTmcMUk;0
z{{v4vh0%m3;FV_|$JDzXf<)ty=s5!Wi7OW`5zFjGfz1<>+z*e4g}4z&PcMN#Elmqb
zE0L3(gE*r2qgNiqj=QFzed}=5cj;q2P-CsJ-54Dw?R3Ozy)ur18|K}Rro8y#i}>xg
z-xTvzqBM&q#fcLqV#pB9q_U6mQP6Iy2^I#9MGP3BqC`CVj)G`$s*swRsv@9?hj)p}
zA&Mf)moG;*3cZh3`shf_1&6C#DM$Wgev^L#j^&&CChei_10BmU<+tQ)>UC^u?Xsm0
zx@6PV+RqPOtIj9uer<fz&Z&*z>+*sQwXRxaatw@vg}QauE!T{P<k#)3$y=+;X8bVu
zg%;8E>P(Jx)~(NsLo<p$qDf3U9PwrPQ@8#0KG^VV^0uUbLaz!q)+@hRbOZ07JTV~O
znz?TN*|9Ip&s96+;V45&G<eg-V!94pcAamp4lUTy`dgaMvG-Dj{MR2ZJz!?mlQgD(
zCVxxo*X0l=WT=|*rA!(BT65GP;Ymtr`UP_AtLcL}*U75V)k;wJho0l~yrAE8Nl^<Q
zGDq67sq$oxQ@5C-?6;v4WG^DlEgyK`0lV>Fr%s))X3ZLi(ziHnGQhXTTv}%f0~Q7>
z3>+~G$UJK1s4K3xLKzSWKUf^6h_aXPiNyi$ph1IFy1I@)k66R3f-MYK7_cy4VW1WU
zWKSV;_QxN8jOU+!UMYcPW@bVRoBH+ZhYK#aK&2N-*`gzBq0ahYVc?K4Ap2^ek0kQo
z>#x6#OD?%YeRJZ#Q9z<ONHiTEA0M^fueD!2<l3wZhk^m4L@Z~+%WN#aQKB7qGG%5o
zAf#4xt)wDn7T7~)feIWLC%#@1wMCqn*6hop;u5ecZ5z(LXcA`MaxGj@Nk#IO&$u$L
zdwc78TJjE=`96ToYz3Tbx{`98kdTONTeslaTV`R>*by|OE9LVBWT%q286c?g^P@nP
z7ouaBnYIz<T|Nb^;@V={nq?@h(s=Un3!zR$HpE=--iMyV>8A{$(s(TVe0`~`u8lIK
zx{AVms!ghD+c?Oz;q|EdwGQm9?V)^|g1gYjSe$p^IE)y5E^eQB57v^evV7Tc{QC1E
zeDmY4wQ{#@+m6Pk#YjuvX=jkhaIajx1|8eQ<DnT><J_}{qF09mmCub)FB7T4v0+mo
zyxeHuK$$dLJP_wqhBS)(Uw-2~bW4t=N<#(tc{T4ytx6B_L;B$2;s!U{u(aeII7k)$
z`p1GpnXikAiqyO;9j>UTP;>XjjT`amtFNj^XlB3ruSba0K??)_5C#n0Bu0ZmH;I9Y
z@RZ~`6u!6c!No>H=qUmDcC9(@9~vxEt!?R&vGWr9uS}7@@uqF971@$N8G|vYE88Q<
z=Hw)IoG|3<3vktW3-J6qKcY*=_E@!cgVKM?V-O(Uz%T^+xZu(I?o|I$mLo*Q#-nuK
zZsZlqI;!dJj-9(O+V?8lF!M1C86?i}<vnRR?ZV7Tr&DOgaaY}d=V?H=hWc%76XURn
zHUd)b&h%8}bf7Xj9k))s*0G89>x9H4?4VNwv5qjLV%JV>uyVypJon}&=$sVIcUl}r
zYNRH%)%vDeiYt{7WGUlC$vdBxz5_8)p_n%LQoQlzTexu45IQ4hh14yZ@aU6I>-t=R
z(Kg->o3?D{fYAPAzYaDf5A}%1g|^es8T443c-mP=!u43Uz8Eo~bj*-d%(gl)!r~6q
zzZHu<!!Z5}oOIgh2xd?OY3`n#+p*}^CF*`ybPO_?Ug3@HZJpE(>o#n}=@(sxo}JsN
zG>+eG-;>Y4y*FKkJ06*b?p-@$`O4KQZ+X!^?Du5Qh1ejxIOk#YuQEFv+(V)fbf5?s
z+4=VIZ`YwSR<Bx(GcUOT=MEdJQwzc^Xch*9))Ah)@P{P8o`4@6y-MH#(IXVwxQi~j
zNZofFM|I-}9}dlu>IgT+bY7zCTz1)Im^W`84YlGR3)qSkD-^R$Hv2L`Sc}yW9*nxh
zAL93}yd<kK?9-zz(N>P*U9)8m42{6hi-utH8($(gIuu2_vbf{tM%hc0_c!4`AANx?
z)2`yjM5T0oRKjqOcSha?9@OSv!qG2$?{&2R#L!~Al2Pnru9C&3s<a4R(J8q1_G$3<
z6mK&uwi*3$Ok(CeVLtSymh>-MvRRf3@=L3cw|AE|URd%uzW(7?Tr}bowyT=VE3F7_
z+A52Z6BW4GIXwUPY<#<96G8%f=!HoyAfgzZm%SU^PacIS6E9K*4pr5R##gA7@T;q|
zQ3G1Jp{k6#UqV2DW?aa(;Ru2op&8`vGFt@0Aa^H-S+4ZUaU4uOg-`z2v3&z3QOUVs
z7=)anK?w48QwyK+3ZM`wL!nFcqEi0YaTD;<w;$uV1>d1{Oc>I3O3gKBH%ucLPY=H!
z^zL`MG9dKgH7j6YRVc02)6}bPzKa39JJRC4mGW36eKm82)G1|%ap2<bKf?o0zKp2o
zDCKEPSIFL0RiMl*2oKDfiO3*}S*Y;Rf`i~%@GeYO+0e@-V$YsEG#E%nuU@_Ei<wE+
zf-0;m76vQ~G=c#`|Hy{^;fEhqk*!2gq@+ZLQ@`u3yC5DZJUr;>!}hH<Qq(bXyY?Ea
zf5kI`$ayEX!#m$?L`--fz1~qE#QtU#(5oTg-p8N8z&_m&;^(QO$klN=AVyQN)|MA$
z<GDExsyyXIIqEFl2;Jy;Z~Nx0K(`_2)IM3?Hw1wCbqpRH5!sC9+v&K52!%TN4Qe83
zcs7`O?QhnlliA?LWxN6f*%^!`-iD3<zQMxpe!}?C6atYB+E0OwtR*$H5!V()!&Kwt
zryjyrzpX_`phO+kw2?R|D9G7^&I8ZFv}-O^v{9XAH0!7IOK7l8-Fm9@ttenHu!oV3
z1tvfCJkCDjR7BF)Q5-YKCaxB}LGP8~tYOFI)wu2Unee6qgaf=MAn0=C`?e!97c*x)
zfF3FFa+{GD%hg#T^YIl^;O?sFn>O*$EKevk%|zEv^-&oVvi@Rvg8K0FN7T)tTun<k
zrgOYj<#W7OEm?$#Q)W3nvR@CqY&r(ffY60wK+N06K^kX<T<G#Euf7%^&3_0#ZOKBQ
zk2`XUq#u$;_t%WQ<OvRo#E5fG!t?Kb5C8BmMh?$HWmyqgMYo{~$Srv9lP_`mwd3d&
zl=hmn=y<`2jz}WUK3(uKUVZ-?M1%&Z=-JX}8MBJwJcK0o!p!M6QW&J^e={zU=4b(#
zdu6Wv>8GDCefo4|&?FH7qN1Wy6Q@p{s@@+<7;?0XnAMJB9Ru>c$@e7mknoJeP;eKc
zrph-byd>G9bf=fvWy_YSv!pfa&#~V3zq|cS;q7Rfj~j2Rta*nAbB)(=c*<|8l!MiM
zWX8kLZuMJsWa_J5PfPFA$5)L)i<DXac}r`mov)#C57+xwyQZV>m(caKKefa6?H#G!
zHZ)!`Vbt!&;jEoyQvz7G{Fc8XbxUfzt<u+8Q0Hf@XHEXl<65sg$#X<;*JPtw^w7}e
z<&641bLPxi#)DnDbb)wDpFMlF@{}$WnDi~G%*te8z`}rqffiuE?0dvf$_F2OfKj7H
zAwE7{?R})Uv17+7$0?$8V9il2K(Lj?!hnSV3j==<17_|O1MhRrIS0Np#E|QRgaoA^
zCQ7*h0Rc+C!7}vzi^#UJTNtom!0bgwj~<Qp-g{3u-W6J@UHf(_x{m0vTyxDe7QT*R
z445$tr^8i&?S++ar?|A-rgv@RsU_uF4?@@%MuzDhL}NKZr8u?aS)`Umrd*I;f`C9j
zP?UIBK-wW~HSKA3q0(5kAt;=>Zv>;bF4tNnPGhR_DjM&JQ(v27UwQZ!K&?k?>+(N;
zQKhu^X@#|P$SjgwXLoM|RA)10AMo98D{#{BU2E6G4jQ?173JQdYbhXdPXmpkRP%@=
zof%h?$KAt=j+{HF{}H3kLt#N4c2kD4e*Iefx%hW{^8QO$El!>Zv5fw+g9`k@SJL%X
zqT+zNdiK+AOYH`P9-efH+xd8^k^T->i4epw2OaQwhD8GfyJ!sQ4sRb{{;RCk;UC7p
z{Q2|o`RAY84ZX!^Y54HrIQQIhRm<wWGyiaNt?Dfd{3|hF_)0w(mG<qo-&W2|I(F=+
zoaQAbCu7{WaZ0X!;)y4!^;C58EodnQYSv9zmlbIBszWGH<KL6c;v?Gk1=jusSK2xt
zUzc4{&c&UOmX^lAMF-%?Xn=}H;z^A9q+VA~f871Zi&*|nTl_)e!LE!Rw`Jpc6qC>@
zq|RA!p(_#+li)^OwL%5}sy^UMgC^?J(?%gJbvr60q%T3b(4}iPtXjDOr;eG38B-=H
z+Dq<J6xbltXr0xjBkCqL?`24I5<d9jM|3`JkTM?Z)S*2i-)&IIGj^uK-O~qclA{=1
zx|$LE3TQIn4qrM7sUVH0BPt8N4lqzcAX3`ID&xT^_dJ2|W6rWwDNZppiX!6M;bA%^
zn0DXONbcMLD_5_x(Rl~3Gb0O$Nl94w%h&4PvArETbwO204mQ$wuz%k^SoQm2)Pzlv
ze(Kc4CA4=S$WPtB0|<&tz)PRKjgy950RO1&43M=AyBOVB)<5ZAD5GZw`FUg4_D%Ty
z>#tOPbBK#i1nn5fU)ZK^v7*@cHt?)YQ@`(>ejU8&?ZEIP<fguM!}Yh`hfV92WBwP*
zA#$#aw5`Zy5Qxgs0&Gn!LhJYhc(}WvxTugijn&GatrZPWcci6acZH?{rK}F@`?@u&
zfaDV~XZ8&ExLc8f^<XsbXvRjIDBN+!9r*qC-<1P}{QP|E*s(*=t#V)VP)*wAm3(+o
zY0cHcQ`TQDMLr5af~%`5Zoc_uWk4vuB~+t$lb<nThVsxQi<R8B7;JwT<;^cZW;K~>
zn+YCndV^cdOdMAGB-vngHSY9;!|<u63>|?vG$8cy4P??RHBoNex*Z8|k+}cniRjs-
z14F0|RFQ3@EW3dO%MixEmeqgajC04yqXyyf=?}n17F0D&H<+Z!oAQndDgwe{FzTx7
z@yp#$A}q2s^0(<pIeqs&wY9(a?D0rm^&R>!f{g*wR^wS{(ZY`~aq6AsalLcD;Z(A=
z-4)c=TXPws*wr(DPqLA<Hy5DNzK$eQQ<M+|E+pzQ(>LOd%WmKUPh{`rhMOS$XbK{u
zTC2z1d-g(UagpAjv;V$c9$2#MM=V{r4uku3Q;ZJjo8G|JDUlPKmo18svsm8Sz-hmZ
zo)f@LyMQuO;Pd{2PUf#C;Y=?<0)p?IsoRj0n1I)xyc@^&>WWDhjjZ|hW%XqmNhijG
znQ5Ca>EyGpT;;BR=zGp28v~~PGwaU5F<`uatzNxaZ5|R563EzDuZ#$Db93?d<Bv0x
za^OF*m>s<JRtgIP{|*e8wPgJG@epR4D6+|SCn2pDELeb3Pd(M{t>WL&<C<P*I`IHJ
zd_ypL>{T=%oC1FuZ|$V9maLPxdv<a&*9OZMzJc3kanpDAboi<@zorbi65~PH5Is8k
zF1+#ipIl?&v2|OjT1y1Kv5}$JQka8#CyZg_TQN8nV*_zs!5#3S5JR=A{bzs4qAy5l
zCV07Nj`{)i`(U7P1Na6<VfckN<C_@|Avipq285|9YZ^D%Le*V%&QP>lwjTYux3?E*
z-e(zGfnUD<6qjFroBes+i$_ntK+#5jbu7B{=%b2GrB@+OhOsQGI-ralThrrX+Omas
z;IXH1{~b4Rqg_M0NCri3khZBP$;YGj-ikNg`Mhou?Z2OV`dRz6A-WXpr4EdmS*~fJ
z<?FVQu~7{VPn&}T8!jZX+3S4v;eYVmCU6s(j7^(1*Oc4PmC!~U?1V&(=U%;gQy7!4
z?uj9uN2_WqocAWy-*&C?wj@TgLWkL!Wh+tta&dKo1ZiYzNoQ$e%T_M#s4Ub*jD9v6
zPv`>|4_};m#@Wh%(A!t&Q=Mizzpcc$DBN+~rRbcJj1i~yQ$~cUBGxT9m3K&B-O`^i
z{DRBXJiTLB<d6FXx?yvh?b>W(vo~(GZQIyvZnkZ^CR>{^VY4;q%=h;{=e(L1@w#R{
z5ANrNn^-u()kRqh><eq9FLKEX^;O2Suey3#VRA8}&(o#atL6><J%GR=AN;>!=iDoP
zOHzC4Lx&3MV3>#bd<LQrdTct4jg9?Ego{NhfD=z+&?@Yvn`ommT*(cfRIXOg0s{hb
z&@k4R+L_X(0*(JUjeSBxg{{(}4M{wH@0Q1Kss~?;qmId+96C>^exr%qedgtlo|gVc
z4Uj^EnffsMTW^HgThEi2T>gWMjO=ft8Dg&YDeb1uRgVns$n{2C;gOE~|0|vA!-irz
zMsScx82~Hi1ea&?^GOf?xeSFN(<z^W&C!<qep&?mk8=PEB}y><F*P}f$ZjzM=C0-D
z=KdX%CbZjV9cfwBugW$c33$6nlRLW3f2&V79$v}i$j9JyzMK)AcsTi@DLQ~^JK*+9
zQ@hsmkBqN1hB?e{$x4nB9~s+kpH<+SUkKc`-_>vCo4Kh9=?ElcNz}M7AG+iV(yREy
zA-?T84?BGAtAPP~OE0@n`K#LCs27-9nTe&tr@oK4vpPaVArz(ImB!gHOD`{~#IIS<
zi8+;SrTAy+R<RvX&XJtuZcrH7qlSpc50?Sny<Eh_+ab?4%g)+<T<vts^aHJVt?Xqu
zMbApPc0)nP@0D_+VrphzZ!6|z2MHajY)<0q`h<`%byf9x{UH)QTWN_{jSqO+Z%R-8
zN}CLRcC(_m==);Kb3kvmxRmu|Bk;XqNpCgekm2K6{`%;#l%8uPsIwF<cU5Wfl0QSz
zh<t2Etm3v6t&4*v{G_X$*FIBTCo_ChgPA>Q^ZwgEP;9fC=vD=fgzLYtP$H|Qn)4ms
z6i)BEk0yju4AWiP&sA}y6^j2|RxrS~ZjX<bWBRggaE^KY0y`!J$6DEcqV&@rSY<sc
zZC-HFZH#`B$K&Ch*T$h#B5v7ugyoGi1Xivq{xpVZDmbSmEpb<4)qP~4tq7Of1Fdcw
zcuGX;yU7~IMw1sR=Sq)q1TmN5p0;d)3L7yx4(*V2{?AalqQ(hHyRmQGx(DZzEqFWQ
z>og+1-$-5J_38C2yD+8%?0y-3$yv~#1r8M8$PIRPppXx*7AdW-cboWgT*~hIGWTua
zP4k8bBm|1MJCfq4>U2nYocckoFuq~|!ykr>@lgQOlp*fcW8*WD{vr^qwxxrFA`8*}
zSt+!;N0&kQyN1vSD>Tzvp{ev5dq+ORqk1utj7p)u!`SX)zwzwG$Xebxks!m3c-HHr
zD@>rW_ti_6Y)MK92a)Z;m9j^vx4w5}Wf9mZt5?9y++q6$r$}4e6LBEvbv+5Ax!ss{
zZ*D%|e%>A{>pG2F@{Qyx<;|J5_U3vXy?CDeMvCcirqj8Ijw4e3)$e~XxfWi%)%C0h
z3IloVB@Vdj!V9D+bisq)DsbTUM~niEQqI?Hy=Mw<4;kgo>R>RO{^l1#&hqrYJO|pw
z`}1(XFX*oJ5Ve;nK8PWv^wqYwyH3l8eR)>BcnuOV1dULx7p4Yhb-|P6^111HIv6Jb
z7i;0)^Vwi^5d}<W9ES<`StR6tJ#Vt!#(Ec-Cz_g?8deng42_702tcY6)ge(c)Hej5
zSjUw`*`t)ZJ>zf^My#p15$EUUSBxJ#;<AT^x3aDEYyrlNuvMvQb?lGh^C>0Mx7l-_
z!vhHygCM;_xO-<2dw6aySh@xi2Q>2XHh%9hc+dMa4HoaeClPT-Wo%8kZ!(tfJ@-!%
z?cV=b)J$L9$7#qYM6k(?7(&CL=l<DIG6{OLEAy{LL*Za92Ab!sDKm*S-Vl4Q(8!fQ
z?D=arm~B$aJevJ}-6g@7*cc_^>78`)eBaV=T91T61;DE@CT)h|IHG+#PR6rZpF=+b
zsK_?mgy`DYH9V~k5e$y`tJly23#d_k)u2B};^1&Y!ys;mV<WN#F8$Ih<(_otejv&2
zx0Llq#+9+vY=M57`h(Cg86OQV4pL|e%~ZZ$+Z|-kWv#)Oj|c7aF>T3&NkAY>H2;8R
z{xnS8yR|9Xoj%SL-pS2L6)7Wwl&g5HqQ6;|y4r8>$|J9IgT&dmK!AnS9WxzUuS^<|
zv;oA8Z?t#_#o(g`qWEtIuFR83Z%`8WY0tBBIQiOsr!wG=QooGfUqF;xEa!l!Wy)-)
zVP+gyPnC7tct{7&yK%G^O21SK;lA9&VG`j534Q1W)27G&=I&wAoFGQ133p{d;sASQ
zbzSnMYJ`%pX+)##iJ=IDLO{VJ&{SwWf2)9`Z}_ibPY(tbBnNjupbs_%e16a=H<2+h
z_q{nE@`BaqVIRm@-db6NCvalS+5DzF#;m{fEfCNy&%)%qDN`P7HdYwFHzr@d4S5(|
z<?8)mdvSKPOc#eKE~6_;+1BTB(2P#c^CFz>yFp7zLQgHj?vW%R9pXh*TU$?_=C#PF
z1&GhH#l>2#NE1~>asc$C<KY~CY*feLQcNz+@)P7k7=4YMHceKNUoS7@A-NpTy>f9c
z3W&$-Zrl|^;`JgO6b)XcQjHlvxN|xAd8`t{^Qqh}PDvWXVc?Y-%SA4Ka-|-pM$p7!
zdktSH0Q;?3?nVa}YGJ5+7?a=gOk6JSop8NPemG2i12Z<M)sFx?nz2}{xSmf>^`}(T
z36Hwl?H(3zzmk9XxzmfMD8P@XIP<AXn>Nu|-ZyE@W=CG{dxF0C@>f<m0yP9=Eof7M
zySw0cv+&){k=!XWxq|?lAF26%==<g|pX!>xD$FbPi>R4MCi?bf4Hl8*=$2rQh&W`a
z#+aYR#JHSGM>ISyEKb(C3K_0#eq3B+9h*`$acKZ;p8s~E-3x}e>yydVK0P0#?@>JY
zQq%puPOsUH89}X}+-Ac!!%Xw#hdU1WN%0*TfF=l%>Z(5(yn3u2t5Nh1!FwIPjax39
zXi2~U>D?Z8KRoweR#~E4eO1N(Y>`Pj89`uwzA;MXvPR*(%`x#JmE31i?i~8Zx#1Rx
zFzIz*AIIZXPT)vJM;h1I6Mlsi`;6eOks|hj-iTzrS)o#5F!N6nsPW9hPVoO9MYMl!
zB(NYp^y3BWW0DG_jTEQRFFQ2wltyRND-4;)mFP!*Bi?4MmudQ+B>#Ve(ouXEq*?Jt
z*Zry6-#Gg91SnCk=1%$U8+L89b@`tuPqQY-W$HfvT|ju8aewinPf(3O)J@473v24?
zR$~e(D=V|utT03XQxYkpw0&|YxRKPy{{!hXaV;^S>iRx9GqXl$J9$zuBy@wulc}qk
zO0x3j42i(U7j+~!MNQ9caJ2BK%d9{+_~1o1y1K8cU^w-MRkPcZb#Q2i@jZVi>Sajh
zFT})DGnMv*vjjHHFJ*Oz`3#I{77BgDZ^%P`7y0&U>Q)Eiqo!WWc+2VNLk+rG|28?{
zVKeK*hO)!5!cL-=c<S>8&-+bG&Zs7u>Xzd&-CF;MP}x(zl+jpT+>+?A;9U6SQ)#Xz
zJ~CY4s>3d`3p@%fM3{)6?UGiA0X%(rVV_yZDFwklHYworF1ndTbk@v_N$-TY@?E&O
zxU{rLX)rfhdN>5QTJEIDe2}Nrh#$=eoEo{QA)8wjmR~-c&P(J-#5dL|6>_OUKc35t
z<jG-;a$T0jbku5UWA%sl20*?(+73lJ(K?>46WG&e@MRX7?8-NP^qNwt+pSf^5PTmj
z81s-9d<hE?8=8;*^aBw}^@!t4d7pBAZ;l&zY$mF-Wp&1+p`*8O{eCK2$?7H|GdgqH
z8=aN5HyJ-@Z1?A7n;MbTeE8(L7_wU{far$qq3R`sFLuAWOZVXE=+KxqskN~YUCHUE
zD?d@;`q>`?HCrP5k-(SUVIGkqGl;#Ol4ivM`&sS7H_69Zwr|sH`*zJ#Xa6^K218_w
zPGx&eGPco_b?*dx_OP8ZGBbydEswNcgR^OcRaG%#r>ZJuiyj(LN^(EDnj0~l-)m^-
z)%6TShfYA(C2Ukx0euZW*wh=<JLoJ9ldMPR>^Ri9rPA-HO;!h2(XdVpz=zUK3^XS@
zu+3h)(|W*m|6h0wlOFXEDOEX!?h{|Jlex7O7cVJOdnRUj34993V^gb;#x4>sm{obg
z_%Bz0SlAN1RIEZ$7=|*H<IZ{;1Ak;*qoItSVpx33J1Lib4UQvB-Jt!ZKWrvxUNP+}
zH+0ImR(bp^S1v!5h~3T32Z=urr+i*1bX~XMSmFZT{WMTKS$N=!j1H4pWF6-d^q;rF
zR>dVvT%Fv=1oD514usrWY&@za6Ok~yeWM7^4vnd)TJA}mOkc~(i2gb|C8?^3Yrf+z
zKmm&&$l3G#qGvaX01YoW@MbAmr^~))Vt=1VxM!IL%TK|6jN7_@BTIoRSQOW^L-{1{
zXK{bd_jtZMN2**eS1y=)a>nmi2`e>-rFH%TXzk%ZkGKA0R#0~I`2)-xo|Ig5d}(+w
zQt*Jo*VmlP%&_iFLbuN_yeA`2>?$ew-#TIiHOR9$QkVlGwrjBUuF-n4l{-+RAsj<s
z@IUX^!X48i^W={!eiApZ6voR7@9WHuEB-Oj|5=uf(8Z9fw%Tntf>}Z)mz!l51Qf~o
zW{uyZzQPc0f39B?v~&iZw-JdT-J0$p#>os8-Q@wsqU$6X#LAAGo2b+;8`oxUuSIm5
ze}FSvX9IR8s_KdowV;cDSi7@%0sR_6AGJ|22#CXBu~`?%+FjprQf_u*J%oZj1XTWn
z>8No!$>`j79sNxU(W^pc#3;Ex4~Mmo1KhvniX1D@YWA4-WUAgZv8A9HVa=vz|A35;
z8;HdL2Z$#K-9DM^WyKqeHco$<T+w~0rtAF(VoXD}HtI?*(HRhJfK$SR#`*<~^#fH%
z;*$!-I6A5@FgPMuIf@jH2C^_%+Cw_rmD#KBCFgZ!W3mxm$6*KWuZPVo_tQ*vhDz6X
zS+G-0mkmV?uQk2EmnJ@d-u1qO&A&y5-u#1dnd<5YzO-9<G0rnimXbK~0AO1BSZ;os
zt?n#jA_Z)(e3>F)0qj-p5Y39j{5a66d5u3y&<(xk9^|uGd}`igdRO}3%LLU65qylc
ziTVB9Lj16DSh?*uuV_uNTZR>0&1wySV3Fe0L#3l$di{B}ZmHQx;MDzUXz5@O29p3o
z0wT=I3v~Z;z0-=~o$rtu-#P_)j5*Xj0~zMhc~M%E3*<2^bGm+qB@<IK_z>hM03+&|
zdiwHah`+dRj!<g~y;&d}ans*Us^2%>4zCcyjd70g=5Z|Wq_RA$X@9mKa5VStCYiUc
z{V$Dnr|<8s&tzqr`dh=vAH+pz(@aM^eC8}j9UlXsFoTc~>(`5AiWZPqX{hS8x<98g
zIg7yCZ+ad@?f&GifAQqM4B>WthTGi1_EEq3{NMjIj1mJKoWVySUGvd6A}vp1R~04n
zj0{LedzHE$^aVJ(gCC2DA^$pct_rS;JDZ0z6Zc*g<nU}(syVk;lPu5cA>PuJyU2W4
zxO9e_jpq$G93pFmb5l(DQ5v&6d|<?vE2&54l16-DvC<k;1q6eSjqpA<Q)#fNkKs+f
z**P+q&P33;5=MDI7sOVs*oa;|T#Cf^Jqs?^sDRVo^e65{MT+?0&bWGCTUFXN*73u~
zXqSKk?tp$#FFr%;oIW{R370fGQiN}1yYD)d59&HzNDt*E{{|$YR~Ev>Mt@Zn5ad_W
z>;x7ebntV!#usp36T6+8)1%h%?29R3L0X+{7s)vb-ymMiMg+Y-Uxhsqy}aMhx@E4^
z>5GK)y@gH6$jRkX)}If#MoAo!8=sVeBQ-1K^&HrvQmFo%y1;RVDQ4mxPXxSorB4t*
z;k_bXNQLRIcl)6P)i}9KmfmlVhMcU^GjrzVLg6Kw$>Pjk&kB{2luj2+G(=*ayCi*>
z2`a)|D+SwJnC7itxri=j-m5;f-XHZhq+}8*R;}3YzIe4MRmaA}l~kC7DeK)m{lics
zsFG=+S)jQeIK@c$zFMbahl$fyLQ?jwK&Dox>4j>RFGL;#xu*}D2I)7QD35DShz1zC
zki?W;KcC(|lsPDsz2+8&f*xWH8-G(}6aZsKXM4;hm2?jmmVmuKD#F3)=y*Yed9>7%
ze+5wY$1xQgZrJsAWJBQvsa30vdP@2=d=D|VyQ1EeiUHQT)N8|Ne8e@3f)H+B-`P*Q
zlx$TY27PQ|-RLyCB?2i&zL>aG{*4_UffcQZBzN3~GwdGVcE1_H=}Ltw;DP%p3Kx04
z(H3ub^A0u%DFdfVU2|9M9C!`Y;?Y1x1(N53YXfoQ7t1fzCg7R~5ZwX-Voi>SRy=<Z
z>vp=*_S`SXRu@B=5tZQaH)gdgL<vWVeR(y)jW;at1jEMF3=!|Jp3eQ9W#ELkZjIkg
z=P8NJ(=@2M`(Nh40!Hxf|1}H;7yAtU(<)$N^tF6KfGG`HumQIT07*@kZeI|5Y=sSC
z((9~8ngm-%&@eH@^-~!1cysoAfX?p0Mf)10_{_5%BE#xXF+IZ(ye<e`(EybqDX8FI
zRt4JU1oSo^ZoGwnR}h<xMo6Pyj=V#B9L{D`wp&)+yBTv0tCOxuMM^3C0DZ+W#Of>y
zPZZmd5)458dGft+pHcQvbzb!P;<iCAS=OY-$|9jd#FXmcn5Or6oH~HzLQ!>X?3QS~
zeYsdb!m7+}q^<W|uz>lsPl60EJ!54;xWmG<=_RYT`0czHc7t;9DdXh(pTBx}r?Mg2
z|3*&oBRr>Q0A&6DDxk-)U2q_8(*j+tXYF(q7M~k-ZYg#at!xQ3_DfdfF8@k_rGiXW
zFQVl{rQy$^JiVHYzMS-^nIlMA=JFJO9Xm?TF#xzW!on;q?Y-bHz`%U%V!sLc-UnY`
z7IS0lGU4lgH?vf|m~chHYjr^DWRBl%R>XRlnIw+UcP?eJ(N>_qtvkZ@b-`T0(0|Uk
z+a_Q(TQ0V)Tf{!kEt|)tmku@ex6C8=Tp9T&L`YWv0VR61!Cv;4iI5tdwo-7Kvolo$
z{gvor$Ek{hFxnV1w5dUb@5?QR<s4~Id&*QNu91;ZbymaN*x{z%(-w#CvtzJ^o7UBV
z#tS7YNrpiYde!{r`%W^zCC^Da@MRM^#wjfk@rNE?DCFB+WogJ-B_?O*J)JkGf||Ct
zo7M1YBAuOE$g#U=dMsN6hP()pY@co6Y3l#;0+0@Xh5oHP+C^MES!X4Z9FQqp6uYo6
zY{gEQB^Mvd#ExLWy(P`4)0_{}QstDLy&W!-$a=qoq4>+|PB6#W3pGrkzkvdlw$dAl
z0{IBR0u2)Ym5U}T^??-wEFJxPLeTR7PIDN&d4lYR9YHR8GCwm;8YHr^PCzTGDw9X6
z$}*5hrxbOrS{@eU1Q^jtHe7{2KW&SYDEdm{K|L~v>Ko3*GwnQe%g@f8Pqnp6t<w)-
zROM6gL*ziq{#S>&6+bIXLy&Ncetq=>t;uzMbHQB<1kxwzocE({I4?@GOq06Z$<;-c
z)p`mo2iRU4<UCA6q0t(DH+@oOlJ4_Qa*=wvt~ZG;6sE(H7l$b2r}4?>LNCM;=xC<d
zYXghp;duQ1y}g0M_#Aq@jXhbsRtLTXU#aZdMfro<>bwNbip8-u??b>!hu03qrGsln
zfk{EiR)>qlHgoVoJ`GCm`^?735PVRDZ37Yjl3~^69rS>U%s5ouGLb@Sf@cnA@N~74
zmzRaJSdB7eQBI}^2WMUuPt@S;)|JRA9~HevajhVuuy?1=?6*6??SU)X$C$;Qvp7nn
z-s0;ggSSK04bxPq)^zu7{^mNPu@4;7D+7ktSdd%}pAc}AJ7l~J=+!9;eyBUksL_v2
z)s>gs&9;BG3{Jq_2{c9ak1pZ2yx_Y1)Ui3c45?)+VLaN}`%zZok#{wIqnw2PY$<3k
z>505|w}&xPTeal#IWw(Z1#%ZSU9LEku`x)8r?XI#mlpu$F0Fb>HA24oJ!crIblD5^
z_BM@1uOtF%Gc!DNCbVy6<@|G%hnPm;`nsHABV(tV2~#v^spi>4-!6}hutc9XnZS{t
z_y%cpIJKHr0I7-14zJkMF&-)H@tb+VSve+O1`=$mkx|K;j%Iq`yylns7-}64!q0>W
z^$Y78UjdJCZ4Ix-Hl}w6E$W(h5dVnNDYvEJ*Ov`H_)LWNB+KpT@~EIo{*tNZ;qUZ(
zh3Gr!d;sb)ZL{_dqm@QComrZA=6h-lxUp9j^C?__24HV^SiD!i-Voy0r2G7UPAIk*
zT+)x@1AWuOzY#UYpz;Sqhmq~)b`kqO8%=6T0)rPuSMQjgd|g=7uX&<#bTo8sYHxUp
zZNJ1IY9G?CxyabQbFIwug!AS$h<m6fE)W;-I0$??TG;#abUymV^A0c!zUaH!W~U})
z4<EB>?EXp7U7j*{%noa3Ls_lV$pdcBT{um8J_}U&(mws${;ZBm-*C}#)hz$1GI0wJ
z*NRSY@nS!48|$u(!|0<9b-Nd~bhukvv*N~i?p#C<)3Kpl<LxF$!edLAZq9}7tXA2r
z(HHX?wOFQ##Ru3mwXCm<bSIh4ZVSFker`{=3+Zap=GIdVTeK*SeVYt3{YgMcuuenM
zpT4-}BB<4Jx^#G^a}@yKJ2=I#>LOGm6tLX#SX3iq7KC|Ve|G@2R7RJ+x^3Ueom%&4
zsOVnE)u^pT#a51a;hISc0`Tzxo^S^)$FC}aYyg>vrYpoAB_@7AWd{DJ6ZOaA6W-w(
zWlrO^*N2h6KE<*>^`XE6JX|B)bJ?QIOrzsBq(Qw|*%#QZ9Swe2>Bf^&SnnRAoZVpE
zk`9p1$eWg~x#$C*dMc`rU^*W`bh^5@7r|AG*@T;@C}bH}iGhQaZi@FV=(0Vh-RBoy
zmE)eVKr$MC-sZjOMKoGxP<M&<z<7A(P=X6uw?$fe;fos&>#f2yUMyaK1;D|L%61oq
zwD`>yuulM^jc+OL<BftH{eZxWn*q4<n-(-l_hkW(9V1q&G<7kwYiVc}>~T*Hk4xPr
z&5#?0@85@$u3UEegDySU0=!H^z>WX^Mg{Oo0yVTS_1LCEXcuF_T5JOMB65q(h7Br(
zsWqPLdv@FKtcnP}7TPap%pgcn;guh|_V|jS{O&>NR+w-vo1Xe@V9m@($=S1-a8CXj
z-G3v3A!-7vx@ksz05LwkHN2ixOaPlgx5i<Tw9+mnghaj}Dk^cT60WKD7~F^sAiCS9
z=LyVfa2XJl!jfZ@aj#`NdVjk(W&$l9k%Z(C=++|a6b;+d*mZqlLCv^%VkiI32KD;6
zVXS9$mZ!BxcH(RpN$ZY>^5j1&oj~^Y)=xPd>n`BfIk|HApy*l;h@Sics?54-RDbK@
zHEHnmyZvi)c83CT?&gzJU}j|<kdcvT?3c2fD@WV;G#s;xqvv-=)55(5xx8)CRNkNg
z1FYS2;@tYj;4O+1I~9nyV}L7_ZsvMquMzhspLOvqeor5AXWnyTl-+-uevDRWw0&Eh
zueB*$E?0u;6><Xbcj*o_3iy#vpSpR#_U2*c%^WMZ-@N(s*#w|S2ZGGrn5g3LC#-<U
zNwd2*pl4XEpYyFT!0wV(+X7!709ok6--{X^JsIV0wOU=TD&G!gbz5KZovQ8Xnil)$
z9?9|MMBlsO2Ym+}d-gTPwx3~jwtcWy-#}?5KLfJ)+{dnq>W<$qjCHT_2Nt+lmJpat
z?h2&j-<J6jzuLH;bnn!tV&wT2R^u-#Pya};+zt|_r)=p=waw-k(c9i$Z<tNf7>`g|
zvAe#ceil8<;m*zIaEM9ZC;8270ey`3J@R-f!s-kws8CF}S7fhb6u-k|PJtZ77SoS$
zjGSD0v#_e>DJ?twg}STV^Qd_G8_}jijc)G}$ZJ8|=5IYSW09OSGCt23KHt6USvU!`
zHX;sl%j0>I6(7O7>q~U-C33ezD|DvbLa#tq^$6mzj?f3o%#s7#D#pXR^IwgX;=D5L
zNsZcuZ^VM9wb=hA&+8K+W}dufYd@>KTs|8CF`yZc^|Rv{*!{Axmp}lJ$?nkG;^V;Q
z2ZR5e+e;R2#{F6V)&XI4bTLkw;6u;m{pMB9=DysahFShq@cmu|(OW4G3D*!A@3w@~
zeG_FRyYE<wfZL%Zj;PHnFp-Nwp*>w~_d_UEKdYG{yr!i}L%UDzeGUI(nZ@RMR|MPC
zA`A)7IQHGYo6}){{H#x}l|TRBWLWm{gw+Nbx=yRfHe>qVKg-FTot+*7Q^FBVKs%%b
zsZ-NTjbYxe0rLR=4n!WXA3i%q%HUk;xHVYtq8m8;qi>;`z6Htr7pX6ZNhgSfl5FOd
zGb)o5&h+Nl^~yzsbhFzW?MW*_Ngt6`Crs#z$;E<9rFQI<(9@#@*RHvt97*m%WZclJ
zySC!yVlI$MqsqwW23bO!A@>Fc*EIBVYJW?Ut|4h!R1hpXiy5)89HCS10kx8UQR^7f
zZt&Nkx{6B4sTI~-ron&y^Y{vS(OK4=2*{vCC1>}#YOU6>Zz;D}ttv%hlXhhoR9bb$
zqRSXDM_=U}XW*++t=zST%_U%FQGW-u2Kr_(#cTgS`J0@1!0czH4pPr6yF6@;#qV4{
z8iaZgo)h3~sZ<mE{<l(<cQ9L{$vOkHRAt6op668&|FHSFb^?rTq)Bm(t+J{zNA6NA
zee0M5jFmuB9exU!B<UIS;Z~(Z>Hv1Ig{3k|{N5O7;7ir30OH@V12|)o95|c$<D%s?
zq&c~etG_o5sIYSe-QmAoh%?D@{eB*N8+(Xs7F*Go6#_U-j#6nYSE;o?zAgOTe4k9=
zJOpgKJ77wg6c)+p5MD_+@>aFVo_u+DGufl-vSSMJrd5pRr6A1`{DlskHW*Q>QufUN
zg@8-0VH!^|wg3(j4)WHI$)Gp8PYN~r*SDlt9tH+fmiYGLB*==Nm+YzXdNinw!JP)h
zY8ATm1sHGDbds!yKsnzbf+jUmaVs_{qRpnQ)Ab``1&ua+0eUXJq}fE2&r~`)HH0c-
zqammOwLv;9K>sM7Q>D11&V!uxF!OS8Y>UyWzI{RpSxqu;6c$`vJ$JVW1-+Jk*cb{@
zts&(|$`L<;RM6b^MHr;fS*E*>F$LY9j;)<JSwVHT^nuu*q2A+D#LI=W>bQlYmnLc#
zousK!-~1B-22)`Iqh45ry!gyvEot9z#o9JIO|zB`o^0SsxtS$}m`UgBa4`yF0F@mk
zu{r(K&+Kck<(qpRN8g426HL!R{Ov(b806l&UETg0hRDvJPS6Xi=Cbm+U}kP4*pEj-
z(4-H4w^pY{n-hsBwKhU)VstesE|L>KuZ%REXgh*8B0^1c0JQlxg3noli(_(@b+edI
zQlSef4O{Yhk9u+EWv!4zyOZPhg_^)0nXpz5E+B)-0Q@xVtP~jvtL<EF5PUg+s&b+O
zt?wYfbJ%gX>bhoc0VX#*+P-x?BA5b4eIE(^pF!+16b;&p^jP=JA^MO4sfLzI*7-o|
zmE8uYGlse3c_sJH0!5jkoMjtrr-8>VF0az*h@{pv%94O|Sa-W7;tOY}^hsA==fXqa
z^JTE;1RhMf(I6ZVN#e|35ib_ypsS3XaPR3FwJdi>G`z`V=jdA+xAjJ|XtmbrnlDxi
z%^f%&s7J|9@^KPc28=pr*D%m5ALDHup7X{&46G)ym0CMu5yFqj-cOfyL;}`zJ-<tD
zVSJlo|Ns8pMoxMUu`c9NYFCb8^NnVk=Sg|n?@5mv`AQC0({9y;1#ZdDWTYmGGdVwM
zI^FEHjm5=7eVD;?!Cc3>NLS{<=ZCx%X>kANCxO5VM<EfkZE?6tvS7VMASc`@5Q9aW
zMRg^7eEV3z_Jo1F)%&;}Lg^-9X#Bk^X0!#nCl9>^E7<md>5C{D<d~;K+P!&?2C9&$
zx68*qE);$qo4hImZ^k_VPwn1p)83B*Iy`#Q)~yTqxJvRY6Aoig0S*By{UDc_os~>Z
zn`$i7v^<{e&a20)7rc~%-MKG-S27_~LTtN{G|5iwmCl+jJO-<-YrVTdVVcIT;g7aW
z+A9*hAL_oUUQ9YM75G<*zIqLpB`f&_1_T8czgN~<Y-%W@akPQGuYk_l3i&JQju<Ke
z<{&~Lrg3$_?%NgEYAC4@7Pd;?b<n>SYF>rPXpL`#GOu5?l?u41iUL5(d`ENDKb+qF
zw3v^eSIxR8I(C9_Ds@fEPB!WVu^<-K5J<9m*4$aVGFCC6-R2hSb(l=?0(QO?u1@Xu
zLhP02pNrK2+_ue+L_CHiB_%gIy**tuhqBmOR}Wr6i{W@LKXC&j^YS<GYkPA9x%F=3
zK&CTwzza6L#-OB9IcdtO#z~&59F+Td|7?yC?Ox*&FIaUQmyhQy(7&8jUZUIh*ha6V
zgya!7qN3tR;O>>JR>bCnCJUVY2L-U|W@-vIm>QPBjGtIwU40_;<IcIg`6Ws?k%Dw*
zzxZdXE{|#0^>kEF4>;*X6O45Ny=6AZ>s(pu0_SMvr2Ee!Y&tw@)zbNe!>@U7Tg&uk
z*qC36Nbb-{oOtDl>1OSu^zedQM*7uii*k6?AUHJicNRD4pv}|Tb|Z?qrhV<(c)LJ_
zxn4C@2cz$Mz7Pi@OmXfVUSF1*&wVE*B~oQfF$==MoD~vc71mn(_*(mL7O*pP{p01d
zE>j217upqs(AxrtKW*FI(Gb6X@k5)_Yt&Ay8s~@xG9#c0G{_BLBZSUwZlyI;=VltK
z!K1WQs#X|7&)U(G&PG5QF~JfaLq3NgHsn|LBe?DDp{a+C|5*3@@iQVAQk(PaiqZzR
zbMYIp#byG;Z95v==YA1)hy8Ox;nX0y`UZOJzM-jjyIQX=?<4sa8+$BzHMS`EhVx}{
z%+G|<lUTj#Wr8*r-Xvy&>v*5a#%-SgeYn+X{b__M-H~0?J^f+R65$Aj@3TEW+BE9~
z-y^zef6}UHMKTEr&g^QfY5r|Ei!%A+<zWKc*BYp+M3a;fxOwVVVb<wFA>7OS+3RcM
zZ>j_iC2!+wV<a1jLR-hT!F(Vs*DVnJ+Ij%x5ULj2--i*NzWp*4TshDdva{E?TLFK8
zgi^P!j(y<?hHko|?F9P$g^&bmd4cf;RPARc2HWQ1rGH{$G)<P9l}n;ZNrKnJEQN&w
zv2bxM8O~Fi3X4qs%3ySpQc|yHL0TT~qV2fo&2f35I5CN=Tj%iEzq9NkdUTKhx==tQ
z>H&p?<no{C9!~*Z*~cWaI)(d5plh7IOr6MZwgWQzY>6y#&{V*UQj3E0kKI=1^0Y7D
znKU{qoY=cu)0=0qQvxK8M&kuH=E3JarAho`%F4WR0``+`pGU7NM@wKOMhLAxJ;KN}
z#GEOrfn%>5rT*(;Jn`GkMU_<iN3r~?heKPgUv-vGZy-4~W`6!TmN_Pj2sQNAuQwz!
z^lAv~E@d|>mPfy6x+nQJ_bx|kkT+&bVR&xP@nI1{bLzzTNa)vS06~CAwyd?~B-{1o
zdMr2x!!WUk3fbxkS)RqQ!UMlrgixIo1|wa%@3<jf097QR2?-v$!AipH@9I@rKTK#H
zsfUuCm=v$l?N$hw?_Ggemi$8dJ#s9~O6?(B2%ODIB`p7S!eaH746lFbmjVXO?w!@I
zKYJIbm6<T%NGv@V)1kh0I4*ILC&dzz#!q3wC59J|zHH(N>BItU*CDKg9Rg<}S!Ft~
zko|r?!Q@s=q}LfrNJ?l$h7~}AsJIr)Z%L=0EBYwtO?@S|+bL!I`V??a08r{w$s&v5
zk}Qm7ixGR01<Z+eanZF0Q3PhwTHOG?#(=KnxfC&fr*jDWcO^>liOS1c%jb*uzI+-C
z+kM6!zp|REKD+}aZa$^~dBvZv!66}k;zHV<go~iV-Gg&OHG~b(aEOi+K7q_l7s_)A
zf<Nx0Kqr3_p;k!K9~5>mY_@YwOFu<MrEozQY1Ba#@}uDyw=tu?=IY`cZo@W6npYec
zd)4nsYNX-_8!o%=6aa8Bf~>7`#Xm7xKmkW*1sYMp1>~eVGz^L+3`3gVV`K`_FFTHj
zZARl<DG%=(ntoMP{{A0I{T~V*B@98adq5P6&pFZ48_9k)ClgjjI=Ef0PcLE#-?38k
zKd5{J9s+Om<KxwVcyaePv<)#U18mhioF?!eUm4Fs_KL)ReUAv@_|JM<-9-<A33JS3
zq%v%ZDr!pZ{r&a|$Oj#A#^LTaj;+LZ->hA+Aj!d<PPb3z<j}Z%#P@M5NVZ(FTH$|e
z(%x~za7HQ35{+9@iHEjgIsfXQ(}OpAX1mRD48y+v)9&h2&Wo+WUVkU}V@NqFb=N_I
z2Ee`YNQGMP>boT#V;#Z8*mp5;o$Ece;4HVGk4OI8=E9{v%vYuT!Hf_pP3<+6@j;QE
ztlU(Kr8duHuCs1-&pCc=Qlg(hG@uCZQ%XRrAhc7HZT4Df!l@Q#)s0Je$ciRm^hH%V
zx<iI*o#^ZhSJ=926FmKFc=+(S(tO%-3-5XZ!*kVR&aG@j2cN})TC}K9Z^N~WHZ`UP
z7dQ?hs^5-W7jO#2X}t8d3RB(AYTC4j9J;1EZ*QYF&BSr>#NvRb$<L-balp(t6fM|A
zTgq|v74EWlojM^u=CTTdS@q`c8rnN-WB?_JPX5vq#!+V_Cv{a#UWGHDvU;`t<mD%J
z4he4&Ka6HTql7R(t<1uF%oV`_{D$Yc)XC-m-C8qF#lQ$Q%`fO|V1*}gs+U+CbMJGZ
z+ii-##{{8De(J&$;#Y`!0T6pv-#(i<j-;N12n##^ZJ3xjIvDV^Dz$UD0GdBCIJk|Q
zbl~m4E>WB@-2cRe8{_FPjbwB|>|~!9`!hJ%F_%xkZGW&N`ok<ytze4@+;@aU^nEo?
zPM0b$piVHSLIdv~FIs~&ogiA~ys!8X&~*!hpB*=-E^$=#Re1$B&*ZyObWsr4JhSWd
zPpl9ZWc2ak{c$#p8TS5ODi;ebe1G}l*ke4;f0mJpVy-nB^RnM*{D4?98x{wi3-}hZ
z@(vtGN@~k$1Qq{APfXo{$djibECeq*a|Ny5IZZO%G>+Z9D$gian;QUff2@hxP8gqH
zf}4=CWqDyAZMh*|T1WDyPS3hmtKDF2CSv+F5qts^h|=x0a{ctW)z)%j=a?6`vp)6A
zdOnQnY!`n_&UpGCzYA3N;nX>D%ig-}IA)JgLD}2sHVvL8A3OWiv<W_gL(DeZDH#6p
zM$Ih}qM}ZHBj&f<GUu|N%QF-m8p4|?fF?Jo8=fYU^{WOyiC+T)T^Rhp;X2Q+p%z5A
zI)TAxy{i(@*iPe(^~{0R2Yj-4%<i`O<8G5Y8h=+~Yd#-|_xUAm=&B&U_bpP#YpGDh
zv}$wPWXtzvu*2i)uMC17U-POdMjLmY6FN@Dwu#hT(nmX{PK6v!V7e~NgVcVBoI20p
zvXonZc$&O-x1~a)oUp{5*vmj;udZ*``e!SpCvurnw^yLC$-+wal|d!Y$S>xV&7FXj
z&YgL(Nj~$mr>`2#jlHi%jj84?p_?2DO&`ju7*Z&jM9h)XY@Zb_>CTP!d?m-h{8Itn
zd_3%%1V0b_s+74r&DB>&^G@t)G;Nr#6Ec?Qdoa;f8n32a{W9I$LheV5%)KUhj`jUU
z*W0H{%Dv9(AD%C!n{25U7_@pK5ffYa&KjL>_|HCxd#N|>mF>+(%k({`wR?;ZkFSQO
z*A#fuZ=HHvKM1RiLp%;EHs`EywDV9%?1=civzuIxsLe1R<|8k_aL2?26g&PlpOHYs
z>yRx1Dds2$htprXm;9F|+!!$$Qem^zVpyNNk#_{OsOLGVHvGeaLu<Xa)T9zL7@!jd
z*E|GRh>VRrFU=U$;67*(WhFxB_iu_==n8nzE%^WY7Me@A2&WY=vkDZ`@{PaBSeM>D
z>@ey_uC~zse%@KMe;cO_4}n55X1Af$8+pSr6>jX4|IlJa(sC~QcIo&(+%W*$;oHF3
zSZ82e^pOMRU?vM8)cU_no7x8VtC{r#+mGeqgTwECqaewUf+1DjzW)9T<4!w^5c=rp
z{WeEjwGkW3Q`cUOaOqoQY^Q(9*(PX8B$&q3NA)l2xQlm@x^r>K5tmkC>kTU8FT6;U
z()Vc2FclyWqgs{X7!${2l0ULhYt7k6eT%P^?DKf%W9jgQMNc2g3_(Z>6HY~!7(z+G
zx&>c19D;({@nPm*vh1#K)c1vT6fs7=RXJ(q04rR*+7{`1S>uh?5+@mJWNfXZT7y?y
zFt=kxt}XpKGJyp_5_Sg!FY#u}awj?ZJJ5o1M8Y|vQ2ZazAZ;???Eu#t^YnD3X4J{)
zY9abu5bcnU?$GAcHvRS0SLgDoSQcA!JAQ}CfAU1dda1#f{K8wd18b1H-7nFo;F7J_
z7WWd1@@EH*4U!_YTEk95A9kI&ZV938*b5m&+x!I}ns=5jY*mHzUhXAKbMe@*_scN~
z3rmi1wuo>8OaJPlBhBG*xg9-<vZ#v9w0Racvzg-_D47y6c=6-?wPvM8$Hm|~e#m&^
zvHP-`hL+D07K!2yEiQ2q8c6+!K$W9Iu-fSOO5^#TasDaTq}BZgPU6)TV!;9x{eKW}
z0wW}wAYUr%p0BVgqp-_=h{s(*`<l6?G>U8ip-P7_(UhqKfDPVmyZd)c8)t15S`;;~
zB1FALTLLV3fCWd;1;&^$C$*1sii}h^mnqJtO=q2e867YtK)7wRKr_QN!>G6@$Ia;%
z%(@gU=!MIi4XfE+u>+tAU$Qurf|U>(3H-~8`QxT9>zj2Nn^(rc3axgRH`Y7*l|$y!
ztgklsyi%jxmG<piKn@}ZLbX8#dbvg;{&clY5l7b%V!1*udXO#!=<IT*V7t?q@s0Q=
zMbooDQSFgQ34)Ot53|)O9-1zWd0T(;sDjV!vyyg$Egs%vUbEpIWTsF6M9q%n?M^@_
zc-vR@lq2M1d8ppWFQ~Ags8s5~{|)oC^VB+L8D-{nVZ(U-b_CIKrCRI$Y14}%V2@np
zhf|b79>09#a-|CRa$jM!Sn4V=1cRxI{qa0yVIRovf6rpK-nhK9JepBcb-sv+Nhp(u
zrpCtKH02?2>20^xo{P<_J#5Dwg3oBskPRMeQ0)FTM=ri(@h6#Jl$+;ht2Rj@S1MIu
zFLMPfSCu5?DblK7CF2zs%=+%IVNSfq4^%YMZ<hwF;xZgB3LQCoyaiaE++w*Jei~gi
z{aTdz_X+br@QWhEDrdcgmX1HBNp6(E1l~Ib3o;ll4xIAH|8TMxJ~bE^^Yo2vo5^aU
z)$WK$Q?BJ~X@!-W9`ylSgCgL@xNTw>e}VY}Ctx>FvZ8BQ@N!wisMG2wAM+JaOl$=G
zh|}b23#v_e15M1ixgekW(wv)4Yz03%2~Xj*uFVn6((>$TxX16DSt6yavIYN59_N37
z86oMJ9s49~m;KYa{P9O0O>;yz)NZE+!r%e0(A%8JeyN;n5$RAYm?w_Cjvf8xx8Bnt
zwc?*nheC`pTklc4Sr!x;a=NhN?el*y7MXXvLT>xGc5JSj6^l&X<B52nPTdz7)e>h3
zZlYb!?8AyJndnx#HM#IO;vdmmqM}oW9}s4=RD2Vqi)`b_PBN+J>ol?IOa_v7M|hbd
zbB=#zKey@=zY+1s1PugX5@X3C<8$zYaM9t|+LC5|kz-#dcXz7I#MgFjDiDdw;Xf?J
zJ3lsc<dp}=l91I^ze2fwo2WnQv>8>`wmgk^f_2lgw9FNF{Wdpl0=}|~ey!B6;#wp?
zp8jE4ji;<E%Fs8I{}nkX6`9!GPh^E~y)XO&WWx0>_=+O7F;m1zz@=h!H@h>pg)G;L
zW8e(0Xa1p_4D6u2)xX?qh<zktX;!3aZn1)tkd##VwZ>-AjCCPt*m-vUQ@hO^8N7oh
zfQd%plSo8u#v^p=EiT-4YrQ$Z-|Cg3kqtMhUG{cjMe1ev<{#WJI_1{N-g?4!NB4T`
zhwE1*W)pf%)|AuSfA%-BE#j(HYk?n6PftblW0sczzRAc0T&A6@)uJ@3QtLA~BL}0A
zC-p`{<+ABaa@36M_kFDO!r&FZIL{vxsoiQ@;i}Af!d?^RK|$IaZ=|n$wcT^l^R!J-
z#BT}c!;)jJ;e17a1M@%y@F>Lund3}QG~@#Q-|hx}Azg*zIeC;fpME}XnnnNTL9sdQ
z8aQ`3b{#MDkq>rmh`5vN%zmtK(SwgI|G!;=oD_%^$J}#|j#t2>e`Xk~GH`B$=Wy2D
z_gjEl4~S_fWw`<_e7l@*W13(i_r4^wuw%axx3iT*v_?vb?~-866RW^=KU7S3%)CBS
z9G5B@4HdZmA$ZeJQvSBVBD6K#E-cFMaM|&DN<>R2V>6qe@k<F8#Lz8^!<Sig|0jct
z#C(;%<^Zd*G`gA>N2DuRHdI^2yVzTLEkkCi3N^dGma9hioNkz@P5m#Gnj{}*8&3`Z
zMM}iuI;@{ekZYsWx7cjCh7Ynhgt1P*PcN873RpFT@M;`!v6#Dvt;?4vO-Na?4ioVW
z{@7^9xl3|xm>K<>O)R5y7$IG0dVt_jqp#4VfZlVvP3nC+-$mPBAH&`%Qu*V$CjH-b
znKwbNxgVe7F6rIwq*}G~C+<uCY;TtI)<zq7*&FGE%M84VKd#8M!}-{9x&1TdXdE%?
zt%eTm#b0=jWwsTpTR$bGc}#qKxk+SZ^t~$9<O-LKqoXOdm#*jjBN>qOWlZGKbJU6|
z9bblWh|GNEvdvfoSG(Bv1H72*LdHIgbzck!{&cdzYTnPeQp&{&pq@a5QHXc5!zbBg
zWy0JqZ9~sDl5a%vC>~a$c5Sb7O9Q)z+c$rV^5&-Xh&e1ERIAL<gP2W_78l1=5->R4
z4}mtOeqyx!J9$77PPUlWM*>3m>xVn)w69!;4D7eWa7EP9`R<IF&H@sbfh2!Otj-F0
zKIb>;1QdIAUZyr5*xxR`Q^>Z*x7u$EG*Y1pQPc*BkYS>sDFl7=hFSCmlY{eUPj<c)
zE<M9}Y$vJ5XHby(Iqna`pDtJ7-0jp~h57M}F_8(^Zs2y%!Z^!hw255NL2kzd`i}mo
z(hul~UlR+6v&Q4SDv?d^G&3aqVap$x#9CSdENbgxS@#EzU_4L|VqXc?chY!AdQlJP
z(PGdD`262^76;nHvKd^nOs7VA_EGsogHVMd=Ww9o3rN!v5`+o3Yz@ufLOJuiKvv!_
zsTyOet8IUSbP4%7>(6#|zvMZrSp;xk6Y;r5U{NUG8#ytczsFp&VoEoRr5G~1lC@{|
zM6j=nt&Q@yh%moc@E1-$V?em_3;CUXCt`~xM}h%Bq6^)zyCESUn2*4XL)nQ7xKz^b
z|M+_A<aayl)O5`^NPye^h(co$I%@Y@T-Rlr;a^TxS|;@4C1g@A+RP;^n_q&YmDD0!
z^Z*96qVucYR4~clE`%9mg{@%*;T;c!C>2gds?WhS8DFM*j6%kT)bR`GMaj@m3xOjG
zAN~A;g#Z-~)8w#&m|d#><-#BAhzypa#&_b8kQ=gl-I`i&cX!0KWQdh}U<Hwj2m@q*
zMx!)|29}txZJDtLG`R$;xW5aq8MW(;$wH+<OX-rLGDUNMa{kK$#CNmVA&PhsLUV{x
zam0sS2pC}k2GF<s=U2yPOu5Gsx-&zU;%nKM;smoyOdfZjjwMPD-aNgc7!S5H9FzBi
zS4ttPqL@ST?ipm5jQLnAE2(kM3b29V9zNbL-zh$deip2d5ZgmZTB%;4j+t9aO9peE
zjub336prZzAeRbUl$S_Y;>of4t-OZ)R51UKs`BdfOf8~CBo(@88vHz#!#oy*vV4e!
zwA&{X7FRXWuh7Md%QQ4i{4<sPc-#wTSG{(avM8BXNw0Y)JUB!onBov&xygp~rblsH
zX&k?uT$w(o6|$uPN#yJThNch%5YafyrQkVnF$5);SDgi@XVk1R`3qVGACk=<FFy1h
zY>cr04v>)pfGVN|>va(EPr+J{GO%W3cn)6Vk&lnWDkLeaqE+fYTETxC2h9xJ*k(N6
z;1?343$p%*FG%~52~S`pi1bi6ibW=|m2;QSY{p6a|3NliAn>m0Vb^PPxbZoyG3lEL
zd7XzD^8*DC;pT82avfO%Wvl*&|MY_oaV9iKD1*Y3o_1DNR^5Hj6l(DTkGMVWj~m^6
zxy!`wyg0S+-~$LLnD^v&4<<D(nx*RjTv0s_8^47n^1=<8yi+^fsRrUmVrNr*BN47~
zXu~R*4I_(dz0{Qh3}p{s@xNvlUnA|zUsD!*;jzB%TH4E{o|#d;T(bSCQyQONK5@8d
zbsh0CcND?z?yw^bCG?Sy>vd@N(`*G)!BkY8aM<L~B$wO4ljc5*+tm_#fHAUA4lh=|
z<)+baZfO1><*kDB;8Q^T;CU$Efj5)<6dqeNYTtLm@Kto!X$JW$jk(xk$2$iUz`CGt
zNnjc?0dV|*st9=+bv6X+K7VA__2RxYSyvXn?H`+|ueqwbak0<!le`!9gKmC`7WnV>
z$nNE5>OalOe{AJb+;Y7%CrjhNX7h_a->PLskNLBnyb^Coh^sbuit@FG)<O!QscUxI
zd(+MyJr|Fz?29bU2dPv43*_d()KXD#4mDbwsU1T5J-;MUNt=PPofb2J3qjXxl4W~u
zBEMUEgU)kEIHRH*_pI+Zgoj(jDx+2l&#X&lL2=Dvtr@ZnH<6g8gvz9FwZT{iSl~^7
zaqU;Ug+WmnaX<t)eTK)>(k$)MNnA0t1?lej9ruoJG8Ww4pD%2i<T^ZH50=jTD0<9A
z_Jl>m|DCgd#LxfgaNiMe%h4%C3-a>6za_Eif2BZb<f8LuoX7t^Dyt`4Aod{1KfqT+
z?8YFpl-z`b{#S`Ek1KPp;trSN#+j^`mfspf*|N8|Uqv}2zJ!`RXW4g-_w=X3pKW>U
zlz<J`vUM)LtGa{@beVivtrn}$Wjtq>jsKeaBG`!Bq31e28aCA^3yiZ+AKLF=+CXS0
z7M13$sx*e6jULlIJjBP%FHhJijo3|IeNzf2+^{+goKB1J>RL3LPl&l;mvkvj|LqIl
z!K*ubpP;>pImup~aduh$<TbpS(wSXE`!WOfuL`VpS^yh_AGK1Ei{5}8kMVqXTmbU3
zBD3JfDxU@|L4vRQez1`P6HX*%kbn&O;IijQAH3xlur^d$(qo(b)^IoRQ@3*55imFi
z{+7`0m6z98=d*n`Su4RSl<dXT^ygS5{rt9Naw2!eX+^3Y&~pxY)U_%)Kh4xY3Z)7S
zLb$^>!z-T3-Zx7N+D*j5KJm)?8G;~~aTw{t+oCohu~|I<VE1sGPi_}Xcb5_DU|c0)
z#@VSm(EBTOk6a%To+KNSF0F|iyr5)lO~)>t?-|Njf!{)Vo;!bw8I+BdaD~GP7K=-D
z?u8NXp!FJP7Kh=Gvv6&+*ho2a--K<5wy^8XlvpDD4|MpyN+JVYU)sNUVG`5Wzq>V8
zAm&Aa;U=S?V7@Lez;abD1v!g>8d0v>(U^6mn&P(F2!8s(-BJVEbh^=O5_=FAHmL5;
zAKY8^u*{G5CxdP3Tn;OAwF+g4-`z7<rt)RrSx`SV@OnEx5E_LKE-^9DHq;^KM%Xj;
zMiTC;Jq^~xpY!EFD<D>oabTctH2EDl+i!AcW;W(>x|PJ;I;$~!h=IGj3>C|Rc$NQ1
zw{jZfU+bF`2u$vJ3-0H{o|H!B8an{0w|Z^9g2;ro$iLItkjZ}7?4O;P@Y`IKT%rhy
zb5;Q?*k;y!eX_2s<`=#OEJ8PZ3hh_TT767R&s5LwIe4kSTKfQFmntP(qGGG3W+f_E
zO-v({_c${+%%SD;x*{fihqbc?CcgLhxX-KE*_WirGjm*o2ay8-EMoO9`MdLJYzpX$
zmX~==R&OXmzw+8%%_6)W&C2Yb7Gmwz=QuUEilPpK+mTd?<aYE@OoS-b>%H;(ZeD~>
zx1Qdc*xk0Q{DF+Fify$^l`qSfgq8&9?+%OFpo2w`0}Ncz64KX`sOa}JG1x~X<ye5L
zM|#$@UKa!Zku$RNbEf;%U(v-<g@T_#@`cP{U6_<;wBd6VHXdC$8U|L|l+BAwyj>2e
z+Z3if7ROwfT!$9;cUvAD#+#wGvWW5(V)3pg;x#%gg;Y386!(AF>ufQ6Uc~OB@5grs
zLQZmhE}iHJB5lbY4?0~>lBxvnoq1Zo_s#}kVSvziMIYGv($-a@*Mb)uu@nNjKN&hB
z)uO<Pp0J_(zfYDabT-FnHm^(h&;N(2_l}42eZGfTi`93dtzh+%5WUycqXcPsgb*Zp
z?_ycKCnQ9VgcK44(R+~SQV^nd!s=aq*UJ0zeLc_r%I<w%*UXu7&dfaFwID)@MyW+8
z2JV%HSB!qN|Mr>ju7%SBy`&rLUKjG%f_D(+k<W-51rLCO$Fr(Ddcv(kcy3=UP5=#^
zn|;C+`#2(og`)I8;r^fZ1*QsL!pv6qI~DGyYuoxVCE6dRed6lYGkE1BTg#QfN;tvb
z=1g6^vDg-q%A+N(>lFX8iS*Dge)v9z-^_19@tU+zZp>}7B1tI|TK_+l!zM7&O^Q{;
z?b^Np5&_5}CRA``UY=pq^4|TwqxQM?-=Qb+#yMx7vk)6G)y?tm@0!TKu0HBQywbVb
zRp$2avFD{5TC%mPd|vu}rgLzjpAJqx$zd7;Vz70OwQk5!Ww++SkkX~AU!N6>_a_yk
zeoifmlX>bfm(Dg%r;ZY9jD73_WW&uNWHZE%NwGm^JnVJU!W(dH7Qq;@-Wy<R_@jHG
zsG2V!j|X(CNqN-#m^27zp%B>T;H;UiEB`V)zK(hYlX-ya&6M6oEr4Y{BUhXE{*0OC
zG4JP_Y=enw<@Y$24sRCax%pLD<vweD-D?DJ1dRq7`U$`@_1%>pHf@@?ViXGHqTpD3
zPwmoF?lS@7#9?Xp$&Yhr02nH9h*+blb{!bQRbl((g3i^_v`Q6oPP8fWKDSF>%|m=h
z;dg*G$31Sa@FNZ0`ogD;os96Mo^LgGsrlT?_2hu~j<i89Tae;Y!tO<qPy@5CpV@jZ
zIodbb#XD}CW-0~^hbz{d6(lfA4;@i4J8U$bc61GBhwwol-8a<LUy8yny2iVxUw0ct
z>$fal)9CxFNU(kLVM^K4y-Lr&tqymG_MFWhguhwrxR$vzmEY#Ig`L()4~}il1I$;V
zwN0T2%bku%>4x`H#<n>P!NUZOEGp&YFRsTG^pa5Y7@JqQ6wunSL21+kj9$EK=LTIl
zA~LDdUQF&4;@zjhN3city7msrBwQvJu4E=$FLL%;!Xai;=8+q{sX~9+bole<FB?`Y
z$8~k_$HG3S5}t*u*IreU{lRWi^FWLG8(1EQ9CnuXamy$&Fr8c6=#PEtu30TFB=xja
zz}Uk+ShJ~mV?|pN8Y&5COxuWm!P{|tx`gZl6}hH?^0q`0Q}m;=$=e-fOO*i8(Lo_%
z)F^qM_%xWcoADCg;Go|WhSa3SaQ_+k3sMOK@FH+fsBN+OokxfBjI~EA?`nR5sRTjo
zXNcCG4DsdiZXug_l>ybyDX1-eV%5;gSRSb<D~>APjR_YT)AE783z@DXo=?S<`XvAB
zkjY92^~5MU|B|R(c<wlk^0vwjod25Ub^PZOE!L&k%SS)VezDN^Uj}sx=`UURQR!&>
z$uJ1?hK+vg1N^#9zrr@9>-fsPMQX#V`*_B)h@HKa4X01CKnh9sE?uB0L<t)F1w24x
z3S)`a<07xOKfgI52uiTZA~|6EXa{97hKRI$Gc{Y@_lAQ5KdXXYGC1E_!u2?aBA8x(
z>&*=weXiwt1_kHpbIc2FgrOe7ZQWTfLoDLCv}>OvJt6Nj^Yj8>-1LSm1FtCi7S1vs
z72v6gP*MPUf9))PTmCBWK_aX<W?hj2=T~Y#NxU*OW%aubHx=^pE%?mnX%6<l))8SK
zV~Jmr%t^Hh@&%M!y(>1D6PX!4Q`LT@{?`L-Jef-iQDts<LQMxd-d$Z>$cW?k<38Il
zn9xDQ+GvlR;s2g-Q=VeGW-9e|#$xPU{lgda7W2+W2o!YsRCrh?relfy7S}Yrh%`r0
z?ZVrfLiV}vrt!;N`7VA%DUV#blO<{{aoJ4BR?_<0gLYPHiQev;$H{!E9knCAp8J{h
z7T0*TkNW1`^YVy4t!G?12CKCOKryl5qsJcTmZY!+YuNp1?t}%t`NuJlRXPa%3_z<;
z@Te}?H4jGf(|kqAH=Y_O9k%n&bY=~w-w{K6Hv;Gnt*wdfxLV;3y1c!%d!?CYxe;sL
z@BsSEcojHyw28St{Mkqj>9$UjCrQN4?Dk`_h+9UDbVMS9WTlC);Y9cf<T|;k*XLMz
z!TLiGRm=9|q4PYppWISp0&d|;n&vUMn@e738D)Z>-b1iH*T&HZY(FXl(Fu-yXsy^T
zOBTRv^vhDCnHCNYAngRRdp|ZGKf4>UELBDDnbG7Hr5MAiP|e(hiHgs@SC$p>6U?;E
zF%CH`A>u6bb4al)VkY6f&VXV0!Qa^=WfKvD83w!43PJEgUCfX?e;nx%>DRDQRFZ2z
zS273G?rPfQ+YV7>S1EYAmIez(<paY>sQ7=H6r_3SNY7JwCX}3?9Q<vhgQWK(*eO3b
z4hu0D)*i3d9a;kaddm=Bd~m2Mw1vbE*@$bUIILNB7o$8sa6E8AernZ>`ELfw^WIb)
z=rw!2Y`L_(wNW*2Upy&1SAG>j8wq}K<3AcB)Hat<!VXXU7UlBZ0GKb(^{qvXST}!f
zx@h=CX_vL9cfLLglcdG}ur$<GczAgDnNY*d4YQ^Y#lYy-MkN<Z?$kZ?mxG5iO@&d6
zcs9@#@1(H1?;%EP_kDe0$A5njGVp);E^B;O*LZ+7f=^p`>$*o%>Zk#lsfOxCZgHZ2
zZ`7*wLBb7T`+yog@6QujmMgLKGL5?0eHppiESq8r*|(3g_EUu3v2SM0UzP8>I_prU
z&~Nfgd}h%tCDY@TepcG@@zBY{TymMxf-jv2femuw;g7fU0yHg#e5vKYw(zHFYzc@X
zMF3B}b;@rPj}49D40UBWUJ!X1d^rE?W`@{(hxTZM6W020YhF)WMQQ=Gr(1DRPQB|s
zNT~QvUV8(B86a#>UYFLZXQ?f3-fLnd`7#|uU_DXqzuv%^e=Sac7gdCYv1ilLTPVCY
z{TNxQLP`RI%1?_@#HZAHua-C0hkkgH%AWu4*bGVcmJ)7{xi*#EHoJZSx=qAfgw$#}
zUY94Qp)p>KIT`{@gJGcq+A?AOF%gQXB-Zo}%R{e%PL5Wmot!UrAVo+*yKc*UQIj)y
zhtK5^k)g0ys|2z_F$i=skwsSZ@9939Yh+)pa;~%<k4ye-eTo~PUtn7my~G1cmT($L
zPACil*Q{6p7EW<5k32_<lm?{-22Ry4LOY5?($jq8J_rr8gIM#w!acMGd5jbhi#hZI
z2g&Q(HR-|E*9-g_m4XgLm{o~-sq;7R72wg{A6<aKv#5z}gw?~(f0>7j&@^`n7UF;7
z#svy-tKe{Ns`z#N=Mphf+7u{q4rpWpB`b~Yka?an5IZp^X!M@HsHM;9&xDR7wtn(a
z+yXg|Dz4vp>ICSJ(~6w&bz&roT8Gc0z#pGugB(be`9Obv>p@;ODYqp%1$_%n4kRR;
z)3T&GSP_Zv4fC*&Z(-O))P1MEWs~n$dftTeEiPIZ4=c>~2+SVJE@rE>#?Q|!$VCZy
z?#f8dyJcC-7p7!=Rl)nbx4)Hk`b;$wqO@AHnm{!>VrU;hPJgS)@Gg@^a~q=hfIo2K
znPfwJYip~+(m;MaZ>t%smdX5+%PTw)BWZkBZIf)X9(AKejb_8Iq!D~z+nCTbS`{OB
zj_LF?isVavU8JHP3xfR_RWL<-)QD%NpIKJ8)@3-vkRVQ<jFQq;la%3bU|hY(>P470
zh2YNW_cv{Nh>Vfgz$m)KXBw-8;LY=p5}Hogym&6_$t%1tjcJ>l%q`99l!?W4t|^0V
zPkqJ%o}$%C9!qeT6c0LtYnM2Ud=Af!H!_4Ep3tvYJe`A)<45QOy?RnVM?7c;8b;7n
zuxJlB^f3oAOp+IpO1l4Ntdk-b#?${?vfEh}=6;^F?Kuc)wSH>gL`F)+?xa5TNsVX*
z16L22eroxV%&Qh>qSaJN)gAaMOqTijSA0uK{vD)HdoK2P={4WAiH1yKdN2{QD>h8z
zs4QUjAp;39YZAe`rBZ0D?49%=Ip4rN`MgSFa3qQm$&%EGI8`J9(PA{M5d&Xk;s@%a
z>TS-Ri@L!tz%!VL2_1+tMAd^?zkW$Doly~q2*rCW)0hG<;cQ)z=hc;l?K^`;fz*%#
z%}r-gV&cKu#&<sVkueBc_Ox!`vLb@5x)`J$3}J^K>j!-GG<zd?8=o;iUkm{a)hy>3
zuR)F;5W{S9M!|c%q`;X)ypV5!_2x|_k9c}H{g=agJQy&6O=T_yAKZ9liXzbo$5j)f
z4)fKbOy0m}2^0{jrX-HM+TjHx=P5%60?{9B`7`$E8&{HoDkx1-#smcR#;3FC1J?(v
z!>?bQwhmA|Ry4xEr^2);Tg7E$(o4*nDW+d&#Q9yP(G-;<q6lWmzxw(~DqsEM^E3o-
zaTdkNo0~;jnwJ=MU^sNO%WpZQ&N-vXhqv!ciC+Y1!4Cyd-EaP=|E=(vX{pOhdyHO%
zY7E?{sOe}$fE)(1;!$fSLcELf?_YH+Df@S~$_Ya&dDFX0a9rHn+;Axs4nIl*Uhw-i
zM3iDKD<c_?g7aiAK_X%Z8t>pl^|R%if2!u!f5L8{C~1PWH#axAEw4_ydky5NK-&Zi
z4MU|>^FMh}^7mMND?cya459T1LcZ+8J%e1OY?rz}Qc{WB6Ro0bZByKPQX9ZUc2V9(
zP|{%_G@>rWG9kooHnYIl2wG1=7$4C}REtkGR&zj(@)JfHC4Z)!PGpsTow3;-?oM0p
zvli}f&SN%bBH$Qbemd_zztWlwXkV!eWQrJW0(JZbm<v2EvK*4kOs;qx8Y>CmG>;Dc
z4M6m^8DdovnSf>IPlYL;9oW3R+obep|DY;j|7J0BVcN~}gF%3BBX9l-eAQm3yTc!e
zAjqAtvWxC|1g6gMMbRGuU5Q6Ho>y`jb^%3;1No*E^$lMzVN^hN@!udLkEkX+rCMu?
zLn!~Yxjff5Gy|Rn`y>J`2eaXDU>#5a77hUcJz?{z`1@pK!yzElmgQeU@;nQE74$)m
z@cz;uIkp+gcoa!+#h&44DGv~17qGQ?68x%`c)H24N!n?|FrtopNn^+fa4F5=@Z=b(
zN>*tXmP(i3&tDW2WK>5jw(PDBd#Z_iX_1Q-!ZA^wUWY0$5Sk9yq=W!dP`Sn#Ueb#(
z30j0BF_qsdDkN$_m%6v;Mwwy>J^o6bpa~#8FcTZV$V_5)xgd1WR@#5&zC3Yy#r8G4
z^p*g`AL)1=CHS}uW19j^kDFDI3QR2mq*8>_DW@Z4HhO$2>Cg&VY**<<s#R*7s2%&2
zutd_F6O_a6bN<H=8Y=)P&yDf-*<R?~0rkQV;P-kX6|GJvA-Yz5)393BobcSBE$z1^
zWt{zkuM%F(-FTH|C;a~O-7Y@SooJ!=u<lrCR#-PM$d5PhQAQyB9PWIyquO9n8=$Z$
zd2hefBrJi?#W+f+tpO}(3n<?iimBF<q&nd*6lA=X3|EF;QAl6ii%=}^Hq!+^NB|Ku
zcZlaj^Dck^kuP1FPM=CSjiAZw9{F}Zz0yM(Mi3OcS$cCA_C<dAl7`_qk?yL7-kTY4
z!L|ST<k~;W9lsW45UE(*)dj=b9Rj_)JNBiDD;n_FmtY6pJ&<0q`|!<=5qKNeBGISm
z*P`6ncwsIMoCim<CTm4`;n3|1DRqOvg^y2s9LDG{kK;n0yvJC;Sw5}(s*HPpiVqy&
z3-c_rYzP<x12eP$z}&j3NRedB-Y#JBOYhdec>CP9x3>j&^*L}cUmgIcJZ@TwVxyyL
zkH272hbCQx-u6(oa?SvkA778%V-~Z8QG9MC9{_y_V1RlSo_^D>xOYhY*0P}XidBJ;
zeLu;K4S-W3Lq%k!9^im!s4$$AW(WwjOAJWNGgf}Ow$>SN+4?5DzOPh7d6yd*gQwER
zOo%vYPA7BaHGHet+_4A-JS~A~m0kxp>kyI%r{6mYu3eHu8hIlep&M+IQfHTeiM+!o
zFO`5$G@g)5GaVXctF5hFKMWN{fu+1QAO4Kc(LJZ2YODDdT+c&`j54(JSqy<nKbKZw
z>9c6CWdm#1m-Qv~WTdXylC<95`tCLu!uA4iwdF-_(}WyXmMelnSo7cD?+X_qd6%rC
z1ur>Uv7#K2Ys6~JggRJpyPiDLk9K7#+}CS6(jS~u1lr=KHQ)i#96jMEX{$*MU@e{s
z{Hpa9*w{sjSf-Lr`x~Z_ZpXgwFowngr1G<@4<MEIcjTYTd0!SFw`pQTk!|+Uut-D`
zqo?m{{Y<MJHa|JK;fU`pCXNd2VhGc}DC5Q+Xs55QUD%r`C7w$eww)|_^5+v%kMOpH
zt2}WOn6Cg!)q|!}m;Z75xYh&aO!plzxou$;dEG5>-4%D2@T~Z%*<CHsK~a~+nxX4F
z+YJMt+TuYFE}{^AkJ&;FIDY#tX4fmVU%a5%>E0eP$k*O!KmWg30J%Y`28z3MX_szx
z*z5}GU?Ciq>Vi8e$*r;Xz?mPtKL_@vX_T_iXu=fM(BD{5KFziyHl`7?x-)#m&Nras
za6(4WwV3*wrlqq7U|aV95sgAK<vl&S5%^~a8>Ov?*4sj(T^Zk6;*r(o-Y$sd{d^DN
z8jW`YvoX!lew+$G9~Geb`Q~O+Q{aH^6Fvjp>Ypw@i<y}3H~V3{EF02?_iG0xe_Sx1
zs;Spqd|cQLF)5{@)r9FVDcVU?Holi^ISMf`K_+2Jl_)mC;kP1Rfc7%DPS3&Xjf?yC
zDQ6CBbSx+S?M4o411fo$c&iamQmr&v?uHyjNRzs=5mF9;+7{QrkxEhazLkVy%PNAD
zzWz#eNUvj`e-O>q^9Jx{ffIJJ$!U5pDi&=AvqBN~QsvMr`~X3D2vmXk9~zG?YZ+*3
zTW^Gmii%b|{Bc<-mD`f^9cX;$Z{y`13Je+$ZJ(_(WCnE}52ReG#Sg}#8lNH}bcw`o
z`i|ptYsB{tca`_5=@AH(pARS%cpUl*_~rAspJhKgyi`{`s@P2ta+qdd`BiYOdSakM
zwd2+vR@6u}<EWKFc<!RrBT^D+YZK}UUfXy%-}Rn;?p}Z6+sE7W9D+E?iX?KDnHQG{
zCKdKVI1WY&uQ7*tLSW4l!B7=Hekv|>)j)s0@FQD_-R#S6g@!#85rn6fvBkq8N~-=B
zw|)d4@4e#7@e8|8Vf?}Dk5qA}`-O6isTA!K&UbFwmrN!P9}hj@sbbB`Wv2}|`u^Z)
zJ|UI&(f~)8y-*i(tEc?W>w$Y~`6@)Dh`kL_BP)d#8O%<WR*VLJT;%-TSf6vfVC>*n
zEV>Xjw-}g~>wn*Dlv0|aPT{7)UZ9A+H5)65E?dA7M*ygD{Ijc_$E2jtjqbCWd(B5c
z<HRW;W){bku9Lv{KOyI&EIUqmy<@JktB(!1r@N`Ds+z>O&A&|(oQu&WhiuBUw)I6)
zF^?2LXY#k<^&Vj}Pgn7r=iEg?HCW(_uvEbjmFlLguL3*cp8Yi?J*qX&6)TNCXnwTo
zyRnL{31O0$F@;SX4;U6B;4kRo6T!})u;s#y#^c0gE`FMDQL(^1r{`k#$y@3epgP=s
zSF&GjRMtZR6z)R%=I_WolUOu25Y`j+y6`gspS;Z<cSQ2mSGHC|ekQ`eHd8+FxclGo
z)Dz;4-qW9Eeh4;n3wBE!x%Wt0Fuuh+aP?=2KNazGN<-kjn2i^(Y|+uvf3{3&1c)vS
zApm<eO+$%rTH#2#AZbZwVL<QHw|Ib}b9yD=`#}Xgsr+I2q4Uxq7rUqMf^|=BrnGBe
zlG0H$9+DqF8|hRC*x_eR!P=(-LTm`QcytX>?MhKF?kSUd3wK%7`u=_%Vxc1x)*_hA
zU%QW%<>lbOkTCVjefjbQI!#)9x3mNEV-9SUemXNd>ra^`VM(1Ur7Qs55>vj<C|zf7
znwC9!dh(U;V|`q=qN{@q$GrqmY6(6_yqfjN_U`U{FbX-<K0;RDVbhs-zwJgeABm7#
z$b`!O@8k-iZ7Eua@RfcyZ5ZiX>J=yrtHcms{q+EYtoUf!H@GOayt~rLKn>mWOm#!F
zTcjcniB+rwC-*v79kK-0YR|b}ua9fN=mJceq0}mO!*4CZa`drDUgI`TnX#@#W;}VG
zxiS|&fAssBg^O<u^C1{5YD>AFx^64bi9;Y@n6|(p1M&+nQ)vp@;~`@;3C1%Mmz@nU
zoXNQxw?h`vGBp`J{8hhM3Bxo$GfO_4+j~!bR1~ngQp}(5wvFJL_-qz&OU<Wt>8)+P
z^OMT!EpVU2Zi(&bYqwakUqgBWO4~i+5?0LwduUh~L+j?!0Qlv>t`x3Oxk$9(z4Wg<
zZ>1|mK@M_z53_P=W0OL+%mFfq6yIT?h-w`oO?_ux;n0E&^zy0@!u8WT0lCZ%4pFTS
zJBaXpU_$lIE;V}iy=gau3mm1{pLzg?6XV=C9w@xdFuQ$Ts(7fQr3k6nl=Om+cBYk0
zg@Fp3X7s_b*I&@2G;}x#Nl|9^-P<N{;2~5aPn~1xWjLA-6B1_Z3k9=_Djv{&Gc0`{
zjRQdWW2Y~_EITge$*8};?IQ)B4H-UwIsYpIba)|sih33BFrC@XB>P!ZHHmY`To)p%
z{L>^@I9ZPVwm<o(|M)q4&&Vu$dXVk>gO#fj*p#f<hZ;Z)R`KI;M2I-9Bd^N(Z*i-b
zG=f*0mE?IP^?t_@-a8G12sLzvRD7J_>qr%HSj)y_(_hMP5AfCtz{=6D6T_m;siNQ8
zp1=D6>OPDUn1+C;pI6xG;#za3)4|^JV=Rv_z8fsboQpMPomiAST=q+*dVO@>fk{oc
z*vLY;I`Qc5sl<aJZmG9q8LBB)uoz)nC%`SmTWYA`ZZm5Q_D7(GrT6%(q@-{GP*2pt
z>r*Le#zdNLHRF*gjCZ^c{~xv(jo_TJm~4@y&7wvpUIdg322|_Hu`w~z?qFPy%MO59
z<&Pyg#EQujgYTGd(!&P*#YR~GTYu$VJ>UV0iOCJj^{oe(ntJmJpGj+6@V(eL@b8%^
zAPJd>2C)$oj5h$;=%+^e3x_0)Fa$n5`G(C7W+y~@Mn`z&``dVgZ^1rwG6BY$=zy_P
zuSP~p7`iAZDPLYO|CH?g>z*c=6a<m=z~eer^ZX^|jc`ucVw<}lQUq2Onn-q4zLwaT
zWDd0vHSrEK|KF)xJT${8fvyme4k8oO@#Nn#EieXs{+b%U5PE<Tm8FpaUo9SUsY{3$
z2t_7w@mO&U9tYet$G0lrYimQ8%%X8Bp=BSix9fn863*TX@u)O2_8uyOaFL)$#cNpU
zqehiGb>8#-jKj5e3F#!xe-9{1NMDUoYcN^od%eG>J{0pFOcnjezSQ*htUJgXsoA1b
zmRKe``&JYjL{KM%+Oy&sto#@QWkx>vgUZgd%Nr1;YZ<pGzhW37hK=GgVPZZ3n!1%w
z!G}s_gsR8DAq61#7Jixx8M~s(rHbov1?1RT0(?=2jgXiM|IshN-4g9_uZfOG^UW$B
z_N-o*@CTFX{NpL9sf{|JJo&SgRIz9!_Rz{SWPe2YR6&xGjz}wKxzwdgm$2Rpt-#UH
z(*c>TfzRq|8`ggzg-KF?N6D`WgwKJQ&vDCuv@HYxdJ8oO)|p)r6MI~0kcb=9VjEQ4
zA8)fX%3h8wJvzMM6?2;%D%Y2IwDZkiR8`Z%L#!nLZZZ4f38L{}hN5;hQGVoMi4!%B
z=--`eCPKI+27~IC>$h7Q)i^nPVRiU}J<mfE-9SK>E`xo+w%xz`Bv2!^CFS^Hfe6yK
zfnsO}-|uq`H!p9wo28$hOv_v4bRNU^EvhK58_PpVcA}4{i634#zq_%7kiIgSSY@EZ
zEtthDw#a#}z@<n5K+)T1*v~P$E=UqwcpFrJw2(eg=tRm?Hqp}+gh(Qqptrw2iMYqM
zpX}*Z7cf2_WdNt~=eL1g{a5URBW4H9^1Qrvk^LnV@A&ZDN4=$J!v`R=+4ECRgaq2J
zjBb-jrAA(rD+<_Ve(8)q=AIhOZzyN!;Piz4h#h>vxBF-8Sp<()y`pi2WH$J6bd1m}
z8#b)T2AHrfMa^TA!&3H1+-J>%;rVdchw7c2pK1txKd5amxogj<@``~XYNJI=5_qg_
zl6sTNR1WY;mlaFj?J79``G+*nY?e*L410s2sBWI@!q`n3tuBT}pqG3v(4vvrnb({B
z;yhf7*MiR2L%kW!+OJZ~IkMZp3PNF^)7wsXBU!N?3~qY^C=;kZ3zXFWNrHc87*+6h
zUGV+N7dJp*Gh=2ekr$fzEhIzJ_>Mol@-uI)yQ!hM7fR64XYM{osbkP)-T9lhb@Tf5
z>uZ)<Z;EnW*ys31@(KQ?6eM)5l2Sq7RG}g@)+bw=n;d#BhFKk)sM#zN&318EIW>z+
za^(!+6VI$2)sc!Xv7yFXq3%S4Hc;&DbBPD7!!NFKF?`0Cy9|uh3BR<jdfNVXsMLV|
zqMCS7GFHxOsaY~AB?GKjK*V2ZmNUa=W6(p!Rrz9xgZ15yTTpT)Onk+_+uQF(Jnn%B
zkJY?+1yc<L7BwC{wh_B4zzt%g6B(5>FkqNi6lf4J?rxR^-W0g<piw&X3anf1W=aS^
z&iMIhMksY+(Ii#vCa2MIuag7!!f$1ag!8R<WO60QE-Nms-rDS6gN*_u;i3#V$9u3p
zWe|v%Z@>^8ybQgMsQ1GCT>bH`^U5vD$5GxD=QS*naB)Nu%r}1ctK!lmqf&Z&@Q6Ui
z1a)zb{5Sr1aP6m9VKPm}`10}vyRBpChrp#Nj>~uR6__W2cYhc!gNc<kXNaNK`7#@R
z$`xs#{#PYfRf)fgoXs02I$8ws)vK2;xq*3?An-+Ju#5wfoELu}mD+LktgUvd+8Cbl
z1mmY}Qg^;7AXK|zsQ%uvL5}VE5Qw--U{<TQyh4j2Kl{UT1}rZR;Wi|OSGtTX{UZR<
z?a-vv&ys1Wp!RzrqTme_*6nR97JETJ;LZ#^Y*Q73qo2<JChcsYx;3$oei6|Uld{%c
zSPc+)DY<Hu4NRh^f=p#FXa54T9-`TgC-Vsaj|-nqfmrrMRT}O<TwpvNmc*u<QxcGO
zNv@Cn8}*NefF=YzDpt^0XuXR{hG8mcL`>{uVES|Q0ujaYkJkx*yZ+D%5QeAfLBR9`
zV#G_3^m8r!risI5*y|%e1sci34K{S#=gC|DUH6e*gLScw!si+&fBm3Yjv^wOrIS$I
zVjLuifa1Qq@A}Kjx8LF>XxHz6=e+|qy4?I|*E>=tzAn4nQu%*8LEcM%SUO)h0}s2c
zYd9FNE;iX(?+=j2#N^KIF5W7>c}k;vl1xmF=OBi43Mj(<X^B%O2sq&fkQvKT?(loX
zxiQ8Isw6|Kfpq!3%Gq4$nM6>&GB^bwdf0$K&0im@!mn5SRgHksCKt&ZHE;rixe}83
zSocQ{f6!rC(akjzSxUijcl_tmESxkA=%jyp(QXihTdKPKpM;DS)d)Sj{z?~d)>3yl
zekBCFH<!@|n|etr20+^LH<KB5r#_D`m^JYHXhnV{?9$t&stC6r!*iS14i67E8<poS
zl#zrha6*!<b!=jm{A`UAmCor*_75<bPNa<8MR6ZW@AdB)A2C4^9fHM&c?OX<a1;kw
zeaEMbycilNLrlU#>VZS~bbg#2x_y`*g?a&uH=<miL0iue%f@$dwd8|i?_ys}f-4x)
ziocPc@t11;)?<cOY_gHisDYiy!kb_}NewZQF%2hVm;L4kAYb8xOuAE|q>v!CARM7}
zINY*^{h-mhjpRLReI~etX(y+r-iW){(^ne!xVR2aE~6?dn+OE+FdSO3Wb58}PY_|d
z)?n7EjE#Nmc-qS{d^R@+DU8uDC|$u{Y<F$+NyZ1m(9mISlZV8LJjeQYGGF(HNDqO4
z9jvS9rHfL)YF+*xykiB(#0a-7TPQ_O1n~W{D*ip$4x;$kn;#Ex4F^yRs^$QLvsZ8T
z$-e=GM^MQ&cU#`SH$5j0c>xEYS2S#B?}>quc3D{&^ggpfIG`q(rMIf7Z20Lf-x{dY
zZQKvD!}l*7CJ-zcLf1Yzja4OB2L6#;nQT&~_%I_UDA?1xeKZp%Jo1sc-cn}YZ>vuK
zc`kUEV3tSUCK1Y0&U;;*VnNt#J5@acUecoE1_;s`Yq=0V&A$(?&=b0XM4*2Pd=6fq
zNlcVwCRBqmUK()dku+?5v5I}7gPCRDs{TDkw=JTnFLaiA`9&CZiPSF9Srnz|Z;$RP
zJ&etjo>{H`-IG32&}@wj!fPeRYB(7-R@UB$^l2}4PR_7-KcVU=$kE&r1DF=}u@diL
zy)EQZ1@><=oI$SQ-sjlwfK%`Zrg#?vT2L=5NRcB-wWAG-^zYap8U>r6)kYf3d3h=T
zpT|-_`pDKn;i7kI5{Qx(im*xaD5>h^$Vfd<yG=b&!$?wum!1uB2X9ZdfLZA^AHeD8
z)bTb8idae}F>LNrU?!S+E8k*r|1;zfpr&p$g#<GoQ@rE~m)_y|w9iz8h_JR1DVK2>
ze9SiQXY5w7!ZwG&;{}>yXF$>D^xTSRR=nNu^UP0F3I6cX89>oQUw%=NFf<=jgGl9n
zWe<?uwDp-rZ*RqP(t}OCg=HWU3)?jdnN>tDUvkn>6)|4ATyg8cyP45RGl6rYbMBb*
zN2rd7<zm*)Kpc7lN)sr@E0Dq#zOh`B*AWRIdABIy;01_`Z-4{^3XZ<QBfF=@eUbyn
z^9aHZsnI~w*;x^vJ=PVPR=j{rmiJnM2QD0e@aUf)9<bvO#)pC#s%vW24hxC(EmkQc
z;4P7{Xcex|2CIBEdq8`lychbiyKR`_Z*%kUeFM3_=3<`iw6@-!O|m{-qxF-9sE%1(
zArE(B{pD+gl2uqj|0L1r%8LL^#9cYptXc3$(Pe`UZLo!N;jY}p<5~;2+j@!hS{R2r
zt`u%X;0aKclPzI+1dY-TI~7VIeIvZE)vwUT%zatAB#P7U1Wbt_n$<$13GVn!M|l1A
z9xfZ|YmJ~Vje+M(<u?(^wgaXt)~-LNSArqlltXcdb7|z}$+5ZPYZ#q9G%HXodHC>T
zyMH;7*(DFOSX_wbLw|y-Dh{YjT?00qXQ2KHo)Cxp!5R+jN7r`{<!@`ytK9Gs6SQmo
z!407!Yk{>O)J37QAg`?L{p1l&6&F?n@DK0E1>sT)pC137Zak8B_?_SKd-wq8j#Lo$
zb5D%<gCRv(xmt^z(Q9N^>fwtRN>IeaecMVmVevF0Is)(;hVp`Y1#QNk{V)R!A)y2v
zqN7<S8%=+g02y0|ABBR?9eNgiu<%W!pR)hXpw?)t();Y?dO|*D{KSJfWr)6}pvPpr
zzqrak6<E4xfuw9my?iHjD6#Omn_KA^*L0e(<rfrLrleyBC9Qf#I{1>(yfrERd5bs=
zIpJM0G&2`_Wc*lyKsK#OfI~wclPlbbh>R3tBcYKSAHtyg4-iI{m{!Fw&qrbZ3(m1%
zsm>IOr*#68=B0eMn{__UW<WxxFhVo25JD_V;Ypho`!~pobtP=T7w_VN=$p|UH^Hd`
z=Tfv}o~5SJeVV>AP-J+qJx4T^EQMNy_!iSS79}Kwv>taLNPJY-IIPw}%YH*`{1|r-
z_3%azHua>ZYo5ISUu=mbCtUQaa2oXh$lQG|=W^J#VRR&cVu!5Xc#BMwcTW5xjoYqQ
z@S*`2b+jl)@l}4H%?}v=YOIsxEr6Eu?N<5l_c~u!RQMD<rOJNhe_&XFGqj9|P)tfD
zN~OLiCm<HcdY!A%12P9hk1ov8#LufV%?#-Z&wJ_rig8VyV*3E5lsuA?KLpM#TUR<h
zgB)%|BIEveG({4YRo=(8#P21o^(}>O{}84%sB}Y2imrrd#Z~?J<w5`OXR$VjH(ata
z3kI|a9tHyDHJ!5S^mf^mg81X20CZV@!C!2FYogC(+&Rr1egjs-d}^fHoeSd=2A@)+
zQEX=j%d$ybtTc1Pm%BNM1Rd-H@|<obp!CD>a>ciyr>L|<e5@Z_B+N_|;Vp=V8*KQO
zG=VDxZ#KcQe|?l!)CdHk05FgGP^q}~=;&x@bGFko1wKm)QFx_V#zY>0GmB>5Nn6(t
zW%<7|Ly1VP(OFOwnY6lo0E92=7N=XXU^H|>=BrnuIy;<50KNr`Dw<BVx<^MyXD-u_
z{3~BH@^B!pE{f<M{&M_Kb48d<F(CDD7FSDcQx9hSvnihLd=vD;Jiq++4enT17x=C)
zUZ8w}@0pbTg>W(acze45(23<%BhzhBhb%VCdzMxs+RJ@jl)HN19gAr-%QgZG75=_@
zhCGqKJVL*%?x8J*C*|&Yd^}cy^i{Ij26QB{c57N0(xzNWb*J37GGQSRLS)UNCja9&
z`iL+$i`biN0t2FQNK#?;z0Wm7YU4J^9)axbQcwr<pqHQ*FlTC>Nu~4UHo@H|mm!we
z&?kE;AE#5_fL%Lyx?NKxp061e-?e}*wZ1n5`abRcl0Lzlw{1qO>Lnz{La1s2D!c-~
z38g6kiP+8u9Ziw1XT@ap$%oZ@c_<<$c+b@5S=_Ol=zk<YIsjO#)qTOByairh2269s
z@1{q}0=sB_)Kl6?zga5OM?o>0?86UFX(>K_0-mwvZG_u}4iK$u<7^rNc4s23IcU0L
z4cjp@9-s$#Ih;l*kN4VhoM*i8<+=64jnFD^)VM)p>H{Xm5m>z6iO#ia^Sy*3>Q>gZ
z77nt{CHybk@fy?^SLaKZ*LMC{i#K^}g2yeDUzL}M=b%2+Z;=}-@$yCvdoVSKsNkTK
zbS57dbmOijiz@f2|6iLXh7(P2oFL*7$sQYSC<M$lk4)U*@v_i0W_Gl@2tR+9a}N=D
zc={@P7IfMfn!Wh%LV_^cg@C)#!e_!bQsp=5pR8g}>2bO0Q*_e!R)UAWYbBM3-LtIE
zUm?FbG%Ki>mQTNQ$ZD}KyN2Y&cP_1Qtn~zbu(~JH>VfLNPt!$0SmeZ^;Eji9z|SPY
z5ESJhM)^4=g&3B1w(;oiO)iSjsW(aZ7;lAWuGQOH`T60lfotO-Z}(AqM~6oX?z=_V
zJ&lEI-<9t%z*`QMH!icRl2=7OufwNAW=P*DXP0z%;sw`D!xan{QJ3;8EaxymdZJ77
zoqA4Z&HA>~8jx-Q5u^xV>Wl)u^8tWhmL~!?=CLERzshV#nV&*(J%B_BJ+qx0J|6n~
z%%aD=R2ll~%h--Uy&1;PQh+0?1%|n8!B4^2%sKisP2kIN0-PZnzYDY~vYT@2#@kdb
znU(9{YLJr<E^<emkDPRg6y%kOziGIDF{Xez^iF~uIZiQc+M$eke<X}S$l+gx!LqSF
z`k7J*c-Gpb92Ofr1#`g%-|xUQJK@$|DSqYsxj4_6JP8~M+;fUx5gCJeB+m$_xXW)p
zDC4CfqBOjW74rgf=fqUE>cl0K@fqL(CSC$j{5%-c9>5JC?EV~l;<}RQsL06LGyxoZ
zhaT#o;`ycU)%$Iv)W4b^d>ROJXxX(5$#H_faO{JAu8#;B6A7)*nLHD?&t>YW+V}K|
z2hHJYm4r_t5MGx5K|DIly@*gxDx!Hem``txVy6EhnD_D$hjWt>A&tn!hxFVwG<le~
zbJ@dGBTevpbm#!1MDlbVJZ;_FM`yAsGN^v5aY*atRBjtiC`av#v?ZfT9rGdq&y_&H
z>>6rVm6{J+3^bGp_+A!FLMcYNR8I$NZEt^*bj9q&+Pw#%I1GK1bLYXtlkl=<U~vDI
zO}v4CQE?tfd`2wo*JMnWf0i(Jqiuq25>1D_L;>YEFAokkBR>=daBw1E^-AFzw}eeH
za%@aYjDqDfYA#^CcJ;k@meR5bu`QmTBml_cl1Q@1{jYRVd*yzc_oRjrDn}+70!>wz
zyx^@sUciGz!OZa0Z%;+*4ZrR^j&*b;e~VsPabAq8uxe2an2E{R=@xFn@y-B+epF5<
zoqa&50hk>Rc*3U?!mg>S9e+>DK!F<oULGHa!?c1#4FFK@0K2}&I+J23F$qbzhc%$V
z4{OAom2PW&#FM$g8qKmfRxM{Bzz-JXhJ5`=n?FLi8rvF89J~XVztT$T=KJ5YUyVaH
zEXnhw%<+el0I(s@{CPmkhMjHvJxkKPU?ZX*c_r1`ijw4Mc-8}oyob+UflI{?$>2<O
zU&Dx|i`sOQ-hRj(y2UOi*m^9UdWD^UFW<gDM<EjL_bJ^|a}&ez<lrCbIe(7{L$iOB
zB_-z;k-(mQ<<WiWR%W%srW}&>z{SrhwCFMxl!=32G``j|%YaM$?$t%d#Aua&?!(WF
zgz={^cpqS-*eKGKz`DI4npwpKLfjj50wSF`k&qW*Ta+nyIs;7z*Z>X=_Q>Eg`St2>
z-6suJqs$%GV4ZDG9*&mZPdgLLQyK)08dufknkISI355V)ig#EauUX4ys<;kx=9YAx
zpPxl)j{(X0ZmV3nf&G_}MqV^{%hw!--@gJJaV7~R60M}9M90Xeh4*K&S&x^4o!#G?
z9zA+E^pb4&XGT@@+Yg`dBbymHrY!m~mVi;a0Ay3l13n}yDxYNOL8yUH-z_VreL(Zv
zk6=g7_q4_3eJjNO1_dGCA4ttSU~R)Ef>y6x{M+W2h$(|QiXqb<2RkA=+t_kAmSpbj
zo%Aj=H5~UR`|T&82{pSw!f*f%EzJ}h840l^Oq8R=V*vPM4<<l0vi#KC1+1*}t|r+3
z5B9q?!esdP;T?FL<{s0bsx0YOEZ`6;fZHsm$7*_avy;u&{~Lz=&0xHA>*hb_EZAp&
z=9{Lmp<r0Wm(<?t;~5`6+<wOps1`954WGc%F6Ne4xI)+yzs3Iy^UboHQ!GhtXTTo2
zSxd#RSvH~!ik`!xBQV0Xg?stn?^-rlv+>Qdze&M&UzFc$J4mWXesSXlLI*ZV#RMAl
z(nZDNMbp{B%cyMbcA`dOhh9Xe=BM&>i1?)O*mNhE9!w7N<&OF5?;i{9Dj4+d`%mN^
zDJ_O<0MguZax$?0FsnZR*Yb2eu9D^Drh_PE_<<@K_MIHUq($F&>_ccUPt|z1kXf}L
zzx?t^kTIHCqarBY71(rEaUlGUin54^1c7=elj-FF+2+Ne{Wo+F@cS@Aj#6%z%p|MU
zt_CXfBYXMRk9~3it|%_&g_1NQvo8nE2X4`_aR$$X?s$;;^_t2${Q^=Q8kR~7LEf|S
zBL_T!&>9FKRS9|rpth)T!YZw^dG?4hjDNW=k`<?rQKQZc#fHL7E<m%Sy-)Y!nZ#RV
z7qe*HEH&*D1(D3Tz@tC8<`2q0#?r+U_mjtY?>!?z;ryzho3OAZj%uDn89)LT{s|`y
zQ~m|YaL=(;bJvC+<rY(2S&8?39-o0Pzz$`g#h7$FB{6EQf@i9-z!aN@+0JlLZmnc|
zCT=)CLGzyORSEE8*yej&@UgYz?_?n{%@lBqHMn`=-y}~KmH(FYVAuHa4uB=D6?~g+
z<8Ny1wG?A-l)+b((1DJ3@P;gcqV++DWpO8a2Xz>4GBm>bSH1tX9<LXeG!_X0WM;hF
zLiR--L&@qlTi)!pik4cnktT?(c3J~$8?}57!vTMbw!QXCUz93~9}rCG{i;RA!@jOh
zzg1(QN-jJrqHEkd^Q(I^`(t1ucar>VL0MGcO$^7fm-a9|w?+LhzWbZ543JTnE4beo
z{=gZYf43<_O6bQC^5x=_T#Z|-(5G{zrjI?}eUtw2<~DRjLjmzs1lgXE{F;^D1)*1N
z(wPDe!Ec1O2B27acHb-h-H*f{8a4q^tB@asqYE<%x^bTRTw2nsYS9Zi&}HS*WdonZ
z;$gSemW<Iu?s#=KA3G}J)u0<TE$01ZHitakZ1<zlazZJ~{@-6;&j_3Qu6MTc<~Kr<
zPu;5BigD4QoIy3-AGk5@jeu_H9{-Dt6kBCt3^~6DPZ9r}Ji}|yAR+fzCw(<xRU_h`
zf1#FGFus)mOzn7(7%uRkzFcF6JDs$hMT0#F_$Z%?N*@pTCk4L{Q$?>vMkqfmHHnU>
zdQJ%`(>wURKSA}((&It(T6y={8QFq*Gi^Dd4>*JO@Z6Cdzd^enztW`7l7T;$;S=}L
z^4c`kcVw!SKlHudo8}J39)GNO&%AGa$)(c<rfCI63u)ol^^l#kuzEnZ*7QJU0ZF1f
z0THI(tkT^yVz8)<`J1E5`gg?(-E`gC@Zpd*(j1wo&;^J;+E$^u^?R6E7-iJ-ikV}{
zeHH)dCnVG?$gVlP1>tB<o+js^q-2*yG3bg1<@@d`fx03yrKelc&{3Y!R^S^IEQJs@
zc5ya=Ts=?N+!@bA3(V_|iZRXwjx~-C_3`)B&>1>Z7SAqfY~dauOFk66eGAN55s7jL
zWA<4ZXn{!YjJ`53aqO*JGn;w$ma675Ii_5#xiiM^5B8ea8Qo&GZ_aNTAMv}re=iHx
zjhEXQ%wpDoZdHhOTL){G$5uX<zbYqsK`m#|NR9O-&>Xi_coPKpfoX6pD4GBtQ9@3`
zjF5{)&YAkaRZ-sGuUpS1NLR^i9=g~4V!*#xI*uvYY~}@#^>OdvJJW!Nt6K5vw1M{{
zXP0Ya_qy+%4Q2Vfeo6KoX8H$o4CM*IqdNt~D1nhh(Hb|^;&X`s7jG;>cjUMGB=@Af
z<0C*hW~`gq-ka}UU*j04MnoU7u%vzQ^B7Pe9lh4Zhe&hkl^m`RyaP2K0Rjpn!w|u)
zx_MZo_6S5BID`s@NtM2*DDz<Gr5g}WqsnYL%?zZ+oW#Yiatv|m53XPBQu!GHjETM@
zcA3sjf;;BAW4ou9K?phzb1z{Ba>_=nWl7$Ok;%}7bfw_hY|Uos#ObNNthwtwvM`#y
ztoEbH`K;$jH!61ToWGtN*nvgMLEnf{z|PVD$f9*jwymBEJ)(;q@z==`Rj0ZE(XO~w
zJ)3C6r_`i?F#G`i*=twmJ*5l&UF|Wny@XNC47iuT!{%+((_+fhNRLYG+Lr%Q@x(iA
zJDaa$qj5C=AC;(}Gwvk6=~RSG8P%YXYWAoxhI?}X?Fg;(a2oF!_rwiOe8fZFhrM*X
zyff=N;a_wgv#0<OsNehL$Y9bk@7;9z$F=Qm7Eal^fJ(Z&aMt}@x#My={(I*&!lMs4
zvY>-0vvjB6=$kXbEbv*>Ttsa+3G~bT?ocX^Eh+1`Xe8`X)OhrM6@MzFVJ{VEj4_=+
z7IKi8jTc{g(G`IdKVWB^k-;htCp|iu#h35L@5@@OOy-hUV2l{s=|nx!oJ*~Y<n%>)
z8TVonJ5hl>NM~#+^26ixAvT42Gf|_@e)Jc<HNXv=$-uveM=R*#`$MLImQ1C5JlZdK
zPhjwZXoq#ZwS{%D%Am^6mft>Oy;YJe^s{dpz(e}32-!T)kWwuV{T;Ac!XTOw{SA;{
zjet~kn+C-KRTPUyw1!-P@5QE-GwC6EEV_mZo<s|Sf#v3J+**hkk;3Y{@2^S!{!aPb
z<UpKS<<oB;^AX^&ZGHRh{lm!KwKllfd3JMHg0<VAf=@lpo=uP1=TurzL94=yOst8Y
zXmccSj?uQTOx5Ip@yO{S6#!4#rO#-32w5d$tFA%+i-j28Bmz&GIZu)?TW0QG8-ReJ
z69TJseVFoJcV1;y$~r=Q{s@#E28q`|V<n98E%LJ5{@*Fht4CM`?fcsRk$<6h7Lohg
z5cT^hbMe`VaT9qbt8Z4x^=i*vn)%b?cl)Y&N^m#X$RtUCitinOtN7TyHB$KVB~lyF
zVP$+R&VXYcW93J^TPf(TjRZ&G8Y9N5r?n7=rPVL(=~?P7BW#@@o%Nw<jGGp~AO~zz
zE`EHzzFi>C2>GGGj^Z1jQ3M7RYXIGR<ZP(K<h!Vr0NLo+J@@0CvGCXj@AQ_u^NeZ*
z&hGklzcLMAJ|vjcYAO3GK<EBKB38(=6_d;@2u<NQ7FU-~{=oMq4xix-8NewPkV_a}
z1g?{QR?;%sxzilwM<FJ@zr8(c2Efr|OH|w&A&()kWxIJ~|BT4`fzuY(a=W^bNLC;_
zr*HlKL}0%E_QEtCqQLBt53{|0n%Y%Ih&3!>`k05$zbOMIwr9n6I-^H~u7ITj3DXd`
zZg#z*5s*z)8-V2fBzPChF3kx}>f{^C$A1YJCP0%wi8O4Q_XR1%0YI$3l*+?`0r_gT
z)aUNU<FM4A)`qIvKp5Q(_CD@2;f?&AH^2t2WTO`Q9W@RDZrWj<XBPJ)yU1yB)qU(3
zsmnFFC>SHTk`K7URq(NkUky4Wn(S~?Os17^kzQYM_xnjAl482)b<?;<_dE&zEt$=B
z+BN`K1O+(61o-Yo#qN8k-y+Auq30-wQh&QAAz=^9LbFQcU>#H-UqVN%!l|78tdEkI
z&eHy7kvo_QzlNCv(@`kO9ppbMo6X8!_!ssP7zuNA$B`6jhm$7@(wJf^<cIP|juCAj
zR&K2=_Xu|-1P80K_Sq|40C$odie_guce{ZSv%Q*gyYplAJ@!a7YQnTGpMbql`zTNX
zGDpv7><WS(Ev<k@d*8s@<Jk!bN&djAB9^|G+SJi<d?5=tUA-FxR*pS)l4d1(_A_{?
z79ZgRq4y>t-NT^#&^=xpBi1s@2?yQv7*mA^P@)t@;#c0#CK&`Vo_~momm!yw)g$dY
z<g>!qS)z>09=yT<{Up6D&z{>>@hX8p7)!Y&cBsm!2!EUg*b!GJjT=GdkifX-zT)(_
za*ktgM@%}w81!1R^~e*-<Q^=6ko;Py+PaM3MA1raO%N-r?Dhw(U<eHt4IPOooP38u
zxPE})B&gGYf{>S__{{KL^VcX?z2Q;lm_Gha=Y8R5Hi6XKOLO=QgwvbNvhdbvl7(lm
z7#PDL9xp$Ao~cd!B4MPf(`O|KA9JlPal*wXpvKi8Jh!p^J<wW3%w7z-(AU4dq{i?A
zpEA5QCKTCdW~H9alq?N_=Od^A9g_SO#TJ5$Za>=2{W~5Ikpdg+=xVM!@#v0vRKH0x
zhVKT60&eTy<@wPDX0gh7LRUaaDB(;_jFF(ujc{KFc0(3k{Va#!F^7T#kHtiKV~fF5
zUYz9su!x|dt0G&mqI9ofX=i!n9B)p3xPi}a?9hvB5T&A*Tj~oGS&BfrXK<;Re|pj}
z=$p)eIqIQpd|K3+VW0Cre`QHA$Z}Jb$649ckQskrz=P*UM9<gQmhzx^Ntof0TV38F
zOU<Qm&OiAW?*_S}rRu+4erKZi#hsD_Ji}`j2^VkQQQ8D*uW9L55E8$;af}Fg!yY1-
zV?da9wg!b;rJno)=4%%Xf7gR&s7r<M5)1&N;E6Jx4|=LV5uFUMS>sPv)c<N!+4=E-
zF;z;uzy9}jk`sw#zKr{QOPHRC6Os}{io*&+srptwG@u$!*Ue|+N?S%j_fK)(qrbX)
z2lweJUVTwithMGaJOgQtzU4E%6NsX*`S)}Y#v*3wHn%XYXJ@JP(SF@z#2ueeo?=jU
z$-*Bi&Ko+Y!6f*hH$tMOMvL?DV^y{XUwnjWH*3N>Rmy9R<;ZhmZ|ckPtkrM#(R-y0
z-89<Z6S_;<y7K#O$#5*+g%{5gn8bO(@Hr*k(m9U#7G2_J$bQ-c#unaGC0yl%wj@7z
zq2cQ6_nl&Xo=%0+JQw9-?GRZ!-(_PHG@H^XGNE$VGWV=%klpoG_67XG1aJR3u&q-+
zI%s2SJ=mP3dV(*OrUAmOT8c%TuDyJsPp*9U#emK&|BI4jtvg340mkd3`Ks;C(jWs5
zr9Bg83<uom5s<b$Fa!uX8gNf64m!<rb#5!(#$Q`0Xi$87M7GS${&Z0;N;V~hlf(W;
zeXdL)-Qxa&fV{71#gfNAQ?KGBFX%2kX*ZdeKmHfCuxNj-sclkU#CBH?2lOh7w2Otz
zYVpUdOl})G1?eLy9Tvqd85rVZ@pVC>m`2vB?1*b^qTs-6dADG<aSHwtf&Z=oO?PcP
zeOkOku>e^}2R#<t<68|ja<#%c*0$sB;qQT5Iw`j0wLHW_Gx1JRn>NVLtNR*?aM3v1
z`19EU$RwZg>YxUk)zXQbxL3$WN60NaV%=F~33obamT6StN|rvnYd`=Fvmp~i^lrGd
zyov~o0uC)7At~8O_Uj`U6|it5bWlV@Ez?Xn^X4jRSLfB^7w1_o06GNJ2wD9uWS3g;
zhlT!JR~w=&`Ns@snV)OGX=Dww@igarj(<N)0;2yW0OaDGoLSKPr&r7`Dib%+Z{KFA
z13jOusK7OAN1aBs3dYqj#<d@J!L3}OC45Hwd4qEU2Z9AFz8_e(L;cZ!X*olyyIbWC
zBZ?gN3V_`RYX<b?|JW+gfB#WOMJ~xD3;#*^p<aq6Q+OzbT3uZObroiFh4a#dUDkXM
z0~#M3XCwndjPlLoQm*Xr;`4fYU<r;R>+g&Q2{i)2rHKXof<x;+ZmvFlklck<8nkW}
z_rqC<uf2S6&ErN0((Z^09MLvS_Jt=Pnd;t*O%`GSHifhVdn9+c-@YJ;eU^J9QzaJ;
zJ5=`VUocFd#_ZhD;uisn5aYUzzTY$$JuPp1E^eQwVY@3zgjxnQ1vO|?`~(){-EXmg
zi$tG8{RAe=t*7lWIyk0s#JxOuz+l#$0+CYIsr(Bs;jBF5`_!!i&?7ZB0B<LJ^`&ae
z#qn#}3A!p@R8muI3?H8`TdK{6jsbtluU1WeoPL$-H$x`Q&pDMuyXv+;vEtddDlT)j
zdiU?I_@t^)J7)8?W7+2dEM#f_LfaIq-IJ*NZrIn9(|Zd&8JJzNT9L5s>$S84{ULke
z6hgzG@~|kR{WR<R4iGPS?i^DJ@3!B`3|jH~0P|JmZz^Bi1sLUmyHdwhI?gy~?Mna`
zksEI}TdfB1sNtdrB>tw-&y-7RU^^-$Ae-OrrdP^TsoC~gTLb}q!1*sYE6jU<=^@96
z+sytV394Ipj*p3<=&zucb5P69UQNWMD_r&7BS7%1&iP0!W_c!#vOP|qi0x$kAEMC=
zMc3}xB=~{InlT<TrncTL6CEz8Z8rWs+GfOx*6I@;gUX}?D=ox!La0*Uui2m{4cog2
z<IjIr01ZnC@Np(_pWP&bxs!E^Q8InXgYWlMfm9?Wuc9;I$<N9R^6xDQLRq*GMd6Ij
za+@A+HnU4LhlS7ReIJPGwHNs%4ST;ZuN(O_^1ukKOFO{f*?KScbW^v*7k|I!6VP&+
z@Umk({0FR%-Fue%<u-!`-_?CtxCNjcS=n;lVgwRj()K;`CMYn4v1mDx7fTwKJbpbW
zV&Vq#Sni{%wM&W1XR9$Y#Ecej5~_=~*VSLASADy+`8}8d(-Db2a(NQL6x9N_2QfzS
zJg}oNnSeqF&K?FIY=^_(w?&<c%BEi)pYs=~s(B74T)L|O#<FQ9py-8U{)V00O6rSD
zPAhw|#s+N+JLs$a_0hh6093F8fGRpsXo^hbljZ(Lph;YX2GtjOmL(Dvp@05D+JNm(
zJxU=&wvL<IFzk|tb|MW@gndof;qO2&APaxhSLWV}m1%4r?xK09_Ad=%oA+VuB=7zL
z`pWr?BkoH3$u>}!#*~oVb@fr~4a#SmNov3=-RP=8!Y&I3|1|+dxTu_+tFA8!W}1A=
ztpV=pKl+2L(}rpUI$<0QK#R$+9(it>&3pxZ!G@GBN%H@SXrP#`1p+O%O>)@6hOIW<
znPcl0DDI{4P8bZDa-ihX#KT!jkP+78XHj!DuY=Fe>{k?K=XXb>8&FT}jKgO|Hx%Sh
zPRX-Yf_Q4F&ApSA5q3m8nCK;Y|F6sv3An?rAsDaX|HssKI8yz8|L0oQzD8VG7g=Q!
z*S>Z`Mnhz;D0{DK?@bi4iKZ>1WN&g68QGi23|B6FpSOB{e!qW!*L{uWIp?tsH^s)z
zeEYs&X?9``t)B~P($1v0aYV8lo5zr{MHHKtsHVeY=IOP`pMT~b12-bHklKx=#Q7Xm
zUdraMym0znVrXP6o0ycKuryu)-wxguHV}2d+pSFchVeQ$?;z2;L~ZSgp5I4Y){E1h
zMag|~2Iu37d^C4~($HpiN(EqCAHe#(zlGp<Dn<SrUlW|kP5t~=yAwE=29>sPqF|5l
z2M+k%>{!}E-{*G=dEP6_N6Nt*A8Lv6|I`F0iMV<T6GZVT5Nh{BgpC7_m%TI{ztxZ-
z4d|($iyGniLm;#eemLzsTX9SyRkuBp7@kWKbp{QoQg4~H;h@KJ=l!87wTEEWNzWFA
zA{ie%URgKI@**VVAm@O-i#xfrJuPRV;?F?wOc<hARw7Sl#g{mNuSE4=*l`aQz1n&%
zNh}RT?Ml>zpI{jVk@Q^sKp0>cm}?frrWm<O`i_(6&%t?+h<fG9{30HVYM14Kx5EN}
zi}PC_wg*o}!Nh+1y%=den)@Y9YhX4wdm1Z%pPgiM9e5O8Z=1GwU!L?%jFS5EcU1Bp
z5utPU-Vri;IyIjj?f^yojJC#Mm@>3xf&6mh*zeu<j;Se8h%6#$SMlSd70xKtVi^Ao
zQ0NF6h-BS2ZF*{m=aE-yq1cgeT}qQLK;~l5TEhDzB#npvdky&hZ&HV3ys%)+mh`<<
zzt$Gl2C^O~DV8eX_1&4BJ<nBlrh&)enIrA_hoo+b{Y`85zS<@V^-DMis52g14eAqk
zVGwNM1U-Xhsj|jT*TN>Ior6v$Q9~vk^8eqn;|)d0ZqbGl<dRR?>-;2gj@az&?v|eM
zX&<ss(!K#KCzYssZ$&sc(%;QUBEi!Zq=md<jqa)-RAW?Yxn0NdKnX`(8#Yc|wD|Ml
zMPNOZ>YfFguE)i`@8y1HBaY$WlYt4#M2@z3bDkXi@IJO~?*P*6ahEP;+i?7x_C24n
zwJ4zU-DqE?U#%}KXmso3xeJ<+em(Z<-Fgx#`RuSAF+`xVVFysN&Sab8dHoIIu4nOt
zZ%S*QsgqjX3J1kMv0^pX{~NZ&`=&=e0^jzDal(@99ju15M^^yhIqS5qIRQD{chIs%
zt6h@^cCg7HuqHSHKgJeL??zAV1>lE4yK(5wjEZnJ_u?E_tkZTNZOjolBQcW5`I4Is
z9>VZ4X<otuEWFQ1>Cs?uw4S{}0;j}(E&%Q)B1q>uHn>5&besPvpH>D8=)d2Shm=lb
z4vkg19=-y;d_(;;pqUj}(7O6TvFxN_lm5>j7mk|d4Bq^FW=lXhT$!HFf_xwk=#P@r
zdO&ULC(f}ZN+2doL@%ivuf)1tqJ7l}Fz^u9pfD<_9?UQ@Pqlyw)JpvShY+C^cdw8$
z54*y-k{KBKLo;ThS!r^-zCC0-k9XooZCC2-A#`D6py(r>+-`|$tDXUt(_>^X6;&(G
ztGLRHeqL>*Qx6G-MdWj_{Ki241AXvaTM|u`_4sl_PRxz2!Xn1Z%wW19t~4ght&-Cg
z(VJHImU<wi0$9C9>ys*9#ph%DzFh|0k18sE?PI4ae6kIH^jU!ZVDzSk^f<jZHPTsa
z&O{tsjb^jM?+f}mI6YPD-LItJS3Ko~tRwOM)bWg1g~CaD=gLmTQFRFNZOxbKGC`f%
z*|n7uGvMuT|KNByEPPS1-yEC<x<W*;SXS*0PM0swuMtf1@YMA3W*I!yT~e+TjJ9e_
zCuMaB{+Ldb5&Fe@+Uq-pjuS!J#uMuNIrWryr&IB>@{R-F{X+VOQWkqL7nb4z5@}7S
zY!pNyQ`!AARf=JD8BnYoheRAO=oW|-1~vV}%uhU|U?tTHeQZGy#>V&?Nvi?`-8SRi
zvjOgeY#;Zj_PzDX!Q*(TKm=dS)@jQR01*%Kcr=C5+L*W)y2#U}%Nj4w&FKlig1q30
zk!w~Z+y%Fwl3L(rTujTwk14=05dc?2*L!9kUEo>Y>lbl`Ad`4K@aTdnwamqez|fzA
zEdO4+myD43%;bF&2YT0CaKb`?EJflhE&#T1r_gZGxXpmFGm{MHuvrg*mV5|6AB&wJ
zB+JPYmt=O?l<7q5Un^IEg|_IZrme$oNNQJo(#}&<h-X)jodWmzIATZymQ70NxI)0N
zSUEfg&=&{eZ9rbxO~3b4JY?G4_AUBb-oboOK?Lm(XItSBUtUl{TKB;0ze*%o^bj96
zMzlh!3aHs+@AQ<V495NCu!hV5Fc;E)5$Y4NyCPIKWf{5c!H_9}yHpi@SKp9_#>WG<
z+Z|<<D8uVe{YlD8X|Tx8h-!uRD=q$gZ=pjZCpz{x0{3ab4nWN>I-j@l_IQM^K8_Rs
z?5>_l5v77$JmZhjW>Lv+1+{G7!v%1}yu<A><6++mCA#%VY+FIuz*Oz(GIc92`EH?D
z%gd3%;NSowl_$U%_^sAQUfpgt@t!^p&UUXb+k`8l6&H2h>bM%T@umz!zz95(kPFd6
zpx+^vrB6K0V5w4z=-<%<@F*%VcpteLy)1Rnj4PS->^76BkA*3RX_R;JKGg5K@|~Bc
z$0;Df#J09wsqfqU4CXr<*{n_Xr;`aSO4}ML#DWBH5iQjL_?iSlm<KO&GT0Q}_y6(E
zJ%pbW4`W*W(tC<LzSt3mKjzHWxs#g~e@0)O)$-xX-q{}zT~!+G75Y8<bbdG}@Pau?
zEZ$Zy_zbj6MjApy=;RsKzhIjk7xcLmzxG$_&Ja>RP%Ws4S;-8wL<6hr^1#^f<M$`$
zKr20sZ{Bts`UZg(X|&X`vo_}s@Rhz8G>wVFv=Dyz!*Q#5V1uiD9N@&N(SaD1*+O1T
z^MzD6faI||60HP|-`S+`^#VUSaucDow29vkJ#1OG2JMlQlz$N(T_kqf(Ym{tL|j*T
z{~b9%cIpLg!C!z6;B+cE{e5v+x7fca_fA4^QqhRkvDxUL^@BF-1=}6KU`RVBJ4|m$
zMt@20l8>W*0yaIe;U_nDk|>&P-zkB+Wha6EUT_4_BNl=c*1Xwh(Nn-r8U#;+J`N+i
z%<Qdi?5h4|H8C6@@o#M|P60)~V^dKTCUeHr@#yXka6;=!5XryM7YstYJOmX%a6Cee
z(u%wN1mgpfqsEg#4{o&kQ!7z)T4{XpEBf|#szM=_ZIdSyaXanvwn`_N)91Q=5Rs|a
zYCjG|uCYjI!pHq!+S=w*@!j)#DCLg~kOZcXpKPnzhKqs~Lh_u=uGXH7tM;Yuo)VAq
z!lc!Po?x+=Y5!#bfPzJ`6!^dA2m>Jk=Go!K`r$=iKwK6a4^IsO0v#uh<x6ap<_wGV
z6@+|Ceo_G>%@*xc(gT=XF_T7p>KLhK{E#zYmy@%y%A0eyXNtSUCsB~A__VR<0<eN;
zg|E{!wA+FdUn%8k`-MM*w}z2s?U(J#vBEG`J0t5Hpsy5YjJqTv8faVjdpPe*vRS+j
z7XCtwhO-c=aewI5i!<JSt=c^GyFa7j6kCN-eaHH;6runymLCY~2@MQ7F;VADJ$j;5
z*f<6RE`BpK8Cr!QDasUKzKp+MrhC>-Eo*dpy^^_Ce+2*Kyq}$etiz#7l7ToZo~p=D
zz6gW)hVP~k%UP9a{#MRJuN6dn3(cuy+&io>`19h8$U)AiyU<kEVcE9>cjL@5ETB0m
zWGd#wlxhaE^@|AVw#G3qR%1>Eck4gmg8yskx}XdR!`8opoBaUO?a;`p`j-AWZKzC3
zSgV<9;AXsvf;i#N?_c}7oZ=1PlU9Ap1{23MoPSOZXox!P&Tb~R*mi$lXbKqZ?4Q1h
zp`5Ya_iBsDa(!0W$R8%iOhO9AFzwm5rLQ)g?@pxX3jAwI6M`}RimMj#dtm;LurF)i
z?MMuVr|L!}^(TTDJSG?3i{dx{q-J^N_}&zsXQg%ofV?^);6(#cN(>$kKscMO?y4lM
z`$*~qRyd0tT`)_44v_A-=jv}uM#q4nWOp5kJ}PanSQRH=B}*Z|VSeM1T2Y8Wu+xSV
zLSbP9Cq>JFZunE{OW+BUYH|xLKhBwbblu>)X#^<fhyc>w_wx3mZ^5z#nsE0)8NO|<
z+K9%niyX>2?H8Z`b1DCLNDijhR{=Vc)j5CLBK+&gfB(f})(4<G&jY#4l}R=28K1=j
zA>H#;0@%{y{nb@6Y9w`@x{F5WcPZzYY!i){CTqRK=)SJRV5R*j+s3ZoZe^#F0SV0b
zuTGl}BdXNlIb;XE&87hdcfDA0-1-D8fMuTyocRf*&g1K2L;mm16}>;ZOxpHd1AB6K
zTZ6qo;ImpH&=R#!5IKUeM~Z+`)JBEtyo|?AE2)u(H^Z4AJlpQJNNf?P!y{}Eb$a>%
zuFp*%J7CKN2;?U^WA+l5<WqvjHSD^HptPrPou@Q`JA@}&j$Ns**!~P8;V61F1RK5U
zdyNJ(2=2N6Km`$^V~Mtz3jgi8cmR5^UWkNweN!t5%hFnmPG7-LB<$sFBHU@h7?0X_
zKQNLB#@>5N#OXpFOOt&Aj6%QLz}R6Qa5B9e$V4r_(=r5@g2wX3_Jve8WX+!$=H*=?
z^k&ItpSL!r*Uc}B(<_2-%=wZmr@r#I)a!t^5a&A|`rZ1or+93U*j@lYH>lKNHpVN9
z$il6{OcRYzxx_E7=Mp3EjOjB$NO70NIc1UH0)(DxZy&zDz0*P#ru>t1ryp*%C?6eG
zK+kMMjhqXv02bBzs9b}*xv>OaZzY{#FmL=h@qTHvtn!$p;>>t2`|ZW>fpcaG7D>(a
zXqppx-kr_<y!cLiK`$O*$MYVOzrq~(Ry2G54YV%<h`t;pZ1<2=gd8u61ZA4RGDY9B
z`55%%nD%^k0V;PA>^+)DWtN4z?rZoT|L0zly7FHTvkWJ8bw>_m2Fd*Huh_eOIV+*S
zb{o`W?l#USRywb73(|hem4jiafadGqcRpewFq`dYq#O(ZQacL3quncWHgx`YAjnJ*
za$euW^X`rNa|#W6uP?Wo5*}6!6m9NHy=!s}|BKW<ibQ=zUZ*4Um?yGFtR>Lf-}~<0
zqLHrbiU!SzgjrIK_l(T&2Ztxeu5XuLEL&ZXTaZDN=TmX&mO!y5sz+9)L^48WH;G=d
z%eYzp>Fnhkp77|aoVELh4<oi&WOZHwPkG1{3aKU}(_Rzm?Y(^L1pr2TX8_O<{+N}@
zRa^sBZK@*8Bq<$F%*%GQp9j)rQOoH@Gx6u95EP^;M6a||;N(c(tY>Ie+9xXJy|nyS
zjyci(ptiSzAoK^JvSs175hQZ({%&%u#Ce>!c}uYTrR2Idz0@9Re;#5iv|g_vDFu25
ztYq2UNpHsS#Ir~bUaAfbKC+PKQI#+>&v6;unyf3gk#>)$PWrHr%F6RZCEp9S<J~`d
z@BS$ODcb-N>-c%W1T{DDMwG7ARg|%cwv=M=L7}J2Zs10Mr{v$e`JJ7B1JiIzzJz}B
zJGgVb67*ez;Uhq}@;m+1WR9xGFJquecx=H3fH{JDS0aP0KUyjVd&dbpwXK|u=x}9o
zq#ytf^a3Gd*TAS_V-W1<N^bD)if5j$6wDX|_RC9CQj7c@^}Pn4GB#RCCz8H6g6X`P
zZW=;8s~z~GaKn%7e|-TMIu!36`w`jtE#0V_a*GRCW9j1S@i%;dFpITm>q#GKf9E(k
z>fteRB(->)6p%d1MiK^Ki%yl6S)m}ahvE4jb}DHUvF7zai@WbNZ$ZWzB^WHbHMa-&
zDS1}Vo-(4LR^nH|c`fA#`XB@mWr&BdHD#xA*4t9;2S(U{TGqpcFfU+6|5TfdXv}h`
zin)iOa<@9;S9*yb?HE}I#@st_wD0Mvj0;5aL@h$!CFD?qJ6e24`hZO9NYF<b@d|!t
z*frk#OALm$EO5>(Ua~#$`Gmc>Qq!BtXQZ#<A)&ovh(zfz%?Q-Gf1mmIVZG&Zf5lcp
z7}Bi?L$T1ndh^M0IO_8UmEXP`Qx9P*Gk{K!Z5A43wZ0bB-Rjg)P3IQ@>~s^4MI1l;
zs69WE?(u2y;O;05#0~M5Bb%uqR)<cJIRG^5wJwO%2@ot+s;GUfF@EIc6He=O6tl`x
zYR2>0eg$~!*nAgY=|i(O?^{^nZR|G@-he?~rE2G=qm6dgb*V>DtM;1V7MK{1)8fN*
z^*;Ej{+lmC$U(=-+m&*=M2ieB?hyL+Y5*HMEM+BWXl7NEVwI#IwFwdh3P7WCo|2Dg
z&rD6!5Z3v;E#g2ObgkEEcf2JSJ$6k~Xc?BfLGYkW<}EuS9_WFurtiJQxBS30>pKqq
zMjH(nX>oq{yO;1p7JjH1f$g~FQg_%}hBxvz_6px{i5f>FzlZO4O;o^#7hUsYNjcCi
zEk4ApqRN#$+HkWl*}*rR`;;f@e?BTVRRp_ET$d!}E4>;{XY@*@Z5znOaj<$j%eOIo
zWz?XZ!L4Z<kn~bB-<ko%mfLlE@g<en$I<(78jV8lYxDl2Ai+qj+On!+#)r7wCa?~$
zsxlaDu5S|R?pn9&^*#PkQg)ww;@4b=Z4wrT<XQF~RiiDz#FmrgDfhnM$$lRE&tDcI
zlT{m<2BnZ2AFJV|xJTfz!mcI!lnQrt)LfU(G+u|5>p97&HLBv4Mc}&<yHIF-<4E@>
z@P;GCy2VITt*yH9(|2Xx3CRPVN(Gq02Wpe8v@Zm){e7}7XFcG_a>DxF8deX~!kW5!
z9Vw2r145&fP2PKu;iYkFAo>Aune)y_*}u{WX5}kHv0eA+SQ|mk{L`s9K>ZDtM<{S9
zyY<$u#857H3X8wQH@(+Gw`(0HxRlbVnn7s$07LqG(p9J=f(XZ4d_&Bv-P?!7S_ycE
z8i|z>a!5elip3#&kF#&n!){;JL7p{%Z4v-dan971J71)L6c^ucLm0ouMuGHk;kdCg
zlQTDSgwCB#pmbG`PUf@3yE%naSo)H6&W^8T9D&V~G86#}Tt4siA5W;IvhAkd7n!(q
z7UFqag~}f}3H_3Cv<q|^H29(tC{mW)0cR&w!Bn+`dynX8MgZfkn76@hZ2)9|<um?a
zfEVLV3`#cAvT?9*2@n`m_yIBS49I*lHLGksCtC2-e3F_pxTsMjE#YM~zICw^0JXQE
zcM^k}qefznnIZWgB4%1#Jk@m~=7^S%Hr#fky8+f#a0EmvPyjo<AscU0+_s!5+rIa&
zx4gj=a%)lP1ayP;+9DuI><%7Z_(VEml*X@?5f{;HJ<4^Xls-|6$bTFl&Vm#_Kr3;d
z^IP^<+@y<dI>+rlf5z@A(EL0|k!L@i2Vwt$*m2;`zxi3pZK;R64kfDWW0&-(AHLRD
zb5Ct+{DlsOd)Ew@+%FL^{#0ZznZ^8fDJuD_upOCC%j)PL&?*hgpVbU&_d63XGeim^
zNxH=OFX48Rf+)c$V`Mj6lED0>dK=V~E4Da52=>LmP--gq<V5J3TiaY;@p}nC(uzn%
z`y2qW((8iHh>OIc<HLe}pUm$60KsuR5Hp`qHtL~TtbW+lzv{TJDhM`dF}FNf&({--
z3q4e{U>CACmOGoc(wi%owg#hklHtgi>6Y9nD>GXxHbJW=Ky;m3_j^EV1-nTvSehZk
zEg{rGvs<=Hy{A|xmqeI{!*(l4O{&m9R~)<1_ttaQqW?bN5fX^v;TL`Rv%sC!shufz
zi2+Vr?B%i^k!4vI2c{Ht*TA>!7Fs|izW6Df(3j!BN>2U4o@cF3Ijg?ohy(<CdE)ox
zv5+72Z$KqS;&Ez!(%fomyB%rm@!)z@q1C;a4(fME3U<H|5XhN8_~*>#)5>ho&3(mD
z!K~19_QUgKo2e-}YFgrIUL0bUYDm!7@4tWE*g1Eu&`F*E-#0%UYy`OA%ESiW!!NEE
z?~sQ?0I;i@J!pGeW2ozc^n-zno#x*s&70y}mR#{18uD5Wt|gaeJ_3RNSiHCVqx5EP
z*U6cu_|^&!crim1A9Pz?BDd@MP9a>67|2zaykNZ>Lda=#MbBwby^mIt)gt94NEb0~
z_3fP$zR&RWZTf2=q6<tA^+w7*s+o^q0vAkH-vI)Rnk?Q+T+Fu&+FSVMFYW<0W1<p2
zeBPqtO97nU<l(VDQ}b{Fg~D_K{$Asm#YHLaCyCSWd9JLsS7;n|x8!2dHv1W+BE?z!
z<A%0Xn)0aBV{m4&gIF!QHfvT&6W1+I{s5;!ww@b*scJAvsUg^znB%_eLXQ=2qKj;L
z_P~PZFp;_-OqY||5>nGS-bWhdAWkpKxq1Z6F>-wOq}0Z6L)KR*_Sc-}KRO?1nC<~W
zAZ`pXkV?<11syYXPhkG!?rc3>K)o;GCg5$nFb)tjEn)RJ42ang$_^Nvm_G<=WOtc5
zI#8cdT#XJ#-PQoesTCXMJx9Aw_8q)b1=gBg+xK(zY)jA2r5lL8+C#Utz(-?968Ti-
zd87A&iTi&;ff(fBV@P%#S(BW@cm+((>w{xK|K$Y-1fD&W@#1zz3C}MzrgS~jR4axV
zWV8?pE_f1l9XJ_X-J#>tIU~@Cpto=^@&WZYOG0Fuy&Dm<y-@p6=wGj-8w6!2jbJWv
zrOT6Yd^W*{pW=L@q$aHCDW-zYSPGps`&*kpZIj>3mbsOJ3qIyt`GDLSvo^vp@kf6r
z55XGV@TDH5CrSzg^lv*JOMyc|baO@l*i!*C1m7eE8|2@Nc&d2&;(PujC5LV)cA32D
zfvO4BE!&q4{Lr3|iUJ(n>`}Yf2$rWa%X_NcwS=<u4U-DI-x3lc)Mh9i4ExO1hTO=o
zN~~m9bx3_T)N6M2CKAk&CE>x%W>fCC#DXCoAc}3L*O8}<q-3UJ2c0e};|%AFMAEsf
z_?g#lN-qGm3ms>EJ?-|4K(x2k_C1i823~I%<XvoV(&8@s47hfliSbTk^#&7`0%Ex&
z?LkUA_9mIqvd5^Q?H?&j4G6;Xwp+-+Uevs5b6c%tR%A;du-ivO6o=A9>92rFjff&u
zBzs}v!vPWMP=SQzn?L_rph{{~?((?V%Jsz8>c5T$UtQ43t1(WeTmIXTh9ZOHIyZeU
zO`(TBS<LWJSl?yso@Z4|kV34`WDi>@CY*xWiji=roZ)?JBIr;;y|hn0c|R&F^eX6o
z-lJN&1x4bzSghlER;Mk765cGH!93#MhG^G>4bWy<Yk?>#a^Rk$1ni3mBDEg?4J;gk
z-A#pocV4~}!M8H_=Jf&@q=_VERS}XY4?L#xU__><Bw*^=8z}F|H4v%S7KvEEv*Ols
zA+g_dHa0%M?A}7L`<T<tZTM_&enP>LYC8wH^i0i=E*<+<OuIIZRJ;-}Zw!d$qLkH2
zq8gpPHL;E0*?(}$4FrkM4haX2I|}2BrXZ7JWn8VjRKm)$>yd|V8j)3oQc#l#eM1<_
ziFmDlg$MQfsk>Hn%Ed}IDG7p_>wjR`RL?Xk=p4v@{~Bw)|A75_vPtYY9;d8OiI{TL
zA?IwLg_r{8*(ToABE=55k|TQp#$SN903DAV6v@GWA?SHF<9AXj`eWju1zrX8yzeBz
z{d}wIseIQF!1|?E8(!7{i`TPLhHEs*CIu&nr?M~UF-p(4QED|vXa|ONwHqTgE0b7G
z`%4RwGAH2*z)m-QKI{c7OYXzLsJfU`AM?vTpx8zL)k8R7lVv4=l}Tx=yxbNU^}N+7
zt(=gvR)YfPc|oxL#+S;%^k@(m|4?k|BXF<ntr+&~hwc?xUgV&7*c)35@)wB31F<)L
z@O9BMio5|$kp>aYWMO8ZH`zN9N(*Y*Tbo}UyB#rPiAQ0w(9f1uSP%d@^koy+wZ6u4
zoU(qm|Kk4NWX4FqF}dh^1p0q+H58}+{_$#Fp0|0NP;G_dpoJ@8UWZh83iQ>m;ZTcC
zY3;X1wRuYFe;Im7IwG9Rs+Xl=%(nI6QjQ-`V6@|x#tCy5zW-n)jHbgeP;(Cr8vcA+
zlqlQBMbX*yc_EdO{jVGtI8LsA;@RXoVN4Vo;Irm$sh8$W6R@r*7DltV(^5w~j8tKL
z7=1tLwygXlP_#JcUAS$iKgFc9VuLpMI}Bb@MX=q7?V|0v6gmNG4Fat1JkaEkRXU^`
z_6CmtR+nWqo1@EI#1n4)>HY7s6H;rivZ+Q)-QA%^(<qzfb9&*~xH7mH&jb|rSnpS;
zqJ<uJ{T)N-2$&D~-m_8=mI0oJC;q~fOWA-@J1))$6PvR!<%5$|S;a2{rt_c+-yP7)
z+SBo^5=ySha$REKhRCnNikoi)<`H!w!lW`4F$zb<vyLI6b9%oI%ALh0cF5;}Z&31B
z?0mGw?+>%5e|<#{j--Z<t~hJ`QxNLfLy_AHRw7hZFs=Lu|E-1>p{{a?T0J~aXdhp#
z(8Y|DNyY__X!fDrZuebHJZ=^p+<aro2&cF^SP|G#>$237G7reeK4+y`p{1M{i2{zZ
z#rAe(Qg(*g*}xNWje|xVzjQa~UvAuP2%7ec#f6^_dV)7D0kIq&%h8=z96D~XcU9zZ
zzqW~1Uk2^?vr?`JvdUIq$tzw@yCj(w5OXY=cugsdYow-mKVI4N>4MmfLffnJXB-^Q
zQ@AxE)6INkNHIC)pdEiA(uCUD4>To}OTcT!Aj(DkX~X8!Hz)9Ky~Tuz>3-tL#W@NF
zUIs=ss8c2ypFU*IkmM0xt{Yu{RIVvm0AX)F{dGX0hHlSKm(^~>qOVgSOaU6jPfCRI
zEh#^nsYp;o&~py3bnSo=O!Xl_mv>LQWlk>;NG0ciYa8J5pl_^kxchvf^Bi<<W9?(F
z#h)=rC4Yu?rxMA&-D|1Juns`D;dsr)+wg3wI}5QX2GJh?#eBae4^M6{G^R;#IzCk1
ziheDqNrcNO*xvPTKLUBPD<oX_P1zsfVfrANY5;q2hQsGI(r5&vdtLZ-w9Nr?>eRR=
zY%nCZc=h!kLz<)$(WNXa7b&3JIJzl%3Tz>nDiK#dia7!m7vuUfFLcf)Uw#Wqt~kla
zm;pI>)0}Q}^0%??uG958QXE35yKV_GT!!d<ycH$?IuV>3A#(dH!)iA0$Pv3aj1eTH
zsPgiLqXE__lTE*;X1!H2j}}EsXlMw}9`)f_58@gNc~#!b2h2Y!`@2<?%JtG;sp|jw
zSTKcF{c%sVRrB=Ez%oJ)aFQ-}>4`5c-)$2QdnVRC8Aj=1Fb_W$svA5kej-RnL-G;t
zE|A%)t~CH`)#a&>PwQ_vo_>`rgoysS<pmwz=MdN6J>h7Uo`NRw!c%VM%1>0Sclgm$
zE><eIHc8eh$bfG6=8MoD*Bp>5jTNP>{nP@U27lP2TqvNrw*#_mabA;cAlsFT#!k(J
z_-CM#QS@f$xog^*9049{AM9r<9J?KF4l0Z4@iix6D4NW`E1^krT>&$mTJOkdSh5hm
zTH5Sgac~qhutsz%9O(u8a^Z>rzla<triI7K7q=hCSQab(0hgZ10yRsRs(kKZzjCB4
zWH-6@2RL}h^U&fVQTBj+hk_IGeSr5_Ot5^<Ys)q<3ja=UoEjFs1R-+eDs)8UEJy8Q
zQ>FlE0^|<%XjOR8_Vf0InKOW*RIWaL7cBRF0SQl)dw(m>7HX(1xL>e^7q(+BfXK6?
z>HO5A&OH0s@+ve8kb=iJ{RT_!!1Y~9-p40EdPpY>;sS9_=+?Hv$WD2^l+2ge)C!wJ
z6-KkuZGf`1rN}_Ou52D3`P%;@`jtZu)OxGDWM^*TW}YD{#Be;-iRncv(w{FD#SqcR
z$F6)i5fV7%+D*)QJ>wj0zDz@#OQwxPaRKNV{uF#7$Y65^noh6S4B*tFAh)OgdXG1h
z+Z`f;7`MUMDs#xG(z=B3$H9}6Tbb3bYYh<U%C2^J)_~5Q4ssSa^a9JK3`3PDhZ`bY
zVWOP8*-pMn$S57w^Ko|1fr>AW*}xH4v5p^}1q#}uANv%u!vDf#&)|?JrNbd0fvKtD
zo$Q2)=$_5T#B*}ISW)Zy16JBdhR3H;JS#jt(p)q1@nMz`SCkUB1&)n71F<rjA<K6%
z3ZHMQ<nMCA_B*CbULCM9$M!Ua%F`}i5bwl$Zu;QoN7H~1&tlMQn0*YvPa4u|$yH%i
z=QOPXyz7n$G4fw*QcN-3CAUuZ{Ql>Sg5oD696Khj2Q3!*8wevGRS83$h?aME$P)VM
zJHW#Rart4?<N#kOBEEEu4R_^UH}ug5Fzz0OHFb$wG^O6mI>0`^mf8mB?pv*{L`9-O
zGrsrmM25E5cd#oD2{s)P@)**gKm8bsomE%T{D-fPh(Hv1yRDQ47luo8D3apQ7jXb6
z@0IH?&{n7u!r}Hss!$v5`-@<W>~m%+XD~arhBY56Hz)SqJ@3$Jp*PV&>%z{rY-qfV
z+Gz)>%y0MGoI7)ra0=IQoLnz-wB#PBHAc?eU-xXh`CqRO48}AaY#lhpS=US5Ww8VA
z)|z@vSyJU3k6D#t2FO{CGVn5;se)wpA@zcz2MM{irZ^HGZe63j)Vz%=NltfIe4}fP
z30A!%dvlWyN*(dB6Uf=EYlE{_!&%eJ2WomHAQqZgvemgBU#{`8bY?zrABvDYt}d}1
zpcUA@MGZEJo;>j*i|N5@)<n_R9Z~C^WZYnMMh`{Yu84|pVIG3P>znO%KpXq%VZ}f=
z-1fZsz2{}7ewtb~s;HJ(!e5WYEwy5ip?IK#@eq&8%-HZs5*Z1u$t11H>Z3P7_TSS-
zOvIeqVGJBH9)BC|G%AQNHer?2hvToz_YVll)a6&$%(-JTV5`S&+tAwMKGzbma#6iz
z8u?f_0sF3lZ#nr<5di|We{H=w2C{_rWs1oER>?rRTGoGm{pQk7_zUI1Rr&a5Vi#Ri
zc3r`0<tRK^u%p<KnQPqA>HEjDh958lAiGlx`*x;D=M0IOR4No4zg2_QQ*0i{I(FLi
zYX`Zozou0EVe-ZfKkb2irKb%Le(9j;Af42p4sNH;bc<WLw7QO*P4ZuN#8;MldDzZw
z>kYq8C&oXutIw=(oG(eNdO^dHouEAIFr6_Y#2g>Zu<=7z+^fS)U5PYGxv=xGMe-Fs
z?N98UQybWNc-?CE{{~wa<cel+!})2BJ;BjGKpx(<@oBu6A4+zwrNtZAi^L2KSj|29
zwG_Qvo@Q2nj6lZc)?n5u&yV}*I~A6KMVs!MZcuXS`a_p6Hlr6Y);MEJzJ-vbo>)Aa
zd#7HMBxd9V)eL7myQ@@4&$usuO7Sk^$rJo^xUzbkH~XL12^9vA&<Gzupo3xnczhAS
zkP-Se-=0(vPdAU>RMY*8H-JDYxHnLP7gGE0EpBvnzY`*QN&-1!clmKgMEP6=*pVbr
zC)5ba`JQmwb_K~?gK(A56lm<*fkE1epnb^5XEIRXBdJW<-#0@N==`Quc>{!ZSh{2=
zrltM(aI$kB7v5q<ywBpi5Gy%HGeIKgE59#0cU`x>Hz0>+BPSj?0@ZZM(SxSzVRwJU
z3})@-_zDOEdzYXm5zhPQi)`BIoqpj|^;LcZB)_c)lPS@iTMSkk80N2lTn52gAMU=<
zZ!jSy^(7gK>B1mRDq}iHDnJnTQyW-7iINEGk?quxZ?Bl1FE@}h?VX+OrAy?ZMajG3
zPVpm{pi^}6CWC*4gsbSa&g=B?OEIybA%q&Olq9Y|FgwIf7(zm*sc&P#t^2h)iYx5p
z9Q((Rx7pfigk1g%TC^BJN4>EaJ41MT5p?R&o6^0S&#c}WmjY>U^8ZeVp$gia2JRI@
zc`nvWC-y+B#o`m3FnU*wEt~9im<Q{d9w)-)8c+*KDX$K%DJnW6la`9jfco(z1rg5h
z#Sg6Skv%P{<2(XH7|?+GUdJJBL1#}C<TdZ>G80Wkm;$PDI7oJi^n6yD%CYAjTbB73
z$o>PW6A`Qk_4Ipu{1g~I%YWBpAXCQuf%#czP#hWed92vrD(mWpWY10lP8_TF#pGg`
zA~iSDAP=(Rg8c*S2!k_TwX7LUYTpx6-meFD@q(6MkTCKk!b5A<sQ?}(qEXoeC&1j`
z-NLtjZ<csA<h#g5BNVB3wu-X3?F_GLvbw6RO}%ortM+8+?+DdmQ{Bi|X!`QB>oNQv
zF@+yq-H0;mGtE-&ogUUTzuOF3dmop58dt{HANjeu+XHZNS=1?W=hS9RZJyj+Xm2q7
zwCXK#`OX(6PThWJ2af0F3$!SK_q;#Z;68ApMgak8nF@`M5@LoKYZ@wA#pvBemj0F$
zo??O8zL;5o2Zuqm)>VXJvuQEsdysRfQ?)QscRr7Wkpr1f8DhgydRbL(UXRJPjNiK(
zdO%+;=KS|rT=G9ek~9;RCzTO=Q29x%y++~Ef!Kjyln$&W+kltNh<61~UpqWnjF%te
z=-kezd-Kl|^^62^_meWwgBB->7v%!COTzKxl-7K%bx7wkBN0u6($()jJH<lREStwm
zZf3Rk5)Jd{GLk*Nb;@v%({v&=9Ax`D+fq?z=5X;+IuU^b6=U{x^Q$_N(c+zwE#Qr^
zAkbYM%w(AfB+cQKqL*j`UHjV2C7VYQ^Q3m%EAtaNmc>At^;Mj&y}SK)hdh;McKNHf
zNh9=6qyZ--xIHVf9Uy<)5l35CoO~rb;tWLRv*ZT;TF0?6aH=V;*mP&Ytd8$+hML!d
zP!L8T=JEr{P+hbM$3WwN$a5;r3OMvRM*o+wZ#YS=Gvgspm6s-ap5x}ob<VXPERL_H
z+mYwM8^Kox{7t)d;&utw8StP5DwA_AE-ORFGUcZALk8~W&Ph2Kprf@iLb$T`x$|F<
zvS4pL&aU}UTHWI&*l~Mr<Cpx3&3&EO2-Hp3%UB(NRGit+7BgA9K4XlQVz_(;V@**Y
zCWfl{yQX;_o&tMo)ypqx6<qMJRI@BwLris1;lGFR6nqhkJ^dMG`(BHb7I39PgBV}w
z@^03sWVzfIcG6eec7It5binsCm44}=v}=L&RG+!>^Qww-`>LwQKYE;$fP=+OXh!(L
zWn63z6|?lp;3-1lSzy19Nm|w06MS$)`O|cxGnf8~sXdC(fWQRF{P=qsv~g|;m0>8b
zgr$$`qm;9rcspXX)9P_u(Z4GL-vZD=qR$=-eq4TPgpbn^a)ItEo#1@@)RiIy$EhBP
z<|@B{mba2-x}X&&y!~u5$CEQ1L9j<{;MHTg-tgPc4?ar4c2<Y_e>SL&ZfNY{r)VEM
zx&Xw`dpE4qqO;Riv!r~^Dyeo4U-}G)b!VvdfaZkBN5oiKg-t1H{|~zjJ`Z41_tD;7
z^d&MRn{ahOHUlxkK*jVnZ1S=L`Mfj#ZC^5X;#S7@9zW>5IehJkAA3_JG$0wDS<z9R
ze+w$82-%gON_xB}&;tc>is>oC#ivHjWc!My$u^m9+AxbR=W8S6XOZ5>`7~t}NH$3d
zp%fVZXnN}vHC6r_<-<|(nw@AS&rD~7=0!M^24rc~xPUML;V+c-KG~DQGF!hvau0c!
z2^}s9MKfTw<FfXNtfZfmrLvEeqQPg%c3Vrfu4MM3>Fvv($lMD!N~RUDooQ!IyJEGk
zXv!fXiDB!T6V(aM%8b{}-C2?qXst6Zy3lX`GIeh)&@^dFL8W}=qgLXzt{c`07p-Ci
z&ZggdcSq;e_Ok$$!PBGdd*l8=nZrz(%3VdI3ZSN*kB??%h<@4=I?MNFB(vgPxhX;W
zrK)!p{2_XGzx!^El~}DGP{_T>QJM26dhO@svIiWtGy`Nq)ilq$Laj0L4g0I`#be~g
zx%kh3Rbm9`02W;#q8i$P0Sa}A(SL{o)S_BTxBu3lFMDlFRZm;CIR&>yJQQTpTGi3U
zxr$$P5$^D{Zt6sQjgff(V%uupN;S=a(c4=7F<0UCS7k(?Q=HFvX=>$y5Ey}Nt7K~I
zW$e_sSn-5g2U)W?-j@A3=h>O~YxPg*F;1V~o!0*&D*&1sgOWe$l+Q9Fw2+N`0_fy!
zYZI_q2#U977rY<arQ?)s`{`q9#oqA>uNyTL66w99@>3z3TqeE8e<u`9`WAp+=fCyp
z^hqr!R?n8N+8E!%TdD+OgUjoXbk0l(1c6djO4c)gNR;TjU<FBO1%X({DtuOhm#^@`
zV(2HVt`m|_R(P^o5o)OSbci*1EoYA<b)Vb)lo<QJt2_t`-XJC`RF`61s(xj4=NtWs
z{fe_Vd7Enf?*}Hd^nRLrK6I2dqNv1m5a{B&_N6#ZM$j_j9k4rfL^&FX&#NOoCq4qL
zY5E<VW6RvjSaXkgk&izg6Mt&}Avu?8v`{9LMAQ7aVGj`v__z;BN?%f+NLOmt$6Dk6
zWNCJ2C{{kTPqarP&T;;>j)G0d6xrHVhkPYi#j+}8xT)hvA$I?$<;Kn}c-4!EtkZAV
z+f}zkCiv(e#jvY+IX@d(Yh4DjWe$xkjgYPj9ireJApcZc8vz1l6G}-N@%!J}0CVab
z^4#@8{IP#?;IA2M!~X^@2F?~7fp2EncI9zfNc_P^xul!VBzx&Lp8q(ORmvrNm@Wf5
z)~Ds<n*_4WPuo_*H>Idp9O^^Xn=%(G96M;jtrfm<=1~m4cMU>54b<6?9@#!)={&vs
z?VgG0Ip6pV@oA~nYP}|a28OisswajT=gpFy5G_d>V@{N_!0NSE3KFhL6N+=egb>5j
z=@^Eb2X_zOEdMepJ}TS3qKcvpzta9@^U;ZU4z<2D??o1t+zr7r7k&?w=qWtj=zz>~
zk7M8hh@I`)MD>f}w$7bUbtTj90u8sqPai6MdH-uh5}a#awxw*M$1xI7V)-m>I(SUP
z?w3rOngPP?iP8&sGibHTcNZ1CdN8#vQM2u~<;vbdBX9k^LpNy%@{(?yh08=AcSrO+
zOygi2&2A5kmx+&<0g*v>30gp2>~bG1L`2lq!ur``>~jX%fTPtfDOdA!4)+IIw-Gqb
z3txfAnJGpiLOc<{sV)CTezLM9`szBK43IBJUTeX0FJV^2`ybG<R0sWUQn^79;u9$N
zn6o9FlcoiEt|?xy5&nAy9Ex!s6Je_L`$_!_x`SzMh{6<LJRo6>p8KIYDC)dm5N!+=
z(z$!lb_N_RnvUJT+p8tLh~&BWw$-(|93RNr3bZ9h9nlj$#F|qcfj6XdK=)T?Fx`0`
zBieU;)>A$27rhhgi>@YwB_20eXUu{#WzT!MsJcY?=Sz;}$r=u`_Q}6Y^<TtF0n$@$
zz@6-x@b)2#Q;h|7VP7QPo8QxO#c{>W$3K1s>`3l$0Uj@-<dpT{7c4=pK#p<`$);*G
z3M;#3eVR<NYWXo(o36-8oS7@DeTdJbJv!;-xzZ+U=#Cc3lyNuxt^a(~e1w_r^7-oh
z`lBZQ_RS;P$%eD2d?xufHJ#Pn)v+eg^o>G^<<?&wj+NyQ_v{>qdAem*_!viN{Tc1^
zKXcDDUX%T8o<Uju6X+fy!Ehc4LOE9rk{gJQ?a*8I_M6GKKmIl~jiQ3=h_8BpxEt|#
zgpSbTYAmi@=AqI!-y=ULwtCq+cW-2q@2Vt0>s-G=&la%!Zoe>ynU~-5|F&;S;opHY
z@c4apnvkR^44vhe^z>1}O_3*T#QmkJftm@`vdX9}lxx=1&)T6V@lpCPZtD*IFn_ja
z;CBtu_kj@c<FjJ8<3zd{npqLI*8VdMCwFMM_A!MA(T#_IcYSv3FRry7I<(p@Z)Sh-
zYiw+_Yd@K{@p$PYVb2~=Ft%#?TC*hJt&7vappow7ChbO(9I5067&e14cxP~jX-#6*
ze_Ns2Bsl%S3CJ^lT_Y1n7^s>}+z|AeZ9e5;^HrMnz^rGaE0Ilnd<uQs1>&`n(z3@&
zrk~ANeS6v@O-;0f8b=0pKbj^Ei=`3VJr~R=)^%6y0k2Unkow#$P~c^v6hiBkbm$Vc
zzr{lr(ndd1E5qGKF_g<$Hj#U~?;4wEG|*$gOD`n{zvRg^f4J2wtzEiXm}{pmDlaCc
zT-!$(1S20RyR7gfS|2|Fn7eHPIi*6}E33<xJf(EguCdRxe{ZLx0@1?pB}T>SAyv+#
zmdpk+?w{jB3}LsJki#VV<g``>xX$p324GBP?7cv$M)Z}PhqtWTtB<czXa79Eq+)EI
z+*aaj!&+TpwO~X09FXqSLJ@F<&Mr>*8_>s=-@vdWR47SucSMA|40U=dAZGH*zkduS
znFy48)YE6xO=l|`qM*~^)%9K`*XXP)xG@#vQ-d51<=CI2J5vyfd5PZ*KG{g_49#1m
zCD1FYZ{t-++TIPox~>v8;(dmw21JWHmGAng@Il!xSD$;VCq4Ypj~zkc%2OT&D_ce2
zGpP<RRTB2yc3DZF%9GLNNS0v~7!}>L%~{zN>62k7LNYUb3~JKew=(TI9s2JIK^N8x
zozv~a>9h#0xIwL6+>v5Aij`qy=Nyzrg4AaU>V<=hqh9?jw|a~ANMcrsoKX{RlSLN0
zC>qDM?tJH@m|znC{Y_9ssf<!&8`WsIn1=1=V0OfvZci>Jox@Nr@k~}~hi=0#40`Ln
zO)0x{@C%uuzoIgxbcgcP6I+$68dpX@%=8e5m!+uhua4f=&^p8I4y-rCrTl$<`42hg
z+*2_EyV=1-jE&UFlX!|4tY4A7bB^@IoAdexoHVs4mL2Ogq!pK8E07gu$W+#0D03tx
z+Xl#JZ9A~{M^@3>G_zMULsS-vzn{(YP|gph9HoXZ%Z-g7I5OqY(iqAgZMLmU#fBM4
zGAkM6F%tSfO~7itos|25mF_S48ICgHOpbxN1jQZaaxoLQ8?tJp`zAENrVUf5<9(@^
zncXDv=szy$PYF<c=;?!=%CxROq);$^GZ4t3>7PxGS3gOm?gWo(i<1s}ml<9>dA%u1
zwG7{*WfeJAXkoQQIRI<HOM2>1A_Zc12uo4e#U6V3Yj+K}=sP0MIoQnx(OfT!V}-K6
zh)&+fA5$BRX6?yQh^wNI<xrKYVM{+$4+=*`0-Z_LniY%&wrd?$7@?d%kf6n@2D3De
zBhy*-IkyOpWP^KlbeO+$U+GY1;3OhuajZ!ZP|vs++e17Ys7090{dwmG9Db%MZ=}6j
zy?nx-iL!W*p{8e^9O(^K1z7;&l<O5Mq>s}=%;RfPp74&aKmffJfO+k~&#=$B1HssR
zC(Iow4!UC0pGYFS6odhy=<Fh&+dr-YBTlO6;X(uQ>-;l|f&s3~_XBch1CMU)sBF9g
zl_tP@!>H9KoL^M1HjaObzS~hduCLI&rrZLd8>_Ro%Kd{!g_MYzUrD!vb0<V32*7s3
zuOIk?&vhQ#<<bv^jK!`4AIU%!<yOY-@{do*ODo-rwr}p_Ez|<!8_YcTi{a#gVQhbv
zk7P#{P>^KwRAfl>-nohrq703Lo>5u^rnp7O$UV{Na5RU8S@4FUml&XXWQY)P;$o`U
zw2ZNM%)yVJP3Y$RP;^oqzH`;R2kMS&=j7(T?dKci=}-AvMEx{!2Tpn}#2wH@eh%_q
zcD5K8|IDm(QvOr&WQ+WISu5XG7)#apoapTLH`0X<73tInqX@Ez#dH@>wR?~44^K{g
zGDp99|E1f(6`QXkTF_KV37i;ES|3EV=jw?r(|=)aOSM8%>LjJkf%o+MP|689Z*P4~
zviH#f$v$YDZ6kO;+gMgCHj=G!=c$rD`+^_w&Rw!6&SrOAx^%uJ_^|Qjx7{<}%-Ygz
zDhh(%KN_EV<Gj?HIWW~M9qlaD`kfX#fS$a+RN^x@t=vx2c5gps9r&K8t;Y}JbzbRZ
z?l%_yVyG*2{Ck;p&!9+=$Ajm0bSoX_qiMMvW@7ceEktFi&hK4bl66l^IiPCa$jEr}
z{>QkGhn?By+6sPm^3`KpXD#NHX_d}M1+7a{&ket<J%B9qz<f<Bgu<DCYISd^H*UO=
zt39eY$}W91#8%Q1zB$$4o@<jFY}vCp|0?^s!giqX|I@pxw5(nexeazPgcPwH+Uyt*
zIiZeDkD7l^W2;8C+c5=Gh#S-qf$=iqlZP@4rg4tngdf{?{^*zlo3O8t20HL&W|`<~
z?3g-?)U*4!ZT@QDbr+2(#Sw0=%7+{Y2sN;u4B(V*-;-5LLpN^k2I8n(&H>NQSG}qv
z*|ke4$DBsiN*om)-KcCr5NTeCmAX8=(sbNW|AnvV_7`s~iw{fREe{ZjN`mHcnNbrV
z$Ao@V5jf^_l#_XIW&${|2=M9N;2aJ=JelhiIytvlm&B==?YY`_x%{W9?*y=pPZbPd
zZ1aWo!n=Co9QgRv@7s_Z@~gwgExA`3=eMQ5v?feTkv%_u@NtlKC*}!7=j4-{vRWRZ
z0@h3(BsRe8Y0;C+8TXTEku8W3-DX`SY^i3v{u!)Xy<M@(+PQ?eX%i5)VQ=)8VhTsm
zLZ0kiV^4@`p}@%RYoTO9=VW<Tq!_!k2W|{FzG`{42xMyS?8F2i^W|uQXjfl>neJ7&
z!K96jNmlx=3Xm(F49_*89HNxU=Lj&L+(YOImF2PQ^bl4i5+p~Y1-(lCoeEK~geWfK
zs)u`MP`;$AVvf{l!-~x3YPzDg|GigQP%L`&hyfGPltlM}JKae1H&++}A0n&dNKm`*
zzKJR?5(il(87pwi%bP!#qaQ{Y1q$;RQqcaQCu0tz%_MPGNQ_WpS2LvBPu^`<_wvhQ
zO<FzjkyE%g8xhP6+pjuq+MGyy^}dmtM0Tfve>7RB2+fToAyL}-uv5-2><SlDSHmow
zwl!d8g}zsvg&f@^tm*hc2{IAlEN2I2#LVs$R9x=UU32_(eAtw+C3eF7*KzcRr4xkg
zkPb|yfnX60<aXo!02xfCbX(-BFJ=0D8`($L$6$Xd5tmQ9RmVm|Mz^*v!eb6jH$SJY
z-v%=3Md%RcXV_=jed6A7rx_D+m!(1FRq_d~+jdZJ1I~U`YWR_WqR1A<$>K)GL5+zL
zbjKfMT9u<Hz3Hw}LXo#g5(w|`Ct=IJV`VwbY&$d$$IvxiL3?Rg!vPlYVjXVaY#F6z
z&47{V7tHF7__QGGr2Hp*1b^Yz!HwY%ND3{Z_ZMA}2<<ildxGL5N8Y#8!kB4Ri#=Kh
zNDWF@RwS@eRSaAbrCO$axV5E5+Sx@%rLwB6Kc8}0hN85qi0Gy?^8%@RyPR{g6?z{e
zD>4E5$%T8>j=5ysqRZZ^(i)70)-U`vE0sQpn|e{;vs7$j;;)GvyWeKsW*i&)uR+1L
zPy=zFqi(q~xw9m?t~HTKhF4$kYXBkhUsw7H=MHuiIHOQ6B8&3)o-H8vedNpC**q3{
zkVEelIdqM}1qm}r{M>(q3DN{`a@00>m$3vTj}_!aiQHV~x$#ZJ<G8H)IgK%gV0N8r
zVEEY(&Clm^rpy)?O%!3M+Pgj<me6=k8jpYn0!?GSOy7hLDDQZgu+c*j!RHDD){!Xr
z-sfQygf#TzBo~0kr%H=|3}B#KJz^Q16SFT{)LMgk<}z-9MqlV8Q8P&6Rp>ke`)Z}G
zoPx;K8;&AOa(a`Q%>nJswV4}A5&`V!=5$;aoTSw!AL$PQQmd}w%CopT@uS1nOKGJN
z1bV+%Bzzf#zW;H#7Tc!}l{w0}zeZd~4xqFYW%R#}VOjr5Z}1SGFvRIjKdYhSm?-J}
z(fI8m!X&W!(x;?8fUCWtei`i?MZDCgQzdznhm$CKG|7*Pi6qVIXpE_pjZ?>7WQrGY
zyHy)j8@J;2-3{1BIAK;7oLNek-xkLUpPl>&YR8GJ+NzL?Qw)kV!B>fVz5}AuI%RF>
zC-wZfK|*a~!axesY;oRD51`a)FTA!W8jauyQ0(CAjDGm<jClsq(vp@!PZ?;e>4g_t
zXouKNGe5Wr3NB+iSmO&se-xt3&up?D)3{aMTJ__=t3=TphPtBhAwg=|k*<Vjgu8rK
zN7>7r{Y#f~oOi{`SoR}#y^J*{m*Y?ov)Ojp6U}MZ={F~nMIKA1bH}_~e6wQc67*4y
zcYF7~Vy!LfA{J~1EJ=U8lXJC5ez9hGJMO4`mMQJo+w@qw7dc*4n+iq_mFi9UDyBUj
z+Md0MUJz?3U$)T;z~_bjC%t2b49<#16}?adVFv@piCUqX`-=}Tr|>SBodbM;E1o^x
z|Mg^-Xi!y`uas0LoO+6lJVq;5!}n;Q`z@7SoYb86bz=4jfR%uF-c56H3-3$Tr6F2y
z!onJw!15WL-`dP$33ZFI-^y4+u$i%SG89@j=KGxE#TrT9&danK!ip4fX|n}ywHYQ~
zF~hxWp|L6op*7a}uvrx+Ls=Es(Q4UFRfUp%b9X6ho$!vK(xMb#-Tw7Lvd|8BQg?kV
zMQ4knPU9%S10be|e>3j&hORauJAJS&y8@W8v)CDAV6t}{C{ivrWP7Agpqsh3-i+-w
zOaiE&>KC-bi+<Pe?k+3PtBQsb*G5o4HXlcuk5^c@-md+$-&y_m8|l+3p^KB=V`U~n
z_3%|r9UaX1pc?4Fw|}u8HnG9`TBiC^G!nmQ8$*IM)>_DL>t_g%7NmzN(=d;cbXB31
z94K{4j|`--9Q0~Rw*So3G%Ve8g4<|ho}H(_B8(PqGyRG7xH5Ks*jngk)|sCYn@CeN
zmGA8FR=|<s?-QlpQj^-EZ>durW?37RO8D#SsI1cb{(eX_&hY$<-t|Kw^GRd*uB#(O
z2#+#AkZy#Uaw|!jY#!&Y*L^C?iy`E`l*XkN$PBPZuFn&OHU4R8B)4ANN(n~}hUO7Z
zCk6iGj_XJym5!5D^m(%XDjwY;{Cbfv;K97fm!1!6ja?NYT}m^D{%-~^s@9xS6kItr
z$974e?&vW7d}yua%tAm-PSc(DSkc@(TufIBsksUC)K5$4!W#4^3fY(M%NqXLX02nc
zEBaRyVGz%lV2r9U_j2l7kqgv1vBT%7j2m!r#=(>35M8XjkSn=aF^{`(R}IyyGptf#
zs^Jt`jOjbqtS^V_Tt7*zr4<oB&A_}k{3x(@4SqWa^SY~9Jzj@69*4TqHtQFzhP@aV
zM5!uD-YU8dg2<8{iA;HP-}*fbf)jf4`77G+ZK#GCduH~mQi9?V#`ZxQWH@WzoTB`-
z(EplNMDBh-mT&z?HpVy!(oV%X6SRH0lO%m+p^*;{wxqnTwqvW-r%~35#=NU1k!PM2
z^D&>{leN;@DXqVmT?95xSdo)RKUHoG7PL9|s!#K#yz;$_ZUK=pH9hIY=t+ThKjhV3
zEpC<v>(DQ;Ty8HBPRxvd8p#xU_lNk|z|;37`%jA#U!3@|ryTFf-?CgA*pCiFh?`sc
z02k6b2L<F>isOq*Tw&B0a~$g)4l6f@3A9Ok2NW7vz0nHxe2xou;vSb)y~B9VhE73-
zaG3{HuLC#g|KTzqKF|dyH~c^nK*&IQ&()NVcQpos>i6eBT4J{gkZDf}45r`l3PcO8
zq{m@};wzvkdthHcrWO{6&B%dOFfpsb(PO^s=%-=}OXX-V&1EjiRWiwLQcVe(zBqRF
zCjKjl+LJG@^Ex1HaH+lY!>KIm-WA@lbpae1cRE!;HyqRz96w9rE9z#EOW;9Blzf?M
zH2UrG)c9bzsy|WQjhNYHqdH<{k0FYklOmdEfk4GK!$(--|CI#;V*rKlEhmYRdoOxW
z4o}x6`-<~gXR&7p<)&V)7MgnhY1HC__GIQ1R7RjSq9=YRllw!c((Cwz!0rRI_5-s<
zwy}o;lVWGPwX^P?|Hs>R2U7XJ?;~46R>+R*9od^gD0>sKM;Y0BMWP~mW*%gdY!V?O
zdmge^<}uDOey`Jbf5!JyfByaxa-Qck?s47seO(@x(JV9hS87)lYC>sT7XaDi!7^}E
z`kcL7U8wKmX(R3N=EILD%XC(U>om?U?@WotY~dreH=A=4{w;F<6cW%sWBkNvB&j~B
zcD}xAHvIXeMmm@GR>=ypq123CZ5^Kl@2KDR5Vz1dz)F7^bM&R>xHe*&e%8b`MeyO?
zKI;h`d6Z<=ymJl*X_tT_`^<L$pjuDWl&mez2oqA^i>N4BxcLmk<l)qPt$FBa<VWze
zIiF|Eo0Cx;&`WncVQ<=~zI>0^<{jp3INf?zPLv-eFEc?L19tVZ8y_w1-yl)UjBb5R
z;2tL-#b|i5TZM?X>^opeM9t?T3&KW8)FmXPYlZyg0w}9I&cBB_<;tr&{AN1}%LGcE
zFx%-tJC%Ew53}7zpizI4kq@iIcaJCXEphZuA|aaN*=@(>nb@!AJE<o|Z?;=MSQ%S6
zYMCIg#2R~!SXK!cgH?bsk0(0a^T6pL2`$%-e$#v3KbKa1%x#~J`;<=koJje3DJ6^3
z59)ROl{Z4))_r~H)Pt>tRz$fqB%Xa2i3v6n?z0%mS0ey4HvJ4w(bR&27#)IZI4cz&
z`KU(%k_LxC^7|D)t6=i@hR_XNz;nRQxCbH6dpxx}O|^Zr_25*#@XXKHDE@{2wBKOU
zvBy0R+z?DT68LFlKc~!X3T=t=RdZq%!e=;El72cQrt%>~l4ABmrI9>&U3$)-E9usG
zEhyNM-A&#HILQ50>=e6>X03bQ3kxzPb+E99O~nd>i*#l!WWO6MiI3e!8WO2AI@2qP
z6XS_{gse_vCf6^iS<qaAf3sg2eEl+p$k_(aoIi%i*BDgW##^Z@h#01vh^0ec4$`@>
zlbSL(#vRU~;`A<k66(^AP01=~iABrBctURBaBaw0yh+DBWA|2M&B8euHTPtv8~a<x
z3mtbyUs~mir0fly{1+K3N8fX|OYc5Qjj`LCo;!_{rNfnq^DE|@lje0^7VYQ3?6YX#
z>JEElOg=%&r<YEjPUT^_SZw%uqin06f=~W(xDrtVS3f(SNt~TnyI6kLH5=O8hpgAX
zuJmnq>a8bFa-(;n1%`br63S_c>xju$1$?>c<k&4vEx}@<TN7ozD_hZ40T*F9T=F~U
zJ9w+K^KM;APr!tRK^gvWJkvLS9Bsl9>d48U6`3*Im?ge>P+6!htG|s&_8GrU(jq1|
z!afwNdD@!JXWcuQ7{>x0ycJ{&PVaC^Gxl`k$2b?O`9}SSR@%K1C0Cu4<PqOQ4w`pp
zz9~VS_ER%OS87A76vF$QB7qKr-{o)l_foX^y12gV)YDO^;z)q*ArrNyRBF?JQygI=
zKF8O<+ia<HK(L3{<txeG22AH(9^8}zGjFVP4yfW+wnt;VXF}2o<6`cdFdhqA6m-3H
zX7B;DIPJsv`ABG;YY&fMEF@vKF8bAB5+c@emzBYTZgU`(pPpF0*7kJJE6Ks^O$j*#
ztC$WERBM<9;nT$FHjPN6;jWe}(Mf?S?@H$$BC3a=-ACl{7kwUY{jGdd><zlMaZNsk
zqtJrn_4((@s6NH9=*pX82he!010uhu6-K5CZeo=zB$1%SMDTM@9?ViTD!<Yyqj@1~
z>+OfK8!^EJ6@EkmF6zx58@5O)@`CU6Ml)W@<4ze=jR(tQN$h7*58CkPGrldHV~k6m
zBTV#oiq)2r+UZ3U$3z)QWw}>d=_1jXm=bhtO<oqw9|c^YmKgNB>~nvP{V|~-;5?{o
zIcKL*tLugog^<26X?0E5c}?mOeHHMI-qd{7|EyLy)p&oV`owVLk-<paYj~5f8(b6W
z28oh(+aNt?22{X!jtcebfEingUH=Zlog<D=>}FmGPteBV@KSepN;~Osgq2#B_`BA*
zuEln_2Ns&twX&lkWJz)k7FnMKaj&B9UEaBt%41reeM6!)Z)#0$eI;RXyR)SDTQ27<
z`nXAxtSzM`x(GA0&e-s)9hmR;sIpc~d1C@F>3bGGzjp91Tz0m1zQn(s0Ik2!J{Nbq
zREhv&6XQWNmei`5EMke)8j%=0hV7-VM~D7Fv+(gzms>n&IKI73<W6#V+-;Th92F-F
zGe!b#J-?MX9gq<CK;l_lW7hzkV?-}ChwWnyIY5kS?7<z!?W5RoB|}r|Am#l`_SW(2
z!b0w0ryFFFtAhYMs+PB3YEvt%*=8@8;c3M@9Rx+6@P3JlUcZ|j%zo?=x!ALq@+8f~
zXOY`fZwV(`0z{cEdv<X}pxzoBntwfKdE)TZDnhW)=v{fvQO2P>00(|oVIr}Q8#Z!j
z@2yxv)t;esoZu|`T}PR}m^&Ny15JP`s$>}&Ra>8$yQ<zd?FS8qVoCY6`7KJI2Y#a*
z$wg906XA=|i(U3%IHjXqwC!We7Laxi=7`v6uPuvFGkPWJs_h<qAXHfV{nhoNNGN3e
z_?2Obi)Z?r#{A8bFRZ);k1eVDDRG5^jC}S>omAe1m*em0#d*YtAL{0+`q*6XJb7f)
z;#)_5W#fvUf1ID(QV#6_J5xFyoRZis2@uW<1?9%_hF0Uec();7aI<*E-oaplghI=k
z>a=gyY0JZV4fb!ngwe#PPia09m1^awh4HMi@^RG!PtYEtA7iaI#|zI96-3zw>@@E1
z#_#UUD%?|A(P~(PvzDR}SfP5Z^j>i~UBJhaQ;@0vT!95U4|bGy=6B5fB;yWfRbp`}
zjUwIq(Ds9fD=Z~;j;?)eA8XH`Z?{N8rPZe3)`pyU__NLey0?vrFXto~RjQ|r1&+YS
zq^{eyD>4=xK{1UJU{p`Mj{%FjAA4_-c;_Zbo=Vb#io2tltNjbmZuWM5of>T_0c-VD
zQ2r4Xp=-9nk8rrud{4!6+2hG}_2Y}jh@YYm$cC&bK#@xBK)!3zTMv?!7OaY)mmL%|
zg%OGDAQY+_@Wl0CSav&Z>b3?9Cgm+!jt1CH5vjPIWDP`OS1Z(xnG&99jT&2a`pl|s
z#7$<57HxX7N@Nb7cTYyfw3@dOv^J|}^DFj+`%z6Wis6f~@U4PTbRG$}mkzEoT}dZ1
zXHWOMS8CZTu_i$swrogM6r&qsqE@KSVx)r85Z!d^N0}7)oOsyB(<&Off>8d?vbv8Z
zI38-^W7DAdGB~vAWOiE2TG2u$`Xvq$-W@Gomkje+YrZ%srCzv=FuJ1f`DBO8XKsW=
zM;Emb)@_zc%HQZVYIK~1(U~AL(H+TNLa43hN&32+-fsT(DUFx9N3$;N`qW6HCA|G6
z)5_-tl^8H2rkf0A`<!jEp<VA9O-~JO6Y{O*UZM>a3ghHpfM%TedF)3Eajy6N<Q=8d
zx=KVAce(rWxWw@g*%tp}x&g(Ae!2S;)!ig=*P7?vhXsWM(&pk!so=7h5@H@#6JDVs
zoD*FnzH+9k|4|$sF2Pe+VX9b;O6H?m{B{6^oLNuDna<UWs2}Zmma<mJt6*=e6q2WK
zDTEv$cc^!Ugs(lXnuXluVD&p@K4GtAUdDz(N%mGg^+4c-3%`@|Zqz`J)~@S10{y&B
zj3J$wsV9>R+>exA0ph{tMb3xEtv+AE?LKbt)m9|t-8&BGj_^#bqwT!4Y!`BJEtWVA
z)flDenF9$Qpjk4k*)bkGzH!X-t}a$hpQ~QwO9)mxtcbbuy@?0CQdxlFT?`^QnZ--n
zApvNNj2`)=%T_NN_{|ADavo5iFEj;^A6*e7JnDCA4Z13UlU_^m9gMU$QiLKYxr8%9
zp5QhOd-flDRjqxz^$j|4gk<LZg)h9hg0@2q8n<<BnY8D(AX;Nu`02QVu|8tAUs7qw
zCyXd!3nB;<k~XgPA=`BZmGU0MH?hcCRJA~kX9Qz%ewxI#b;dmdJ~PY9#~7v9P;AMN
za^5|fichUVPmB)RMPG^c9hGPJJ-KXbo68|vLouEm08j7Cx{|>#asM9tgTT570d61E
zFJU(a%H<<C*Aqozwv+oEdo_~B<F1Ehkls$}j(4lhtC?2>fWoAIEG{-UNSwA^yggNd
zJ7M>TWpPz#e8`E<soh{mG8IGPVIxXu+SOBz(?fuEkiQUKzJ?bW*h@;2u!5>*$C^#>
zB57=QrLFnjULPn3^u2B2rv{82NH$P16|%IO4Klsq`KxmgOAWoy^FyK6zHL!s<fV6^
z4gR^ulpbuy67Uo4M>{WkUS&31>)UUPnA@0Zo!_9F3_JDOdA%B=XQHXFV}<T7&wN?i
zCtptW?$nM?SIA7jtf$DK%NI+2Mm~#<o#WZ??sq!mogNa$_fDKIe4Zxp+}=sE!g{Xf
z-|Et?5scr!wZUDn*qbU`+5Np76YXgN^wUvqHTBbD7=tY!vRR$3t2BGjh_>gEfD`Pi
zwDajS_`SAIW7WH+A7d;4egQ*KsoZ;4g*BCW*ScDr+2kaYcm$7cU&jMlJFm6-n`^u6
z(dJF&l&v#r<}W2mzI@zzDVDmFt*tz^#@SFduLEm>ooS2l5{&M$As&TQ-2@qfo!lXI
z4Elu(&S;!Z*?p9!6`VTqJN%~VxKH0{Mds%^@ZnuGOnCk><-&BoY+eD+qHoUVW95E|
zOdq+YjVO{s4hj7tQA1+%)TjIu9obD!P8xbUsM@Dfp-!JP$X-I<Cdj*0sbLFPAnW?E
z{%HyWLYVhy?@+KP<G*3yA)I6^u#%2!6{AIm#aIrOD-$W)ZIa5rf~RQ0!hkJ>5?~rw
zA#x>5evJOAXp}!${WZ}#x`0=9JJM1C*#RO=TTneZa!%_r{ev+KQjYGEG7tA)h8m;!
zzyNeCl;`#1c~=zVEbt7kKO|D~ufu}l?0WB}*~uJ4+iB&QqP+!EpMB^ox2?0QWa>g%
z(CP0EZl_C7EyJ4QQt>wx{&_noaYn-aP{ZVt+6bP9EhuC0H?HBf-!zls19S=58uqke
zSMNuPKdGwSc4^$dyTd^1cVL!yv2^;%AznmE)8hH3dGEyi`Iz_2v>tdXys6wuCpT7P
zBRw$Q-G$EG?aJIMbz)n2J$LiIYXE5^zH>VrItG@H={+1j%-O!}KnW4|gQ%?wzZ7AX
zM=!#!ArcrE7~R*0Kc}LLX9igUiL)Ee*P@O;9#1&iH*mO7Z;}6F1So0Hde>qTW@T4;
zPQCRX(0URoly+IL@G_sDM)iK?>3RN~m+eUvn1t*&PVMGn>~vTd$GAZCU-b>>44|D)
z-nrcbJ>gN3I0%<$ksT#7%eic_h{+sx?aN+Zt=ttw|9J{}_^0smHoJ<97=Nn_-wKx3
z>=rNLHgB>mSM-qVPwe_SU%Ws)>N<Ns=6jlGzOb?@N}s=Aj@e^knWWNmBH|PUwFfjm
zb-kQT=ieN?=Lo*1K)>#qrJSEgY`=xxJVGgb{`_SHn+#^uAPFs6<I7vV>%)bI2DvNk
z2uA3~)s=utS9lmRk!|JGWBQ`a&wE79Jl|%-CV0yKD!U_NF~E&~OzwexTmc*=r{R;&
zOrNY;@G3JFa<Pqxj95PPzh=INEADkr(6awVq?GH(+rQD(kEN0Ml%#>u%gl9!i}=$Z
zey7YK=}XbmR*hhSEsZw+R-n-mUX9tRVylEM*Z%U#dD;ej_@k1*xAYBkV=jI(X<Nsf
zx0h)bMk>AJ(FG5PE<g0G^MC4>>eUs{x;msbn8w}Jx7CL_f|HkGOnWAHgzh+fDc5`j
zRc5YoK5#H?D4!w7i8<i<73|eMp($5>{xHR-G*f~(D_;fC!yen1{G?z+=DCdW0m3t$
zjLT9PSPN52xAz1W?Ya~O&%RA##)LHB8<&#AS8yI|v{><BX?!zX^<^C~9z3V6-?}zx
zXm@WR=HZmgvhOiYf=Qd??&G>VUlU%Jrk=&5_!&{(AgrLHJCZvR2h{1I2r0D}eb<ez
z3Nv+1=%h)x$scJ`PszYPRkKxcZUXKhOLV7rVXJI@C{W<2l)~lw@-Fj3P3U<FDNF<L
z6D|fWDKIQhiilgQsuVKI)z@IcKK5CTk3vyj>&Vp*JMI>;$9p5A^i*U!xH2J^ta+Lu
zO8;`J-avN44)&Cj<x8@YIm0`yS>4#}P9dipAN6AQvy7U#rU;=EkEDCrk_g6fIml(+
z2RvaW6Lf~YxOLPgNSmQ+<Pq>B7s8@kVo(e4@v>kFoUBbcN`~X?RcA%%cRF%@MlVjP
z8#y4QzQ28DG6R}~l{XG%FEkfh0>@0!=W3fr>Uh`X)0nXfB4eOGq{W7s*vz{=N7=`&
z_337oM}UwF>wMT?E_{^m$feY=EGP>XlaBCcQ|viZ5|O4BB>B;-l8vDqcY==h3Sf|%
z;#IhhUaBqk?RBL3pu|t330Tdk0u!MNstem)$`D5WK&Mt~Oyf`#-0#-dYS^V=y!e;`
zU9~&~6r%3-(b66FFE`=%y_C2w;=k_m`e?*6`B>C#u5gu+w&tbupiWH+AARXZ9!#3S
z=pxp6W%J9eUA!^8c~_vVi3C$S8>h3^)W<@=6ibQ}Gs)#-=T%ovTcENXoe>)T!qcV+
zNG3<WF^Vl_l@FVk#yfkqmg>@n18TMS*HT@!Ro5yP5n2Fk_+jcnsEI-Y&PW{?i2_5H
zsir<XU=qn5w1G#)?JHS~GGb2w-mW%jEb6%ZnLel770#0FX+<CIz6(+qR_Co_-=Ht_
z<Y8lq;otQheu}2jan)}k5a)ZMoPebPht+XS?N~KY_k<YHqzP$bQmyvQH_kjJl8A>w
zw+Cy_l1wFOzf*M%K?(qOGAgwQpIIuwXVs9`XtWk>b4GG6>S!0>vslpl-yQ2x8uBeC
z4BYG~HvvL;KQ@$sIGCFOo3bx-^=ZCZhGS9~d;8T{Y|n&!#U1IYjWJ8AZ}mMQU|iw>
zDh6Bq@>h{ZHKAYlKs%5PkwoZrAHmm~E2yorp2XiNF3-u9%NIP4C4J>UQO75C^^~YW
z!6ItMvJ1V=n5g6QrO8xJHhl6X(l!1F%>_u&V+pvNS9@+)PrOM*BzJR{B8o+UOVoWj
z4q38gn8Wkq7LLX+wTzM?gI?=pL<fqTGgzsbOB3h224ruzsN*VJ-4ihIFz=VkF*3jv
z%ChgD$ni42`8b~Kf2+Zr7)lt;shiC^uKX}UL4}75JsKmrOxXz!jg3KG%I5sYt4o~b
zQ_{qQL_I?ELu!&n#=f|fdwN=uoujX*F>Tye5R=QJ_ztNLZf5U9Z+dC4%t({E96W6D
z=jk4cs_D4UjaD6cA~7>oSp2x+OfJ83+rYnSLsswn+no;%gSE8lF-Hvz4Lc<-;g~Ls
zcd{kt&Zfv<(hQ9OnP)dCzfFDXIk`P3q9TieicTnn61a%w<v22DKJ()6lB=ZOKseQ~
z+E=V@82!~oz3lUsaHS7h@wR}mhN#*0E5hsi$SM9sQvt0*)X}BvA)jE0{%xI4xBVms
zeOJHW)1Ka=o*Cm?zgb9-1hLI5-7s%V%ChZ&3(CO~NG@*<zEv!EU*Pvj;&Qg%t69Uy
z?^9!Aw<jfLbP#VBoWuRWv;2IZtEez4pNQGfs)_^pVS=wQ@X+-O56SybsS<*^)oMoH
z0)>4Ty#>Y<*km%A-v!{;YQ$Nh*|^1YwpuNCfuef)=^H|IP(s7Uzkke)m=<xcel36R
z=+HXVTKL|PWkbn_QiA!_X%@r6eWI;q_!CPC_R9qXOCA{`>|q;jYA~Y_E3JzW6D%zg
zlXx2Omc+iMgL(GSinPt(5je^#38|8GA$V*v0Tg_&1E`9+gJzI0iE5Ke-(PPwAmGo5
ze!fNKId*|bPE#AGms<gydmj$5L?tO-92omSE(T=Sw}-Pfq&rk!ai}rljV;wJakZ_3
zR;Pqf#RnN*n-A`7r+Bxh`})je=<J2MbaeE{klH}qZOkXU{Z-FAYolu9xAq0Sn)_<0
z(pHApL|y>mz@@X5Rk3^f1o4H`>rVOmSx=#PF@WNaQUawkAoILt?fzbJ8GHg>f!|0|
z>{n$h`a;s(#Khbw!%-36Ed%w(vZJDZCEhs?i>cN=sFNJjK7i*pTfIB#9=Z7dMKyze
z*e(<34&s!CL)u(E1j8?R&6IHY)Tn1P4sW!3mE4|@&S2HN7?3n5ka#I!P|$C<j_00o
z%g*?T_lgzXYX|<Om^&9NNhCwRRtLG!1(c|0AzBOF+U(LT7pq6*PJAPHJNgPvv8(tf
zjf8|}QgOzY2V8x1rzNlFl4CNfrEjLZ8!n%{Gl=DUdg%c?SjS;({Nmau73TTd!}Tvw
zkZV^YPn|WS)SXOMW1e0xKlTmilH|w{5<Li{sn(<2xqC|vx;pUWls7{u$`hL|00j+O
zvnk*x#%I%;r6eO~sqsNH{O&r{+NE#nR1VWsgA!+pLxcju;rFyl;NyVKeTxrctARQ<
zdPEf_d`gw!21VS}A44eGmcrd}&$LErg=m~xQ1hH*hr`7W!eV9@2e!ZnN{HWU3DXjx
z;Nh6BDblu2A<_=BOAT?0=&&utSresduKj<`yemfbS@f!diHUDa#i1mLsYbK1FYm=p
z`S%S)TIRuU`vZ8q-$9@S?B+<qu#Z*~I~P|CXjc`QK62MQ((NoBt3FsbQ?8A8F~YT7
zd!pM}GUesl=MSkr8$4TDTG8vL5tr4Hf=Q2XkAy!yZSNLQfZZPnAJHw9UauDSjh&GE
zxaj+R)m^!s`r<<dH@D<Tm)6SpfGhz%ZTFa66#UyO&0zQ#F1Ib!U}PwmAS*Al?a7o5
zZo?|~rJBW*w30~UMf<s=!?b~0qBREE!5rR5AsNuCG_TxvKvN3O{*1X@y12X?ro?aF
zPht0T_OaC}W1)YRpNazwNyOC2MPE6svWPEp<CWquoe?J;TH_;Fa+zb1Q~pu!*&zU5
z)NONVpilKW*N4_`nWf=vmm)lO&)<K74?-yl`=06@Q5*SzDHcJk0?iA3Nnv5(`CF#2
z+%sh%R|CoQr$rfQwmZ$N**!Tf#@RhCRKE^<H&^D0DZa!Zr^iLxc4rK1GQ${eBnB?C
z?y?F~3&lH&vW5xE&Ww`todU|q=TN!a>6i=qtfQC)lcI&arkAt)I{xn<5(c;J$9a0z
z(#^jp%LL$Ff?MIi^m8OM3dSgIY5VsfTnh<@zprMRf1O)c6?0@n9=so?k1jw8hC@hK
zEMa%3`3&tmyg8=Y=Hk*&XQBIwzv;%M1Fv8?|El#G3G7@1{H+00CWjp7AdvM8^_>u_
zfXPq;JS)%6KwpP8^?`gwH|4>-FnDl-{61NYL2w$aA5xmb<E@N;?1t>tc_53g-TS;X
z{40&`GbM-5g1>t`mOeTQmRp0b-tOKo(8ILH`e!}n`k`Ps3J78yC8ajj@rfH*v;AJq
z3f!0MVjnBmerp>BSAX^<>M+emxa6(G8@MuDs$7Dl*pl6RRqp|Y`q>TN09jvJ-&Hx<
zZ##1t&7N6n>ym}gs><!*vc>k{=ytEBcM^srO>s3ElPPy?>+9j;F*l7&OwxZJA3Akv
zv~mK9i=%ddUBtn8R?Namg1gC?_?G#`o06>3{H6?e*lfn|hVA+#+YfI>undR8hg};n
z^F5REJiWH=?GLXE$G}sY-qlbXYCXBGuU7h{5L##P`PJ8CU7LNFehTDC5pChQ`9TlQ
z0cDzm+*^r4ct&z*Q{nfbn8Kz!c$$RC)WC*Ya{iXJQAz&Tw(CX8+5}V2*0h2rB4yCe
z?x3b!uHW~dra$IIbrUx~plqlI^L{e%-z~JT-)_JieCZ52OI=C`O6&&0Ydc?1+X0Cg
z-D6A_;gigL<5}|~2OfoAE^d-36TFLB6gl@5lUT@T5p5odS%vf&22AVVL)NG$7!Z(M
zlJT7gf)lSbd{3~Ssy6#@wC}U&pju0t3p;r0R}Wube~TawEr8}B)>AfanZY{F&RjW*
zj`~J~#-4cH(_K;PvHKA8%!{Cr4^yjt0=S`e?>RmEN|_eTGX+>ZjHa%y8a}+PX7?d)
z&Fvwqn(9_J*IIDR<umm!I#5GjC)mPJqu?})7l$a~lh=&6Nc_~VQyYteHp{(NK3TP2
zhe&x0arbL{d!yk9_F_jQ7cQ}`VOyM;brd?x{nZx+tlngeTZ(Vf;Xcnjlj+Q{+avi8
zs1Ee=(IO!}x_Yw4#_xdgJMV#=t9^8Za+7oM4U~eh+0(PfFz?}&-F`CLbhzyKgbXZW
z_-NF3MjOhKcK)&+uG^_e2JPlE75#mSkoQSl5cm?y{fBG%40Hae@Y|D{uIF9RT(tfM
zP9DctS#5{PO}*ArhYs`jL}!EBwANqou;9Cba-F;WJR9eZ^=s{Nq8Hd>w99aFBPVO?
z&7PvI<a{A{rO^l{{mG*dGN+i*Ma00_szXNqwO?1owpr@nMAA$2y58L}nX{<KgG<8%
zdrh%UCP%PVqV1a}ry<}ngt~v8JG)-p;V&auuxQXp6?c$uDof+l-ab`y0)KXx*7m9U
zIA(GS(Bb>iexPmK+Nb!(Jh(~IH4%{bLt}Uk!q2Ck9@xYSYfBCyo)0!91x3RB5jC%H
zN2Y4R2$&F0W@`_2xi;btwzFk#zk7eEi17GO!o6>+zNeoS^VatsOlU#U`ugaJ6ZF=B
zfwFOPlq3I#i^$m*GzQrY9os_Ze%Wr_eD^+yd;*4@SCgQ(zn^<70rFX08l~}^qC^Qf
zJ0Q9gr?CmB$*X|KO6T>n_cI?j93JT*gGZzv7e|{N8^9`8lQ^+J($1Qj=w|v!t@bbp
zU-!M=3ehTRn+8<m1_14qX@0O>GP=@=805RNs55vT4_}<+KHAz4^Q+EXyfy!dn{v>5
z;{$E;b8aes$A*h_U*~O;4Y75Y>6vvhCMVUbD0kAz(6`!zKHqAl``!(l5~@}P9KpZr
zX%crV#6M@{EK=eKVTCt>wI{tD&u+20on)7O5z^G<Z-N-!v(0EWd54%~ZZs}D>TdMU
z85<iGifoenzAsS1Ae()Df0)Uuo&jNI^y|%jzMe5SS|b}@X8Gjk&hZ0|5#^8aj(P6e
zCsBSNf-WB;W{aIJTHle2_;8v3{%><sffi@a<c1ay*LIJZCv3k=N7e{?iB2ZVIj9P7
zez;QmuPDgfFG4=U=B~hv4R84beA<A!J8(^-jVPvyI|7`x#EzYf%oJ%RLke)y*Afv`
zu4@lAKn#5>=%STA7@pD1w|aY8Cf=+;M7=6`J~zSG77Tcn`5sQ(>^<5-gqK!DCm-$z
z^8PkCk$4`GvS*P12=7G-`t5VGM;uaL-MUMg-uL-4FN_I{l0U+tb|su|l~cc)=h@tA
z)d@XXqf|tg3{DMN+OE4-%?wWMZau3J^%C_H{{HKvN}ZA18I8FkAl}4H<loGUu`osD
z51k@Iu1wSQe^%tjIXOc^$F{o=Uc`pnlY)vRdRcuwA5d-7-m5D-r&GJdeL|M>doQsy
zqg(p?9_;m9J<EYSwkrC4)uoKCvM6VibM$Dxxvys&gVzJ`PNief)7vV1w$)|SndhWJ
zE9zd1lnn;F`$7ga_IkMj`CzJHw8Byu*>CIsTOTn?K@NukdpL%S7dNJAoeK0<MKuPb
zwpe@WcHMs8K&fSH4_aBy4+}4#6Y}I|)3~^}#bsqYV*NKa5QPMpp6lGbKoKR~XYaH6
zm)i$KN)V-R?sr|O?ZvM-@47p>mK83?V=-!FaE~<XZAQ8M6Xxw<=d54kB<rO6+N5dv
zW@_$t*GrE6O2mFxmcU6)sem%~3`zZ%e+3Hv^_5gL&T6|V9OWyR+`lFhQdd_e`1Jd<
z(u_YC?v>>!f4uNX(5f$WyhaUZ4pH5*jl-wlyU}|@Vf(r^ia@ar_t&o2#so;lTmZJ4
za$?ont$;tvNnT#wCKOBD+5<4^O)e#v&|I0U)$vBRX8k8(`L72-LDOOfPiyNtA@b*6
zaZ`{Y^`#WBHbtss<5LQBAsfT+$T$ir7BuABfOyjc(6qDv{EDgk%+PH_OVH=oc?yWH
z7rSkYmao}nU{=5UouBZTv>?cwnojbN@@=D)R%!?^%plXTU{Nwgj>&Rk984ai2sx!2
zdCZ3j`ki|8^z{isjVs)eUi_cO{^vmXlF&)%()NpVKL7LY2%|S-_k+&;O+aE@Z8MY?
ziUI{HJw4^s2Rfg-yDN~iq55DdXn&=jU>>EU5vUtX0s$fi=-KzDvJq0PsI(+>>Ma3~
z5U#eL&Lgn*>UfiH{hF|`iNXMwq8@k;*dV4NN!ecs4z~vbg~JLU5;AdLk=jyCY&Qga
zV%U!9gIkY&1&#mrIftJD3k5sFojd-QUHN_Bet9cGmf(PJY^S;<G7Y8{B=bvKC|*xl
zXa)DW8EVM{&=XXTFT4L%0eOtZKlOo00a3sg=CCu@I$CWvHtt%gbSIHVp$-41fwMJi
zVaIr<SNTaHn$i+9<3+<*v-=UxC@JwN*yIWzp)?9ARboT`{RF>~d!)nIM#J9_Md|$W
z0S9U%cpd@j(&G4#>zX6MhimP?ILUO-&ukB51tUr0!HIc9d{gzZWU>SZ!l(e_GXC}3
z1Nt@gg?BIi+S^!qG#Z-e4{k+g+ZX3f*aXWU_u$54;S?Kx|Jd9PG+N$%1x8beX?kN_
zl=%PnuzUsqxFJcte%91~KHwBgbF^@iCZ9TRV!vqOsMEJ`H=kB0Ocg?cA*%1~C-^kF
z)Z1Sw(%9suK8d7$(nUWCD4gxa%d$LCDio-C`hM<OK|b2x$~>U1{lZnZc(td$zZTF|
z8Q9EAzl3c=p^=f1n``+QHLq1gSj9@G9JTlSKTH08)qhJV{y817>H#QbGGxpQ|Lcc8
zzbD0jdNFr#xHYx)LrDji#5b>Bn|E|{JR>VTw3(Qg7|m5qAhb0sGnKZ#K=Rzq050g!
zCSPxv5MENppT|+%7tQ#-u5|0o44<zD)0=@Un)A{bE7I-A!=FWv{l>dF2mT^Roc@nb
zp^iYO9ByJBdidLU{tS?RpWB}<m=)DG!bA&O%S}E0OhCZqYffJBe#x2RL`4S~x3N7g
z!Sd2lDBCmrRnX1HD0a-r$^6g5(Hy3TxY=S89Ig#b0g+r<%DMTr<53R}9w8wiO;*j0
zHc<JN<j6aZSmyuZ{Q`-aZD3fT6+iiZJk`Gr^pCIZaPT<KweXk&R)W!j`;1c`-0Z$#
z6g`Gu;lmHN?2y=r_c<8*wFgP+yHDC>?7!YO0=M8vd6SP+U@Ktp66l?L|5&5DDOfW9
zXl<x-8E}d#QoF@P1FZ;3LHlb>y_wRNnz)5+dma9~TCZ?+BE9%1^8Se=f7`l$jz)l#
z3~K4&P^0%#QQ#>ZCMqnmKA5zH7Cp|!!q@avM+Lm8-s8X~$atu0MK<i+za{w0=;sEi
zZ(}q(*#*_5N0RWtm>@+Ut>CcK9nZ>+z3y2L{A?DaOgkB=qhLGIO`>o^Om~}`9p#UA
ztD6q^j?20nk^g$K|ML}@#AYc0tk!z4EsR!NEOyoX-W3`e5TX*qV-W~15~jf6ni@<p
z1e6{-<;+u`n|@s-H8jztS)w*SF!K^`<nrYf;L|GA1C09iyWcv>&*k`HfH?_+geG4A
z)tn@maA2@%uKYVR^<P^nH8%x9mu81Hl0PpyA&a~esti7YU{><EUB%Vda4bArTzfFo
z>;Cob%?bW~F=7ZAt5{-uJn3YY<gYCOmuH<_VBBFv@#?1-T3R;j!)>UfCf4D~cg>Qu
z!MEX@MjwXH0dvhH!0%-|%9s&Ug_GT4e|`o&J#golGpHxS{?9u8J_J%>cm<KMVSr3?
z5|DNqGnQycnY9F<YU}D+1IDg*NNSQ%(9Wms8M|W|oqE;%$KI&-W1L1|e%t}xc5+0=
zggU(_Dl+ncHqC);D=y`_GAfXAq5;f&3qg7PMJrX;CH`zGEy;kpeZ;5z-wXWjm;QpV
zImk=0aVH-&2Q>EGLVMdCjGV{;HH~ScTAbYogmk`@QkZy?<i~XkOhXfO-^7+~1=40S
zeYY1bBSSiDbX!LO!)vfTNXW^_NnYkWpvxs|y4Etb+ob49{U0FAe=U{N8rW)Op@%qs
zUS`4w;(_pE(ks>jnSuD?9@dFdfOznIF67YhtwOX4{Ut4$2BaD;;Q6mWo-_CRo@KUM
zzaym2=rvAIM=zRm5U5ZC9UZfB;9<j@{VUwW#8#!-fduwA(8VRLSup!(vB5|E7mM=%
zPe4UHrSA96{?~i__$RPiKq!lyqYS8P594WnGsM8CciSL?Pyq2IBX_{q8m^>BV_W>u
zsGRlJ>)z3j>Tky-0CZ0I?nsunY9zCa@*9r3br@Pqo0HW=UowEbJOXO0>5*-$9f{BW
z*T??+Y&e=GoeDIP>CZul6dgmRtu*D6Ct%>;JO+P00K`FxZwiuAAYw>jEA@$0HGlYP
zBfw!7f>jg-XmNjdk=UAm@M9r|Ns9y%zq-b=!>Q3yljZ?XAeF6%UW-E29MNqD0(Mq_
zusc87nUCWyhEQDri5j4rKmN;JkF#d-1h8S=a+;lfA+lb;bHBFeiMrNXWY`KKw#_7~
z^k-T^djm3B-%}iZr$i4?VOU})w?PQ%4ThUbGBfEy&KjFzJ-(!AXyul@e?Ok?f9{EF
zbi*cqA3iAQ{L7UlWHADFdQE{N@Q(|Pf_4|3<k~<c0m6=@q)lD70PTXsw9Mz^2^e4P
z+ytZ4mr;YQt+UWl9%=o0PnPh2BaEtbz<2r(Nj3l|hxN_O%vQ<eRuqM{eK9fct@_g)
zkR<!0(bWz8QC$6haW{l487Qc2dv)bxf4=qDaoERLrwG`F6_T-~Kw!AaW{9nF0>okC
zhd^1Hz@X8~t-w8wBT?Nl+O+-GfhHv0X@T06Hj%MiI@+2N3c;$Ds#vjx(F$-&f)nW7
zL8>z@ypl>hm3PGbkof)ImS>5qpb@n#&BWU9`z5Q63tS6`d0tIXF}Z5RLWF9}EZ4@N
zUXvGw>$~--6Npo%L8Ff5%%p+*yZB`NTE{fh7kO;xY)>4t<-NxrZIQC{S8JxbK@3=C
z1oP?*-D)LYAL_hTxK#((qp+%S_t5#)lDl(iG}Czu*osibr1d&<oA@x;_TfccHEb1*
z$u#Gv7cZzqClh(i+w_6LxRT3O1$T|@2-^mj=R5=I994MS4Fljn)5?SZtHy%(r2BRm
z<6G(AG2#}qEse7v(mi+b5yW%E;niJ-!tdrWP+GEGhH1qXU{q+*!+}}etPl4Witqt<
zJ4?oykA{GN&AOmF7*wDdjKBcs8{mIN_nYJ^U`fWoXqG49iMA6U2YuoZU!Arp0qQgp
z2df{n9@pm`8jyCj32s1F@NE}_S9o=(`t={xCfTu7_7jx!a0Ehp8Z?(`dfq15Y_az9
zmZ^4NyuZTc*hNOzB^T&QJGI7@@T~Jr3ZG6UUujYIw6@5@k;Z1%NzIv_9J|=>PjDtp
zyf1~+Gu@_SjyIyypysbOvLsb?zdpD&IAu8_(W6ru(5K}qY69ExC_0LS7<d<TRX@<!
z7%ky%8Pp7wl7IIFVofkr+=#YR_olm2)eSFq>XU0i(f32EujjU33z(16?ydxYO^{+X
z(nuP9(@p$H*^+clgr(?Ok4~PHrLjNhgtq)BXK;A<(G`)^%rb3vcXx_WuBmKXQV!#W
zabzkCz^oi2AhliNx&KHe#L~PsHFp8I3rSzULacQl4tdEsGtA&`uS*;rpP3PHx1D)`
zT7rM*x%N9l8>AS|z$!?y3J6o#(82NpKUNJeuy8jd@L~r7E{^BA{d)X}ot`~!o{<WG
z7072+)DX{DRX8xG&=}RSIgSnc6@Akke{_aukaiGT5nHxh(CgV0bh&4Fc#`Fo#H1b{
zlK`1^_axyj5nmF<94&kgPFn~51R7crOYC=Z(U~Q_-D@@)%eb1$ZdyrGN{YoFjuKQ;
zAl^x?_+O2<q!D&b0X(g(JUD-GFt)0hz;tc;06E&x_m3CYY$9Z^aG46e4z>hd+5-9n
zl^{z;W?~8vWlA3>SbpArD4DuPnRGB_jm;1<7+>tM2NYF#kwJhY0l$C9t4UQ5NycAX
zbb@3AGn3Kc)4cXidjG!yMK%*){+3cI<o|4<*W&|pDAoZ%S2T_Iq{R8LIS53J;wd~L
zoWZobplJ(AJs@P+dfJRI8qa9EY_ffaM!%p!q1^1}UtE6{kRA^6DU$AQ1^w8GYs%=F
z_tkxaKpOK!2iE%S+d~BKb&h}vwbYZT-K(wB?9U06`W6TsiqcZ4|MDxf=<Z<{?z*7S
zX)~fd1{-TETR!RuZB7uzq&B2gHUt^yoSvSlpRFP_kBT-&>D)Z%N8FRbe_8*}7}@hJ
zK+AO;&^mk|q~YM;P@$kX;HDaIIRumnTR`Nz3`7tiWm)~oO*+ee%V^}$u?e;1V%+}b
zow4Ic7;)P(&oD!G!8Xgpnyw5VTx=l&Q<J9Y8pj#i+)zUCk38Oon}iHVWo-w*D`I9P
zDjTiIpkk8#%ki@qwOl#{!eZsL=R4t}wN55O`(>E^#xJ0ek~i7KbTu_CkUj{+oS(=T
zrLMi5!~C-!(P97zgOcv=qxQcdADD8B<SDdBhnwoQb0(*LRTn^N5(H(mwco(L&rH4H
z(0hoBCTKrC0BFAP?CQLGs%m)s&q2dXPbDCR9nZKpT^Seo+;+Jf;~$S=gJTbEnnB`M
z{8oKcfI25M^CJ0{ojoY;+#NgGF$HOb%z!g!1UQT`Ic4A|g*9Bnx?bx2ON1MUiwDYn
zJoHq5`5jbp<ltNMbz#0~hY?7;nyRoPDCrfLRyohh)PtC33us$agNU80c&O0)rrl(f
zO*ib81}Q-TrvaHv1Ta9^jetguJ}wg_>)ia;=LGKIv25m-U3AB@oA>W~^<4m3tOsEz
zFtJpS_Jgz)Pn1^DuK^k9h&|UmCo5<E^G;yruuBE-7_q+jcj)rJOi5r48ia0<G~$Q4
zr6Dk}UzdCpQUo3B0n22Su*>o|P|7eRH*&q7=msb!r;rSI02M3)C5G^Upwid&4UZQT
zfO2D+O$s1|3TXr+Rap<dj)`IuGV`1Nf*W&jR!@xLv9u_FTordsM-(}-%253N{cW;Q
zwHkciq!z#}K>ElZ5cDIVi~$q%zZ)BfA}}_v+m+;hF*eas7w2c~<?r;XyRU{~lL`(a
zX`<~0vqKB_GTVXxhcNz7?e;j$Cjf{%!6s!hOiV~1&x=3oUmqzlC&fF0f^n;zb^_Ve
z*7oS!l763GpL7f`Qgl+9;r-Q8KNvewSn^)~KJM|xiQ)chd|Vv&&GA8`WkYmIo|}Q-
z_UZVGn$AB$D&PkrH(S{EN36c2|1X>R^LqtDXf&5K-Lm-mZnsNZoVrW_g+6!TM+8*X
z6k0a`l9q%N5g;KO&ZLvk4ldTElg>giS{Rs_W#I$j42}f^&eLz_gAJtY+PbQ$s)=vQ
z+JFTzpAUcEQ5W^gTHQql)=Khpp1^(Ro>1t@x9sffxOr*+^u8}&knV8m<1=ChFk?Pn
zH?zVt!SwnsrU(d=0ds}QmLm7>nc{zJQ>Fwi3rS{KAmj?5Or8(S1VAk>ZU*!hN^B2A
zEe^q8{P@m%d%KtZSTF{q_ecx!zPkgd$4Q{6R}6feB}!}UeM3WgfWhJ-&ikG=5eG#=
zJgR&Ved}T63Xd=SI^kDwk6qT4xf?BzDKjf!fmAc*7iEECm&Wu`Qh^2_Bh!|Edt7lY
zwte)wn()7Zcc~Gi8SpYc{PRXiH4^Pe1+rb(jPJr;@El4>Lz{dZ0ES^US-;(62PQG2
zF)$WnF>p^=<qCE$5dIhaBsVmjv-~g4Z9=ihIrS~TTUP>I^ES}gYYw=%YKn_FWJ07f
zezjWN;mT}jO!o)10vn+6Pz8#yt=c8}@dCFCI8R&}vGBEwj=w5%<BJaNd!Fw5>^1WL
z?i2W5r;1GjTpml?3eNx7mH*hT^}2xYOPXg+faDeI|FQvy=w#=l%$mSiz@o=MJp%I-
zgoMK)O~zsw;n-RuJ7H9g*wRv30^R-nYV2~iLEwNi)JVP%u7;g9b(lK6OsV6wX31Z*
zD0L{t!S%wG?xmiDDZoKbb(>Pi(H?w;^4+)GL|vahmjl#8ADHbepk!XV{3WHc=`!6?
zckiE%6iOf)F~BP<tL%SQegE%^2f}Y=(q*Ed1G?FAK=dhr!Xi~*D~G#Z$d|=-2@;v9
zL#{$b<0?)-R0A+9$NDWn(d9&QBrar@GO1Gm^PL5He=-p}fLFW<h;Ot3nda*dHX;UB
zvrj+W+a}4*$}((YEPU>)!m_6raNE(VByOIJZXNhs00E)!`U@|h+z#Gs+@+Db{m;*d
ziVi`BQm~Xt#lLJ&RX~t8CDLH?AZM=&6mq2I!IWSL$Omgc^C{ssJiMIU7?}|Ld_cBz
z7%q8AugR?$${0#1#*%2wFQG;+6H0bdCD9Z}+g;d!@*BNeBKC8eA1?yamg-MB_wfdU
zr&A^u@UflgI_LQ|!qKCZBRMI2D#0p%Lr(#Pb(s-p5Gu&`iKTh*|I4BL>z{#?gySWP
z^5<#W-^N<{CYb)>sD{N+OO10N@&E>^0S-kJXlriPHlLLgio6U8(9_ccnt>)yLGg(`
zq97W{apDRsqGg^e>qo{9Us8pK92<7Qd?x6u6`7rt+xYcNfpEGxTB?ElB|yw+2QpZ-
z-VFXTVS$&y{p>7&TcJ(H8|bWUf`TK#ydP)j$=`5#^-5$_bTp&!&v>o+3Ob35x~Y^|
z^Gim>ut+&1r#tY{4Knl6;d_K;_wT=CEz6|8d9yPzDyoNsp#e~uZwBFUVQ+Y+v{Ro0
z<|eS=ndvwliN^6kiqEf^fqG$<R~Z&M@#EtL)JvG-!1!$fO|nW*Hw=~cG`@G^lfa*k
zh^+!RMPJ@m>iqdv)~f=rux7nBIKgc#a$ainDBcoPf?N~qssP*@<H)I@N1)C$p<S#?
z)NI{`fIPqLeQ56uVt_3y$zy5VPgAMR7{BTk>WUa*iGW0QdkVChsr2V>jFr{`d&aOv
z<n1vK90o|4!e)R!1fdcCKF`Ci@kxKf0Y=zB_^4kuLGkC~0#l@;>?(@n33O5!-Z}iu
z1psE`X3J!+2!H(Gy7rJt&>lN0{A*lgWu@#$8wMWPI4GQuvoS#$DM=zte}-C_fG*x;
z?Q5=biDC@Rd@Rfd4wM$-y^f8~o&uh|!+!tsArZHAIgc{UTV#I@0yE(ll$sY@6O4a;
zUhH8k)Kb+PQ{!OF_=`6oHKlXytyr}7uWzbdF$+f)CP}VvIE+_VMwJ-Wef5H^TLOf#
zBEi^;6&(u@a$J2=gTMUq+^MHvh>5*--_jRdNp)$<I#?UJDVFhuEYAs$tNMa)#4Ig8
z!%rjxOY3tPTl%(LC9i|xf0*`vH;i<|=xi4=aFyF^lYe$?C}<S)nJ6+g^dWnK!?h(X
zP~e!ikX8^tm3rH=jhyW4MZ;elr{52P%_U|dqVYW#L~?o)`T&c}MveC)w;6td3IL9S
zr-0{s5~v;)1IL%w-QeYS4`x`9=?7xXO@JC#0TH(^Ph4DNGbPhjX7&3N_WvAc6vQKM
z<C4wW!T*(9{Q4eUp!MzDI1SZu(3Lpw2tZ}P%PQmD(MkX*5hYqU!~%eRv|)r<Xr#X`
z{;)i1=%vO7bASNK35YV(1_hz9v#}|G%xz^FjE{z8&V$(N5g56(27qA0ht&?=ztqd7
zFt7<n5BcvP{_++pXoE_3t<v1y%slR-rk5*FQlfkiN-5w3YBk6}xNH+-57aV5kZidK
zp4c4%<oS}KCf->O;%?Xp0um~oOr+=tJ%9-o&P$i%XJ)-=JXucJ0>YShd|q5&aSb}b
zklUXPfNh%87Cxb$(MB<UWoy!UV&N9shMvm*Z+xdjCB}CAO%NWkI^g{QsM&5I<B9k<
z%*)qIam8-n2_83q^nPQcNJsagto=$QSeP(KNC<Y(@nVO`+ufrgk0TqWrVmqEGYDmj
zmv<fRj`Xc3hReILRK~E84Y=e&2%11nawvJRFA1vTItERrZ_9KD$UX^4_h%*NuQ%Zm
z0HkjeDJWHzSd*|REa)dXU3%$Xpj(@!-qf@2{1bw&@5Q_`Ag#5tZPt3sVPARfJDVw(
z?n2{Iy<2SQo>G^`hd3Sh(0jF@yHi=qv0f}PX*7NB`lSs`!+?#<Z(;VRfhr_-j>^-%
zKS}a<Ud8GH;KmP-UWZ&pZSdgv_eL63K41bsF7vEDzG1*5aD>?Y<=wxW?f@x#91os{
zU>3z4iLnCxY)4$8zT{i%CEZHC@B<uDY%BsAdjMb{8y^@o88qc(Fn=Be+sXh*MJ|wY
z10oXYE4eN!eKij|B6Gr*=39|To%0zeV{JP5BT_)1NsoR+s$lVF+lLa^OEx!h+AASh
zb>&}v|Nnf|O_xa*jCK{&s<UwC0jMhD!2{6Y5~UDiCOJJlt)8?7YQmMEFn|A9+2!+}
zrN-DK&>3J@?_QDy;OMNExI}DXiIAYorkMAjnSoxcApZOyUovzjlkMOtO>eKuy`q0N
zZvScZBFO2au5q{d{`oEt7L1_LFxUerw*o0-D_x4XcMS;VxJwA<LB3Q1EY>05a+v_#
zHjbco<qC+PxUc>EyaESg14E5N3Lv6$JKXExP6>kHk#ni&rRj7|<lH4jCjGY;fd&Sn
zSOS~a9n0BCchUjlKRrnxoCA12i45Ntf37J7im=Vmw*f0V9)d%>35wMK{an@qDfL%e
zA~I4^J!$E{86c%62wE<X<?VthxrnkC#yr=N&_D3hn$iR880#lHAiO4^_r%!H@>Jg^
z#y5^fsvFc;e7@?vUYKvcI*?`N2{q1!CH}cciGr4Nv&`T#71}c>QCCCFSB5{m)Q`wU
z1<jbL5ENCw$4Y`qLN#o2VhFSa7}`3^IAyWO>4MUx(2VPABcO9yPDnrhj4ut7>_<;r
z0X=G|#BoCNX@~0Vd30oI0Z@q?`)DjYEMOv#P#pAhS;&1YHzCaJV0v}FEso0UZ<vV1
zb5IF+E=($b{(sKtzfKTDrbRXcTn+qIoUOM2-T=Dm6>;=3PEq05+W;I!tf~1^G81Py
zQ~!+rli23wTWe>1daj7Awh(5T)IG`d1wEE`Q#R+N2`JBjLUs+Z)dJwN=KEVrMoAQZ
zx!JKVfpg>Es~TYW%X${5pc07pCh{V0Heogh^YiFJ!<imz^~;73h#$nB?SxBSj=IXA
z!u07!)haNVWM}6TfSAb4B#RZ4G%8{w&u`mQo}LV_!)QF_0tIcp-mrr<iO;v@*!~3-
zqua-zwD2Rgq5n&;L#NIgh>1@bveOQtL3`x<DX2z=BDN;0`7uzHsX&hmhomGFNHlPG
zA5K`AN99*K+ME4uRKZ8X{bFTlIRUV{O#pmd@!kZMzk4T>?5m4D5O4pHR;K|f!LXgo
zwg@j8%fH#CN!FI4)9U?(LEFEqB+FaSaz!9<Y>EI15)?rsoCY;jkG>?we_#q_d&6a9
z3+V;|Z8t+<jSn;m*(-k`1S2=*NT1f)&-^INAp@7ay*-t9Y*<6Qt@YQOXSeK!c{ui#
z4V=QdLybT4jCl3_4S?$f)%L`RmGIF&hZ6x(Ot>Da+g*$?RRGNBLjt5=cEUzW8yJ_@
zB__?YNWw;B56Zn1LC)g*GR#Xq_vaR8W?8)sZo@`j{U&H6r~x5O3cr;qHUV={@<ywS
z7AuFbzP<nXe#TY+JywWPV^d?Ygy7-dI=+^GDb@889sOH6uFpJ2k8{f#Fi#(X;gnEQ
zd4R<!i(f54fPOnYfbkY8y=J3m5?T<K3CZm)|FNV2cr32z99=6taaO0*@uxah>4tZ}
z_D>?)WxX8P0fK%@tN@02<+?TKenfT+B0JyO-47bbeP=HdpZpE+uuW@mWOBmX^dZk0
zy_JUf=L8N!!ArygQ;al`?~%|g607``cRg@a->{wm3^S8^OFiusl~(;V4Gm&bpvMZE
zJZ~C>pQvB~Ew>S-JL$6<C->$+Ei}yaP-C*`^r>7ZWm`A49J;F!+%1>R%u@Skf9oC)
z<O9^KwvFCLH6XG<n&=#i`q_gO0rBucrFqc2WmP-lmvXDmQ3cj&RQUdPQQ`lZ45<=i
zpGJ`yZS<d`e3ZaFT#s1UtSA$pp5zW#t-@{ZL0T5GBITwIJ;4xn8I$rGU4Xu9NnV`9
zEG;e)GN_<`suH0mr0t4oE)5<wmz8w08F<Vrsx8^~!M)ed@HxAV)Y!{+q!=*JYx(F)
zico1)Y&zEX%9j)?WX3vAE#g`RI$8zRqzgE0HIS`G00{$FK9BdeXE%$1rHUVYmm_NR
zm-+#=W)ZN^wo8w!{_iXQgV4p^MKdn9nW}L>y19BFtkg}yusKy*3K}1vhXB4!5wLj$
zloOv3nlY!DPQC)o2#Y?~jqXdotq5Cen%%ATtzKeB0B?OShFg48VD|mvw+^!n6Tr-0
zO?ihLQ_(jj9jYppxep)oaY~38k#Kq)Q&~|VL#iGPGD~Y@*B!{mcZNVqiSwQ0G0;h7
zH~qf+mcyh#?~s62(2y%<ez_C>dhBLR?dQ(HB_C0V7kvxvXG8<l^J6U-<c5Ur_Mzv8
zwWFZ#{*|4N;%B$1%;{_AVl`ecTO{(d38MRQ<3_IuV6v5F9w7~1M<l74a45ES9QuOz
zbKUiBj=v>s)e4zrB{r=1^8XnJ{im^H)04`g59KBigoEy48$iI51XKfkwbj*4LqkL9
zcV4oPESeF9Vrgxyf#|XZlzt`w5?lf-jHVN0asT5on_^3;B`rexsol;!sR3D4iT+M~
z#d(R)C{P%8GV$4!$37|1t7H~)B*8WW1%eX&YPRRi@O5^LOdC*Jt*P=T<YYHqPU-G?
z?C0lKfIF6}Og;sWni8AWd86-qMUhCi%z%1p8;H;KL7XewqTa)jS^%ZSWwgEXDBp7r
z@y7cukA^G+)`oVfVTC?gVqyikdfT!)j&M2!bho)}&x(s#t%|U0RL{*zi_gCMunr-l
z8Lk!sg|M7{lNW_3C2bXyBqBG&R{4I9gZ_`@D)0skGR592af~wm<EOt?G>{M1qazoz
z2u)I0rJ5nrvs~gf^>NuOI+MfV%DxJukY2KolWIiS^Ob-Ob^u>Ih??c%OwFNtB@+k|
z;0ge(h3sUop^=f3r_hiim3KG|-w%*n^8ryr&x|g?BJ2B{ZvWjt)@E8s)u-Wpy}RZn
zCY^<y^=L6bRml@u7T!?t9G0jvr<B!(6b>}aVv7a+Ug`6@rE9p<Y|i63HpJ}D!kA_n
zCfBz{WR}Dab3{!QqVYTioPfB~n}h@_Ab5iWenQ+E0gzJzB-202<l)xj^RFiF+F70+
z?;^D}<0<{d+^b)V!ZJ?*CU1qb!Jd6eSZS933Y`A?tAbo)s=oH@?ZjU$vw9r}zBMtb
zk-!-w2p5x6w~UVL{hcaB0`r4kU9|w=u1;}kny9F(#Id-6X0D%$<FVS?Iq6)$oOq+S
z2BZ$^^6IU^p=de)uPVBF43He;<=F%znJPuTkmO~0DFQSv(SyW+7#WRZvc_%HCSZ#~
z=`x_u22U4kp7qDNNx?EcxCaoW%pg7ZeQzycb@Q2{&az2Lf0KQIf;8L8PmseJpOd`@
zDTO@qfR~j_CKOqKFq6e#5p`WP1%C~HUPdc$-}j@F`qpEOFL*ui0ynj;@%m9s_g_Xe
z68cbca4Z7ub}^X2pZEG|uG)@dc01mgpReJj`hMf2vlP#WSWO%j2MXjOWENur8MMtG
z`l)zK1HOO}24qiN{c3hp+e7`EhUUBMk7@rBz1lVc1FG+jD~$4&z^8x%m4JxLpr#kV
zxsM=ZBX4uM$6qliKcs&vhuBjO({cR(`Z2da+--^dJck(bZq>a!dP45ZfEcV`*Dp+X
z2o{$2KwU}QOf7Ico?U11TSt_vlzLVc=+^FZ@=8EJ((}7LX)X`zj+JAEW**!g^sSc9
z`T))qhbHH=B_rwkq1*N4ORoLpNU2hivLOlIanEV(itRLwY1yM;GOhc=<=mjLQl~Jk
z9D>IdvC3@w+HY}gMFufO=dWe2Y48dkuvF9l`E)wXz#cFegK?RZE6%q_yClf};JvTt
zpq<o^4^$%K@iI=Fn5{C`c-qQ35EraQ<`>BFc8a8bliS)?CPP`T=KyAD6a>XP=jiyu
zhWULH|1%ij1FdnRehoi-<_81S*&8=OAF^1jk<V^N-XRNi@mg~K->k12vc@taR(hTE
zFHv%w2FNfVVg<3`m>50)5|(XYpwx~0-qucGJh6s^zF9M~0-Y5!Bd6B>A7gJFSJk?G
z4-3+vC?XOP1}Z2b4bq56qwGzmfOJTQbXtfa-6*x`mM#^M?k=Sy1nK5Cm-n3ey`OuJ
zyzhVD(F1Gk=b16)7-JI5Mm^Owds=5O*or{!o(iI(TJMNXUAwgPxtquQ*PBmLj>%@~
z=<PFfD{OCcQmI*RQrX@VhyM(YkGDdq3@BXu$K$ab0hcS@SiBv<jD?wt{|u+<IciKP
zcP<*^Y5Gb9e~l>M2VQj5=>5*07Pp788uI9Ug7kNT7E`wQm2r31-eCeTOlgLFKzhR5
zVt%p(t+4+t=0qwz?z1kcGkXY|!?-%AR<I~Lz6ok*-^Gk?`uTd$M<TJr_nD2L>qa3E
z2cxlHz^_5*{%hU@>Zg*G$9wt1Iqq21C!n7-03+}y*lz}~CmIX2dZxFBPg!?AzloK2
z!q(4dzw~O=Cm}Z=s!ULKJV6(sjJXEJ+Z2c}b5V#PxH+&I7~jvoI{g3OW13dO-5B&Z
z!H0d+-7vs9Y5W8L!eTJx4#>)QfWovZ6cX<5Zk8k^U2vUE3|N4%ik{T3bSq{>iSX~-
z*r%80FH&R6oH?d6E62!)i;KRmh?NBYxDCwn-jF>=Oaf}gXUwz&WoOkHW9AzSX$-?4
z9igZ*BceBnCKCAZE5S2CEO0Qul4UY&mxuuKK*!>|!Mo+eC!D=Y$8m|*-yIu=mPppC
z1z6_()`{5un7S?4R`J&53&5JhSoO2p>#N!0N$w3-yCaOx3Az-*yi~jQW=Xt#+Yh={
zFYM>+ujtPZt%~kG``MPtkxhqna`s1Fibxv9)Kt-vi=PB^8INGVhyc%!tT=EU7g?_D
zZQFLifc)Xu?&zkNs_Ibpl20cdu50*B9lEn!OTlpaFOyyiE57j;IQ@@TLS*qY)TrgH
zlvzjAB3`Dam)jcv&6cC6MKMZa(fb8R)0}z#K=B?{j!~TRXL*5NAFa>?EEY7)Ipx@N
z=T?7Nl1c-fa43O~+jmA<iC3<N4Ix8<rYE}+NCq9B>J~>d7A<2p7ih7c{NkW^@WA-q
zkPJ61FnLqHMq+GIiM%oI`|^||%|<Zx1bA~*-o8)0O&g1UblJafj}f{t^4MA2ief-V
zZ8KdY+??V%Y#477zbZSyI-=aKRLhEvLS*yeX}kk@ECjPX#BNkY5)Da<um)@F$`ZTK
z_ZJ*uMRkB{k;!*0rGv)JgN5y!;K>e=K~|dY@}V$vXoSVura%yKa<Yuzu^MIFU9r{r
zSKZYMrqzn+iiu*?aa_H&&#_a4cL&-QfX2lU>xgDuTX!5Vo|J!n_J$aNYPACR9h~2V
z`M0<e+qZhTKcDBhGC1>P?*4p2fBrjUSHnf5l;2(YkarP>`v5qO$P8YNq95ff8`>yM
z19>+KHd-@ot=19W?7!7OOHS;4b)i<V8Yc;h)z9-AzLrv1@mW^QbKa>SAahUCrK%o|
zbNy)o6L8n-3@M9qE)P5r5yBY8bb6lNWtI_Y4ti`!BBJTZNnerI%tQb{d_2P@oocGP
z#`|PQC`h}nV@Rl)`=xyh^^=&iMgGrrK}s`sdx+4YHXsjVR83<D$B;7bB{RRFzCwM5
z03{)b%e${>#)nHuas8#$7|gGXh<q_N7_sJ^^WD&?nRTaiutxW}bSx&@(w3Wh-Zmlr
zunMl7`jnd1Uh6<z)nh=-h%_;O%osaPt?lw7SrH3Wf=)+?en;k@4pX5j>QJT<oZWR%
zXBrr9l7}^nRfqda(E-#UH`?ruc&}+1Pyx;NZciHjcWv|^<#@tr+%wbd37(%}O7+`_
zguvsvTK*+N2_7qNZ*9zIN^USl;ab1Ab-n%Efok8YfPinu)rmr`iKLMAH%D?nNHy7j
zGwMN{4EKO>k3!1>TBAfvEQa{=NpXLYyjmapfO(Wx-|u15Y4fhTJvcHa3FmfR&_j|8
zir0x>+Fc@`x??q8RUyrx^uZc}O0mP@AlWfA0czqFIwpqS9`nOdZm%8ScQR%aSx?T*
zSRVAfo~5X*38cV<naLPxBwMnLt`~?-N;Q1^Th0opEgkD0V%2NfUbU`5EoydBcrVv}
zagYmzD_5AZR}>U>KUox=R{{0rA_Dd3Z2+!=aBe$^PVN*}U?!k4u$YPWaPQA5VYyFp
zBob+_fTY~pskEn#NV%vaPw%srCE~@VQh{kZ?7r+n|FMqd$HHBTk3ie`u6Ro}^fLfg
zXDm~d7H`BZ7RXK$%&HUi$w-BK%OGJME&`Zb(OI?!7uk2HWY{#D!0cJ3{Y2~JF`&mV
z`jWnDn%jUu4kdHT6o}a7A~4tcA@jcN!Kri;>J@re?~$|G?`Da5=Bcr(N)x)vy7Aa`
zMK=-KfG7$<;}Pi?()A(r(+!J6)7SuPH{n75-skj)(2s`SF70<jFSwL|@ibZ6eBHZg
z@wT^h%fi+}1?%LC`MjL*RDWPg1U!3N&br+q7}=yVVT<dDj$Ju~g}Tzrfzy6-UKl!z
znHc(N2x%2*7SQBk6!VsWY(p}mHY9JqczKBFC~-}~1`+UJDrbVijzCaExCrkYrvy%V
zF3eookP!~xvqYjKCx<@rG>Fp@Jvl>388Cpko}w5~N8iydzgIS#1Bjoxo04;@kB4b#
z_ESLn0*-~_<HftorE8s#_PT&hUlZ+Xf*>mXr9E|f3s_k^Xv%K;J}{yp<1~j;PH=IX
zy(4dfzLHgtZSwnU{%|%QmawFdvW#8O>DViN9jGjbrfBLIP;%@8#FvL`>Xr`cc-LOk
z0X?l&@w;`3yU*#}ce>&S!F<c$IQ|LF{cKq2IK}#0G1i(gh<)VOu?c8Bs9r$)vp}pM
zLXEoyg0p>)nV@af)cWo3AqqlLYFH}svo4)WglJy$lqOoJ+j)KCeSuZjzXtpN*gATZ
zT?DZIXN*kHkx;Z^jSnT!qv0p3Ee<VQeZDm<aN)a%PHg}U0s#V{V7lc;U>{GWM-i9H
zJZL9%J?GN-4;&2V=+_>6Dgl;FfbI`q@*}#$6MBqR&oIOoOhh*0zOfscsoVaP@Cz!A
z&j=_#KUVFLDIJ3?qJG7F*)u$4_X&N&&8Gc9#__&;g+(2n7=<yIa%5?hbE8U7MWXvc
z4^$VC6$BCw^>I6>4Y&yUa*C7ZnS>O1K^hDoNdzgKKtF0AUqAH?S(0?_f#b57Tpwj$
zM8+lh-PO+^qcZ@7+V3IDSv=XQ-jbQwZ85J^yZV5R_OiNpU^9Q;o*v4S{qy@v7$xW)
zJ*L-4Q}B8dGuJ|xv39%#)gWu3qNX5{|NS0!W#*94_8djKbJudq?&R&IzA2AV<@uF?
ztYLkGss7rYW%Fu3HFi0XwZ+f5+R7E;w=?R@ZTzrAZo5~u<mC@ml`7@#mqov+>RLRl
zbdslT221s!n2IisKHUZCp1q=5@4}BE>`>=@w1EbN+UAhtr?;oEPWoKEiU4gxR_?3O
zWXsIV%tU(Be(tA9i3W|ebF?ePB+7tzJphVED@13pf5QGFGRGv>>#gAw&Y^C=PX)A$
ztn~*pB}O?FE6)&}e0iZFx<()~*`9(L-Oj>)b(q6u@*a};^?@+MxX=ZQ#Xv?K#Cq1!
z)l<gt+t5muAB(=2e_Y5{-a>Y(cm6k$`Vt4@7WS-QP>+N<GH!rW3rj{_nvms=S|>_i
zf|U3yS)rS22e5iKmS)I*;e)V;l$u!w(tv%q*@H!?wTNYl-p#za&qO+Nw+_K-XBaqi
z*@_b#86C=@ue_0lg1D~+j*~es$Fj!SIMBFSIwcxmV?OC&a$Gsri$T3$x1koh`>Z%M
zWrN1zcnOPw=c<}>m^q=>;Dws+RmCya1|tcv(c4bxUoFBLSi1(5;`DW6pAlQ1M-2zx
zU<iJS{X?j@ON*8K)oX6UY>)`3gqCL6eZ;tW{3uK>3zzC+7@0a<SiONqKu${%azwg4
z=7l-COf~`WauM2#0{9#n0KrE{@W9Bc#13V4gG8whta**P^JuruuciA2Sm|xThr`n?
zu|`%^>nZz-RvrZ&`|~<^f@yWSz*f_*WyURlC}jj4=(8JLnI;^!T^9zp4ZZ}EiJ*(v
zwD8rr`L_<ZZm6kVFB2%4kN3<zMJg0j?a!%DTLUVFk4Wjnd`2Fy;W(#nge}iVp<g1I
z5b+za%lfey6ZYx^=2`ljFHzaX)%3trQ;d*PZs>fsL{<6&W>+*h+WrCVE;LYUEn;YE
z8Abzi={`b-2cL;R+_4N@74y?afdx+yu)rqC_{gDI5KKv`fsMV}sNnt(v5=1x^M!VZ
z2Yo|ef33>`_Cxe0Nf3+CQQ5e>ORO|LCzB}ZcL#P`Q)5cqfY_UNmPNJ))Ctxn07b2H
z8m(~7+b;X%L%+v>vKfMtE~l4u;ynKo7PeW&>o*k0WQa%%DV7-$Uy*A`5}nBgRtzGt
zMap}*NcK<KAd%_M2HDSf%)2?4wK0358fJp|`fI5%r|V37@J|+lrh}ZxF5*l7A}SUI
zmev=wKpbuG^lN$gYNoA_Zp|_9JPSi+qz<ioGatQ^k8bDJRiL)m7u=-fJF2!25eY3j
za~7Fw##+}AGOC6}N7IP$(M{hgbdFc~S8eamAwfBiRWeGA@o*l$)ZrqV!S7{|D2jWB
zg8B(?W5hlcdmQeL<=tI_YBa_}*a&m4)b2-T{}VsIGx_`=`4kVWg${b@bbhC|dLO<P
zrSB6>pT~wocXF2Q^bPE+&({}aC}w*5!Z2%`wY;w=n=PyO-Iy~Ck7ePvZ{Paak?z_J
zegKajq3c^;6A01gqEpQTI)wCzyC-N4%0)vTQJmeJ3Bd3hoV=<H9uE$%^z~yaRkaF6
zI%e?*wS+6MetY9=C1n20brE5x#}T-rT9MgbHe+`(ONlGnkC@WG{RKA9Q#@RL&Nh})
z+JL(Jo=?;S1jwJxYAF0lv8;<O>>P(nRlludybQymqQ;Ob4Gx1jI+l&jT#))T2p*&}
zPXOhKI$9W#&TY7};=$5-aX?aRnErw1RjbAOK}j6jeZ*|@*MyMPAx0kIumRqxPC)Js
zOt!o*j7ti(cUc(NZx~=6eQ^5qt$z>k90}svI7hP=Tbt6Jd9tc)YkzyMjJr3-eLuVX
z@!>bh>Re>voVa4#jbVRP3YwXeRXf;EFxXNuY<@$d@CEu+X7hgT5e!?hv{(ccopFBG
za|9}iSR-s9I2A%fD8&3Vg=Y67Xm~|$6|QL`rRvcTlp|B;d-(^sKl7<}zUL>|5y{7>
z`>w_A(AdEvkG=2o`nzZbR1-62TFqNA9}NGGdZ@1#kU1hC?L0WX080NXsOuN^`L#P_
z$oLcX*kIHBR3cB(Qy=Lo5(56;a(@J;$%8b-v>()Gn1Dp$VV=f50g_6G*6Z7j!yg`R
zR4%!-0Z@3;3^KO4OHzZ5`J?ltj7oyjeVJ<dh$H|hx(M+AAIf@jacz7DG}iiv@``}f
zRMPbLUvtWTehVU=!DjzhIQ<>X(h?vlK^;p~$37T?vAQPv?pQ$GrF4IUxdr(Rc0TsM
zf|rn+hOY?v&5AW#flCym_n=y@wQEHgBE;oD3)!BEC~gZ=3|nMutObx^2a>-If?`o$
z(tYV3P2m{BJOmTf&ng@HWasQoeJ+x!$<Zm|+fnUs6V!(EVFYV_;6A0wMkY1tDLSdo
zGs~tC`4ORZk#(E99k1LCpv(VoZ8l|_T0oPgnqDV|`_=b&a)EIbbi<`CNUa0ViI{sp
z@ww2<(MD3f;(+RLA7DKq&~%>wHEhv$fez^-dd@G_SSL->o{a#NCleUKi~?Iw{e=zM
z__eI8u4bjBeSx(9`1X3Yl76B%^S#io;Wl1(7?WWX=qqhXG*|(e6g@XS7M$c`Z!s7X
zMb)nX-~`<QtDbpj1e~l1NL>h|SKa7+@wA>l)*@4cL-YApUvb@UHcz@z>L5asL;ODV
z17bi{K_?lNV6D6M_`T;^+WmLthx?l)2o~1cp?}q#J}<Ip*<YA`?=OEF#y$6VL05-R
zx~I(VL7MhiXnQh*EU;>=Q$}CZ_%K#EnN;`tKcAJ~;8SoOLY>&?Zf85<-5`V=>TSS+
z4G~-`6R4lXk6NfTs@>hv13H1A0bnv=XgTVX6+rWh5z66WT*((u->`pqy@z4v5W>Rs
zqtwm?_AYDjm7JIqQy(JSyY=$m=~DovPeWMvv}DYwT)?I%jw{abS|z_YarZps@|^Fl
zzCGw=>6p{1cIGlRnsg4>Q`+<N0e~tivKT4jLjCC02hA~W^B7dc3((4!Tnys9AW-}y
zd8;8yAty_JKf4sJS(ZY)5TmtPPebCE9+CB&<A|D3tRd8KW&{O&Tzwb^gWW&Bo^CEU
zIrfV$Yy|%NcNi4)VXi8J6)hFQH1Os1MR9aF=yd|f<V;8rK_tQObr={xsJ6d787%JL
zPe8NqXy+AUktcZWt~Uoj^EL#n1_H%yKu7Q22*Y54p0+c_U%}(&rSQ(|JGLCPf=9o@
z{4rzTDHQ?Ro<}0NHUfuduG~|&_glR$y~kc&OT?{uM0{NiWQT{c0AU9Sx}OP)1LlJH
zD20lq-n+X&`EDB{4Fd1yu|{U~`HIE-$AVvK0*CLpqQx&jri=fw>cM19?Tny-T7*yM
zlpwgbT#rEim_g-eq1%6+<}s{7K6^CEmnd=6dwLE`+$3=)gb)3KqcwN$VBf;w{(W`H
z9%u{6xRHS;vSI#r0a%g#QZ%aY#D~*oSJ;%gjVJ2-xM51E=mmNt3B8*{x6(Tk>ZFL6
zB{E14Ca(w+dbI)lpzRFXT5ZXB`nN0FFHV6K&%wE;LI-QSO4jNVBM5kbAXGKoi2VMP
zLZX%+9z{Ov=0Zm}A~qHf;t>KD<9No?r^V;bwvKzO?Mj?QjE}HZkUcd*`)f)__ADw?
zug;iEnZq31wgj4v1Jr2&`>wl~<Xa0zHKgofP!HXW!J|Hk#ceMoGC}Ic%Q+0iU5a&-
zim$YN4Bg%=SQ9{s61ctt+}lAAsERKGgP5gfZrxJ*$%lK1$#6RSq<wgXt;L(gMX66-
zzb5d`I?*4{tD*ip{YBt^5>u2VRjCKH>%Iu4A$Wf|q2Z;!afCH!6H~_Yk?Ls?S*vMr
z<>t*c<erf^AO=3jII+2F4Y8&`W?hh|h`aXkv}x!<=-Q(Nobz9vyH#f=(DCf~El=i(
ziMGps(IR{WktV=l&?MDwX!J9)Id=449&LZ8pZ~z`j(L#)&K)6o#V6$`Ip@f!K>vTG
zZ!HJ4>vv`+g6>Gpuexk3P%%51P@&tq+;At87)$Peki>+JX(hNb?1l#7_n-LfJJ1U$
z2>2a;nuA=D04o`>tZ4sT8&%l0@-@gqq$FcNNpRAi_KSZ)2i{@#bZY3|sn^q|mSwRG
z&F55GLRpvqHWOx11{e~I;o24oU1!`cUwvCLh?XjhkT`trU4sb|KH<J&_2K9e;<t8p
zb}=VAPdMBTWNqq2rWAwLV29j)Ib8E0&>sZiQGHK!|F%f^2k76x6WR(AUP8{lZNdJj
z9h*z>RB?W=3~lLSht(FIAy2I1Vxa;j9WU|Q#HZ@M#7w0>7zK)jIcR><`Vvo`yzI;%
z)zgHC7IweWAD(kJ7yuYZ1mg^?X90+7J_k;DH0L#_9_}50xz9Vc5pkbL+I!E=ALAiQ
z^TYo2O5=PTl*x+-%!b?{P`V2HzI#9+hMQcyw<2RUT2Tu0b;)8-kFqI%#O&Q&KT~%-
zu}0zBKE9;Vb-qH$(+zZV-AnO^2o(`Rc09}H>Jb~joK9jc)CT_x2awHZz|G<idZDJI
zz3^uvBCj$gKz_1g?*|>lTw<4o5h2h`i=W@D>i=1}Im(W{ur`NA>;nNQRWEl~6q~IV
zx1+MpMR!MR9eaa)*Gk@_>u33)5W=;o(*`RCN(|}Oa!`yE>(+X+xq;8GgPxS`ba?<h
zowvZ~$JmK?BVw01;y;5R38O6X>Ne@Yt_&I<8Koc`1}*3T@?z(IWiBUp`ywm_P!ak%
z_i5U`jD=g#TkUb!pMP+hn>!KD%1HxG>LbL@ck{V-GqfC;waRV<W~CGq6a%LuX-~yH
zKl7n?NrjZ?{*eYwBZ$u%PaBJ*-@l1I|9iBkE{!LiMvs8Ck^33UgWp)IlePuheOtG<
zn+SQ;zr6u5&9M^mwY)-)iw`UH&XUA|Rf<ST!s|LdOl~s9n~s)N(8Vt87`NT5A~@Bc
zReOB`?UM!**o7zE>YS(I2d|93k~n#KjsOO;i@-t4kG3pp1U4Y`3F+!x5bs@e+AUsG
zuE^w-RgqBH7ebtlHpwk+Hm6N{>}~cSw+$?1Bb<*_L`A>0c072JG!}^{cbjCPzds?c
zTw|@_ukL^3#fU>DHjeUqN0Dm3h<L#oZw+A7ft#d}!)Gd^exMZSPn<sKaLKgzZ;{jQ
zj=f|Ae7?bvOFn==Fz{jskQD|1(lmjs$pM0^%^Y4*jOWly03n^|X%^sh5|t{dg|+V^
z2pBFVsjfQI$smKx?&a-4_JsiJ<beczG@?>Oc#rN7a)%(W(hjC4z#(y|nBVlO^QS&@
zsr$QD^-0bxeL-qj5)RA{`ol^ty*eBiEv`PS{+?m7DdqUR?V@@DG&NvkBne4kvu?%X
zpecTF>wZIkwC|p~tn?R>KUZ<4MF?o&wqq=CRH@7a42Nvhyt=y}r=oY?N<_rvzh_hy
zL|vDt1@>-PkBda}*`^?#8_3-a7>~hMKAojPllsFcNiPY}K_OxgqDf=L;90nY1U-26
z9+0%D!D~|MjCUmX4OkJFnyT*=bH0R6lU+&Vl?o}{fzl^sTtW)kICev6&=o@ke2BT1
zHbr?;n>K|7g~)U?!dbQI_M@B@TyceQX({NQfH{38bVvxjq&+2SFBRZ85DOZ0*#;lB
z3P9Pk2s0KU3J@wA{AbSjuRP>c#)81faT-A+|Mg$~^ILXB2r5LR;Iww7Fc%pX5quY|
zz0<PcjQDLr`W@K%^?mV;3@hPt_sZ{PLs_+!Pn9#cx++db1_U4t&u@D1oJuuOL&A7F
zETRzqkPGoLkE}UVMcV|ipSz~{W4`x}Q(CV`mm&_kCWFvDu-1S*O$9It9D=HDyM1SP
zSW^Rt{YB;joe1MD;~p3(pB#j8GYbx;Ug_MPR)X6P$95pciK!}7cbysTTFRQE-76K_
z1(AOx(5zYk4x%yh#`Fh)nFN5>)#IsDI^laN58}CsNqGLsG~<T_j`Yjup3TDs;l>vE
zdjxv^6bvDZCp14j5Ya5+bx&qh6lDoizG44d^;6}XNX9;&I)2hY(crV5GIh!I8O+s-
z2EoVlmT<7uc(&u)Hm6-H2_rA@3=dZXy&87?$v3ttIJUGJ<7)iUO6Z>o#oEiDz5kGX
zrQpv9_AxJc23>JqYMk!zXx6NBR5E%C=B#ptRmjM3+DT*o>yz0#H`jf9APIy4E{o2t
zSdr!+CRKysX|$<+M@PpSpm-F6e_D?XSjjZacD$=BSp1S3y!k$p!P8R*XHJ-A<L3wq
z!Y2~|7<r}j_ELmxN^0tJAr6q4T?Q`gv|3_YH@H;DFv&$-x_|$EN-XK-wqZh1?4a!v
z0I_W#A4bpRt25p&aa>FCi2L~QV<2AMViFVbNxwLED@i_7dBm!|ulUB&KfQy${)|i$
z`ZAw+7j~LI-)OSgOJMo10t-)@5Km2PHtOrc5E%+M+KH6Zz06>AyaJ5eub_98sOK)5
zt!m9zJ$`;EPSAA{*ooXdIP11HHu-n%+=-aeQWuq(!8Cz{MWYn-L~_>ct?1nj``rP~
zNn9)(Z?OdTU`3W41R)KB3k=}vBsqtq8(lWgs0Db;jeo*jV@IoVHK#tWjwj!6MuZ=Y
zz)g^-f9Y`j(J^<Ij+r=W69Tr&mnAe?U9~ORcRqX%BG2MQjHG^yRaZOW9276d1yUUG
zsIdPF+ZXFG)j6CaqL-Zn77cF)TQi6}44|3^S@Bu&6f<y66c{dSYixWCk`i$+QhOm!
zej$^dU<X>psp28a5QK9gtKq`~Wk?7x0VAZJm)*}G)drIsCUX-XZ(rT0a+&^DBFhBb
z9+q$4zKt;Y46;dM<`C0a)r_AMl$6h{W>q)aDhyKIlSth<N8R0<8|xNS7!VvJx7$@U
z(;RsbG&{jikT(GxW$@iD(=IsZlmlX^;;=MoA@+7~3pB04F#S_NcFsxNyT{g`A$;D*
zwY9RbHjn&21JQrggV;z{A)<+gcT`uQb-xCWpR+mN>DR+ZDBRyCCrg2@_HAe=m&|EO
z$}7+*h5`2TySc~64k$h>z^8wYSM{AmUFDL3@Ooi05Hwyqg1$aquO3h7<t^wE%n{IV
zYP0&VGE&39;Qhc|>tzNl0r}@5#|XBBc<gy0L4|^4ofaY>yvqYL=Jd2QHm|w<e$|fP
zB32Okyahl@De2w27NJGS_{zmRV;$<RUE{0JuE<S^3YI9#n72u^CC+pjf`4C<2VVbN
zX4&F&v=z7B3e=a8MA>C>@!@5KeVTGc6-RXrsnA~Zr?XP}97UtiCC}9(BlWM?TWPWZ
z_NVmSyZ*+Wt$4ywQMNF6dS6kYSxDW-Gxp>ng3Ix-w%1*#TJ5%;96LO4<l9{+Xz8}A
zQWunI$PA?*CMIriAl-|BDeNebIu3qx8F_zzNZ;vpqh|;GMk5fJCjkXv>ybrY;Na*&
zO?FAAKsm}jQKfUR5}rgsxXza@<0`0BNPoToIE9nYxP^3gqm(E*V&0$EsjI7#wN@Nk
zU0s!HQ+Iw01XLSnTc7%0S?tudE!h9{XCvTa*s&@JZU@qzT5o&Y{kcude7ucOv7tvj
z{qyuh`G{j>(SBEzKJJ>jebIbR&-759Bg#59>&B+EMi42h#3OQJ?BQrH2Z?harQ8zt
zG>R2Ql{>_H*(u<5s+MhNJ+?M#bF;SIFW(s$T0Jn6(Xrqw&d{kp5mSwazi0!Kf-gwT
z&-}>H&@i&4YS-fSZuV~Bj&h0RNOKBw1Yh8W$_7i+Uv$?{cedKbQ-gYu8G#2UY6Ala
zs9=Df{vpj)6@UT4lL+H5<@9f^f1Qs@1t}5N)I`a)gIz<`+T!el{lMyDE$q3@`2rDf
z*NyFjiBecOjRp?T?b2~?Vp&5WQYN$8q^f3$YAh6Uwktrhxz#2wsJ&Uzx7w+E+pbh|
z(G==#L$Rm8;s^muCVF`sWVf<pyReKi95EKBp(~_wuw3LP;}=ihYO75d<SxqL`nuTj
zYKf0#z94V0s$oZeUpKao-Zrr<dvlD&?z35|V>X9&Q4Jl(CQ4U_{w}2|_Q77&R>9Ko
z`y_?GXur_%rYvF)<6H2&$H&3GpO8GZ7*<UDk&iv4hQhdQ7bCc9`czdiKIgLj+${GE
zE@P8&yw3`_b$E*XzDE@L1a^g<{z9C~iA~@^!vN)G)(cv`P8@8m@rNv1J@nxtJWk8H
zP_n!n$YKmzTeEvyKGHcV8n!cIHCJ%HAn3l2fckxF@Nk$WBfWR_%$dNT+dMpd=H-AA
zO+91D4hFa`y3I7HVeTX`gyHtLo=Y5sNl9Yx*$8g8Sh?%RJy$=a$Pz!taf_R~7iYPU
zeFDrxE`gsh=g3^ual(-wwyi<|Rv#wtN?|Z1%cdT0WuXO{${PS5u<6|!>Vrw@4Rxve
zEay#g6)DgAoX2mIVfl3Xh={KWSwY#`@rcABGR{EUf9wUGTH%}C^Nz!e&<X~_gx~cz
zGbw3@ze*u?AKc7487L?SRM>TEJblhySR=g&T&R+y+9&`3MEpsp9)3otsa^Z^>sQKP
zQY%934<nZs5Us1PtJFJ3lV)z*YL1AN=7^00<>TLR^JY<~bA1pnYNhS6gTOgWmEM*J
zbl)h8l3|<Y>Eo$hVp<Ef{ZEW*pOgLsg_jJX(E}B-)un6Kq`>WN)cc)>`NR0{JK43S
zr1*okOfv%LomJ)ew$Dh($gKKf>@&-jGdW3)41E`&c%bpp<2d5YF<7(Vn3EJK|Jw_|
zDY>Fz7{v&t$X>>?hM=9eL3GM=N;GRWRWuB2yCWH%TSc^u+2)7la<=C?E@?Z%{ALn3
z=3J>g7$2CaCy7eZyoiL^3$p&O6S2ek+&VV){k;bc8G$y|*i3Ni3Y4=UP<d*NI(;YY
zz_{PKb?d={2N$TRn*r-=qj%E|q8A=bD4dQoiB}tZC6uA`;DG@U*HYqpD`q3!goMb|
zl;!5O)AECSB@(8QvJq^xIQ14DF7l+*|2mNW+xY%fO|{2B?=$V&f0Rs%z%JL5^!>s>
zK?CY@Cs~~T5@*803=|jVrSh8)uW{B=<YSo;+j2XQ{`8=WsOPFnEgXgi<&S$qpBjR6
zcBtmg(%G#G7cR(tnBMySiihItD@f>FH@qUI?FQgSXHhJ>WrN~I0kOXQ3aGCv4;2+v
z3Uwmh0cU?^6L7a~fKDpR*B3{L5M9DW*;&w52|%@s{Ov`~r2_R=7L9KrBCZ01{taa8
zbPR?)z<72CO0PE%N+V`UEHmk!nM;io9#K4F;h-4K{3UAsuVUiwZ@p?xx6iq$W5FIK
zc{=wkJwBKx$T=xy5Ss?R&l7n*k~$$sO3SMGK{31fz@=mS#YVa)rN<5KJMXX}kQJXX
zI`ux(kD8mBIJ{y&p%Jk>4on{tX0L63eETOaTbgwAQ*_`!SYqvJcFZW**%cb6smDuF
zpKgZo3@U{5%uLQD>Z^#&tQ>(gxR*>jzi)d#9T)9#LaXZVz;!iyzsLY78E5%m(q@AB
zJXZjP)6!dLRYmDs7j7xpxBFMylklH)%?44~QMI#34UwW(yY%u=nUeq~!qcBXi#6PQ
z_``i*)ZS48_b3t??q*a=C)-mzJR0?dDsZLy0und5KtvrJzP!BbkaK5NgTf5jH=8~!
z$3|~lVgsmSn3j_!KD~c`iM*E&R*uN}<shL{Z+_3bCN<GH7cqn}zKJzv6e{Fe_;4J&
zS53-F+N4R>OmY=LPB3-T26(HHGbwIoqt6T7<Sx`wS7!$2xz`{*QsF%J!F}H)UOA50
ze~=q&^YB2#9ybrdvXmC6s0=}L#SUdQ6}Y}^^3qUu&+s9k`_DJ!EJRd`j_;~Rh18lh
zZ0-*aU_uX>n4dHO20Wi});QmGwm%g21v>N_U_3^RkCO5X>qeQfB?~gEZEvh1T?$Op
zEbD?UN(OP(N@PVC*Ymy-SP2A4u6SWmm{o9UVqO9AB9_BFmuy*tg>?{9A?IJ8C=CIG
zdvO20UYvq@mNh_6HlV9%yiqcI0aW|9Cd}Njckp)1bvCw#!T4M0R}m}-Y+WWNCr<|9
zZoccLWruWTSq$)1e)oG|pTy!4!@4n`dMNPd%FQF*gl7#F(DwvHcuyRmM8(44m#*<A
z00j-B`ZXEKEEF1r>P{j{#M>!!nIKmXU<6B&bUtk#<|@&11$h)Vxq06$As+g&vHU%>
zS&6lviG)oHr*Dq}XZvmta6}5mT9YYKlaR#}?b+DeX{n-f`T6Xiz)&%O?Gn?p#YBm2
zmUA-@kQ+fz^JrtpDBeAH9zkkkqd27&@=_94lX?igfBRM;YB~bbXfRyvwRS|I-kM<c
zXFKU?ExS$~`Ou!PMAF*$|Gk&wpGys_tK&AMvWkX~-I78N?9`w@Tbu7|LuHzpf1!TU
zAps#^7O?}UfGOmoXn*`g_ku*fn=UU%TNe8B#F4;3PDcyX-KEQyrA$oH(|eOAYH2Jh
zL=X0tJffEqNEc=`RUsaE`CLnA6DFPiQ6MY+gi_ln5%|4#5Y}N-ZoJUV_0q_wC{rPL
z^of<ZjGQROq3>%xq<S}DoWD>YDw1_NqXFqpY2#yJu7h&>gYl<&u<{lU5?Hxst8J0f
zc6TvkIe`)BZ~qQ`|MS%zg9xsea6;!%HcSldqu5;E_LLS0qn?1bG&>|GB|jKTs!B^s
zM+s^{gJhC}6;=)GCmR@xI3M@r#_7_$!fl<l2;H{<3@TQD5g3R^!^M`?gKukVE5~D1
z@ykEv@n@<>BX}pG=i~R`jEYDS_gfd>ZNc>WGBAnK_Fz=Z(<YM@p^iph223L##<7vW
z*3@)eEb4>>F?l^GQ2n<QC}x~7Mb`o^>K?e;MSg~o)&SO9O<fV@QwA_&DmF@pe4THw
z(<o<CMEQ?z0r@13lQD=m9W$o&{^tYnuWLk0f;Dz*3;@fEpp0$1eDR_<?3Q_-pPxU#
z2)h>|$)5XbjCvfpMS{*Wy{6|46chx@;4Bsf?t9UzCdt_g3+7a}9{L(nWW(MTQ99?z
zQ%b)SX}0K$PK+a;5`hR74MBGz;@DyX4&G7s=Qxy)cOlUPO^7UnQG?2b@SN%KEWGHj
zFeYd@QYx!}_bJH<#uvmzb&0IpY5i|zviLlYa6tq=saP0g7L#8Z`E!hf;CY^LoaO?e
zG@JscgNx#r3Yg>8xwO1wymjmTLw$X@*(o3^hQn09cpy05il9A?1BuK)?qzlW7YC)n
ze8eMTD#|STH5iDL@J93xJ0TSUfgP081@gx`fNFfkO@0vWg7m!Y+PhamZ-D)YGEd+a
z5YR+S>3=7YTn!fLxg<B~z<b7lGq#c~eyd0R&dQ$05<|!TY?1-57yu>e3*F4hWe7tJ
z%DC`|XCCT=Ab19#$Q(Ezocl0@H0Vyd|4qZKspKS08npJoK-W-3?zEJGLOAelp5x&o
zJeDZo!@X5@Q1^0Vf8JSH47Z1C#z2N^o-9Io%yO(se7db#4y=#vlM`tcnTC?k38=1V
zg@bD$$3U5VwE1X-8tlcq4&B(Qyi|NFie}9w_o%anf8X=igy_ea?jr-b7txkK0oSli
z4_YNs+LuK+lP!@#BR$vsklMJzjoLeJq8j3{l$_ki%{#_Eo^WQ_!I=*^R{cbp)EAmt
zTDV3$U~Itdu%KFCc|2gft;q<UDuIKre?|w54ka`N?Y0K86eBKvht|GSlj+|6WQf97
z$dAq4Yv&;OI-dP=ut8oAj@WTMvKL29IpD|HV^hm_<i@e8Xg>BE7CLn3SRMx)xDqSe
z-=(ltob)8H0=qf+etjfQ2G$DBL-TlUfp?)rDLT9(U^Tu3y-ze*qCdU@G!)maU+0_<
zT~zTXG^PCA&<)^nGNiTD!#b!^2;EblSWPt_ENn#4ya)<%U_NQdg(kEgLr&rqPdTUD
z0v)%{f3B!StO=KChR4g|n(_W8u>N1HDGT=WU*{Z8(hHr>u5QI41e@31Z)AEvbO59(
zl589(Y#@y@zl9}|^&xqJij)c&ORY?gjdJ#o7A+xo5ZMH<7g&jP)URH<c8!VmojwC+
zm!G9j$}<s4vUa0PQc1IR7bql|6w_)=NOfl>Cj*uB_eYl8uYmbXI7(SL$|#NWp(ECX
zl)ximTdWAf$8A4Jxhv<ch#%qO01s+>N2H#a+HRoIwFLHP$(+5RehJL@-T+fd%<bhq
z|GncLWzbJ3ft&U<=!@SX5cQikZ<=S~_suKFnTO4>+0`GnZ#YB$*#vSlme;Re+hZ)b
z*af%|4MD8BNPNi7yEZjaWgXZBweqWhKH4->Jrtc$U|O>S)Z!2X_9zrfbYpd#d&=Q-
z#AzcS!eS=F`($Wv`iLvj9*S#zxeioojS$M1LaxL=s`F8&k`cf85{=jGMvYzAlaElG
zkd+>M%JtsVbluDvfRLwjCg7b0Il{Hb+m6|ryjiF($lb*$@DvhX=bLvZH-!C5E3mnw
z5$S=rdZC1lSWc)KgKCx?x@Pj};<hPW2R+N9elb3rG?9M3Z1Q(Uei~5}?bgrncEEe`
zI#Mo!tWx%YlG0^i;p$px-@LrMH&7cmJ3FsHx7GxUG~ns#15WbHP_r8ZE)17;p}Jse
z&ASRD;XrDSc0=`<ZrHR#tM9E?BV;5aBV%~5x6Q<93~xVBk>xZp&(7Da#eVwg6{Ta*
zs^*Ey#^-%Yu$BJIn@Q**AY)kI41ebJXRauG>@AS}5%5^HM?_G}#}m8;Mx}k#o!I~|
zIDPu``-B7$ZSW3=1i=wu6@vG~Kw%}p$)KdH{0L(LLvU9cSf3u@CWq$YBy~dCLvPg@
zytE7qW)cht!(mV>#pzV}@Dovo(JX?<!L!tv8mbNn1xiIwAJHt}<U&_{tcsW9&wiG0
zA$ZBKXf7Zfe&X3heJ}}p0LIv5pq!{CEHp+VyG^tXW;_m3<)><a<1b}sm~1{$hUR2g
zg|poR^yfQ1K4reXz7dYvNF9>RtSj!dqxl3}C=Gym{*Z-ikZc0t>*Ps~EgzV)kX=~7
z@DQ#3nRUW&4AMJZjf5`25vR*j#1(ntzhPfG=l6FcC1s$3{`l#WvyU%~V}oK~IbJ^O
zHh@&YCEmWQ>+D<#8EfFl0Wi1>pu}a`OR5#E^I3FDo;?X2LWZYX>)aOCoh@LP_R?G^
zq#(>Gou)2@#`W@r3*KaUMwRU^{$AYsf06O;ue{`0$p#x6+Ln)?3d2WAO-4XU%B2^I
zz^b4?y|BBn7y@<}&QOb!bT5wsiDT-0h&;O>2^ISt7;w##o^*%#moGj|t|2*m#tGOP
zd>Qj9TK1uYr&x8WG@)uU01Svpb_=#+egSA=k@TeLZ17RlGTH1s2q_Nlxo7@-;NchL
zS4>E``#vRQ&{q?w29ZS7G7x@U?E=U+!(f=%2vpLGNJH~JHMI%IM<1tbq#i%c10gx3
zP4g{S;FEhihcZ>{m{;qyagC?ewcfZk&>cmQ={YzQ!{L7btO_P%;+n3Q#*z7$t`%jw
z7}FPZ|IZSvb}BF)boiX{IpROxFvADjn8O+sF>lvr&8?E2^NT*U%>TX%p29d!e3(Jl
z6b5IukuiYwAv3AzmnrDmZ;6J(sFsS;I`~XB>szSR?=i_nj2|xR8f}l&#~Q{QeDIou
znU4A;s2?i;1fATO&*7mUD7uhHdI~{R0L%~|XXutEJXIVRcK3)g+K#MvvA~(M{&$S`
zVxSloCL!r0ZYms<^IW=DexI&8=tB^GsPI(<x_g@_hL@MG-gLMUd1h1eN~xkKf3ryG
zA+{l{s7vJSu0qZ`Y0pVBjN7LWG)2R*^b?JB<CibNF)_5;F!f^v-%TN2tnh5RHg2xI
zlnwh7npb%j+CSl#2j*fh(w0@*k4hoTR8G_u7IHR%IVySk2~yI<hhnk_p=b6R_MTNm
zO*PhsyIvkI`G*KfQ~8G|^ega{YU0NzJvQ7J9(i%c9gjTTP^jg(o3QA=<|)EJRJaD%
zw1XF~<mWRVuos<mii~t_oSL6qEi#ZjKa!G+cf+EuW{Z%F+p~`8->={w3Jr#S9C$Wi
zYE@^bn~@%RRJRFax(L9z0t3J%up0KTuJftIqkFO1;hN?%ZCIbZVYhKm6z?`xWU;?d
zwW}tXa1qx$&>Flu5#%9q#^TYV6o@%@LDz0L)2fvZi}1)t9m+?(*_86zIK>eE!*2oS
z{`Y+@OMsBc>eLa*{_nH&zg35wAQp}3HteLDguFzl@tBQ;MFxi4Q?P08HA_xKXN|Gy
za}njfa!G9a&o_3PP#V3=iZfq6c+1oXS;5vtR-<^^;wM|R0qh1}$dCdZDaw^E?!o^o
z8H_X@4&j9#J95G<0)w-2_f&lHj%+8~$#Stm;jEL>c3bP3n`eUUhz=|~ngllCTWGZF
zQCA8r_Ss0v7ACPR9Yawdu%Th?S;i<`=74dm@qp_1MpksPL7Pyjx<;B3qf*Q*C$@}O
zBFm1E)9)49=vwiH%0k3B_7cc)+d6^15H(||rWUz2*CTV9oLnOQ69NYa05mC&uDhzV
z9@_4psOiA;=Q*f|2$3)DWZJniN4$1uv&#wk$z-IYo@&DEH>C|mw$Zr>P$~odO3pxH
zFQ!p!Q63W^?|nC+tn72Cj@V?h!f2QVy^}N^>Fg2?VaA}dJC{5!o2G;L(4_`hUZw1+
zhh@IJUNuosWaMY}=98`%Oard#)EZ6iu54Lt>K{UHH+Z|TZqQuM$6_E*M3Qipqh}FE
z6Q7j&5|{z`A=>-Xr%o|Kg~AR7i^u_PF3!j<`%3ckYtDIlL*C#1rvH0>kdI9ZQTO(h
zPd6WBoLv^^iT8l>V^R||n9TG~mc0xfJ^Bjq(*V?2ql-ZL<PfC{Z!#?Y<t?IxrC?Y+
z@@Z&l1orJXhSLkJ)44ReSNi)oGoL=u_B9xdYxc2`<7>^^#5d(Oe!c+%yJ55A?$+kK
zY1limJ-QnpjQbrgb@skdz6lMz3=$BoB?J{Q1aE2tpp2`<UzdJt^XIGVtpQJDt)uhk
z&+cCE*s3+kAb|M_Oa5eaFW<hc0p*^Y=W;=t5P8<!G%U(GAFZvsCKKISdZ$vRAZ}lP
z5v*PB(9PV`P1BOCpZO2BA3S{;WNvq7P(Gs!eLJ;xeMe^ZWtw~2le^<JIASrFh%#ir
zyMiP|*k*PS%EfSGT(}4V-e5SUUxA>Tj%{}5ca`;b2LG>k;I#oBWc{N_Yezi@0gk7q
zKX%cMuBBzRY@C1^(pB~r?S%RhAm&9>und?`Z-Chki_P4h><czm&m%iX__o*z5{p8e
zwc-L;5|xgd8m9H$WjPp3=R)z~6Cd9=^{2b%TkvpBM0w&7EUs>Wl~*|E7rp>X>naG|
zZ|O5%zy1~+>ze?RVLf%~)O4h|cmTddd(2Ts$Xgmd6-6z1rhjiZ{->bf#9Ux<RnbQq
z>>;@j$_#Wo59@rO_bCD(l!6)OgsO-cW?;v|!A<ci+0$nPR=MoD1y^jay>C7KmH*kK
zUy-X>F?^;kig2V{1}60BZs%y?b<0R?OQRO!@CaySvE1m)0u|%y!QeNQkj&ItQP_;D
z4n$6aIAy?gmG@lM)xO&L@}F-C<XDklKze^CPHauj>I3eYn`HHW0)6>QJe3W)h?Ef&
zw*t7q>>w*e08m&VC)3&4ISEY|M-QO|I<r+!<E}?8?phz+uMSqV^0Hhl|9p#?pZhxl
zO8Fz^yK@;<8$%^o25s&`{hlHTgvNpGiw;d-|2SEHQur-=1f#xX2&@b$i4b7beF27g
z^J<ilZGx8I=Rdz|ks0J{mFCdDTgt@VQTdhsPoKuW{%jl{i!{v`w**F$UxAxvP{#}$
zWu}BAtU6@i&{^(iMQ&h{))`Ije<xh@I@xJzraV3LgZ#D|eWP|6By&UJ%*+`vo~HL=
zrG2MWF3P8&>$A#?YkF|BV(r_`J`Q@^SXJqI>GHl}*XP0vt=&dn4uc69$$PS>_bAt0
zg3y)xN_IB;kM4_=G^(Nuo=A?~+y}F?DWoGo)-R#DhszyvsHQARMwmcGS^-74YZZO#
zrtgs@s4?P$S4?Dc6vvT)i~*ZkwnI@@Lc$NwJHgTWCOx90XFvkzvl0@&_Yp@)Oe=A8
zKa;^a0Xuuy_(zX^$-=-@o7xwV?CeEjUJgAqj~V6L+sWAk7QW=!^uH$M{AFqLFi=P@
zBWljnimhYl{pd6QbL*+UlJ8<NEGqIQlv_4CmLHohMq#^D8{3PzRZqT=F#wA{q<xox
zEjtE)qo+Jv03S3)@aerQ($8ge>d~K1E0EN-T5@$%fBb7r<bOq%zrUSz!qOO71nJ}(
zP=v^{7qBPi=Xd(zgAnc}rOuN)s<){t8cMb4LG-tc7Gkiu<YjY;84^BZV45!tQ;*tm
z7f+=I-R+{P;+I?Z3A*wzeJ!PDG-{`VEPTJUd+B3=;QPk!MN26=X=7L7Pbp$mS`|Jp
z7ZdX)w4dkB;{5=Yd{VNqZ(&i16aYCUse0l^;$8_^;1_3}!O-yM8XYnk7DIw4IcZ9!
zMu|Ka1YH1N<bkRpg8Agb_5-EYipN<j9gCEbgRAw~kFlyPlO}S9V63P!yCjbLm+=-I
zG`s5G9BeKA)j}M_mSAh#F^A4~9+D>{Cgw;K9;)^~`#ogm-e9nod>^&?8tR6oQt*{e
z$%dz=QInbUr@LQ&hz%i;lMCrj3*_Jbu~k^Pp@Y89<m|ltt^0Xbi~ZSxF~S+9b@{M^
zeHZ6f>0N;*2{<n#gg#ssy8SKi;w0q0H(<bf4~blK<+d~O+rY%X3LA5(ol}N(^Im87
z|9M9@#4Ju0;Hauyp#Jk!hPUH&W1NPq<Eu{@32mAe^J}QvOF?fn2}LBgS7>|te!XG}
z<4uA>HQhtkCV%Yc`N5KrgUY~)^+6?@?V?TY{+6Ym`ym2OBeE?g`8Pk1ZxR!R#?lZ^
z<$jkp&8-~STFY4a@~N6%?PTZ2cO&LiSE$MM=5(x@`a@EkN_YzMpY*u=SXx-#Kf&D{
zWI@nPnY-Bxb@feT*POHRCb%x(5JGt&$_F+-lR*9ZK8iWnfIz2zm&O16m2uHAk4p25
zM&3XDh2Q^@;5rt~ooxshQ^1}GgU(|BtX(H(W@Kb#UufEONIa@3*3x|$*TK+UA!2Us
zZNmAedE(6+>V&L}OlW=3IsM|x4$n6n5^9B8j??jP+;RT(YBOR{@;ujF@ET=?u~chb
z`kU8$Vx6(wV>xYQqRLi-*BIre<g>=ppW~4gy_u={mSr<$(G`0`(4af;x^0Ym4*Wx=
z!Fbl3!&MF{A<hBXjD}o>c519jqqQm-Y3VnxQz1fpckRbT(2DTPZ;m*|zYPm>$sj9E
zu^K!Q0II^?V`@_IK``_`zLA6wLSx9WSJ7zn3hc&==ulBsmOeaCr<5}Q{&iB~8Bz?H
z4f~~vEg6vz*VZH}7ah7U3L}ZmJ6#q%J(dM#j#7E#FIqw>DxO?p9k3`a9f@0xcW*zI
z$jd0A<<7VMaJ%Ot=Qd=m_hm__l^BsMe^Xm!*6^qg*Hb@jt}MvpL>DJAIi=}upf2pq
zjOm0{yX8sd=esm@P7O?d09c)nkeFw`rQ*PnZ_zhzTGdv*;4?9H7J2SwD-!j2s<&Sn
z7#T&kI|4Po0#sltpht*0v0nc1DAb>THVwl4@zC$QN4*$;e9Utvp~?vs-v6QSCNk2b
z&KG1C?Dlggz8~*Hny*?YUOwjEOy+%0<hw)EK-VWclvcJP`DB-Cc9C#gocoh3`skI)
zSBuV-$E{CvZKNb64Bfc@OK_@pH~v;^&z&pJWHx((uHCFw?8LkBbx}p<f=<p=wh-&v
z4Zi;VUwZAg*;l>Cc(ZoDh9zOQ-D*vp{kd;o_EXwuk*#zB6M1^NS;MEaO5esIpP~IB
zR;A+_oec~QMAGo*INZR(GvyU@d=HS7bX6J~YGdD8O^$-83A&+>nN<GsA%WAwpYDk#
z%~^=n*8Z6#qzXg=m>)j6iwqO)+`an@?;Qc3edlx9@p=c-4JnJqBG*`Ma`YSmVsr&2
zYFRr2Gle;J7~@{8m}3t|NSPRBM^M6AvkSS4;<04<MFk#P6T+d@0xsp5jT+ae)To$Z
z41*lQrTj8d)!eq83d@u#6|!Bw-u&cXUdAIVt5yAxON{xLl3wwTbpJ~YGEY|zKJUJ2
z3U(Jvn=>(RGRg21s$W-&d;Oa6<iUjKHD=~FFfF^?bF;tzs-hLpDc8q{RhwNu0wwXR
z@gi_?Cw5?vv>`dN^{Wx3Xm5XtcN|eQsTCT(2JlG+u*k`&sYp|0NdN(<;<HE`74e%I
zeIC?k<*D>qt;$-Al2(Vj|M}Sdcn0^XL5SP>nKing7eFr?D7Bd%dG+;Xknq<l5vi}!
z_r-nJ%hFcwE6nhP(#^cbzKn9Wua#BX>ob}v@|gLOa3E-y#i6@DntAO@$cr_-l}>%f
zFQwHn*Q?KYyghUMP@1*!fK}=or>t_$SDqdcvlybs^_}bh&(W4X9Q9#$?#z>~-WmD6
zWSZsE7I6G*Zrh5E+;*tuetCu=(5E_673jO-0qkq@U<K~b%C;r#ayo#rf4(yR|3C_N
zEYcWbHpSyUu=Oq`vK=(vmzkNrX6hh;*Q1Es{enpUc8+6BYfb6NjF@iiJF0<utMndL
zU2Kj^_RQyc)zm5Jy2agWpHVM&?Fus`mJGWb#!nSpY><&doqS3#z!X>JeL=&~wbydL
z{_yLqcU@EKer-{w)=08~(Uw|SVOyj7hG^}eFE#OBxvER=X_oa|vpPpT=gMt+?j`|k
zu&2<wb?x&&dO<(}8?a`P*3^timyQStxrj8n2p<H$n+N|0|L|kLp)18dBH)4);i@i+
z@;)%3LqUP8jI^4^V78#+zF9uj2ua`cQF3UnD%o<0h+oKsh0%AZAMZ#6jz-^5TN};H
zc92=puAB-;mbu(ac)v%>J@bmHqwDwhIr>CK;Vbi3E`HvVjnlAB)pYu#+1M-_9?D`X
zM^Sg4=J|WqCvTtZ_Hx(^EIimY{naEtb1L7|{=UVrlDlupC8ZnBzAn+(@*$ZU8F|u1
zFvaao+TX?P1tt*D$Mm3;Bss@cW4F;xPxnSio=>98amlhuN1$)$QS%XNVeAkQwASJ?
z4j^v*F|y3AVHfWtC}+BC8<Gk<O}}%Fj?S_dbYzd}?xW~AX)El4YqHM|8T4VrurLaZ
z()Q%{>vdh}7iOJD-O5aNkS6#4sz%xR)}vxOsbWR1_&v!iOGcjsd+Z|fwGcYOTPug!
zkE>)7@5=}0$zm{E!>Tt-BGu&k*)*~%^}Y7?jPzqRxLO@E+}rbh+{&Z$3L`MSijH4w
zY;0VCy@K~y%NN+6zI+)9eAn%r=$t9Uw;So=aR@ZLrH<l=r6FchC-CY2{May(sG-aS
z;syX;Fd7eI6!#AtT0EO2gt%t#f#AFOQrZKGtv>d1cheFDNe`1rsF?1*p16@M0$b^W
z#|g>&f2!QDJ>*RgOv&5a0UTH>ki5BbNfK2O$G-Ga_$!N~9NAN;w~7OoxLWzvcMIP+
z#b4T7x;eyc_4XOFAm;ArofB^bt_WQ9X=p?ju(rRHPs{zBF5AEJIMT;iG=U0h*Sycv
zrwnFUN*69(Y}u*vBR1@OFEw3YVdSuUWM<_=9-WH8;mDHQi%HkV3%m=fsMJ+eBW7Q*
z!iuG!51On>f^sbCc?{!LSfq>guk0J=>d+SaJ)`+6E)7fc_yX;-aZM;ka;nFZPTOPn
zmailGn!``ka~N(v3oV+-d`&vv7j3`qZX#kP^6>4M+Y&^Shf`QT#yH}ZP?Z_=4I7lX
zZ5wajo+(`{9-2f{2rx_d3W6%6%CP|wZxe_oMJehwQd5uE2j{Jxu!={pdFZC6sB^Vi
zj#cseaeK|IO0t(N^^WCBE@r!_ZVg1UMV(V3hx0gX9kKJFy9KsdH}C$v0P;UmPWxpX
z^Qm;O)@?+TZ_}FE+N>Z<3xzw^gf#8kG<SZSzAD@4fxR*IlE=nBxSdTZF!PO8vSp;l
zCcQy_jrN24YL~N04>@Pcj1<yeNYfj%eseY7_mCS|vo?+K@EiM5{jqP(zo$n%NU^ni
zmVJA-ZaaUgJd{1n!%D5(T_$$mhvRjw5kksGId9E=sxqX$5bnHoZ+0!qEtg?j605QS
z6T6G5CI>jAjF4<@KTWs{Hpkp%5}7TfocFlB$IDiBw}z;2y4Vb3p|rbDs=hL+y^k|k
z`lO-jwe6bV&H4X)R_HYT`j!lZ9m^x~Woc$`<}L}ULFBxOSr1Kgz>>q*dhdq9ZV<)n
zvpx(<YpMPcbL&4YL=nlrHTPTwI`C_7qLu<k{lkc5R~t-(FEKHFrV%l*pP}^>al_i*
z{79{BZ1C7mQs&|2NWNM8mz!<;3jQY-yY4lGSrl)Uq}soGTyvM-Y)8j5fH(0vsnI8<
zjn}U62dK03zmx_hg5IQAhrdO;REZBh-W=V(EbN#}dwUzZbb5s<$zCAiyia?3%C41x
zqWRqfH1O^C!4#(yOrs}(co2#VB=6kuZI0$qc+?!h2<A;WZmqTo#YEwsEhvp!ZuFss
zQZ|Yny<O~4kZB!wJ+pGYt(HG$>7436FBkBVznM_I^zcZ2F4-&&Hg$IAR}{6k3vd8h
z0%1yf2}C!Uug>2tCU5p;#0&9MqLF*P8kwAwG+bepfL`k9-J2EE;t@#GGFi&fP#**-
zoR^J($7{i82WbO?k!o8mf#y|~?w=#%mzdc*Nj$&#WR;&N6tc$B@M8ly5j4{e`JdVS
ztOreE<hoVW_H@ndnR`ct`Ztgn%O?$uI{*1({5~TvRO8f5mI0}e0H}pd)6lRKtM|z9
zj2K`Z{BSRq>r*3}y^7^J_QTc8gY%r(tHZ|?iy97%IA>y415u4#uSRd`<WNeT54-fq
zRiIYVbu^3S*(Je?N~6wtUIOdi%;H+80}Dx=BolmaP6+Q=U-?LFDE18m9MhS|c-Gij
zvzlY0&G!WLiPR%rwwFAzHZMe**Z<F03n0oWy1*WJv;tbsW&doD{23IRTrS!7QPt{u
z7U}rNi`t}(Ad!%apEka_S~a_T{;^ccmp6OpjLqYnraq;mxNn5smuTKz)!eo*sq*bs
zJ{ZoqMMJji<4KASdQwTtDAy1^AE7>=t4=9+?1TWi(Q1BCWETHP*`J9G3<NN+#G8;X
zls@7EAbWyMeWpY4DIN}(h+O0l)oN>L35Bpp#bt_GmW!gYclPQ<@0(Q=xvQ-07U=6I
zHVgfdZQzpLu+-9M=)<#;OKgiGx|S8hv6~a)8oqEni!6NmfXh9IKlT@v7dKJA^*E^P
zWEFNwt;VVzjre~Vaw0nM&&U3ErRl|rthj!zX`J%(-y!7xg2~@s#cI^}OTl`Is|d+4
z@&#U!UF0o&|25cqlsQE9cDsfc`#f`d+&Z@4aVxD?q$R}@8n30dyXqaAPRjSG{Wxw=
zAN0VgsP%*I9jaN>T4A+7&r-(@7w#LbC%#YCd*i1f{XDpi6A?0s^e2{}RD{$P7h_-)
zk)EE84D-nuRNeqjRCU44;?R8dE2{Y@rd-t7-0I_IWfZReIWqp=)*M@m0k&7Z5I=sI
z`?}Nc<Az8Jb;A}*;=o#V0-Qm$go!}it}E%>mvJS8+&1M(e^jMjx@h*nU}ie{nJ;zK
zTv)%-#+jwJMG_L7S&qV8k(Q3^zHefc7)-7SP7SKfd_BC;;#lnWY)ETljd0+($ZY~&
z{>>;>DJdzS-4*f+3W0eGB7rP;c}(v-wa^jpk;rjGFCwCc5CQ)FDE{XwGGlD+b6da!
zh)n!30}XvaTwENTalN4c!Infq(fT1LYTky~-f}EgI$L1sx{<8ZgNnTN7jm2HvpgaW
zOT$b?^3@Lx##nAj{|bBAY1`gDn0K2{Y*Xl3*3U;mIvzuA4=Qq`HM14-5<d?5S1^uK
zVpU4o^MR1NrCew;06a)~iHV4sZy!ls7O{orh$eq1eAIJT2jdF#w2K+QICljI=}{fV
z|Btn|j*7Bv+r9+}0TC2|3y@F*1SFIakTg)Fq@_c0DCrtPN<l!nyJP4Xx)r3mTY5+t
zU}(OB>-paG-uL}H*F4`J-&(qsELn@;JkR4e_ha9;?YDjZ0Xpx+p63t%k_~m5lAvSD
z*%`!!1*7>wN22Kt+{lo=_*pfQ7yG|N%6<rHPnKAfnT?5BXZ6m`q<1rTKnLvOY)6%=
z^;fuzrY5neqMs^kqODpdCExaSN6PDXN?+8i5f6!GBJ%Z7JgK<YmXsy;{{U~q8)xUL
zbsK;PvfPQK!%$+TzPl0$-HC~Ni=js(ZbH$|5WxwM6X91=wX62MJa^{=VDzh#JsOZ!
zK}e^Wb%W)@Ij_748Dn~>F_mHMc3OWtHdWj)eVQEIz0k^JJz|a$8G!l(WOsB<yI0%v
z!femvZ}BjuxQqm^KqG{;(p#U`uS2ZlyfaB;qXj8bm{L4b*ze1652yw}##o1_utl*C
z<C1}<>Pl=C9)4$Mwz%O$IzK<ZI|cVp2fh6fWAA?VHiP)uzp5<$hm8Wvx`6u0*qMNU
zAp0cM<5y=V;nIB`L@McS@Up{_uX!e%{D!3)G1}~)Sr($&`C}+M@a4@&7-Y}mULCte
z3)@&ipIT2mXBcM~n-lydm51+hR6k5nLwO$OW<VU9Z#LNTCX~p{Ci`mi8$e^i>ZBNW
z4nwmG;k969#&_>8a&o42I=900Ie$V*POV2*eY`0k7Zw(w{pWiFDkWg$M%q55!theP
z@fwTfFK}RaGBl*8tdq=glh0<Jp}Yq{(00s|<HMn6=;F|xhE6<gw?1w;XD1yMR7oO9
zE?s9PR$6y@Ila6$evax1>26*qtFIW;gmQ~meko*|WUmxGE4&x|M4cqOfAXUD`KqMg
z4?%OIZHjd=dZUnmYAbckN3BxdB8_%9BTaN%XZAOK)Lt#IqjydI*Fm7}g2>PLW*;Mv
z&3)Bl-{Hrs5pM&^Dt_ixM-0EEIOxUkK2KlB%Fk!}P-@^u6-FGH2!?ip8Bzw<zJ=en
zC%{@29cBUofoUh;3ACAAWP1K|R(=RD<<;G`OG<3kXGPuv0RYqVhp{Y=kbVy_(UbNK
z+ttOOkHhx^ew`2}Fab@R>$CO)8g6xIHKdbSri|F>&7lC*JH!3@4i3Q&4`st@buM&G
z+`jHpg>wQ4;L0-*kJgo~rw<rk6{Ya0G-$=|xC<P_nh)WF>!769&mga^<>M0;mTVpi
z87=&?%DVo~QY|2?d&%(l%}O&bhUI+CJC$O*+$7W;ly}A<*){Ryj$g>W0haYs^08d;
zzlLMP7?{<RXd<V|jLI$MN{58AX&rkA7T{=uR&UU#9Xbf1r7;505ytgTA5YfRLb2Vc
zSB7@l+eRjA&&-s1F0#bV^k%avhU?IwA(02YlPS7x;&^CTUM%s`Btn7#LEm4QN}jB%
za&@{C&?P~~&>VbJ4J3i3?jRvy`#U-@Ro}qEH};x=<*$Jp)&ejwXcC<Q6lV@IGqday
z3s9!7R{|4W-4ws2C>8BLzb(AP6|QEgon4)o7_J3_I*tWy3m~#|U7pWfb^w-99eE$G
zOnQ(d*<(9nI&aqbeAtnIg?j$}*3ekTgy0|19Bf@>^(c3g_SbUrMUO4M3;I(c5|r;D
z9!c-_A9TsjbS<>%+~E#BFa6y-mh%n>K|DeybZ_`Geh)*4sQI@|&KVXV-W~yesh6G6
zI~VLGy|IiY05)T`NYhY8j?1{{`U{Stx5M^j>4?n;i7u;mOPqZn1Ajrx%KXqihKoXs
zg{$s_sM@yeu1PJ6^SBOA4n6RF{%CLS0$prbul{WSgyA1CYi(&cvTI7mXf8V?AZ3^i
z^(FpqFWP^31B=fSY>qGFp(x167_BOEs5ODWW}Z0mHg1v^tk-GZmnX5)M>vstHndq(
z_yciiTblz9{S?m|Q+dASv#w=IlfLPlX+FM@I~2E7gm3m$<^N=gnX@m}65R2|d!a&o
z?c2A&u<^BBJaoV)-hGnOj)xO)y8tEaeu7)(W5geE3JM@Uw$7>&^8+3O^SAi*qLXt%
z5|S8DMA{M3xc2n*IT1plg}g^`JQL$ZF%&`!Z>}_#9ey9F|Lu1bSGd8uOK*txvo7{u
zp$=ON;4qIj6x6kR2S_&FDJq7$tm0yM60Kco2L*;a5tB{o(jDP8G+2DdjL74GNW7Hq
z<a+!({ncD>Tf0UAg?&Cdv%S2<N#^FO)ay8#_2$=oPd>cxp@;5=ZO+zD6;AQfa^I8t
zXQdDjS<3)P152&m&3}hc-7v>Gx90uuuTOJoh?ml7w>u{*>ysS~V!7+S1b+wy0Z~E7
z^4QC(5l1Gomw<y$*-ySNua>vTggpa}e#U!m1i0js#FEFzE>IQLN0%SBJ!M{qxP^=m
z2K08zTzAtt9~Dcky`U3i>~FvZ&K+J_WPL7H3y8g&C^wNmP4=Dr*H7>tB`3ogj--#(
zYndAuy1S$|?qHFr6CU`+j23A_j8(K@-ppZ7q(Z`g<-T0btAl&@w+U8#pJd|cK;4)>
z?v`ur#C9XrIBM8)OdMuaP`mb*$kayVSRXOHQYHRrM<qS@$fA~-v$uCEy@-RahEBlq
zBsc@WH|J1|6HG?}InJx|m#(<~Kbr`yVK;N7O0)o3XxvxxFK=VMeY^QJD2Qj{zueC_
zjpE?(i2DeXVW8_&uA`$vcSdI7|8Gy(zZVhx%vY+(--~*fUQ$h$*cuKB*BNWZ%^|>}
zJbUfyrBoBu-<SOsLL79us9L}rqW%Rd2ggBCIp#LnL+~r!Cr4oHGh;nWCC|PZ@x0E|
zm(;!jW7N739Dj=9yZVsc^LKB6Mdy7TKhWB%Uo{85us5G5SdKwr>x}^QqD2s0`#+Z?
zV2hz;Q26j+otRWQc-0qFQ^r}@*{>xNJ+FLs;5DWM3V@9C^pE2u`o`goG~_pYQ1LwM
z|9sIVukxGR%m*nkRo*~xQaQx|Y&F@d@uc#f6?`84*XTxDiUGKz0C2h6*V3ybJw1Kn
z8n@Cv|18pH4B#f>|7er=j~mT#Cl~f@Fdf1BuNTMrHEu=cJRnSVduUp6KYcprJ_`M>
z9}Au=td`i=SRt|zum8mq8wtjY+4kfAA=v8Y_x_Hc?ftjbd4H7`OqA(tXS*$I{GVky
z|L38!|8&(_Kf}{I`Hx@aU%w<h!ltI!SG{*v{%7;vo-L1!W*GObN%M`rcihPb3d==%
zsu}R}DoJg}D2yb8R0;6Yh|5ZD|Bt%^59;jkwQJ(n-oBJj{(mq2jeFkx{R+U&fWG-F
zg8nWI!_CC^Pw)KwpPqzO1=ETe8s>8El@^a%8J<6wPRYr%#&FkeV1u77VRJhU8^be#
zQz;HkML_1+C8Jny8>y(JrL|gqb?yfjM7*C6U~4)i;gFs)3omYdety%{t{)h7!&E4E
z?;t`M>oJrm*RVavz61t_UvYmfEWrXx+naj3{<q?dfdR)t9XyVb007Ly$=NGh1pM3O
zR#VPS7_DgkUuLk_S`56r%71IFNzIw^kx29M;Q255|7CMD2dl(#g_53rCn?7|w!bzE
z6BkLmNebBdNboQ^cE!aBe4Srsq&5He@e<XH_eK?_!K8fuW^Tbxy{pUDNO)y-*{7$X
zS||Q4_44J>L83h-TYQo(SnR8f{@wra_W8FjKPxl5l>DJedGEP%NnDmH<FL{CV3wke
zj@4*Z8>)@{?;E;H2+R_#GIB3`4v*(*op$DvxOx6bcXzcFI)W48IOjKej9c!JR1*j@
zxO1nQVBgN&z3xgc1dxOxQ*TI5@KbcaqVc|Vrvyt9CS41>;XF^zQC=8NrKVQ`M<t<6
z44(@N2m2+1py0%}OrV7azFMQvO3Nt<h77~M{$9oxclw)BIdO4uSG2_-u{HqQ3BXIM
zGsdczM4|vE0_wv;{1yyDjK2+)uKR2H{wk`f%$zY@h1QdGtfT>*v41a$$+zMKz2<sA
zR+!LPJ_&=#T-joQs27sMGeC@K4PI&J^y<sHF$vi}OE#${1B-Jw;23m)CCS7)jABn#
zIWFkFXPJ;1Tav<()|`MuA{~zh8Z5rI_qE=d-=;xt-blzUHj%wn`-B%qgGHgN_9X~X
zz8n^O1iZokanx=1MGPO=zl+HL>5kLlKKcOz(g|#CHx#g7PaTHeOLYK|m351?P&XhF
zNCUYafSr*tm^C{LmBjg5ObVMSDJg9o1^GT}?)^^jjZr;by|2IDhX>+zkzJhQe}km=
z=<~7=PpA*O-VVwV%y)o6jRl0=>|aoE0}3Y3v#FK&kjQcjBQo*St3%K*dutVjZR#49
zlz8iV>RSZhH4hApRAe-<t{bq*B>*W31KX0`$Tu(I@y$uZD}JjPPH>m2PUuz?+&+83
zfqle&Mkna|cZIJZU$5vHV5g4Zjv>3pOT`CkQ(J_Qez-i+JFyU9??QL@%O<F_o4D5K
zY~irAUikp-(5>Xft`DX56daz_BCMl=6Dk7>5QGVig=2Y>ThYJ9t-_z0iYJA^kAK*E
zHA&o22h<=zJ1|8D1e3nPoXpI7nFBT&7&iPh8PN9-9vU$y{MWbHznpHa-h%y1xEAVc
zjEt?_jWsnIKtKzI9rEBXEaTOWSPvKHh^;s{UO<s7ndHb@Hs9_MpmO*zur~xqVMf0)
zLhdoft+yubrjqH{70H*VF;*l`2^57#-cQ!s@Gy|NkVZgvKR^5_6<?A~+^{{ieT{z{
z#dW?%M&*Qz#B+PLSXRB)Y3TIEH^QW1i^k&DYaDF#CJ$@XLiGjOW#mXfk1KFJJJGOX
z`1D@lhF6`_2z^Y9A_h`DY{cX+5J+SJG@7wJKyy3=<D_deX7jgL9zSonY4sy_K(Wp+
zA-Vu^pa(I}H`>T1F592t>gl70xK*vJ)P6kdrh00xr>oQnrn^w5YcrLu&+$>$hz0WW
zWYNuoEQRWao3QV`boEB9H6u@-K55%QISEDyI#9X%x?cuqzeW4?M;nWDZ=g~5UzC=I
zK+SJLUeY`k7)W>w+($jU_6eN81k(UagK-WtPkHJ8f7qA$aV(x?f`{zNc=!u2w7AyS
z*NtO!J&v;y0eBS{Wpc|#KNFd>3M?-#mwh^S%_AVTY<{22OpQ0Z8KM(fQu5~Qm(Zwf
zf<Jf2saUu3pSsM4By{(=rMNS(obA6M_(YvRsvp$XFGv&rOvxx%d0k8;N^u$Iu|w&o
zN0N$VY`#qKsy}hBV1bdiFUvD^?b^QL)f_vVvqyT@ujs(hR|?qPxDX-aqpx4S%vbA5
z`H^6_%l+TQyF3{u`v?BUJpJ=Z-UUs<QQkM{Dpx97>t2)A4_9LhU}qfJF}#5wGp&#}
zv>F*1;kfuzD`GigRcU&y)Oq#RhjLf=($dnKi+p%^bQlwXTnbBwu=MQt5{=SKN!xnk
zyT?%@=_-RD6e+6(biFhp{E`jKR>~W7yW#tSIXZ?EIG-iN*?W-TVPUK%X9LTmImm3z
z!#-@3H)hTO7BK7mujVOmADQxjrO-JbIxI}T1wzfaK2^yTm0R}|ru!+7D86dKOTvdq
z=xH5)WQOJjC-us(d8pB;w9!HQgB>}TTx?7P$2mSplof<<DKaIAK@ej15UOX*lB&*_
zmUfC>7Ky#8ZBmoH@bq3l*fY(uK4^E_F@tGmPIh+u-;U4!u~fa<bi7xt+KntfJTUA)
z;y_sbl!vFsl#qz%C*B(XyC<R&uu3H3yr1cq8Y2xE`Pu%mvjz^)nEqKZ%sWw6q;MFi
zVn)Ti*f>i-l5G-9+M&bQSAUj0?Xo2^u$g)|$5br0m07!ars*y)K<e#^4cCoN5_amm
zq8B@wN6B6x4>_)&G#k&+#Md#6D*AoFJC@mI922zp22P+C@z;keEM0&Q^0@Cg>KmAl
z^E@Yx(E=d*@bBNn$y-!)OGpVmu@N512ZlLlN`D-fyI__2nEmF1%d6`u*I#7TSrp$D
zyx&YRr~Q~H*;V2puf*>Rv~)*9=Ok&G($|vIHz&0(w`;aNm%~vxZ=~nw6c<5RC^*mN
zE64GaMJ7|_k;uC@*9{@=zg?$8+xe$^r*-A7!5Jk(h=be3R?$hpJFcyGjs@_t9mm>+
zshu<skTN#A5iAH_ns(egoS`?gHg#{nOa3H;R_<DdlI-klAPf8fDr^tn6V<M`YWXQ_
z-F<E6-Gz|UepS}ZJ-urfN_Fv!tGzZ$A0I>Q!a({AoBH8E$s2G=2SA(-oEv=4(p7FW
zUYtO#`px&;HcNr($E_pLM(NF)Tp)N9l!|`SwtG7~da|)Y=a!hkw?vP&%U@JEDa`Gc
zztt3fBiWza)-<yAo5DHItb6&JXUOQh)0#=Rvi~ZelA-WZQ5MU+;r_4g*A4g?GVed0
z+j2OC<i^nVrL~WUAkq$#y$s+49DYJuG*&}M7(Z&QPHjwC_`dX3ZP=e@tA~k=VdpSW
zmyKH`-p^=$nRj+85fnK{$n`xT4t={L0V&!leE-5QS4?h>Zes_s<~(-+1rV^BtvR0A
zXzd(CB7g%Dj`AN)UICJg136jN>Oe_b?lHa)fV)u<hv_VSBmqth^a|^kQm#mMbDDsF
zMFuVGw9Tu6f6xj*AEwy8{Pw^5Q22&(a>1fJFmN74>8PlTd^9TV@8^zlM&5NfhznRM
z3|jrww9nho(SsUP9`TJoNL0bK?W|&~Ti}l1whuQ*>rrMLPL1Z|??ymYZ%x1<F_F>R
zQRBXJ;ZM0ICJHPM<xfVQVezht?+A7tM*VF`8_Mos_EOeaP=06MMtYm>e(9%Ag9T33
z>sx0(+JDB+$0w`3&^??!Ic}mbad&j?b;~6SA2I@(W}XlcMV<Hh&p=xtQ`5c9-maHk
zBOx7fa4e#A;J;p5s?RRc<p0~g;p99o&#|kQR`_ErN=ZxcxAI9L|H$m`-(;Cm1|(N*
zhF$JHtxX5>4s?;A{8WskT8&9%<g?W=^H`yi++5SIPHm)=G+R_TWWVf{4;15n#!r++
zg5m8Q2hL*N=Ed>xXKy#d9&wr^*Nh*oydcuCaGUa6PrftJ01W_%jM|4$QB>{y3NbI+
ze@H7TlB`Y)Yv1|3SceXyD{h}$)U@g3oO-!~>oC~>ttALz_q76rM3NT34O|(iEK2?t
z8Xyl?Hwjn<0vOlLBW(W1=?h`+IICYK19Ah4!d+{Bkh6PfveU3w@ObAkw6Pp*fQwD_
zko3(pTr@VhK<<}kCrSkdDv1>%Lbo-8+*CgG)xe`hy<tRm+tspey?lMcw?q>AJ^{gf
zxAUS6q3Rc3yu7~Q=%8EedZF8&f>#|@&srC^OwxrZ=;<4Kno|#-HXd@{>Kpg3s$&?-
zZW|fzXYf?Iy_vfx&!2OdyGgDRc#F8d28rk70<9-@dRyH^v}B;ed~*r6q;vG{+LlvJ
zJ}dW+<qZq&UxzA6+Ic!q{B_?95^I7%qx1bFAaY5+lz~d|cxug0)-Cy;9t_Wnoow?-
z#iI<j6UPFGDLE6xq*6Q&<FaK>-&`J{-L}tGX8maeBw3Q2KZj6>YMpNJ^!s&d&3E}D
z`JINi?p5lGPx;SmUewVyjtuAR#FuR3#2-#vTH2$Zuq5SYgg#f4qJ>7@8n-Tylo7XX
z)#9(QAJRqGeb=FPoO#z>(|vYA0~Io?nLR~!b!s5CO`yk4??zr3zDBNPgp4i((55fx
zh)nb82#eJ=7s6zZ_=ZQ;7SWdle9KXUPy2!?NqNj(jj+C9NwN>G`SH4D%C3ABDYkPi
zb(IB^?ePqn!7MLiRN+r=mnbLbl6jKFG@%@K-Ul~HNt;9xLQi|tjC*p{hvc)@%Zoit
zs~b%wuLV=Pq=$$t;P71N2i_u?FgLXJkR^tnEKJ44Uv%W0Y?jL(%!L|PRLnV=tnHH7
zSLFo?*^hJ6+U|NI?=B{!z@Dz-zM7hCbxQF<yI+w{0QCepRas0_I#~{Q1ZAInd@5bH
zxG^5wZjkQX#P9+DP0N=}{)rafS-80s7+;6jV6~*CGEj0}>9s);cOGEP!hO244M~Rj
zeBqlEQ+YvcA)?Bjo*RZ3WXbtBtV#D7h~EF8k}^h~hrv6vTD*xKHzY)IQL{9K$q
zMp!o{*rdquVoB0mb3cWz@}5k;)8Jem;!+ZvK#^Or^;?>wBz3YNdk32lp~xD|9rNnP
zylirB31+mo`~4#}jZ;`OVI_r`3Mrmvy6Cd@;=1j=lSP%q$mrqLB<smuQvDAOFajaJ
zHx5y*zZdZBe>zl7u0Rv=lqtz*jXr;r)u=_t49y8NOQOoAtlQ7ulUdiuK_lF%R%bM<
zO+@?0#*Al0xZ)J1J!d_X#uDw4DMqcTo~4;^`2_@2muN<OsLk(`UWRp#l*>Q=t#jBJ
zkmB)vHN`I4fKgI_YOQS0aZ~mH?s_pgbg*LKHr7}9iak))OCf%5FhU6Rxl2=9FVP@A
zNxEzQVz_d8qekqFHT1|&PWa*mA78)+wH4!aF0!Jra%+nlL3n<?texLrMTpnzlzl^s
z5nCHrw8ATrA{X=8$b?~N#G)0SS2W6xJ!UP<ZD&|JBE?dWmV!3N*D6VtuZzK{TT~NK
zta9vf@;icLW@B48Qz9TG^(~ooe@8n#>>66w_(i#}p^B#esJ>HS8nF+5tOFFSJva9f
zmN)uAMP+%#zFz|0VZ8du{{<iX_Zo3r1Z;Uup~CeTTi}h-^QqUN_wQ&Xv9We2Kj2A#
zDLa7_kQ$`24sL<&2!X(5x|gRyYKzRXJ}VC_nv3<GVL!We>Wz&A^d@dYQ)FYc6+H_6
z*pU9!$w=NTj$g}zjDtn=T%Mgp1yN%CrM#|liBlsM;d_`W<=x!o3L^ooYikX>jV}6C
zSwzMgEl+$7CfxJnT|IG6_{;(6N&_6QDU6FPq3^mp#Pz<{9K2DGQI4#=C_S}`fI?4t
zLWPj?Q0*`M592k8F0*L4{)!&YieT#sly%;vm~loAA!DA1^B1bAYUB?(EOUN0S-nF|
zkv(1|7x?Xq!W)}Z9S@}S%7Hu-HIyUdtS}c%y1;c%%dsj_j68rGG|`edbj^guO)*Br
z#jSnT$YNq@bI+othHjWn9SWqi=dS(b5E#VM++qXMtyOMp+{dmzxL|R0+^d(~7=bZa
zpvy~R;X8b5yk>{W#Ir0)BX9?1W$MR``PK1iwwWzH=LZ*JDW4XamC5cBtJaUg*zFcN
z^E(OAH~swm*n9VBX=rldTdJv{Eebucf@)H9yy8Kt(1I8EbeVkFi$I1+HAM(xXIJ^)
z;@8<VR$F3fFOx{+R+w&>&bOt@_2_))mBw!C-Gg_t?qB-tH1>xsd0ppx`1&eR1ocvp
zkb)jN6|3X|1CCx+6>&W;A{_ovfxpUMgN|H*CYsJzww0XvPP*VFI!#Xa&x;x7v5&HK
zhthud$F-~D1xLp`#q~#C=&7WLhz#HZc?mQcoC@md>bW#lRcXuU+0bh%I%kpG7_3<c
zS-sXq1FI>h7ABqH4TcgL919~h8g4*<?@w}?PD@~svGKkFYSaTbc?}X-@UhiT=Z2BM
z%}>S1K~>KJn8r>*If0x@0_8Wt8&B?+^81Z$PTq|pLfHl0rBTlv%y(tVIdG_Kdo5)?
zTNp?E>5xf!Eg^3&DyZUPeeq)*dlTK*p4lBsgc;Wo{6V{K$5T8=wIDx3dE-it?!5Mj
z=nKi#k$Sf}7oE>qZ%TWW`Pj9zQv>s<$tji+Vs`dK*QwalW3w_ys0#ZUQ*zQyjS%~#
z?|l-E6^%X{ITFFxN3T20WS_E}w)jkZ;P+U`DJfAvx$}3bs+4PLYbU9yz<^_&qi4Ty
zeBbkz==#YMx41)D`N`}HP3p<+5MU*~49OphS<5bHN2XEEj-)~l-|K8k_N1hY*sA4l
z{s{~UwpF3AeAO`+{(wBr{OdCFxQW1J6Djdu6`{s;2k9ptSIs*1J=wC{a(Y7Gy}sKr
zpA~=l9cz^4tKSbxQYmkEe;)7?*_wAb_=-}OjVUv)POmhdJUjIoRYrU?X@&z^Zoaa_
zg)~!E_PbX^4jbp8>v6&!#hRRA(|-6ogG0O~z0Vzjc8tkj*+TmDNSWL|t5G-YIIfrR
zRxOD{<rnge^(V&Aqmzihpc@wx*8XTM^2c$-63oxl4JUtXj;WzmdmOeV;4*KwEG2UW
z*-&SN#f7SgPc{ZwU-L0HRXw-PB1|a$wm$eG@9UqM)9gQi-@Xm_7W6vxr9#7}&Rlrs
zO3@z9jkK2lm`N*XV`D?q2BKVlx1`QaRwU}-|Mv~?|N1t@KR1nD7E4z4-^lsrPR7-@
zJ0^KiGSED+&D<FFu;#{MsjWZm6VN98MMPcWQ@3S<WlcN^;}}r0_OP1VDYPZyM)8X&
z!FsK3mzFYn8Ke1qFE#}z<DZiMI6HH{)Kb&gCdxAEJCUxOIRx4p>;h@!;d^v9pQub@
z%SKfq5-1<$Kjs+bYZPw2y1Yu-&izCWCfpQ<P9BwHD|SV54y5}L!Tal?A8VVp_{bus
zSYS*)jCMMnEY$b%ry3*lPg63o3Z%8>dk+uZB_tV*oG9W3yh0A4FZ5e{LRklte`z5s
z@&<=aS(zr(7K$5K#lb0EC7vJ^e(U?hg{3n$hscnFL+_Dhg(Eb0V~*!C>xspB9i&xN
z$s&I!!)XrL;&Zyq^Ty8O<Sm5V;$<(+bsx!|@sr$4Q+Qrc%wnM}1()MOGZ-?mbu0Ik
zYewW{KeO(Y@4Q!0%<EZm@$8S4%J6Z^S54}IN=`UAQ&G}yzm&M$`JXHLU)5gAd?%oI
zo$%ctPkJ;uU&<hm$Ci@+-Nb23LW$wWkG`UwC@M0KX>gg}n<SE{Os(atHN7UgshuUM
z<nT0K^RuE`4)5G{1Om;)tKSO({-oyQ&TF$h&Z>9Z3-t178_$W&3Sq-Om2+z?KG#nY
zcJ&U^SKi}1%2OlZ=;=}E{jEhwR}oyuXMA{Ew$MCVuhe}TRhV$m8A!+raYW!5Wg?>s
zxca*V1rL3TYqDws1=#g2+X}}zqu3oluzGCcvAEi8J7ByJ0>PMk05^kgRIHD2Qi4!z
zLKkaly77%+9Eso9bj0F%4tVU>f@uWgf@G^Y@NR%+y#t8COkgud&HPn)*I;rh!nF9h
z>8<x4YJ2J}ezkXLKreeJ%O=;)YjUg7i;Psgu^PPO4J0Y6J-<&q5<5ce%D>f5OE>tv
z|2rady~jyZxsvk}+oK`{V8PdJDhBiKf_Lsw=bI;$75(?b-BHUqe9I{JEn!oyGK!TN
z(s1i@pJ5hQr7h)ZZaS;_*etgM$XKfa+0&n9Tu}$oiZF`h$EwAVyneXx3W;&CmUDQ+
z7EwZG2s-yOTqS`%oDG@zfdr?nmjdO61yAw(Ugx^GtGVUm%f71dBPxg6PuQaPUJ}Dq
zIy*jO{;Yl%IV>zYkd|#%%ZF}sPRnyO$;a-!+%>8{o~?+sYe<4Yt>2qhH}~|ppCT9Y
zYPLh#dHa2Lj4yfHyC(|6*M*-wP!&l>c8}ZIFMZ9hM?*>0I#^N$p-yvYWd7S+G)wtG
zatc}>zm%8VuRXRihR~Bqx}Q#*?yo4%sY4GrW~^-6bqsfO4YA`zT$xy#J>g|#6py$(
zgZ*h8zJ&-PZ!B|Y{{D6+B3zcHA>bFp?fgXA&o8#~^9Ua@zW*Ju5iaL$RgsR6WjB@3
zR%C=qVxwgByJ$8+rk_21GQ+`Bop)geD!pf`!aD_Jy@j<@L1PH?@nUzM{Uu6C_Khul
zkEULW&!NX9!@-v)eQ$IcE^N^+;*YmTibA7~k2^n9DDY%^<`#IOFDriRCqyPr4`x#r
zC{O6&Ss*+c(P5|im0Q&!vl>M1`=x#Dcpq9@TW9i!IIEhr-0ruIj+J9lo7}K?n|iGK
z8(~kdig|aOjPN4<Gfw&yCU=l9clKId<RB6Zu=thlyQ5?$Y|_;H`gQscMp*KX7@E+1
zCRkWv#fPi#d6yOAp21*B?fF|VMZGAw+CFhIM7gH40T+70w8cPk(jsBm2tqzoUC{9X
zre@>(4H+2CChR8BW%>0_Qlv_qA|L#qp+Cw6?@TtUH7aNo+46^sJbGAd0<}{8J?5=t
z+$nbCsPL@v7tQoW(cP-HWIO*mGO5KbrYr6dMRb>L^}@@1=iB)kcV~EB$reQC*ECZ;
z(29-9`qsee`f(601lfN>`y?~PY*h8l>GGviUXr}FgWu;`ry*OVgZ`I~56;*tH@;uT
zXKz#Pg*-LXEf><ImpPBIs@c+Et*A9<2~trtlZ-XqJPgy0*WFwZ-JWgdL;lDhr>EiE
zFnwV%Rqo<lAAi8)dUm0yMYb{e*dfJH2P^G8^0#h&R5tfK`{haKx?R<S))$&JHJf`~
z2Oao3ro$74@X^KyDr@iuMr60La+*&NQjgLP{>#I+hA;FW=C%1{NULE@K0_Z4d(Yun
zffDcj_w$h~rNpn={ARNH-m@+!a&5P+B&3m~uS-`9{2QP`!}FZ~nt}(MjV`gy^@|+*
zrlI~c9fq`E)8*&m%QbcIo^}4iI%6|+p8Y`2nhaSE(cj?(3M|D}aebF{+}e<Boq~@j
z_lfqlzCKFk3N@&pVNJc(fl9+}KA()NEU)*lmdM$e7_Z0Xhi&(bN?xT8dtX{floTZe
zv<24niD#X@cXqN**Gx19;n@9|qVMZZDf+9R=!w2n{mkb|tB+jMm3^PjdpOzH273f%
zH*rRbb&G-A{^yS$rXbVEEsap=pXr9zylL<6c3sv~GP<S_V`_|pZ)BVI8^0yA#&8u(
zm|Zg^siLOF4#cxpv3CT?Mzt4p(gwm6D3PL4W-=LweK}BZD`(`bsK0-o2L72+KN?d!
zRK^s<w+yGO@LcgYNmE9eeOB|!B8Mqs536qxH6F;zTM9O0amQ)1)Mgv~gxnp21rP*s
z@S&O3OHFk8(d8bB9?fjf<DWNSIx49IYAK75p*~96v!h1q+8tKrAQj7O{i!mn(gvs-
z<WKnX^Q{R1-aqkOBL%g@B=L64xgT4lv!xuq%J;ugyLh`(e^EFJ)5<?u;-&n8a_G+u
zbk$AWJMgS$R~qldNkkMGB+|Z+G$<n?p?kXbe7W#Q%dk&GiE14h_5FKla=okB?gjpO
zTjO*F)lQ=sUW2rEk{fI8u`XB778{pFp2s>g^TXvxrC2YDxFdNSX}JigZ}dAB^C(ag
z>wQX2!BbI}+Fd=xJang)ZEk5v$IU6eR|M)yL^A1?7<K&ZTgXtJiFR(WSR5N)^rOso
z@^j8THLyy<tueKei^dc86_SSARzKCxufG`P8&s>_^WkdXx!?B$84;g8KK|FM1X4W>
zSO228UCJ4r1vW}L8QHg!riYFkmg=Sbynptl=r;yYeX7NDGqS1AhLsC~xJPJD*J=nV
z*ZsSCK~*vw`6K!iQZQDa`59&<pvh#^VD8J$YZ_pgGE$T85D(nd(+7Mjl|L;n()Nmb
z9BLUu#YUl{qoYEM8y|HK4h{%!d>tPDq*j9x>rKvJs;(|lG(Y@&+$kVM>2Z>+dbiMV
zwcg>AuJe!-Jv39LKrL=HF9k$kB>n=!fSe+2*{boQ$?x}RF!dfwIItT$|4c;-S5aW9
zT*dV&iN;Ifh$DOh0yfIJIER3D5cccW8_L;IA2)!2<OK=Rl>DVwv|Kh-Q~0y9czPD#
ztS%GVp(bJV+rd*|HTH(dX?Yrde4t&{&y#%=SAx7Bdm5xfwTSamgAOUEy}~Kt^W7MG
zFMUq3kJv~xJS%UBLF`+x+#1vr0|{o9k!u5n2m7r~`SJ#6V#<oi^5!REWDhlT6;sEO
z6W4kp$zf&7i(0QLbvo+drtd>~>&??S>D>^*bNzbxo47{_r)L_HpM!&mSEva3f6aXx
zskig!KX4MY!nWw>?9g6`*C;i}Qml~<o%>W<)Uf1!ARi)t^&{BF1?E3eMst@UqYYb=
zgG;4P#I|_Q^=B<%+-P%o$y+`#rS(6*$ol#t8|6o-4BHd>4e14}iqqm<bvJF>D0LxA
z@9}Hc92)^m3Eh@5+J(2&5c{We=cRV=X~p)}jy#R3M`|XzPb3Uq(=CR$>2vH@w|fXU
z3oWfh9PH{A5A0Y&`~A*sZDVRS*z;+oSMi5LhjJG~xfdjBSGN0&=UkbX<HgNGIIAx>
zX+3{jtkk@YGcwOB8`o<o^!AnzTD&}06`1~$JIasC%G)nLa?s%K_Aop46W6F&V{PxZ
zDay6-4GW)SM>{mW-^Mf%*MNxp#S4%74dU@`GBQ&V`r6$pQTZBk_ekxXCJ^V!x|*<X
zcmwyx7cZiOGhQ1~BpMvXn2*ZaMUJB0;Ns)g+KmFWNmGyLgHJPe4yKpf_{54|-cFNP
zvF;QwKD|i+<FM<?D}Fy)Zvq3SQO~1A`g?BxyLAs`Iju+y$n&R57)iF{bU?v2mC+`G
zVOH!VE=;=nS@uQ1tr1Xg6#^)xJP`3Jo15obHJ&>LQ}Mj^!6!My9kVd_Vp)!TKrBm0
zxIbnxBsRUtH~Y0ewn!RDQJ`|n9@&^(!9;4}XZey%lv5IyJ+pvQRQ`4|v&@JVU$=jO
zdjfjm41Ub`?D=bzqCGwTWal+bGP-Y0Bczt$eVUM+TT`F6tUFqcPn;Vfr*l&FY|Efh
zvcEW{W7Y>>HHy5u&n#f#^AU@=aLloML1Jgx%p_?Q+czp$qNq$qJ7YbqLHd5u>03w{
zAH*t}i1fsG0>L!r)W?u#A^=(_Lq2`eS>3ZD)6X@~J3Z}_<9c&%bCU8R=mnxk8++cn
zTllI9sM$Y;<=PX=U!G`2sSdMow#XFz{4``ZZZjOxR#~l=@TriMYd|ffVdIvnO8j0}
zkLJhNofKJ5x6wy&OiDg^>8sXt{DpBn#wS$lcF(yL+C!eHJjH6EZe*AcwzMzF{g?#V
zs+MmY%><cc8A_SebKTZNo^Ja08$3dvIe*cVrzs=ihWxhVw=k)+5^*&@y0#wS5;T(W
zu7WVo9s0@-x1cFe%<@NRnNmsetjM9Lb)!_@ONXa(lw3v1FTbR)ne%(#30$n$mA4+E
zh@LpbA>%nBWi^s_3W{7-zGUzocdR;ehe<tREzNnr*dmY&QOM=2IS~^6#$lyAJk^96
z)wDK~U7#k*+}ijYd)N)~Z`M7=>TOp13nnlhjpUlpTymOD9BP=4Miq=$G%{u0_ci@?
zLGFbkV^BzlRi5P0u#$YWO)T+R#VtvA25Ut@+VF@#zEX@cK!9}NI$HcyzEvO<y1iGd
zZIa)>F<295P8qvr(P~(0)_Cr})}FFreg-31J4!>OC&Dhq4^x&j2GwbL#7a%-EO<Az
zS(tNm!?~WDvhPnEltX4tmYHg7wM`WWiMgXTv>>v9yo>5pre9BP2`l-W<Wy&95}LWJ
zhM#_1JG*_#>S-1NL~6#{sGpsMK{G4eaIBxiBY&o25Z1<tSj^8xm6euyZwj9=%#rg4
zBfj<=TE4JbD4lUQsV18ye_~9$X>6URp;mOnu-=Zo>{EmH-b2^TyqY>vt#J&#_|x%#
zwJ=9INS6G0`EkI@Jof>~@|ZktD(1&#h-+kbEVj0`@Z%R9-^s0K_{buxe*QK>-l5#a
z(^RUK%X|B25Pdn2|3LTEJEuPsvu6p&>51{&wUvTNq2mVpxK3{Z0{kinw$F>69Kmgq
z&;E!9sS~aabM{%%PJ?y0zP^tpZYmu>WE4idYG4u`#;{FQ%`GDH8m=B|L?7ME7SCf`
zJl|uAADd&UQS6U+6~nSm|HNo#Vo|MA+a0>pEGFac&z{n=PAR{9%&xn$4LLXVEb!==
zgj+%6Co4G*cl3Z>vMAnSwKvI#{r1YzQk7Y<Z71tCS*?iKNF0U?pIUIj=F+M~$h%^E
z+DOMGu=&S7Rsz>|b)e5BNTiC4jm-s!47F-xH&5R%VB{vSM_A@sAbe`(7UNl2HDIu>
z9v{$6sSISZ-xL61>w(M{9u`OgAT=vchNPs5U9Q`Hu#6ynx{!*Hp&4^S`8A)B_bYF3
zPJ8Y$%n@gYB0fDWW)kys%YOSV;l*oWc!S&4aaHUam@Yf5z$U}bR|)em#Mt~|EQjt>
zJ;`N^gdtxBE&^y_F&C#klC2LkI17qkPNygtU2+H6z#C-(6-ho$)q?c2In(60gknd^
zWELAp;ZnZ~X#FXx;k@YfBwnNVhq5+iv5}E6wlb+gRW9B1@NnCRNQhP6hE-4sP1~AZ
zv2@UAm9XpKm*IRZ-KD|eQdJjYfd?bH#f|%k1}!g!^(d_(z+|OQd?Xg>NB)&rB33D*
ztdp5u%CO#r*`Qk+qB5-&+%Hfm%m4A#NnT!cN)yA-C<XuNLmXcG_w^<%qSu4771L)V
zTQ-HP%~3`CtJ7JqhT1OZ9E~O{2a4Dl^ZNdV*7?`%K^l5?w#n{-ye2<3n7Q_WD<5tE
zd%b)(62f*c;5lo{WsM`1!mSuUXaD_h#)+Pon)eM<(XEy+<*<&pdm=x=QtJ0itpId#
zb&zOR6y$DLA^CCWsHyV{3m>0@7NJ1%0FKFucBQ~Ew;G01!T6J_smV7+7{(b~?W-n#
zs0Bkio?H>2m`_~O2ZRJ5C|+(ut%_ZKINfSYF)%bBNVCxQvxx1$%eWKa#{T%>8YNrS
zF}5M!h>Av7rJ_+5Gi()6<obuc4_P?C!p{3kbrhvS0THd9AW49s1XLFCyVR;6cYfDe
z9BR0=_=jlORHSLR6sXleHfY=>o}My29FI|#c_;JzyuFE8X`zqunSG4a?;gB1cgw@g
z<h9;Yd}kG8rbAQ%n~T`vZY32X_ydC${tZJPld#+OHB6*glb=1)e*eCK;rFQT&zd&0
zEtGO}nEl6*%1B(G12OR)Ng!|gJEMBfEkseb8Wq>@U&p_F6kliuv#wBP22NMktk*yg
zc|r5yJiXK@p<QP2fnkmXj|KFlY9|8B-)ZuEqqLbG%v#B_%bBUI?(-+ynw;d|cD7s4
zb88U%a#H^4hJq3lUMu!+IGSa;gpV)odkVp0I;Xw$LHdhAKw%$dVR|q44%(MnUzS!R
zO;k=9D<bBwk(`?Q%LX@APtQTcPxO3OY<n5*yioP$#IsTG-3t=om-@zqI$!#Q8!J6r
zJ)P#<QNe&!u=IHjaiVt>v1DA6A}4a7EVXzsi&lNOf@u=bsNr>Op_n-nb1jZ0bYA#7
zlm-y|>$mICIv^=r6R3-aVst(7#&n>vS41%`dxTrSq?KFclY+m<+%-!rI{1U12trd|
zC)y-}R#K)vorkY$o0B72AYN}wRqZBEUhOrd9+(9@4?4d7<`rBy;`GCBNJc5&=vZEU
zdTw<iG5L-21Rvvto-}S<UyBS)&x@?%^j~W$O}Yhv-ofw&FD;#B4L$@R+eO{&x!ad3
zZW*nT<m2IxsXeXDq_pPdBJaIUyjL}Z4hX_js@Rm`FxdJOU;o}{jr^R45sXXxuO$<f
zI(>+FuHF5X3SK4FzWw??6U1Z3hZd%lI=IK|D%Of$78>*ulsxuGOfOc)Rysdh?o3ak
zM;T|P`80(Z_^^J+&RUbD7^6nJYuiL?5k1Lf*ALb`FVZrkl418yxkkpu`3BJHy}dn|
zsMqp&fQ+`MGVX5Y_2kRO^s6TW?+N);gbLWD4_cHWW+3~=F&iP8)~c^HxP}_IGS?2O
zE1?>?8(LN^*&sUv=m{D<>VGdTYJ2S#)ov^1$R#0!zSLD7KfwfQ8g~UntfuwPD2zpH
z?cLpc(n;=45Wt}2Rf0f_`ndybu01$qA$J*XjWwKZzWd9FjD2mDKD8*UnN3SA>y#e)
zI<B5f+3>86G^+k5k=bOwyv>{3^bEthG&F{i@qd_?$V}LZk00pq-(CLvv1d+TV1}7w
z;z`vFJ@=~h%Hxz>!~>O4EzRD8355RC3c~7w=8h*vrBz;Nbdbi@Q9`GKW6+Hd1+N4j
zf_OOLLqv^z#tehf@srVetQ>ht;<08KZNfA6l&1pu>xA7?beb$%-_M<l?^yQ6AuPXe
zn=G^tQ(Cv{$il4q;X3`c?4vfqH4{HL5;jcj+64w)CcHS5E3hB_QqF6wTDE=E)#JLA
zBtNa9edo@|PhZ&$%P;UU#RA!%LnkZZ`i6!+qZE|YG4;>5AB`&?%DlIKSvBjrPJli+
zX~z}%IOpMZuoHI9QQF9UmE@Hzo3PRn$1f9`l(gm19za6BU06RyhxQY|un~*v2?KGX
z6+U$(#+`Uew#k2nT6Uxy<OJ7)*zOweccjtN6J*d;rOk@2JJy2`A3}f>ubY>4OK7#C
z3MJSbPt{hIi6kPuCHBeJKa<G<rBGNuvngaTX59Mnu+4Q!F2QEXn0lWFiW}eQ=ZJz7
z4Vs`6G!-pnqt20#u`SC5n4pR32i0}Xvc5N6D?O|ay7y6CD2V-iX)~y$A5xYFi~q<Z
z0kWNuHN!9Lz~{gQZx_PP(@%2X7KnA><2%Y{$HVojs5YEx#5=;TPI#UXO|j{I{fwNB
z?!ISj^la=FZqMT3g_S!m%w3DIAxKiDYS>Cvv)X_AchU)hd^cfZj*7RV=;g}1&%tzo
zwb`Z#&wg*M^~ONXMN#@0v4G=FT&6nBBi?3B%`_Va{WPuQ{)z!TNq_ce4hKp!eMu-q
z_vzb!WRECSC>rs5@j<sk_MMb12-hSvHT7Lm(p2!m)CTHGX&IT}-#@{TL5d`Y8^FnN
z@$j}su)6BkKI!HE^Sarz2TMyhDfSko*0HxX<Ge~fHIMN(9nW(I=+Q!e^qaLj;A@nP
zd-@85nb|i>a@~MKUXMI+{e!K`r!r#I1e!3Kw0ITUQxx~6U#fQsSCC7vx#b1<;riu6
zSaipqFzB_4osRGywOFzTNxP55(Ri@FUQwaaDt8P{@KjQI(beMj3NNqa;i><@PTD-T
zu6Qr*rbf|tiDA2{_G+zwK(WHe$N?cix#4Nn?KjKh%SCB8L%Q$Z`ozl^VlfYoDU|op
zlJH=)ZOyqe-%blF`a1bqSaEI?rdCFXiZ&Y_7eg*g6{)F<8`>T9B%?d3#EnoK4WYzn
z0fC`C{npI)*^*f^2xglJTSMWgKa!b_+5Ec{)VE=VQi=H)A;J=1K*mhwkx)$Ea4Dhd
z@h5IJ<uFbaHqGrFIcr9^Z#`JX^iFw9E3RK-e0RP{;?#6I(aiPqT%LD3QEAD9EKc*!
zw6$ry;m!v&8oI)wqS4H^5gN>f1wVUJ#B{IZ*9EUli>DBCQPJ7s7+649IQ)0Uce%dO
z(5_%8t--Aqmm({X;HTOD`t92=2m;>5_SI+JjRM*L;0+6=6;=gW_eMNo>ZPLc`xJ;^
z+_N)iGdIojgv$c0Zmi{Ea^*t82NN33Jrt3$w1%~lp@NOgyX(tQ4WvumJH`dmI7jI(
zdc+8<?q@DTx+*@X<sFw_u1@ChEihXL-Q@QcMHwli%m&_s_jUIn(JnDH4C*dsaWx5&
zp1Lx};(jDWDl!IRuzc6J%Ex1HGODFwce2kFab@%0ZD8G8(Z53##(EnRl8FzFvA@#P
z%<Lyyb7-ang#_8^7MLT+P35KtzaI2pRl>7WkdyF)7U(NN%{hej=_s7hT8CkxH|@as
zRcaniT;k+dz1%&)PUU-AIV#7;8WoSGa0na6Do8Fe<Qp%VWkvD}@^aO*^dx-`Z(G>2
ztEnrl^wtX=yhsu@&V2CVtP*)_Bd~>K&0lC?m<RYE`9!YhjWKy(1mJw`yp|S#1avaH
z^8E`=v==K6E{0ulya)TDw%W4>gT)w>Fyr3X{QJf}Eco|qysq+WIdtmO!SFW>mTOWe
zcJU{ajh)@jn?aK`80JIB8!)7J`mu^2_F1C!1LnJx2pjldxG<zGk_B%1Hdz=nvlE<(
z^j;NR9R5C4)Cvz&EjITixV48Xi>B(=<rE#iR|Tm~JqV#vlU){ih2DmQaE>{ZuO9bW
zamtv4oW_}`2E$Km+jyNUwPpQID=J^UlFA)*7hXTQ9~gA#cZtYRPone>+8ESUwHO)X
z3;eq4$N5eb6wU?v$C2%Di!AF|{x1-1e%CmcsU6KrClu;hMuNJOGY{&qu39$0t-!Qv
z9W&HGRt_MuyYm}!-VPg(ez(I#!(4Yf+K5a-=WMjoU*w!xHNIMg$T;_lY25d2@Qg;N
zFtM|_ZwQ}nd|=~i7Ob6s&(iRpZXP8_f4c<HFZLjJr%RO<1URWGNA65`fID=TjBGKv
zG>KAgmL@Zf5kqIU;tEEu;RD5R6U9?~h{jVRDR0z*mzTr-fD}7BdzZ2uDgtKD2R*Tu
zO@2PnGe|_^xXZdT(kjo_46}Nz_sOc-KxX~9=0ss$nrg5_Qev0z&Z(r!N-niP*x(-S
zlDlt;EYE^O`N0Nt;a)r*y8F#a3fYFccX2bbxM?MaQN8<WymDDXoA&AcyGt9(;{@{<
z;)EN8lc~wU6C6Fs8B=r~Z=bx)>+I`tin?ie{ry5(QBo_(WMj2rQl3HO2tkV~qh;^j
zPe){WMz82(#fSXds@@_?K4tdIa%(GHsBo84cSC}Qg)Rq|QqrL7L}S8%(a)2M+8tiN
zgggf+EF8rX#-5{_g88}m@Jgqup3^M_B^dLZOOlY&cD|AvT^<NqlWV7QN_-tmoyDnL
zW7-*@D-@IcTDN}?Z?R6#NLi-vkk&T!f>%F0yW!#+>z^t)kvkExHoZ2nOr>M5)Z>=3
z^7A03{N`}g9;w3$5=uJWzFuHxasVM_wd+yQ(N}&ezZ>)*V3QW8>9(m*Y-!tOc-@$E
zBaWfKurRYISNzYfKL)QRIkFNg78=#BAt9q6e}4W1;MMK!M|F40%m7DQJjf>#p1t$e
zq*+GVLJHB@$;UWPJ0X~6v9h*9k2=|4r&{GU0ms4sQ*~El{IE(yQT@xI#$?O<Gu+r~
zF)41Go8=4j7M&anO}a!To-n&MZR<O3B5>PdMV^nk>P1SDTpZm!L+?$rvoD}Z)5-|u
zCbh^$E$GSNz&C-EVWQ&3<!vHU56=3AEfaCQ)Q%n45F>hSz33|>|GlgaK}7ZQxW>E!
z(+v{ofVgXEGyGxR_U)eQJ$USv3qQQRKcW@df9B+(?)<UKl3g{b>O6?67C`udwEg60
zLLeflG>-fEE%p23B0}>`*ZG`x^@ypSW-jxMZ|(>jDU!wStDJ3`dg?k_LifE1cPmvm
zXb#Q=bT<O%8^%cHJd3#+jyeUQ7bBG`-@eAw@bRfU?166Ul#7oR7L8U~y$GPsAhnwr
zRDlQHAa)$Xi8UE`r5Lez_s$ZSp&xjXS?O)<_Yfs(BmkzZ6uVlHva4%NOKYok(`lrV
zTo|#tTLM&P0%J)+%Ovh)BlULh7KXLV&>w<RN18?~P=EA0s1u}h6O&Au`vRcwU|vpg
zKET^oUHeY_x^zn#i*n$^ftEi2Ynd`PLMmlza*rg~HidJ3Oub-a8EgBrG=O+iD&?{d
zw{_EQ;KXRrpxneGyF5g&TRVXip|er2VOi8~`KPo<HIY+r=kcomyc(NW$efdF`Oe`*
z;;VO&@rkK_4Eu(axa0>;^5cU~5Q~r4b+T$NY$NF0FXoU#EVA#^3hgZ?KRNI({M>x?
zF6z^!b%nLDuCDHE6aN%yMJ^VLZ{k;i{n7jOn!e80y3RelIb{_JUpwlv!sBYrNCZp=
z_ON+W$!aW?$@TIdO^VM93tSYjvrOl7OPuBxQ`u>xh)T=Kj?ACmve~*gZhki`!asdb
z$)~!V?YKYsF(R5!;qv18bnc1qErpND6+#Zk%&K1P$mHnE)t!{ob=?W`;D&4YNjc~;
zV~OVG?b%l==(f@H%?S>5Ae!XFq8`*z*(-ta$oRco{D@d-@7dZhvxdFMyviH7IIL`}
zp8E|#mqz&UIV^Jl&cL?dvf+@IaRn1=Kv*sH*mJ$gPB;yNN)bFD-r8LAelfiwXe}nT
z1oi*J0#K6J#1{c5Ip)j}DZrMu;$BU1N(QHz>>};jn)yKDixP)>Sk};hd$yTYHJdUs
z2TKXaxtvOhrN^K2ivr;VVD6hEO{9kOWh5D``ZKofYZ#)8w$hg2YhjKm`~c%Jb}y`@
zbMBU{Q48(uWPjv{p6pkWRLn11F<GB~Pigk!iBuJ&PSo>lhbrMs!dnUwpR&T;97c^+
zQ$UwNMAjr!^h3SU9ogqFiRvJVwQ8xN0VkrY;R<CkTkXvggyqylty7@lrv`hJ3T1)P
z$6v+nuc0b?7QCE%b|u?&7fv<Dv#XI4T(YQg%G%WVK%;k&k%OA_jmL?DJsWB5DI*K`
z;DoFFdssoO;B(#b$&Ro!vbRwrZ#?;}2CowW8DE}yk@f_s9kHR_`|JP*ZD!{@mE>g4
zu~{S_%qq53ekoyfjY)+#pG`N1kcX<4Giv11_R*h!otzw9_ZLzmA}_Ute#V)*>KAny
zL7_>~fr0yrPP!Y>UC@Qm{P2<d@+hVr3QF=k1C&e4KmaTA^qC!;!13gGtGZF7XfT@~
z1>{u46m{xp#JjAl^f}#^JUs>}^z4j`i)x~CA<>x6m=U1cC(zL%f${CU2u7|klsa+T
z&B`|uM72SHk4h+=NMv$yQ3?>l3C!3>(7A0s@$)^K^ipj{BTadBN5{mtmDRL_2XJqc
zLq126Qf8mQRXDrhqrUiz1~s{w7P-ms?kR5YBoj%4Kx(#k{DdSYem@>@R!A^6=A2%-
zCmFQ*AlT+VvUg0xs(*J$Mw*)|o8<SxNY*oFvnA(N=^M6mEKlXPlG3MtGP{o@BFgW>
zGl%Va5`^XPlU>8)1g&CgjUcT-mQ&~kHyw`)iJG;}jeTDN(%!xzRSjD%4xQ*#N#Cv*
z&i8$pAIUj%v&FPNl{#&_PGPMdifptfB_cUFooXy)CPt>DPl)x7k`>p%yv;;pnTrPC
zCaZ%3{Ff^ZB@$hYI(BJR&|O^O?zMvI4?$W@<=F<XmULnE+;sIAon0D%`qmKYqR3>C
zyLU-*I|HBA9~W0@X4BG8Wry!cqn^i~1bgTcnyZ8MzHN&Q+RP{Va5}ka0$GHxT?Uk9
zKHx7G_z4t6(Yx~?0Vf;y!mAe>507Wb&SNoA8aMyCI)b)^VJ5XXvg#EOPLc+}o?eAO
zL4JL|Pk8H=qjxlTQ3IBH9>TcA7j*TY@8->{Z<LK|#RNIV(bAOhW{o(mpH$Dv*yaxu
z4+OXR_q$W&That*>k41!K=Ia5=p57Ww<eFO=B{PEj$s}1{k^IBUNtjo*;`s}9kyHY
z|FrfVKv8a8*03T-k|ZifQdAT{qU2;Ff(nu(G?EdOoO2dIQ4}LN3z9REp-Czz8Cqy^
z5XqrILX-J--<f}E<}K;>oBF<6b#GDLmVTad_St9cw3eFiPfT-*j;z0bW=8Ja;oynP
z98s;&76E4Wxu2+r_v5BQR_jvI%d-O#_iy<*4aSQ4*tmXn5*W`<#)<l0W@a12CI)C$
z&HL$=ROrx|um{f!8Z5_|-brj4S<|v>P}eO~fF`pF<7k5;UViPrHA#>$g@KQ}cG}2O
z6^HnO7#7N;%fqFykF9>-COy7gT0{TLOS4+~*a*_ILj2J5+-5Y&t7}moFs5FhsQMh4
zoRNww^DKT+pY*d_BO98?iy!>BkB&gUH&P3H_F%mm1OT1CwYpi&+j*Pt^BwEUoC`N#
z=3TXU^f-pmwE3xxTa{I-t`2vCTXS6ra(})O)p}#YyS-A<3e#L!(>>8zXX-~^RJAcX
zXYknGR{Nb`7do`qzMwMS(x8B;{#;mmuSVE}{FY_IrL9aYdO_K`y_wrwEk<L|7pG~8
zh@@tW&4BTLL!8WJ=Cf5**OlI1PTdu))FpP9#%Fl_?elsI-L^mlx)_-w<=%Ds(hR62
zBum=nr4VH&j}oeKyFLM+7x!5410kS?@H(E)eu`P`G?07XN2{*3iOB&mf^#?7RY5`L
zFI1xG$UH*{U;`h_w_&tWrJ~!~+`MkD{*F#jdBJ9K&TMiv@4MPc`y&te$_K+eB0a16
z5iD6MzGJh4#`SXkb$_m&96BXWJiu;)e#G4n#ewdiZ=BxsL#2Oc&>vkqBWC;<CI~cu
zTR1Z_tGGoIGcb6{n(L_ROqZ5`KxdQSSn7K%kBX_~2$vt?t^Q(jML%M8AKW*#RD7YH
zP9D-7Q%)T8)T*wkoXL4(d20yeX3?wOXzpS7@#urqP9RJzsxHh_R`R7dcI>Wo8t-g>
z%7@7quZ8vDw2|q@hckG(clrl^SKI2e-})S%u?UDTR67!dSQ)glbkaIP)mt5O45PZg
zeJ738`4c70`fV&<O@qXEvBF#v#=^ukqf)wqn1>lg8LA$IZL^&?ksVp4a#4*jts<Dn
z$bG3n(i!vB>cstuA``WNn*%(x*#$%QC0sPrZe;6ye*XQIo3+*6Fp=DKA6%oWfPaHI
zE?ePQp9p2iuktmGvU};HnK#zR?CvsrRuLgSefspTMNz7<5|k*PdEa>sxofSlAAP80
zngU5N(IX*;b&U*jfmBQj3h-wgOFRsrXHKuG{(8$*>n}kU^Yx2T)hG);pFF{mq+(E!
z0h&dYnU~$h>IyJB@)1VvC3BfSs_X_oi#~b1J3~Um-RflerEkP{I|pRy=JrkjJK@|#
z-1qZuI6)C&SA?EzzIU#5`e24Qb1Ym%1KSh=GKB6TV^T8r!znO~K3%=Nh<3pkq#eF!
z4ARb0NdG0!@zMefN`+U9CQp=8dHdLy&ShuiI7ELo+s(h-?Md(3-xour(^?w$y9E<n
z5|^VtN@Tvc)RUTJz0sT-_2Pb<`_|^x-rR*D{=IX`+ph6e7dg+VSXjK^{rM<sL^v`c
z#HR0U3>9zR?31twt76B8@qduf8p{D|ZAu?pnwI4Z%B+;yuWOhFg!dV?==a<5wHalm
zvGKD@Ys}c4fqxCd^Xe0F0vS&*b{zNoynxX}TFM(%_hh$;wmz8skZ0K08AR=1dNsg$
zz`5DYPTFs0Y-+B&qNr-3BE+qwDkPk0i%P;ivihDy!)C8swEL7CPsEyt$ql`aowlyt
zuAlwnTx&{F6`RASGSWL3IKBU*h`NmJGbg`A(8mv0bCh2Ui!3f47<@!pS@X3zDyJlO
zxb$<B+W>a9+^Fnx4i?8-TGz^BqpVD|#not7aO>h9Orggv2D86Yj(bWL@{U|*^3iU3
z&7CqszTNHQa4+fe3`{~Rwhn@GVJA8VNUmkw`Oa_muv#&gV#w!>)OK`3yj$wIJ6(=W
zvd!VpVfY$%thXtzbi}vP(0z=g&oU1t0~J+N!l`KYM)r3THe>D#)UR~OUTV)j*g_DA
z2Ee3Z9noB$NH~(=9)0R<&1t@~vE0<$j0P#aY~S523lLkwr*yx+JHH0HR94VO$=mzu
zDYe`DEmu3MxL;nDJKf03ZJL!<=1bT0d@1-(7Z(QWev_9MqOotp$gk)gBY)G8BdVYL
zEb-Rnb}@yONKcjwr}oFXYQOr=<+V9ORrWC<6$@_P)jj9N?SxIY8a+YWX|3gD9`~h2
z<eIh8LY&|vONh8nk&4(JqYL)98E>)a3dvOe@Kgwo*p<7bgYG$(aSSFzuB}c2?K&uO
z;)d1PtcnT+D#5V5KjFMx*9^V1R8{w07K&<+JM=DJnu~>=<Fr>&Fnf6Cn*_aek!&N6
zfO9bR<A{+<*!{}LwQO8YT1|$Oj+SBOC)w?iic)3nM?@vJ5~;jglyCL$xJjjVn#CvY
zSBYxnRWF75>c$SZHZl8Lv)*_iF}{ix{_}}GEIxX=ZIj3$hFWrKlXUvIdW{B7PEk2U
zMx(PMkYV9b)`i^5hFKfD0*l*|!#hWaT<Rx2gqD}wHJRL8TBPCcNr8dgm&XQLa;iN@
zk3OBrqqkFYG0petLFF4IdMr_5a*_IXHZEdCTP2f+cX8cU^LCV`{MIvuW47YiJa;U3
zehd}9!;C@$K+4sI*j%)VwEXV&r?M|zp6(qgU3=BTaQ=B@7xs3ytv~@9&zIxeYZ4@m
z<f5r)^e2RSdw&r5PM!(!-j^u;AerPr$l)CFAL1L;YSe{U>$aLvZ`8`VBz~e5*l9Gi
zwI{FhjQHT<)<^vO=<}`A9+Qg|xLi1F^iY~FQqu@&nn{uS^DceAUWxb93}5ZcrcBEi
z3QcpUhbedeh({d{d;dP^tD*EsHl|+}trF;&6$c%k|J=K38e=@%o-V?sx*Xlz)ZUI%
zcX-hgmM2Ole_7(9%21^n+^VP(tTU8_<$KDWHqAM9%KO)tJKCw;{pg3u^?2<13R83o
zA7m)Lia@gRUl6*pJmeM0<#-u*nl$e?^%ikVn^#HvnanaNpAjz-Db%`z%;Vxe$&HN8
ze77FOr4i<lYB@JMxSFH!;6bS8g$tZ@Rd{wOqG0vKSez<a&o@^hH7PDeG|w#FLm|S@
zGb2k%%x}*d-;Llj+0r@w=2~tuUrp7w`pRn4wnzes+mJ=aGkK|N2RjfP(3HGYOL?^a
zY(!3AF=#B~3(UpE#k?mTR7Q!~#Z%U}V-^#0EgmtD_o~J0jy(62t<PELIr?qBBnP*9
zcbk`X+Kk9QrY)^_aQMMiX+bUPke?E1OkcqmAH$*TZymp$9WBAQ%TcmgwO{RzFWwZ!
zxe{~W=7p{e;*-*Cpu_EPk`%Qx%2PU+G+<lVDm{>MB#PC<_toF&^Zvt-BuW51y+--I
zVk1;N@8vzr$A~WoKH)8S2b^q}p5T+*gK0UjVej6JWgfRxHUBQ$MLklbXtn-%?a}N)
z@m_@n&So^-#m#WU^@gP52}Ap4@S4G9wk)le7RpPeP}{yU=&QTm=Aw^0iK$q`tkz_#
zm*659j;$`@?zo1AVQg>iT5sR!^Ke(NRS|jBXX&``&_IvMB4|-0IzP9Dys>{_4P%4>
z<#qINww9Kb&|Ov(h*Yk2e4)84b;bM5w)D`)NTI*Vc>E`op`<)C4XBu;s1rI+iMy2U
zTKSJ!qf>U*2imE`WMmBM>gxVn4}`F?8_0k4r@yt2Gz_{vsLI)87Pt<-%Gil$*e+cf
z`;>HhZSE3ZB+9ssC=M8eK)ojo($I45_D*kE2owPP<G4n*jo24|@|v>{+7U#eG(~Ub
z6Olt#VTj3RrB&4SITR$I(fuxPKyAy|k0S7i+d_<paCFoC5=S<CKXZNrWf3(^H4JA$
z3np-6i&D_MW|P)cm0Bhqt3&PFGa*3gIByGaTBR4s^cg}=)f+-&_<U(JfTjnea#Na`
z6dBG!iA!5iF_<}uim@$L9L;bJ#?`L}Ryx#8Gr`DSC1P%A6s>wKXQlm`5l}Aa!eqRl
zpx^^;8W>Z0;W-&)c7lN+?b)-Vxb5-*(zZhc?o#8t6K4@+NM6Yg1jY@ZY(}=Rxmm6l
z7{un84ojf~wP$naILyq-(zt&=sdDM99Cas<OD$5?ZM>izJ1Vmdd&+lwsXjpD#0H2c
zn*$pjuTYu&*mY=(fKrSS2)m&{sxQ4QPO@^z7=frYyzo_%5H3IgO`f$KcfC7-cY(~-
z6<~gXwOsl_g8}lVF@=1`2}K+bk0ARnAgi7M%x=iZ+3-2HWwjY<*pglwB14WkU@2FQ
z6;t=yLMI5pC>jG(Q5fk|dqUp$Ye|*;ovCZxIeMb?0hKl>(}X0Fbt&NqbLwOWC0Fw!
zD2k}**c`snMT<M7e$WA~8fc=|*Qy8BFsq;G>YnR;W<%nBetyVudp-`+ey~1pdrOHq
z7j*RXvq2MF(QU{jf|8~UymQK*Q8>uS5WyQPFE1~azH18b>O4|UU=__9@%VfB7rzjp
z(`$_U=NX}55H0DJJLe1iiL-s5)55RZOM+{7?!6Lkr_ufvvX4t&<c4{Gur&mbweg%C
zKY#u_ezc{vwR^fVd2MH<y|N>biiVm+tV4^9<(h9*y!Y&Fm&L)p-HZJr3L=EQKT(=&
zBg${d+>+*q$uUCF=^>(pn~4PlollS0nA^8R3PcNAX)6`y96oaN`%yFAs-^2gURV^A
zII}2w-4B0Vze=fqCzQ0Vd5n`Z*Nfb2y~FA_&7NBT!0|FDhzA^{>WUS25_0%;LphRP
zmYtoQSL)V8-Gb<p3W2BXUB>s)RbA#Gc)@uEKF+yf9>5Qy=uALNm8ufge?0O>ON+Bs
zDYeuR0^ih;%M=mkJXhPw=3jdO&Q9KmCExw|-}u4b%Cp5os<&^eL%|P(+;Zh#o|^F|
zW$VED?R(+$eqa+$-Y3ui>c4&wn2Aw2Wa9*@;{ER)GbCN+=0<~%a3&~PL26Ns^3)YI
zUEOG)A|EurwlR7n&c2@9Hi1@IQWx<I7INSMZ25)lKR6uH#if`HicAK6yK9g!*SdZC
z1&|vTdv7{oCYkN3K7uOyz`{ypsd9@xApzV<HMm-MzortP9|jJw^AzrNkrfpZ(#v1z
zbNjV{7aF|x2^N;@wK+`l(PK6plVG6gw{AVpx-mU9b!q#b#gTaOn2Nf;b<ei%?LYTC
z^se<iP5oS0h)-}nrDUkElG&cW3R)d43j^C5IZh|42()G+B*A0$QZqbdC-5P#P32lj
zx_$@LN?WDGLXo=dbErl;$i~1y=LTzI(6{%8#=TE~3XtELvwn9EPkzC>Hvb+X!(uJ3
zmS;zR27=SAUt7O;tPV(_Ef)vNnFJp^H}u*SUc+KWb{qO$lF>+T5n>5XjKjxLX_Q~`
z3Hr?Siyaa-@PaQh;HaJDSon<}1F3f!Bnev+u8pw9fHKc(sXw<$M<gQA!;@d(DUGqG
z^4ZP!ru8*6lELX4;#&aaZo|%l3iRE(clDny{d&pQ!wTF6wnG)_4_&an){)W&yG2&T
z+8Vi#@H&D=h-_ZuF!)7=q5|3aBh+Gu=5QV~C}~5Y4CK0yAbDs#+F)Dai8=p9Dhd2K
z2{Cb5ehAe}K7NlD<ZJiB`)2*uOI!Ei4P5&k@=BTewF6VsAXXb}my$*$Ug{qXKbYiF
zD?$Y|1uQ(|I8BIu%=-3Yia@=tF_weh3hx##l2lm+hJ}TB0&$niLNTU-Um0))u+)V?
z5BB`Lb(~Ajy=Wne_g!eTf#k4HjCE)L{;%=Unj5%uxZ?Imu~uJipVx1PBo8nDv`>Ek
zp7!Up^tz5){0M(zEum>EXFPc}t9bz<7okV&h$q%1wXm+81k~g9rMac$=g#KJ!z_0m
zo%~u>FL+|mQf9<Y++-S-I5Kos_M<HYPZ6(E`}fr7WohSh$<auEf^uZzE*l32hed0&
zaG~rp^j3v12`kb_Ej@-_LYCK5Y=0_?-J~wH985yyFMT_4{3uyWi{Qq>ZKZ;k$u2|I
zfw?kQv|uL>QKjbNni_*9RHO5{ReX$*6PE4B_Z$5whuR-i>W8BqsY&^Hwcf?9zxb2A
zu+Gstezf*#aU+jKPy%iHgCL`NYH5Gg&7Ixo65m!7tLI_Ho!k@VtPS_7+zV{0mKC5G
z>)TUO8`?`CkVZvC1+f@Lp26S~IsHXW&{Lr5WTPP?>ka!dR9(G3S(AeDShPtvb)`Sp
zIUQ@0Mco!DAP3WMMKJ+6B9SpMb6jco_I*<kF)`agF?pb%^;}frZZ&qxtS#B0ww>wc
zi5mzfpHFwy#g&(fh`Lp+p(IWH+}0|uPF{~WKG(OGK-81Io2P!0nY~@}rk+4Ur6h^#
z<VbUywU<{*|A2dm8TH`G9Em%%FN&S#YzG@j$-14FRi4!wrw4Zykj6J<kdlQtIdlWv
zyEd(nu4}@2R{6ykoBKPgqKL8=KkNx=1t5$u0CFcaH8rOpae~=c9v?z%0TO5aUeHZ8
z)fzMPy6^GFocWWCjMGoV*Ar`MY9t%~!N$oXx}<RsuI7O3pl<1~XV%<BX=wwc@GI|j
zSACOZK$JDy-b79=nOtH8R4p-qfD3_h;_v@4#sJ0}bm>_Q{Qr5=|JD{c-$|4sCt>8b
zTg+QFO2ngEbgQHS198<)0C_n^HHIaEV<{1anO1qIo~N!?f>D_E_IA{|`Gt$X>Rx##
z(WR_!Q8h+H8T?i?zMcJgD_qJz9IXN30w9!-1v1QCTIvhkSrNJ;mCZ-*+$4lRYE@_f
zJkzUL9BkTnkf}#vJ>6g{a!f~4^Ai}1CVuu-vIq2fc?>Ev*PS4-vDkaHT`CzaN<DRT
z^+m5a+9b(;PIrC?k<AyslKRA59?zvZQUj%!EuJmtzs~?V=2A@sj*hC3X?;Q*-V545
zYh7u;bd*p~N9KITzho>9WU;J(s5_U!WPfkhfTSLTB7}v6%qN<{m}I=m@VC_$YRMMm
zNXtN0r=iorL<_QsE@XY$Qa+$?vo<iY*Fy#C?+f`j4dCNeR8rEqdpF5pykVwdE>{D9
zL}lvQ?t+QTD?+T#v>U~Mr~Gox;s~%U<3ZfrL>F2-)r{)3-J**svD3M&-@mKDEdb)Y
z;BO~h4>_ZiD<HJ}2?AL-)W-tZJ>R|D=&_5Eqi4Y%c3d&`vzwp9VzDxKA!y{TbAORV
z@QWAfP^K$(UC`yYaKU`I%40G5vPP;oz;aDiXC^|Bpf(;P2JKZ1?oART`Ybx)U(!u>
zZGXqfz~S3T-dfXuCnXdnK0YY8ib5exps)k?=4=sKMZ?*-XxlbG*4NjUn0%nlQ;?Xr
zKL#-{63L+yJ`IYM-EnTiGtVr)G&M)?A=~4niy^Rbn{VRI`zegkA17*AN6h7au6#@=
zKZY=-IS#f<%5zbJFfz<S%sp0daCl+pG4XJBjK<IY%K|1Zfr5epf8g+8V0We#-ac%r
zHy;6lx+5zqyI9d<Q-tvl<OSOoCb9_#07a!vJv&qiSVQ^YRqTjSN=nKi?)=%a2&D*K
zEwBxIahVlJI}01hE@7jKlNb(g5qRIxi^4<hylW_eCgK%>7^rQp@>p5zkfSNLG&#i%
zehEN>2H;txlziZcK$PhA9wucO<)SUIG0m$pO(HuxO5DG9w6|j!7%<bb@~U-#!!&sA
zL|WuDBS<Q8va`zqCbq|c?wTLkV=68UdbY~2#P2-_<*JSCAO%)dnk}?)u+SsCRsRdb
zTqb@D8<g<g2<^=->&8~<KwS^2Q<^ZkitjD~ydXM@m$qk;bj=33+aX*Ddy=c5@G}s(
zk-VJ<ZM(|KA^6yQ$Zvml3$h9Nc_M+<+>s^J)P^9|o!dW?C>t;+oa5)`+NEYea0J^N
zi4PRJ9r+mv>;u3+I&*V#H3Z^u%o4<2t9YSyExOO7*0kvr75#CP<mA8@^Kx(xj5P!A
z+CYGD(Q82Mo#c18I_3q4Z1x)#unjFySJwc2%ylD;Tvl4(6hpo5zNu-k=b9yG?Y3$0
zpdg7P405gDr!#CMy^hh+6Es*~SqLNe4mm)c<nPzaKlhLE6nPQVT5sa0Q@eB;9>KWu
z*ZBE?>$nWE^(2oW*!}eyf}Q}0-Bom0Z0tM?u|WdlM|CfRAf}Y=e(1fuJ==33${|~0
z+h<lmo_Odf>4GdXOOZ+4=%{gD(-SZ?Ck#XtpC@r9MZbPYY%U5<?d&dKiE5~*0|_0>
z-Yl32Sk!86eLx@`a>#%EGIWFI;O~ZBJO~pVcK<@vt9_y9WCIASXliMt03Vav4&*#K
zfibG<_=O@;ALxKwALIZ(h9Es|&didXmj?yp&#T}z%>VrUVS8~MmsnWXwfm@d_6cy8
zFK*xgJS<P?1TJv_t4Mm^IGx~KNKFrh{)N+mFwhvqQ1sTmK{{ju4-cLv9N(*}94FB&
zY{Pv#_ugj(kZR-N<g{l$=T)zLg+<!42uh6ug2eT5JSXPQb}W+gA0@T2vRcE3D^D2=
zJK)+JZ%6>a1Fu0tW;V8eg1K>6jO4a!``*ZR9c=ki5BFA_v`B~WFHQhgc;!Gw7v(w=
zCH7amykCRz3hB(^!X2vij4HW`x<hGWVWD)n2pz7Sb+$B|g7}*fk*v_q8_&<YB26~>
z`ZdyAig@k9ed-sTd<~3_qsI4xgOkV^EXaeO^Mv(3Gn_eT9u;2Fv3;^lYOc(1B&rRO
zwlLt4w&NPr=aq+A@3-1tALfYO@c@M%#N$K$TPLO&F9a)^g8R93ZKIB+3(nP_Pv>uy
zfnpoWIZGQGWv})59}BoaC)KTavuiN{H#nYi-qJ~E@5?3&M0h6@gkoJl2Xj->Z`6<N
z7R??uV6*r4j}Pc~=WqU52d~ftU85`Oa89GDcP9AKnt3a)VBK~q&x>wBy7w^nf`1<4
zfBxW}KuJbh-EMTKRQ15mq$B-bn<PTJathvWiQg*o-uxrAKz3YVG`*lefK|-?ENW{u
zt9%#6nt(CPRj&dDS<sLmcGM&1lGiHSFl9$1nh{I*4hXyi{_Ru{bZ?(AyS9DL6X+ZN
zeAU&}b+qT-qG1usKhCn#6;U1fYYO^YR3RX2_Zi>jW&b(|@}hr#dRSJ(DcZBE=l=3$
z_$9~xwV%a^#(Z_+ka+JuKUN_Tb1g@w;9R@(69x4Q{>%^ZZ_R<sv3&Qn<RZkzzFrl7
znz%KboSY_Pl2sFAYy|2{&QKmEGE+z#FJ(avRe3mhLR&6c6_Sia4}QFtdPjEj=Giju
zWM&cT?+b2&4qjVt_RFsNwL=tA-dY-adIxlL4_JEV%aDKI2s!fCZTXLfU%SvD;C(_C
zI*b@n6Lx-In&I=?REnPsy{yqy7eMO7QJ5}O=DN^7=-aJ@Op(M^UB%~aEPj1`5jGIK
zq<)1fLhF__tym7xL?w?&E#nRpRA&HGE5e|KdByf(B{wEU!o{*5gvzLi&PaO-1yPQV
zVyf4RSD*5Ev*QEo1+HN2H}_6|JxXBtB@Z92cV%(?n{EB)4$K-P62DiRw!<wB&ER!g
zEB5!c(eT5Z)Gp+x(x%-umd02VxMb_aHiodi(4>Y|wwP>*$^hHK@tIOwct~AC7F&og
z8yf`a!8AymrEIQDrIDWT<~KTDT?b%fV$=@U#`;Ta^gN*!uu@>>GpA<(z|W#5`(D`F
zyx@Se9rI%c?n6~OF)`VQ8O`7VAgKd3tL>Ek@hxuI`gAGAu}?;Oe<Ef8y?a!*LVLrf
z$;n9;6(%uzV^0XQyMR^hPXT}=VIR;+QH4T)3)3}U@24rm34!F?7evTn-y$|IX4S-{
zi<CiSrO3GM$*R%*T0qI;(RHaF2wFpvMhZ+D9pAbEUJtVx-2UQ)Ru&xzO;t@Ww4i6n
zR_i_R8OfZLAV;XDF98l5{~B==Rp_4nH1v7wkUQ5@HE!CIR?OotcJjx7_-E8(w+vJe
zYU}utZx3dLpBaC;#43qZrfSSoA7*Qa<K{ijEvA-|#r~GmyRO7>%l-HCyCUztKdUfe
zAmfAe8p#^m{h6WRBwr7?<f)R`%)n0UhlHI6(E_Fl!CdAKXWsFT-IfRy*P|EvKs2%a
z(kk4Jza;tnC?#Lj+nO)Or$g2)(5Vwx{;h`cxt^StlP5-|L~Ax%SC`-TNf`i9b~%qP
zIkh&YHSM&A|KiT}%+OZ#K*8eR#0*o~R<uD#pO)8Jd2#Pz#$3-Y!&g!7r|#|B`I~9(
zx2Ko3c1U&)#7Azfe?suoMCiWu5qz{JlJKFNbSk#uF>drHRR|)HjYMU2K&I1o&Hc@!
zW(`r=3Q8i*H12tCRQ2$SmYF*^arFTD1<a2f5;95I&Kn1q1Q>kBHnHN{42iErFqOah
z`-5ugnceA|7T``cQz4j%Ja@x=b-Gi3(;A(sJX7m`WV06()kBj6#~?p_SM$~!CeMiE
z9BEYlo|3N5R{Xr5a+Y8y6%k4|(c8*_zI#MZ6Q^HrUp`j^h)?##ic3l+w_}AY?pm6g
zr)v_0bQqIQ4Z9B5%s>aJ>Swcdm8p0y+eM>>JT}QQOD_*_Ip8G|2Z)FQhb}sSyw^dF
z2O&-Ad`hOj!1ShWmAk`MtDWx$-{qG^nyDjQUGJ$`B{az?!rz)WZ!{sR-^;*-kVfOT
z@x=m4Lm8?Gex#&I8<*<?mm9B-S~GBtXbqaV<YPgWwmf(gs$2<x6UJ7*(yMB6LL=Jy
zEGh+B(dvY|HvAGdy4yFZffhRIC^buD`{fa>wT-YkYXWXPHWUEj?E>)^1m1O+L~-=;
z6D5uv1}#!#u6~r93N(5cdG4-ZR%~uOErJrm?|co-OF*_`*AGfd6Q^pHL+n05vReRh
zVBA3elG??_%(1HJ6X(i0PdlALG{GD^gACfDJ|hzgtxU0dd$^i3NCgN%inYcuNWJ`O
z^;0p?>Wo>61kn+1r)W_-Lnyx3M)R9opNQRf=6&rXHS<BMe#jrqbr#{SD^8_wu*Ipp
zA>ts@Vtw+DuN!;H&;@x?N2oiM1(6BMPZSkfVYIJ5>D-IMdS5btykEIve{X?laz-H;
zJshUh>;4-m_b<=QVkh7xuo!O$*^GI?6#yAN#02#vFj$y`3q6-O(9!W03O;WG0#d$6
z;|4#-tYxUCoWA<#Q)+5zS8NS;T^&Ub)xpN24BphL-cs$rPaN|1Ji#ejKihGaI2j!D
zhj@?4D13C6f>**0%P1`>(!8!hcTvCCQforT+IxFoL<N7YocOuw13S~MgjuD?T;4}(
zhqYc$942n^Vp_?hKGxt%eE7T&j5_e8l2D%d1Y>>IqE`fccQ%Bar#nuJsCuh5zGhW|
z6UP^XW~kZt<_z~l3U_Xqp!`Uo=JgVv0j_|CAQSe3+&>v@dIlt5ls%|a2<%NB5r>!-
zYc#&QrAvtq6&kO*q*<|j4Qng91__AYZ#7rnB#r_^8(`g^Mb<<ETB;C&kXp#3KJaI6
zZ||ZzhgkQilHl5~rwCQDuU==Ava<q;9`aVYE;Py3rnhZEc$GG?yXZEdMomP`CM6bh
zbX@YeKu?YyQrs7sI6pz#15az5q^N=S@;8gx$A>p{HhUy04JRHPY;%W+gy}%Hj66#g
za&`y3z2{2=ax4`%#)_=_3XAN=>Q}#<*~@p71dL<R_35_w9mWv4Pr<ZW<YWp1(0=j$
z+#Q#`hY=HJyVKQ^`=1_d7EaDn)8f>zysWlctws81JQ~KTRX`F!8Kz%ax<$|PGh%)2
zC3zYLnk3g76PuZ4LtUqwMFsEFRwi4OpjqX%Mw*JU+_PgDEZieE8m+V?2;73S>E*Ch
ztuG7?-YG<4DOqTuR%0zXoJX$<4@co1u6G{s*&kYTg;|MkIW4;I;FYA{F_4NeoT0aY
zLMaBVg)|5QA*gp*Wso1qc9arnaxv9Q<Ueuc5;raO?v;l_%LcD;&R}QdO`}~YN@$3c
zW7s^WKe|S|d~B^r^QxMT>DAIGh_7+`<W_IZI)j;{TIH5sR8EkQ78Vsnz7BKi^U`N8
zfWY?v-#o1jSc`4K&4JL_Iys%~sT-Jl?hfP0e*DpL#-eZ~F?%3Nqfc%q|Cp-*l);oM
zW$+#2xhn2}2UEkt!-ZVud!h3CGgoy!bgr?4Uz<}$f+F;-@x8|7*Zy_p1LaO;p1>yH
z7*_Y~<*Bqyns!y_y0K(wY6j1a4kV}l<NE5PDG2sT{uA`fzUvw+cXE2zde_1puw9s`
zgUXJ(DjxkDXk;$u&mwe0-_+kY_#?!#>WP8L_iek!vd!%vR^ryqzSR!XFP^{O-R#28
zhBoos;Ix8k$m7}*Er&$_$mnNO%v?VA$0uX#{;{SrJENp%e82=cDP0{O<p$PX#Laqq
zbuS2Y8D5^tW_a#)HoP#`_e^u^%_SkC06N-NOS9135D5w!8LRb_e4)G^tYh6`*R~qH
zoZ)6Kg0h&aPg2w9C7I<HtMA@;Uyv8mPN{R1A^?U_*8!s;r7nH|rP+hFIi1vhme#0o
zsVBy+ItutC6CjQ8{uHl%r0-gmQE|*4(5^-UoZt@Y|1}yf?bQVyU|?;#w^1fMw_-L^
zF_HiJ^YaR?Zo%<f*!rfj=B*f+pZ#Vo`y+;|sCxw@%J!)#8oq9?E`0c<+V~K1#4{nH
z!?$9L`eL>7bmPK#4Wilnc9vHm1S_4BfCIim9kyh`@+xucHLGO*TIF1B<z3CwJGG=T
zZ?lers;Bnr2prF_0QTO~ZwH47iMb@8z_Ya+$#Q^cgY!Y4D0ciJxgOzEDw_g39ii*9
z=wWks5hyeknRh0w_L{y)fo#7FwN^NI(@#+DpP;bsWE@}UFXj%a<BIDSiH?r$f=r=f
zqCKR6FF$z>lTU_BBGx*yBQ<_5m@0$oh7$;K&oCE@(p(z<*X`Vox&>l&A2FT0GS2#<
z!y-^CdF!F(sU7fbY89G29QjOC6Mc<d<q%&eCiHF$PRT^%f^|E?iJ9aINWS?dclFKq
zLtg=f)0g^r4!qP46QSf_$DwZanb3}#`jg%Jc6_ewiMD#2J-|irrDFHxU#pOf7r`P&
z?h;cZHyNMiehs1aXjv_?$jI>r$4s<U?(M6OT5dTElQ8JNRd~%36&(|UhBQD@vx5@(
z6Rk6x{`rNuGLN=b$uzIE&n_^cvJ#C~2TJXX^mOdaENzCuNBqf>dG$)J;L!{E#WycC
zR?ZMJCeyE8NR&PVk~7bkZNK~1;oZaHj)R4o>9*S>4AHlxIj{2~-#m;t$bJE2?%}t4
z|8x{Pf$ip_Pp6(+n;Fn9&sk8tcP@6Vf!Xf2S}*?Q#2Y*yMU2HjNlzC?9{ALlBmO?y
zt2W&1IIJ9GOO!ztZqMyYP06_%VrFfzLU2du-?ps}Brm@^22@y1#r0&DT#G}E_3lOZ
zcGuO<E;#P&RxeI>JM7;ea;G~!gz|C&aUQP$$$TE0-h6h*Q1U_%M+lia-%=K+yi)Kz
zw*+<O<{LI;D@?8p10rM`THciDn07jXWJ00sBf8<unS_xb@5LJ5Z&l5Mst?+_r~08o
z<DeBuw*$w$<ty_D)L#!;5&KhQnxsV%+HsPu^E&<DaH&ahb&I)>QC`qYgoXs3+hE*H
z&V0ze8iaje+y(?E?(8~9ZbPM>vIM!mmXF||s`7a>#Uuc?ipb~lbDaVd$B&empC6np
zne|Gy#WG%*FEbh{6}5>#7(_WW?vgD`n49aR)ZlahPDBE-4^42=O!i*uMmiZUO+*;A
zwdZ7IJ^^w>8!v5Bt}v2jmS1uBCM@bC*Q#|hnUyH#ZzqwTqHNlI9QCy7kKf2yMD7BO
zTGm7B{|rI@axB_pU@1Ohqbkl5xWpt*akA&@xSbph4tCC~+4Iz`@%0H-8~gLH8EyLJ
zS~!Srdk)6QPt=heUZ2D8A>X|eNNzIOxuL_8$?96H54~08Tn4Y`WQ)^P7(N!Sv`O+o
z(<`T)sEEj9K_&CCZ0Zabm)+U*#n(nYi<LGEShqR)#-_FAE!0-TINc=W98f@hg6z|j
z<r5ROc6-3d;+$pRhV<{*LneHpXuOAxnrh`Ze~8D|LDQXdiPKoQ#tGo|`{#~{(09CT
zX<>1DndN2(Q`oO47ybLM3%-^Op&DPC_FX#IM5d)7E<;V-i@JP}fgm2&-s4mwvVCYk
z^q{+x>EzM#$I8G#vMB0Ry4nC4sl0BPy$N_e4e)i+kLDwVoWFM{PE?S+l7D=qK?XAK
zxzBK5C@gM<jnD8QPMqJ~rUhJM_<WHC43$~@{{GIR=Ho|pD!`UV!FlkS)!M|P_qVNe
zlI|Pt1nOzhz6$m$c%4AzSiRPxSDrKq*Xy5kAeTqK=TI76>p4GtTDH|bliIuC^P2>4
zkg4g4y?ugkJe^_e5#)=~(q8gba0Zc_pBA_7%~v_%PZSV$+4B5>Yf`n3Pt5qW53(L?
zPGmm|5ah?hU63co71Q~-(0Ke&UT;8583FfLyzkZwFP6XFjLw*Qyun4WmcNINe-O?+
z^%Ym~TiyOE?Pmr~1vAG4Jfjn2k@0qCt0^xRM}B$PVG=lTP73q$XQ<qBb#}holl~22
z+C<Nf96k1Zpz~Ctq(Oi5faUZ=t$|si5-p#1lWN9s#*Y=f!{A!?#G(0=np|N3IwDt8
zHK|{X8bh9&+U(i4KNHQ8m6~ZbU{1|p%;RkLUu>s~yk00%koue(u4h}$fe$(H&|SRj
zG<zGQbW<iL+rB)(Rt=p(SZ~uS>E|g`=JKY;9q2$1quD2E&q`UH$zeWtO=-pSh|f8n
zy7q8}>w@e2LW%w0u#W}!S3Cyz&R*OaBRZAo3Plek5HP%RItjf7y@?v+hZKSw<L;vP
z`_EZ3IK6Pu92<aKn@~cRpmlEt@c7Elz(7x{7S(xcom^J-FNFp@4h4}K0xw+p-nbAS
z!Oi!52zU!^CK4&-VIR)3oUUsYOwfs#YpnWJQ9vDmKWO~Fpr5LFCN9?wwbmo_uqpH>
zWE#%7Gs@Pv9|b7$-K4oqC3r5BBbPzxUWBXF!JgwVkv!bCw{!>?4DGZ$5uG9T;S#|G
zvSOE#8`IY9!_wmVjCJ+tC8dy+ViD8_fZSjBP-zSDF1>vjjm6Lh!xc1;$xW(|R;ECX
zaf#LIdt+~~`C?C<o&Sk1U0K!yEJVKkCjTUh(<_(0MRV<SB{jZv({1RX+`Ke-=Hm}w
zk*%HzO;e4Df7BBD4w@S4^>5qb&mK&^h;yEX$?^bFx6>zH)itx+uM8w^mgv9o7vK3`
z*mxK+eM_i776Sg{Y=;uDVq$)_X+NEqS82yR;_-9eaR7uT&yGMPX2q5Kv_h>NwC`@3
z;nUxlMs8xD@c5n^CoC+Sg3sxV8b)bko8~_BO+mdf>Tlkw%xM;z7&bLP8RVX{p=)`0
z)_4#HxlYG#_4MS#+D3lhcr2iKv)pqua;4$Z*!gEuZ;b;_o`29cI2bGU67CRXsv}Hy
zM`YrHBu!gp%Nu-e2AO|8FdTrF7ds6X#RqjK>Vy5^A%DXQYOJ5Q(Y#|-g}e)KIZ#7*
z`^A;6@TKwCN4X%!-u&WX;RT>tBwd0lBbu8@VFY?xxNQc@1b|nj?DN=cA^hxM(G+_5
za*z6H{wHtfXj#M^A29LTBP7heirduHc3L3x82MknVH7wAO%%WFA7qbM&0M*l(<c7T
zOl?b-pq;&jIMl6Z71$aMJhS%U<j$vfuax!<DY~n7^EJF|^4-Q^RUtrb3)@SQ<~psQ
z7f3Viu6g*?Y!Dsd)jAnlLxK6ry@%O?HG*k{BLdD0+dkXtttY9W-yTVh6BZHqVRn=H
z&>>Qj+c#u2foD$>aix*;7~|UjKf2>r7SvfCMr-{uG72uQ&5iIO55L;GRPnW{X|PGW
z+bMgPw=su67J%%hE*!0%`UZkV*G!_wpPMaN8Mhd?AR$@9HXuPs67Hc*N|aUF>_G6~
zu0b1t4vlIZ%YRw<Uw()sA!0r9j1^Z|@lE&Wl8QTZhH9{1)7@tAFe`#*KD`+BBIjwy
z!8NV}vmgKU6rPAgI~sj72cb10WYG9;@MnT*TMuLJ5~0)mU*Gum9}+LYwdi$yNcjKa
zK@cGT(5;SHyAyJy|K=Gx=mD`ve_V|IH=iS5{)of|_#MJWMWhHE@_+Zgrpduk#H+a}
z|6ja|nkoDarX$Sp2cA?yZ}A`Jdo>V&rJ}7y)9ag!3D0#G7*4sIswT3<=cm);M>Y3`
zWx||Pn}1VXPozAIeZ;^YO}?X4E9&T4MG-&Vx6Cp(!&{}Xwkp)ZL0t7=I3WJS(%#yq
zYAf8u!y}4Qs#)>+vlhH@R&nLpr_9>=!yqH63Y8J*4O^d)1s%7=9p?}YpVr)l`ApQ-
zpsqFUr;C*XU&HFY#_BV-T2Tyh{9SBxvRkH`G~efid;Yq<e8nu=4}Q+t$Xs%wX%lxj
zjIGOHX7Wc!Q^Zb}`XuenF0-{}_>!nhdAUe5O3)Qt^+C}`p`#X^l8#>L&-<{6^GLIq
z`D8%<FMHF$>c3%x@u_fnQvJU$3jcnJ)nSUjViy64|M~l-;~y^><EmB(L{|TLY%O`g
zi#Xk9_}4%G`%(J4V>UB{+qEU8^4$M?n*Y_W{69!S{{74U+q%VifKgtxTMYhhfA;Sj
z%)dTz;w1inU2^@`KmWI1{@=dHeiEETdsR92!S&I9yS)C<c*hspOY(0&dGM3gMlk@s
rU75_i^}l)ge>u4SZwzE~|Ikg&^t+Ag?`#jjKey#oZscA!e)9hTE?}VK

literal 0
HcmV?d00001

diff --git a/fluss-rust/docs/creating-a-release.md b/fluss-rust/docs/creating-a-release.md
new file mode 100644
index 0000000000..95714d9824
--- /dev/null
+++ b/fluss-rust/docs/creating-a-release.md
@@ -0,0 +1,453 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Creating a Fluss Rust Client Release
+
+This document describes in detail how to create a release of the **Fluss clients** (fluss-rust, fluss-python, fluss-cpp) from the [fluss-rust](https://github.com/apache/fluss-rust) repository. It is based on the [Creating a Fluss Release](https://fluss.apache.org/community/how-to-release/creating-a-fluss-release/) guide of the Apache Fluss project and the [release guide of Apache OpenDAL](https://nightlies.apache.org/opendal/opendal-docs-stable/community/release/); releases are source archives plus CI-published crates.io and PyPI.
+
+Publishing software has legal consequences. This guide complements the foundation-wide [Product Release Policy](https://www.apache.org/legal/release-policy.html) and [Release Distribution Policy](https://infra.apache.org/release-distribution.html).
+
+## Overview
+
+![Release process overview](assets/release-guide.png)
+
+The release process consists of:
+
+1. [Decide to release](#decide-to-release)
+2. [Prepare for the release](#prepare-for-the-release)
+3. [Build a release candidate](#build-a-release-candidate)
+4. [Vote on the release candidate](#vote-on-the-release-candidate)
+5. [If necessary, fix any issues and go back to step 3](#fix-any-issues)
+6. [Finalize the release](#finalize-the-release)
+7. [Promote the release](#promote-the-release)
+
+## Decide to release
+
+Deciding to release and selecting a Release Manager is the first step. This is a consensus-based decision of the community.
+
+Anybody can propose a release (e.g. on the dev mailing list), giving a short rationale and nominating a committer as Release Manager (including themselves). Any objections should be resolved by consensus before starting.
+
+**Checklist to proceed**
+
+- [ ] Community agrees to release
+- [ ] A Release Manager is selected
+
+## Prepare for the release
+
+### 0. One-time Release Manager setup
+
+Before your first release, perform one-time configuration. See **[Release Manager Preparation](https://fluss.apache.org/community/how-to-release/release-manager-preparation/)** (GPG key, etc.). For fluss-rust you do **not** need Nexus/Maven; you only need GPG for signing the source archive and (optionally) git signing.
+
+**Checklist (one-time)**
+
+- [ ] GPG key set up and published to [KEYS](https://downloads.apache.org/incubator/fluss/KEYS) or Apache account
+- [ ] Git configured to use your GPG key for signing tags
+
+### 1. Install Rust (and optional: just)
+
+The release script (`just release` or `./scripts/release.sh`) uses `git archive` and `gpg`; building or verifying the project locally requires **Rust**. Install the [Rust toolchain](https://rustup.rs/) (the version should match [rust-toolchain.toml](https://github.com/apache/fluss-rust/blob/main/rust-toolchain.toml) in the repo). The dependency list script (`scripts/dependencies.py`) requires **Python 3.11+**.
+
+```bash
+rustc --version
+cargo --version
+```
+
+To use `just release`, install [just](https://github.com/casey/just) (e.g. `cargo install just` or your system package manager). If you prefer not to use just, run `./scripts/release.sh $RELEASE_VERSION` instead.
+
+### 2. Optional: Create a new Milestone in GitHub
+
+If the project uses GitHub milestones for release tracking, create a new milestone for the **next** version (e.g. `v0.2` if you are releasing `0.1.x`). This helps contributors target issues to the correct release.
+
+### 3. Optional: Triage release-blocking issues
+
+Check open issues that might block the release. Resolve, defer to the next milestone, or mark as blocker and do not proceed until they are fixed.
+
+### 4. Clone fluss-rust into a fresh workspace
+
+Use a clean clone to avoid local changes affecting the release.
+
+```bash
+git clone https://github.com/apache/fluss-rust.git
+cd fluss-rust
+```
+
+### 5. Set up environment variables
+
+Set these once and use them in all following commands. (Bash syntax.)
+
+```bash
+export RELEASE_VERSION="0.1.0"
+export RELEASE_TAG="v${RELEASE_VERSION}"
+export SVN_RELEASE_DIR="fluss-rust-${RELEASE_VERSION}"
+# Only set if there is a previous release (for compare link in DISCUSS / release notes)
+export LAST_VERSION="0.0.9"
+export NEXT_VERSION="0.2.0"
+```
+
+For the **first release** there is no previous version; leave `LAST_VERSION` unset or omit it when using the compare link in the DISCUSS thread and release notes.
+
+### 6. Generate dependencies list
+
+[ASF release policy](https://www.apache.org/legal/release-policy.html) requires that every release comply with [ASF licensing policy](https://www.apache.org/legal/resolved.html) and that an **audit be performed before a full release**. Generating and committing a dependency list (and using cargo-deny) documents third-party components and supports this requirement.
+
+Do this on `main` **before** creating the release branch. Then both the release branch (when created from `main`) and `main` will have the same dependency list.
+
+1. Download and set up [cargo-deny](https://embarkstudios.github.io/cargo-deny/cli/index.html) (see cargo-deny docs).
+2. Run the script to update the dependency list (requires **Python 3.11+** for the release tooling), then commit on `main`:
+
+```bash
+git checkout main
+git pull
+python3 scripts/dependencies.py generate
+git add **/DEPENDENCIES*.tsv
+# Bash: run  shopt -s globstar  first so ** matches subdirs
+git commit -m "chore: update dependency list for release ${RELEASE_VERSION}"
+git push origin main
+```
+
+To only check licenses (no file update): `python3 scripts/dependencies.py check`.
+
+### 7. Optional: Start a [DISCUSS] thread
+
+On [Fluss Discussions](https://github.com/apache/fluss-rust/discussions) or the dev list:
+
+- **Subject:** `[DISCUSS] Release Apache Fluss clients (fluss-rust, fluss-python, fluss-cpp) $RELEASE_VERSION`
+- **Body:** Short rationale; if there is a previous release, add compare link: `https://github.com/apache/fluss-rust/compare/v${LAST_VERSION}...main`. Ask for comments.
+
+### 8. Create a release branch
+
+From `main`, create a release branch. All release artifacts will be built from this branch. The tag (RC or release) is created later when building the release candidate.
+
+```bash
+git checkout main
+git pull
+git checkout -b release-${RELEASE_VERSION}
+git push origin release-${RELEASE_VERSION}
+```
+
+Do **not** create or push the release/RC tag yet; that happens in [Build a release candidate](#build-a-release-candidate) after the source artifacts are staged.
+
+### 9. Bump version on main for the next development cycle
+
+So that `main` moves to the next version immediately after the release branch is cut, run the bump script and commit:
+
+```bash
+git checkout main
+git pull
+
+./scripts/bump-version.sh $RELEASE_VERSION $NEXT_VERSION
+
+git add Cargo.toml
+git commit -m "Bump version to ${NEXT_VERSION}"
+git push origin main
+```
+
+The script updates the root `Cargo.toml` ([workspace.package] and [workspace.dependencies] fluss-rs). crates/fluss and bindings inherit `version` from the workspace.
+
+### 10. Optional: Create PRs for release blog and download page
+
+You can open a pull request in the **Apache Fluss** repository for the release blog (announcement). If the project website has a download page, also create a PR to add the new version there. **Do not merge these PRs until the release is finalized.**
+
+---
+
+**Checklist to proceed to the next step**
+
+- [ ] Rust (and optionally just) installed and on PATH
+- [ ] Python 3.11+ for dependency list script
+- [ ] No release-blocking issues (or triaged)
+- [ ] Environment variables set
+- [ ] Release branch created and pushed
+- [ ] Main branch bumped to `NEXT_VERSION` and pushed
+- [ ] Dependencies list generated and committed on main
+- [ ] (Optional) DISCUSS thread and/or tracking issue created
+- [ ] (Optional) PRs for blog and download page created but not merged
+
+## Build a release candidate
+
+Each release candidate is built from the release branch, signed, and staged to the dev area of dist.apache.org. If an RC fails the vote, fix issues and repeat this section with an incremented `RC_NUM` (see [Fix any issues](#fix-any-issues)).
+
+### 1. Set RC environment variables
+
+Set these when building a **release candidate**. Start with `RC_NUM=1`; if the vote fails and you build a new candidate, increment to `2`, then `3`, etc.
+
+```bash
+export RC_NUM="1"
+export RC_TAG="v${RELEASE_VERSION}-rc${RC_NUM}"
+export SVN_RC_DIR="fluss-rust-${RELEASE_VERSION}-rc${RC_NUM}"
+```
+
+For a **direct release** (no RC), skip these and use `RELEASE_TAG` and `SVN_RELEASE_DIR` from the Prepare step instead.
+
+### 2. Check out the release branch and create the tag
+
+Check out the release branch at the commit you want to release, create the signed tag, then push it. Use `RC_TAG` for a release candidate or `RELEASE_TAG` for a direct release. Pushing the tag triggers GitHub Actions (for an RC tag, fluss-python is published to TestPyPI).
+
+```bash
+git checkout release-${RELEASE_VERSION}
+git pull
+git tag -s $RC_TAG -m "${RC_TAG}"
+git push origin $RC_TAG
+```
+
+Check CI: [Actions](https://github.com/apache/fluss-rust/actions) (Release Rust, Release Python).
+
+### 3. Create source release artifacts
+
+From the repository root (on the release branch, at the commit you tagged):
+
+```bash
+just release $RELEASE_VERSION
+# Or: ./scripts/release.sh $RELEASE_VERSION
+```
+
+This creates under `dist/`:
+
+- `fluss-rust-${RELEASE_VERSION}.tar.gz`
+- `fluss-rust-${RELEASE_VERSION}.tar.gz.sha512`
+- `fluss-rust-${RELEASE_VERSION}.tar.gz.asc`
+
+Verify with: `gpg --verify dist/fluss-rust-${RELEASE_VERSION}.tar.gz.asc dist/fluss-rust-${RELEASE_VERSION}.tar.gz`
+
+### 4. Stage artifacts to SVN (dist.apache.org dev)
+
+From the **fluss-rust** repo root, check out the Fluss dev area and add the release artifacts.
+
+```bash
+svn checkout https://dist.apache.org/repos/dist/dev/incubator/fluss fluss-dist-dev --depth=immediates
+cd fluss-dist-dev
+mkdir $SVN_RC_DIR
+cp ../dist/fluss-rust-${RELEASE_VERSION}.* $SVN_RC_DIR/
+svn add $SVN_RC_DIR
+svn status
+svn commit -m "Add fluss-rust ${RELEASE_VERSION} RC${RC_NUM}"
+```
+
+Verify: [https://dist.apache.org/repos/dist/dev/incubator/fluss/](https://dist.apache.org/repos/dist/dev/incubator/fluss/)
+
+---
+
+**Checklist to proceed to the next step**
+
+- [ ] Source distribution built and signed under `dist/`
+- [ ] Artifacts staged to [dist.apache.org dev](https://dist.apache.org/repos/dist/dev/incubator/fluss/) under `$SVN_RC_DIR`
+- [ ] RC (or release) tag pushed to GitHub
+- [ ] CI for Release Rust / Release Python succeeded
+
+## Vote on the release candidate
+
+Share the release candidate for community review. If the project is in incubation, a [two-phase vote](https://incubator.apache.org/cookbook/#two_phase_vote_on_podling_releases) (Fluss community then Incubator PMC) may be required; otherwise one community vote is enough.
+
+### Fluss community vote
+
+Start the vote on the dev@ mailing list.
+
+**Subject:** `[VOTE] Release Apache Fluss clients (fluss-rust, fluss-python, fluss-cpp) ${RELEASE_VERSION} (RC${RC_NUM})`
+
+**Body template:**
+
+```
+Hi everyone,
+
+Please review and vote on release candidate #${RC_NUM} for Apache Fluss clients (fluss-rust, fluss-python, fluss-cpp) ${RELEASE_VERSION}.
+
+[ ] +1 Approve the release
+[ ] +0 No opinion
+[ ] -1 Do not approve (please provide specific comments)
+
+The release candidate (source distribution) is available at:
+* https://dist.apache.org/repos/dist/dev/incubator/fluss/$SVN_RC_DIR/
+
+KEYS for signature verification:
+* https://downloads.apache.org/incubator/fluss/KEYS
+
+Git tag:
+* https://github.com/apache/fluss-rust/releases/tag/$RC_TAG
+
+PyPI (release) / TestPyPI (RC):
+* https://pypi.org/project/pyfluss/
+* https://test.pypi.org/project/pyfluss/
+
+Please download, verify, and test. Verification steps are in the project docs (todo: add how to verify release).
+
+The vote will be open for at least 72 hours. It is adopted by majority approval with at least 3 PPMC affirmative votes (or as per project policy).
+
+Thanks,
+Release Manager
+```
+
+If issues are found, cancel the vote and go to [Fix any issues](#fix-any-issues). If the vote passes, close it and tally the result in a follow-up:
+
+**Subject:** `[RESULT][VOTE] Release Apache Fluss clients ${RELEASE_VERSION} (RC${RC_NUM})`
+
+**Body:** Summarize binding and non-binding votes and link to the vote thread.
+
+### Incubator PMC vote (if applicable)
+
+If the project is in incubation, start a vote on general@incubator.apache.org after the Fluss community vote passes. Use the same structure: link to the community vote thread, release candidate URL, KEYS, tag, and ask IPMC to vote within 72 hours. Then send the result to the same list.
+
+---
+
+**Checklist to proceed to finalization**
+
+- [ ] Community vote passed (at least 3 binding +1, more +1 than -1)
+- [ ] (If incubating) Incubator PMC vote passed
+
+## Fix any issues
+
+If the vote revealed issues:
+
+1. Fix them on `main` (or the release branch) via normal PRs; cherry-pick fixes into the release branch as needed.
+2. Remove the old RC from dist.apache.org dev (optional but recommended):
+
+```bash
+svn checkout https://dist.apache.org/repos/dist/dev/incubator/fluss fluss-dist-dev --depth=immediates
+cd fluss-dist-dev
+svn remove $SVN_RC_DIR
+svn commit -m "Remove fluss-rust ${RELEASE_VERSION} RC${RC_NUM} (superseded)"
+```
+
+3. Increment `RC_NUM` (e.g. set `RC_NUM="2"`), recreate `RC_TAG` and `SVN_RC_DIR`, then go back to [Build a release candidate](#build-a-release-candidate) and repeat until a candidate is approved.
+
+**Checklist**
+
+- [ ] Issues resolved and changes merged/cherry-picked to the release branch
+- [ ] New RC built and voted on (or same RC re-voted if only minor fixes)
+
+## Finalize the release
+
+Once a release candidate has been approved, finalize the release.
+
+### 1. Push the release git tag (if the vote was on an RC)
+
+If the community voted on an RC tag, create and push the formal release tag so CI publishes to crates.io and PyPI:
+
+```bash
+git checkout $RC_TAG
+git tag -s $RELEASE_TAG -m "Release fluss-rust, fluss-python, fluss-cpp ${RELEASE_VERSION}"
+git push origin $RELEASE_TAG
+```
+
+### 2. Deploy source artifacts to the release repository
+
+Move the staged artifacts from dev to release:
+
+```bash
+svn mv -m "Release fluss-rust ${RELEASE_VERSION}" \
+  https://dist.apache.org/repos/dist/dev/incubator/fluss/$SVN_RC_DIR \
+  https://dist.apache.org/repos/dist/release/incubator/fluss/$SVN_RELEASE_DIR
+```
+
+(Only PPMC members may have write access to the release repository; if you get permission errors, ask on the mailing list.)
+
+### 3. Remove old RC(s) from dev (optional)
+
+Clean up the dev area so only the current RC or the moved release remains:
+
+```bash
+cd fluss-dist-dev
+svn remove $SVN_RC_DIR
+svn commit -m "Remove RC after release fluss-rust ${RELEASE_VERSION}"
+```
+
+### 4. Verify language artifacts
+
+- **fluss-rust:** [crates.io/crates/fluss-rs](https://crates.io/crates/fluss-rs) shows version `$RELEASE_VERSION`
+- **fluss-python:** [PyPI – pyfluss](https://pypi.org/project/pyfluss/) shows version `$RELEASE_VERSION`
+- **fluss-cpp:** Distributed via the source archive; no separate registry
+
+### 5. Create GitHub Release
+
+1. Go to [Releases → New release](https://github.com/apache/fluss-rust/releases/new).
+2. Choose tag `$RELEASE_TAG`.
+3. Set the target to the release branch `release-${RELEASE_VERSION}` (i.e., the branch/commit used to create `$RELEASE_TAG`).
+4. Click **Generate release notes**, then add: notable changes, breaking changes (if any) from component upgrade docs, **official download link** (source archive and verification), and install instructions for fluss-rust, fluss-python, fluss-cpp.
+   - **Download link:** `https://downloads.apache.org/incubator/fluss/fluss-rust-${RELEASE_VERSION}/` (or the project download page). In the release description, include checksums and GPG verification steps.
+5. Click **Publish release**.
+
+### 6. Update CHANGELOG.md on main
+
+Add an entry for `$RELEASE_VERSION` with the list of changes (use [Generate Release Note](generate-release-note.md) from the release tag). Commit and push to `main`.
+
+---
+
+**Checklist to proceed to promotion**
+
+- [ ] Release tag pushed; CI published to crates.io and PyPI
+- [ ] Source artifacts in [dist release](https://dist.apache.org/repos/dist/release/incubator/fluss/)
+- [ ] GitHub Release created
+- [ ] CHANGELOG.md updated on main
+
+## Promote the release
+
+### Merge website PRs
+
+Merge the pull requests for the release blog and download page that were created in [Prepare for the release](#10-optional-create-prs-for-release-blog-and-download-page).
+
+### Announce the release
+
+Wait at least 24 hours after finalizing, per [ASF release policy](https://www.apache.org/legal/release-policy.html#release-announcements).
+
+- Announce on the dev mailing list that the release is complete.
+- Announce on [Fluss Discussions – Announcements](https://github.com/apache/fluss-rust/discussions) (if that category exists).
+- Send the release announcement to **announce@apache.org**.
+
+Use the `@apache.org` email address and **plain text** for the body; otherwise the list may reject the message.
+
+**Subject:** `[ANNOUNCE] Release Apache Fluss clients (fluss-rust, fluss-python, fluss-cpp) ${RELEASE_VERSION}`
+
+**Body template:**
+
+```
+The Apache Fluss community is pleased to announce the release of Apache Fluss clients (fluss-rust, fluss-python, fluss-cpp) ${RELEASE_VERSION}.
+
+This release includes ...
+(Notable changes; link to CHANGELOG or release notes.)
+
+Download and verification:
+* https://downloads.apache.org/incubator/fluss/$SVN_RELEASE_DIR/
+* KEYS: https://downloads.apache.org/incubator/fluss/KEYS (or https://downloads.apache.org/fluss/KEYS after graduation)
+
+Rust:    cargo add fluss-rs
+Python:  pip install pyfluss
+C++:     build from source (see project documentation)
+
+Release notes: https://github.com/apache/fluss-rust/releases/tag/$RELEASE_TAG
+
+Thanks to all contributors!
+
+Release Manager
+```
+
+---
+
+**Checklist to declare the process completed**
+
+- [ ] Release announced on dev list and (if applicable) user list
+- [ ] Release announced on announce@apache.org
+- [ ] Release blog published (if applicable)
+- [ ] Download page updated (if applicable)
+
+## Improve the process
+
+After finishing the release, consider what could be improved (simplifications, clearer steps, automation). Propose changes on the dev list or via a pull request to this guide.
+
+## See also
+
+- [Release Manager Preparation](https://fluss.apache.org/community/how-to-release/release-manager-preparation/) — GPG and one-time setup
+- [Verifying a Fluss Release](https://fluss.apache.org/community/how-to-release/verifying-a-fluss-release/) — How to verify artifacts (adapt for fluss-rust source tarball)
+- [ASF Release Policy](https://www.apache.org/legal/release-policy.html)
diff --git a/fluss-rust/docs/generate-release-note.md b/fluss-rust/docs/generate-release-note.md
new file mode 100644
index 0000000000..1167f4cdb7
--- /dev/null
+++ b/fluss-rust/docs/generate-release-note.md
@@ -0,0 +1,28 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Generate Release Note
+
+Use GitHub's **Generate release notes** to produce a draft from merged PRs between tags. Categories (Added, Fixed, Docs, etc.) are configured in [.github/release.yml](../.github/release.yml).
+
+1. Go to [Create a new release](https://github.com/apache/fluss-rust/releases/new).
+2. In **Choose a tag**, pick the release tag (e.g. `v0.1.0`).
+3. Click **Generate release notes**.
+4. Copy the generated content for **CHANGELOG.md** or the GitHub Release description. When publishing the release, add the official download link, checksums/verification, and install instructions (see [creating-a-release.md](creating-a-release.md)).
+
+See [creating-a-fluss-rust-release.md](creating-a-fluss-rust-release.md) and [GitHub: Automatically generated release notes](https://docs.github.com/en/repositories/releasing-projects-on-github/automatically-generated-release-notes).
diff --git a/fluss-rust/justfile b/fluss-rust/justfile
new file mode 100644
index 0000000000..c4e1a763ac
--- /dev/null
+++ b/fluss-rust/justfile
@@ -0,0 +1,28 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to you under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# Create ASF source release artifacts under dist/.
+# Check out the release tag first (e.g. git checkout v0.1.0-rc1).
+# Usage: just release [version]
+#   If version is omitted, read from Cargo.toml.
+
+# [version]: optional; if omitted, script reads from Cargo.toml
+release [version]:
+    ./scripts/release.sh {{version}}
+
+# Bump version on main for next development cycle. Run from main after cutting release branch.
+# Usage: just bump-version <current> <next>   e.g. just bump-version 0.1.0 0.1.1
+bump-version from to:
+    ./scripts/bump-version.sh {{from}} {{to}}
diff --git a/fluss-rust/scripts/bump-version.sh b/fluss-rust/scripts/bump-version.sh
new file mode 100755
index 0000000000..347b2863d9
--- /dev/null
+++ b/fluss-rust/scripts/bump-version.sh
@@ -0,0 +1,54 @@
+#!/usr/bin/env bash
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to you under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# Bump version in root Cargo.toml ([workspace.package] and [workspace.dependencies] fluss-rs).
+# Run from repo root. Use after cutting a release branch so main is set to the next version.
+#
+# Usage: ./scripts/bump-version.sh <current_version> <next_version>
+#   e.g. ./scripts/bump-version.sh 0.1.0 0.1.1
+#   Or with env vars: ./scripts/bump-version.sh $RELEASE_VERSION $NEXT_VERSION
+
+set -e
+
+if [ -z "$1" ] || [ -z "$2" ]; then
+  echo "Usage: $0 <current_version> <next_version>"
+  echo "  e.g. $0 0.1.0 0.1.1"
+  exit 1
+fi
+
+FROM_VERSION="$1"
+TO_VERSION="$2"
+
+REPO_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
+cd "$REPO_ROOT"
+
+if [ ! -f Cargo.toml ]; then
+  echo "Cargo.toml not found. Run from repo root."
+  exit 1
+fi
+
+# Replace version = "X.Y.Z" with version = "TO_VERSION" (all occurrences in root Cargo.toml)
+case "$(uname -s)" in
+  Darwin)
+    sed -i '' "s/version = \"${FROM_VERSION}\"/version = \"${TO_VERSION}\"/g" Cargo.toml
+    ;;
+  *)
+    sed -i "s/version = \"${FROM_VERSION}\"/version = \"${TO_VERSION}\"/g" Cargo.toml
+    ;;
+esac
+
+echo "Bumped version from ${FROM_VERSION} to ${TO_VERSION} in Cargo.toml"
+echo "Review with: git diff Cargo.toml"
diff --git a/fluss-rust/scripts/constants.py b/fluss-rust/scripts/constants.py
new file mode 100644
index 0000000000..4a23e6a53e
--- /dev/null
+++ b/fluss-rust/scripts/constants.py
@@ -0,0 +1,45 @@
+#!/usr/bin/env python3
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+import tomllib
+from pathlib import Path
+
+ROOT_DIR = Path(__file__).resolve().parent.parent
+
+
+def list_packages():
+    """Package directories from [workspace].members in root Cargo.toml, plus workspace root.
+    Each gets a DEPENDENCIES.rust.tsv. Avoids scanning target/, .git/, etc.
+    Requires Python 3.11+ (tomllib).
+    """
+    root_cargo = ROOT_DIR / "Cargo.toml"
+    if not root_cargo.exists():
+        return ["."]
+    with open(root_cargo, "rb") as f:
+        data = tomllib.load(f)
+    members = data.get("workspace", {}).get("members", [])
+    if not isinstance(members, list):
+        return ["."]
+    packages = ["."]
+    for m in members:
+        if isinstance(m, str) and m:
+            packages.append(m)
+    return packages
+
+
+PACKAGES = list_packages()
diff --git a/fluss-rust/scripts/dependencies.py b/fluss-rust/scripts/dependencies.py
new file mode 100644
index 0000000000..ec77469f15
--- /dev/null
+++ b/fluss-rust/scripts/dependencies.py
@@ -0,0 +1,96 @@
+#!/usr/bin/env python3
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+#
+# Release tooling: requires Python 3.11+ (constants.py uses tomllib).
+
+import sys
+
+if sys.version_info < (3, 11):
+    sys.exit(
+        "This script requires Python 3.11 or newer (uses tomllib). "
+        f"Current: {sys.version}. Use python3.11+ or see docs for release requirements."
+    )
+
+import subprocess
+from argparse import ArgumentParser, ArgumentDefaultsHelpFormatter
+
+from constants import PACKAGES, ROOT_DIR
+
+
+def check_single_package(root):
+    pkg_dir = ROOT_DIR / root if root != "." else ROOT_DIR
+    if (pkg_dir / "Cargo.toml").exists():
+        print(f"Checking dependencies of {root}")
+        subprocess.run(
+            ["cargo", "deny", "check", "license"],
+            cwd=pkg_dir,
+            check=True,
+        )
+    else:
+        print(f"Skipping {root} as Cargo.toml does not exist")
+
+
+def check_deps():
+    for d in PACKAGES:
+        check_single_package(d)
+
+
+def generate_single_package(root):
+    pkg_dir = ROOT_DIR / root if root != "." else ROOT_DIR
+    if (pkg_dir / "Cargo.toml").exists():
+        print(f"Generating dependencies {root}")
+        result = subprocess.run(
+            ["cargo", "deny", "list", "-f", "tsv", "-t", "0.6"],
+            cwd=pkg_dir,
+            capture_output=True,
+            text=True,
+        )
+        if result.returncode != 0:
+            raise RuntimeError(
+                f"cargo deny list failed in {root}: {result.stderr or result.stdout}"
+            )
+        out_file = pkg_dir / "DEPENDENCIES.rust.tsv"
+        out_file.write_text(result.stdout)
+    else:
+        print(f"Skipping {root} as Cargo.toml does not exist")
+
+
+def generate_deps():
+    for d in PACKAGES:
+        generate_single_package(d)
+
+
+if __name__ == "__main__":
+    parser = ArgumentParser(formatter_class=ArgumentDefaultsHelpFormatter)
+    parser.set_defaults(func=parser.print_help)
+    subparsers = parser.add_subparsers()
+
+    parser_check = subparsers.add_parser(
+        "check", description="Check dependencies", help="Check dependencies"
+    )
+    parser_check.set_defaults(func=check_deps)
+
+    parser_generate = subparsers.add_parser(
+        "generate", description="Generate dependencies", help="Generate dependencies"
+    )
+    parser_generate.set_defaults(func=generate_deps)
+
+    args = parser.parse_args()
+    arg_dict = dict(vars(args))
+    del arg_dict["func"]
+    args.func(**arg_dict)
diff --git a/fluss-rust/scripts/release.sh b/fluss-rust/scripts/release.sh
new file mode 100755
index 0000000000..8187d1fd44
--- /dev/null
+++ b/fluss-rust/scripts/release.sh
@@ -0,0 +1,66 @@
+#!/usr/bin/env bash
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to you under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# Create ASF source release artifacts under dist/:
+#   fluss-rust-{version}.tar.gz
+#   fluss-rust-{version}.tar.gz.asc
+#   fluss-rust-{version}.tar.gz.sha512
+# Run from repo root. Check out the release tag first (e.g. git checkout v0.1.0-rc1).
+# Usage: ./scripts/release.sh [version]
+#   If version is omitted, it is read from Cargo.toml (workspace.package.version).
+
+set -e
+
+REPO_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
+cd "$REPO_ROOT"
+
+if [ -n "$1" ]; then
+  VERSION="$1"
+else
+  VERSION=$(grep -E '^version\s*=' Cargo.toml | head -1 | sed 's/.*"\([^"]*\)".*/\1/')
+  if [ -z "$VERSION" ]; then
+    echo "Could not read version from Cargo.toml. Pass version as argument: $0 <version>"
+    exit 1
+  fi
+fi
+
+PREFIX="fluss-rust-${VERSION}"
+DIST_DIR="${REPO_ROOT}/dist"
+TARBALL="${PREFIX}.tar.gz"
+
+echo "Creating ASF source release for fluss-rust ${VERSION}"
+mkdir -p "$DIST_DIR"
+
+echo "Creating source archive: ${TARBALL}"
+git archive --format=tar.gz --prefix="${PREFIX}/" -o "${DIST_DIR}/${TARBALL}" HEAD
+
+echo "Generating SHA-512 checksum: ${TARBALL}.sha512"
+if command -v shasum >/dev/null 2>&1; then
+  (cd "$DIST_DIR" && shasum -a 512 "$TARBALL" > "${TARBALL}.sha512")
+else
+  (cd "$DIST_DIR" && sha512sum "$TARBALL" > "${TARBALL}.sha512")
+fi
+
+echo "Signing with GPG: ${TARBALL}.asc"
+(cd "$DIST_DIR" && gpg --armor --detach-sig "$TARBALL")
+
+echo "Verifying signature"
+(cd "$DIST_DIR" && gpg --verify "${TARBALL}.asc" "$TARBALL")
+
+echo "Done. Artifacts in dist/:"
+ls -la "${DIST_DIR}/"
+echo ""
+echo "Next: upload contents of dist/ to SVN (see docs/creating-a-release.md)."

From e9e3db4fcd9068eaac83562e47576d656cf13e4e Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 8 Feb 2026 01:06:03 +0000
Subject: [PATCH 123/287] feat: support temporal types in CPP (#266)

---
 fluss-rust/bindings/cpp/examples/example.cpp | 229 +++++++++++--------
 fluss-rust/bindings/cpp/include/fluss.hpp    | 114 +++++++++
 fluss-rust/bindings/cpp/src/lib.rs           |  38 ++-
 fluss-rust/bindings/cpp/src/table.cpp        |  48 ++++
 fluss-rust/bindings/cpp/src/types.rs         | 136 ++++++-----
 5 files changed, 422 insertions(+), 143 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 10266c7522..92ebe9cfbe 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -42,7 +42,7 @@ int main() {
     check("get_admin", conn.GetAdmin(admin));
 
     fluss::TablePath table_path("fluss", "sample_table_cpp_v1");
-    
+
     // 2.1) Drop table if exists
     std::cout << "Dropping table if exists..." << std::endl;
     auto drop_result = admin.DropTable(table_path, true);
@@ -52,12 +52,16 @@ int main() {
         std::cout << "Table drop result: " << drop_result.error_message << std::endl;
     }
 
-    // 3) Schema & descriptor
+    // 3) Schema with scalar and temporal columns
     auto schema = fluss::Schema::NewBuilder()
                         .AddColumn("id", fluss::DataType::Int)
                         .AddColumn("name", fluss::DataType::String)
                         .AddColumn("score", fluss::DataType::Float)
                         .AddColumn("age", fluss::DataType::Int)
+                        .AddColumn("event_date", fluss::DataType::Date)
+                        .AddColumn("event_time", fluss::DataType::Time)
+                        .AddColumn("created_at", fluss::DataType::Timestamp)
+                        .AddColumn("updated_at", fluss::DataType::TimestampLtz)
                         .Build();
 
     auto descriptor = fluss::TableDescriptor::NewBuilder()
@@ -66,7 +70,6 @@ int main() {
                           .SetComment("cpp example table with 3 buckets")
                           .Build();
 
-    // 3.1) Create table with 3 buckets
     std::cout << "Creating table with 3 buckets..." << std::endl;
     check("create_table", admin.CreateTable(table_path, descriptor, false));
 
@@ -74,7 +77,7 @@ int main() {
     fluss::Table table;
     check("get_table", conn.GetTable(table_path, table));
 
-    // 5) Writer
+    // 5) Write rows with scalar and temporal values
     fluss::AppendWriter writer;
     check("new_append_writer", table.NewAppendWriter(writer));
 
@@ -83,12 +86,26 @@ int main() {
         const char* name;
         float score;
         int age;
+        fluss::Date date;
+        fluss::Time time;
+        fluss::Timestamp ts_ntz;
+        fluss::Timestamp ts_ltz;
     };
 
+    auto tp_now = std::chrono::system_clock::now();
     std::vector<RowData> rows = {
-        {1, "Alice", 95.2f, 25},
-        {2, "Bob", 87.2f, 30},
-        {3, "Charlie", 92.1f, 35},
+        {1, "Alice", 95.2f, 25,
+         fluss::Date::FromYMD(2024, 6, 15), fluss::Time::FromHMS(14, 30, 45),
+         fluss::Timestamp::FromTimePoint(tp_now),
+         fluss::Timestamp::FromMillis(1718467200000)},
+        {2, "Bob", 87.2f, 30,
+         fluss::Date::FromYMD(2025, 1, 1), fluss::Time::FromHMS(0, 0, 0),
+         fluss::Timestamp::FromMillis(1735689600000),
+         fluss::Timestamp::FromMillisNanos(1735689600000, 500000)},
+        {3, "Charlie", 92.1f, 35,
+         fluss::Date::FromYMD(1999, 12, 31), fluss::Time::FromHMS(23, 59, 59),
+         fluss::Timestamp::FromMillis(946684799999),
+         fluss::Timestamp::FromMillis(946684799999)},
     };
 
     // Fire-and-forget: queue rows, flush at end
@@ -98,6 +115,10 @@ int main() {
         row.SetString(1, r.name);
         row.SetFloat32(2, r.score);
         row.SetInt32(3, r.age);
+        row.SetDate(4, r.date);
+        row.SetTime(5, r.time);
+        row.SetTimestampNtz(6, r.ts_ntz);
+        row.SetTimestampLtz(7, r.ts_ltz);
         check("append", writer.Append(row));
     }
     check("flush", writer.Flush());
@@ -116,7 +137,7 @@ int main() {
         std::cout << "Row acknowledged by server" << std::endl;
     }
 
-    // 6) Scan
+    // 6) Full scan — verify all column types including temporal
     fluss::LogScanner scanner;
     check("new_log_scanner", table.NewScan().CreateLogScanner(scanner));
 
@@ -129,188 +150,216 @@ int main() {
     fluss::ScanRecords records;
     check("poll", scanner.Poll(5000, records));
 
-    std::cout << "Scanned records: " << records.records.size() << std::endl;
+    std::cout << "Scanned records: " << records.Size() << std::endl;
+    bool scan_ok = true;
     for (const auto& rec : records.records) {
-        std::cout << " offset=" << rec.offset << " id=" << rec.row.fields[0].i32_val
-                  << " name=" << rec.row.fields[1].string_val
-                  << " score=" << rec.row.fields[2].f32_val << " age=" << rec.row.fields[3].i32_val
-                  << " ts=" << rec.timestamp << std::endl;
+        const auto& f = rec.row.fields;
+
+        if (f[4].type != fluss::DatumType::Date) {
+            std::cerr << "ERROR: field 4 expected Date, got "
+                      << static_cast<int>(f[4].type) << std::endl;
+            scan_ok = false;
+        }
+        if (f[5].type != fluss::DatumType::Time) {
+            std::cerr << "ERROR: field 5 expected Time, got "
+                      << static_cast<int>(f[5].type) << std::endl;
+            scan_ok = false;
+        }
+        if (f[6].type != fluss::DatumType::TimestampNtz) {
+            std::cerr << "ERROR: field 6 expected TimestampNtz, got "
+                      << static_cast<int>(f[6].type) << std::endl;
+            scan_ok = false;
+        }
+        if (f[7].type != fluss::DatumType::TimestampLtz) {
+            std::cerr << "ERROR: field 7 expected TimestampLtz, got "
+                      << static_cast<int>(f[7].type) << std::endl;
+            scan_ok = false;
+        }
+
+        auto date = f[4].GetDate();
+        auto time = f[5].GetTime();
+        auto ts_ntz = f[6].GetTimestamp();
+        auto ts_ltz = f[7].GetTimestamp();
+
+        std::cout << "  id=" << f[0].i32_val
+                  << " name=" << f[1].string_val
+                  << " score=" << f[2].f32_val
+                  << " age=" << f[3].i32_val
+                  << " date=" << date.Year() << "-" << date.Month() << "-" << date.Day()
+                  << " time=" << time.Hour() << ":" << time.Minute() << ":" << time.Second()
+                  << " ts_ntz=" << ts_ntz.epoch_millis
+                  << " ts_ltz=" << ts_ltz.epoch_millis
+                  << "+" << ts_ltz.nano_of_millisecond << "ns"
+                  << std::endl;
+    }
+
+    if (!scan_ok) {
+        std::cerr << "Full scan type verification FAILED!" << std::endl;
+        std::exit(1);
     }
-    
-    // 7) Project only id (0) and name (1) columns
-    std::vector<size_t> projected_columns = {0, 1};
+
+    // 7) Projected scan — project [id, updated_at(TimestampLtz)] to verify
+    //    NTZ/LTZ disambiguation works with column index remapping
+    std::vector<size_t> projected_columns = {0, 7};
     fluss::LogScanner projected_scanner;
     check("new_log_scanner_with_projection",
           table.NewScan().Project(projected_columns).CreateLogScanner(projected_scanner));
-    
+
     for (int b = 0; b < buckets; ++b) {
         check("subscribe_projected", projected_scanner.Subscribe(b, 0));
     }
-    
+
     fluss::ScanRecords projected_records;
     check("poll_projected", projected_scanner.Poll(5000, projected_records));
-    
-    std::cout << "Projected records: " << projected_records.records.size() << std::endl;
-    
-    bool projection_verified = true;
-    for (size_t i = 0; i < projected_records.records.size(); ++i) {
-        const auto& rec = projected_records.records[i];
-        const auto& row = rec.row;
-        
-        if (row.fields.size() != projected_columns.size()) {
-            std::cerr << "ERROR: Record " << i << " has " << row.fields.size() 
-                      << " fields, expected " << projected_columns.size() << std::endl;
-            projection_verified = false;
+
+    std::cout << "Projected records: " << projected_records.Size() << std::endl;
+    for (const auto& rec : projected_records.records) {
+        const auto& f = rec.row.fields;
+
+        if (f.size() != 2) {
+            std::cerr << "ERROR: expected 2 fields, got " << f.size() << std::endl;
+            scan_ok = false;
             continue;
         }
-        
-        // Verify field types match expected columns
-        // Column 0 (id) should be Int32, Column 1 (name) should be String
-        if (row.fields[0].type != fluss::DatumType::Int32) {
-            std::cerr << "ERROR: Record " << i << " field 0 type mismatch, expected Int32" << std::endl;
-            projection_verified = false;
+        if (f[0].type != fluss::DatumType::Int32) {
+            std::cerr << "ERROR: projected field 0 expected Int32, got "
+                      << static_cast<int>(f[0].type) << std::endl;
+            scan_ok = false;
         }
-        if (row.fields[1].type != fluss::DatumType::String) {
-            std::cerr << "ERROR: Record " << i << " field 1 type mismatch, expected String" << std::endl;
-            projection_verified = false;
-        }
-        
-        // Print projected data
-        if (row.fields[0].type == fluss::DatumType::Int32 && 
-            row.fields[1].type == fluss::DatumType::String) {
-            std::cout << "  Record " << i << ": id=" << row.fields[0].i32_val 
-                      << ", name=" << row.fields[1].string_val << std::endl;
+        if (f[1].type != fluss::DatumType::TimestampLtz) {
+            std::cerr << "ERROR: projected field 1 expected TimestampLtz, got "
+                      << static_cast<int>(f[1].type) << std::endl;
+            scan_ok = false;
         }
+
+        auto ts = f[1].GetTimestamp();
+        std::cout << "  id=" << f[0].i32_val
+                  << " updated_at=" << ts.epoch_millis
+                  << "+" << ts.nano_of_millisecond << "ns" << std::endl;
     }
-    
-    if (projection_verified) {
-        std::cout << "Column pruning verification passed!" << std::endl;
+
+    if (scan_ok) {
+        std::cout << "Scan verification passed!" << std::endl;
     } else {
-        std::cerr << "Column pruning verification failed!" << std::endl;
+        std::cerr << "Scan verification FAILED!" << std::endl;
         std::exit(1);
     }
 
     // 8) List offsets examples
     std::cout << "\n=== List Offsets Examples ===" << std::endl;
-    
-    // 8.1) Query earliest offsets for all buckets
+
     std::vector<int32_t> all_bucket_ids;
     all_bucket_ids.reserve(buckets);
     for (int b = 0; b < buckets; ++b) {
         all_bucket_ids.push_back(b);
     }
-    
+
     std::unordered_map<int32_t, int64_t> earliest_offsets;
-    check("list_earliest_offsets", 
-          admin.ListOffsets(table_path, all_bucket_ids, 
-                           fluss::OffsetQuery::Earliest(), 
+    check("list_earliest_offsets",
+          admin.ListOffsets(table_path, all_bucket_ids,
+                           fluss::OffsetQuery::Earliest(),
                            earliest_offsets));
     std::cout << "Earliest offsets:" << std::endl;
     for (const auto& [bucket_id, offset] : earliest_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
     }
-    
-    // 8.2) Query latest offsets for all buckets
+
     std::unordered_map<int32_t, int64_t> latest_offsets;
-    check("list_latest_offsets", 
-          admin.ListOffsets(table_path, all_bucket_ids, 
-                           fluss::OffsetQuery::Latest(), 
+    check("list_latest_offsets",
+          admin.ListOffsets(table_path, all_bucket_ids,
+                           fluss::OffsetQuery::Latest(),
                            latest_offsets));
     std::cout << "Latest offsets:" << std::endl;
     for (const auto& [bucket_id, offset] : latest_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
     }
-    
-    // 8.3) Query offsets for a specific timestamp (current time - 1 hour)
+
     auto now = std::chrono::system_clock::now();
     auto one_hour_ago = now - std::chrono::hours(1);
     auto timestamp_ms = std::chrono::duration_cast<std::chrono::milliseconds>(
         one_hour_ago.time_since_epoch()).count();
-    
+
     std::unordered_map<int32_t, int64_t> timestamp_offsets;
-    check("list_timestamp_offsets", 
-          admin.ListOffsets(table_path, all_bucket_ids, 
-                           fluss::OffsetQuery::FromTimestamp(timestamp_ms), 
+    check("list_timestamp_offsets",
+          admin.ListOffsets(table_path, all_bucket_ids,
+                           fluss::OffsetQuery::FromTimestamp(timestamp_ms),
                            timestamp_offsets));
     std::cout << "Offsets for timestamp " << timestamp_ms << " (1 hour ago):" << std::endl;
     for (const auto& [bucket_id, offset] : timestamp_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
     }
-    
-    // 8.4) Use batch subscribe with offsets from list_offsets
+
+    // 9) Batch subscribe
     std::cout << "\n=== Batch Subscribe Example ===" << std::endl;
     fluss::LogScanner batch_scanner;
     check("new_log_scanner_for_batch", table.NewScan().CreateLogScanner(batch_scanner));
-    
+
     std::vector<fluss::BucketSubscription> subscriptions;
     for (const auto& [bucket_id, offset] : earliest_offsets) {
         subscriptions.push_back({bucket_id, offset});
-        std::cout << "Preparing subscription: bucket=" << bucket_id 
+        std::cout << "Preparing subscription: bucket=" << bucket_id
                   << ", offset=" << offset << std::endl;
     }
-    
+
     check("subscribe_buckets", batch_scanner.Subscribe(subscriptions));
     std::cout << "Batch subscribed to " << subscriptions.size() << " buckets" << std::endl;
-    
-    // 8.5) Poll and verify bucket_id in records
+
     fluss::ScanRecords batch_records;
     check("poll_batch", batch_scanner.Poll(5000, batch_records));
-    
+
     std::cout << "Scanned " << batch_records.Size() << " records from batch subscription" << std::endl;
     for (size_t i = 0; i < batch_records.Size() && i < 5; ++i) {
         const auto& rec = batch_records[i];
-        std::cout << "  Record " << i << ": bucket_id=" << rec.bucket_id 
-                  << ", offset=" << rec.offset 
+        std::cout << "  Record " << i << ": bucket_id=" << rec.bucket_id
+                  << ", offset=" << rec.offset
                   << ", timestamp=" << rec.timestamp << std::endl;
     }
     if (batch_records.Size() > 5) {
         std::cout << "  ... and " << (batch_records.Size() - 5) << " more records" << std::endl;
     }
 
-    // 9) Test the new Arrow record batch polling functionality
+    // 10) Arrow record batch polling
     std::cout << "\n=== Testing Arrow Record Batch Polling ===" << std::endl;
 
     fluss::LogScanner arrow_scanner;
     check("new_record_batch_log_scanner", table.NewScan().CreateRecordBatchScanner(arrow_scanner));
-    
-    // Subscribe to all buckets starting from offset 0
+
     for (int b = 0; b < buckets; ++b) {
         check("subscribe_arrow", arrow_scanner.Subscribe(b, 0));
     }
-    
+
     fluss::ArrowRecordBatches arrow_batches;
     check("poll_record_batch", arrow_scanner.PollRecordBatch(5000, arrow_batches));
-    
+
     std::cout << "Polled " << arrow_batches.Size() << " Arrow record batches" << std::endl;
     for (size_t i = 0; i < arrow_batches.Size(); ++i) {
         const auto& batch = arrow_batches[i];
         if (batch->Available()) {
-            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows() << " rows. " << std::endl;
+            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows() << " rows" << std::endl;
         } else {
             std::cout << "  Batch " << i << ": not available" << std::endl;
         }
     }
-    
-    // 10) Test the new Arrow record batch polling with projection
+
+    // 11) Arrow record batch polling with projection
     std::cout << "\n=== Testing Arrow Record Batch Polling with Projection ===" << std::endl;
 
     fluss::LogScanner projected_arrow_scanner;
     check("new_record_batch_log_scanner_with_projection",
           table.NewScan().Project(projected_columns).CreateRecordBatchScanner(projected_arrow_scanner));
-    
-    // Subscribe to all buckets starting from offset 0
+
     for (int b = 0; b < buckets; ++b) {
         check("subscribe_projected_arrow", projected_arrow_scanner.Subscribe(b, 0));
     }
-    
+
     fluss::ArrowRecordBatches projected_arrow_batches;
     check("poll_projected_record_batch", projected_arrow_scanner.PollRecordBatch(5000, projected_arrow_batches));
-    
+
     std::cout << "Polled " << projected_arrow_batches.Size() << " projected Arrow record batches" << std::endl;
     for (size_t i = 0; i < projected_arrow_batches.Size(); ++i) {
         const auto& batch = projected_arrow_batches[i];
         if (batch->Available()) {
-            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows() << " rows " << std::endl;
+            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows() << " rows" << std::endl;
         } else {
             std::cout << "  Batch " << i << ": not available" << std::endl;
         }
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 6c20717565..239d9a472a 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -19,6 +19,7 @@
 
 #pragma once
 
+#include <chrono>
 #include <memory>
 #include <optional>
 #include <string>
@@ -41,6 +42,64 @@ namespace ffi {
     struct LogScanner;
 }  // namespace ffi
 
+struct Date {
+    int32_t days_since_epoch{0};
+
+    static Date FromDays(int32_t days) { return {days}; }
+    static Date FromYMD(int year, int month, int day);
+
+    int Year() const;
+    int Month() const;
+    int Day() const;
+};
+
+struct Time {
+    static constexpr int32_t kMillisPerSecond = 1000;
+    static constexpr int32_t kMillisPerMinute = 60 * kMillisPerSecond;
+    static constexpr int32_t kMillisPerHour = 60 * kMillisPerMinute;
+
+    int32_t millis_since_midnight{0};
+
+    static Time FromMillis(int32_t ms) { return {ms}; }
+    static Time FromHMS(int hour, int minute, int second, int millis = 0) {
+        return {hour * kMillisPerHour + minute * kMillisPerMinute +
+                second * kMillisPerSecond + millis};
+    }
+
+    int Hour() const { return millis_since_midnight / kMillisPerHour; }
+    int Minute() const { return (millis_since_midnight % kMillisPerHour) / kMillisPerMinute; }
+    int Second() const { return (millis_since_midnight % kMillisPerMinute) / kMillisPerSecond; }
+    int Millis() const { return millis_since_midnight % kMillisPerSecond; }
+};
+
+struct Timestamp {
+    static constexpr int32_t kMaxNanoOfMillisecond = 999999;
+    static constexpr int64_t kNanosPerMilli = 1000000;
+
+    int64_t epoch_millis{0};
+    int32_t nano_of_millisecond{0};
+
+    static Timestamp FromMillis(int64_t ms) { return {ms, 0}; }
+    static Timestamp FromMillisNanos(int64_t ms, int32_t nanos) {
+        if (nanos < 0) nanos = 0;
+        if (nanos > kMaxNanoOfMillisecond) nanos = kMaxNanoOfMillisecond;
+        return {ms, nanos};
+    }
+    static Timestamp FromTimePoint(std::chrono::system_clock::time_point tp) {
+        auto duration = tp.time_since_epoch();
+        auto ns =
+            std::chrono::duration_cast<std::chrono::nanoseconds>(duration)
+                .count();
+        auto ms = ns / kNanosPerMilli;
+        auto nano_of_ms = static_cast<int32_t>(ns % kNanosPerMilli);
+        if (nano_of_ms < 0) {
+            nano_of_ms += kNanosPerMilli;
+            ms -= 1;
+        }
+        return {ms, nano_of_ms};
+    }
+};
+
 enum class DataType {
     Boolean = 1,
     TinyInt = 2,
@@ -66,6 +125,11 @@ enum class DatumType {
     Float64 = 5,
     String = 6,
     Bytes = 7,
+    // 8-10 reserved for decimal types
+    Date = 11,
+    Time = 12,
+    TimestampNtz = 13,
+    TimestampLtz = 14,
 };
 
 constexpr int64_t EARLIEST_OFFSET = -2;
@@ -270,6 +334,36 @@ struct Datum {
         d.bytes_val = std::move(v);
         return d;
     }
+    static Datum Date(fluss::Date d) {
+        Datum dat;
+        dat.type = DatumType::Date;
+        dat.i32_val = d.days_since_epoch;
+        return dat;
+    }
+    static Datum Time(fluss::Time t) {
+        Datum dat;
+        dat.type = DatumType::Time;
+        dat.i32_val = t.millis_since_midnight;
+        return dat;
+    }
+    static Datum TimestampNtz(fluss::Timestamp ts) {
+        Datum dat;
+        dat.type = DatumType::TimestampNtz;
+        dat.i64_val = ts.epoch_millis;
+        dat.i32_val = ts.nano_of_millisecond;
+        return dat;
+    }
+    static Datum TimestampLtz(fluss::Timestamp ts) {
+        Datum dat;
+        dat.type = DatumType::TimestampLtz;
+        dat.i64_val = ts.epoch_millis;
+        dat.i32_val = ts.nano_of_millisecond;
+        return dat;
+    }
+
+    fluss::Date GetDate() const { return {i32_val}; }
+    fluss::Time GetTime() const { return {i32_val}; }
+    fluss::Timestamp GetTimestamp() const { return {i64_val, i32_val}; }
 };
 
 struct GenericRow {
@@ -315,6 +409,26 @@ struct GenericRow {
         fields[idx] = Datum::Bytes(std::move(v));
     }
 
+    void SetDate(size_t idx, fluss::Date d) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Date(d);
+    }
+
+    void SetTime(size_t idx, fluss::Time t) {
+        EnsureSize(idx);
+        fields[idx] = Datum::Time(t);
+    }
+
+    void SetTimestampNtz(size_t idx, fluss::Timestamp ts) {
+        EnsureSize(idx);
+        fields[idx] = Datum::TimestampNtz(ts);
+    }
+
+    void SetTimestampLtz(size_t idx, fluss::Timestamp ts) {
+        EnsureSize(idx);
+        fields[idx] = Datum::TimestampLtz(ts);
+    }
+
 private:
     void EnsureSize(size_t idx) {
         if (fields.size() <= idx) {
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 4957c9937a..5a266135df 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -310,6 +310,9 @@ pub struct WriteResult {
 pub struct LogScanner {
     inner: Option<fcore::client::LogScanner>,
     inner_batch: Option<fcore::client::RecordBatchLogScanner>,
+    /// Fluss columns matching the projected Arrow fields (1:1 by index).
+    /// For non-projected scanners this is the full table schema columns.
+    projected_columns: Vec<fcore::metadata::Column>,
 }
 
 fn ok_result() -> ffi::FfiResult {
@@ -653,6 +656,7 @@ impl Table {
             let scanner_ptr = Box::into_raw(Box::new(LogScanner {
                 inner: Some(scanner),
                 inner_batch: None,
+                projected_columns: self.table_info.get_schema().columns().to_vec(),
             }));
 
             Ok(scanner_ptr)
@@ -670,6 +674,19 @@ impl Table {
                 self.table_info.clone(),
             );
 
+            let all_columns = self.table_info.get_schema().columns();
+            let projected_columns: Vec<_> = column_indices
+                .iter()
+                .map(|&i| {
+                    all_columns.get(i).cloned().ok_or_else(|| {
+                        format!(
+                            "Invalid column index {i}: schema has {} columns",
+                            all_columns.len()
+                        )
+                    })
+                })
+                .collect::<Result<_, String>>()?;
+
             let log_scanner = fluss_table
                 .new_scan()
                 .project(&column_indices)
@@ -680,6 +697,7 @@ impl Table {
             let scanner = Box::into_raw(Box::new(LogScanner {
                 inner: Some(log_scanner),
                 inner_batch: None,
+                projected_columns,
             }));
             Ok(scanner)
         })
@@ -701,6 +719,7 @@ impl Table {
             let scanner = Box::into_raw(Box::new(LogScanner {
                 inner: None,
                 inner_batch: Some(batch_scanner),
+                projected_columns: self.table_info.get_schema().columns().to_vec(),
             }));
             Ok(scanner)
         })
@@ -717,6 +736,19 @@ impl Table {
                 self.table_info.clone(),
             );
 
+            let all_columns = self.table_info.get_schema().columns();
+            let projected_columns: Vec<_> = column_indices
+                .iter()
+                .map(|&i| {
+                    all_columns.get(i).cloned().ok_or_else(|| {
+                        format!(
+                            "Invalid column index {i}: schema has {} columns",
+                            all_columns.len()
+                        )
+                    })
+                })
+                .collect::<Result<_, String>>()?;
+
             let batch_scanner = fluss_table
                 .new_scan()
                 .project(&column_indices)
@@ -727,6 +759,7 @@ impl Table {
             let scanner = Box::into_raw(Box::new(LogScanner {
                 inner: None,
                 inner_batch: Some(batch_scanner),
+                projected_columns,
             }));
             Ok(scanner)
         })
@@ -925,7 +958,10 @@ impl LogScanner {
             match result {
                 Ok(records) => ffi::FfiScanRecordsResult {
                     result: ok_result(),
-                    scan_records: types::core_scan_records_to_ffi(&records),
+                    scan_records: types::core_scan_records_to_ffi(
+                        &records,
+                        &self.projected_columns,
+                    ),
                 },
                 Err(e) => ffi::FfiScanRecordsResult {
                     result: err_result(1, e.to_string()),
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 24be8d45dd..04d1846c43 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -22,12 +22,60 @@
 #include "ffi_converter.hpp"
 #include "rust/cxx.h"
 #include <arrow/c/bridge.h>
+#include <ctime>
 // todo:  bindings/cpp/BUILD.bazel still doesn’t declare Arrow include/link dependencies.
 // In environments where Bazel does not already have Arrow available, this will fail at compile/link time.
 #include <arrow/record_batch.h>
 
 namespace fluss {
 
+static constexpr int kSecondsPerDay = 24 * 60 * 60;
+
+static std::time_t timegm_utc(std::tm* tm) {
+#if defined(_WIN32)
+    return _mkgmtime(tm);
+#else
+    return ::timegm(tm);
+#endif
+}
+
+static std::tm gmtime_utc(std::time_t epoch_seconds) {
+    std::tm tm{};
+#if defined(_WIN32)
+    gmtime_s(&tm, &epoch_seconds);
+#else
+    ::gmtime_r(&epoch_seconds, &tm);
+#endif
+    return tm;
+}
+
+Date Date::FromYMD(int year, int month, int day) {
+    std::tm tm{};
+    tm.tm_year = year - 1900;
+    tm.tm_mon = month - 1;
+    tm.tm_mday = day;
+    std::time_t epoch_seconds = timegm_utc(&tm);
+    return {static_cast<int32_t>(epoch_seconds / kSecondsPerDay)};
+}
+
+int Date::Year() const {
+    std::time_t epoch_seconds = static_cast<std::time_t>(days_since_epoch) * kSecondsPerDay;
+    std::tm tm = gmtime_utc(epoch_seconds);
+    return tm.tm_year + 1900;
+}
+
+int Date::Month() const {
+    std::time_t epoch_seconds = static_cast<std::time_t>(days_since_epoch) * kSecondsPerDay;
+    std::tm tm = gmtime_utc(epoch_seconds);
+    return tm.tm_mon + 1;
+}
+
+int Date::Day() const {
+    std::time_t epoch_seconds = static_cast<std::time_t>(days_since_epoch) * kSecondsPerDay;
+    std::tm tm = gmtime_utc(epoch_seconds);
+    return tm.tm_mday;
+}
+
 Table::Table() noexcept = default;
 
 Table::Table(ffi::Table* table) noexcept : table_(table) {}
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 91d6e260ba..f546b6824c 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -52,6 +52,15 @@ pub const DATUM_TYPE_FLOAT32: i32 = 4;
 pub const DATUM_TYPE_FLOAT64: i32 = 5;
 pub const DATUM_TYPE_STRING: i32 = 6;
 pub const DATUM_TYPE_BYTES: i32 = 7;
+pub const DATUM_TYPE_DATE: i32 = 11;
+pub const DATUM_TYPE_TIME: i32 = 12;
+pub const DATUM_TYPE_TIMESTAMP_NTZ: i32 = 13;
+pub const DATUM_TYPE_TIMESTAMP_LTZ: i32 = 14;
+
+const MILLIS_PER_SECOND: i64 = 1_000;
+const MICROS_PER_MILLI: i64 = 1_000;
+const NANOS_PER_MICRO: i64 = 1_000;
+const NANOS_PER_MILLI: i64 = 1_000_000;
 
 fn ffi_data_type_to_core(dt: i32) -> Result<fcore::metadata::DataType> {
     match dt {
@@ -224,6 +233,16 @@ pub fn ffi_row_to_core(row: &ffi::FfiGenericRow) -> fcore::row::GenericRow<'_> {
             DATUM_TYPE_FLOAT64 => Datum::Float64(field.f64_val.into()),
             DATUM_TYPE_STRING => Datum::String(Cow::Borrowed(field.string_val.as_str())),
             DATUM_TYPE_BYTES => Datum::Blob(Cow::Borrowed(field.bytes_val.as_slice())),
+            DATUM_TYPE_DATE => Datum::Date(fcore::row::Date::new(field.i32_val)),
+            DATUM_TYPE_TIME => Datum::Time(fcore::row::Time::new(field.i32_val)),
+            DATUM_TYPE_TIMESTAMP_NTZ => Datum::TimestampNtz(
+                fcore::row::TimestampNtz::from_millis_nanos(field.i64_val, field.i32_val)
+                    .unwrap_or_else(|_| fcore::row::TimestampNtz::new(field.i64_val)),
+            ),
+            DATUM_TYPE_TIMESTAMP_LTZ => Datum::TimestampLtz(
+                fcore::row::TimestampLtz::from_millis_nanos(field.i64_val, field.i32_val)
+                    .unwrap_or_else(|_| fcore::row::TimestampLtz::new(field.i64_val)),
+            ),
             _ => Datum::Null,
         };
         generic_row.set_field(idx, datum);
@@ -232,7 +251,10 @@ pub fn ffi_row_to_core(row: &ffi::FfiGenericRow) -> fcore::row::GenericRow<'_> {
     generic_row
 }
 
-pub fn core_scan_records_to_ffi(records: &fcore::record::ScanRecords) -> ffi::FfiScanRecords {
+pub fn core_scan_records_to_ffi(
+    records: &fcore::record::ScanRecords,
+    columns: &[fcore::metadata::Column],
+) -> ffi::FfiScanRecords {
     let mut ffi_records = Vec::new();
 
     // Iterate over all buckets and their records
@@ -240,7 +262,7 @@ pub fn core_scan_records_to_ffi(records: &fcore::record::ScanRecords) -> ffi::Ff
         let bucket_id = table_bucket.bucket_id();
         for record in bucket_records {
             let row = record.row();
-            let fields = core_row_to_ffi_fields(row);
+            let fields = core_row_to_ffi_fields(row, columns);
 
             ffi_records.push(ffi::FfiScanRecord {
                 bucket_id,
@@ -256,7 +278,10 @@ pub fn core_scan_records_to_ffi(records: &fcore::record::ScanRecords) -> ffi::Ff
     }
 }
 
-fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
+fn core_row_to_ffi_fields(
+    row: &fcore::row::ColumnarRow,
+    columns: &[fcore::metadata::Column],
+) -> Vec<ffi::FfiDatum> {
     fn new_datum(datum_type: i32) -> ffi::FfiDatum {
         ffi::FfiDatum {
             datum_type,
@@ -361,52 +386,59 @@ fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
                     .as_any()
                     .downcast_ref::<Date32Array>()
                     .expect("Date32 column expected");
-                let mut datum = new_datum(DATUM_TYPE_INT32);
+                let mut datum = new_datum(DATUM_TYPE_DATE);
                 datum.i32_val = array.value(row_id);
                 datum
             }
-            ArrowDataType::Timestamp(unit, _) => match unit {
-                TimeUnit::Second => {
-                    let array = record_batch
-                        .column(i)
-                        .as_any()
-                        .downcast_ref::<TimestampSecondArray>()
-                        .expect("Timestamp(second) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_INT64);
-                    datum.i64_val = array.value(row_id);
-                    datum
-                }
-                TimeUnit::Millisecond => {
-                    let array = record_batch
-                        .column(i)
-                        .as_any()
-                        .downcast_ref::<TimestampMillisecondArray>()
-                        .expect("Timestamp(millisecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_INT64);
-                    datum.i64_val = array.value(row_id);
-                    datum
+            ArrowDataType::Timestamp(unit, _tz) => {
+                let datum_type = match columns.get(i).map(|c| c.data_type()) {
+                    Some(fcore::metadata::DataType::TimestampLTz(_)) => DATUM_TYPE_TIMESTAMP_LTZ,
+                    _ => DATUM_TYPE_TIMESTAMP_NTZ,
+                };
+                let mut datum = new_datum(datum_type);
+                match unit {
+                    TimeUnit::Second => {
+                        let array = record_batch
+                            .column(i)
+                            .as_any()
+                            .downcast_ref::<TimestampSecondArray>()
+                            .expect("Timestamp(second) column expected");
+                        datum.i64_val = array.value(row_id) * MILLIS_PER_SECOND;
+                        datum.i32_val = 0;
+                    }
+                    TimeUnit::Millisecond => {
+                        let array = record_batch
+                            .column(i)
+                            .as_any()
+                            .downcast_ref::<TimestampMillisecondArray>()
+                            .expect("Timestamp(millisecond) column expected");
+                        datum.i64_val = array.value(row_id);
+                        datum.i32_val = 0;
+                    }
+                    TimeUnit::Microsecond => {
+                        let array = record_batch
+                            .column(i)
+                            .as_any()
+                            .downcast_ref::<TimestampMicrosecondArray>()
+                            .expect("Timestamp(microsecond) column expected");
+                        let micros = array.value(row_id);
+                        datum.i64_val = micros.div_euclid(MICROS_PER_MILLI);
+                        datum.i32_val =
+                            (micros.rem_euclid(MICROS_PER_MILLI) * NANOS_PER_MICRO) as i32;
+                    }
+                    TimeUnit::Nanosecond => {
+                        let array = record_batch
+                            .column(i)
+                            .as_any()
+                            .downcast_ref::<TimestampNanosecondArray>()
+                            .expect("Timestamp(nanosecond) column expected");
+                        let nanos = array.value(row_id);
+                        datum.i64_val = nanos.div_euclid(NANOS_PER_MILLI);
+                        datum.i32_val = nanos.rem_euclid(NANOS_PER_MILLI) as i32;
+                    }
                 }
-                TimeUnit::Microsecond => {
-                    let array = record_batch
-                        .column(i)
-                        .as_any()
-                        .downcast_ref::<TimestampMicrosecondArray>()
-                        .expect("Timestamp(microsecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_INT64);
-                    datum.i64_val = array.value(row_id);
-                    datum
-                }
-                TimeUnit::Nanosecond => {
-                    let array = record_batch
-                        .column(i)
-                        .as_any()
-                        .downcast_ref::<TimestampNanosecondArray>()
-                        .expect("Timestamp(nanosecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_INT64);
-                    datum.i64_val = array.value(row_id);
-                    datum
-                }
-            },
+                datum
+            }
             ArrowDataType::Time32(unit) => match unit {
                 TimeUnit::Second => {
                     let array = record_batch
@@ -414,8 +446,8 @@ fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
                         .as_any()
                         .downcast_ref::<Time32SecondArray>()
                         .expect("Time32(second) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_INT32);
-                    datum.i32_val = array.value(row_id);
+                    let mut datum = new_datum(DATUM_TYPE_TIME);
+                    datum.i32_val = array.value(row_id) * MILLIS_PER_SECOND as i32;
                     datum
                 }
                 TimeUnit::Millisecond => {
@@ -424,7 +456,7 @@ fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
                         .as_any()
                         .downcast_ref::<Time32MillisecondArray>()
                         .expect("Time32(millisecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_INT32);
+                    let mut datum = new_datum(DATUM_TYPE_TIME);
                     datum.i32_val = array.value(row_id);
                     datum
                 }
@@ -437,8 +469,8 @@ fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
                         .as_any()
                         .downcast_ref::<Time64MicrosecondArray>()
                         .expect("Time64(microsecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_INT64);
-                    datum.i64_val = array.value(row_id);
+                    let mut datum = new_datum(DATUM_TYPE_TIME);
+                    datum.i32_val = (array.value(row_id) / MICROS_PER_MILLI) as i32;
                     datum
                 }
                 TimeUnit::Nanosecond => {
@@ -447,8 +479,8 @@ fn core_row_to_ffi_fields(row: &fcore::row::ColumnarRow) -> Vec<ffi::FfiDatum> {
                         .as_any()
                         .downcast_ref::<Time64NanosecondArray>()
                         .expect("Time64(nanosecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_INT64);
-                    datum.i64_val = array.value(row_id);
+                    let mut datum = new_datum(DATUM_TYPE_TIME);
+                    datum.i32_val = (array.value(row_id) / NANOS_PER_MILLI) as i32;
                     datum
                 }
                 _ => panic!("Will never come here. Unsupported Time64 unit for column {i}"),

From c68ef0322dac6090a979e4d6951c5c4fe76a3964 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 8 Feb 2026 03:24:59 +0000
Subject: [PATCH 124/287] feat: support decimals in cpp binding (#265)

---
 fluss-rust/Cargo.toml                         |   1 +
 fluss-rust/bindings/cpp/Cargo.toml            |   1 +
 fluss-rust/bindings/cpp/examples/example.cpp  |  95 +++++++++++--
 fluss-rust/bindings/cpp/include/fluss.hpp     | 121 +++++++++++++++-
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  14 +-
 fluss-rust/bindings/cpp/src/lib.rs            |  15 +-
 fluss-rust/bindings/cpp/src/types.rs          | 133 ++++++++++++++++--
 fluss-rust/crates/fluss/Cargo.toml            |   2 +-
 8 files changed, 352 insertions(+), 30 deletions(-)

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index dfddd8d48a..77d714006a 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -37,6 +37,7 @@ tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression"] }
 
+bigdecimal = "0.4"
 serde = { version = "1.0", features = ["derive"] }
 serde_json = "1.0"
 opendal = "0.53"
diff --git a/fluss-rust/bindings/cpp/Cargo.toml b/fluss-rust/bindings/cpp/Cargo.toml
index 8606a226e0..26816522fe 100644
--- a/fluss-rust/bindings/cpp/Cargo.toml
+++ b/fluss-rust/bindings/cpp/Cargo.toml
@@ -29,6 +29,7 @@ crate-type = ["staticlib"]
 [dependencies]
 anyhow = "1.0"
 arrow = { workspace = true, features = ["ffi"] }
+bigdecimal = { workspace = true }
 cxx = "1.0"
 fluss = { workspace = true, features = ["storage-all"] }
 tokio = { workspace = true, features = ["rt-multi-thread", "macros"] }
diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 92ebe9cfbe..efdf2e80ba 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -54,14 +54,14 @@ int main() {
 
     // 3) Schema with scalar and temporal columns
     auto schema = fluss::Schema::NewBuilder()
-                        .AddColumn("id", fluss::DataType::Int)
-                        .AddColumn("name", fluss::DataType::String)
-                        .AddColumn("score", fluss::DataType::Float)
-                        .AddColumn("age", fluss::DataType::Int)
-                        .AddColumn("event_date", fluss::DataType::Date)
-                        .AddColumn("event_time", fluss::DataType::Time)
-                        .AddColumn("created_at", fluss::DataType::Timestamp)
-                        .AddColumn("updated_at", fluss::DataType::TimestampLtz)
+                        .AddColumn("id", fluss::DataType::Int())
+                        .AddColumn("name", fluss::DataType::String())
+                        .AddColumn("score", fluss::DataType::Float())
+                        .AddColumn("age", fluss::DataType::Int())
+                        .AddColumn("event_date", fluss::DataType::Date())
+                        .AddColumn("event_time", fluss::DataType::Time())
+                        .AddColumn("created_at", fluss::DataType::Timestamp())
+                        .AddColumn("updated_at", fluss::DataType::TimestampLtz())
                         .Build();
 
     auto descriptor = fluss::TableDescriptor::NewBuilder()
@@ -131,6 +131,10 @@ int main() {
         row.SetString(1, "AckTest");
         row.SetFloat32(2, 99.9f);
         row.SetInt32(3, 42);
+        row.SetDate(4, fluss::Date::FromYMD(2025, 3, 1));
+        row.SetTime(5, fluss::Time::FromHMS(12, 0, 0));
+        row.SetTimestampNtz(6, fluss::Timestamp::FromMillis(1740787200000));
+        row.SetTimestampLtz(7, fluss::Timestamp::FromMillis(1740787200000));
         fluss::WriteResult wr;
         check("append", writer.Append(row, wr));
         check("wait", wr.Wait());
@@ -365,5 +369,80 @@ int main() {
         }
     }
 
+    // 12) Decimal support example
+    std::cout << "\n=== Decimal Support Example ===" << std::endl;
+
+    fluss::TablePath decimal_table_path("fluss", "decimal_table_cpp_v1");
+
+    // Drop table if exists
+    admin.DropTable(decimal_table_path, true);
+
+    // Create schema with decimal columns
+    auto decimal_schema = fluss::Schema::NewBuilder()
+                              .AddColumn("id", fluss::DataType::Int())
+                              .AddColumn("price", fluss::DataType::Decimal(10, 2))    // compact
+                              .AddColumn("amount", fluss::DataType::Decimal(28, 8))   // i128
+                              .Build();
+
+    auto decimal_descriptor = fluss::TableDescriptor::NewBuilder()
+                                  .SetSchema(decimal_schema)
+                                  .SetBucketCount(1)
+                                  .SetComment("cpp decimal example table")
+                                  .Build();
+
+    check("create_decimal_table", admin.CreateTable(decimal_table_path, decimal_descriptor, false));
+
+    // Get table and writer
+    fluss::Table decimal_table;
+    check("get_decimal_table", conn.GetTable(decimal_table_path, decimal_table));
+
+    fluss::AppendWriter decimal_writer;
+    check("new_decimal_writer", decimal_table.NewAppendWriter(decimal_writer));
+
+    // Just provide the value — Rust resolves (p,s) from schema
+    {
+        fluss::GenericRow row;
+        row.SetInt32(0, 1);
+        row.SetDecimal(1, "123.45");       // Rust knows DECIMAL(10,2)
+        row.SetDecimal(2, "1.00000000");   // Rust knows DECIMAL(28,8)
+        check("append_decimal", decimal_writer.Append(row));
+    }
+    {
+        fluss::GenericRow row;
+        row.SetInt32(0, 2);
+        row.SetDecimal(1, "-999.99");
+        row.SetDecimal(2, "3.14159265");
+        check("append_decimal", decimal_writer.Append(row));
+    }
+    {
+        fluss::GenericRow row;
+        row.SetInt32(0, 3);
+        row.SetDecimal(1, "500.00");
+        row.SetDecimal(2, "2.71828182");
+        check("append_decimal", decimal_writer.Append(row));
+    }
+    check("flush_decimal", decimal_writer.Flush());
+    std::cout << "Wrote 3 decimal rows" << std::endl;
+
+    // Scan and read back
+    fluss::LogScanner decimal_scanner;
+    check("new_decimal_scanner", decimal_table.NewScan().CreateLogScanner(decimal_scanner));
+    check("subscribe_decimal", decimal_scanner.Subscribe(0, 0));
+
+    fluss::ScanRecords decimal_records;
+    check("poll_decimal", decimal_scanner.Poll(5000, decimal_records));
+
+    std::cout << "Scanned decimal records: " << decimal_records.Size() << std::endl;
+    for (const auto& rec : decimal_records) {
+        auto& price = rec.row.fields[1];
+        auto& amount = rec.row.fields[2];
+        std::cout << "  id=" << rec.row.fields[0].i32_val
+                  << " price=" << price.DecimalToString()
+                  << " (raw=" << price.i64_val << ")"
+                  << " amount=" << amount.DecimalToString()
+                  << " is_decimal=" << price.IsDecimal()
+                  << std::endl;
+    }
+
     return 0;
 }
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 239d9a472a..8125c49cda 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -20,8 +20,8 @@
 #pragma once
 
 #include <chrono>
+#include <cstdint>
 #include <memory>
-#include <optional>
 #include <string>
 #include <unordered_map>
 #include <vector>
@@ -100,7 +100,7 @@ struct Timestamp {
     }
 };
 
-enum class DataType {
+enum class TypeId {
     Boolean = 1,
     TinyInt = 2,
     SmallInt = 3,
@@ -114,6 +114,43 @@ enum class DataType {
     Time = 11,
     Timestamp = 12,
     TimestampLtz = 13,
+    Decimal = 14,
+};
+
+class DataType {
+public:
+    explicit DataType(TypeId id, int32_t p = 0, int32_t s = 0)
+        : id_(id), precision_(p), scale_(s) {}
+
+    static DataType Boolean() { return DataType(TypeId::Boolean); }
+    static DataType TinyInt() { return DataType(TypeId::TinyInt); }
+    static DataType SmallInt() { return DataType(TypeId::SmallInt); }
+    static DataType Int() { return DataType(TypeId::Int); }
+    static DataType BigInt() { return DataType(TypeId::BigInt); }
+    static DataType Float() { return DataType(TypeId::Float); }
+    static DataType Double() { return DataType(TypeId::Double); }
+    static DataType String() { return DataType(TypeId::String); }
+    static DataType Bytes() { return DataType(TypeId::Bytes); }
+    static DataType Date() { return DataType(TypeId::Date); }
+    static DataType Time() { return DataType(TypeId::Time); }
+    static DataType Timestamp(int32_t precision = 6) {
+        return DataType(TypeId::Timestamp, precision, 0);
+    }
+    static DataType TimestampLtz(int32_t precision = 6) {
+        return DataType(TypeId::TimestampLtz, precision, 0);
+    }
+    static DataType Decimal(int32_t precision, int32_t scale) {
+        return DataType(TypeId::Decimal, precision, scale);
+    }
+
+    TypeId id() const { return id_; }
+    int32_t precision() const { return precision_; }
+    int32_t scale() const { return scale_; }
+
+private:
+    TypeId id_;
+    int32_t precision_{0};
+    int32_t scale_{0};
 };
 
 enum class DatumType {
@@ -125,7 +162,9 @@ enum class DatumType {
     Float64 = 5,
     String = 6,
     Bytes = 7,
-    // 8-10 reserved for decimal types
+    DecimalI64 = 8,
+    DecimalI128 = 9,
+    DecimalString = 10,
     Date = 11,
     Time = 12,
     TimestampNtz = 13,
@@ -182,7 +221,7 @@ struct Schema {
     public:
         Builder& AddColumn(std::string name, DataType type,
                            std::string comment = "") {
-            columns_.push_back({std::move(name), type, std::move(comment)});
+            columns_.push_back({std::move(name), std::move(type), std::move(comment)});
             return *this;
         }
 
@@ -290,6 +329,10 @@ struct Datum {
     double f64_val{0.0};
     std::string string_val;
     std::vector<uint8_t> bytes_val;
+    int32_t decimal_precision{0};  // Decimal: precision (total digits)
+    int32_t decimal_scale{0};      // Decimal: scale (digits after decimal point)
+    int64_t i128_hi{0};            // Decimal (i128): high 64 bits of unscaled value
+    int64_t i128_lo{0};            // Decimal (i128): low 64 bits of unscaled value
 
     static Datum Null() { return {}; }
     static Datum Bool(bool v) {
@@ -360,10 +403,75 @@ struct Datum {
         dat.i32_val = ts.nano_of_millisecond;
         return dat;
     }
+    // Stores the decimal string as-is. Rust side will parse via BigDecimal,
+    // look up (p,s) from the schema, validate, and create the Decimal.
+    static Datum DecimalString(std::string str) {
+        Datum d;
+        d.type = DatumType::DecimalString;
+        d.string_val = std::move(str);
+        return d;
+    }
 
     fluss::Date GetDate() const { return {i32_val}; }
     fluss::Time GetTime() const { return {i32_val}; }
     fluss::Timestamp GetTimestamp() const { return {i64_val, i32_val}; }
+
+    bool IsDecimal() const {
+        return type == DatumType::DecimalI64 || type == DatumType::DecimalI128
+            || type == DatumType::DecimalString;
+    }
+
+    std::string DecimalToString() const {
+        if (type == DatumType::DecimalI64) {
+            return FormatUnscaled64(i64_val, decimal_scale);
+        } else if (type == DatumType::DecimalI128) {
+            unsigned __int128 uval = (static_cast<unsigned __int128>(static_cast<uint64_t>(i128_hi)) << 64) |
+                                     static_cast<unsigned __int128>(static_cast<uint64_t>(i128_lo));
+            __int128 val = static_cast<__int128>(uval);
+            return FormatUnscaled128(val, decimal_scale);
+        } else if (type == DatumType::DecimalString) {
+            return string_val;
+        }
+        return "";
+    }
+
+private:
+    static std::string FormatUnscaled64(int64_t unscaled, int32_t scale) {
+        bool negative = unscaled < 0;
+        uint64_t abs_val = negative ? -static_cast<uint64_t>(unscaled) : static_cast<uint64_t>(unscaled);
+        std::string digits = std::to_string(abs_val);
+        if (scale <= 0) {
+            return (negative ? "-" : "") + digits;
+        }
+        while (static_cast<int32_t>(digits.size()) <= scale) {
+            digits = "0" + digits;
+        }
+        auto pos = digits.size() - static_cast<size_t>(scale);
+        return (negative ? "-" : "") + digits.substr(0, pos) + "." + digits.substr(pos);
+    }
+
+    static std::string FormatUnscaled128(__int128 val, int32_t scale) {
+        bool negative = val < 0;
+        unsigned __int128 abs_val = negative ? -static_cast<unsigned __int128>(val)
+                                             : static_cast<unsigned __int128>(val);
+        std::string digits;
+        if (abs_val == 0) {
+            digits = "0";
+        } else {
+            while (abs_val > 0) {
+                digits = static_cast<char>('0' + static_cast<int>(abs_val % 10)) + digits;
+                abs_val /= 10;
+            }
+        }
+        if (scale <= 0) {
+            return (negative ? "-" : "") + digits;
+        }
+        while (static_cast<int32_t>(digits.size()) <= scale) {
+            digits = "0" + digits;
+        }
+        auto pos = digits.size() - static_cast<size_t>(scale);
+        return (negative ? "-" : "") + digits.substr(0, pos) + "." + digits.substr(pos);
+    }
 };
 
 struct GenericRow {
@@ -429,6 +537,11 @@ struct GenericRow {
         fields[idx] = Datum::TimestampLtz(ts);
     }
 
+    void SetDecimal(size_t idx, const std::string& value) {
+        EnsureSize(idx);
+        fields[idx] = Datum::DecimalString(value);
+    }
+
 private:
     void EnsureSize(size_t idx) {
         if (fields.size() <= idx) {
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 63a2e91a7b..e3e63a855c 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -47,8 +47,10 @@ inline ffi::FfiTablePath to_ffi_table_path(const TablePath& path) {
 inline ffi::FfiColumn to_ffi_column(const Column& col) {
     ffi::FfiColumn ffi_col;
     ffi_col.name = rust::String(col.name);
-    ffi_col.data_type = static_cast<int32_t>(col.data_type);
+    ffi_col.data_type = static_cast<int32_t>(col.data_type.id());
     ffi_col.comment = rust::String(col.comment);
+    ffi_col.precision = col.data_type.precision();
+    ffi_col.scale = col.data_type.scale();
     return ffi_col;
 }
 
@@ -112,6 +114,10 @@ inline ffi::FfiDatum to_ffi_datum(const Datum& datum) {
     ffi_datum.f32_val = datum.f32_val;
     ffi_datum.f64_val = datum.f64_val;
     ffi_datum.string_val = rust::String(datum.string_val);
+    ffi_datum.decimal_precision = datum.decimal_precision;
+    ffi_datum.decimal_scale = datum.decimal_scale;
+    ffi_datum.i128_hi = datum.i128_hi;
+    ffi_datum.i128_lo = datum.i128_lo;
 
     rust::Vec<uint8_t> bytes;
     for (auto b : datum.bytes_val) {
@@ -137,7 +143,7 @@ inline ffi::FfiGenericRow to_ffi_generic_row(const GenericRow& row) {
 inline Column from_ffi_column(const ffi::FfiColumn& ffi_col) {
     return Column{
         std::string(ffi_col.name),
-        static_cast<DataType>(ffi_col.data_type),
+        DataType(static_cast<TypeId>(ffi_col.data_type), ffi_col.precision, ffi_col.scale),
         std::string(ffi_col.comment)};
 }
 
@@ -202,6 +208,10 @@ inline Datum from_ffi_datum(const ffi::FfiDatum& ffi_datum) {
     datum.f64_val = ffi_datum.f64_val;
     // todo: avoid copy string
     datum.string_val = std::string(ffi_datum.string_val);
+    datum.decimal_precision = ffi_datum.decimal_precision;
+    datum.decimal_scale = ffi_datum.decimal_scale;
+    datum.i128_hi = ffi_datum.i128_hi;
+    datum.i128_lo = ffi_datum.i128_lo;
 
     for (auto b : ffi_datum.bytes_val) {
         datum.bytes_val.push_back(b);
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 5a266135df..4aeb13dbe8 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -51,6 +51,8 @@ mod ffi {
         name: String,
         data_type: i32,
         comment: String,
+        precision: i32,
+        scale: i32,
     }
 
     struct FfiSchema {
@@ -98,6 +100,10 @@ mod ffi {
         f64_val: f64,
         string_val: String,
         bytes_val: Vec<u8>,
+        decimal_precision: i32,
+        decimal_scale: i32,
+        i128_hi: i64,
+        i128_lo: i64,
     }
 
     struct FfiGenericRow {
@@ -301,6 +307,7 @@ pub struct Table {
 
 pub struct AppendWriter {
     inner: fcore::client::AppendWriter,
+    table_info: fcore::metadata::TableInfo,
 }
 
 pub struct WriteResult {
@@ -636,7 +643,10 @@ impl Table {
             Ok(w) => w,
             Err(e) => return Err(format!("Failed to create writer: {e}")),
         };
-        let writer = Box::into_raw(Box::new(AppendWriter { inner: writer }));
+        let writer = Box::into_raw(Box::new(AppendWriter {
+            inner: writer,
+            table_info: self.table_info.clone(),
+        }));
         Ok(writer)
     }
 
@@ -792,7 +802,8 @@ unsafe fn delete_append_writer(writer: *mut AppendWriter) {
 
 impl AppendWriter {
     fn append(&mut self, row: &ffi::FfiGenericRow) -> Result<Box<WriteResult>, String> {
-        let generic_row = types::ffi_row_to_core(row);
+        let schema = self.table_info.get_schema();
+        let generic_row = types::ffi_row_to_core(row, Some(schema)).map_err(|e| e.to_string())?;
 
         let result_future = self
             .inner
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index f546b6824c..7837032eab 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -18,8 +18,8 @@
 use crate::ffi;
 use anyhow::{Result, anyhow};
 use arrow::array::{
-    Date32Array, LargeBinaryArray, LargeStringArray, Time32MillisecondArray, Time32SecondArray,
-    Time64MicrosecondArray, Time64NanosecondArray, TimestampMicrosecondArray,
+    Date32Array, Decimal128Array, LargeBinaryArray, LargeStringArray, Time32MillisecondArray,
+    Time32SecondArray, Time64MicrosecondArray, Time64NanosecondArray, TimestampMicrosecondArray,
     TimestampMillisecondArray, TimestampNanosecondArray, TimestampSecondArray,
 };
 use arrow::datatypes::{DataType as ArrowDataType, TimeUnit};
@@ -27,6 +27,7 @@ use arrow::ffi::{FFI_ArrowArray, FFI_ArrowSchema};
 use fcore::row::InternalRow;
 use fluss as fcore;
 use std::borrow::Cow;
+use std::str::FromStr;
 
 use arrow::array::Array;
 
@@ -43,6 +44,7 @@ pub const DATA_TYPE_DATE: i32 = 10;
 pub const DATA_TYPE_TIME: i32 = 11;
 pub const DATA_TYPE_TIMESTAMP: i32 = 12;
 pub const DATA_TYPE_TIMESTAMP_LTZ: i32 = 13;
+pub const DATA_TYPE_DECIMAL: i32 = 14;
 
 pub const DATUM_TYPE_NULL: i32 = 0;
 pub const DATUM_TYPE_BOOL: i32 = 1;
@@ -52,6 +54,9 @@ pub const DATUM_TYPE_FLOAT32: i32 = 4;
 pub const DATUM_TYPE_FLOAT64: i32 = 5;
 pub const DATUM_TYPE_STRING: i32 = 6;
 pub const DATUM_TYPE_BYTES: i32 = 7;
+pub const DATUM_TYPE_DECIMAL_I64: i32 = 8;
+pub const DATUM_TYPE_DECIMAL_I128: i32 = 9;
+pub const DATUM_TYPE_DECIMAL_STRING: i32 = 10;
 pub const DATUM_TYPE_DATE: i32 = 11;
 pub const DATUM_TYPE_TIME: i32 = 12;
 pub const DATUM_TYPE_TIMESTAMP_NTZ: i32 = 13;
@@ -62,7 +67,7 @@ const MICROS_PER_MILLI: i64 = 1_000;
 const NANOS_PER_MICRO: i64 = 1_000;
 const NANOS_PER_MILLI: i64 = 1_000_000;
 
-fn ffi_data_type_to_core(dt: i32) -> Result<fcore::metadata::DataType> {
+fn ffi_data_type_to_core(dt: i32, precision: u32, scale: u32) -> Result<fcore::metadata::DataType> {
     match dt {
         DATA_TYPE_BOOLEAN => Ok(fcore::metadata::DataTypes::boolean()),
         DATA_TYPE_TINYINT => Ok(fcore::metadata::DataTypes::tinyint()),
@@ -75,8 +80,16 @@ fn ffi_data_type_to_core(dt: i32) -> Result<fcore::metadata::DataType> {
         DATA_TYPE_BYTES => Ok(fcore::metadata::DataTypes::bytes()),
         DATA_TYPE_DATE => Ok(fcore::metadata::DataTypes::date()),
         DATA_TYPE_TIME => Ok(fcore::metadata::DataTypes::time()),
-        DATA_TYPE_TIMESTAMP => Ok(fcore::metadata::DataTypes::timestamp()),
-        DATA_TYPE_TIMESTAMP_LTZ => Ok(fcore::metadata::DataTypes::timestamp_ltz()),
+        DATA_TYPE_TIMESTAMP => Ok(fcore::metadata::DataTypes::timestamp_with_precision(
+            precision,
+        )),
+        DATA_TYPE_TIMESTAMP_LTZ => Ok(fcore::metadata::DataTypes::timestamp_ltz_with_precision(
+            precision,
+        )),
+        DATA_TYPE_DECIMAL => {
+            let dt = fcore::metadata::DecimalType::new(precision, scale)?;
+            Ok(fcore::metadata::DataType::Decimal(dt))
+        }
         _ => Err(anyhow!("Unknown data type: {dt}")),
     }
 }
@@ -96,6 +109,7 @@ fn core_data_type_to_ffi(dt: &fcore::metadata::DataType) -> i32 {
         fcore::metadata::DataType::Time(_) => DATA_TYPE_TIME,
         fcore::metadata::DataType::Timestamp(_) => DATA_TYPE_TIMESTAMP,
         fcore::metadata::DataType::TimestampLTz(_) => DATA_TYPE_TIMESTAMP_LTZ,
+        fcore::metadata::DataType::Decimal(_) => DATA_TYPE_DECIMAL,
         _ => 0,
     }
 }
@@ -106,7 +120,13 @@ pub fn ffi_descriptor_to_core(
     let mut schema_builder = fcore::metadata::Schema::builder();
 
     for col in &descriptor.schema.columns {
-        let dt = ffi_data_type_to_core(col.data_type)?;
+        if col.precision < 0 || col.scale < 0 {
+            return Err(anyhow!(
+                "Column '{}': precision and scale must be non-negative",
+                col.name
+            ));
+        }
+        let dt = ffi_data_type_to_core(col.data_type, col.precision as u32, col.scale as u32)?;
         schema_builder = schema_builder.column(&col.name, dt);
         if !col.comment.is_empty() {
             schema_builder = schema_builder.with_comment(&col.comment);
@@ -148,10 +168,22 @@ pub fn core_table_info_to_ffi(info: &fcore::metadata::TableInfo) -> ffi::FfiTabl
     let columns: Vec<ffi::FfiColumn> = schema
         .columns()
         .iter()
-        .map(|col| ffi::FfiColumn {
-            name: col.name().to_string(),
-            data_type: core_data_type_to_ffi(col.data_type()),
-            comment: col.comment().unwrap_or("").to_string(),
+        .map(|col| {
+            let (precision, scale) = match col.data_type() {
+                fcore::metadata::DataType::Decimal(dt) => {
+                    (dt.precision() as i32, dt.scale() as i32)
+                }
+                fcore::metadata::DataType::Timestamp(dt) => (dt.precision() as i32, 0),
+                fcore::metadata::DataType::TimestampLTz(dt) => (dt.precision() as i32, 0),
+                _ => (0, 0),
+            };
+            ffi::FfiColumn {
+                name: col.name().to_string(),
+                data_type: core_data_type_to_ffi(col.data_type()),
+                comment: col.comment().unwrap_or("").to_string(),
+                precision,
+                scale,
+            }
         })
         .collect();
 
@@ -218,7 +250,21 @@ pub fn empty_table_info() -> ffi::FfiTableInfo {
     }
 }
 
-pub fn ffi_row_to_core(row: &ffi::FfiGenericRow) -> fcore::row::GenericRow<'_> {
+/// Look up decimal (precision, scale) from schema for column `idx`.
+fn get_decimal_type(idx: usize, schema: Option<&fcore::metadata::Schema>) -> Result<(u32, u32)> {
+    let col = schema
+        .and_then(|s| s.columns().get(idx))
+        .ok_or_else(|| anyhow!("Schema not available for decimal column {idx}"))?;
+    match col.data_type() {
+        fcore::metadata::DataType::Decimal(dt) => Ok((dt.precision(), dt.scale())),
+        other => Err(anyhow!("Column {idx} is {:?}, not Decimal", other)),
+    }
+}
+
+pub fn ffi_row_to_core<'a>(
+    row: &'a ffi::FfiGenericRow,
+    schema: Option<&fcore::metadata::Schema>,
+) -> Result<fcore::row::GenericRow<'a>> {
     use fcore::row::Datum;
 
     let mut generic_row = fcore::row::GenericRow::new(row.fields.len());
@@ -233,6 +279,40 @@ pub fn ffi_row_to_core(row: &ffi::FfiGenericRow) -> fcore::row::GenericRow<'_> {
             DATUM_TYPE_FLOAT64 => Datum::Float64(field.f64_val.into()),
             DATUM_TYPE_STRING => Datum::String(Cow::Borrowed(field.string_val.as_str())),
             DATUM_TYPE_BYTES => Datum::Blob(Cow::Borrowed(field.bytes_val.as_slice())),
+            DATUM_TYPE_DECIMAL_STRING => {
+                let (precision, scale) = get_decimal_type(idx, schema)?;
+                let bd =
+                    bigdecimal::BigDecimal::from_str(field.string_val.as_str()).map_err(|e| {
+                        anyhow!(
+                            "Column {idx}: invalid decimal string '{}': {e}",
+                            field.string_val
+                        )
+                    })?;
+                let decimal = fcore::row::Decimal::from_big_decimal(bd, precision, scale)
+                    .map_err(|e| anyhow!("Column {idx}: {e}"))?;
+                Datum::Decimal(decimal)
+            }
+            DATUM_TYPE_DECIMAL_I64 => {
+                let precision = field.decimal_precision as u32;
+                let scale = field.decimal_scale as u32;
+                let decimal =
+                    fcore::row::Decimal::from_unscaled_long(field.i64_val, precision, scale)
+                        .map_err(|e| anyhow!("Column {idx}: {e}"))?;
+                Datum::Decimal(decimal)
+            }
+            DATUM_TYPE_DECIMAL_I128 => {
+                let precision = field.decimal_precision as u32;
+                let scale = field.decimal_scale as u32;
+                let i128_val = ((field.i128_hi as i128) << 64) | (field.i128_lo as u64 as i128);
+                let decimal = fcore::row::Decimal::from_arrow_decimal128(
+                    i128_val,
+                    scale as i64,
+                    precision,
+                    scale,
+                )
+                .map_err(|e| anyhow!("Column {idx}: {e}"))?;
+                Datum::Decimal(decimal)
+            }
             DATUM_TYPE_DATE => Datum::Date(fcore::row::Date::new(field.i32_val)),
             DATUM_TYPE_TIME => Datum::Time(fcore::row::Time::new(field.i32_val)),
             DATUM_TYPE_TIMESTAMP_NTZ => Datum::TimestampNtz(
@@ -243,12 +323,12 @@ pub fn ffi_row_to_core(row: &ffi::FfiGenericRow) -> fcore::row::GenericRow<'_> {
                 fcore::row::TimestampLtz::from_millis_nanos(field.i64_val, field.i32_val)
                     .unwrap_or_else(|_| fcore::row::TimestampLtz::new(field.i64_val)),
             ),
-            _ => Datum::Null,
+            other => return Err(anyhow!("Column {idx}: unknown datum type {other}")),
         };
         generic_row.set_field(idx, datum);
     }
 
-    generic_row
+    Ok(generic_row)
 }
 
 pub fn core_scan_records_to_ffi(
@@ -292,6 +372,10 @@ fn core_row_to_ffi_fields(
             f64_val: 0.0,
             string_val: String::new(),
             bytes_val: vec![],
+            decimal_precision: 0,
+            decimal_scale: 0,
+            i128_hi: 0,
+            i128_lo: 0,
         }
     }
 
@@ -485,6 +569,29 @@ fn core_row_to_ffi_fields(
                 }
                 _ => panic!("Will never come here. Unsupported Time64 unit for column {i}"),
             },
+            ArrowDataType::Decimal128(precision, scale) => {
+                let array = record_batch
+                    .column(i)
+                    .as_any()
+                    .downcast_ref::<Decimal128Array>()
+                    .expect("Decimal128 column expected");
+                let i128_val = array.value(row_id);
+
+                if fcore::row::Decimal::is_compact_precision(*precision as u32) {
+                    let mut datum = new_datum(DATUM_TYPE_DECIMAL_I64);
+                    datum.i64_val = i128_val as i64;
+                    datum.decimal_precision = *precision as i32;
+                    datum.decimal_scale = *scale as i32;
+                    datum
+                } else {
+                    let mut datum = new_datum(DATUM_TYPE_DECIMAL_I128);
+                    datum.i128_hi = (i128_val >> 64) as i64;
+                    datum.i128_lo = i128_val as i64;
+                    datum.decimal_precision = *precision as i32;
+                    datum.decimal_scale = *scale as i32;
+                    datum
+                }
+            }
             other => panic!(
                 "Will never come here. Unsupported Arrow data type for column {i}: {other:?}"
             ),
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 4d9be026f5..db1348a086 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -59,7 +59,7 @@ tokio = { workspace = true }
 parking_lot = "0.12"
 bytes = "1.10.1"
 dashmap = "6.1.0"
-bigdecimal = { version = "0.4", features = ["serde"] }
+bigdecimal = { workspace = true, features = ["serde"] }
 ordered-float = { version = "5", features = ["serde"] }
 parse-display = "0.10"
 jiff = { workspace = true }

From ac28f8ee5acc2bc756097ebbf47a8103ae292894 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 8 Feb 2026 04:06:16 +0000
Subject: [PATCH 125/287] feat: Add subscribe_partition_buckets method and
 partitions support (#273)

---
 fluss-rust/bindings/cpp/examples/example.cpp  | 253 +++++++++++++-----
 fluss-rust/bindings/cpp/include/fluss.hpp     | 157 ++++++-----
 fluss-rust/bindings/cpp/src/admin.cpp         |  21 ++
 fluss-rust/bindings/cpp/src/lib.rs            |  83 ++++++
 fluss-rust/bindings/cpp/src/table.cpp         |  71 +++--
 fluss-rust/bindings/python/example/example.py |  12 +
 fluss-rust/bindings/python/fluss/__init__.pyi |  10 +
 fluss-rust/bindings/python/src/table.rs       |  26 +-
 .../crates/fluss/src/client/table/scanner.rs  |  71 ++++-
 .../fluss/tests/integration/log_table.rs      |  49 ++++
 10 files changed, 556 insertions(+), 197 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index efdf2e80ba..e6f9619b21 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -26,8 +26,8 @@
 
 static void check(const char* step, const fluss::Result& r) {
     if (!r.Ok()) {
-        std::cerr << step << " failed: code=" << r.error_code
-                  << " msg=" << r.error_message << std::endl;
+        std::cerr << step << " failed: code=" << r.error_code << " msg=" << r.error_message
+                  << std::endl;
         std::exit(1);
     }
 }
@@ -54,15 +54,15 @@ int main() {
 
     // 3) Schema with scalar and temporal columns
     auto schema = fluss::Schema::NewBuilder()
-                        .AddColumn("id", fluss::DataType::Int())
-                        .AddColumn("name", fluss::DataType::String())
-                        .AddColumn("score", fluss::DataType::Float())
-                        .AddColumn("age", fluss::DataType::Int())
-                        .AddColumn("event_date", fluss::DataType::Date())
-                        .AddColumn("event_time", fluss::DataType::Time())
-                        .AddColumn("created_at", fluss::DataType::Timestamp())
-                        .AddColumn("updated_at", fluss::DataType::TimestampLtz())
-                        .Build();
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .AddColumn("score", fluss::DataType::Float())
+                      .AddColumn("age", fluss::DataType::Int())
+                      .AddColumn("event_date", fluss::DataType::Date())
+                      .AddColumn("event_time", fluss::DataType::Time())
+                      .AddColumn("created_at", fluss::DataType::Timestamp())
+                      .AddColumn("updated_at", fluss::DataType::TimestampLtz())
+                      .Build();
 
     auto descriptor = fluss::TableDescriptor::NewBuilder()
                           .SetSchema(schema)
@@ -94,17 +94,13 @@ int main() {
 
     auto tp_now = std::chrono::system_clock::now();
     std::vector<RowData> rows = {
-        {1, "Alice", 95.2f, 25,
-         fluss::Date::FromYMD(2024, 6, 15), fluss::Time::FromHMS(14, 30, 45),
-         fluss::Timestamp::FromTimePoint(tp_now),
-         fluss::Timestamp::FromMillis(1718467200000)},
-        {2, "Bob", 87.2f, 30,
-         fluss::Date::FromYMD(2025, 1, 1), fluss::Time::FromHMS(0, 0, 0),
+        {1, "Alice", 95.2f, 25, fluss::Date::FromYMD(2024, 6, 15), fluss::Time::FromHMS(14, 30, 45),
+         fluss::Timestamp::FromTimePoint(tp_now), fluss::Timestamp::FromMillis(1718467200000)},
+        {2, "Bob", 87.2f, 30, fluss::Date::FromYMD(2025, 1, 1), fluss::Time::FromHMS(0, 0, 0),
          fluss::Timestamp::FromMillis(1735689600000),
          fluss::Timestamp::FromMillisNanos(1735689600000, 500000)},
-        {3, "Charlie", 92.1f, 35,
-         fluss::Date::FromYMD(1999, 12, 31), fluss::Time::FromHMS(23, 59, 59),
-         fluss::Timestamp::FromMillis(946684799999),
+        {3, "Charlie", 92.1f, 35, fluss::Date::FromYMD(1999, 12, 31),
+         fluss::Time::FromHMS(23, 59, 59), fluss::Timestamp::FromMillis(946684799999),
          fluss::Timestamp::FromMillis(946684799999)},
     };
 
@@ -160,23 +156,23 @@ int main() {
         const auto& f = rec.row.fields;
 
         if (f[4].type != fluss::DatumType::Date) {
-            std::cerr << "ERROR: field 4 expected Date, got "
-                      << static_cast<int>(f[4].type) << std::endl;
+            std::cerr << "ERROR: field 4 expected Date, got " << static_cast<int>(f[4].type)
+                      << std::endl;
             scan_ok = false;
         }
         if (f[5].type != fluss::DatumType::Time) {
-            std::cerr << "ERROR: field 5 expected Time, got "
-                      << static_cast<int>(f[5].type) << std::endl;
+            std::cerr << "ERROR: field 5 expected Time, got " << static_cast<int>(f[5].type)
+                      << std::endl;
             scan_ok = false;
         }
         if (f[6].type != fluss::DatumType::TimestampNtz) {
-            std::cerr << "ERROR: field 6 expected TimestampNtz, got "
-                      << static_cast<int>(f[6].type) << std::endl;
+            std::cerr << "ERROR: field 6 expected TimestampNtz, got " << static_cast<int>(f[6].type)
+                      << std::endl;
             scan_ok = false;
         }
         if (f[7].type != fluss::DatumType::TimestampLtz) {
-            std::cerr << "ERROR: field 7 expected TimestampLtz, got "
-                      << static_cast<int>(f[7].type) << std::endl;
+            std::cerr << "ERROR: field 7 expected TimestampLtz, got " << static_cast<int>(f[7].type)
+                      << std::endl;
             scan_ok = false;
         }
 
@@ -185,15 +181,11 @@ int main() {
         auto ts_ntz = f[6].GetTimestamp();
         auto ts_ltz = f[7].GetTimestamp();
 
-        std::cout << "  id=" << f[0].i32_val
-                  << " name=" << f[1].string_val
-                  << " score=" << f[2].f32_val
-                  << " age=" << f[3].i32_val
-                  << " date=" << date.Year() << "-" << date.Month() << "-" << date.Day()
-                  << " time=" << time.Hour() << ":" << time.Minute() << ":" << time.Second()
-                  << " ts_ntz=" << ts_ntz.epoch_millis
-                  << " ts_ltz=" << ts_ltz.epoch_millis
-                  << "+" << ts_ltz.nano_of_millisecond << "ns"
+        std::cout << "  id=" << f[0].i32_val << " name=" << f[1].string_val
+                  << " score=" << f[2].f32_val << " age=" << f[3].i32_val << " date=" << date.Year()
+                  << "-" << date.Month() << "-" << date.Day() << " time=" << time.Hour() << ":"
+                  << time.Minute() << ":" << time.Second() << " ts_ntz=" << ts_ntz.epoch_millis
+                  << " ts_ltz=" << ts_ltz.epoch_millis << "+" << ts_ltz.nano_of_millisecond << "ns"
                   << std::endl;
     }
 
@@ -237,9 +229,8 @@ int main() {
         }
 
         auto ts = f[1].GetTimestamp();
-        std::cout << "  id=" << f[0].i32_val
-                  << " updated_at=" << ts.epoch_millis
-                  << "+" << ts.nano_of_millisecond << "ns" << std::endl;
+        std::cout << "  id=" << f[0].i32_val << " updated_at=" << ts.epoch_millis << "+"
+                  << ts.nano_of_millisecond << "ns" << std::endl;
     }
 
     if (scan_ok) {
@@ -260,19 +251,16 @@ int main() {
 
     std::unordered_map<int32_t, int64_t> earliest_offsets;
     check("list_earliest_offsets",
-          admin.ListOffsets(table_path, all_bucket_ids,
-                           fluss::OffsetQuery::Earliest(),
-                           earliest_offsets));
+          admin.ListOffsets(table_path, all_bucket_ids, fluss::OffsetQuery::Earliest(),
+                            earliest_offsets));
     std::cout << "Earliest offsets:" << std::endl;
     for (const auto& [bucket_id, offset] : earliest_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
     }
 
     std::unordered_map<int32_t, int64_t> latest_offsets;
-    check("list_latest_offsets",
-          admin.ListOffsets(table_path, all_bucket_ids,
-                           fluss::OffsetQuery::Latest(),
-                           latest_offsets));
+    check("list_latest_offsets", admin.ListOffsets(table_path, all_bucket_ids,
+                                                   fluss::OffsetQuery::Latest(), latest_offsets));
     std::cout << "Latest offsets:" << std::endl;
     for (const auto& [bucket_id, offset] : latest_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
@@ -280,14 +268,14 @@ int main() {
 
     auto now = std::chrono::system_clock::now();
     auto one_hour_ago = now - std::chrono::hours(1);
-    auto timestamp_ms = std::chrono::duration_cast<std::chrono::milliseconds>(
-        one_hour_ago.time_since_epoch()).count();
+    auto timestamp_ms =
+        std::chrono::duration_cast<std::chrono::milliseconds>(one_hour_ago.time_since_epoch())
+            .count();
 
     std::unordered_map<int32_t, int64_t> timestamp_offsets;
     check("list_timestamp_offsets",
           admin.ListOffsets(table_path, all_bucket_ids,
-                           fluss::OffsetQuery::FromTimestamp(timestamp_ms),
-                           timestamp_offsets));
+                            fluss::OffsetQuery::FromTimestamp(timestamp_ms), timestamp_offsets));
     std::cout << "Offsets for timestamp " << timestamp_ms << " (1 hour ago):" << std::endl;
     for (const auto& [bucket_id, offset] : timestamp_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
@@ -301,8 +289,8 @@ int main() {
     std::vector<fluss::BucketSubscription> subscriptions;
     for (const auto& [bucket_id, offset] : earliest_offsets) {
         subscriptions.push_back({bucket_id, offset});
-        std::cout << "Preparing subscription: bucket=" << bucket_id
-                  << ", offset=" << offset << std::endl;
+        std::cout << "Preparing subscription: bucket=" << bucket_id << ", offset=" << offset
+                  << std::endl;
     }
 
     check("subscribe_buckets", batch_scanner.Subscribe(subscriptions));
@@ -311,12 +299,12 @@ int main() {
     fluss::ScanRecords batch_records;
     check("poll_batch", batch_scanner.Poll(5000, batch_records));
 
-    std::cout << "Scanned " << batch_records.Size() << " records from batch subscription" << std::endl;
+    std::cout << "Scanned " << batch_records.Size() << " records from batch subscription"
+              << std::endl;
     for (size_t i = 0; i < batch_records.Size() && i < 5; ++i) {
         const auto& rec = batch_records[i];
         std::cout << "  Record " << i << ": bucket_id=" << rec.bucket_id
-                  << ", offset=" << rec.offset
-                  << ", timestamp=" << rec.timestamp << std::endl;
+                  << ", offset=" << rec.offset << ", timestamp=" << rec.timestamp << std::endl;
     }
     if (batch_records.Size() > 5) {
         std::cout << "  ... and " << (batch_records.Size() - 5) << " more records" << std::endl;
@@ -339,7 +327,8 @@ int main() {
     for (size_t i = 0; i < arrow_batches.Size(); ++i) {
         const auto& batch = arrow_batches[i];
         if (batch->Available()) {
-            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows() << " rows" << std::endl;
+            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows()
+                      << " rows" << std::endl;
         } else {
             std::cout << "  Batch " << i << ": not available" << std::endl;
         }
@@ -350,20 +339,25 @@ int main() {
 
     fluss::LogScanner projected_arrow_scanner;
     check("new_record_batch_log_scanner_with_projection",
-          table.NewScan().Project(projected_columns).CreateRecordBatchScanner(projected_arrow_scanner));
+          table.NewScan()
+              .Project(projected_columns)
+              .CreateRecordBatchScanner(projected_arrow_scanner));
 
     for (int b = 0; b < buckets; ++b) {
         check("subscribe_projected_arrow", projected_arrow_scanner.Subscribe(b, 0));
     }
 
     fluss::ArrowRecordBatches projected_arrow_batches;
-    check("poll_projected_record_batch", projected_arrow_scanner.PollRecordBatch(5000, projected_arrow_batches));
+    check("poll_projected_record_batch",
+          projected_arrow_scanner.PollRecordBatch(5000, projected_arrow_batches));
 
-    std::cout << "Polled " << projected_arrow_batches.Size() << " projected Arrow record batches" << std::endl;
+    std::cout << "Polled " << projected_arrow_batches.Size() << " projected Arrow record batches"
+              << std::endl;
     for (size_t i = 0; i < projected_arrow_batches.Size(); ++i) {
         const auto& batch = projected_arrow_batches[i];
         if (batch->Available()) {
-            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows() << " rows" << std::endl;
+            std::cout << "  Batch " << i << ": " << batch->GetArrowRecordBatch()->num_rows()
+                      << " rows" << std::endl;
         } else {
             std::cout << "  Batch " << i << ": not available" << std::endl;
         }
@@ -380,8 +374,8 @@ int main() {
     // Create schema with decimal columns
     auto decimal_schema = fluss::Schema::NewBuilder()
                               .AddColumn("id", fluss::DataType::Int())
-                              .AddColumn("price", fluss::DataType::Decimal(10, 2))    // compact
-                              .AddColumn("amount", fluss::DataType::Decimal(28, 8))   // i128
+                              .AddColumn("price", fluss::DataType::Decimal(10, 2))   // compact
+                              .AddColumn("amount", fluss::DataType::Decimal(28, 8))  // i128
                               .Build();
 
     auto decimal_descriptor = fluss::TableDescriptor::NewBuilder()
@@ -403,8 +397,8 @@ int main() {
     {
         fluss::GenericRow row;
         row.SetInt32(0, 1);
-        row.SetDecimal(1, "123.45");       // Rust knows DECIMAL(10,2)
-        row.SetDecimal(2, "1.00000000");   // Rust knows DECIMAL(28,8)
+        row.SetDecimal(1, "123.45");      // Rust knows DECIMAL(10,2)
+        row.SetDecimal(2, "1.00000000");  // Rust knows DECIMAL(28,8)
         check("append_decimal", decimal_writer.Append(row));
     }
     {
@@ -436,13 +430,134 @@ int main() {
     for (const auto& rec : decimal_records) {
         auto& price = rec.row.fields[1];
         auto& amount = rec.row.fields[2];
-        std::cout << "  id=" << rec.row.fields[0].i32_val
-                  << " price=" << price.DecimalToString()
+        std::cout << "  id=" << rec.row.fields[0].i32_val << " price=" << price.DecimalToString()
                   << " (raw=" << price.i64_val << ")"
-                  << " amount=" << amount.DecimalToString()
-                  << " is_decimal=" << price.IsDecimal()
+                  << " amount=" << amount.DecimalToString() << " is_decimal=" << price.IsDecimal()
                   << std::endl;
     }
 
+    // 13) Partitioned table example
+    std::cout << "\n=== Partitioned Table Example ===" << std::endl;
+
+    fluss::TablePath partitioned_table_path("fluss", "partitioned_table_cpp_v1");
+
+    // Drop if exists
+    check("drop_partitioned_table_if_exists", admin.DropTable(partitioned_table_path, true));
+
+    // Create a partitioned table with a "region" partition key
+    auto partitioned_schema = fluss::Schema::NewBuilder()
+                                  .AddColumn("id", fluss::DataType::Int())
+                                  .AddColumn("region", fluss::DataType::String())
+                                  .AddColumn("value", fluss::DataType::BigInt())
+                                  .Build();
+
+    auto partitioned_descriptor = fluss::TableDescriptor::NewBuilder()
+                                      .SetSchema(partitioned_schema)
+                                      .SetPartitionKeys({"region"})
+                                      .SetBucketCount(1)
+                                      .SetComment("cpp partitioned table example")
+                                      .Build();
+
+    check("create_partitioned_table",
+          admin.CreateTable(partitioned_table_path, partitioned_descriptor, false));
+    std::cout << "Created partitioned table" << std::endl;
+
+    // Create partitions
+    check("create_partition_US",
+          admin.CreatePartition(partitioned_table_path, {{"region", "US"}}, true));
+    check("create_partition_EU",
+          admin.CreatePartition(partitioned_table_path, {{"region", "EU"}}, true));
+    std::cout << "Created partitions: US, EU" << std::endl;
+
+    // List partitions
+    std::vector<fluss::PartitionInfo> partition_infos;
+    check("list_partition_infos",
+          admin.ListPartitionInfos(partitioned_table_path, partition_infos));
+    for (const auto& pi : partition_infos) {
+        std::cout << "  Partition: " << pi.partition_name << " (id=" << pi.partition_id << ")"
+                  << std::endl;
+    }
+
+    // Write data to partitioned table
+    fluss::Table partitioned_table;
+    check("get_partitioned_table", conn.GetTable(partitioned_table_path, partitioned_table));
+
+    fluss::AppendWriter partitioned_writer;
+    check("new_partitioned_writer", partitioned_table.NewAppendWriter(partitioned_writer));
+
+    struct PartitionedRow {
+        int id;
+        const char* region;
+        int64_t value;
+    };
+
+    std::vector<PartitionedRow> partitioned_rows = {
+        {1, "US", 100},
+        {2, "US", 200},
+        {3, "EU", 300},
+        {4, "EU", 400},
+    };
+
+    for (const auto& r : partitioned_rows) {
+        fluss::GenericRow row;
+        row.SetInt32(0, r.id);
+        row.SetString(1, r.region);
+        row.SetInt64(2, r.value);
+        check("append_partitioned", partitioned_writer.Append(row));
+    }
+    check("flush_partitioned", partitioned_writer.Flush());
+    std::cout << "Wrote " << partitioned_rows.size() << " rows to partitioned table" << std::endl;
+
+    // 13.1) subscribe_partition_buckets: subscribe to each partition individually
+    std::cout << "\n--- Testing SubscribePartitionBuckets ---" << std::endl;
+    fluss::LogScanner partition_scanner;
+    check("new_partition_scanner", partitioned_table.NewScan().CreateLogScanner(partition_scanner));
+
+    for (const auto& pi : partition_infos) {
+        check("subscribe_partition_buckets",
+              partition_scanner.SubscribePartitionBuckets(pi.partition_id, 0, 0));
+        std::cout << "Subscribed to partition " << pi.partition_name << std::endl;
+    }
+
+    fluss::ScanRecords partition_records;
+    check("poll_partitioned", partition_scanner.Poll(5000, partition_records));
+    std::cout << "Scanned " << partition_records.Size() << " records from partitioned table"
+              << std::endl;
+    for (size_t i = 0; i < partition_records.Size(); ++i) {
+        const auto& rec = partition_records[i];
+        std::cout << "  Record " << i << ": id=" << rec.row.fields[0].i32_val
+                  << ", region=" << rec.row.fields[1].string_val
+                  << ", value=" << rec.row.fields[2].i64_val << std::endl;
+    }
+
+    // 13.2) subscribe_partition_buckets: batch subscribe to all partitions at once
+    std::cout << "\n--- Testing SubscribePartitionBuckets (batch) ---" << std::endl;
+    fluss::LogScanner partition_batch_scanner;
+    check("new_partition_batch_scanner",
+          partitioned_table.NewScan().CreateLogScanner(partition_batch_scanner));
+
+    std::vector<fluss::PartitionBucketSubscription> partition_subs;
+    for (const auto& pi : partition_infos) {
+        partition_subs.push_back({pi.partition_id, 0, 0});
+    }
+    check("subscribe_partition_buckets",
+          partition_batch_scanner.SubscribePartitionBuckets(partition_subs));
+    std::cout << "Batch subscribed to " << partition_subs.size() << " partition+bucket combinations"
+              << std::endl;
+
+    fluss::ScanRecords partition_batch_records;
+    check("poll_partition_batch", partition_batch_scanner.Poll(5000, partition_batch_records));
+    std::cout << "Scanned " << partition_batch_records.Size()
+              << " records from batch partition subscription" << std::endl;
+    for (size_t i = 0; i < partition_batch_records.Size(); ++i) {
+        const auto& rec = partition_batch_records[i];
+        std::cout << "  Record " << i << ": id=" << rec.row.fields[0].i32_val
+                  << ", region=" << rec.row.fields[1].string_val
+                  << ", value=" << rec.row.fields[2].i64_val << std::endl;
+    }
+
+    // Cleanup
+    check("drop_partitioned_table", admin.DropTable(partitioned_table_path, true));
+    std::cout << "Dropped partitioned table" << std::endl;
     return 0;
 }
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 8125c49cda..3a10445516 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -28,18 +28,18 @@
 
 // Forward declare Arrow classes to avoid including heavy Arrow headers in header
 namespace arrow {
-    class RecordBatch;
+class RecordBatch;
 }
 
 namespace fluss {
 
 namespace ffi {
-    struct Connection;
-    struct Admin;
-    struct Table;
-    struct AppendWriter;
-    struct WriteResult;
-    struct LogScanner;
+struct Connection;
+struct Admin;
+struct Table;
+struct AppendWriter;
+struct WriteResult;
+struct LogScanner;
 }  // namespace ffi
 
 struct Date {
@@ -62,8 +62,8 @@ struct Time {
 
     static Time FromMillis(int32_t ms) { return {ms}; }
     static Time FromHMS(int hour, int minute, int second, int millis = 0) {
-        return {hour * kMillisPerHour + minute * kMillisPerMinute +
-                second * kMillisPerSecond + millis};
+        return {hour * kMillisPerHour + minute * kMillisPerMinute + second * kMillisPerSecond +
+                millis};
     }
 
     int Hour() const { return millis_since_midnight / kMillisPerHour; }
@@ -87,9 +87,7 @@ struct Timestamp {
     }
     static Timestamp FromTimePoint(std::chrono::system_clock::time_point tp) {
         auto duration = tp.time_since_epoch();
-        auto ns =
-            std::chrono::duration_cast<std::chrono::nanoseconds>(duration)
-                .count();
+        auto ns = std::chrono::duration_cast<std::chrono::nanoseconds>(duration).count();
         auto ms = ns / kNanosPerMilli;
         auto nano_of_ms = static_cast<int32_t>(ns % kNanosPerMilli);
         if (nano_of_ms < 0) {
@@ -118,7 +116,7 @@ enum class TypeId {
 };
 
 class DataType {
-public:
+   public:
     explicit DataType(TypeId id, int32_t p = 0, int32_t s = 0)
         : id_(id), precision_(p), scale_(s) {}
 
@@ -147,7 +145,7 @@ class DataType {
     int32_t precision() const { return precision_; }
     int32_t scale() const { return scale_; }
 
-private:
+   private:
     TypeId id_;
     int32_t precision_{0};
     int32_t scale_{0};
@@ -218,9 +216,8 @@ struct Schema {
     std::vector<std::string> primary_keys;
 
     class Builder {
-    public:
-        Builder& AddColumn(std::string name, DataType type,
-                           std::string comment = "") {
+       public:
+        Builder& AddColumn(std::string name, DataType type, std::string comment = "") {
             columns_.push_back({std::move(name), std::move(type), std::move(comment)});
             return *this;
         }
@@ -230,11 +227,9 @@ struct Schema {
             return *this;
         }
 
-        Schema Build() {
-            return Schema{std::move(columns_), std::move(primary_keys_)};
-        }
+        Schema Build() { return Schema{std::move(columns_), std::move(primary_keys_)}; }
 
-    private:
+       private:
         std::vector<Column> columns_;
         std::vector<std::string> primary_keys_;
     };
@@ -251,7 +246,7 @@ struct TableDescriptor {
     std::string comment;
 
     class Builder {
-    public:
+       public:
         Builder& SetSchema(Schema s) {
             schema_ = std::move(s);
             return *this;
@@ -283,15 +278,12 @@ struct TableDescriptor {
         }
 
         TableDescriptor Build() {
-            return TableDescriptor{std::move(schema_),
-                                   std::move(partition_keys_),
-                                   bucket_count_,
-                                   std::move(bucket_keys_),
-                                   std::move(properties_),
-                                   std::move(comment_)};
+            return TableDescriptor{std::move(schema_),     std::move(partition_keys_),
+                                   bucket_count_,          std::move(bucket_keys_),
+                                   std::move(properties_), std::move(comment_)};
         }
 
-    private:
+       private:
         Schema schema_;
         std::vector<std::string> partition_keys_;
         int32_t bucket_count_{0};
@@ -417,16 +409,17 @@ struct Datum {
     fluss::Timestamp GetTimestamp() const { return {i64_val, i32_val}; }
 
     bool IsDecimal() const {
-        return type == DatumType::DecimalI64 || type == DatumType::DecimalI128
-            || type == DatumType::DecimalString;
+        return type == DatumType::DecimalI64 || type == DatumType::DecimalI128 ||
+               type == DatumType::DecimalString;
     }
 
     std::string DecimalToString() const {
         if (type == DatumType::DecimalI64) {
             return FormatUnscaled64(i64_val, decimal_scale);
         } else if (type == DatumType::DecimalI128) {
-            unsigned __int128 uval = (static_cast<unsigned __int128>(static_cast<uint64_t>(i128_hi)) << 64) |
-                                     static_cast<unsigned __int128>(static_cast<uint64_t>(i128_lo));
+            unsigned __int128 uval =
+                (static_cast<unsigned __int128>(static_cast<uint64_t>(i128_hi)) << 64) |
+                static_cast<unsigned __int128>(static_cast<uint64_t>(i128_lo));
             __int128 val = static_cast<__int128>(uval);
             return FormatUnscaled128(val, decimal_scale);
         } else if (type == DatumType::DecimalString) {
@@ -435,10 +428,11 @@ struct Datum {
         return "";
     }
 
-private:
+   private:
     static std::string FormatUnscaled64(int64_t unscaled, int32_t scale) {
         bool negative = unscaled < 0;
-        uint64_t abs_val = negative ? -static_cast<uint64_t>(unscaled) : static_cast<uint64_t>(unscaled);
+        uint64_t abs_val =
+            negative ? -static_cast<uint64_t>(unscaled) : static_cast<uint64_t>(unscaled);
         std::string digits = std::to_string(abs_val);
         if (scale <= 0) {
             return (negative ? "-" : "") + digits;
@@ -452,8 +446,8 @@ struct Datum {
 
     static std::string FormatUnscaled128(__int128 val, int32_t scale) {
         bool negative = val < 0;
-        unsigned __int128 abs_val = negative ? -static_cast<unsigned __int128>(val)
-                                             : static_cast<unsigned __int128>(val);
+        unsigned __int128 abs_val =
+            negative ? -static_cast<unsigned __int128>(val) : static_cast<unsigned __int128>(val);
         std::string digits;
         if (abs_val == 0) {
             digits = "0";
@@ -542,7 +536,7 @@ struct GenericRow {
         fields[idx] = Datum::DecimalString(value);
     }
 
-private:
+   private:
     void EnsureSize(size_t idx) {
         if (fields.size() <= idx) {
             fields.resize(idx + 1);
@@ -569,15 +563,14 @@ struct ScanRecords {
 };
 
 class ArrowRecordBatch {
-public:
-
+   public:
     std::shared_ptr<arrow::RecordBatch> GetArrowRecordBatch() const { return batch_; }
 
     bool Available() const;
 
     // Get number of rows in the batch
     int64_t NumRows() const;
-    
+
     // Get ScanBatch metadata
     int64_t GetTableId() const;
     int64_t GetPartitionId() const;
@@ -585,14 +578,11 @@ class ArrowRecordBatch {
     int64_t GetBaseOffset() const;
     int64_t GetLastOffset() const;
 
-private:
+   private:
     friend class LogScanner;
-    explicit ArrowRecordBatch(
-        std::shared_ptr<arrow::RecordBatch> batch,
-        int64_t table_id,
-        int64_t partition_id,
-        int32_t bucket_id,
-        int64_t base_offset) noexcept;
+    explicit ArrowRecordBatch(std::shared_ptr<arrow::RecordBatch> batch, int64_t table_id,
+                              int64_t partition_id, int32_t bucket_id,
+                              int64_t base_offset) noexcept;
 
     std::shared_ptr<arrow::RecordBatch> batch_{nullptr};
 
@@ -602,7 +592,6 @@ class ArrowRecordBatch {
     int64_t base_offset_;
 };
 
-
 struct ArrowRecordBatches {
     std::vector<std::unique_ptr<ArrowRecordBatch>> batches;
 
@@ -626,6 +615,12 @@ struct BucketSubscription {
     int64_t offset;
 };
 
+struct PartitionBucketSubscription {
+    int64_t partition_id;
+    int32_t bucket_id;
+    int64_t offset;
+};
+
 struct LakeSnapshot {
     int64_t snapshot_id;
     std::vector<BucketOffset> bucket_offsets;
@@ -644,7 +639,7 @@ class Table;
 class TableScan;
 
 class Connection {
-public:
+   public:
     Connection() noexcept;
     ~Connection() noexcept;
 
@@ -660,13 +655,13 @@ class Connection {
     Result GetAdmin(Admin& out);
     Result GetTable(const TablePath& table_path, Table& out);
 
-private:
+   private:
     void Destroy() noexcept;
     ffi::Connection* conn_{nullptr};
 };
 
 class Admin {
-public:
+   public:
     Admin() noexcept;
     ~Admin() noexcept;
 
@@ -677,8 +672,7 @@ class Admin {
 
     bool Available() const;
 
-    Result CreateTable(const TablePath& table_path,
-                       const TableDescriptor& descriptor,
+    Result CreateTable(const TablePath& table_path, const TableDescriptor& descriptor,
                        bool ignore_if_exists = false);
 
     Result DropTable(const TablePath& table_path, bool ignore_if_not_exists = false);
@@ -687,26 +681,24 @@ class Admin {
 
     Result GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& out);
 
-    Result ListOffsets(const TablePath& table_path,
-                       const std::vector<int32_t>& bucket_ids,
-                       const OffsetQuery& offset_query,
-                       std::unordered_map<int32_t, int64_t>& out);
+    Result ListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
+                       const OffsetQuery& offset_query, std::unordered_map<int32_t, int64_t>& out);
+
+    Result ListPartitionOffsets(const TablePath& table_path, const std::string& partition_name,
+                                const std::vector<int32_t>& bucket_ids,
+                                const OffsetQuery& offset_query,
+                                std::unordered_map<int32_t, int64_t>& out);
 
-    Result ListPartitionOffsets(const TablePath& table_path,
-                              const std::string& partition_name,
-                              const std::vector<int32_t>& bucket_ids,
-                              const OffsetQuery& offset_query,
-                              std::unordered_map<int32_t, int64_t>& out);
+    Result ListPartitionInfos(const TablePath& table_path, std::vector<PartitionInfo>& out);
 
-    Result ListPartitionInfos(const TablePath& table_path,
-                             std::vector<PartitionInfo>& out);
+    Result CreatePartition(const TablePath& table_path,
+                           const std::unordered_map<std::string, std::string>& partition_spec,
+                           bool ignore_if_exists = false);
 
-private:
-    Result DoListOffsets(const TablePath& table_path,
-                       const std::vector<int32_t>& bucket_ids,
-                       const OffsetQuery& offset_query,
-                       std::unordered_map<int32_t, int64_t>& out,
-                       const std::string* partition_name = nullptr);
+   private:
+    Result DoListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
+                         const OffsetQuery& offset_query, std::unordered_map<int32_t, int64_t>& out,
+                         const std::string* partition_name = nullptr);
 
     friend class Connection;
     Admin(ffi::Admin* admin) noexcept;
@@ -716,7 +708,7 @@ class Admin {
 };
 
 class Table {
-public:
+   public:
     Table() noexcept;
     ~Table() noexcept;
 
@@ -734,7 +726,7 @@ class Table {
     TablePath GetTablePath() const;
     bool HasPrimaryKey() const;
 
-private:
+   private:
     friend class Connection;
     friend class TableScan;
     Table(ffi::Table* table) noexcept;
@@ -744,7 +736,7 @@ class Table {
 };
 
 class TableScan {
-public:
+   public:
     TableScan(const TableScan&) = delete;
     TableScan& operator=(const TableScan&) = delete;
     TableScan(TableScan&&) noexcept = default;
@@ -755,7 +747,7 @@ class TableScan {
     Result CreateLogScanner(LogScanner& out);
     Result CreateRecordBatchScanner(LogScanner& out);
 
-private:
+   private:
     friend class Table;
     explicit TableScan(ffi::Table* table) noexcept;
 
@@ -764,7 +756,7 @@ class TableScan {
 };
 
 class WriteResult {
-public:
+   public:
     WriteResult() noexcept;
     ~WriteResult() noexcept;
 
@@ -779,7 +771,7 @@ class WriteResult {
     /// For fire-and-forget, simply let the WriteResult go out of scope.
     Result Wait();
 
-private:
+   private:
     friend class AppendWriter;
     WriteResult(ffi::WriteResult* inner) noexcept;
 
@@ -788,7 +780,7 @@ class WriteResult {
 };
 
 class AppendWriter {
-public:
+   public:
     AppendWriter() noexcept;
     ~AppendWriter() noexcept;
 
@@ -803,7 +795,7 @@ class AppendWriter {
     Result Append(const GenericRow& row, WriteResult& out);
     Result Flush();
 
-private:
+   private:
     friend class Table;
     AppendWriter(ffi::AppendWriter* writer) noexcept;
 
@@ -812,7 +804,7 @@ class AppendWriter {
 };
 
 class LogScanner {
-public:
+   public:
     LogScanner() noexcept;
     ~LogScanner() noexcept;
 
@@ -825,12 +817,13 @@ class LogScanner {
 
     Result Subscribe(int32_t bucket_id, int64_t start_offset);
     Result Subscribe(const std::vector<BucketSubscription>& bucket_offsets);
-    Result SubscribePartition(int64_t partition_id, int32_t bucket_id, int64_t start_offset);
+    Result SubscribePartitionBuckets(int64_t partition_id, int32_t bucket_id, int64_t start_offset);
+    Result SubscribePartitionBuckets(const std::vector<PartitionBucketSubscription>& subscriptions);
     Result UnsubscribePartition(int64_t partition_id, int32_t bucket_id);
     Result Poll(int64_t timeout_ms, ScanRecords& out);
     Result PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out);
 
-private:
+   private:
     friend class Table;
     friend class TableScan;
     LogScanner(ffi::LogScanner* scanner) noexcept;
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index d19e444cd2..4aed78db8b 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -183,4 +183,25 @@ Result Admin::ListPartitionInfos(const TablePath& table_path,
     return result;
 }
 
+Result Admin::CreatePartition(const TablePath& table_path,
+                              const std::unordered_map<std::string, std::string>& partition_spec,
+                              bool ignore_if_exists) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+
+    rust::Vec<ffi::FfiPartitionKeyValue> rust_spec;
+    for (const auto& [key, value] : partition_spec) {
+        ffi::FfiPartitionKeyValue kv;
+        kv.key = rust::String(key);
+        kv.value = rust::String(value);
+        rust_spec.push_back(std::move(kv));
+    }
+
+    auto ffi_result = admin_->create_partition(ffi_path, std::move(rust_spec), ignore_if_exists);
+    return utils::from_ffi_result(ffi_result);
+}
+
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 4aeb13dbe8..235d282fc5 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -166,6 +166,12 @@ mod ffi {
         offset: i64,
     }
 
+    struct FfiPartitionBucketSubscription {
+        partition_id: i64,
+        bucket_id: i32,
+        offset: i64,
+    }
+
     struct FfiBucketOffsetPair {
         bucket_id: i32,
         offset: i64,
@@ -181,6 +187,11 @@ mod ffi {
         lake_snapshot: FfiLakeSnapshot,
     }
 
+    struct FfiPartitionKeyValue {
+        key: String,
+        value: String,
+    }
+
     struct FfiPartitionInfo {
         partition_id: i64,
         partition_name: String,
@@ -240,6 +251,12 @@ mod ffi {
             self: &Admin,
             table_path: &FfiTablePath,
         ) -> FfiListPartitionInfosResult;
+        fn create_partition(
+            self: &Admin,
+            table_path: &FfiTablePath,
+            partition_spec: Vec<FfiPartitionKeyValue>,
+            ignore_if_exists: bool,
+        ) -> FfiResult;
 
         // Table
         unsafe fn delete_table(table: *mut Table);
@@ -279,6 +296,10 @@ mod ffi {
             bucket_id: i32,
             start_offset: i64,
         ) -> FfiResult;
+        fn subscribe_partition_buckets(
+            self: &LogScanner,
+            subscriptions: Vec<FfiPartitionBucketSubscription>,
+        ) -> FfiResult;
         fn unsubscribe_partition(self: &LogScanner, partition_id: i64, bucket_id: i32)
         -> FfiResult;
         fn poll(self: &LogScanner, timeout_ms: i64) -> FfiScanRecordsResult;
@@ -613,6 +634,33 @@ impl Admin {
             },
         }
     }
+    fn create_partition(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        partition_spec: Vec<ffi::FfiPartitionKeyValue>,
+        ignore_if_exists: bool,
+    ) -> ffi::FfiResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+        let spec_map: std::collections::HashMap<String, String> = partition_spec
+            .into_iter()
+            .map(|kv| (kv.key, kv.value))
+            .collect();
+        let partition_spec = fcore::metadata::PartitionSpec::new(spec_map);
+
+        let result = RUNTIME.block_on(async {
+            self.inner
+                .create_partition(&path, &partition_spec, ignore_if_exists)
+                .await
+        });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
 }
 
 // Table implementation
@@ -939,6 +987,41 @@ impl LogScanner {
         self.do_subscribe(Some(partition_id), bucket_id, start_offset)
     }
 
+    fn subscribe_partition_buckets(
+        &self,
+        subscriptions: Vec<ffi::FfiPartitionBucketSubscription>,
+    ) -> ffi::FfiResult {
+        use std::collections::HashMap;
+        let mut partition_bucket_offsets: HashMap<(PartitionId, i32), i64> = HashMap::new();
+        for sub in subscriptions {
+            partition_bucket_offsets.insert((sub.partition_id, sub.bucket_id), sub.offset);
+        }
+
+        if let Some(ref inner) = self.inner {
+            let result = RUNTIME.block_on(async {
+                inner
+                    .subscribe_partition_buckets(&partition_bucket_offsets)
+                    .await
+            });
+            match result {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else if let Some(ref inner_batch) = self.inner_batch {
+            let result = RUNTIME.block_on(async {
+                inner_batch
+                    .subscribe_partition_buckets(&partition_bucket_offsets)
+                    .await
+            });
+            match result {
+                Ok(_) => ok_result(),
+                Err(e) => err_result(1, e.to_string()),
+            }
+        } else {
+            err_result(1, "LogScanner not initialized".to_string())
+        }
+    }
+
     fn unsubscribe_partition(&self, partition_id: PartitionId, bucket_id: i32) -> ffi::FfiResult {
         if let Some(ref inner) = self.inner {
             match RUNTIME
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 04d1846c43..4425b5fbfa 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -17,14 +17,17 @@
  * under the License.
  */
 
+#include <arrow/c/bridge.h>
+
+#include <ctime>
+
+#include "ffi_converter.hpp"
 #include "fluss.hpp"
 #include "lib.rs.h"
-#include "ffi_converter.hpp"
 #include "rust/cxx.h"
-#include <arrow/c/bridge.h>
-#include <ctime>
 // todo:  bindings/cpp/BUILD.bazel still doesn’t declare Arrow include/link dependencies.
-// In environments where Bazel does not already have Arrow available, this will fail at compile/link time.
+// In environments where Bazel does not already have Arrow available, this will fail at compile/link
+// time.
 #include <arrow/record_batch.h>
 
 namespace fluss {
@@ -89,9 +92,7 @@ void Table::Destroy() noexcept {
     }
 }
 
-Table::Table(Table&& other) noexcept : table_(other.table_) {
-    other.table_ = nullptr;
-}
+Table::Table(Table&& other) noexcept : table_(other.table_) { other.table_ = nullptr; }
 
 Table& Table::operator=(Table&& other) noexcept {
     if (this != &other) {
@@ -119,9 +120,7 @@ Result Table::NewAppendWriter(AppendWriter& out) {
     }
 }
 
-TableScan Table::NewScan() {
-    return TableScan(table_);
-}
+TableScan Table::NewScan() { return TableScan(table_); }
 
 // TableScan implementation
 TableScan::TableScan(ffi::Table* table) noexcept : table_(table) {}
@@ -167,7 +166,8 @@ Result TableScan::CreateRecordBatchScanner(LogScanner& out) {
             for (size_t idx : projection_) {
                 rust_indices.push_back(idx);
             }
-            out.scanner_ = table_->new_record_batch_log_scanner_with_projection(std::move(rust_indices));
+            out.scanner_ =
+                table_->new_record_batch_log_scanner_with_projection(std::move(rust_indices));
         }
         return utils::make_ok();
     } catch (const rust::Error& e) {
@@ -354,7 +354,8 @@ Result LogScanner::Subscribe(const std::vector<BucketSubscription>& bucket_offse
     return utils::from_ffi_result(ffi_result);
 }
 
-Result LogScanner::SubscribePartition(int64_t partition_id, int32_t bucket_id, int64_t start_offset) {
+Result LogScanner::SubscribePartitionBuckets(int64_t partition_id, int32_t bucket_id,
+                                             int64_t start_offset) {
     if (!Available()) {
         return utils::make_error(1, "LogScanner not available");
     }
@@ -363,6 +364,25 @@ Result LogScanner::SubscribePartition(int64_t partition_id, int32_t bucket_id, i
     return utils::from_ffi_result(ffi_result);
 }
 
+Result LogScanner::SubscribePartitionBuckets(
+    const std::vector<PartitionBucketSubscription>& subscriptions) {
+    if (!Available()) {
+        return utils::make_error(1, "LogScanner not available");
+    }
+
+    rust::Vec<ffi::FfiPartitionBucketSubscription> rust_subs;
+    for (const auto& sub : subscriptions) {
+        ffi::FfiPartitionBucketSubscription ffi_sub;
+        ffi_sub.partition_id = sub.partition_id;
+        ffi_sub.bucket_id = sub.bucket_id;
+        ffi_sub.offset = sub.offset;
+        rust_subs.push_back(ffi_sub);
+    }
+
+    auto ffi_result = scanner_->subscribe_partition_buckets(std::move(rust_subs));
+    return utils::from_ffi_result(ffi_result);
+}
+
 Result LogScanner::UnsubscribePartition(int64_t partition_id, int32_t bucket_id) {
     if (!Available()) {
         return utils::make_error(1, "LogScanner not available");
@@ -387,12 +407,9 @@ Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
     return utils::make_ok();
 }
 
-ArrowRecordBatch::ArrowRecordBatch(
-    std::shared_ptr<arrow::RecordBatch> batch,
-    int64_t table_id,
-    int64_t partition_id,
-    int32_t bucket_id,
-    int64_t base_offset) noexcept
+ArrowRecordBatch::ArrowRecordBatch(std::shared_ptr<arrow::RecordBatch> batch, int64_t table_id,
+                                   int64_t partition_id, int32_t bucket_id,
+                                   int64_t base_offset) noexcept
     : batch_(std::move(batch)),
       table_id_(table_id),
       partition_id_(partition_id),
@@ -406,7 +423,6 @@ int64_t ArrowRecordBatch::NumRows() const {
     return batch_->num_rows();
 }
 
-
 int64_t ArrowRecordBatch::GetTableId() const {
     if (!Available()) return 0;
     return this->table_id_;
@@ -453,26 +469,23 @@ Result LogScanner::PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out)
         if (import_result.ok()) {
             auto batch_ptr = import_result.ValueOrDie();
             auto batch_wrapper = std::unique_ptr<ArrowRecordBatch>(new ArrowRecordBatch(
-                std::move(batch_ptr),
-                ffi_batch.table_id,
-                ffi_batch.partition_id,
-                ffi_batch.bucket_id,
-                ffi_batch.base_offset
-            ));
+                std::move(batch_ptr), ffi_batch.table_id, ffi_batch.partition_id,
+                ffi_batch.bucket_id, ffi_batch.base_offset));
             out.batches.push_back(std::move(batch_wrapper));
-            
+
             // Free the container structures that were allocated in Rust after successful import
             ffi::free_arrow_ffi_structures(ffi_batch.array_ptr, ffi_batch.schema_ptr);
         } else {
             // Import failed, free the container structures to avoid leaks and return error
             ffi::free_arrow_ffi_structures(ffi_batch.array_ptr, ffi_batch.schema_ptr);
-            
+
             // Return an error indicating that the import failed
-            std::string error_msg = "Failed to import Arrow record batch: " + import_result.status().ToString();
+            std::string error_msg =
+                "Failed to import Arrow record batch: " + import_result.status().ToString();
             return utils::make_error(1, error_msg);
         }
     }
-    
+
     return utils::make_ok();
 }
 
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index dd7f1b14a8..732b7dff76 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -717,6 +717,18 @@ async def main():
         print(f"\nto_arrow() returned {partitioned_arrow.num_rows} records from partitioned table:")
         print(partitioned_arrow.to_pandas())
 
+        # Demo: subscribe_partition_buckets for batch subscribing to multiple partitions at once
+        print("\n--- Testing subscribe_partition_buckets + to_arrow() ---")
+        partitioned_scanner_batch = await partitioned_table.new_scan().create_batch_scanner()
+        partition_bucket_offsets = {
+            (p.partition_id, 0): fluss.EARLIEST_OFFSET for p in partition_infos
+        }
+        partitioned_scanner_batch.subscribe_partition_buckets(partition_bucket_offsets)
+        print(f"Batch subscribed to {len(partition_bucket_offsets)} partition+bucket combinations")
+        partitioned_batch_arrow = partitioned_scanner_batch.to_arrow()
+        print(f"to_arrow() returned {partitioned_batch_arrow.num_rows} records:")
+        print(partitioned_batch_arrow.to_pandas())
+
         # Demo: unsubscribe_partition - unsubscribe from one partition, read remaining
         print("\n--- Testing unsubscribe_partition ---")
         partitioned_scanner3 = await partitioned_table.new_scan().create_batch_scanner()
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 526dad7840..ceef1553a3 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -420,6 +420,16 @@ class LogScanner:
             start_offset: The offset to start reading from (use EARLIEST_OFFSET for beginning)
         """
         ...
+    def subscribe_partition_buckets(
+        self, partition_bucket_offsets: Dict[Tuple[int, int], int]
+    ) -> None:
+        """Subscribe to multiple partition+bucket combinations at once (partitioned tables only).
+
+        Args:
+            partition_bucket_offsets: Dict mapping (partition_id, bucket_id) tuples to start_offsets.
+                Example: {(partition_id_1, 0): EARLIEST_OFFSET, (partition_id_2, 1): 100}
+        """
+        ...
     def unsubscribe_partition(self, partition_id: int, bucket_id: int) -> None:
         """Unsubscribe from a specific partition bucket (partitioned tables only).
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 1a7dbdcecd..d92659634b 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -1657,6 +1657,26 @@ impl LogScanner {
         })
     }
 
+    /// Subscribe to multiple partition+bucket combinations at once (partitioned tables only).
+    ///
+    /// Args:
+    ///     partition_bucket_offsets: A dict mapping (partition_id, bucket_id) tuples to start_offsets
+    fn subscribe_partition_buckets(
+        &self,
+        py: Python,
+        partition_bucket_offsets: HashMap<(i64, i32), i64>,
+    ) -> PyResult<()> {
+        py.detach(|| {
+            TOKIO_RUNTIME.block_on(async {
+                with_scanner!(
+                    &self.scanner,
+                    subscribe_partition_buckets(&partition_bucket_offsets)
+                )
+                .map_err(|e| FlussError::new_err(e.to_string()))
+            })
+        })
+    }
+
     /// Unsubscribe from a specific partition bucket (partitioned tables only).
     ///
     /// Args:
@@ -1813,7 +1833,7 @@ impl LogScanner {
     /// Reads from currently subscribed buckets until reaching their latest offsets.
     /// Works for both partitioned and non-partitioned tables.
     ///
-    /// You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
+    /// You must call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.
     ///
     /// Returns:
     ///     PyArrow Table containing all data from subscribed buckets
@@ -1822,7 +1842,7 @@ impl LogScanner {
         let subscribed = scanner.get_subscribed_buckets();
         if subscribed.is_empty() {
             return Err(FlussError::new_err(
-                "No buckets subscribed. Call subscribe(), subscribe_buckets(), or subscribe_partition() first.",
+                "No buckets subscribed. Call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.",
             ));
         }
 
@@ -1838,7 +1858,7 @@ impl LogScanner {
     /// Reads from currently subscribed buckets until reaching their latest offsets.
     /// Works for both partitioned and non-partitioned tables.
     ///
-    /// You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
+    /// You must call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.
     ///
     /// Returns:
     ///     Pandas DataFrame containing all data from subscribed buckets
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 26f54da8fb..57f90a1e5a 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -361,29 +361,17 @@ impl LogScannerInner {
         if self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
                 message:
-                    "The table is a partitioned table, subscribe_buckets is not supported currently."
+                    "The table is a partitioned table, please use \"subscribe_partition_buckets\" instead."
                         .to_string(),
             });
         }
-        self.metadata
-            .check_and_update_table_metadata(from_ref(&self.table_path))
-            .await?;
-        if bucket_offsets.is_empty() {
-            return Err(Error::UnexpectedError {
-                message: "Bucket offsets are empty.".to_string(),
-                source: None,
-            });
-        }
 
         let mut scan_bucket_offsets = HashMap::new();
         for (bucket_id, offset) in bucket_offsets {
             let table_bucket = TableBucket::new(self.table_id, *bucket_id);
             scan_bucket_offsets.insert(table_bucket, *offset);
         }
-
-        self.log_scanner_status
-            .assign_scan_buckets(scan_bucket_offsets);
-        Ok(())
+        self.do_subscribe_buckets(scan_bucket_offsets).await
     }
 
     async fn subscribe_partition(
@@ -409,6 +397,43 @@ impl LogScannerInner {
         Ok(())
     }
 
+    async fn subscribe_partition_buckets(
+        &self,
+        partition_bucket_offsets: &HashMap<(PartitionId, i32), i64>,
+    ) -> Result<()> {
+        if !self.is_partitioned_table {
+            return Err(UnsupportedOperation {
+                message: "The table is not a partitioned table, please use \"subscribe_buckets\" \
+                    to subscribe to non-partitioned buckets instead."
+                    .to_string(),
+            });
+        }
+
+        let mut scan_bucket_offsets = HashMap::new();
+        for (&(partition_id, bucket_id), &offset) in partition_bucket_offsets {
+            let table_bucket =
+                TableBucket::new_with_partition(self.table_id, Some(partition_id), bucket_id);
+            scan_bucket_offsets.insert(table_bucket, offset);
+        }
+        self.do_subscribe_buckets(scan_bucket_offsets).await
+    }
+
+    async fn do_subscribe_buckets(&self, bucket_offsets: HashMap<TableBucket, i64>) -> Result<()> {
+        if bucket_offsets.is_empty() {
+            return Err(Error::UnexpectedError {
+                message: "Bucket offsets are empty.".to_string(),
+                source: None,
+            });
+        }
+
+        self.metadata
+            .check_and_update_table_metadata(from_ref(&self.table_path))
+            .await?;
+
+        self.log_scanner_status.assign_scan_buckets(bucket_offsets);
+        Ok(())
+    }
+
     async fn unsubscribe_partition(&self, partition_id: PartitionId, bucket: i32) -> Result<()> {
         if !self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
@@ -501,6 +526,15 @@ impl LogScanner {
             .await
     }
 
+    pub async fn subscribe_partition_buckets(
+        &self,
+        partition_bucket_offsets: &HashMap<(PartitionId, i32), i64>,
+    ) -> Result<()> {
+        self.inner
+            .subscribe_partition_buckets(partition_bucket_offsets)
+            .await
+    }
+
     pub async fn unsubscribe_partition(
         &self,
         partition_id: PartitionId,
@@ -546,6 +580,15 @@ impl RecordBatchLogScanner {
         self.inner.log_scanner_status.get_all_subscriptions()
     }
 
+    pub async fn subscribe_partition_buckets(
+        &self,
+        partition_bucket_offsets: &HashMap<(PartitionId, i32), i64>,
+    ) -> Result<()> {
+        self.inner
+            .subscribe_partition_buckets(partition_bucket_offsets)
+            .await
+    }
+
     pub async fn unsubscribe_partition(
         &self,
         partition_id: PartitionId,
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 82f8135206..d80ce791a6 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -1200,6 +1200,55 @@ mod table_test {
             records_after_unsubscribe.len()
         );
 
+        // Test subscribe_partition_buckets: batch subscribe to all partitions at once
+        let log_scanner_batch = table
+            .new_scan()
+            .create_log_scanner()
+            .expect("Failed to create log scanner for batch partition subscribe test");
+        let partition_infos = admin
+            .list_partition_infos(&table_path)
+            .await
+            .expect("Failed to list partition infos");
+        let partition_bucket_offsets: HashMap<(i64, i32), i64> = partition_infos
+            .iter()
+            .map(|p| ((p.get_partition_id(), 0), 0i64))
+            .collect();
+        log_scanner_batch
+            .subscribe_partition_buckets(&partition_bucket_offsets)
+            .await
+            .expect("Failed to batch subscribe to partitions");
+
+        let mut batch_collected: Vec<(i32, String, i64)> = Vec::new();
+        let batch_start = std::time::Instant::now();
+        while batch_collected.len() < expected_records.len()
+            && batch_start.elapsed() < Duration::from_secs(10)
+        {
+            let records = log_scanner_batch
+                .poll(Duration::from_millis(500))
+                .await
+                .expect("Failed to poll after batch partition subscribe");
+            for rec in records {
+                let row = rec.row();
+                batch_collected.push((
+                    row.get_int(0),
+                    row.get_string(1).to_string(),
+                    row.get_long(2),
+                ));
+            }
+        }
+        assert_eq!(
+            batch_collected.len(),
+            expected_records.len(),
+            "Did not receive all records in time, expect receive {} records, but got {} records",
+            expected_records.len(),
+            batch_collected.len()
+        );
+        batch_collected.sort_by_key(|r| r.0);
+        assert_eq!(
+            batch_collected, expected_records,
+            "subscribe_partition_buckets should receive the same records as subscribe_partition loop"
+        );
+
         admin
             .drop_table(&table_path, false)
             .await

From a056cfd054f457f1b71ca502781ecf254b638b23 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 8 Feb 2026 12:21:37 +0800
Subject: [PATCH 126/287] chore: remove async for upsert/delete/append in
 python (#280)

---
 fluss-rust/bindings/python/fluss/__init__.pyi | 33 +++++++++++++++----
 1 file changed, 26 insertions(+), 7 deletions(-)

diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index ceef1553a3..50f3b20b3a 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -301,13 +301,16 @@ class FlussTable:
     def __repr__(self) -> str: ...
 
 class AppendWriter:
-    async def append(self, row: dict | list | tuple) -> None:
+    def append(self, row: dict | list | tuple) -> WriteResultHandle:
         """Append a single row to the table.
 
         Args:
             row: Dictionary mapping field names to values, or
                  list/tuple of values in schema order
 
+        Returns:
+            WriteResultHandle: Ignore for fire-and-forget, or await handle.wait() for acknowledgement.
+
         Supported Types:
             Currently supports primitive types only:
             - Boolean, TinyInt, SmallInt, Int, BigInt (integers)
@@ -319,8 +322,8 @@ class AppendWriter:
             Temporal types (Date, Timestamp, Decimal) are not yet supported.
 
         Example:
-            await writer.append({'id': 1, 'name': 'Alice', 'score': 95.5})
-            await writer.append([1, 'Alice', 95.5])
+            writer.append({'id': 1, 'name': 'Alice', 'score': 95.5})
+            writer.append([1, 'Alice', 95.5])
 
         Note:
             For high-throughput bulk loading, prefer write_arrow_batch().
@@ -328,15 +331,15 @@ class AppendWriter:
         """
         ...
     def write_arrow(self, table: pa.Table) -> None: ...
-    def write_arrow_batch(self, batch: pa.RecordBatch) -> None: ...
+    def write_arrow_batch(self, batch: pa.RecordBatch) -> WriteResultHandle: ...
     def write_pandas(self, df: pd.DataFrame) -> None: ...
-    def flush(self) -> None: ...
+    async def flush(self) -> None: ...
     def __repr__(self) -> str: ...
 
 class UpsertWriter:
     """Writer for upserting and deleting data in a Fluss primary key table."""
 
-    async def upsert(self, row: dict | list | tuple) -> None:
+    def upsert(self, row: dict | list | tuple) -> WriteResultHandle:
         """Upsert a row into the table.
 
         If a row with the same primary key exists, it will be updated.
@@ -345,14 +348,20 @@ class UpsertWriter:
         Args:
             row: Dictionary mapping field names to values, or
                  list/tuple of values in schema order
+
+        Returns:
+            WriteResultHandle: Ignore for fire-and-forget, or await handle.wait() for ack.
         """
         ...
-    async def delete(self, pk: dict | list | tuple) -> None:
+    def delete(self, pk: dict | list | tuple) -> WriteResultHandle:
         """Delete a row from the table by primary key.
 
         Args:
             pk: Dictionary with PK column names as keys, or
                 list/tuple of PK values in PK column order
+
+        Returns:
+            WriteResultHandle: Ignore for fire-and-forget, or await handle.wait() for ack.
         """
         ...
     async def flush(self) -> None:
@@ -360,6 +369,16 @@ class UpsertWriter:
         ...
     def __repr__(self) -> str: ...
 
+
+class WriteResultHandle:
+    """Handle for a pending write (append/upsert/delete). Ignore for fire-and-forget, or await handle.wait() for ack."""
+
+    async def wait(self) -> None:
+        """Wait for server acknowledgment of this write."""
+        ...
+    def __repr__(self) -> str: ...
+
+
 class Lookuper:
     """Lookuper for performing primary key lookups on a Fluss table."""
 

From 6e7aa7c129ffd1186a62ca0e54e39cfd33093774 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 8 Feb 2026 12:59:34 +0800
Subject: [PATCH 127/287] feat: support database-level ops in python (#279)

---
 fluss-rust/bindings/cpp/src/types.rs          |   2 +-
 fluss-rust/bindings/python/fluss/__init__.pyi |  66 +++++
 fluss-rust/bindings/python/src/admin.rs       | 227 +++++++++++++++++-
 fluss-rust/bindings/python/src/lib.rs         |   2 +
 fluss-rust/bindings/python/src/metadata.rs    | 104 +++++++-
 fluss-rust/bindings/python/src/table.rs       |   6 +-
 6 files changed, 398 insertions(+), 9 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 7837032eab..05d3d6a1d2 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -257,7 +257,7 @@ fn get_decimal_type(idx: usize, schema: Option<&fcore::metadata::Schema>) -> Res
         .ok_or_else(|| anyhow!("Schema not available for decimal column {idx}"))?;
     match col.data_type() {
         fcore::metadata::DataType::Decimal(dt) => Ok((dt.precision(), dt.scale())),
-        other => Err(anyhow!("Column {idx} is {:?}, not Decimal", other)),
+        other => Err(anyhow!("Column {idx} is {other:?}, not Decimal")),
     }
 }
 
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 50f3b20b3a..a9ef828aac 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -121,6 +121,45 @@ class FlussConnection:
     def __repr__(self) -> str: ...
 
 class FlussAdmin:
+    async def create_database(
+        self,
+        database_name: str,
+        ignore_if_exists: bool = False,
+        database_descriptor: Optional["DatabaseDescriptor"] = None,
+    ) -> None:
+        """Create a database."""
+        ...
+    async def drop_database(
+        self,
+        database_name: str,
+        ignore_if_not_exists: bool = False,
+        cascade: bool = True,
+    ) -> None:
+        """Drop a database."""
+        ...
+    async def list_databases(self) -> List[str]:
+        """List all databases."""
+        ...
+    async def database_exists(self, database_name: str) -> bool:
+        """Check if a database exists."""
+        ...
+    async def get_database_info(self, database_name: str) -> "DatabaseInfo":
+        """Get database information."""
+        ...
+    async def list_tables(self, database_name: str) -> List[str]:
+        """List all tables in a database."""
+        ...
+    async def table_exists(self, table_path: TablePath) -> bool:
+        """Check if a table exists."""
+        ...
+    async def drop_partition(
+        self,
+        table_path: TablePath,
+        partition_spec: Dict[str, str],
+        ignore_if_not_exists: bool = False,
+    ) -> None:
+        """Drop a partition from a partitioned table."""
+        ...
     async def create_table(
         self,
         table_path: TablePath,
@@ -203,6 +242,33 @@ class FlussAdmin:
         ...
     def __repr__(self) -> str: ...
 
+
+class DatabaseDescriptor:
+    """Descriptor for a Fluss database (comment and custom properties)."""
+
+    def __init__(
+        self,
+        comment: Optional[str] = None,
+        custom_properties: Optional[Dict[str, str]] = None,
+    ) -> None: ...
+    @property
+    def comment(self) -> Optional[str]: ...
+    def get_custom_properties(self) -> Dict[str, str]: ...
+    def __repr__(self) -> str: ...
+
+
+class DatabaseInfo:
+    """Information about a Fluss database."""
+
+    @property
+    def database_name(self) -> str: ...
+    def get_database_descriptor(self) -> DatabaseDescriptor: ...
+    @property
+    def created_time(self) -> int: ...
+    @property
+    def modified_time(self) -> int: ...
+    def __repr__(self) -> str: ...
+
 class TableScan:
     """Builder for creating log scanners with flexible configuration.
 
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index d28c9c066e..335aa248ad 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -17,6 +17,7 @@
 
 use crate::*;
 use fcore::rpc::message::OffsetSpec;
+use pyo3::conversion::IntoPyObject;
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::Arc;
 
@@ -38,8 +39,7 @@ fn parse_offset_spec(offset_type: &str, timestamp: Option<i64>) -> PyResult<Offs
             Ok(OffsetSpec::Timestamp(ts))
         }
         _ => Err(FlussError::new_err(format!(
-            "Invalid offset_type: '{}'. Must be 'earliest', 'latest', or 'timestamp'",
-            offset_type
+            "Invalid offset_type: '{offset_type}'. Must be 'earliest', 'latest', or 'timestamp'"
         ))),
     }
 }
@@ -49,8 +49,7 @@ fn validate_bucket_ids(bucket_ids: &[i32]) -> PyResult<()> {
     for &bucket_id in bucket_ids {
         if bucket_id < 0 {
             return Err(FlussError::new_err(format!(
-                "Invalid bucket_id: {}. Bucket IDs must be non-negative",
-                bucket_id
+                "Invalid bucket_id: {bucket_id}. Bucket IDs must be non-negative"
             )));
         }
     }
@@ -59,6 +58,226 @@ fn validate_bucket_ids(bucket_ids: &[i32]) -> PyResult<()> {
 
 #[pymethods]
 impl FlussAdmin {
+    /// Create a database.
+    ///
+    /// Args:
+    ///     database_name: Name of the database
+    ///     ignore_if_exists: If True, don't raise error if database already exists
+    ///     database_descriptor: Optional descriptor (comment, custom_properties)
+    ///
+    /// Returns:
+    ///     None
+    #[pyo3(signature = (database_name, ignore_if_exists=false, database_descriptor=None))]
+    pub fn create_database<'py>(
+        &self,
+        py: Python<'py>,
+        database_name: &str,
+        ignore_if_exists: bool,
+        database_descriptor: Option<&DatabaseDescriptor>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let admin = self.__admin.clone();
+        let name = database_name.to_string();
+        let descriptor = database_descriptor.map(|d| d.to_core().clone());
+
+        future_into_py(py, async move {
+            admin
+                .create_database(&name, ignore_if_exists, descriptor.as_ref())
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to create database: {e}")))?;
+
+            Python::attach(|py| Ok(py.None()))
+        })
+    }
+
+    /// Drop a database.
+    ///
+    /// Args:
+    ///     database_name: Name of the database
+    ///     ignore_if_not_exists: If True, don't raise error if database does not exist
+    ///     cascade: If True, drop tables in the database first
+    ///
+    /// Returns:
+    ///     None
+    #[pyo3(signature = (database_name, ignore_if_not_exists=false, cascade=true))]
+    pub fn drop_database<'py>(
+        &self,
+        py: Python<'py>,
+        database_name: &str,
+        ignore_if_not_exists: bool,
+        cascade: bool,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let admin = self.__admin.clone();
+        let name = database_name.to_string();
+
+        future_into_py(py, async move {
+            admin
+                .drop_database(&name, ignore_if_not_exists, cascade)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to drop database: {e}")))?;
+
+            Python::attach(|py| Ok(py.None()))
+        })
+    }
+
+    /// List all databases.
+    ///
+    /// Returns:
+    ///     List[str]: Names of all databases
+    pub fn list_databases<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let admin = self.__admin.clone();
+
+        future_into_py(py, async move {
+            let names = admin
+                .list_databases()
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to list databases: {e}")))?;
+
+            Python::attach(|py| {
+                let py_list = pyo3::types::PyList::empty(py);
+                for name in names {
+                    py_list.append(name)?;
+                }
+                Ok(py_list.unbind())
+            })
+        })
+    }
+
+    /// Check if a database exists.
+    ///
+    /// Args:
+    ///     database_name: Name of the database
+    ///
+    /// Returns:
+    ///     bool: True if the database exists
+    pub fn database_exists<'py>(
+        &self,
+        py: Python<'py>,
+        database_name: &str,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let admin = self.__admin.clone();
+        let name = database_name.to_string();
+
+        future_into_py(py, async move {
+            let exists = admin.database_exists(&name).await.map_err(|e| {
+                FlussError::new_err(format!("Failed to check database exists: {e}"))
+            })?;
+
+            Python::attach(|py| Ok(exists.into_pyobject(py)?.to_owned().into_any().unbind()))
+        })
+    }
+
+    /// Get database information.
+    ///
+    /// Args:
+    ///     database_name: Name of the database
+    ///
+    /// Returns:
+    ///     DatabaseInfo: Database metadata
+    pub fn get_database_info<'py>(
+        &self,
+        py: Python<'py>,
+        database_name: &str,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let admin = self.__admin.clone();
+        let name = database_name.to_string();
+
+        future_into_py(py, async move {
+            let info = admin
+                .get_database_info(&name)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to get database info: {e}")))?;
+
+            Python::attach(|py| Py::new(py, DatabaseInfo::from_core(info)))
+        })
+    }
+
+    /// List all tables in a database.
+    ///
+    /// Args:
+    ///     database_name: Name of the database
+    ///
+    /// Returns:
+    ///     List[str]: Names of all tables in the database
+    pub fn list_tables<'py>(
+        &self,
+        py: Python<'py>,
+        database_name: &str,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let admin = self.__admin.clone();
+        let name = database_name.to_string();
+
+        future_into_py(py, async move {
+            let names = admin
+                .list_tables(&name)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to list tables: {e}")))?;
+
+            Python::attach(|py| {
+                let py_list = pyo3::types::PyList::empty(py);
+                for name in names {
+                    py_list.append(name)?;
+                }
+                Ok(py_list.unbind())
+            })
+        })
+    }
+
+    /// Check if a table exists.
+    ///
+    /// Args:
+    ///     table_path: Path to the table (database, table)
+    ///
+    /// Returns:
+    ///     bool: True if the table exists
+    pub fn table_exists<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let core_table_path = table_path.to_core();
+        let admin = self.__admin.clone();
+
+        future_into_py(py, async move {
+            let exists = admin
+                .table_exists(&core_table_path)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to check table exists: {e}")))?;
+
+            Python::attach(|py| Ok(exists.into_pyobject(py)?.to_owned().into_any().unbind()))
+        })
+    }
+
+    /// Drop a partition from a partitioned table.
+    ///
+    /// Args:
+    ///     table_path: Path to the table
+    ///     partition_spec: Dict mapping partition column name to value (e.g., {"region": "US"})
+    ///     ignore_if_not_exists: If True, don't raise error if partition does not exist
+    ///
+    /// Returns:
+    ///     None
+    #[pyo3(signature = (table_path, partition_spec, ignore_if_not_exists=false))]
+    pub fn drop_partition<'py>(
+        &self,
+        py: Python<'py>,
+        table_path: &TablePath,
+        partition_spec: std::collections::HashMap<String, String>,
+        ignore_if_not_exists: bool,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let core_table_path = table_path.to_core();
+        let admin = self.__admin.clone();
+        let core_partition_spec = fcore::metadata::PartitionSpec::new(partition_spec);
+
+        future_into_py(py, async move {
+            admin
+                .drop_partition(&core_table_path, &core_partition_spec, ignore_if_not_exists)
+                .await
+                .map_err(|e| FlussError::new_err(format!("Failed to drop partition: {e}")))?;
+
+            Python::attach(|py| Ok(py.None()))
+        })
+    }
+
     /// Create a table with the given schema
     #[pyo3(signature = (table_path, table_descriptor, ignore_if_exists=None))]
     pub fn create_table<'py>(
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index f1f4ee6b61..41f8de5447 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -91,6 +91,8 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<PartitionInfo>()?;
     m.add_class::<OffsetType>()?;
     m.add_class::<WriteResultHandle>()?;
+    m.add_class::<DatabaseDescriptor>()?;
+    m.add_class::<DatabaseInfo>()?;
 
     // Register constants
     m.add("EARLIEST_OFFSET", fcore::client::EARLIEST_OFFSET)?;
diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
index f39f9d441b..d6b122d27b 100644
--- a/fluss-rust/bindings/python/src/metadata.rs
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -53,7 +53,7 @@ impl ChangeType {
     }
 
     fn __repr__(&self) -> String {
-        format!("ChangeType.{:?}", self)
+        format!("ChangeType.{self:?}")
     }
 }
 
@@ -657,3 +657,105 @@ impl LakeSnapshot {
         }
     }
 }
+
+/// Descriptor for a Fluss database (comment and custom properties)
+#[pyclass]
+#[derive(Clone)]
+pub struct DatabaseDescriptor {
+    __descriptor: fcore::metadata::DatabaseDescriptor,
+}
+
+#[pymethods]
+impl DatabaseDescriptor {
+    /// Create a new DatabaseDescriptor
+    #[new]
+    #[pyo3(signature = (comment=None, custom_properties=None))]
+    pub fn new(
+        comment: Option<String>,
+        custom_properties: Option<HashMap<String, String>>,
+    ) -> PyResult<Self> {
+        let mut builder = fcore::metadata::DatabaseDescriptor::builder();
+        if let Some(c) = comment {
+            builder = builder.comment(&c);
+        }
+        if let Some(props) = custom_properties {
+            builder = builder.custom_properties(props);
+        }
+        let __descriptor = builder.build();
+        Ok(Self { __descriptor })
+    }
+
+    /// Get comment if set
+    #[getter]
+    pub fn comment(&self) -> Option<String> {
+        self.__descriptor.comment().map(|s| s.to_string())
+    }
+
+    /// Get custom properties
+    pub fn get_custom_properties(&self) -> HashMap<String, String> {
+        self.__descriptor.custom_properties().clone()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "DatabaseDescriptor(comment={:?}, custom_properties={:?})",
+            self.comment(),
+            self.get_custom_properties()
+        )
+    }
+}
+
+impl DatabaseDescriptor {
+    pub fn to_core(&self) -> &fcore::metadata::DatabaseDescriptor {
+        &self.__descriptor
+    }
+}
+
+/// Information about a Fluss database
+#[pyclass]
+pub struct DatabaseInfo {
+    __info: fcore::metadata::DatabaseInfo,
+}
+
+#[pymethods]
+impl DatabaseInfo {
+    /// Get the database name
+    #[getter]
+    pub fn database_name(&self) -> String {
+        self.__info.database_name().to_string()
+    }
+
+    /// Get the database descriptor
+    pub fn get_database_descriptor(&self) -> DatabaseDescriptor {
+        DatabaseDescriptor {
+            __descriptor: self.__info.database_descriptor().clone(),
+        }
+    }
+
+    /// Get created time
+    #[getter]
+    pub fn created_time(&self) -> i64 {
+        self.__info.created_time()
+    }
+
+    /// Get modified time
+    #[getter]
+    pub fn modified_time(&self) -> i64 {
+        self.__info.modified_time()
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "DatabaseInfo(database_name='{}', created_time={}, modified_time={})",
+            self.database_name(),
+            self.created_time(),
+            self.modified_time()
+        )
+    }
+}
+
+impl DatabaseInfo {
+    pub fn from_core(info: fcore::metadata::DatabaseInfo) -> Self {
+        Self { __info: info }
+    }
+}
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index d92659634b..cb203dc67a 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -315,7 +315,7 @@ fn resolve_projection_indices(
                 let idx = columns
                     .iter()
                     .position(|c| c.name() == name)
-                    .ok_or_else(|| FlussError::new_err(format!("Column '{}' not found", name)))?;
+                    .ok_or_else(|| FlussError::new_err(format!("Column '{name}' not found")))?;
                 indices.push(idx);
             }
             Ok(Some(indices))
@@ -796,9 +796,9 @@ pub fn python_pk_to_generic_row(
                 let field: &fcore::metadata::DataField = &fields[*pk_idx];
                 let value = dict
                     .get_item(pk_name)?
-                    .ok_or_else(|| FlussError::new_err(format!("Missing PK field: {}", pk_name)))?;
+                    .ok_or_else(|| FlussError::new_err(format!("Missing PK field: {pk_name}")))?;
                 datums[*pk_idx] = python_value_to_datum(&value, field.data_type())
-                    .map_err(|e| FlussError::new_err(format!("PK field '{}': {}", pk_name, e)))?;
+                    .map_err(|e| FlussError::new_err(format!("PK field '{pk_name}': {e}")))?;
             }
         }
 

From db996f870f979c4b46917f40ce5ddb47c894fb89 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 8 Feb 2026 06:56:25 +0000
Subject: [PATCH 128/287] chore: introduce getters in CPP Datum (#281)

---
 fluss-rust/bindings/cpp/examples/example.cpp  |  87 +++++----
 fluss-rust/bindings/cpp/include/fluss.hpp     | 106 +++++++++--
 fluss-rust/bindings/cpp/src/ffi_converter.hpp | 165 ++++++++++--------
 3 files changed, 228 insertions(+), 130 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index e6f9619b21..f568422e6b 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -153,40 +153,38 @@ int main() {
     std::cout << "Scanned records: " << records.Size() << std::endl;
     bool scan_ok = true;
     for (const auto& rec : records.records) {
-        const auto& f = rec.row.fields;
-
-        if (f[4].type != fluss::DatumType::Date) {
-            std::cerr << "ERROR: field 4 expected Date, got " << static_cast<int>(f[4].type)
-                      << std::endl;
+        if (rec.row.GetType(4) != fluss::DatumType::Date) {
+            std::cerr << "ERROR: field 4 expected Date, got "
+                      << static_cast<int>(rec.row.GetType(4)) << std::endl;
             scan_ok = false;
         }
-        if (f[5].type != fluss::DatumType::Time) {
-            std::cerr << "ERROR: field 5 expected Time, got " << static_cast<int>(f[5].type)
-                      << std::endl;
+        if (rec.row.GetType(5) != fluss::DatumType::Time) {
+            std::cerr << "ERROR: field 5 expected Time, got "
+                      << static_cast<int>(rec.row.GetType(5)) << std::endl;
             scan_ok = false;
         }
-        if (f[6].type != fluss::DatumType::TimestampNtz) {
-            std::cerr << "ERROR: field 6 expected TimestampNtz, got " << static_cast<int>(f[6].type)
-                      << std::endl;
+        if (rec.row.GetType(6) != fluss::DatumType::TimestampNtz) {
+            std::cerr << "ERROR: field 6 expected TimestampNtz, got "
+                      << static_cast<int>(rec.row.GetType(6)) << std::endl;
             scan_ok = false;
         }
-        if (f[7].type != fluss::DatumType::TimestampLtz) {
-            std::cerr << "ERROR: field 7 expected TimestampLtz, got " << static_cast<int>(f[7].type)
-                      << std::endl;
+        if (rec.row.GetType(7) != fluss::DatumType::TimestampLtz) {
+            std::cerr << "ERROR: field 7 expected TimestampLtz, got "
+                      << static_cast<int>(rec.row.GetType(7)) << std::endl;
             scan_ok = false;
         }
 
-        auto date = f[4].GetDate();
-        auto time = f[5].GetTime();
-        auto ts_ntz = f[6].GetTimestamp();
-        auto ts_ltz = f[7].GetTimestamp();
-
-        std::cout << "  id=" << f[0].i32_val << " name=" << f[1].string_val
-                  << " score=" << f[2].f32_val << " age=" << f[3].i32_val << " date=" << date.Year()
-                  << "-" << date.Month() << "-" << date.Day() << " time=" << time.Hour() << ":"
-                  << time.Minute() << ":" << time.Second() << " ts_ntz=" << ts_ntz.epoch_millis
-                  << " ts_ltz=" << ts_ltz.epoch_millis << "+" << ts_ltz.nano_of_millisecond << "ns"
-                  << std::endl;
+        auto date = rec.row.GetDate(4);
+        auto time = rec.row.GetTime(5);
+        auto ts_ntz = rec.row.GetTimestamp(6);
+        auto ts_ltz = rec.row.GetTimestamp(7);
+
+        std::cout << "  id=" << rec.row.GetInt32(0) << " name=" << rec.row.GetString(1)
+                  << " score=" << rec.row.GetFloat32(2) << " age=" << rec.row.GetInt32(3)
+                  << " date=" << date.Year() << "-" << date.Month() << "-" << date.Day()
+                  << " time=" << time.Hour() << ":" << time.Minute() << ":" << time.Second()
+                  << " ts_ntz=" << ts_ntz.epoch_millis << " ts_ltz=" << ts_ltz.epoch_millis << "+"
+                  << ts_ltz.nano_of_millisecond << "ns" << std::endl;
     }
 
     if (!scan_ok) {
@@ -210,26 +208,24 @@ int main() {
 
     std::cout << "Projected records: " << projected_records.Size() << std::endl;
     for (const auto& rec : projected_records.records) {
-        const auto& f = rec.row.fields;
-
-        if (f.size() != 2) {
-            std::cerr << "ERROR: expected 2 fields, got " << f.size() << std::endl;
+        if (rec.row.FieldCount() != 2) {
+            std::cerr << "ERROR: expected 2 fields, got " << rec.row.FieldCount() << std::endl;
             scan_ok = false;
             continue;
         }
-        if (f[0].type != fluss::DatumType::Int32) {
+        if (rec.row.GetType(0) != fluss::DatumType::Int32) {
             std::cerr << "ERROR: projected field 0 expected Int32, got "
-                      << static_cast<int>(f[0].type) << std::endl;
+                      << static_cast<int>(rec.row.GetType(0)) << std::endl;
             scan_ok = false;
         }
-        if (f[1].type != fluss::DatumType::TimestampLtz) {
+        if (rec.row.GetType(1) != fluss::DatumType::TimestampLtz) {
             std::cerr << "ERROR: projected field 1 expected TimestampLtz, got "
-                      << static_cast<int>(f[1].type) << std::endl;
+                      << static_cast<int>(rec.row.GetType(1)) << std::endl;
             scan_ok = false;
         }
 
-        auto ts = f[1].GetTimestamp();
-        std::cout << "  id=" << f[0].i32_val << " updated_at=" << ts.epoch_millis << "+"
+        auto ts = rec.row.GetTimestamp(1);
+        std::cout << "  id=" << rec.row.GetInt32(0) << " updated_at=" << ts.epoch_millis << "+"
                   << ts.nano_of_millisecond << "ns" << std::endl;
     }
 
@@ -428,12 +424,9 @@ int main() {
 
     std::cout << "Scanned decimal records: " << decimal_records.Size() << std::endl;
     for (const auto& rec : decimal_records) {
-        auto& price = rec.row.fields[1];
-        auto& amount = rec.row.fields[2];
-        std::cout << "  id=" << rec.row.fields[0].i32_val << " price=" << price.DecimalToString()
-                  << " (raw=" << price.i64_val << ")"
-                  << " amount=" << amount.DecimalToString() << " is_decimal=" << price.IsDecimal()
-                  << std::endl;
+        std::cout << "  id=" << rec.row.GetInt32(0) << " price=" << rec.row.DecimalToString(1)
+                  << " amount=" << rec.row.DecimalToString(2)
+                  << " is_decimal=" << rec.row.IsDecimal(1) << std::endl;
     }
 
     // 13) Partitioned table example
@@ -525,9 +518,9 @@ int main() {
               << std::endl;
     for (size_t i = 0; i < partition_records.Size(); ++i) {
         const auto& rec = partition_records[i];
-        std::cout << "  Record " << i << ": id=" << rec.row.fields[0].i32_val
-                  << ", region=" << rec.row.fields[1].string_val
-                  << ", value=" << rec.row.fields[2].i64_val << std::endl;
+        std::cout << "  Record " << i << ": id=" << rec.row.GetInt32(0)
+                  << ", region=" << rec.row.GetString(1) << ", value=" << rec.row.GetInt64(2)
+                  << std::endl;
     }
 
     // 13.2) subscribe_partition_buckets: batch subscribe to all partitions at once
@@ -551,9 +544,9 @@ int main() {
               << " records from batch partition subscription" << std::endl;
     for (size_t i = 0; i < partition_batch_records.Size(); ++i) {
         const auto& rec = partition_batch_records[i];
-        std::cout << "  Record " << i << ": id=" << rec.row.fields[0].i32_val
-                  << ", region=" << rec.row.fields[1].string_val
-                  << ", value=" << rec.row.fields[2].i64_val << std::endl;
+        std::cout << "  Record " << i << ": id=" << rec.row.GetInt32(0)
+                  << ", region=" << rec.row.GetString(1) << ", value=" << rec.row.GetInt64(2)
+                  << std::endl;
     }
 
     // Cleanup
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 3a10445516..6b9d479a7b 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -22,6 +22,7 @@
 #include <chrono>
 #include <cstdint>
 #include <memory>
+#include <stdexcept>
 #include <string>
 #include <unordered_map>
 #include <vector>
@@ -312,19 +313,13 @@ struct TableInfo {
     Schema schema;
 };
 
+namespace detail {
+struct FfiAccess;
+}
+
 struct Datum {
-    DatumType type{DatumType::Null};
-    bool bool_val{false};
-    int32_t i32_val{0};
-    int64_t i64_val{0};
-    float f32_val{0.0F};
-    double f64_val{0.0};
-    std::string string_val;
-    std::vector<uint8_t> bytes_val;
-    int32_t decimal_precision{0};  // Decimal: precision (total digits)
-    int32_t decimal_scale{0};      // Decimal: scale (digits after decimal point)
-    int64_t i128_hi{0};            // Decimal (i128): high 64 bits of unscaled value
-    int64_t i128_lo{0};            // Decimal (i128): low 64 bits of unscaled value
+    friend struct GenericRow;
+    friend struct detail::FfiAccess;
 
     static Datum Null() { return {}; }
     static Datum Bool(bool v) {
@@ -404,6 +399,29 @@ struct Datum {
         return d;
     }
 
+   private:
+    DatumType type{DatumType::Null};
+    bool bool_val{false};
+    int32_t i32_val{0};
+    int64_t i64_val{0};
+    float f32_val{0.0F};
+    double f64_val{0.0};
+    std::string string_val;
+    std::vector<uint8_t> bytes_val;
+    int32_t decimal_precision{0};  // Decimal: precision (total digits)
+    int32_t decimal_scale{0};      // Decimal: scale (digits after decimal point)
+    int64_t i128_hi{0};            // Decimal (i128): high 64 bits of unscaled value
+    int64_t i128_lo{0};            // Decimal (i128): low 64 bits of unscaled value
+
+    DatumType GetType() const { return type; }
+    bool IsNull() const { return type == DatumType::Null; }
+    bool GetBool() const { return bool_val; }
+    int32_t GetInt32() const { return i32_val; }
+    int64_t GetInt64() const { return i64_val; }
+    float GetFloat32() const { return f32_val; }
+    double GetFloat64() const { return f64_val; }
+    const std::string& GetString() const { return string_val; }
+    const std::vector<uint8_t>& GetBytes() const { return bytes_val; }
     fluss::Date GetDate() const { return {i32_val}; }
     fluss::Time GetTime() const { return {i32_val}; }
     fluss::Timestamp GetTimestamp() const { return {i64_val, i32_val}; }
@@ -428,7 +446,6 @@ struct Datum {
         return "";
     }
 
-   private:
     static std::string FormatUnscaled64(int64_t unscaled, int32_t scale) {
         bool negative = unscaled < 0;
         uint64_t abs_val =
@@ -469,7 +486,47 @@ struct Datum {
 };
 
 struct GenericRow {
-    std::vector<Datum> fields;
+    friend struct detail::FfiAccess;
+
+    size_t FieldCount() const { return fields.size(); }
+
+    DatumType GetType(size_t idx) const { return GetField(idx).GetType(); }
+    bool IsNull(size_t idx) const { return GetField(idx).IsNull(); }
+    bool GetBool(size_t idx) const { return GetTypedField(idx, DatumType::Bool).GetBool(); }
+    int32_t GetInt32(size_t idx) const { return GetTypedField(idx, DatumType::Int32).GetInt32(); }
+    int64_t GetInt64(size_t idx) const { return GetTypedField(idx, DatumType::Int64).GetInt64(); }
+    float GetFloat32(size_t idx) const {
+        return GetTypedField(idx, DatumType::Float32).GetFloat32();
+    }
+    double GetFloat64(size_t idx) const {
+        return GetTypedField(idx, DatumType::Float64).GetFloat64();
+    }
+    const std::string& GetString(size_t idx) const {
+        return GetTypedField(idx, DatumType::String).GetString();
+    }
+    const std::vector<uint8_t>& GetBytes(size_t idx) const {
+        return GetTypedField(idx, DatumType::Bytes).GetBytes();
+    }
+    fluss::Date GetDate(size_t idx) const { return GetTypedField(idx, DatumType::Date).GetDate(); }
+    fluss::Time GetTime(size_t idx) const { return GetTypedField(idx, DatumType::Time).GetTime(); }
+    fluss::Timestamp GetTimestamp(size_t idx) const {
+        const auto& d = GetField(idx);
+        auto t = d.GetType();
+        if (t != DatumType::TimestampNtz && t != DatumType::TimestampLtz) {
+            throw std::runtime_error("GenericRow: field " + std::to_string(idx) +
+                                     " is not a Timestamp type");
+        }
+        return d.GetTimestamp();
+    }
+    bool IsDecimal(size_t idx) const { return GetField(idx).IsDecimal(); }
+    std::string DecimalToString(size_t idx) const {
+        const auto& d = GetField(idx);
+        if (!d.IsDecimal()) {
+            throw std::runtime_error("GenericRow: field " + std::to_string(idx) +
+                                     " is not a Decimal type");
+        }
+        return d.DecimalToString();
+    }
 
     void SetNull(size_t idx) {
         EnsureSize(idx);
@@ -537,6 +594,27 @@ struct GenericRow {
     }
 
    private:
+    std::vector<Datum> fields;
+
+    const Datum& GetField(size_t idx) const {
+        if (idx >= fields.size()) {
+            throw std::runtime_error("GenericRow: index " + std::to_string(idx) +
+                                     " out of bounds (size=" + std::to_string(fields.size()) + ")");
+        }
+        return fields[idx];
+    }
+
+    const Datum& GetTypedField(size_t idx, DatumType expected) const {
+        const auto& d = GetField(idx);
+        if (d.GetType() != expected) {
+            throw std::runtime_error("GenericRow: field " + std::to_string(idx) +
+                                     " type mismatch: expected " +
+                                     std::to_string(static_cast<int>(expected)) + ", got " +
+                                     std::to_string(static_cast<int>(d.GetType())));
+        }
+        return d;
+    }
+
     void EnsureSize(size_t idx) {
         if (fields.size() <= idx) {
             fields.resize(idx + 1);
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index e3e63a855c..8adcd01bb5 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -23,15 +23,94 @@
 #include "lib.rs.h"
 
 namespace fluss {
+
+namespace detail {
+struct FfiAccess {
+    static const std::vector<Datum>& fields(const GenericRow& row) { return row.fields; }
+    static std::vector<Datum>& fields(GenericRow& row) { return row.fields; }
+
+    static ffi::FfiDatum to_ffi_datum(const Datum& datum) {
+        ffi::FfiDatum ffi_datum;
+        ffi_datum.datum_type = static_cast<int32_t>(datum.type);
+        ffi_datum.bool_val = datum.bool_val;
+        ffi_datum.i32_val = datum.i32_val;
+        ffi_datum.i64_val = datum.i64_val;
+        ffi_datum.f32_val = datum.f32_val;
+        ffi_datum.f64_val = datum.f64_val;
+        ffi_datum.string_val = rust::String(datum.string_val);
+        ffi_datum.decimal_precision = datum.decimal_precision;
+        ffi_datum.decimal_scale = datum.decimal_scale;
+        ffi_datum.i128_hi = datum.i128_hi;
+        ffi_datum.i128_lo = datum.i128_lo;
+
+        rust::Vec<uint8_t> bytes;
+        for (auto b : datum.bytes_val) {
+            bytes.push_back(b);
+        }
+        ffi_datum.bytes_val = std::move(bytes);
+
+        return ffi_datum;
+    }
+
+    static Datum from_ffi_datum(const ffi::FfiDatum& ffi_datum) {
+        auto dtype = static_cast<DatumType>(ffi_datum.datum_type);
+        switch (dtype) {
+            case DatumType::Null:
+                return Datum::Null();
+            case DatumType::Bool:
+                return Datum::Bool(ffi_datum.bool_val);
+            case DatumType::Int32:
+                return Datum::Int32(ffi_datum.i32_val);
+            case DatumType::Int64:
+                return Datum::Int64(ffi_datum.i64_val);
+            case DatumType::Float32:
+                return Datum::Float32(ffi_datum.f32_val);
+            case DatumType::Float64:
+                return Datum::Float64(ffi_datum.f64_val);
+            case DatumType::String:
+                return Datum::String(std::string(ffi_datum.string_val));
+            case DatumType::Bytes: {
+                std::vector<uint8_t> bytes;
+                for (auto b : ffi_datum.bytes_val) {
+                    bytes.push_back(b);
+                }
+                return Datum::Bytes(std::move(bytes));
+            }
+            case DatumType::Date:
+                return Datum::Date(fluss::Date{ffi_datum.i32_val});
+            case DatumType::Time:
+                return Datum::Time(fluss::Time{ffi_datum.i32_val});
+            case DatumType::TimestampNtz:
+                return Datum::TimestampNtz(fluss::Timestamp{ffi_datum.i64_val, ffi_datum.i32_val});
+            case DatumType::TimestampLtz:
+                return Datum::TimestampLtz(fluss::Timestamp{ffi_datum.i64_val, ffi_datum.i32_val});
+            case DatumType::DecimalI64:
+            case DatumType::DecimalI128:
+            case DatumType::DecimalString: {
+                Datum d;
+                d.type = dtype;
+                d.i64_val = ffi_datum.i64_val;
+                d.decimal_precision = ffi_datum.decimal_precision;
+                d.decimal_scale = ffi_datum.decimal_scale;
+                d.i128_hi = ffi_datum.i128_hi;
+                d.i128_lo = ffi_datum.i128_lo;
+                if (dtype == DatumType::DecimalString) {
+                    d.string_val = std::string(ffi_datum.string_val);
+                }
+                return d;
+            }
+            default:
+                return Datum::Null();
+        }
+    }
+};
+}  // namespace detail
+
 namespace utils {
 
-inline Result make_error(int32_t code, std::string msg) {
-    return Result{code, std::move(msg)};
-}
+inline Result make_error(int32_t code, std::string msg) { return Result{code, std::move(msg)}; }
 
-inline Result make_ok() {
-    return Result{0, {}};
-}
+inline Result make_ok() { return Result{0, {}}; }
 
 inline Result from_ffi_result(const ffi::FfiResult& ffi_result) {
     return Result{ffi_result.error_code, std::string(ffi_result.error_message)};
@@ -105,37 +184,14 @@ inline ffi::FfiTableDescriptor to_ffi_table_descriptor(const TableDescriptor& de
     return ffi_desc;
 }
 
-inline ffi::FfiDatum to_ffi_datum(const Datum& datum) {
-    ffi::FfiDatum ffi_datum;
-    ffi_datum.datum_type = static_cast<int32_t>(datum.type);
-    ffi_datum.bool_val = datum.bool_val;
-    ffi_datum.i32_val = datum.i32_val;
-    ffi_datum.i64_val = datum.i64_val;
-    ffi_datum.f32_val = datum.f32_val;
-    ffi_datum.f64_val = datum.f64_val;
-    ffi_datum.string_val = rust::String(datum.string_val);
-    ffi_datum.decimal_precision = datum.decimal_precision;
-    ffi_datum.decimal_scale = datum.decimal_scale;
-    ffi_datum.i128_hi = datum.i128_hi;
-    ffi_datum.i128_lo = datum.i128_lo;
-
-    rust::Vec<uint8_t> bytes;
-    for (auto b : datum.bytes_val) {
-        bytes.push_back(b);
-    }
-    ffi_datum.bytes_val = std::move(bytes);
-
-    return ffi_datum;
-}
-
 inline ffi::FfiGenericRow to_ffi_generic_row(const GenericRow& row) {
     ffi::FfiGenericRow ffi_row;
 
-    rust::Vec<ffi::FfiDatum> fields;
-    for (const auto& field : row.fields) {
-        fields.push_back(to_ffi_datum(field));
+    rust::Vec<ffi::FfiDatum> ffi_fields;
+    for (const auto& field : detail::FfiAccess::fields(row)) {
+        ffi_fields.push_back(detail::FfiAccess::to_ffi_datum(field));
     }
-    ffi_row.fields = std::move(fields);
+    ffi_row.fields = std::move(ffi_fields);
 
     return ffi_row;
 }
@@ -166,9 +222,8 @@ inline TableInfo from_ffi_table_info(const ffi::FfiTableInfo& ffi_info) {
 
     info.table_id = ffi_info.table_id;
     info.schema_id = ffi_info.schema_id;
-    info.table_path = TablePath{
-        std::string(ffi_info.table_path.database_name),
-        std::string(ffi_info.table_path.table_name)};
+    info.table_path = TablePath{std::string(ffi_info.table_path.database_name),
+                                std::string(ffi_info.table_path.table_name)};
     info.created_time = ffi_info.created_time;
     info.modified_time = ffi_info.modified_time;
 
@@ -198,44 +253,19 @@ inline TableInfo from_ffi_table_info(const ffi::FfiTableInfo& ffi_info) {
     return info;
 }
 
-inline Datum from_ffi_datum(const ffi::FfiDatum& ffi_datum) {
-    Datum datum;
-    datum.type = static_cast<DatumType>(ffi_datum.datum_type);
-    datum.bool_val = ffi_datum.bool_val;
-    datum.i32_val = ffi_datum.i32_val;
-    datum.i64_val = ffi_datum.i64_val;
-    datum.f32_val = ffi_datum.f32_val;
-    datum.f64_val = ffi_datum.f64_val;
-    // todo: avoid copy string
-    datum.string_val = std::string(ffi_datum.string_val);
-    datum.decimal_precision = ffi_datum.decimal_precision;
-    datum.decimal_scale = ffi_datum.decimal_scale;
-    datum.i128_hi = ffi_datum.i128_hi;
-    datum.i128_lo = ffi_datum.i128_lo;
-
-    for (auto b : ffi_datum.bytes_val) {
-        datum.bytes_val.push_back(b);
-    }
-
-    return datum;
-}
-
 inline GenericRow from_ffi_generic_row(const ffi::FfiGenericRow& ffi_row) {
     GenericRow row;
 
     for (const auto& field : ffi_row.fields) {
-        row.fields.push_back(from_ffi_datum(field));
+        detail::FfiAccess::fields(row).push_back(detail::FfiAccess::from_ffi_datum(field));
     }
 
     return row;
 }
 
 inline ScanRecord from_ffi_scan_record(const ffi::FfiScanRecord& ffi_record) {
-    return ScanRecord{
-        ffi_record.bucket_id,
-        ffi_record.offset,
-        ffi_record.timestamp,
-        from_ffi_generic_row(ffi_record.row)};
+    return ScanRecord{ffi_record.bucket_id, ffi_record.offset, ffi_record.timestamp,
+                      from_ffi_generic_row(ffi_record.row)};
 }
 
 inline ScanRecords from_ffi_scan_records(const ffi::FfiScanRecords& ffi_records) {
@@ -253,11 +283,8 @@ inline LakeSnapshot from_ffi_lake_snapshot(const ffi::FfiLakeSnapshot& ffi_snaps
     snapshot.snapshot_id = ffi_snapshot.snapshot_id;
 
     for (const auto& offset : ffi_snapshot.bucket_offsets) {
-        snapshot.bucket_offsets.push_back(BucketOffset{
-            offset.table_id,
-            offset.partition_id,
-            offset.bucket_id,
-            offset.offset});
+        snapshot.bucket_offsets.push_back(
+            BucketOffset{offset.table_id, offset.partition_id, offset.bucket_id, offset.offset});
     }
 
     return snapshot;

From 1c0b97ae8b8b433e95b41ddc60f403f2da7fef29 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 8 Feb 2026 20:21:19 +0800
Subject: [PATCH 129/287] feat: introduce database level ops for cpp bindings
 (#286)

---
 fluss-rust/bindings/cpp/BUILD.bazel           |  33 +++
 fluss-rust/bindings/cpp/CMakeLists.txt        |   6 +
 .../bindings/cpp/examples/admin_example.cpp   | 121 ++++++++++
 fluss-rust/bindings/cpp/include/fluss.hpp     |  36 +++
 fluss-rust/bindings/cpp/src/admin.cpp         | 120 ++++++++++
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  25 +++
 fluss-rust/bindings/cpp/src/lib.rs            | 208 ++++++++++++++++++
 fluss-rust/bindings/cpp/src/types.rs          |  43 ++++
 8 files changed, 592 insertions(+)
 create mode 100644 fluss-rust/bindings/cpp/examples/admin_example.cpp

diff --git a/fluss-rust/bindings/cpp/BUILD.bazel b/fluss-rust/bindings/cpp/BUILD.bazel
index 81d483cb72..aff8f504fd 100644
--- a/fluss-rust/bindings/cpp/BUILD.bazel
+++ b/fluss-rust/bindings/cpp/BUILD.bazel
@@ -340,3 +340,36 @@ cc_binary(
     visibility = ["//visibility:public"],
 )
 
+cc_binary(
+    name = "fluss_cpp_admin_example",
+    srcs = [
+        "examples/admin_example.cpp",
+    ],
+    deps = [":fluss_cpp"],
+    copts = [
+        "-std=c++17",
+    ] + select({
+        ":debug_mode": [
+            "-g3",
+            "-O0",
+            "-ggdb",
+            "-fno-omit-frame-pointer",
+            "-DDEBUG",
+        ],
+        ":fastbuild_mode": [
+            "-g",
+            "-O0",
+        ],
+        ":release_mode": [
+            "-O2",
+            "-DNDEBUG",
+        ],
+    }),
+    linkopts = select({
+        ":debug_mode": ["-g"],
+        ":fastbuild_mode": ["-g"],
+        ":release_mode": [],
+    }),
+    visibility = ["//visibility:public"],
+)
+
diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
index 93cfc413fe..ae70842678 100644
--- a/fluss-rust/bindings/cpp/CMakeLists.txt
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -102,6 +102,12 @@ target_link_libraries(fluss_cpp_example PRIVATE Arrow::arrow_shared)
 target_compile_definitions(fluss_cpp_example PRIVATE ARROW_FOUND)
 target_include_directories(fluss_cpp_example PUBLIC ${CPP_INCLUDE_DIR})
 
+add_executable(fluss_cpp_admin_example examples/admin_example.cpp)
+target_link_libraries(fluss_cpp_admin_example PRIVATE fluss_cpp)
+target_link_libraries(fluss_cpp_admin_example PRIVATE Arrow::arrow_shared)
+target_compile_definitions(fluss_cpp_admin_example PRIVATE ARROW_FOUND)
+target_include_directories(fluss_cpp_admin_example PUBLIC ${CPP_INCLUDE_DIR})
+
 set_target_properties(fluss_cpp
     PROPERTIES ADDITIONAL_CLEAN_FILES ${CARGO_TARGET_DIR}
 )
diff --git a/fluss-rust/bindings/cpp/examples/admin_example.cpp b/fluss-rust/bindings/cpp/examples/admin_example.cpp
new file mode 100644
index 0000000000..7b7a333b0e
--- /dev/null
+++ b/fluss-rust/bindings/cpp/examples/admin_example.cpp
@@ -0,0 +1,121 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include <iostream>
+#include <string>
+#include <unordered_map>
+#include <vector>
+
+#include "fluss.hpp"
+
+static void check(const char* step, const fluss::Result& r) {
+    if (!r.Ok()) {
+        std::cerr << step << " failed: code=" << r.error_code << " msg=" << r.error_message
+                  << std::endl;
+        std::exit(1);
+    }
+}
+
+int main() {
+    const std::string bootstrap = "127.0.0.1:9123";
+    const std::string db_name = "admin_example_db";
+    const std::string table_name = "admin_example_table";
+
+    // 1) Connect and get Admin
+    fluss::Connection conn;
+    check("connect", fluss::Connection::Connect(bootstrap, conn));
+
+    fluss::Admin admin;
+    check("get_admin", conn.GetAdmin(admin));
+
+    // 2) Database operations
+    std::cout << "--- Database operations ---" << std::endl;
+
+    bool exists = false;
+    check("database_exists (before create)", admin.DatabaseExists(db_name, exists));
+    std::cout << "Database " << db_name << " exists before create: " << (exists ? "yes" : "no")
+              << std::endl;
+
+    fluss::DatabaseDescriptor db_desc;
+    db_desc.comment = "Example database for Admin API";
+    db_desc.properties["owner"] = "admin_example";
+    check("create_database", admin.CreateDatabase(db_name, db_desc, true));
+
+    check("database_exists (after create)", admin.DatabaseExists(db_name, exists));
+    std::cout << "Database " << db_name << " exists after create: " << (exists ? "yes" : "no")
+              << std::endl;
+
+    fluss::DatabaseInfo db_info;
+    check("get_database_info", admin.GetDatabaseInfo(db_name, db_info));
+    std::cout << "Database info: name=" << db_info.database_name
+              << " comment=" << db_info.comment << " created_time=" << db_info.created_time
+              << std::endl;
+
+    std::vector<std::string> databases;
+    check("list_databases", admin.ListDatabases(databases));
+    std::cout << "List databases (" << databases.size() << "): ";
+    for (size_t i = 0; i < databases.size(); ++i) {
+        if (i > 0) std::cout << ", ";
+        std::cout << databases[i];
+    }
+    std::cout << std::endl;
+
+    // 3) Table operations in the new database
+    std::cout << "--- Table operations ---" << std::endl;
+
+    fluss::TablePath table_path(db_name, table_name);
+
+    bool table_exists_flag = false;
+    check("table_exists (before create)", admin.TableExists(table_path, table_exists_flag));
+    std::cout << "Table " << db_name << "." << table_name
+              << " exists before create: " << (table_exists_flag ? "yes" : "no") << std::endl;
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .Build();
+    auto descriptor = fluss::TableDescriptor::NewBuilder()
+                          .SetSchema(schema)
+                          .SetBucketCount(1)
+                          .SetComment("admin example table")
+                          .Build();
+
+    check("create_table", admin.CreateTable(table_path, descriptor, true));
+
+    check("table_exists (after create)", admin.TableExists(table_path, table_exists_flag));
+    std::cout << "Table exists after create: " << (table_exists_flag ? "yes" : "no") << std::endl;
+
+    std::vector<std::string> tables;
+    check("list_tables", admin.ListTables(db_name, tables));
+    std::cout << "List tables in " << db_name << " (" << tables.size() << "): ";
+    for (size_t i = 0; i < tables.size(); ++i) {
+        if (i > 0) std::cout << ", ";
+        std::cout << tables[i];
+    }
+    std::cout << std::endl;
+
+    // 4) Cleanup: drop table, then drop database
+    std::cout << "--- Cleanup ---" << std::endl;
+    check("drop_table", admin.DropTable(table_path, true));
+    check("drop_database", admin.DropDatabase(db_name, true, true));
+
+    check("database_exists (after drop)", admin.DatabaseExists(db_name, exists));
+    std::cout << "Database exists after drop: " << (exists ? "yes" : "no") << std::endl;
+
+    std::cout << "Admin example completed successfully." << std::endl;
+    return 0;
+}
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 6b9d479a7b..50dffaefa1 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -709,6 +709,21 @@ struct PartitionInfo {
     std::string partition_name;
 };
 
+/// Descriptor for create_database (optional). Leave comment and properties empty for default.
+struct DatabaseDescriptor {
+    std::string comment;
+    std::unordered_map<std::string, std::string> properties;
+};
+
+/// Metadata returned by GetDatabaseInfo.
+struct DatabaseInfo {
+    std::string database_name;
+    std::string comment;
+    std::unordered_map<std::string, std::string> properties;
+    int64_t created_time{0};
+    int64_t modified_time{0};
+};
+
 class AppendWriter;
 class WriteResult;
 class LogScanner;
@@ -773,6 +788,27 @@ class Admin {
                            const std::unordered_map<std::string, std::string>& partition_spec,
                            bool ignore_if_exists = false);
 
+    Result DropPartition(const TablePath& table_path,
+                         const std::unordered_map<std::string, std::string>& partition_spec,
+                         bool ignore_if_not_exists = false);
+
+    Result CreateDatabase(const std::string& database_name,
+                          const DatabaseDescriptor& descriptor,
+                          bool ignore_if_exists = false);
+
+    Result DropDatabase(const std::string& database_name, bool ignore_if_not_exists = false,
+                        bool cascade = true);
+
+    Result ListDatabases(std::vector<std::string>& out);
+
+    Result DatabaseExists(const std::string& database_name, bool& out);
+
+    Result GetDatabaseInfo(const std::string& database_name, DatabaseInfo& out);
+
+    Result ListTables(const std::string& database_name, std::vector<std::string>& out);
+
+    Result TableExists(const TablePath& table_path, bool& out);
+
    private:
     Result DoListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
                          const OffsetQuery& offset_query, std::unordered_map<int32_t, int64_t>& out,
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index 4aed78db8b..77c95d317c 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -204,4 +204,124 @@ Result Admin::CreatePartition(const TablePath& table_path,
     return utils::from_ffi_result(ffi_result);
 }
 
+Result Admin::DropPartition(const TablePath& table_path,
+                            const std::unordered_map<std::string, std::string>& partition_spec,
+                            bool ignore_if_not_exists) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+
+    rust::Vec<ffi::FfiPartitionKeyValue> rust_spec;
+    for (const auto& [key, value] : partition_spec) {
+        ffi::FfiPartitionKeyValue kv;
+        kv.key = rust::String(key);
+        kv.value = rust::String(value);
+        rust_spec.push_back(std::move(kv));
+    }
+
+    auto ffi_result =
+        admin_->drop_partition(ffi_path, std::move(rust_spec), ignore_if_not_exists);
+    return utils::from_ffi_result(ffi_result);
+}
+
+Result Admin::CreateDatabase(const std::string& database_name,
+                             const DatabaseDescriptor& descriptor,
+                             bool ignore_if_exists) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_desc = utils::to_ffi_database_descriptor(descriptor);
+    auto ffi_result =
+        admin_->create_database(rust::Str(database_name), ffi_desc, ignore_if_exists);
+    return utils::from_ffi_result(ffi_result);
+}
+
+Result Admin::DropDatabase(const std::string& database_name, bool ignore_if_not_exists,
+                           bool cascade) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_result =
+        admin_->drop_database(rust::Str(database_name), ignore_if_not_exists, cascade);
+    return utils::from_ffi_result(ffi_result);
+}
+
+Result Admin::ListDatabases(std::vector<std::string>& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_result = admin_->list_databases();
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.clear();
+        out.reserve(ffi_result.database_names.size());
+        for (const auto& name : ffi_result.database_names) {
+            out.push_back(std::string(name));
+        }
+    }
+    return result;
+}
+
+Result Admin::DatabaseExists(const std::string& database_name, bool& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_result = admin_->database_exists(rust::Str(database_name));
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = ffi_result.value;
+    }
+    return result;
+}
+
+Result Admin::GetDatabaseInfo(const std::string& database_name, DatabaseInfo& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_result = admin_->get_database_info(rust::Str(database_name));
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = utils::from_ffi_database_info(ffi_result.database_info);
+    }
+    return result;
+}
+
+Result Admin::ListTables(const std::string& database_name, std::vector<std::string>& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_result = admin_->list_tables(rust::Str(database_name));
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.clear();
+        out.reserve(ffi_result.table_names.size());
+        for (const auto& name : ffi_result.table_names) {
+            out.push_back(std::string(name));
+        }
+    }
+    return result;
+}
+
+Result Admin::TableExists(const TablePath& table_path, bool& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+    auto ffi_result = admin_->table_exists(ffi_path);
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = ffi_result.value;
+    }
+    return result;
+}
+
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 8adcd01bb5..8fc8415543 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -290,5 +290,30 @@ inline LakeSnapshot from_ffi_lake_snapshot(const ffi::FfiLakeSnapshot& ffi_snaps
     return snapshot;
 }
 
+inline ffi::FfiDatabaseDescriptor to_ffi_database_descriptor(
+    const DatabaseDescriptor& desc) {
+    ffi::FfiDatabaseDescriptor ffi_desc;
+    ffi_desc.comment = rust::String(desc.comment);
+    for (const auto& [k, v] : desc.properties) {
+        ffi::HashMapValue kv;
+        kv.key = rust::String(k);
+        kv.value = rust::String(v);
+        ffi_desc.properties.push_back(std::move(kv));
+    }
+    return ffi_desc;
+}
+
+inline DatabaseInfo from_ffi_database_info(const ffi::FfiDatabaseInfo& ffi_info) {
+    DatabaseInfo info;
+    info.database_name = std::string(ffi_info.database_name);
+    info.comment = std::string(ffi_info.comment);
+    info.created_time = ffi_info.created_time;
+    info.modified_time = ffi_info.modified_time;
+    for (const auto& prop : ffi_info.properties) {
+        info.properties[std::string(prop.key)] = std::string(prop.value);
+    }
+    return info;
+}
+
 }  // namespace utils
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 235d282fc5..5f3e7e96dd 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -202,6 +202,39 @@ mod ffi {
         partition_infos: Vec<FfiPartitionInfo>,
     }
 
+    struct FfiDatabaseDescriptor {
+        comment: String,
+        properties: Vec<HashMapValue>,
+    }
+
+    struct FfiDatabaseInfo {
+        database_name: String,
+        comment: String,
+        properties: Vec<HashMapValue>,
+        created_time: i64,
+        modified_time: i64,
+    }
+
+    struct FfiDatabaseInfoResult {
+        result: FfiResult,
+        database_info: FfiDatabaseInfo,
+    }
+
+    struct FfiListDatabasesResult {
+        result: FfiResult,
+        database_names: Vec<String>,
+    }
+
+    struct FfiListTablesResult {
+        result: FfiResult,
+        table_names: Vec<String>,
+    }
+
+    struct FfiBoolResult {
+        result: FfiResult,
+        value: bool,
+    }
+
     extern "Rust" {
         type Connection;
         type Admin;
@@ -257,6 +290,29 @@ mod ffi {
             partition_spec: Vec<FfiPartitionKeyValue>,
             ignore_if_exists: bool,
         ) -> FfiResult;
+        fn drop_partition(
+            self: &Admin,
+            table_path: &FfiTablePath,
+            partition_spec: Vec<FfiPartitionKeyValue>,
+            ignore_if_not_exists: bool,
+        ) -> FfiResult;
+        fn create_database(
+            self: &Admin,
+            database_name: &str,
+            descriptor: &FfiDatabaseDescriptor,
+            ignore_if_exists: bool,
+        ) -> FfiResult;
+        fn drop_database(
+            self: &Admin,
+            database_name: &str,
+            ignore_if_not_exists: bool,
+            cascade: bool,
+        ) -> FfiResult;
+        fn list_databases(self: &Admin) -> FfiListDatabasesResult;
+        fn database_exists(self: &Admin, database_name: &str) -> FfiBoolResult;
+        fn get_database_info(self: &Admin, database_name: &str) -> FfiDatabaseInfoResult;
+        fn list_tables(self: &Admin, database_name: &str) -> FfiListTablesResult;
+        fn table_exists(self: &Admin, table_path: &FfiTablePath) -> FfiBoolResult;
 
         // Table
         unsafe fn delete_table(table: *mut Table);
@@ -661,6 +717,158 @@ impl Admin {
             Err(e) => err_result(1, e.to_string()),
         }
     }
+
+    fn drop_partition(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        partition_spec: Vec<ffi::FfiPartitionKeyValue>,
+        ignore_if_not_exists: bool,
+    ) -> ffi::FfiResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+        let spec_map: std::collections::HashMap<String, String> = partition_spec
+            .into_iter()
+            .map(|kv| (kv.key, kv.value))
+            .collect();
+        let partition_spec = fcore::metadata::PartitionSpec::new(spec_map);
+
+        let result = RUNTIME.block_on(async {
+            self.inner
+                .drop_partition(&path, &partition_spec, ignore_if_not_exists)
+                .await
+        });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+
+    fn create_database(
+        &self,
+        database_name: &str,
+        descriptor: &ffi::FfiDatabaseDescriptor,
+        ignore_if_exists: bool,
+    ) -> ffi::FfiResult {
+        let descriptor_opt = types::ffi_database_descriptor_to_core(descriptor);
+
+        let result = RUNTIME.block_on(async {
+            self.inner
+                .create_database(database_name, ignore_if_exists, descriptor_opt.as_ref())
+                .await
+        });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+
+    fn drop_database(
+        &self,
+        database_name: &str,
+        ignore_if_not_exists: bool,
+        cascade: bool,
+    ) -> ffi::FfiResult {
+        let result = RUNTIME.block_on(async {
+            self.inner
+                .drop_database(database_name, ignore_if_not_exists, cascade)
+                .await
+        });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+
+    fn list_databases(&self) -> ffi::FfiListDatabasesResult {
+        let result = RUNTIME.block_on(async { self.inner.list_databases().await });
+
+        match result {
+            Ok(names) => ffi::FfiListDatabasesResult {
+                result: ok_result(),
+                database_names: names,
+            },
+            Err(e) => ffi::FfiListDatabasesResult {
+                result: err_result(1, e.to_string()),
+                database_names: vec![],
+            },
+        }
+    }
+
+    fn database_exists(&self, database_name: &str) -> ffi::FfiBoolResult {
+        let result = RUNTIME.block_on(async { self.inner.database_exists(database_name).await });
+
+        match result {
+            Ok(exists) => ffi::FfiBoolResult {
+                result: ok_result(),
+                value: exists,
+            },
+            Err(e) => ffi::FfiBoolResult {
+                result: err_result(1, e.to_string()),
+                value: false,
+            },
+        }
+    }
+
+    fn get_database_info(&self, database_name: &str) -> ffi::FfiDatabaseInfoResult {
+        let result = RUNTIME.block_on(async { self.inner.get_database_info(database_name).await });
+
+        match result {
+            Ok(info) => ffi::FfiDatabaseInfoResult {
+                result: ok_result(),
+                database_info: types::core_database_info_to_ffi(&info),
+            },
+            Err(e) => ffi::FfiDatabaseInfoResult {
+                result: err_result(1, e.to_string()),
+                database_info: ffi::FfiDatabaseInfo {
+                    database_name: String::new(),
+                    comment: String::new(),
+                    properties: vec![],
+                    created_time: 0,
+                    modified_time: 0,
+                },
+            },
+        }
+    }
+
+    fn list_tables(&self, database_name: &str) -> ffi::FfiListTablesResult {
+        let result = RUNTIME.block_on(async { self.inner.list_tables(database_name).await });
+
+        match result {
+            Ok(names) => ffi::FfiListTablesResult {
+                result: ok_result(),
+                table_names: names,
+            },
+            Err(e) => ffi::FfiListTablesResult {
+                result: err_result(1, e.to_string()),
+                table_names: vec![],
+            },
+        }
+    }
+
+    fn table_exists(&self, table_path: &ffi::FfiTablePath) -> ffi::FfiBoolResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+
+        let result = RUNTIME.block_on(async { self.inner.table_exists(&path).await });
+
+        match result {
+            Ok(exists) => ffi::FfiBoolResult {
+                result: ok_result(),
+                value: exists,
+            },
+            Err(e) => ffi::FfiBoolResult {
+                result: err_result(1, e.to_string()),
+                value: false,
+            },
+        }
+    }
 }
 
 // Table implementation
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 05d3d6a1d2..65b9b0409f 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -250,6 +250,49 @@ pub fn empty_table_info() -> ffi::FfiTableInfo {
     }
 }
 
+/// Convert FFI database descriptor to core. Returns None if descriptor is effectively empty
+/// (no comment and no properties), so create_database can pass Option::None to core.
+pub fn ffi_database_descriptor_to_core(
+    d: &ffi::FfiDatabaseDescriptor,
+) -> Option<fcore::metadata::DatabaseDescriptor> {
+    if d.comment.is_empty() && d.properties.is_empty() {
+        return None;
+    }
+    let mut builder = fcore::metadata::DatabaseDescriptor::builder();
+    if !d.comment.is_empty() {
+        builder = builder.comment(&d.comment);
+    }
+    if !d.properties.is_empty() {
+        let props: std::collections::HashMap<String, String> = d
+            .properties
+            .iter()
+            .map(|kv| (kv.key.clone(), kv.value.clone()))
+            .collect();
+        builder = builder.custom_properties(props);
+    }
+    Some(builder.build())
+}
+
+/// Convert core DatabaseInfo to FFI.
+pub fn core_database_info_to_ffi(info: &fcore::metadata::DatabaseInfo) -> ffi::FfiDatabaseInfo {
+    let desc = info.database_descriptor();
+    let properties: Vec<ffi::HashMapValue> = desc
+        .custom_properties()
+        .iter()
+        .map(|(k, v)| ffi::HashMapValue {
+            key: k.clone(),
+            value: v.clone(),
+        })
+        .collect();
+    ffi::FfiDatabaseInfo {
+        database_name: info.database_name().to_string(),
+        comment: desc.comment().unwrap_or("").to_string(),
+        properties,
+        created_time: info.created_time(),
+        modified_time: info.modified_time(),
+    }
+}
+
 /// Look up decimal (precision, scale) from schema for column `idx`.
 fn get_decimal_type(idx: usize, schema: Option<&fcore::metadata::Schema>) -> Result<(u32, u32)> {
     let col = schema

From ecb12288d2885274de45e68bf55c9b84e4f8793d Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Sun, 8 Feb 2026 20:51:53 +0800
Subject: [PATCH 130/287] doc: introduce how to verify a release document
 (#282)

---
 fluss-rust/bindings/cpp/README.md             |  57 +++++++
 fluss-rust/bindings/python/README.md          |   7 +
 fluss-rust/crates/fluss/README.md             |  43 ++++++
 fluss-rust/docs/creating-a-release.md         |  16 +-
 .../docs/verifying-a-release-candidate.md     | 142 ++++++++++++++++++
 fluss-rust/scripts/release.sh                 |  13 +-
 6 files changed, 265 insertions(+), 13 deletions(-)
 create mode 100644 fluss-rust/bindings/cpp/README.md
 create mode 100644 fluss-rust/crates/fluss/README.md
 create mode 100644 fluss-rust/docs/verifying-a-release-candidate.md

diff --git a/fluss-rust/bindings/cpp/README.md b/fluss-rust/bindings/cpp/README.md
new file mode 100644
index 0000000000..2556a4b6c8
--- /dev/null
+++ b/fluss-rust/bindings/cpp/README.md
@@ -0,0 +1,57 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Apache Fluss™ C++ Bindings (Incubating)
+
+C++ bindings for Fluss, built on top of the [fluss-rust](../../crates/fluss) client. The API is exposed via a C++ header ([include/fluss.hpp](include/fluss.hpp)) and implemented with Rust FFI.
+
+## Requirements
+
+- Rust (see [rust-toolchain.toml](../../rust-toolchain.toml) at repo root)
+- C++17-capable compiler
+- CMake 3.18+ and/or Bazel
+- Apache Arrow (for Arrow-based APIs)
+
+## Build
+
+From the repository root or from `bindings/cpp`:
+
+**With CMake:**
+
+```bash
+cd bindings/cpp
+mkdir build && cd build
+cmake ..
+cmake --build .
+```
+
+**With Bazel:**
+
+```bash
+cd bindings/cpp
+bazel build //...
+```
+See [ci.sh](ci.sh) for the CI build sequence.
+
+
+## TODO
+
+- [] How to introduce fluss-cpp in your own project, https://github.com/apache/opendal/blob/main/bindings/cpp/README.md is a good reference
+- [ ] Add CMake/Bazel install and packaging instructions.
+- [ ] Document API usage and minimal example in this README.
+- [ ] Add more C++ examples (log scan, upsert, etc.).
diff --git a/fluss-rust/bindings/python/README.md b/fluss-rust/bindings/python/README.md
index 44d6099c6c..b0970397f5 100644
--- a/fluss-rust/bindings/python/README.md
+++ b/fluss-rust/bindings/python/README.md
@@ -53,6 +53,8 @@ Used for writing data to tables, supports PyArrow and Pandas
 
 Used for scanning table log data
 
+
+# todo: we may move the following part to DEVELOPMENT.md
 ## Development
 
 ## Requirements
@@ -143,6 +145,11 @@ bindings/python/
     └── example.py
 ```
 
+## TODO
+
+- [ ] Add basic usage examples in API Overview (code snippets for Config, FlussConnection, FlussAdmin, FlussTable).
+- [ ] Add a "Verifying a release" subsection with install-from-TestPyPI/PyPI and smoke-test steps.
+
 ## License
 
 Apache 2.0 License
diff --git a/fluss-rust/crates/fluss/README.md b/fluss-rust/crates/fluss/README.md
new file mode 100644
index 0000000000..bee8ce8450
--- /dev/null
+++ b/fluss-rust/crates/fluss/README.md
@@ -0,0 +1,43 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Apache Fluss™ Rust Client (Incubating)
+
+Rust client library for [Apache Fluss™](https://fluss.apache.org/). This crate provides the core client used by the fluss-rust workspace and by the Python and C++ bindings.
+
+# Todo: move how to use to the first, and how to build to the last, https://github.com/apache/opendal/blob/main/core/README.md 
+# is a good reference
+
+## Requirements
+
+- Rust (see [rust-toolchain.toml](../../rust-toolchain.toml) at repo root)
+- protobuf (for build)
+
+## Build
+
+From the repository root:
+
+```bash
+cargo build -p fluss-rs
+```
+
+## Quick start and examples
+
+## TODO
+- [ ] Expand API documentation and usage examples in this README.
+- [ ] Add more examples for table, log scan, and write flows.
diff --git a/fluss-rust/docs/creating-a-release.md b/fluss-rust/docs/creating-a-release.md
index 95714d9824..164b64b770 100644
--- a/fluss-rust/docs/creating-a-release.md
+++ b/fluss-rust/docs/creating-a-release.md
@@ -217,11 +217,13 @@ just release $RELEASE_VERSION
 
 This creates under `dist/`:
 
-- `fluss-rust-${RELEASE_VERSION}.tar.gz`
-- `fluss-rust-${RELEASE_VERSION}.tar.gz.sha512`
-- `fluss-rust-${RELEASE_VERSION}.tar.gz.asc`
+- `fluss-rust-${RELEASE_VERSION}-incubating.tgz`
+- `fluss-rust-${RELEASE_VERSION}-incubating.tgz.sha512`
+- `fluss-rust-${RELEASE_VERSION}-incubating.tgz.asc`
 
-Verify with: `gpg --verify dist/fluss-rust-${RELEASE_VERSION}.tar.gz.asc dist/fluss-rust-${RELEASE_VERSION}.tar.gz`
+(Incubator policy requires the word "incubating" in release artifact names.)
+
+Verify with: `gpg --verify dist/fluss-rust-${RELEASE_VERSION}-incubating.tgz.asc dist/fluss-rust-${RELEASE_VERSION}-incubating.tgz`
 
 ### 4. Stage artifacts to SVN (dist.apache.org dev)
 
@@ -231,7 +233,7 @@ From the **fluss-rust** repo root, check out the Fluss dev area and add the rele
 svn checkout https://dist.apache.org/repos/dist/dev/incubator/fluss fluss-dist-dev --depth=immediates
 cd fluss-dist-dev
 mkdir $SVN_RC_DIR
-cp ../dist/fluss-rust-${RELEASE_VERSION}.* $SVN_RC_DIR/
+cp ../dist/fluss-rust-${RELEASE_VERSION}-incubating.* $SVN_RC_DIR/
 svn add $SVN_RC_DIR
 svn status
 svn commit -m "Add fluss-rust ${RELEASE_VERSION} RC${RC_NUM}"
@@ -282,7 +284,7 @@ PyPI (release) / TestPyPI (RC):
 * https://pypi.org/project/pyfluss/
 * https://test.pypi.org/project/pyfluss/
 
-Please download, verify, and test. Verification steps are in the project docs (todo: add how to verify release).
+Please download, verify, and test. Verification steps are in [How to Verify a Release Candidate](verifying-a-release-candidate.md).
 
 The vote will be open for at least 72 hours. It is adopted by majority approval with at least 3 PPMC affirmative votes (or as per project policy).
 
@@ -449,5 +451,5 @@ After finishing the release, consider what could be improved (simplifications, c
 ## See also
 
 - [Release Manager Preparation](https://fluss.apache.org/community/how-to-release/release-manager-preparation/) — GPG and one-time setup
-- [Verifying a Fluss Release](https://fluss.apache.org/community/how-to-release/verifying-a-fluss-release/) — How to verify artifacts (adapt for fluss-rust source tarball)
+- [How to Verify a Release Candidate](verifying-a-release-candidate.md) — Verify signatures, checksums, build, and tests for a release candidate
 - [ASF Release Policy](https://www.apache.org/legal/release-policy.html)
diff --git a/fluss-rust/docs/verifying-a-release-candidate.md b/fluss-rust/docs/verifying-a-release-candidate.md
new file mode 100644
index 0000000000..e67d4efc7b
--- /dev/null
+++ b/fluss-rust/docs/verifying-a-release-candidate.md
@@ -0,0 +1,142 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# How to Verify a Release Candidate
+
+This document describes how to verify a release candidate (RC) of the **Fluss clients** (fluss-rust, fluss-python, fluss-cpp) from the [fluss-rust](https://github.com/apache/fluss-rust) repository. It is intended for anyone participating in the release vote (binding or non-binding) and is based on [Verifying a Fluss Release](https://fluss.apache.org/community/how-to-release/verifying-a-fluss-release/) of the Apache Fluss project, adapted for the fluss-rust source distribution and tooling (Rust, Python, C++).
+
+## Validating distributions
+
+The release vote email includes links to:
+
+- **Distribution archive:** source tarball (`fluss-rust-${RELEASE_VERSION}-incubating.tgz`) on [dist.apache.org dev](https://dist.apache.org/repos/dist/dev/incubator/fluss/)
+- **Signature file:** `fluss-rust-${RELEASE_VERSION}-incubating.tgz.asc`
+- **Checksum file:** `fluss-rust-${RELEASE_VERSION}-incubating.tgz.sha512`
+- **KEYS file:** [https://downloads.apache.org/incubator/fluss/KEYS](https://downloads.apache.org/incubator/fluss/KEYS)
+
+Download the archive (`.tgz`), `.asc`, and `.sha512` from the RC directory (e.g. `fluss-rust-0.1.0-rc1/`) and the KEYS file. Then follow the steps below to verify signatures and checksums.
+
+## Verifying signatures
+
+First, import the keys into your local keyring:
+
+```bash
+curl https://downloads.apache.org/incubator/fluss/KEYS -o KEYS
+gpg --import KEYS
+```
+
+Next, verify all `.asc` files:
+
+```bash
+for i in *.tgz; do echo $i; gpg --verify $i.asc $i; done
+```
+
+If verification succeeds, you will see a message like:
+
+```text
+gpg: Signature made ...
+gpg: using RSA key ...
+gpg: Good signature from "Release Manager Name (CODE SIGNING KEY) <...@apache.org>"
+```
+
+## Verifying checksums
+
+Next, verify the tarball(s) using the provided `.sha512` file(s). Each `.sha512` file lists the expected SHA-512 hash for the corresponding archive; `-c` reads that file and checks the archive.
+
+**On macOS (shasum):**
+
+```bash
+shasum -a 512 -c fluss-rust-${RELEASE_VERSION}-incubating.tgz.sha512
+```
+
+**On Linux (sha512sum):**
+
+```bash
+sha512sum -c fluss-rust-${RELEASE_VERSION}-incubating.tgz.sha512
+```
+
+If you have multiple archives, run `-c` on each `.sha512` file (or use `shasum -a 512 -c *.sha512` / `sha512sum -c *.sha512`).
+
+If the verification is successful, you will see a message like this:
+
+```text
+fluss-rust-0.1.0-incubating.tgz: OK
+```
+
+## Verifying build
+
+Extract the source release archive and verify that it builds (and optionally that tests pass). You need **Rust** (see [rust-toolchain.toml](https://github.com/apache/fluss-rust/blob/main/rust-toolchain.toml) for the expected version) and, for full builds, **protobuf** and **Python 3.9+** for bindings.
+
+```bash
+tar -xzf fluss-rust-${RELEASE_VERSION}-incubating.tgz
+cd fluss-rust-${RELEASE_VERSION}-incubating
+```
+
+Build the workspace:
+
+```bash
+cargo build --workspace --release
+```
+
+For Python bindings, see the project [README](https://github.com/apache/fluss-rust#readme) and [Development Guide](https://github.com/apache/fluss-rust/blob/main/DEVELOPMENT.md). For C++ bindings, see `bindings/cpp/`.
+
+## Verifying LICENSE and NOTICE
+
+Unzip the source release archive and verify that:
+
+1. The **LICENSE** and **NOTICE** files in the root directory are correct and refer to dependencies in the source release (e.g. files in the repository such as fonts, CSS, JavaScript, images).
+2. All files that need it have ASF license headers.
+3. All dependencies have been checked for their license and the license is ASL 2.0 compatible ([ASF third-party license policy](http://www.apache.org/legal/resolved.html#category-x)).
+4. Compatible non-ASL 2.0 licenses are documented (e.g. in NOTICE or in dependency audit files such as `DEPENDENCIES*.tsv`).
+
+The project uses [cargo-deny](https://embarkstudios.github.io/cargo-deny/) for license checks; see [Creating a Fluss Rust Client Release](creating-a-release.md) for how the dependency list is generated before a release.
+
+## Testing features
+
+For any user-facing feature included in a release, we aim to ensure it is functional, usable, and well-documented. Release managers may create testing issues that outline key scenarios to validate; these are open to all community members.
+
+**Per-language verification:** For **Rust** and **C++**, build from the source release and write your own test cases to verify. For **Python**, the RC is published to **TestPyPI**; install the client from TestPyPI and write your own test cases (e.g. connect, create table, read/write) to verify. Use the README in each component as the entry point:
+
+- **Rust client:** You can depend on the RC via its git tag (e.g. in your `Cargo.toml`: `fluss-rs = { git = "https://github.com/apache/fluss-rust", tag = "v${RELEASE_VERSION}-rc${RC_NUM}" }`) and build your own test project to verify. Alternatively, build from the source release; see [crates/fluss/README.md](../crates/fluss/README.md).
+- **Python bindings:** See [bindings/python/README.md](../bindings/python/README.md) for how to add the Python client (for an RC, install from **TestPyPI**: `pip install -i https://test.pypi.org/simple/ pyfluss==${RELEASE_VERSION}`); then write test cases to verify.
+- **C++ bindings:** See [bindings/cpp/README.md](../bindings/cpp/README.md) for how to build and link the C++ client; then write test cases to verify.
+
+## Incubator release checklist
+
+If the project is in incubation, the ASF Incubator provides a release checklist. You can refer to it when verifying the release:
+
+- [Incubator Release Checklist](https://cwiki.apache.org/confluence/display/INCUBATOR/Incubator+Release+Checklist)
+
+## Voting
+
+Votes are cast by replying to the vote email on the dev mailing list with **+1**, **0**, or **-1**.
+
+In addition to your vote, it is customary to state whether your vote is **binding** or **non-binding**. Only members of the PPMC and mentors have formally binding votes (and the IPMC on the Incubator general list). If unsure, you can state that your vote is non-binding. See [Apache Foundation Voting](https://www.apache.org/foundation/voting.html).
+
+It is recommended to include a short list of what you verified (e.g. signatures, checksums, build, tests, LICENSE/NOTICE). This helps the community see what has been checked and what might still be missing.
+
+**Checklist you can reference in your vote:**
+
+- [ ] [Validating distributions](#validating-distributions)
+- [ ] [Verifying signatures](#verifying-signatures)
+- [ ] [Verifying checksums](#verifying-checksums)
+- [ ] [Verifying build](#verifying-build)
+- [ ] [Verifying LICENSE and NOTICE](#verifying-license-and-notice)
+- [ ] [Testing features](#testing-features)
+- [ ] [Incubator release checklist](#incubator-release-checklist) (if applicable)
+
diff --git a/fluss-rust/scripts/release.sh b/fluss-rust/scripts/release.sh
index 8187d1fd44..e4e6b07939 100755
--- a/fluss-rust/scripts/release.sh
+++ b/fluss-rust/scripts/release.sh
@@ -14,10 +14,11 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #
-# Create ASF source release artifacts under dist/:
-#   fluss-rust-{version}.tar.gz
-#   fluss-rust-{version}.tar.gz.asc
-#   fluss-rust-{version}.tar.gz.sha512
+# Create ASF source release artifacts under dist/ (aligned with Fluss release package format):
+#   fluss-rust-{version}-incubating.tgz
+#   fluss-rust-{version}-incubating.tgz.asc
+#   fluss-rust-{version}-incubating.tgz.sha512
+# (Incubator policy requires "incubating" in the artifact name.)
 # Run from repo root. Check out the release tag first (e.g. git checkout v0.1.0-rc1).
 # Usage: ./scripts/release.sh [version]
 #   If version is omitted, it is read from Cargo.toml (workspace.package.version).
@@ -37,9 +38,9 @@ else
   fi
 fi
 
-PREFIX="fluss-rust-${VERSION}"
+PREFIX="fluss-rust-${VERSION}-incubating"
 DIST_DIR="${REPO_ROOT}/dist"
-TARBALL="${PREFIX}.tar.gz"
+TARBALL="${PREFIX}.tgz"
 
 echo "Creating ASF source release for fluss-rust ${VERSION}"
 mkdir -p "$DIST_DIR"

From f3a42f1d9d20a7443a26928003fca39cf7309a76 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 9 Feb 2026 07:14:26 +0000
Subject: [PATCH 131/287] chore: cleanup and fix partial update in python
 (#292)

---
 fluss-rust/bindings/python/example/example.py |  43 ++++
 fluss-rust/bindings/python/fluss/__init__.pyi |   7 +-
 fluss-rust/bindings/python/src/lib.rs         |   1 +
 fluss-rust/bindings/python/src/lookup.rs      |   5 +-
 fluss-rust/bindings/python/src/table.rs       | 195 +++++-------------
 fluss-rust/bindings/python/src/upsert.rs      |  41 +++-
 .../crates/fluss/src/client/table/mod.rs      |   1 +
 7 files changed, 128 insertions(+), 165 deletions(-)

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 732b7dff76..9f8cafa33a 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -569,6 +569,49 @@ async def main():
         print(f"Error during delete: {e}")
         traceback.print_exc()
 
+    # --- Test Partial Update by column names ---
+    print("\n--- Testing Partial Update (by column names) ---")
+    try:
+        partial_writer = pk_table.new_upsert(columns=["user_id", "balance"])
+        handle = partial_writer.upsert({"user_id": 1, "balance": Decimal("9999.99")})
+        await handle.wait()
+        print("Partial update: set balance=9999.99 for user_id=1")
+
+        lookuper = pk_table.new_lookup()
+        result = await lookuper.lookup({"user_id": 1})
+        if result:
+            print(f"Partial update verified:"
+                  f"\n  name={result['name']} (unchanged)"
+                  f"\n  balance={result['balance']} (updated)")
+        else:
+            print("ERROR: Expected to find user_id=1")
+
+    except Exception as e:
+        print(f"Error during partial update by names: {e}")
+        traceback.print_exc()
+
+    # --- Test Partial Update by column indices ---
+    print("\n--- Testing Partial Update (by column indices) ---")
+    try:
+        # Columns: 0=user_id (PK), 1=name — update name only
+        partial_writer_idx = pk_table.new_upsert(column_indices=[0, 1])
+        handle = partial_writer_idx.upsert([1, "Alice Renamed"])
+        await handle.wait()
+        print("Partial update by indices: set name='Alice Renamed' for user_id=1")
+
+        lookuper = pk_table.new_lookup()
+        result = await lookuper.lookup({"user_id": 1})
+        if result:
+            print(f"Partial update by indices verified:"
+                  f"\n  name={result['name']} (updated)"
+                  f"\n  balance={result['balance']} (unchanged)")
+        else:
+            print("ERROR: Expected to find user_id=1")
+
+    except Exception as e:
+        print(f"Error during partial update by indices: {e}")
+        traceback.print_exc()
+
     # Demo: Column projection using builder pattern
     print("\n--- Testing Column Projection ---")
     try:
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index a9ef828aac..cc7053e4e2 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -378,15 +378,14 @@ class AppendWriter:
             WriteResultHandle: Ignore for fire-and-forget, or await handle.wait() for acknowledgement.
 
         Supported Types:
-            Currently supports primitive types only:
             - Boolean, TinyInt, SmallInt, Int, BigInt (integers)
             - Float, Double (floating point)
             - String, Char (text)
             - Bytes, Binary (binary data)
+            - Date, Time, Timestamp, TimestampLTZ (temporal)
+            - Decimal (arbitrary precision)
             - Null values
 
-            Temporal types (Date, Timestamp, Decimal) are not yet supported.
-
         Example:
             writer.append({'id': 1, 'name': 'Alice', 'score': 95.5})
             writer.append([1, 'Alice', 95.5])
@@ -712,5 +711,7 @@ class OffsetType:
 
 # Constant for earliest offset (-2)
 EARLIEST_OFFSET: int
+# Constant for latest offset (-1)
+LATEST_OFFSET: int
 
 __version__: str
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 41f8de5447..094dc0062f 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -96,6 +96,7 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
 
     // Register constants
     m.add("EARLIEST_OFFSET", fcore::client::EARLIEST_OFFSET)?;
+    m.add("LATEST_OFFSET", fcore::client::LATEST_OFFSET)?;
 
     // Register exception types
     m.add_class::<FlussError>()?;
diff --git a/fluss-rust/bindings/python/src/lookup.rs b/fluss-rust/bindings/python/src/lookup.rs
index 8d91a6198b..e5c1f62313 100644
--- a/fluss-rust/bindings/python/src/lookup.rs
+++ b/fluss-rust/bindings/python/src/lookup.rs
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::table::{internal_row_to_dict, python_pk_to_generic_row};
+use crate::table::{internal_row_to_dict, python_to_sparse_generic_row};
 use crate::*;
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::Arc;
@@ -52,7 +52,8 @@ impl Lookuper {
         py: Python<'py>,
         pk: &Bound<'_, PyAny>,
     ) -> PyResult<Bound<'py, PyAny>> {
-        let generic_row = python_pk_to_generic_row(pk, &self.table_info)?;
+        let pk_indices = self.table_info.get_schema().primary_key_indexes();
+        let generic_row = python_to_sparse_generic_row(pk, &self.table_info, &pk_indices)?;
         let inner = self.inner.clone();
         let table_info = self.table_info.clone();
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index cb203dc67a..81acf0083d 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -639,124 +639,51 @@ enum RowInput<'py> {
     List(Bound<'py, pyo3::types::PyList>),
 }
 
-/// Helper function to process sequence types (list/tuple) into datums
-fn process_sequence_to_datums<'a, I>(
-    values: I,
-    len: usize,
-    fields: &[fcore::metadata::DataField],
-) -> PyResult<Vec<fcore::row::Datum<'static>>>
-where
-    I: Iterator<Item = Bound<'a, PyAny>>,
-{
-    if len != fields.len() {
-        return Err(FlussError::new_err(format!(
-            "Expected {} values, got {}",
-            fields.len(),
-            len
-        )));
-    }
-
-    let mut datums = Vec::with_capacity(fields.len());
-    for (i, (field, value)) in fields.iter().zip(values).enumerate() {
-        datums.push(
-            python_value_to_datum(&value, field.data_type()).map_err(|e| {
-                FlussError::new_err(format!("Field '{}' (index {}): {}", field.name(), i, e))
-            })?,
-        );
-    }
-    Ok(datums)
-}
-
-/// Convert Python row (dict/list/tuple) to GenericRow based on schema
+/// Convert Python row (dict/list/tuple) to GenericRow requiring all schema columns.
 pub fn python_to_generic_row(
     row: &Bound<PyAny>,
     table_info: &fcore::metadata::TableInfo,
 ) -> PyResult<fcore::row::GenericRow<'static>> {
-    // Extract with user-friendly error message
-    let row_input: RowInput = row.extract().map_err(|_| {
-        let type_name = row
-            .get_type()
-            .name()
-            .map(|n| n.to_string())
-            .unwrap_or_else(|_| "unknown".to_string());
-        FlussError::new_err(format!(
-            "Row must be a dict, list, or tuple; got {type_name}"
-        ))
-    })?;
-    let schema = table_info.row_type();
-    let fields = schema.fields();
-
-    let datums = match row_input {
-        RowInput::Dict(dict) => {
-            // Strict: reject unknown keys (and also reject non-str keys nicely)
-            for (k, _) in dict.iter() {
-                let key_str = k.extract::<&str>().map_err(|_| {
-                    let key_type = k
-                        .get_type()
-                        .name()
-                        .map(|n| n.to_string())
-                        .unwrap_or_else(|_| "unknown".to_string());
-                    FlussError::new_err(format!("Row dict keys must be strings; got {key_type}"))
-                })?;
-
-                if fields.iter().all(|f| f.name() != key_str) {
-                    let expected = fields
-                        .iter()
-                        .map(|f| f.name())
-                        .collect::<Vec<_>>()
-                        .join(", ");
-                    return Err(FlussError::new_err(format!(
-                        "Unknown field '{key_str}'. Expected fields: {expected}"
-                    )));
-                }
-            }
-
-            let mut datums = Vec::with_capacity(fields.len());
-            for field in fields {
-                let value = dict.get_item(field.name())?.ok_or_else(|| {
-                    FlussError::new_err(format!("Missing field: {}", field.name()))
-                })?;
-                datums.push(
-                    python_value_to_datum(&value, field.data_type()).map_err(|e| {
-                        FlussError::new_err(format!("Field '{}': {}", field.name(), e))
-                    })?,
-                );
-            }
-            datums
-        }
-
-        RowInput::List(list) => process_sequence_to_datums(list.iter(), list.len(), fields)?,
-
-        RowInput::Tuple(tuple) => process_sequence_to_datums(tuple.iter(), tuple.len(), fields)?,
-    };
+    let all_indices: Vec<usize> = (0..table_info.row_type().fields().len()).collect();
+    python_to_sparse_generic_row(row, table_info, &all_indices)
+}
 
-    Ok(fcore::row::GenericRow { values: datums })
+/// Process a Python sequence (list or tuple) into datums at the target column positions.
+fn process_sequence(
+    seq: &Bound<pyo3::types::PySequence>,
+    target_indices: &[usize],
+    fields: &[fcore::metadata::DataField],
+    datums: &mut [fcore::row::Datum<'static>],
+) -> PyResult<()> {
+    if seq.len()? != target_indices.len() {
+        return Err(FlussError::new_err(format!(
+            "Expected {} elements, got {}",
+            target_indices.len(),
+            seq.len()?
+        )));
+    }
+    for (i, &col_idx) in target_indices.iter().enumerate() {
+        let field = &fields[col_idx];
+        let value = seq.get_item(i)?;
+        datums[col_idx] = python_value_to_datum(&value, field.data_type())
+            .map_err(|e| FlussError::new_err(format!("Field '{}': {}", field.name(), e)))?;
+    }
+    Ok(())
 }
 
-/// Convert Python primary key values (dict/list/tuple) to GenericRow.
-/// Only requires PK columns; non-PK columns are filled with Null.
-/// For dict: keys should be PK column names.
-/// For list/tuple: values should be PK values in PK column order.
-pub fn python_pk_to_generic_row(
+/// Build a full-width GenericRow filling only the specified column
+/// indices from user input; all other columns are set to Null.
+pub fn python_to_sparse_generic_row(
     row: &Bound<PyAny>,
     table_info: &fcore::metadata::TableInfo,
+    target_indices: &[usize],
 ) -> PyResult<fcore::row::GenericRow<'static>> {
-    let schema = table_info.get_schema();
     let row_type = table_info.row_type();
     let fields = row_type.fields();
-    let pk_indexes = schema.primary_key_indexes();
-    let pk_names: Vec<&str> = schema.primary_key_column_names();
-
-    if pk_indexes.is_empty() {
-        return Err(FlussError::new_err(
-            "Table has no primary key; cannot use PK-only row",
-        ));
-    }
+    let target_names: Vec<&str> = target_indices.iter().map(|&i| fields[i].name()).collect();
 
-    // Initialize all datums as Null
     let mut datums: Vec<fcore::row::Datum<'static>> = vec![fcore::row::Datum::Null; fields.len()];
 
-    // Extract with user-friendly error message
     let row_input: RowInput = row.extract().map_err(|_| {
         let type_name = row
             .get_type()
@@ -764,13 +691,12 @@ pub fn python_pk_to_generic_row(
             .map(|n| n.to_string())
             .unwrap_or_else(|_| "unknown".to_string());
         FlussError::new_err(format!(
-            "PK row must be a dict, list, or tuple; got {type_name}"
+            "Row must be a dict, list, or tuple; got {type_name}"
         ))
     })?;
 
     match row_input {
         RowInput::Dict(dict) => {
-            // Validate keys are PK columns
             for (k, _) in dict.iter() {
                 let key_str = k.extract::<&str>().map_err(|_| {
                     let key_type = k
@@ -778,64 +704,35 @@ pub fn python_pk_to_generic_row(
                         .name()
                         .map(|n| n.to_string())
                         .unwrap_or_else(|_| "unknown".to_string());
-                    FlussError::new_err(format!("PK dict keys must be strings; got {key_type}"))
+                    FlussError::new_err(format!("Dict keys must be strings; got {key_type}"))
                 })?;
-
-                if !pk_names.contains(&key_str) {
+                if !target_names.contains(&key_str) {
                     return Err(FlussError::new_err(format!(
-                        "Unknown PK field '{}'. Expected PK fields: {}",
+                        "Unknown field '{}'. Expected: {}",
                         key_str,
-                        pk_names.join(", ")
+                        target_names.join(", ")
                     )));
                 }
             }
-
-            // Extract PK values
-            for (i, pk_idx) in pk_indexes.iter().enumerate() {
-                let pk_name = pk_names[i];
-                let field: &fcore::metadata::DataField = &fields[*pk_idx];
+            for (i, &col_idx) in target_indices.iter().enumerate() {
+                let name = target_names[i];
+                let field = &fields[col_idx];
                 let value = dict
-                    .get_item(pk_name)?
-                    .ok_or_else(|| FlussError::new_err(format!("Missing PK field: {pk_name}")))?;
-                datums[*pk_idx] = python_value_to_datum(&value, field.data_type())
-                    .map_err(|e| FlussError::new_err(format!("PK field '{pk_name}': {e}")))?;
+                    .get_item(name)?
+                    .ok_or_else(|| FlussError::new_err(format!("Missing field: {name}")))?;
+                datums[col_idx] = python_value_to_datum(&value, field.data_type())
+                    .map_err(|e| FlussError::new_err(format!("Field '{name}': {e}")))?;
             }
         }
 
         RowInput::List(list) => {
-            if list.len() != pk_indexes.len() {
-                return Err(FlussError::new_err(format!(
-                    "PK list must have {} elements (PK columns), got {}",
-                    pk_indexes.len(),
-                    list.len()
-                )));
-            }
-            for (i, pk_idx) in pk_indexes.iter().enumerate() {
-                let field: &fcore::metadata::DataField = &fields[*pk_idx];
-                let value = list.get_item(i)?;
-                datums[*pk_idx] =
-                    python_value_to_datum(&value, field.data_type()).map_err(|e| {
-                        FlussError::new_err(format!("PK field '{}': {}", field.name(), e))
-                    })?;
-            }
+            let seq = list.as_sequence();
+            process_sequence(seq, target_indices, fields, &mut datums)?;
         }
 
         RowInput::Tuple(tuple) => {
-            if tuple.len() != pk_indexes.len() {
-                return Err(FlussError::new_err(format!(
-                    "PK tuple must have {} elements (PK columns), got {}",
-                    pk_indexes.len(),
-                    tuple.len()
-                )));
-            }
-            for (i, pk_idx) in pk_indexes.iter().enumerate() {
-                let field: &fcore::metadata::DataField = &fields[*pk_idx];
-                let value = tuple.get_item(i)?;
-                datums[*pk_idx] =
-                    python_value_to_datum(&value, field.data_type()).map_err(|e| {
-                        FlussError::new_err(format!("PK field '{}': {}", field.name(), e))
-                    })?;
-            }
+            let seq = tuple.as_sequence();
+            process_sequence(seq, target_indices, fields, &mut datums)?;
         }
     }
 
diff --git a/fluss-rust/bindings/python/src/upsert.rs b/fluss-rust/bindings/python/src/upsert.rs
index 0aa69d747d..745163e3dd 100644
--- a/fluss-rust/bindings/python/src/upsert.rs
+++ b/fluss-rust/bindings/python/src/upsert.rs
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::table::{python_pk_to_generic_row, python_to_generic_row};
+use crate::table::{python_to_generic_row, python_to_sparse_generic_row};
 use crate::*;
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::{Arc, Mutex};
@@ -46,6 +46,8 @@ struct UpsertWriterInner {
     /// Lazily initialized writer - created on first write operation
     writer: Mutex<Option<Arc<fcore::client::UpsertWriter>>>,
     table_info: fcore::metadata::TableInfo,
+    /// Column indices for partial updates (None = full row)
+    target_columns: Option<Vec<usize>>,
 }
 
 #[pymethods]
@@ -62,7 +64,11 @@ impl UpsertWriter {
     ///          For dict: keys are column names, values are column values.
     ///          For list/tuple: values must be in schema order.
     pub fn upsert(&self, row: &Bound<'_, PyAny>) -> PyResult<WriteResultHandle> {
-        let generic_row = python_to_generic_row(row, &self.inner.table_info)?;
+        let generic_row = if let Some(target_cols) = &self.inner.target_columns {
+            python_to_sparse_generic_row(row, &self.inner.table_info, target_cols)?
+        } else {
+            python_to_generic_row(row, &self.inner.table_info)?
+        };
 
         let writer = self.inner.get_or_create_writer()?;
         let result_future = writer
@@ -80,7 +86,8 @@ impl UpsertWriter {
     ///         For dict: keys are PK column names.
     ///         For list/tuple: values in PK column order.
     pub fn delete(&self, pk: &Bound<'_, PyAny>) -> PyResult<WriteResultHandle> {
-        let generic_row = python_pk_to_generic_row(pk, &self.inner.table_info)?;
+        let pk_indices = self.inner.table_info.get_schema().primary_key_indexes();
+        let generic_row = python_to_sparse_generic_row(pk, &self.inner.table_info, &pk_indices)?;
 
         let writer = self.inner.get_or_create_writer()?;
         let result_future = writer
@@ -134,15 +141,26 @@ impl UpsertWriter {
         columns: Option<Vec<String>>,
         column_indices: Option<Vec<usize>>,
     ) -> PyResult<Self> {
-        // Apply partial update configuration if specified
-        let table_upsert = if let Some(cols) = columns {
-            let col_refs: Vec<&str> = cols.iter().map(|s| s.as_str()).collect();
-            table_upsert
-                .partial_update_with_column_names(&col_refs)
-                .map_err(|e| FlussError::new_err(e.to_string()))?
-        } else if let Some(indices) = column_indices {
+        // Resolve target column indices (names → indices, or use provided indices directly)
+        let target_columns = if let Some(cols) = columns {
+            let row_type = table_info.row_type();
+            Some(
+                cols.iter()
+                    .map(|name| {
+                        row_type
+                            .get_field_index(name)
+                            .ok_or_else(|| FlussError::new_err(format!("Unknown column: {name}")))
+                    })
+                    .collect::<PyResult<Vec<usize>>>()?,
+            )
+        } else {
+            column_indices
+        };
+
+        // Apply partial update to the Rust core using resolved indices
+        let table_upsert = if let Some(ref indices) = target_columns {
             table_upsert
-                .partial_update(Some(indices))
+                .partial_update(Some(indices.clone()))
                 .map_err(|e| FlussError::new_err(e.to_string()))?
         } else {
             table_upsert
@@ -153,6 +171,7 @@ impl UpsertWriter {
                 table_upsert,
                 writer: Mutex::new(None),
                 table_info,
+                target_columns,
             }),
         })
     }
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 37e9b45b14..62f51b476d 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -22,6 +22,7 @@ use crate::metadata::{TableInfo, TablePath};
 use std::sync::Arc;
 
 pub const EARLIEST_OFFSET: i64 = -2;
+pub const LATEST_OFFSET: i64 = -1;
 
 mod append;
 mod lookup;

From d44898ecf697db1d3cf6e9b9fcb1dab67361a279 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 9 Feb 2026 12:41:14 +0000
Subject: [PATCH 132/287] feat: support kv tables in CPP (#288)

---
 fluss-rust/bindings/cpp/BUILD.bazel           |  33 ++
 fluss-rust/bindings/cpp/CMakeLists.txt        |   6 +
 .../bindings/cpp/examples/admin_example.cpp   |   5 +-
 .../bindings/cpp/examples/kv_example.cpp      | 488 ++++++++++++++++++
 fluss-rust/bindings/cpp/include/fluss.hpp     | 134 ++++-
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |   3 +-
 fluss-rust/bindings/cpp/src/lib.rs            | 295 ++++++++++-
 fluss-rust/bindings/cpp/src/table.cpp         | 235 ++++++++-
 fluss-rust/bindings/cpp/src/types.rs          | 432 +++++++++++-----
 9 files changed, 1483 insertions(+), 148 deletions(-)
 create mode 100644 fluss-rust/bindings/cpp/examples/kv_example.cpp

diff --git a/fluss-rust/bindings/cpp/BUILD.bazel b/fluss-rust/bindings/cpp/BUILD.bazel
index aff8f504fd..0ae2ce329b 100644
--- a/fluss-rust/bindings/cpp/BUILD.bazel
+++ b/fluss-rust/bindings/cpp/BUILD.bazel
@@ -373,3 +373,36 @@ cc_binary(
     visibility = ["//visibility:public"],
 )
 
+cc_binary(
+    name = "fluss_cpp_kv_example",
+    srcs = [
+        "examples/kv_example.cpp",
+    ],
+    deps = [":fluss_cpp"],
+    copts = [
+        "-std=c++17",
+    ] + select({
+        ":debug_mode": [
+            "-g3",
+            "-O0",
+            "-ggdb",
+            "-fno-omit-frame-pointer",
+            "-DDEBUG",
+        ],
+        ":fastbuild_mode": [
+            "-g",
+            "-O0",
+        ],
+        ":release_mode": [
+            "-O2",
+            "-DNDEBUG",
+        ],
+    }),
+    linkopts = select({
+        ":debug_mode": ["-g"],
+        ":fastbuild_mode": ["-g"],
+        ":release_mode": [],
+    }),
+    visibility = ["//visibility:public"],
+)
+
diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
index ae70842678..05c58ea73d 100644
--- a/fluss-rust/bindings/cpp/CMakeLists.txt
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -108,6 +108,12 @@ target_link_libraries(fluss_cpp_admin_example PRIVATE Arrow::arrow_shared)
 target_compile_definitions(fluss_cpp_admin_example PRIVATE ARROW_FOUND)
 target_include_directories(fluss_cpp_admin_example PUBLIC ${CPP_INCLUDE_DIR})
 
+add_executable(fluss_cpp_kv_example examples/kv_example.cpp)
+target_link_libraries(fluss_cpp_kv_example PRIVATE fluss_cpp)
+target_link_libraries(fluss_cpp_kv_example PRIVATE Arrow::arrow_shared)
+target_compile_definitions(fluss_cpp_kv_example PRIVATE ARROW_FOUND)
+target_include_directories(fluss_cpp_kv_example PUBLIC ${CPP_INCLUDE_DIR})
+
 set_target_properties(fluss_cpp
     PROPERTIES ADDITIONAL_CLEAN_FILES ${CARGO_TARGET_DIR}
 )
diff --git a/fluss-rust/bindings/cpp/examples/admin_example.cpp b/fluss-rust/bindings/cpp/examples/admin_example.cpp
index 7b7a333b0e..196fe975d6 100644
--- a/fluss-rust/bindings/cpp/examples/admin_example.cpp
+++ b/fluss-rust/bindings/cpp/examples/admin_example.cpp
@@ -61,9 +61,8 @@ int main() {
 
     fluss::DatabaseInfo db_info;
     check("get_database_info", admin.GetDatabaseInfo(db_name, db_info));
-    std::cout << "Database info: name=" << db_info.database_name
-              << " comment=" << db_info.comment << " created_time=" << db_info.created_time
-              << std::endl;
+    std::cout << "Database info: name=" << db_info.database_name << " comment=" << db_info.comment
+              << " created_time=" << db_info.created_time << std::endl;
 
     std::vector<std::string> databases;
     check("list_databases", admin.ListDatabases(databases));
diff --git a/fluss-rust/bindings/cpp/examples/kv_example.cpp b/fluss-rust/bindings/cpp/examples/kv_example.cpp
new file mode 100644
index 0000000000..daebfb2655
--- /dev/null
+++ b/fluss-rust/bindings/cpp/examples/kv_example.cpp
@@ -0,0 +1,488 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include <iostream>
+#include <string>
+#include <vector>
+
+#include "fluss.hpp"
+
+static void check(const char* step, const fluss::Result& r) {
+    if (!r.Ok()) {
+        std::cerr << step << " failed: code=" << r.error_code << " msg=" << r.error_message
+                  << std::endl;
+        std::exit(1);
+    }
+}
+
+int main() {
+    const std::string bootstrap = "127.0.0.1:9123";
+
+    // 1) Connect and get Admin
+    fluss::Connection conn;
+    check("connect", fluss::Connection::Connect(bootstrap, conn));
+
+    fluss::Admin admin;
+    check("get_admin", conn.GetAdmin(admin));
+
+    fluss::TablePath kv_table_path("fluss", "kv_table_cpp_v1");
+
+    // Drop if exists
+    admin.DropTable(kv_table_path, true);
+
+    // 2) Create a KV table with primary key, including decimal and temporal types
+    auto kv_schema = fluss::Schema::NewBuilder()
+                         .AddColumn("user_id", fluss::DataType::Int())
+                         .AddColumn("name", fluss::DataType::String())
+                         .AddColumn("email", fluss::DataType::String())
+                         .AddColumn("score", fluss::DataType::Float())
+                         .AddColumn("balance", fluss::DataType::Decimal(10, 2))
+                         .AddColumn("birth_date", fluss::DataType::Date())
+                         .AddColumn("login_time", fluss::DataType::Time())
+                         .AddColumn("created_at", fluss::DataType::Timestamp())
+                         .AddColumn("last_seen", fluss::DataType::TimestampLtz())
+                         .SetPrimaryKeys({"user_id"})
+                         .Build();
+
+    auto kv_descriptor = fluss::TableDescriptor::NewBuilder()
+                             .SetSchema(kv_schema)
+                             .SetBucketCount(3)
+                             .SetComment("cpp kv table example")
+                             .Build();
+
+    check("create_kv_table", admin.CreateTable(kv_table_path, kv_descriptor, false));
+    std::cout << "Created KV table with primary key" << std::endl;
+
+    fluss::Table kv_table;
+    check("get_kv_table", conn.GetTable(kv_table_path, kv_table));
+
+    // 3) Upsert rows using name-based Set()
+    //    - Set("balance", "1234.56") auto-routes to SetDecimal (schema-aware)
+    //    - Set("created_at", ts) auto-routes to SetTimestampNtz (schema-aware)
+    //    - Set("last_seen", ts) auto-routes to SetTimestampLtz (schema-aware)
+    std::cout << "\n--- Upsert Rows ---" << std::endl;
+    fluss::UpsertWriter upsert_writer;
+    check("new_upsert_writer", kv_table.NewUpsertWriter(upsert_writer));
+
+    // Fire-and-forget upserts
+    {
+        auto row = kv_table.NewRow();
+        row.Set("user_id", 1);
+        row.Set("name", "Alice");
+        row.Set("email", "alice@example.com");
+        row.Set("score", 95.5f);
+        row.Set("balance", "1234.56");
+        row.Set("birth_date", fluss::Date::FromYMD(1990, 3, 15));
+        row.Set("login_time", fluss::Time::FromHMS(9, 30, 0));
+        row.Set("created_at", fluss::Timestamp::FromMillis(1700000000000));
+        row.Set("last_seen", fluss::Timestamp::FromMillis(1700000060000));
+        check("upsert_1", upsert_writer.Upsert(row));
+    }
+    {
+        auto row = kv_table.NewRow();
+        row.Set("user_id", 2);
+        row.Set("name", "Bob");
+        row.Set("email", "bob@example.com");
+        row.Set("score", 87.3f);
+        row.Set("balance", "567.89");
+        row.Set("birth_date", fluss::Date::FromYMD(1985, 7, 22));
+        row.Set("login_time", fluss::Time::FromHMS(14, 15, 30));
+        row.Set("created_at", fluss::Timestamp::FromMillis(1700000100000));
+        row.Set("last_seen", fluss::Timestamp::FromMillis(1700000200000));
+        check("upsert_2", upsert_writer.Upsert(row));
+    }
+
+    // Per-record acknowledgment
+    {
+        auto row = kv_table.NewRow();
+        row.Set("user_id", 3);
+        row.Set("name", "Charlie");
+        row.Set("email", "charlie@example.com");
+        row.Set("score", 92.0f);
+        row.Set("balance", "99999.99");
+        row.Set("birth_date", fluss::Date::FromYMD(2000, 1, 1));
+        row.Set("login_time", fluss::Time::FromHMS(23, 59, 59));
+        row.Set("created_at", fluss::Timestamp::FromMillis(1700000300000));
+        row.Set("last_seen", fluss::Timestamp::FromMillis(1700000400000));
+        fluss::WriteResult wr;
+        check("upsert_3", upsert_writer.Upsert(row, wr));
+        check("upsert_3_wait", wr.Wait());
+        std::cout << "Upsert acknowledged by server" << std::endl;
+    }
+
+    check("upsert_flush", upsert_writer.Flush());
+    std::cout << "Upserted 3 rows" << std::endl;
+
+    // 4) Lookup by primary key — verify all types round-trip
+    std::cout << "\n--- Lookup by Primary Key ---" << std::endl;
+    fluss::Lookuper lookuper;
+    check("new_lookuper", kv_table.NewLookuper(lookuper));
+
+    // Lookup existing key
+    {
+        auto pk_row = kv_table.NewRow();
+        pk_row.Set("user_id", 1);
+
+        bool found = false;
+        fluss::GenericRow result_row;
+        check("lookup_1", lookuper.Lookup(pk_row, found, result_row));
+        if (found) {
+            auto date = result_row.GetDate(5);
+            auto time = result_row.GetTime(6);
+            auto created = result_row.GetTimestamp(7);
+            auto seen = result_row.GetTimestamp(8);
+            std::cout << "Found user_id=1:"
+                      << "\n  name=" << result_row.GetString(1)
+                      << "\n  email=" << result_row.GetString(2)
+                      << "\n  score=" << result_row.GetFloat32(3)
+                      << "\n  balance=" << result_row.DecimalToString(4)
+                      << "\n  birth_date=" << date.Year() << "-" << date.Month() << "-"
+                      << date.Day() << "\n  login_time=" << time.Hour() << ":" << time.Minute()
+                      << ":" << time.Second() << "\n  created_at(ms)=" << created.epoch_millis
+                      << "\n  last_seen(ms)=" << seen.epoch_millis << std::endl;
+        } else {
+            std::cerr << "ERROR: Expected to find user_id=1" << std::endl;
+            std::exit(1);
+        }
+    }
+
+    // Lookup non-existing key
+    {
+        auto pk_row = kv_table.NewRow();
+        pk_row.Set("user_id", 999);
+
+        bool found = false;
+        fluss::GenericRow result_row;
+        check("lookup_999", lookuper.Lookup(pk_row, found, result_row));
+        if (!found) {
+            std::cout << "user_id=999 not found (expected)" << std::endl;
+        } else {
+            std::cerr << "ERROR: Expected user_id=999 to not be found" << std::endl;
+            std::exit(1);
+        }
+    }
+
+    // 5) Update via upsert (overwrite existing key)
+    std::cout << "\n--- Update via Upsert ---" << std::endl;
+    {
+        auto row = kv_table.NewRow();
+        row.Set("user_id", 1);
+        row.Set("name", "Alice Updated");
+        row.Set("email", "alice.new@example.com");
+        row.Set("score", 99.0f);
+        row.Set("balance", "9999.00");
+        row.Set("birth_date", fluss::Date::FromYMD(1990, 3, 15));
+        row.Set("login_time", fluss::Time::FromHMS(10, 0, 0));
+        row.Set("created_at", fluss::Timestamp::FromMillis(1700000000000));
+        row.Set("last_seen", fluss::Timestamp::FromMillis(1700000500000));
+        fluss::WriteResult wr;
+        check("upsert_update", upsert_writer.Upsert(row, wr));
+        check("upsert_update_wait", wr.Wait());
+    }
+
+    // Verify update
+    {
+        auto pk_row = kv_table.NewRow();
+        pk_row.Set("user_id", 1);
+
+        bool found = false;
+        fluss::GenericRow result_row;
+        check("lookup_updated", lookuper.Lookup(pk_row, found, result_row));
+        if (found && result_row.GetString(1) == "Alice Updated") {
+            std::cout << "Update verified: name=" << result_row.GetString(1)
+                      << " balance=" << result_row.DecimalToString(4)
+                      << " last_seen(ms)=" << result_row.GetTimestamp(8).epoch_millis << std::endl;
+        } else {
+            std::cerr << "ERROR: Update verification failed" << std::endl;
+            std::exit(1);
+        }
+    }
+
+    // 6) Delete by primary key
+    std::cout << "\n--- Delete by Primary Key ---" << std::endl;
+    {
+        auto pk_row = kv_table.NewRow();
+        pk_row.Set("user_id", 2);
+        fluss::WriteResult wr;
+        check("delete_2", upsert_writer.Delete(pk_row, wr));
+        check("delete_2_wait", wr.Wait());
+        std::cout << "Deleted user_id=2" << std::endl;
+    }
+
+    // Verify deletion
+    {
+        auto pk_row = kv_table.NewRow();
+        pk_row.Set("user_id", 2);
+
+        bool found = false;
+        fluss::GenericRow result_row;
+        check("lookup_deleted", lookuper.Lookup(pk_row, found, result_row));
+        if (!found) {
+            std::cout << "Delete verified: user_id=2 not found" << std::endl;
+        } else {
+            std::cerr << "ERROR: Expected user_id=2 to be deleted" << std::endl;
+            std::exit(1);
+        }
+    }
+
+    // 7) Partial update by column names
+    std::cout << "\n--- Partial Update by Column Names ---" << std::endl;
+    fluss::UpsertWriter partial_writer;
+    check("new_partial_upsert_writer",
+          kv_table.NewUpsertWriter(partial_writer,
+                                   std::vector<std::string>{"user_id", "balance", "last_seen"}));
+
+    {
+        auto row = kv_table.NewRow();
+        row.Set("user_id", 3);
+        row.Set("balance", "50000.00");
+        row.Set("last_seen", fluss::Timestamp::FromMillis(1700000999000));
+        fluss::WriteResult wr;
+        check("partial_upsert", partial_writer.Upsert(row, wr));
+        check("partial_upsert_wait", wr.Wait());
+        std::cout << "Partial update: set balance=50000.00, last_seen for user_id=3" << std::endl;
+    }
+
+    // Verify partial update (other fields unchanged)
+    {
+        auto pk_row = kv_table.NewRow();
+        pk_row.Set("user_id", 3);
+
+        bool found = false;
+        fluss::GenericRow result_row;
+        check("lookup_partial", lookuper.Lookup(pk_row, found, result_row));
+        if (found) {
+            std::cout << "Partial update verified:"
+                      << "\n  name=" << result_row.GetString(1) << " (unchanged)"
+                      << "\n  balance=" << result_row.DecimalToString(4) << " (updated)"
+                      << "\n  last_seen(ms)=" << result_row.GetTimestamp(8).epoch_millis
+                      << " (updated)" << std::endl;
+        } else {
+            std::cerr << "ERROR: Expected to find user_id=3" << std::endl;
+            std::exit(1);
+        }
+    }
+
+    // 8) Partial update by column indices (using index-based setters for lower overhead)
+    std::cout << "\n--- Partial Update by Column Indices ---" << std::endl;
+    fluss::UpsertWriter partial_writer_idx;
+    // Columns: 0=user_id (PK), 1=name — update name only
+    check("new_partial_upsert_writer_idx",
+          kv_table.NewUpsertWriter(partial_writer_idx, std::vector<size_t>{0, 1}));
+
+    {
+        // Index-based setters: lighter than name-based, useful for hot paths
+        fluss::GenericRow row;
+        row.SetInt32(0, 3);                   // user_id (PK)
+        row.SetString(1, "Charlie Updated");  // name
+        fluss::WriteResult wr;
+        check("partial_upsert_idx", partial_writer_idx.Upsert(row, wr));
+        check("partial_upsert_idx_wait", wr.Wait());
+        std::cout << "Partial update by indices: set name='Charlie Updated' for user_id=3"
+                  << std::endl;
+    }
+
+    // Verify: name changed, balance/last_seen unchanged from previous partial update
+    {
+        auto pk_row = kv_table.NewRow();
+        pk_row.Set("user_id", 3);
+
+        bool found = false;
+        fluss::GenericRow result_row;
+        check("lookup_partial_idx", lookuper.Lookup(pk_row, found, result_row));
+        if (found) {
+            std::cout << "Partial update by indices verified:"
+                      << "\n  name=" << result_row.GetString(1) << " (updated)"
+                      << "\n  balance=" << result_row.DecimalToString(4) << " (unchanged)"
+                      << "\n  last_seen(ms)=" << result_row.GetTimestamp(8).epoch_millis
+                      << " (unchanged)" << std::endl;
+        } else {
+            std::cerr << "ERROR: Expected to find user_id=3" << std::endl;
+            std::exit(1);
+        }
+    }
+
+    // Cleanup
+    check("drop_kv_table", admin.DropTable(kv_table_path, true));
+
+    // 9) Partitioned KV table
+    std::cout << "\n--- Partitioned KV Table ---" << std::endl;
+    fluss::TablePath part_kv_path("fluss", "partitioned_kv_cpp_v1");
+    admin.DropTable(part_kv_path, true);
+
+    auto part_kv_schema = fluss::Schema::NewBuilder()
+                              .AddColumn("region", fluss::DataType::String())
+                              .AddColumn("user_id", fluss::DataType::Int())
+                              .AddColumn("name", fluss::DataType::String())
+                              .AddColumn("score", fluss::DataType::BigInt())
+                              .SetPrimaryKeys({"region", "user_id"})
+                              .Build();
+
+    auto part_kv_descriptor = fluss::TableDescriptor::NewBuilder()
+                                  .SetSchema(part_kv_schema)
+                                  .SetPartitionKeys({"region"})
+                                  .SetComment("partitioned kv table example")
+                                  .Build();
+
+    check("create_part_kv", admin.CreateTable(part_kv_path, part_kv_descriptor, false));
+    std::cout << "Created partitioned KV table" << std::endl;
+
+    // Create partitions
+    check("create_US", admin.CreatePartition(part_kv_path, {{"region", "US"}}));
+    check("create_EU", admin.CreatePartition(part_kv_path, {{"region", "EU"}}));
+    check("create_APAC", admin.CreatePartition(part_kv_path, {{"region", "APAC"}}));
+    std::cout << "Created partitions: US, EU, APAC" << std::endl;
+
+    fluss::Table part_kv_table;
+    check("get_part_kv_table", conn.GetTable(part_kv_path, part_kv_table));
+
+    fluss::UpsertWriter part_writer;
+    check("new_part_writer", part_kv_table.NewUpsertWriter(part_writer));
+
+    // Upsert rows across partitions
+    struct TestRow {
+        const char* region;
+        int32_t user_id;
+        const char* name;
+        int64_t score;
+    };
+    TestRow test_data[] = {
+        {"US", 1, "Gustave", 100}, {"US", 2, "Lune", 200},   {"EU", 1, "Sciel", 150},
+        {"EU", 2, "Maelle", 250},  {"APAC", 1, "Noco", 300},
+    };
+
+    for (const auto& td : test_data) {
+        auto row = part_kv_table.NewRow();
+        row.Set("region", td.region);
+        row.Set("user_id", td.user_id);
+        row.Set("name", td.name);
+        row.Set("score", td.score);
+        check("part_upsert", part_writer.Upsert(row));
+    }
+    check("part_flush", part_writer.Flush());
+    std::cout << "Upserted 5 rows across 3 partitions" << std::endl;
+
+    // Lookup all rows
+    fluss::Lookuper part_lookuper;
+    check("new_part_lookuper", part_kv_table.NewLookuper(part_lookuper));
+
+    for (const auto& td : test_data) {
+        auto pk = part_kv_table.NewRow();
+        pk.Set("region", td.region);
+        pk.Set("user_id", td.user_id);
+
+        bool found = false;
+        fluss::GenericRow result;
+        check("part_lookup", part_lookuper.Lookup(pk, found, result));
+        if (!found) {
+            std::cerr << "ERROR: Expected to find region=" << td.region << " user_id=" << td.user_id
+                      << std::endl;
+            std::exit(1);
+        }
+        if (result.GetString(2) != td.name || result.GetInt64(3) != td.score) {
+            std::cerr << "ERROR: Data mismatch for region=" << td.region
+                      << " user_id=" << td.user_id << std::endl;
+            std::exit(1);
+        }
+    }
+    std::cout << "All 5 rows verified across partitions" << std::endl;
+
+    // Update within a partition
+    {
+        auto row = part_kv_table.NewRow();
+        row.Set("region", "US");
+        row.Set("user_id", 1);
+        row.Set("name", "Gustave Updated");
+        row.Set("score", static_cast<int64_t>(999));
+        fluss::WriteResult wr;
+        check("part_update", part_writer.Upsert(row, wr));
+        check("part_update_wait", wr.Wait());
+    }
+    {
+        auto pk = part_kv_table.NewRow();
+        pk.Set("region", "US");
+        pk.Set("user_id", 1);
+        bool found = false;
+        fluss::GenericRow result;
+        check("part_lookup_updated", part_lookuper.Lookup(pk, found, result));
+        if (!found || result.GetString(2) != "Gustave Updated" || result.GetInt64(3) != 999) {
+            std::cerr << "ERROR: Partition update verification failed" << std::endl;
+            std::exit(1);
+        }
+        std::cout << "Update verified: US/1 name=" << result.GetString(2)
+                  << " score=" << result.GetInt64(3) << std::endl;
+    }
+
+    // Lookup in non-existent partition
+    {
+        auto pk = part_kv_table.NewRow();
+        pk.Set("region", "UNKNOWN");
+        pk.Set("user_id", 1);
+        bool found = false;
+        fluss::GenericRow result;
+        check("part_lookup_unknown", part_lookuper.Lookup(pk, found, result));
+        if (found) {
+            std::cerr << "ERROR: Expected UNKNOWN partition lookup to return not found"
+                      << std::endl;
+            std::exit(1);
+        }
+        std::cout << "UNKNOWN partition lookup: not found (expected)" << std::endl;
+    }
+
+    // Delete within a partition
+    {
+        auto pk = part_kv_table.NewRow();
+        pk.Set("region", "EU");
+        pk.Set("user_id", 1);
+        fluss::WriteResult wr;
+        check("part_delete", part_writer.Delete(pk, wr));
+        check("part_delete_wait", wr.Wait());
+    }
+    {
+        auto pk = part_kv_table.NewRow();
+        pk.Set("region", "EU");
+        pk.Set("user_id", 1);
+        bool found = false;
+        fluss::GenericRow result;
+        check("part_lookup_deleted", part_lookuper.Lookup(pk, found, result));
+        if (found) {
+            std::cerr << "ERROR: Expected EU/1 to be deleted" << std::endl;
+            std::exit(1);
+        }
+        std::cout << "Delete verified: EU/1 not found" << std::endl;
+    }
+
+    // Verify other record in same partition still exists
+    {
+        auto pk = part_kv_table.NewRow();
+        pk.Set("region", "EU");
+        pk.Set("user_id", 2);
+        bool found = false;
+        fluss::GenericRow result;
+        check("part_lookup_eu2", part_lookuper.Lookup(pk, found, result));
+        if (!found || result.GetString(2) != "Maelle") {
+            std::cerr << "ERROR: Expected EU/2 (Maelle) to still exist" << std::endl;
+            std::exit(1);
+        }
+        std::cout << "EU/2 still exists: name=" << result.GetString(2) << std::endl;
+    }
+
+    check("drop_part_kv", admin.DropTable(part_kv_path, true));
+    std::cout << "\nKV table example completed successfully!" << std::endl;
+
+    return 0;
+}
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 50dffaefa1..c635c81adf 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -41,6 +41,8 @@ struct Table;
 struct AppendWriter;
 struct WriteResult;
 struct LogScanner;
+struct UpsertWriter;
+struct Lookuper;
 }  // namespace ffi
 
 struct Date {
@@ -490,6 +492,7 @@ struct GenericRow {
 
     size_t FieldCount() const { return fields.size(); }
 
+    // ── Index-based getters ──────────────────────────────────────────
     DatumType GetType(size_t idx) const { return GetField(idx).GetType(); }
     bool IsNull(size_t idx) const { return GetField(idx).IsNull(); }
     bool GetBool(size_t idx) const { return GetTypedField(idx, DatumType::Bool).GetBool(); }
@@ -528,6 +531,7 @@ struct GenericRow {
         return d.DecimalToString();
     }
 
+    // ── Index-based setters ──────────────────────────────────────────
     void SetNull(size_t idx) {
         EnsureSize(idx);
         fields[idx] = Datum::Null();
@@ -593,8 +597,77 @@ struct GenericRow {
         fields[idx] = Datum::DecimalString(value);
     }
 
+    // ── Name-based setters (require schema — see Table::NewRow()) ───
+    void Set(const std::string& name, std::nullptr_t) { SetNull(Resolve(name)); }
+    void Set(const std::string& name, bool v) { SetBool(Resolve(name), v); }
+    void Set(const std::string& name, int32_t v) { SetInt32(Resolve(name), v); }
+    void Set(const std::string& name, int64_t v) { SetInt64(Resolve(name), v); }
+    void Set(const std::string& name, float v) { SetFloat32(Resolve(name), v); }
+    void Set(const std::string& name, double v) { SetFloat64(Resolve(name), v); }
+    // const char* overload to prevent "string literal" → bool conversion
+    void Set(const std::string& name, const char* v) {
+        auto [idx, type] = ResolveColumn(name);
+        if (type == TypeId::Decimal) {
+            SetDecimal(idx, v);
+        } else if (type == TypeId::String) {
+            SetString(idx, v);
+        } else {
+            throw std::runtime_error("GenericRow::Set: column '" + name +
+                                     "' is not a string or decimal column");
+        }
+    }
+    void Set(const std::string& name, std::string v) {
+        auto [idx, type] = ResolveColumn(name);
+        if (type == TypeId::Decimal) {
+            SetDecimal(idx, v);
+        } else if (type == TypeId::String) {
+            SetString(idx, std::move(v));
+        } else {
+            throw std::runtime_error("GenericRow::Set: column '" + name +
+                                     "' is not a string or decimal column");
+        }
+    }
+    void Set(const std::string& name, std::vector<uint8_t> v) {
+        SetBytes(Resolve(name), std::move(v));
+    }
+    void Set(const std::string& name, fluss::Date d) { SetDate(Resolve(name), d); }
+    void Set(const std::string& name, fluss::Time t) { SetTime(Resolve(name), t); }
+    void Set(const std::string& name, fluss::Timestamp ts) {
+        auto [idx, type] = ResolveColumn(name);
+        if (type == TypeId::TimestampLtz) {
+            SetTimestampLtz(idx, ts);
+        } else if (type == TypeId::Timestamp) {
+            SetTimestampNtz(idx, ts);
+        } else {
+            throw std::runtime_error("GenericRow::Set: column '" + name +
+                                     "' is not a timestamp column");
+        }
+    }
+
    private:
+    friend class Table;
+    struct ColumnInfo {
+        size_t index;
+        TypeId type_id;
+    };
+    using ColumnMap = std::unordered_map<std::string, ColumnInfo>;
     std::vector<Datum> fields;
+    std::shared_ptr<ColumnMap> column_map_;
+
+    size_t Resolve(const std::string& name) const { return ResolveColumn(name).index; }
+
+    const ColumnInfo& ResolveColumn(const std::string& name) const {
+        if (!column_map_) {
+            throw std::runtime_error(
+                "GenericRow: name-based Set() requires a schema. "
+                "Use Table::NewRow() to create a schema-aware row.");
+        }
+        auto it = column_map_->find(name);
+        if (it == column_map_->end()) {
+            throw std::runtime_error("GenericRow: unknown column '" + name + "'");
+        }
+        return it->second;
+    }
 
     const Datum& GetField(size_t idx) const {
         if (idx >= fields.size()) {
@@ -725,6 +798,8 @@ struct DatabaseInfo {
 };
 
 class AppendWriter;
+class UpsertWriter;
+class Lookuper;
 class WriteResult;
 class LogScanner;
 class Admin;
@@ -792,8 +867,7 @@ class Admin {
                          const std::unordered_map<std::string, std::string>& partition_spec,
                          bool ignore_if_not_exists = false);
 
-    Result CreateDatabase(const std::string& database_name,
-                          const DatabaseDescriptor& descriptor,
+    Result CreateDatabase(const std::string& database_name, const DatabaseDescriptor& descriptor,
                           bool ignore_if_exists = false);
 
     Result DropDatabase(const std::string& database_name, bool ignore_if_not_exists = false,
@@ -833,7 +907,13 @@ class Table {
 
     bool Available() const;
 
+    GenericRow NewRow() const;
+
     Result NewAppendWriter(AppendWriter& out);
+    Result NewUpsertWriter(UpsertWriter& out);
+    Result NewUpsertWriter(UpsertWriter& out, const std::vector<std::string>& column_names);
+    Result NewUpsertWriter(UpsertWriter& out, const std::vector<size_t>& column_indices);
+    Result NewLookuper(Lookuper& out);
     TableScan NewScan();
 
     TableInfo GetTableInfo() const;
@@ -846,7 +926,10 @@ class Table {
     Table(ffi::Table* table) noexcept;
 
     void Destroy() noexcept;
+    const std::shared_ptr<GenericRow::ColumnMap>& GetColumnMap() const;
+
     ffi::Table* table_{nullptr};
+    mutable std::shared_ptr<GenericRow::ColumnMap> column_map_;
 };
 
 class TableScan {
@@ -887,6 +970,7 @@ class WriteResult {
 
    private:
     friend class AppendWriter;
+    friend class UpsertWriter;
     WriteResult(ffi::WriteResult* inner) noexcept;
 
     void Destroy() noexcept;
@@ -917,6 +1001,52 @@ class AppendWriter {
     ffi::AppendWriter* writer_{nullptr};
 };
 
+class UpsertWriter {
+   public:
+    UpsertWriter() noexcept;
+    ~UpsertWriter() noexcept;
+
+    UpsertWriter(const UpsertWriter&) = delete;
+    UpsertWriter& operator=(const UpsertWriter&) = delete;
+    UpsertWriter(UpsertWriter&& other) noexcept;
+    UpsertWriter& operator=(UpsertWriter&& other) noexcept;
+
+    bool Available() const;
+
+    Result Upsert(const GenericRow& row);
+    Result Upsert(const GenericRow& row, WriteResult& out);
+    Result Delete(const GenericRow& row);
+    Result Delete(const GenericRow& row, WriteResult& out);
+    Result Flush();
+
+   private:
+    friend class Table;
+    UpsertWriter(ffi::UpsertWriter* writer) noexcept;
+    void Destroy() noexcept;
+    ffi::UpsertWriter* writer_{nullptr};
+};
+
+class Lookuper {
+   public:
+    Lookuper() noexcept;
+    ~Lookuper() noexcept;
+
+    Lookuper(const Lookuper&) = delete;
+    Lookuper& operator=(const Lookuper&) = delete;
+    Lookuper(Lookuper&& other) noexcept;
+    Lookuper& operator=(Lookuper&& other) noexcept;
+
+    bool Available() const;
+
+    Result Lookup(const GenericRow& pk_row, bool& found, GenericRow& out);
+
+   private:
+    friend class Table;
+    Lookuper(ffi::Lookuper* lookuper) noexcept;
+    void Destroy() noexcept;
+    ffi::Lookuper* lookuper_{nullptr};
+};
+
 class LogScanner {
    public:
     LogScanner() noexcept;
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 8fc8415543..40676e57df 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -290,8 +290,7 @@ inline LakeSnapshot from_ffi_lake_snapshot(const ffi::FfiLakeSnapshot& ffi_snaps
     return snapshot;
 }
 
-inline ffi::FfiDatabaseDescriptor to_ffi_database_descriptor(
-    const DatabaseDescriptor& desc) {
+inline ffi::FfiDatabaseDescriptor to_ffi_database_descriptor(const DatabaseDescriptor& desc) {
     ffi::FfiDatabaseDescriptor ffi_desc;
     ffi_desc.comment = rust::String(desc.comment);
     for (const auto& [k, v] : desc.properties) {
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 5f3e7e96dd..ee7f1d8fdb 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -182,6 +182,12 @@ mod ffi {
         bucket_offsets: Vec<FfiBucketOffsetPair>,
     }
 
+    struct FfiLookupResult {
+        result: FfiResult,
+        found: bool,
+        row: FfiGenericRow,
+    }
+
     struct FfiLakeSnapshotResult {
         result: FfiResult,
         lake_snapshot: FfiLakeSnapshot,
@@ -242,6 +248,8 @@ mod ffi {
         type AppendWriter;
         type WriteResult;
         type LogScanner;
+        type UpsertWriter;
+        type Lookuper;
 
         // Connection
         fn new_connection(bootstrap_server: &str) -> Result<*mut Connection>;
@@ -330,6 +338,16 @@ mod ffi {
         fn get_table_info_from_table(self: &Table) -> FfiTableInfo;
         fn get_table_path(self: &Table) -> FfiTablePath;
         fn has_primary_key(self: &Table) -> bool;
+        fn new_upsert_writer(self: &Table) -> Result<*mut UpsertWriter>;
+        fn new_upsert_writer_with_column_names(
+            self: &Table,
+            column_names: Vec<String>,
+        ) -> Result<*mut UpsertWriter>;
+        fn new_upsert_writer_with_column_indices(
+            self: &Table,
+            column_indices: Vec<usize>,
+        ) -> Result<*mut UpsertWriter>;
+        fn new_lookuper(self: &Table) -> Result<*mut Lookuper>;
 
         // AppendWriter
         unsafe fn delete_append_writer(writer: *mut AppendWriter);
@@ -339,6 +357,16 @@ mod ffi {
         // WriteResult — dropped automatically via rust::Box, or call wait() for ack
         fn wait(self: &mut WriteResult) -> FfiResult;
 
+        // UpsertWriter
+        unsafe fn delete_upsert_writer(writer: *mut UpsertWriter);
+        fn upsert(self: &mut UpsertWriter, row: &FfiGenericRow) -> Result<Box<WriteResult>>;
+        fn delete_row(self: &mut UpsertWriter, row: &FfiGenericRow) -> Result<Box<WriteResult>>;
+        fn upsert_flush(self: &mut UpsertWriter) -> FfiResult;
+
+        // Lookuper
+        unsafe fn delete_lookuper(lookuper: *mut Lookuper);
+        fn lookup(self: &mut Lookuper, pk_row: &FfiGenericRow) -> FfiLookupResult;
+
         // LogScanner
         unsafe fn delete_log_scanner(scanner: *mut LogScanner);
         fn subscribe(self: &LogScanner, bucket_id: i32, start_offset: i64) -> FfiResult;
@@ -399,6 +427,16 @@ pub struct LogScanner {
     projected_columns: Vec<fcore::metadata::Column>,
 }
 
+pub struct UpsertWriter {
+    inner: fcore::client::UpsertWriter,
+    table_info: fcore::metadata::TableInfo,
+}
+
+pub struct Lookuper {
+    inner: fcore::client::Lookuper,
+    table_info: fcore::metadata::TableInfo,
+}
+
 fn ok_result() -> ffi::FfiResult {
     ffi::FfiResult {
         error_code: 0,
@@ -1045,6 +1083,113 @@ impl Table {
     fn has_primary_key(&self) -> bool {
         self.has_pk
     }
+
+    fn new_upsert_writer(&self) -> Result<*mut UpsertWriter, String> {
+        let _enter = RUNTIME.enter();
+
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+
+        let table_upsert = fluss_table
+            .new_upsert()
+            .map_err(|e| format!("Failed to create upsert: {e}"))?;
+
+        let writer = table_upsert
+            .create_writer()
+            .map_err(|e| format!("Failed to create upsert writer: {e}"))?;
+
+        Ok(Box::into_raw(Box::new(UpsertWriter {
+            inner: writer,
+            table_info: self.table_info.clone(),
+        })))
+    }
+
+    fn new_upsert_writer_with_column_names(
+        &self,
+        column_names: Vec<String>,
+    ) -> Result<*mut UpsertWriter, String> {
+        let _enter = RUNTIME.enter();
+
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+
+        let table_upsert = fluss_table
+            .new_upsert()
+            .map_err(|e| format!("Failed to create upsert: {e}"))?;
+
+        let col_refs: Vec<&str> = column_names.iter().map(|s| s.as_str()).collect();
+        let table_upsert = table_upsert
+            .partial_update_with_column_names(&col_refs)
+            .map_err(|e| format!("Failed to set partial update columns: {e}"))?;
+
+        let writer = table_upsert
+            .create_writer()
+            .map_err(|e| format!("Failed to create upsert writer: {e}"))?;
+
+        Ok(Box::into_raw(Box::new(UpsertWriter {
+            inner: writer,
+            table_info: self.table_info.clone(),
+        })))
+    }
+
+    fn new_upsert_writer_with_column_indices(
+        &self,
+        column_indices: Vec<usize>,
+    ) -> Result<*mut UpsertWriter, String> {
+        let _enter = RUNTIME.enter();
+
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+
+        let table_upsert = fluss_table
+            .new_upsert()
+            .map_err(|e| format!("Failed to create upsert: {e}"))?;
+
+        let table_upsert = table_upsert
+            .partial_update(Some(column_indices))
+            .map_err(|e| format!("Failed to set partial update columns: {e}"))?;
+
+        let writer = table_upsert
+            .create_writer()
+            .map_err(|e| format!("Failed to create upsert writer: {e}"))?;
+
+        Ok(Box::into_raw(Box::new(UpsertWriter {
+            inner: writer,
+            table_info: self.table_info.clone(),
+        })))
+    }
+
+    fn new_lookuper(&self) -> Result<*mut Lookuper, String> {
+        let _enter = RUNTIME.enter();
+
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+
+        let table_lookup = fluss_table
+            .new_lookup()
+            .map_err(|e| format!("Failed to create lookup: {e}"))?;
+
+        let lookuper = table_lookup
+            .create_lookuper()
+            .map_err(|e| format!("Failed to create lookuper: {e}"))?;
+
+        Ok(Box::into_raw(Box::new(Lookuper {
+            inner: lookuper,
+            table_info: self.table_info.clone(),
+        })))
+    }
 }
 
 // AppendWriter implementation
@@ -1095,6 +1240,137 @@ impl WriteResult {
     }
 }
 
+// UpsertWriter implementation
+unsafe fn delete_upsert_writer(writer: *mut UpsertWriter) {
+    if !writer.is_null() {
+        unsafe {
+            drop(Box::from_raw(writer));
+        }
+    }
+}
+
+impl UpsertWriter {
+    /// Pad row with Null to full schema width.
+    /// This allows callers to only set the fields they care about.
+    fn pad_row<'a>(&self, mut row: fcore::row::GenericRow<'a>) -> fcore::row::GenericRow<'a> {
+        let num_columns = self.table_info.get_schema().columns().len();
+        if row.values.len() < num_columns {
+            row.values.resize(num_columns, fcore::row::Datum::Null);
+        }
+        row
+    }
+
+    fn upsert(&mut self, row: &ffi::FfiGenericRow) -> Result<Box<WriteResult>, String> {
+        let schema = self.table_info.get_schema();
+        let generic_row = types::ffi_row_to_core(row, Some(schema)).map_err(|e| e.to_string())?;
+        let generic_row = self.pad_row(generic_row);
+
+        let result_future = self
+            .inner
+            .upsert(&generic_row)
+            .map_err(|e| format!("Failed to upsert: {e}"))?;
+
+        Ok(Box::new(WriteResult {
+            inner: Some(result_future),
+        }))
+    }
+
+    fn delete_row(&mut self, row: &ffi::FfiGenericRow) -> Result<Box<WriteResult>, String> {
+        let schema = self.table_info.get_schema();
+        let generic_row = types::ffi_row_to_core(row, Some(schema)).map_err(|e| e.to_string())?;
+        let generic_row = self.pad_row(generic_row);
+
+        let result_future = self
+            .inner
+            .delete(&generic_row)
+            .map_err(|e| format!("Failed to delete: {e}"))?;
+
+        Ok(Box::new(WriteResult {
+            inner: Some(result_future),
+        }))
+    }
+
+    fn upsert_flush(&mut self) -> ffi::FfiResult {
+        let result = RUNTIME.block_on(async { self.inner.flush().await });
+
+        match result {
+            Ok(_) => ok_result(),
+            Err(e) => err_result(1, e.to_string()),
+        }
+    }
+}
+
+// Lookuper implementation
+unsafe fn delete_lookuper(lookuper: *mut Lookuper) {
+    if !lookuper.is_null() {
+        unsafe {
+            drop(Box::from_raw(lookuper));
+        }
+    }
+}
+
+impl Lookuper {
+    /// Pad row with Null to full schema width (same as UpsertWriter::pad_row).
+    /// Ensures the PK row is always full-width, matching Python's behavior.
+    fn pad_row<'a>(&self, mut row: fcore::row::GenericRow<'a>) -> fcore::row::GenericRow<'a> {
+        let num_columns = self.table_info.get_schema().columns().len();
+        if row.values.len() < num_columns {
+            row.values.resize(num_columns, fcore::row::Datum::Null);
+        }
+        row
+    }
+
+    fn lookup(&mut self, pk_row: &ffi::FfiGenericRow) -> ffi::FfiLookupResult {
+        let schema = self.table_info.get_schema();
+        let generic_row = match types::ffi_row_to_core(pk_row, Some(schema)) {
+            Ok(r) => self.pad_row(r),
+            Err(e) => {
+                return ffi::FfiLookupResult {
+                    result: err_result(1, e.to_string()),
+                    found: false,
+                    row: ffi::FfiGenericRow { fields: vec![] },
+                };
+            }
+        };
+
+        let lookup_result = match RUNTIME.block_on(self.inner.lookup(&generic_row)) {
+            Ok(r) => r,
+            Err(e) => {
+                return ffi::FfiLookupResult {
+                    result: err_result(1, e.to_string()),
+                    found: false,
+                    row: ffi::FfiGenericRow { fields: vec![] },
+                };
+            }
+        };
+
+        match lookup_result.get_single_row() {
+            Ok(Some(row)) => match types::internal_row_to_ffi_row(&row, &self.table_info) {
+                Ok(ffi_row) => ffi::FfiLookupResult {
+                    result: ok_result(),
+                    found: true,
+                    row: ffi_row,
+                },
+                Err(e) => ffi::FfiLookupResult {
+                    result: err_result(1, e.to_string()),
+                    found: false,
+                    row: ffi::FfiGenericRow { fields: vec![] },
+                },
+            },
+            Ok(None) => ffi::FfiLookupResult {
+                result: ok_result(),
+                found: false,
+                row: ffi::FfiGenericRow { fields: vec![] },
+            },
+            Err(e) => ffi::FfiLookupResult {
+                result: err_result(1, e.to_string()),
+                found: false,
+                row: ffi::FfiGenericRow { fields: vec![] },
+            },
+        }
+    }
+}
+
 // LogScanner implementation
 unsafe fn delete_log_scanner(scanner: *mut LogScanner) {
     if !scanner.is_null() {
@@ -1258,13 +1534,18 @@ impl LogScanner {
             let result = RUNTIME.block_on(async { inner.poll(timeout).await });
 
             match result {
-                Ok(records) => ffi::FfiScanRecordsResult {
-                    result: ok_result(),
-                    scan_records: types::core_scan_records_to_ffi(
-                        &records,
-                        &self.projected_columns,
-                    ),
-                },
+                Ok(records) => {
+                    match types::core_scan_records_to_ffi(&records, &self.projected_columns) {
+                        Ok(scan_records) => ffi::FfiScanRecordsResult {
+                            result: ok_result(),
+                            scan_records,
+                        },
+                        Err(e) => ffi::FfiScanRecordsResult {
+                            result: err_result(1, e.to_string()),
+                            scan_records: ffi::FfiScanRecords { records: vec![] },
+                        },
+                    }
+                }
                 Err(e) => ffi::FfiScanRecordsResult {
                     result: err_result(1, e.to_string()),
                     scan_records: ffi::FfiScanRecords { records: vec![] },
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 4425b5fbfa..5b2f66c805 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -92,12 +92,16 @@ void Table::Destroy() noexcept {
     }
 }
 
-Table::Table(Table&& other) noexcept : table_(other.table_) { other.table_ = nullptr; }
+Table::Table(Table&& other) noexcept
+    : table_(other.table_), column_map_(std::move(other.column_map_)) {
+    other.table_ = nullptr;
+}
 
 Table& Table::operator=(Table&& other) noexcept {
     if (this != &other) {
         Destroy();
         table_ = other.table_;
+        column_map_ = std::move(other.column_map_);
         other.table_ = nullptr;
     }
     return *this;
@@ -111,7 +115,7 @@ Result Table::NewAppendWriter(AppendWriter& out) {
     }
 
     try {
-        out.writer_ = table_->new_append_writer();
+        out = AppendWriter(table_->new_append_writer());
         return utils::make_ok();
     } catch (const rust::Error& e) {
         return utils::make_error(1, e.what());
@@ -177,6 +181,24 @@ Result TableScan::CreateRecordBatchScanner(LogScanner& out) {
     }
 }
 
+const std::shared_ptr<GenericRow::ColumnMap>& Table::GetColumnMap() const {
+    if (!column_map_ && Available()) {
+        auto info = GetTableInfo();
+        column_map_ = std::make_shared<GenericRow::ColumnMap>();
+        for (size_t i = 0; i < info.schema.columns.size(); ++i) {
+            (*column_map_)[info.schema.columns[i].name] = {i,
+                                                           info.schema.columns[i].data_type.id()};
+        }
+    }
+    return column_map_;
+}
+
+GenericRow Table::NewRow() const {
+    GenericRow row;
+    row.column_map_ = GetColumnMap();
+    return row;
+}
+
 TableInfo Table::GetTableInfo() const {
     if (!Available()) {
         return TableInfo{};
@@ -281,7 +303,7 @@ Result AppendWriter::Append(const GenericRow& row, WriteResult& out) {
     try {
         auto ffi_row = utils::to_ffi_generic_row(row);
         auto rust_box = writer_->append(ffi_row);
-        out.inner_ = rust_box.into_raw();
+        out = WriteResult(rust_box.into_raw());
         return utils::make_ok();
     } catch (const rust::Error& e) {
         return utils::make_error(1, e.what());
@@ -299,6 +321,213 @@ Result AppendWriter::Flush() {
     return utils::from_ffi_result(ffi_result);
 }
 
+// UpsertWriter implementation
+UpsertWriter::UpsertWriter() noexcept = default;
+
+UpsertWriter::UpsertWriter(ffi::UpsertWriter* writer) noexcept : writer_(writer) {}
+
+UpsertWriter::~UpsertWriter() noexcept { Destroy(); }
+
+void UpsertWriter::Destroy() noexcept {
+    if (writer_) {
+        ffi::delete_upsert_writer(writer_);
+        writer_ = nullptr;
+    }
+}
+
+UpsertWriter::UpsertWriter(UpsertWriter&& other) noexcept : writer_(other.writer_) {
+    other.writer_ = nullptr;
+}
+
+UpsertWriter& UpsertWriter::operator=(UpsertWriter&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        writer_ = other.writer_;
+        other.writer_ = nullptr;
+    }
+    return *this;
+}
+
+bool UpsertWriter::Available() const { return writer_ != nullptr; }
+
+Result UpsertWriter::Upsert(const GenericRow& row) {
+    WriteResult wr;
+    return Upsert(row, wr);
+}
+
+Result UpsertWriter::Upsert(const GenericRow& row, WriteResult& out) {
+    if (!Available()) {
+        return utils::make_error(1, "UpsertWriter not available");
+    }
+
+    try {
+        auto ffi_row = utils::to_ffi_generic_row(row);
+        auto rust_box = writer_->upsert(ffi_row);
+        out = WriteResult(rust_box.into_raw());
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result UpsertWriter::Delete(const GenericRow& row) {
+    WriteResult wr;
+    return Delete(row, wr);
+}
+
+Result UpsertWriter::Delete(const GenericRow& row, WriteResult& out) {
+    if (!Available()) {
+        return utils::make_error(1, "UpsertWriter not available");
+    }
+
+    try {
+        auto ffi_row = utils::to_ffi_generic_row(row);
+        auto rust_box = writer_->delete_row(ffi_row);
+        out = WriteResult(rust_box.into_raw());
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result UpsertWriter::Flush() {
+    if (!Available()) {
+        return utils::make_error(1, "UpsertWriter not available");
+    }
+
+    auto ffi_result = writer_->upsert_flush();
+    return utils::from_ffi_result(ffi_result);
+}
+
+// Lookuper implementation
+Lookuper::Lookuper() noexcept = default;
+
+Lookuper::Lookuper(ffi::Lookuper* lookuper) noexcept : lookuper_(lookuper) {}
+
+Lookuper::~Lookuper() noexcept { Destroy(); }
+
+void Lookuper::Destroy() noexcept {
+    if (lookuper_) {
+        ffi::delete_lookuper(lookuper_);
+        lookuper_ = nullptr;
+    }
+}
+
+Lookuper::Lookuper(Lookuper&& other) noexcept : lookuper_(other.lookuper_) {
+    other.lookuper_ = nullptr;
+}
+
+Lookuper& Lookuper::operator=(Lookuper&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        lookuper_ = other.lookuper_;
+        other.lookuper_ = nullptr;
+    }
+    return *this;
+}
+
+bool Lookuper::Available() const { return lookuper_ != nullptr; }
+
+Result Lookuper::Lookup(const GenericRow& pk_row, bool& found, GenericRow& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Lookuper not available");
+    }
+
+    try {
+        auto ffi_row = utils::to_ffi_generic_row(pk_row);
+        auto ffi_result = lookuper_->lookup(ffi_row);
+        auto result = utils::from_ffi_result(ffi_result.result);
+        if (!result.Ok()) {
+            found = false;
+            return result;
+        }
+        found = ffi_result.found;
+        if (found) {
+            out = utils::from_ffi_generic_row(ffi_result.row);
+        }
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        found = false;
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        found = false;
+        return utils::make_error(1, e.what());
+    }
+}
+
+// Table KV methods
+Result Table::NewUpsertWriter(UpsertWriter& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        out = UpsertWriter(table_->new_upsert_writer());
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result Table::NewUpsertWriter(UpsertWriter& out, const std::vector<std::string>& column_names) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        rust::Vec<rust::String> rust_names;
+        for (const auto& name : column_names) {
+            rust_names.push_back(rust::String(name));
+        }
+        out = UpsertWriter(table_->new_upsert_writer_with_column_names(std::move(rust_names)));
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result Table::NewUpsertWriter(UpsertWriter& out, const std::vector<size_t>& column_indices) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        rust::Vec<size_t> rust_indices;
+        for (size_t idx : column_indices) {
+            rust_indices.push_back(idx);
+        }
+        out = UpsertWriter(table_->new_upsert_writer_with_column_indices(std::move(rust_indices)));
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+Result Table::NewLookuper(Lookuper& out) {
+    if (!Available()) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        out = Lookuper(table_->new_lookuper());
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
 // LogScanner implementation
 LogScanner::LogScanner() noexcept = default;
 
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 65b9b0409f..17aa872109 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -316,7 +316,22 @@ pub fn ffi_row_to_core<'a>(
         let datum = match field.datum_type {
             DATUM_TYPE_NULL => Datum::Null,
             DATUM_TYPE_BOOL => Datum::Bool(field.bool_val),
-            DATUM_TYPE_INT32 => Datum::Int32(field.i32_val),
+            DATUM_TYPE_INT32 => match schema
+                .and_then(|s| s.columns().get(idx))
+                .map(|c| c.data_type())
+            {
+                Some(fcore::metadata::DataType::TinyInt(_)) => {
+                    Datum::Int8(i8::try_from(field.i32_val).map_err(|_| {
+                        anyhow!("Column {idx}: {} overflows TinyInt", field.i32_val)
+                    })?)
+                }
+                Some(fcore::metadata::DataType::SmallInt(_)) => {
+                    Datum::Int16(i16::try_from(field.i32_val).map_err(|_| {
+                        anyhow!("Column {idx}: {} overflows SmallInt", field.i32_val)
+                    })?)
+                }
+                _ => Datum::Int32(field.i32_val),
+            },
             DATUM_TYPE_INT64 => Datum::Int64(field.i64_val),
             DATUM_TYPE_FLOAT32 => Datum::Float32(field.f32_val.into()),
             DATUM_TYPE_FLOAT64 => Datum::Float64(field.f64_val.into()),
@@ -360,11 +375,11 @@ pub fn ffi_row_to_core<'a>(
             DATUM_TYPE_TIME => Datum::Time(fcore::row::Time::new(field.i32_val)),
             DATUM_TYPE_TIMESTAMP_NTZ => Datum::TimestampNtz(
                 fcore::row::TimestampNtz::from_millis_nanos(field.i64_val, field.i32_val)
-                    .unwrap_or_else(|_| fcore::row::TimestampNtz::new(field.i64_val)),
+                    .map_err(|e| anyhow!("Column {idx}: {e}"))?,
             ),
             DATUM_TYPE_TIMESTAMP_LTZ => Datum::TimestampLtz(
                 fcore::row::TimestampLtz::from_millis_nanos(field.i64_val, field.i32_val)
-                    .unwrap_or_else(|_| fcore::row::TimestampLtz::new(field.i64_val)),
+                    .map_err(|e| anyhow!("Column {idx}: {e}"))?,
             ),
             other => return Err(anyhow!("Column {idx}: unknown datum type {other}")),
         };
@@ -377,7 +392,7 @@ pub fn ffi_row_to_core<'a>(
 pub fn core_scan_records_to_ffi(
     records: &fcore::record::ScanRecords,
     columns: &[fcore::metadata::Column],
-) -> ffi::FfiScanRecords {
+) -> Result<ffi::FfiScanRecords> {
     let mut ffi_records = Vec::new();
 
     // Iterate over all buckets and their records
@@ -385,7 +400,7 @@ pub fn core_scan_records_to_ffi(
         let bucket_id = table_bucket.bucket_id();
         for record in bucket_records {
             let row = record.row();
-            let fields = core_row_to_ffi_fields(row, columns);
+            let fields = core_row_to_ffi_fields(row, columns)?;
 
             ffi_records.push(ffi::FfiScanRecord {
                 bucket_id,
@@ -396,32 +411,15 @@ pub fn core_scan_records_to_ffi(
         }
     }
 
-    ffi::FfiScanRecords {
+    Ok(ffi::FfiScanRecords {
         records: ffi_records,
-    }
+    })
 }
 
 fn core_row_to_ffi_fields(
     row: &fcore::row::ColumnarRow,
     columns: &[fcore::metadata::Column],
-) -> Vec<ffi::FfiDatum> {
-    fn new_datum(datum_type: i32) -> ffi::FfiDatum {
-        ffi::FfiDatum {
-            datum_type,
-            bool_val: false,
-            i32_val: 0,
-            i64_val: 0,
-            f32_val: 0.0,
-            f64_val: 0.0,
-            string_val: String::new(),
-            bytes_val: vec![],
-            decimal_precision: 0,
-            decimal_scale: 0,
-            i128_hi: 0,
-            i128_lo: 0,
-        }
-    }
-
+) -> Result<Vec<ffi::FfiDatum>> {
     let record_batch = row.get_record_batch();
     let schema = record_batch.schema();
     let row_id = row.get_row_id();
@@ -430,124 +428,135 @@ fn core_row_to_ffi_fields(
 
     for (i, field) in schema.fields().iter().enumerate() {
         if row.is_null_at(i) {
-            fields.push(new_datum(DATUM_TYPE_NULL));
+            fields.push(ffi::FfiDatum::default());
             continue;
         }
 
         let datum = match field.data_type() {
-            ArrowDataType::Boolean => {
-                let mut datum = new_datum(DATUM_TYPE_BOOL);
-                datum.bool_val = row.get_boolean(i);
-                datum
-            }
-            ArrowDataType::Int8 => {
-                let mut datum = new_datum(DATUM_TYPE_INT32);
-                datum.i32_val = row.get_byte(i) as i32;
-                datum
-            }
-            ArrowDataType::Int16 => {
-                let mut datum = new_datum(DATUM_TYPE_INT32);
-                datum.i32_val = row.get_short(i) as i32;
-                datum
-            }
-            ArrowDataType::Int32 => {
-                let mut datum = new_datum(DATUM_TYPE_INT32);
-                datum.i32_val = row.get_int(i);
-                datum
-            }
-            ArrowDataType::Int64 => {
-                let mut datum = new_datum(DATUM_TYPE_INT64);
-                datum.i64_val = row.get_long(i);
-                datum
-            }
-            ArrowDataType::Float32 => {
-                let mut datum = new_datum(DATUM_TYPE_FLOAT32);
-                datum.f32_val = row.get_float(i);
-                datum
-            }
-            ArrowDataType::Float64 => {
-                let mut datum = new_datum(DATUM_TYPE_FLOAT64);
-                datum.f64_val = row.get_double(i);
-                datum
-            }
-            ArrowDataType::Utf8 => {
-                let mut datum = new_datum(DATUM_TYPE_STRING);
-                // todo: avoid copy string
-                datum.string_val = row.get_string(i).to_string();
-                datum
-            }
+            ArrowDataType::Boolean => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_BOOL,
+                bool_val: row.get_boolean(i),
+                ..Default::default()
+            },
+            ArrowDataType::Int8 => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_INT32,
+                i32_val: row.get_byte(i) as i32,
+                ..Default::default()
+            },
+            ArrowDataType::Int16 => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_INT32,
+                i32_val: row.get_short(i) as i32,
+                ..Default::default()
+            },
+            ArrowDataType::Int32 => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_INT32,
+                i32_val: row.get_int(i),
+                ..Default::default()
+            },
+            ArrowDataType::Int64 => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_INT64,
+                i64_val: row.get_long(i),
+                ..Default::default()
+            },
+            ArrowDataType::Float32 => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_FLOAT32,
+                f32_val: row.get_float(i),
+                ..Default::default()
+            },
+            ArrowDataType::Float64 => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_FLOAT64,
+                f64_val: row.get_double(i),
+                ..Default::default()
+            },
+            ArrowDataType::Utf8 => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_STRING,
+                string_val: row.get_string(i).to_string(),
+                ..Default::default()
+            },
             ArrowDataType::LargeUtf8 => {
                 let array = record_batch
                     .column(i)
                     .as_any()
                     .downcast_ref::<LargeStringArray>()
-                    .expect("LargeUtf8 column expected");
-                let mut datum = new_datum(DATUM_TYPE_STRING);
-                datum.string_val = array.value(row_id).to_string();
-                datum
-            }
-            ArrowDataType::Binary => {
-                let mut datum = new_datum(DATUM_TYPE_BYTES);
-                // todo: avoid copy bytes for blob
-                datum.bytes_val = row.get_bytes(i).to_vec();
-                datum
-            }
-            ArrowDataType::FixedSizeBinary(len) => {
-                let mut datum = new_datum(DATUM_TYPE_BYTES);
-                datum.bytes_val = row.get_binary(i, *len as usize).to_vec();
-                datum
+                    .ok_or_else(|| anyhow!("Column {i}: expected LargeUtf8 array"))?;
+                ffi::FfiDatum {
+                    datum_type: DATUM_TYPE_STRING,
+                    string_val: array.value(row_id).to_string(),
+                    ..Default::default()
+                }
             }
+            ArrowDataType::Binary => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_BYTES,
+                bytes_val: row.get_bytes(i).to_vec(),
+                ..Default::default()
+            },
+            ArrowDataType::FixedSizeBinary(len) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_BYTES,
+                bytes_val: row.get_binary(i, *len as usize).to_vec(),
+                ..Default::default()
+            },
             ArrowDataType::LargeBinary => {
                 let array = record_batch
                     .column(i)
                     .as_any()
                     .downcast_ref::<LargeBinaryArray>()
-                    .expect("LargeBinary column expected");
-                let mut datum = new_datum(DATUM_TYPE_BYTES);
-                datum.bytes_val = array.value(row_id).to_vec();
-                datum
+                    .ok_or_else(|| anyhow!("Column {i}: expected LargeBinary array"))?;
+                ffi::FfiDatum {
+                    datum_type: DATUM_TYPE_BYTES,
+                    bytes_val: array.value(row_id).to_vec(),
+                    ..Default::default()
+                }
             }
             ArrowDataType::Date32 => {
                 let array = record_batch
                     .column(i)
                     .as_any()
                     .downcast_ref::<Date32Array>()
-                    .expect("Date32 column expected");
-                let mut datum = new_datum(DATUM_TYPE_DATE);
-                datum.i32_val = array.value(row_id);
-                datum
+                    .ok_or_else(|| anyhow!("Column {i}: expected Date32 array"))?;
+                ffi::FfiDatum {
+                    datum_type: DATUM_TYPE_DATE,
+                    i32_val: array.value(row_id),
+                    ..Default::default()
+                }
             }
             ArrowDataType::Timestamp(unit, _tz) => {
                 let datum_type = match columns.get(i).map(|c| c.data_type()) {
                     Some(fcore::metadata::DataType::TimestampLTz(_)) => DATUM_TYPE_TIMESTAMP_LTZ,
                     _ => DATUM_TYPE_TIMESTAMP_NTZ,
                 };
-                let mut datum = new_datum(datum_type);
+                let mut datum = ffi::FfiDatum {
+                    datum_type,
+                    ..Default::default()
+                };
                 match unit {
                     TimeUnit::Second => {
                         let array = record_batch
                             .column(i)
                             .as_any()
                             .downcast_ref::<TimestampSecondArray>()
-                            .expect("Timestamp(second) column expected");
+                            .ok_or_else(|| {
+                                anyhow!("Column {i}: expected Timestamp(second) array")
+                            })?;
                         datum.i64_val = array.value(row_id) * MILLIS_PER_SECOND;
-                        datum.i32_val = 0;
                     }
                     TimeUnit::Millisecond => {
                         let array = record_batch
                             .column(i)
                             .as_any()
                             .downcast_ref::<TimestampMillisecondArray>()
-                            .expect("Timestamp(millisecond) column expected");
+                            .ok_or_else(|| {
+                                anyhow!("Column {i}: expected Timestamp(millisecond) array")
+                            })?;
                         datum.i64_val = array.value(row_id);
-                        datum.i32_val = 0;
                     }
                     TimeUnit::Microsecond => {
                         let array = record_batch
                             .column(i)
                             .as_any()
                             .downcast_ref::<TimestampMicrosecondArray>()
-                            .expect("Timestamp(microsecond) column expected");
+                            .ok_or_else(|| {
+                                anyhow!("Column {i}: expected Timestamp(microsecond) array")
+                            })?;
                         let micros = array.value(row_id);
                         datum.i64_val = micros.div_euclid(MICROS_PER_MILLI);
                         datum.i32_val =
@@ -558,7 +567,9 @@ fn core_row_to_ffi_fields(
                             .column(i)
                             .as_any()
                             .downcast_ref::<TimestampNanosecondArray>()
-                            .expect("Timestamp(nanosecond) column expected");
+                            .ok_or_else(|| {
+                                anyhow!("Column {i}: expected Timestamp(nanosecond) array")
+                            })?;
                         let nanos = array.value(row_id);
                         datum.i64_val = nanos.div_euclid(NANOS_PER_MILLI);
                         datum.i32_val = nanos.rem_euclid(NANOS_PER_MILLI) as i32;
@@ -572,22 +583,26 @@ fn core_row_to_ffi_fields(
                         .column(i)
                         .as_any()
                         .downcast_ref::<Time32SecondArray>()
-                        .expect("Time32(second) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_TIME);
-                    datum.i32_val = array.value(row_id) * MILLIS_PER_SECOND as i32;
-                    datum
+                        .ok_or_else(|| anyhow!("Column {i}: expected Time32(second) array"))?;
+                    ffi::FfiDatum {
+                        datum_type: DATUM_TYPE_TIME,
+                        i32_val: array.value(row_id) * MILLIS_PER_SECOND as i32,
+                        ..Default::default()
+                    }
                 }
                 TimeUnit::Millisecond => {
                     let array = record_batch
                         .column(i)
                         .as_any()
                         .downcast_ref::<Time32MillisecondArray>()
-                        .expect("Time32(millisecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_TIME);
-                    datum.i32_val = array.value(row_id);
-                    datum
+                        .ok_or_else(|| anyhow!("Column {i}: expected Time32(millisecond) array"))?;
+                    ffi::FfiDatum {
+                        datum_type: DATUM_TYPE_TIME,
+                        i32_val: array.value(row_id),
+                        ..Default::default()
+                    }
                 }
-                _ => panic!("Will never come here. Unsupported Time32 unit for column {i}"),
+                _ => return Err(anyhow!("Column {i}: unsupported Time32 unit")),
             },
             ArrowDataType::Time64(unit) => match unit {
                 TimeUnit::Microsecond => {
@@ -595,55 +610,210 @@ fn core_row_to_ffi_fields(
                         .column(i)
                         .as_any()
                         .downcast_ref::<Time64MicrosecondArray>()
-                        .expect("Time64(microsecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_TIME);
-                    datum.i32_val = (array.value(row_id) / MICROS_PER_MILLI) as i32;
-                    datum
+                        .ok_or_else(|| anyhow!("Column {i}: expected Time64(microsecond) array"))?;
+                    ffi::FfiDatum {
+                        datum_type: DATUM_TYPE_TIME,
+                        i32_val: (array.value(row_id) / MICROS_PER_MILLI) as i32,
+                        ..Default::default()
+                    }
                 }
                 TimeUnit::Nanosecond => {
                     let array = record_batch
                         .column(i)
                         .as_any()
                         .downcast_ref::<Time64NanosecondArray>()
-                        .expect("Time64(nanosecond) column expected");
-                    let mut datum = new_datum(DATUM_TYPE_TIME);
-                    datum.i32_val = (array.value(row_id) / NANOS_PER_MILLI) as i32;
-                    datum
+                        .ok_or_else(|| anyhow!("Column {i}: expected Time64(nanosecond) array"))?;
+                    ffi::FfiDatum {
+                        datum_type: DATUM_TYPE_TIME,
+                        i32_val: (array.value(row_id) / NANOS_PER_MILLI) as i32,
+                        ..Default::default()
+                    }
                 }
-                _ => panic!("Will never come here. Unsupported Time64 unit for column {i}"),
+                _ => return Err(anyhow!("Column {i}: unsupported Time64 unit")),
             },
             ArrowDataType::Decimal128(precision, scale) => {
                 let array = record_batch
                     .column(i)
                     .as_any()
                     .downcast_ref::<Decimal128Array>()
-                    .expect("Decimal128 column expected");
+                    .ok_or_else(|| anyhow!("Column {i}: expected Decimal128 array"))?;
                 let i128_val = array.value(row_id);
 
                 if fcore::row::Decimal::is_compact_precision(*precision as u32) {
-                    let mut datum = new_datum(DATUM_TYPE_DECIMAL_I64);
-                    datum.i64_val = i128_val as i64;
-                    datum.decimal_precision = *precision as i32;
-                    datum.decimal_scale = *scale as i32;
-                    datum
+                    ffi::FfiDatum {
+                        datum_type: DATUM_TYPE_DECIMAL_I64,
+                        i64_val: i128_val as i64,
+                        decimal_precision: *precision as i32,
+                        decimal_scale: *scale as i32,
+                        ..Default::default()
+                    }
                 } else {
-                    let mut datum = new_datum(DATUM_TYPE_DECIMAL_I128);
-                    datum.i128_hi = (i128_val >> 64) as i64;
-                    datum.i128_lo = i128_val as i64;
-                    datum.decimal_precision = *precision as i32;
-                    datum.decimal_scale = *scale as i32;
-                    datum
+                    ffi::FfiDatum {
+                        datum_type: DATUM_TYPE_DECIMAL_I128,
+                        i128_hi: (i128_val >> 64) as i64,
+                        i128_lo: i128_val as i64,
+                        decimal_precision: *precision as i32,
+                        decimal_scale: *scale as i32,
+                        ..Default::default()
+                    }
                 }
             }
-            other => panic!(
-                "Will never come here. Unsupported Arrow data type for column {i}: {other:?}"
-            ),
+            other => return Err(anyhow!("Column {i}: unsupported Arrow data type {other:?}")),
+        };
+
+        fields.push(datum);
+    }
+
+    Ok(fields)
+}
+
+impl Default for ffi::FfiDatum {
+    fn default() -> Self {
+        Self {
+            datum_type: DATUM_TYPE_NULL,
+            bool_val: false,
+            i32_val: 0,
+            i64_val: 0,
+            f32_val: 0.0,
+            f64_val: 0.0,
+            string_val: String::new(),
+            bytes_val: vec![],
+            decimal_precision: 0,
+            decimal_scale: 0,
+            i128_hi: 0,
+            i128_lo: 0,
+        }
+    }
+}
+
+/// Convert any InternalRow to FfiGenericRow using Fluss schema metadata.
+/// Used for lookup results (CompactedRow) where Arrow schema is unavailable.
+pub fn internal_row_to_ffi_row(
+    row: &dyn fcore::row::InternalRow,
+    table_info: &fcore::metadata::TableInfo,
+) -> Result<ffi::FfiGenericRow> {
+    let schema = table_info.get_schema();
+    let columns = schema.columns();
+    let mut fields = Vec::with_capacity(columns.len());
+
+    for (i, col) in columns.iter().enumerate() {
+        if row.is_null_at(i) {
+            fields.push(ffi::FfiDatum::default());
+            continue;
+        }
+
+        let datum = match col.data_type() {
+            fcore::metadata::DataType::Boolean(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_BOOL,
+                bool_val: row.get_boolean(i),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::TinyInt(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_INT32,
+                i32_val: row.get_byte(i) as i32,
+                ..Default::default()
+            },
+            fcore::metadata::DataType::SmallInt(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_INT32,
+                i32_val: row.get_short(i) as i32,
+                ..Default::default()
+            },
+            fcore::metadata::DataType::Int(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_INT32,
+                i32_val: row.get_int(i),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::BigInt(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_INT64,
+                i64_val: row.get_long(i),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::Float(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_FLOAT32,
+                f32_val: row.get_float(i),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::Double(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_FLOAT64,
+                f64_val: row.get_double(i),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::String(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_STRING,
+                string_val: row.get_string(i).to_string(),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::Bytes(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_BYTES,
+                bytes_val: row.get_bytes(i).to_vec(),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::Date(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_DATE,
+                i32_val: row.get_date(i).get_inner(),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::Time(_) => ffi::FfiDatum {
+                datum_type: DATUM_TYPE_TIME,
+                i32_val: row.get_time(i).get_inner(),
+                ..Default::default()
+            },
+            fcore::metadata::DataType::Timestamp(dt) => {
+                let ts = row.get_timestamp_ntz(i, dt.precision());
+                ffi::FfiDatum {
+                    datum_type: DATUM_TYPE_TIMESTAMP_NTZ,
+                    i64_val: ts.get_millisecond(),
+                    i32_val: ts.get_nano_of_millisecond(),
+                    ..Default::default()
+                }
+            }
+            fcore::metadata::DataType::TimestampLTz(dt) => {
+                let ts = row.get_timestamp_ltz(i, dt.precision());
+                ffi::FfiDatum {
+                    datum_type: DATUM_TYPE_TIMESTAMP_LTZ,
+                    i64_val: ts.get_epoch_millisecond(),
+                    i32_val: ts.get_nano_of_millisecond(),
+                    ..Default::default()
+                }
+            }
+            fcore::metadata::DataType::Decimal(dt) => {
+                let precision = dt.precision();
+                let scale = dt.scale();
+                let decimal = row.get_decimal(i, precision as usize, scale as usize);
+                if fcore::row::Decimal::is_compact_precision(precision) {
+                    ffi::FfiDatum {
+                        datum_type: DATUM_TYPE_DECIMAL_I64,
+                        i64_val: decimal.to_unscaled_long().map_err(|e| {
+                            anyhow!("Column {i}: compact decimal conversion failed: {e}")
+                        })?,
+                        decimal_precision: precision as i32,
+                        decimal_scale: scale as i32,
+                        ..Default::default()
+                    }
+                } else {
+                    let bd = decimal.to_big_decimal();
+                    let (unscaled, _) = bd.into_bigint_and_exponent();
+                    use bigdecimal::ToPrimitive;
+                    let i128_val = unscaled.to_i128().ok_or_else(|| {
+                        anyhow!("Column {i}: decimal unscaled value does not fit in i128")
+                    })?;
+                    ffi::FfiDatum {
+                        datum_type: DATUM_TYPE_DECIMAL_I128,
+                        i128_hi: (i128_val >> 64) as i64,
+                        i128_lo: i128_val as i64,
+                        decimal_precision: precision as i32,
+                        decimal_scale: scale as i32,
+                        ..Default::default()
+                    }
+                }
+            }
+            other => return Err(anyhow!("Unsupported data type for column {i}: {other:?}")),
         };
 
         fields.push(datum);
     }
 
-    fields
+    Ok(ffi::FfiGenericRow { fields })
 }
 
 pub fn core_lake_snapshot_to_ffi(snapshot: &fcore::metadata::LakeSnapshot) -> ffi::FfiLakeSnapshot {

From 02fc41171c3c4992917d6ca8daeecfc6a1d36faa Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 9 Feb 2026 14:51:13 +0000
Subject: [PATCH 133/287] feat: Partitioned KV tables python example (#290)

---
 fluss-rust/bindings/python/example/example.py | 106 ++++++++++++++++++
 1 file changed, 106 insertions(+)

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 9f8cafa33a..3d4235392d 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -802,6 +802,112 @@ async def main():
         print(f"Error with partitioned table: {e}")
         traceback.print_exc()
 
+    # =====================================================
+    # Demo: Partitioned KV Table (Upsert, Lookup, Delete)
+    # =====================================================
+    print("\n" + "=" * 60)
+    print("--- Testing Partitioned KV Table ---")
+    print("=" * 60)
+
+    partitioned_kv_fields = [
+        pa.field("region", pa.string()),   # partition key + part of PK
+        pa.field("user_id", pa.int32()),   # part of PK
+        pa.field("name", pa.string()),
+        pa.field("score", pa.int64()),
+    ]
+    partitioned_kv_schema = pa.schema(partitioned_kv_fields)
+    fluss_partitioned_kv_schema = fluss.Schema(
+        partitioned_kv_schema, primary_keys=["region", "user_id"]
+    )
+
+    partitioned_kv_descriptor = fluss.TableDescriptor(
+        fluss_partitioned_kv_schema,
+        partition_keys=["region"],
+    )
+
+    partitioned_kv_path = fluss.TablePath("fluss", "partitioned_kv_table_py")
+
+    try:
+        await admin.drop_table(partitioned_kv_path, ignore_if_not_exists=True)
+        await admin.create_table(partitioned_kv_path, partitioned_kv_descriptor, False)
+        print(f"Created partitioned KV table: {partitioned_kv_path}")
+
+        # Create partitions
+        await admin.create_partition(partitioned_kv_path, {"region": "US"})
+        await admin.create_partition(partitioned_kv_path, {"region": "EU"})
+        await admin.create_partition(partitioned_kv_path, {"region": "APAC"})
+        print("Created partitions: US, EU, APAC")
+
+        partitioned_kv_table = await conn.get_table(partitioned_kv_path)
+        upsert_writer = partitioned_kv_table.new_upsert()
+
+        # Upsert rows across partitions
+        test_data = [
+            ("US", 1, "Gustave", 100),
+            ("US", 2, "Lune", 200),
+            ("EU", 1, "Sciel", 150),
+            ("EU", 2, "Maelle", 250),
+            ("APAC", 1, "Noco", 300),
+        ]
+        for region, user_id, name, score in test_data:
+            upsert_writer.upsert({
+                "region": region, "user_id": user_id,
+                "name": name, "score": score,
+            })
+        await upsert_writer.flush()
+        print(f"Upserted {len(test_data)} rows across 3 partitions")
+
+        # Lookup all rows across partitions
+        print("\n--- Lookup across partitions ---")
+        lookuper = partitioned_kv_table.new_lookup()
+        for region, user_id, name, score in test_data:
+            result = await lookuper.lookup({"region": region, "user_id": user_id})
+            assert result is not None, f"Expected to find region={region} user_id={user_id}"
+            assert result["name"] == name, f"Name mismatch: {result['name']} != {name}"
+            assert result["score"] == score, f"Score mismatch: {result['score']} != {score}"
+        print(f"All {len(test_data)} rows verified across partitions")
+
+        # Update within a partition
+        print("\n--- Update within partition ---")
+        handle = upsert_writer.upsert({
+            "region": "US", "user_id": 1,
+            "name": "Gustave Updated", "score": 999,
+        })
+        await handle.wait()
+        result = await lookuper.lookup({"region": "US", "user_id": 1})
+        assert result is not None, "Expected to find region=US user_id=1 after update"
+        assert result["name"] == "Gustave Updated"
+        assert result["score"] == 999
+        print(f"Update verified: US/1 name={result['name']} score={result['score']}")
+
+        # Lookup in non-existent partition
+        print("\n--- Lookup in non-existent partition ---")
+        result = await lookuper.lookup({"region": "UNKNOWN", "user_id": 1})
+        assert result is None, "Expected UNKNOWN partition lookup to return None"
+        print("UNKNOWN partition lookup: not found (expected)")
+
+        # Delete within a partition
+        print("\n--- Delete within partition ---")
+        handle = upsert_writer.delete({"region": "EU", "user_id": 1})
+        await handle.wait()
+        result = await lookuper.lookup({"region": "EU", "user_id": 1})
+        assert result is None, "Expected EU/1 to be deleted"
+        print("Delete verified: EU/1 not found")
+
+        # Verify sibling record still exists
+        result = await lookuper.lookup({"region": "EU", "user_id": 2})
+        assert result is not None, "Expected EU/2 to still exist"
+        assert result["name"] == "Maelle"
+        print(f"EU/2 still exists: name={result['name']}")
+
+        # Cleanup
+        await admin.drop_table(partitioned_kv_path, ignore_if_not_exists=True)
+        print(f"\nDropped partitioned KV table: {partitioned_kv_path}")
+
+    except Exception as e:
+        print(f"Error with partitioned KV table: {e}")
+        traceback.print_exc()
+
     # Close connection
     conn.close()
     print("\nConnection closed")

From 219c016833c8574b7d402e09236aa7bbdf59a6eb Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Tue, 10 Feb 2026 01:29:40 +0000
Subject: [PATCH 134/287] doc: add python docs and API reference (#291)

---
 fluss-rust/bindings/python/API_REFERENCE.md   | 278 ++++++++++
 fluss-rust/bindings/python/DEVELOPMENT.md     | 114 ++++
 fluss-rust/bindings/python/README.md          | 494 ++++++++++++++----
 fluss-rust/bindings/python/fluss/__init__.pyi |   3 +-
 4 files changed, 790 insertions(+), 99 deletions(-)
 create mode 100644 fluss-rust/bindings/python/API_REFERENCE.md
 create mode 100644 fluss-rust/bindings/python/DEVELOPMENT.md

diff --git a/fluss-rust/bindings/python/API_REFERENCE.md b/fluss-rust/bindings/python/API_REFERENCE.md
new file mode 100644
index 0000000000..258b26e6e8
--- /dev/null
+++ b/fluss-rust/bindings/python/API_REFERENCE.md
@@ -0,0 +1,278 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Python API Reference
+
+Complete API reference for the Fluss Python client. For a usage guide with examples, see the [Python Client Guide](README.md).
+
+## `Config`
+
+| Method / Property | Description |
+|---|---|
+| `Config(properties: dict = None)` | Create config from a dict of key-value pairs |
+| `.bootstrap_server` | Get/set coordinator server address |
+| `.request_max_size` | Get/set max request size in bytes |
+| `.writer_batch_size` | Get/set write batch size in bytes |
+
+## `FlussConnection`
+
+| Method | Description |
+|---|---|
+| `await FlussConnection.connect(config) -> FlussConnection` | Connect to a Fluss cluster |
+| `await conn.get_admin() -> FlussAdmin` | Get admin interface |
+| `await conn.get_table(table_path) -> FlussTable` | Get a table for read/write operations |
+| `conn.close()` | Close the connection |
+
+Supports `with` statement (context manager).
+
+## `FlussAdmin`
+
+| Method | Description |
+|---|---|
+| `await create_database(name, ignore_if_exists=False, database_descriptor=None)` | Create a database |
+| `await drop_database(name, ignore_if_not_exists=False, cascade=True)` | Drop a database |
+| `await list_databases() -> list[str]` | List all databases |
+| `await database_exists(name) -> bool` | Check if a database exists |
+| `await get_database_info(name) -> DatabaseInfo` | Get database metadata |
+| `await create_table(table_path, table_descriptor, ignore_if_exists=False)` | Create a table |
+| `await drop_table(table_path, ignore_if_not_exists=False)` | Drop a table |
+| `await get_table(table_path) -> TableInfo` | Get table metadata |
+| `await list_tables(database_name) -> list[str]` | List tables in a database |
+| `await table_exists(table_path) -> bool` | Check if a table exists |
+| `await list_offsets(table_path, bucket_ids, offset_type, timestamp=None) -> dict[int, int]` | Get offsets for buckets |
+| `await list_partition_offsets(table_path, partition_name, bucket_ids, offset_type, timestamp=None) -> dict[int, int]` | Get offsets for a partition's buckets |
+| `await create_partition(table_path, partition_spec, ignore_if_exists=False)` | Create a partition |
+| `await drop_partition(table_path, partition_spec, ignore_if_not_exists=False)` | Drop a partition |
+| `await list_partition_infos(table_path) -> list[PartitionInfo]` | List partitions |
+| `await get_latest_lake_snapshot(table_path) -> LakeSnapshot` | Get latest lake snapshot |
+
+## `FlussTable`
+
+| Method | Description |
+|---|---|
+| `new_scan() -> TableScan` | Create a scan builder |
+| `await new_append_writer() -> AppendWriter` | Create writer for log tables |
+| `new_upsert(columns=None, column_indices=None) -> UpsertWriter` | Create writer for PK tables (optionally partial) |
+| `new_lookup() -> Lookuper` | Create lookuper for PK tables |
+| `get_table_info() -> TableInfo` | Get table metadata |
+| `get_table_path() -> TablePath` | Get table path |
+| `has_primary_key() -> bool` | Check if table has a primary key |
+
+## `TableScan`
+
+| Method | Description |
+|---|---|
+| `.project(indices) -> TableScan` | Project columns by index |
+| `.project_by_name(names) -> TableScan` | Project columns by name |
+| `await .create_log_scanner() -> LogScanner` | Create record-based scanner (for `poll()`) |
+| `await .create_batch_scanner() -> LogScanner` | Create batch-based scanner (for `poll_arrow()`, `to_arrow()`, etc.) |
+
+## `AppendWriter`
+
+| Method | Description |
+|---|---|
+| `.append(row) -> WriteResultHandle` | Append a row (dict, list, or tuple) |
+| `.write_arrow(table)` | Write a PyArrow Table |
+| `.write_arrow_batch(batch) -> WriteResultHandle` | Write a PyArrow RecordBatch |
+| `.write_pandas(df)` | Write a Pandas DataFrame |
+| `await .flush()` | Flush all pending writes |
+
+## `UpsertWriter`
+
+| Method | Description |
+|---|---|
+| `.upsert(row) -> WriteResultHandle` | Upsert a row (insert or update by PK) |
+| `.delete(pk) -> WriteResultHandle` | Delete a row by primary key |
+| `await .flush()` | Flush all pending operations |
+
+## `WriteResultHandle`
+
+| Method | Description |
+|---|---|
+| `await .wait()` | Wait for server acknowledgment of this write |
+
+## `Lookuper`
+
+| Method | Description |
+|---|---|
+| `await .lookup(pk) -> dict \| None` | Lookup a row by primary key |
+
+## `LogScanner`
+
+| Method | Description |
+|---|---|
+| `.subscribe(bucket_id, start_offset)` | Subscribe to a bucket |
+| `.subscribe_buckets(bucket_offsets)` | Subscribe to multiple buckets (`{bucket_id: offset}`) |
+| `.subscribe_partition(partition_id, bucket_id, start_offset)` | Subscribe to a partition bucket |
+| `.subscribe_partition_buckets(partition_bucket_offsets)` | Subscribe to multiple partition+bucket combos (`{(part_id, bucket_id): offset}`) |
+| `.unsubscribe_partition(partition_id, bucket_id)` | Unsubscribe from a partition bucket |
+| `.poll(timeout_ms) -> list[ScanRecord]` | Poll individual records (record scanner only) |
+| `.poll_arrow(timeout_ms) -> pa.Table` | Poll as Arrow Table (batch scanner only) |
+| `.poll_batches(timeout_ms) -> list[RecordBatch]` | Poll batches with metadata (batch scanner only) |
+| `.to_arrow() -> pa.Table` | Read all subscribed data as Arrow Table (batch scanner only) |
+| `.to_pandas() -> pd.DataFrame` | Read all subscribed data as DataFrame (batch scanner only) |
+
+## `ScanRecord`
+
+| Property | Description |
+|---|---|
+| `.bucket -> TableBucket` | Bucket this record belongs to |
+| `.offset -> int` | Record offset in the log |
+| `.timestamp -> int` | Record timestamp |
+| `.change_type -> ChangeType` | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
+| `.row -> dict` | Row data as `{column_name: value}` |
+
+## `RecordBatch`
+
+| Property | Description |
+|---|---|
+| `.batch -> pa.RecordBatch` | Arrow RecordBatch data |
+| `.bucket -> TableBucket` | Bucket this batch belongs to |
+| `.base_offset -> int` | First record offset |
+| `.last_offset -> int` | Last record offset |
+
+## `Schema`
+
+| Method | Description |
+|---|---|
+| `Schema(schema: pa.Schema, primary_keys=None)` | Create from PyArrow schema |
+| `.get_column_names() -> list[str]` | Get column names |
+| `.get_column_types() -> list[str]` | Get column type names |
+
+## `TableDescriptor`
+
+| Method | Description |
+|---|---|
+| `TableDescriptor(schema, *, partition_keys=None, bucket_count=None, bucket_keys=None, comment=None, log_format=None, kv_format=None, properties=None, custom_properties=None)` | Create table descriptor |
+| `.get_schema() -> Schema` | Get the schema |
+
+## `TablePath`
+
+| Method / Property | Description |
+|---|---|
+| `TablePath(database, table)` | Create a table path |
+| `.database_name -> str` | Database name |
+| `.table_name -> str` | Table name |
+
+## `TableInfo`
+
+| Property / Method | Description |
+|---|---|
+| `.table_id -> int` | Table ID |
+| `.table_path -> TablePath` | Table path |
+| `.num_buckets -> int` | Number of buckets |
+| `.schema_id -> int` | Schema ID |
+| `.comment -> str \| None` | Table comment |
+| `.created_time -> int` | Creation timestamp |
+| `.modified_time -> int` | Last modification timestamp |
+| `.get_primary_keys() -> list[str]` | Primary key columns |
+| `.get_partition_keys() -> list[str]` | Partition columns |
+| `.get_bucket_keys() -> list[str]` | Bucket key columns |
+| `.has_primary_key() -> bool` | Has primary key? |
+| `.is_partitioned() -> bool` | Is partitioned? |
+| `.get_schema() -> Schema` | Get table schema |
+| `.get_column_names() -> list[str]` | Column names |
+| `.get_column_count() -> int` | Number of columns |
+| `.get_properties() -> dict` | All table properties |
+| `.get_custom_properties() -> dict` | Custom properties only |
+
+## `PartitionInfo`
+
+| Property | Description |
+|---|---|
+| `.partition_id -> int` | Partition ID |
+| `.partition_name -> str` | Partition name |
+
+## `DatabaseDescriptor`
+
+| Method / Property | Description |
+|---|---|
+| `DatabaseDescriptor(comment=None, custom_properties=None)` | Create descriptor |
+| `.comment -> str \| None` | Database comment |
+| `.get_custom_properties() -> dict` | Custom properties |
+
+## `DatabaseInfo`
+
+| Property / Method | Description |
+|---|---|
+| `.database_name -> str` | Database name |
+| `.created_time -> int` | Creation timestamp |
+| `.modified_time -> int` | Last modification timestamp |
+| `.get_database_descriptor() -> DatabaseDescriptor` | Get descriptor |
+
+## `LakeSnapshot`
+
+| Property / Method | Description |
+|---|---|
+| `.snapshot_id -> int` | Snapshot ID |
+| `.table_buckets_offset -> dict[TableBucket, int]` | All bucket offsets |
+| `.get_bucket_offset(bucket) -> int \| None` | Get offset for a bucket |
+| `.get_table_buckets() -> list[TableBucket]` | Get all buckets |
+
+## `TableBucket`
+
+| Method / Property | Description |
+|---|---|
+| `TableBucket(table_id, bucket)` | Create non-partitioned bucket |
+| `TableBucket.with_partition(table_id, partition_id, bucket)` | Create partitioned bucket |
+| `.table_id -> int` | Table ID |
+| `.bucket_id -> int` | Bucket ID |
+| `.partition_id -> int \| None` | Partition ID (None if non-partitioned) |
+
+## `FlussError`
+
+| Property | Description |
+|---|---|
+| `.message -> str` | Error message |
+
+Raised for all Fluss-specific errors (connection failures, table not found, schema mismatches, etc.). Inherits from `Exception`.
+
+## Constants
+
+| Constant | Value | Description |
+|---|---|---|
+| `fluss.EARLIEST_OFFSET` | `-2` | Start reading from earliest available offset |
+| `fluss.LATEST_OFFSET` | `-1` | Start reading from latest offset (only new records) |
+| `fluss.OffsetType.EARLIEST` | `"earliest"` | For `list_offsets()` |
+| `fluss.OffsetType.LATEST` | `"latest"` | For `list_offsets()` |
+| `fluss.OffsetType.TIMESTAMP` | `"timestamp"` | For `list_offsets()` with timestamp |
+
+## `ChangeType`
+
+| Value | Short String | Description |
+|---|---|---|
+| `ChangeType.AppendOnly` (0) | `+A` | Append-only |
+| `ChangeType.Insert` (1) | `+I` | Insert |
+| `ChangeType.UpdateBefore` (2) | `-U` | Previous value of updated row |
+| `ChangeType.UpdateAfter` (3) | `+U` | New value of updated row |
+| `ChangeType.Delete` (4) | `-D` | Delete |
+
+## Data Types
+
+| PyArrow Type | Fluss Type | Python Type |
+|---|---|---|
+| `pa.boolean()` | Boolean | `bool` |
+| `pa.int8()` / `int16()` / `int32()` / `int64()` | TinyInt / SmallInt / Int / BigInt | `int` |
+| `pa.float32()` / `float64()` | Float / Double | `float` |
+| `pa.string()` | String | `str` |
+| `pa.binary()` | Bytes | `bytes` |
+| `pa.date32()` | Date | `datetime.date` |
+| `pa.time32("ms")` | Time | `datetime.time` |
+| `pa.timestamp("us")` | Timestamp (NTZ) | `datetime.datetime` |
+| `pa.timestamp("us", tz="UTC")` | TimestampLTZ | `datetime.datetime` |
+| `pa.decimal128(precision, scale)` | Decimal | `decimal.Decimal` |
diff --git a/fluss-rust/bindings/python/DEVELOPMENT.md b/fluss-rust/bindings/python/DEVELOPMENT.md
new file mode 100644
index 0000000000..e316f5e8e6
--- /dev/null
+++ b/fluss-rust/bindings/python/DEVELOPMENT.md
@@ -0,0 +1,114 @@
+<!--
+  ~ Licensed to the Apache Software Foundation (ASF) under one
+  ~ or more contributor license agreements.  See the NOTICE file
+  ~ distributed with this work for additional information
+  ~ regarding copyright ownership.  The ASF licenses this file
+  ~ to you under the Apache License, Version 2.0 (the
+  ~ "License"); you may not use this file except in compliance
+  ~ with the License.  You may obtain a copy of the License at
+  ~
+  ~   http://www.apache.org/licenses/LICENSE-2.0
+  ~
+  ~ Unless required by applicable law or agreed to in writing,
+  ~ software distributed under the License is distributed on an
+  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  ~ KIND, either express or implied.  See the License for the
+  ~ specific language governing permissions and limitations
+  ~ under the License.
+-->
+
+# Development
+
+## Requirements
+
+- Python 3.9+
+- Rust 1.70+
+- [uv](https://docs.astral.sh/uv/) package manager
+- Linux or MacOS
+
+> **Before you start:**
+> Please make sure you can successfully build and run the [Fluss Rust client](../../crates/fluss/README.md) on your machine.
+> The Python bindings require a working Fluss Rust backend and compatible environment.
+
+## Install Development Dependencies
+
+```bash
+cd bindings/python
+uv sync --all-extras
+```
+
+## Build Development Version
+
+```bash
+source .venv/bin/activate
+uv run maturin develop
+```
+
+## Build Release Version
+
+```bash
+uv run maturin build --release
+```
+
+## Code Formatting and Linting
+
+```bash
+uv run ruff format python/
+uv run ruff check python/
+```
+
+## Type Checking
+
+```bash
+uv run mypy python/
+```
+
+## Run Examples
+
+```bash
+uv run python example/example.py
+```
+
+## Build API Docs
+
+```bash
+uv run pdoc fluss
+```
+
+## Release
+
+```bash
+# Build wheel
+uv run maturin build --release
+
+# Publish to PyPI
+uv run maturin publish
+```
+
+## Project Structure
+
+```
+bindings/python/
+├── Cargo.toml            # Rust dependency configuration
+├── pyproject.toml         # Python project configuration
+├── README.md              # User guide
+├── DEVELOPMENT.md         # This file
+├── API_REFERENCE.md       # API reference
+├── src/                   # Rust source code (PyO3 bindings)
+│   ├── lib.rs
+│   ├── config.rs
+│   ├── connection.rs
+│   ├── admin.rs
+│   ├── table.rs
+│   └── error.rs
+├── fluss/                 # Python package
+│   ├── __init__.py
+│   ├── __init__.pyi       # Type stubs
+│   └── py.typed
+└── example/
+    └── example.py
+```
+
+## License
+
+Apache 2.0 License
diff --git a/fluss-rust/bindings/python/README.md b/fluss-rust/bindings/python/README.md
index b0970397f5..a31c990ad3 100644
--- a/fluss-rust/bindings/python/README.md
+++ b/fluss-rust/bindings/python/README.md
@@ -1,155 +1,453 @@
 <!--
-  ~ Licensed to the Apache Software Foundation (ASF) under one
-  ~ or more contributor license agreements.  See the NOTICE file
-  ~ distributed with this work for additional information
-  ~ regarding copyright ownership.  The ASF licenses this file
-  ~ to you under the Apache License, Version 2.0 (the
-  ~ "License"); you may not use this file except in compliance
-  ~ with the License.  You may obtain a copy of the License at
-  ~
-  ~   http://www.apache.org/licenses/LICENSE-2.0
-  ~
-  ~ Unless required by applicable law or agreed to in writing,
-  ~ software distributed under the License is distributed on an
-  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-  ~ KIND, either express or implied.  See the License for the
-  ~ specific language governing permissions and limitations
-  ~ under the License.
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
 -->
 
-# Apache Fluss™ Python Bindings
+# Fluss Python Client
 
-Python bindings for Fluss using PyO3 and Maturin.
+This guide covers how to use the Fluss Python client for reading and writing data to log tables and primary key tables.
 
-## API Overview
+The Python client is async-first, built on top of the Rust core via [PyO3](https://pyo3.rs/), and uses [PyArrow](https://arrow.apache.org/docs/python/) for schema definitions and data interchange.
 
-### Basic Usage
+## Key Concepts
 
-TODO: Add basic usage examples here
+- **Log table** — an append-only table (no primary key). Records are immutable once written. Use for event streams, logs, and audit trails.
+- **Primary key (PK) table** — a table with a primary key. Supports upsert, delete, and point lookups.
+- **Bucket** — the unit of parallelism within a table (similar to Kafka partitions). Each table has one or more buckets. Readers subscribe to individual buckets.
+- **Partition** — a way to organize data by column values (e.g. by date or region). Each partition contains its own set of buckets. Partitions must be created explicitly before writing.
+- **Offset** — the position of a record within a bucket. Used to track reading progress. Start from `EARLIEST_OFFSET` to read all data, or `LATEST_OFFSET` to only read new records.
 
-### Core Classes
+## Prerequisites
 
-#### `Config`
+You need a running Fluss cluster to use the Python client. See the [Quick-Start guide](../../README.md#quick-start) for how to start a local cluster.
 
-Configuration for Fluss connection parameters
+## Installation
 
-#### `FlussConnection`
+```bash
+pip install pyfluss
+```
 
-Main interface for connecting to Fluss cluster
+To build from source instead, see the [Development Guide](DEVELOPMENT.md).
+
+## Quick Start
+
+A minimal end-to-end example: connect, create a table, write data, and read it back. Assumes a Fluss cluster is running on `localhost:9123`.
+
+```python
+import asyncio
+import pyarrow as pa
+import fluss
+
+async def main():
+    # Connect
+    config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
+    conn = await fluss.FlussConnection.connect(config)
+    admin = await conn.get_admin()
+
+    # Create a log table
+    schema = fluss.Schema(pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("name", pa.string()),
+        pa.field("score", pa.float32()),
+    ]))
+    table_path = fluss.TablePath("fluss", "quick_start")
+    await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
+
+    # Write
+    table = await conn.get_table(table_path)
+    writer = await table.new_append_writer()
+    writer.append({"id": 1, "name": "Alice", "score": 95.5})
+    writer.append({"id": 2, "name": "Bob", "score": 87.0})
+    await writer.flush()
+
+    # Read
+    num_buckets = (await admin.get_table(table_path)).num_buckets
+    scanner = await table.new_scan().create_batch_scanner()
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+    print(scanner.to_pandas())
+
+    # Cleanup
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    conn.close()
+
+asyncio.run(main())
+```
 
-#### `FlussAdmin`
+## Connection Setup
+
+```python
+config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
+conn = await fluss.FlussConnection.connect(config)
+```
 
-Administrative operations for managing tables (create, delete, etc.)
+The connection also supports context managers:
 
-#### `FlussTable`
+```python
+with await fluss.FlussConnection.connect(config) as conn:
+    ...
+```
 
-Represents a Fluss table, providing read and write operations
+### Configuration Options
 
-#### `TableWriter`
+| Key | Description | Default |
+|-----|-------------|---------|
+| `bootstrap.servers` | Coordinator server address | `127.0.0.1:9123` |
+| `request.max.size` | Maximum request size in bytes | `10485760` (10 MB) |
+| `writer.acks` | Acknowledgment setting (`all` waits for all replicas) | `all` |
+| `writer.retries` | Number of retries on failure | `2147483647` |
+| `writer.batch.size` | Batch size for writes in bytes | `2097152` (2 MB) |
 
-Used for writing data to tables, supports PyArrow and Pandas
+## Admin Operations
 
-#### `LogScanner`
+```python
+admin = await conn.get_admin()
+```
 
-Used for scanning table log data
+### Databases
 
+```python
+await admin.create_database("my_database", ignore_if_exists=True)
+databases = await admin.list_databases()
+exists = await admin.database_exists("my_database")
+await admin.drop_database("my_database", ignore_if_not_exists=True, cascade=True)
+```
 
-# todo: we may move the following part to DEVELOPMENT.md
-## Development
+### Tables
 
-## Requirements
+Schemas are defined using PyArrow and wrapped in `fluss.Schema`:
 
-- Python 3.9+
-- Rust 1.70+
-- [uv](https://docs.astral.sh/uv/) package manager
-- Linux or MacOS
+```python
+import pyarrow as pa
 
-> **⚠️ Before you start:**  
-> Please make sure you can successfully build and run the [Fluss Rust client](../../crates/fluss/README.md) on your machine.  
-> The Python bindings require a working Fluss Rust backend and compatible environment.
+schema = fluss.Schema(pa.schema([
+    pa.field("id", pa.int32()),
+    pa.field("name", pa.string()),
+    pa.field("amount", pa.int64()),
+]))
 
-### Install Development Dependencies
+table_path = fluss.TablePath("my_database", "my_table")
+await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
 
-```bash
-cd bindings/python
-uv sync --all-extras
+table_info = await admin.get_table(table_path)
+tables = await admin.list_tables("my_database")
+await admin.drop_table(table_path, ignore_if_not_exists=True)
 ```
 
-### Build Development Version
+`TableDescriptor` accepts these optional parameters:
 
-```bash
-source .venv/bin/activate
-uv run maturin develop
+| Parameter | Description |
+|---|---|
+| `partition_keys` | Column names to partition by (e.g. `["region"]`) |
+| `bucket_count` | Number of buckets (parallelism units) for the table |
+| `bucket_keys` | Columns used to determine bucket assignment |
+| `comment` | Table comment / description |
+| `log_format` | Log storage format: `"ARROW"` or `"INDEXED"` |
+| `kv_format` | KV storage format for primary key tables: `"INDEXED"` or `"COMPACTED"` |
+| `properties` | Table configuration properties as a dict (e.g. `{"table.replication.factor": "1"}`) |
+| `custom_properties` | User-defined properties as a dict |
+
+### Offsets
+
+```python
+# Latest offsets for buckets
+offsets = await admin.list_offsets(table_path, bucket_ids=[0, 1], offset_type="latest")
+
+# By timestamp
+offsets = await admin.list_offsets(table_path, bucket_ids=[0], offset_type="timestamp", timestamp=1704067200000)
+
+# Per-partition offsets
+offsets = await admin.list_partition_offsets(table_path, partition_name="US", bucket_ids=[0], offset_type="latest")
 ```
 
-### Build Release Version
+## Log Tables
 
-```bash
-uv run maturin build --release
+Log tables are append-only tables without primary keys, suitable for event streaming.
+
+### Writing
+
+Rows can be appended as dicts, lists, or tuples. For bulk writes, use `write_arrow()`, `write_arrow_batch()`, or `write_pandas()`.
+
+Write methods like `append()` and `write_arrow_batch()` return a `WriteResultHandle`. You can ignore it for fire-and-forget semantics (flush at the end), or `await handle.wait()` to block until the server acknowledges that specific write.
+
+```python
+table = await conn.get_table(table_path)
+writer = await table.new_append_writer()
+
+# Fire-and-forget: queue writes, flush at the end
+writer.append({"id": 1, "name": "Alice", "score": 95.5})
+writer.append([2, "Bob", 87.0])
+await writer.flush()
+
+# Per-record acknowledgment
+handle = writer.append({"id": 3, "name": "Charlie", "score": 91.0})
+await handle.wait()
+
+# Bulk writes
+writer.write_arrow(pa_table)          # PyArrow Table
+writer.write_arrow_batch(record_batch) # PyArrow RecordBatch
+writer.write_pandas(df)                # Pandas DataFrame
+await writer.flush()
 ```
 
-### Code Formatting and Linting
+### Reading
 
-```bash
-uv run ruff format python/
-uv run ruff check python/
+There are two scanner types:
+- **Batch scanner** (`create_batch_scanner()`) — returns Arrow Tables or DataFrames, best for analytics
+- **Record scanner** (`create_log_scanner()`) — returns individual records with metadata (offset, timestamp, change type), best for streaming
+
+And two reading modes:
+- **`to_arrow()` / `to_pandas()`** — reads all data from subscribed buckets up to the current latest offset, then returns. Best for one-shot batch reads.
+- **`poll_arrow()` / `poll()` / `poll_batches()`** — returns whatever data is available within the timeout, then returns. Call in a loop for continuous streaming.
+
+#### Batch Read (One-Shot)
+
+```python
+num_buckets = (await admin.get_table(table_path)).num_buckets
+
+scanner = await table.new_scan().create_batch_scanner()
+scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+# Reads everything up to current latest offset, then returns
+arrow_table = scanner.to_arrow()
+df = scanner.to_pandas()
 ```
 
-### Type Checking
+#### Continuous Polling
 
-```bash
-uv run mypy python/
+Use `poll_arrow()` or `poll()` in a loop for streaming consumption:
+
+```python
+# Batch scanner: poll as Arrow Tables
+scanner = await table.new_scan().create_batch_scanner()
+scanner.subscribe(bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
+
+while True:
+    result = scanner.poll_arrow(timeout_ms=5000)
+    if result.num_rows > 0:
+        print(result.to_pandas())
+
+# Record scanner: poll individual records with metadata
+scanner = await table.new_scan().create_log_scanner()
+scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+while True:
+    for record in scanner.poll(timeout_ms=5000):
+        print(f"offset={record.offset}, change={record.change_type.short_string()}, row={record.row}")
 ```
 
-### Run Examples
+#### Subscribe from Latest Offset
 
-```bash
-uv run python example/example.py
+To only consume new records (skip existing data), use `LATEST_OFFSET`:
+
+```python
+scanner = await table.new_scan().create_batch_scanner()
+scanner.subscribe(bucket_id=0, start_offset=fluss.LATEST_OFFSET)
 ```
 
-### Build API docs:
+### Column Projection
 
-```bash
-uv run pdoc fluss
+```python
+scanner = await table.new_scan().project([0, 2]).create_batch_scanner()
+# or by name
+scanner = await table.new_scan().project_by_name(["id", "score"]).create_batch_scanner()
 ```
 
-### Release
+## Primary Key Tables
 
-```bash
-# Build wheel
-uv run maturin build --release
+Primary key tables support upsert, delete, and point lookup operations.
 
-# Publish to PyPI
-uv run maturin publish
+### Creating
+
+Pass `primary_keys` to `fluss.Schema`:
+
+```python
+schema = fluss.Schema(
+    pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("name", pa.string()),
+        pa.field("age", pa.int64()),
+    ]),
+    primary_keys=["id"],
+)
+table_path = fluss.TablePath("fluss", "users")
+await admin.create_table(table_path, fluss.TableDescriptor(schema, bucket_count=3), ignore_if_exists=True)
 ```
 
-## Project Structure
+### Upsert, Delete, Lookup
+
+```python
+table = await conn.get_table(table_path)
+
+# Upsert (fire-and-forget, flush at the end)
+writer = table.new_upsert()
+writer.upsert({"id": 1, "name": "Alice", "age": 25})
+writer.upsert({"id": 2, "name": "Bob", "age": 30})
+await writer.flush()
+
+# Per-record acknowledgment (for read-after-write)
+handle = writer.upsert({"id": 3, "name": "Charlie", "age": 35})
+await handle.wait()
+
+# Delete by primary key
+handle = writer.delete({"id": 2})
+await handle.wait()
+
+# Lookup
+lookuper = table.new_lookup()
+result = await lookuper.lookup({"id": 1})
+if result:
+    print(f"Found: name={result['name']}, age={result['age']}")
 ```
-bindings/python/
-├── Cargo.toml            # Rust dependency configuration
-├── pyproject.toml        # Python project configuration
-├── README.md             # This file
-├── src/                  # Rust source code
-│   ├── lib.rs            # Main entry module
-│   ├── config.rs         # Configuration related
-│   ├── connection.rs     # Connection management
-│   ├── admin.rs          # Admin operations
-│   ├── table.rs          # Table operations
-│   ├── types.rs          # Data types
-│   └── error.rs          # Error handling
-├── fluss/                # Python package source
-│   ├── __init__.py       # Python package entry
-│   ├── __init__.pyi      # Stub file
-│   └── py.typed          # Type declarations
-└── example/              # Example code
-    └── example.py
+
+### Partial Updates
+
+Update specific columns while preserving others:
+
+```python
+partial_writer = table.new_upsert(columns=["id", "age"])
+partial_writer.upsert({"id": 1, "age": 27})  # only updates age
+await partial_writer.flush()
 ```
 
-## TODO
+## Partitioned Tables
+
+Partitioned tables distribute data across partitions based on column values. Partitions must be created before writing.
+
+### Creating and Managing Partitions
+
+```python
+schema = fluss.Schema(pa.schema([
+    pa.field("id", pa.int32()),
+    pa.field("region", pa.string()),
+    pa.field("value", pa.int64()),
+]))
+
+table_path = fluss.TablePath("fluss", "partitioned_events")
+await admin.create_table(
+    table_path,
+    fluss.TableDescriptor(schema, partition_keys=["region"], bucket_count=1),
+    ignore_if_exists=True,
+)
+
+# Create partitions
+await admin.create_partition(table_path, {"region": "US"}, ignore_if_exists=True)
+await admin.create_partition(table_path, {"region": "EU"}, ignore_if_exists=True)
+
+# List partitions
+partition_infos = await admin.list_partition_infos(table_path)
+```
+
+### Writing
+
+Same as non-partitioned tables — include partition column values in each row:
+
+```python
+table = await conn.get_table(table_path)
+writer = await table.new_append_writer()
+writer.append({"id": 1, "region": "US", "value": 100})
+writer.append({"id": 2, "region": "EU", "value": 200})
+await writer.flush()
+```
+
+### Reading
+
+Use `subscribe_partition()` or `subscribe_partition_buckets()` instead of `subscribe()`:
+
+```python
+scanner = await table.new_scan().create_batch_scanner()
+
+# Subscribe to individual partitions
+for p in partition_infos:
+    scanner.subscribe_partition(partition_id=p.partition_id, bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
+
+# Or batch-subscribe
+scanner.subscribe_partition_buckets({
+    (p.partition_id, 0): fluss.EARLIEST_OFFSET for p in partition_infos
+})
+
+print(scanner.to_pandas())
+```
+
+### Partitioned Primary Key Tables
+
+Partition columns must be part of the primary key. Partitions must be created before upserting.
+
+```python
+schema = fluss.Schema(
+    pa.schema([
+        pa.field("user_id", pa.int32()),
+        pa.field("region", pa.string()),
+        pa.field("score", pa.int64()),
+    ]),
+    primary_keys=["user_id", "region"],
+)
+
+table_path = fluss.TablePath("fluss", "partitioned_users")
+await admin.create_table(
+    table_path,
+    fluss.TableDescriptor(schema, partition_keys=["region"]),
+    ignore_if_exists=True,
+)
+
+await admin.create_partition(table_path, {"region": "US"}, ignore_if_exists=True)
+
+table = await conn.get_table(table_path)
+writer = table.new_upsert()
+writer.upsert({"user_id": 1, "region": "US", "score": 1234})
+await writer.flush()
+
+# Lookup includes partition columns
+lookuper = table.new_lookup()
+result = await lookuper.lookup({"user_id": 1, "region": "US"})
+```
+
+## Error Handling
+
+The client raises `fluss.FlussError` for Fluss-specific errors (connection failures, table not found, invalid operations, etc.):
+
+```python
+try:
+    await admin.create_table(table_path, table_descriptor)
+except fluss.FlussError as e:
+    print(f"Fluss error: {e.message}")
+```
+
+Common error scenarios:
+- **Connection refused** — Fluss cluster is not running or wrong address in `bootstrap.servers`
+- **Table not found** — table doesn't exist or wrong database/table name
+- **Partition not found** — writing to a partitioned table before creating partitions
+- **Schema mismatch** — row data doesn't match the table schema
+
+## Data Types
+
+The Python client uses PyArrow types for schema definitions:
 
-- [ ] Add basic usage examples in API Overview (code snippets for Config, FlussConnection, FlussAdmin, FlussTable).
-- [ ] Add a "Verifying a release" subsection with install-from-TestPyPI/PyPI and smoke-test steps.
+| PyArrow Type | Fluss Type | Python Type |
+|---|---|---|
+| `pa.boolean()` | Boolean | `bool` |
+| `pa.int8()` / `int16()` / `int32()` / `int64()` | TinyInt / SmallInt / Int / BigInt | `int` |
+| `pa.float32()` / `float64()` | Float / Double | `float` |
+| `pa.string()` | String | `str` |
+| `pa.binary()` | Bytes | `bytes` |
+| `pa.date32()` | Date | `datetime.date` |
+| `pa.time32("ms")` | Time | `datetime.time` |
+| `pa.timestamp("us")` | Timestamp (NTZ) | `datetime.datetime` |
+| `pa.timestamp("us", tz="UTC")` | TimestampLTZ | `datetime.datetime` |
+| `pa.decimal128(precision, scale)` | Decimal | `decimal.Decimal` |
 
-## License
+All Python native types (`date`, `time`, `datetime`, `Decimal`) work when appending rows via dicts.
 
-Apache 2.0 License
+For a complete list of classes, methods, and properties, see the [API Reference](API_REFERENCE.md).
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index cc7053e4e2..adbfc2fe02 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -610,7 +610,8 @@ class TableDescriptor:
         comment: Optional[str] = None,
         log_format: Optional[str] = None,
         kv_format: Optional[str] = None,
-        **properties: str,
+        properties: Optional[Dict[str, str]] = None,
+        custom_properties: Optional[Dict[str, str]] = None,
     ) -> None: ...
     def get_schema(self) -> Schema: ...
 

From f51691194ea3b14689fe37a30c27db2ccc33d8d5 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Tue, 10 Feb 2026 01:57:56 +0000
Subject: [PATCH 135/287] doc: Add documentation for rust (#242)

---
 fluss-rust/docs/rust-client.md | 748 +++++++++++++++++++++++++++++++++
 1 file changed, 748 insertions(+)
 create mode 100644 fluss-rust/docs/rust-client.md

diff --git a/fluss-rust/docs/rust-client.md b/fluss-rust/docs/rust-client.md
new file mode 100644
index 0000000000..779b974c28
--- /dev/null
+++ b/fluss-rust/docs/rust-client.md
@@ -0,0 +1,748 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Fluss Rust Client Guide
+
+This guide covers how to use the Fluss Rust client for reading and writing data to log tables and primary key tables.
+
+## Adding to Your Project
+
+The Fluss Rust client is published to [crates.io](https://crates.io/crates/fluss-rs) as `fluss-rs`. The crate's library name is `fluss`, so you import it with `use fluss::...`.
+
+```toml
+[dependencies]
+fluss-rs = "0.1"
+tokio = { version = "1", features = ["full"] }
+```
+
+### Feature Flags
+
+The Fluss crate supports optional storage backends:
+
+```toml
+[dependencies]
+# Default: memory and filesystem storage
+fluss-rs = "0.1"
+
+# With S3 storage support
+fluss-rs = { version = "0.1", features = ["storage-s3"] }
+
+# With OSS storage support
+fluss-rs = { version = "0.1", features = ["storage-oss"] }
+
+# All storage backends
+fluss-rs = { version = "0.1", features = ["storage-all"] }
+```
+
+Available features:
+- `storage-memory` (default) - In-memory storage
+- `storage-fs` (default) - Local filesystem storage
+- `storage-s3` - Amazon S3 storage
+- `storage-oss` - Alibaba OSS storage
+- `storage-all` - All storage backends
+
+### Alternative: Git or Path Dependency
+
+For development against unreleased changes, you can depend on the Git repository or a local checkout:
+
+```toml
+[dependencies]
+# From Git
+fluss = { git = "https://github.com/apache/fluss-rust.git", package = "fluss-rs" }
+
+# From local path
+fluss = { path = "/path/to/fluss-rust/crates/fluss", package = "fluss-rs" }
+```
+
+> **Note:** When using `git` or `path` dependencies, the `package = "fluss-rs"` field is required so that Cargo resolves the correct package while still allowing `use fluss::...` imports.
+
+## Building from Source
+
+### Prerequisites
+
+- Rust 1.85+
+- Protobuf compiler (`protoc`) - only required when [building from source](#building-from-source)
+
+
+### 1. Clone the Repository
+
+```bash
+git clone https://github.com/apache/fluss-rust.git
+cd fluss-rust
+```
+
+### 2. Install Dependencies
+
+The Protobuf compiler (`protoc`) is required to build from source.
+
+#### macOS
+
+```bash
+brew install protobuf
+```
+
+#### Ubuntu/Debian
+
+```bash
+sudo apt-get install protobuf-compiler
+```
+
+### 3. Build the Library
+
+```bash
+cargo build --workspace --all-targets
+```
+
+## Connection Setup
+
+```rust
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+use fluss::error::Result;
+
+#[tokio::main]
+async fn main() -> Result<()> {
+    let mut config = Config::default();
+    config.bootstrap_server = "127.0.0.1:9123".to_string();
+
+    let conn = FlussConnection::new(config).await?;
+
+    // Use the connection...
+
+    Ok(())
+}
+```
+
+### Configuration Options
+
+| Option | Description | Default |
+|--------|-------------|---------|
+| `bootstrap_server` | Coordinator server address | `127.0.0.1:9123` |
+| `request_max_size` | Maximum request size in bytes | 10 MB |
+| `writer_acks` | Acknowledgment setting (`all` waits for all replicas) | `all` |
+| `writer_retries` | Number of retries on failure | `i32::MAX` |
+| `writer_batch_size` | Batch size for writes | 2 MB |
+
+## Admin Operations
+
+### Get Admin Interface
+
+```rust
+let admin = conn.get_admin().await?;
+```
+
+### Database Operations
+
+```rust
+// Create database
+admin.create_database("my_database", true, None).await?;
+
+// List all databases
+let databases = admin.list_databases().await?;
+println!("Databases: {:?}", databases);
+
+// Check if database exists
+let exists = admin.database_exists("my_database").await?;
+
+// Get database information
+let db_info = admin.get_database_info("my_database").await?;
+
+// Drop database
+admin.drop_database("my_database", true, false).await?;
+```
+
+### Table Operations
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+// Define table schema
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .column("amount", DataTypes::bigint())
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("my_database", "my_table");
+
+// Create table
+admin.create_table(&table_path, &table_descriptor, true).await?;
+
+// Get table information
+let table_info = admin.get_table(&table_path).await?;
+println!("Table: {}", table_info);
+
+// List tables in database
+let tables = admin.list_tables("my_database").await?;
+
+// Check if table exists
+let exists = admin.table_exists(&table_path).await?;
+
+// Drop table
+admin.drop_table(&table_path, true).await?;
+```
+
+### Partition Operations
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+// List all partitions
+let partitions = admin.list_partition_infos(&table_path).await?;
+
+// List partitions matching a spec
+let mut filter = HashMap::new();
+filter.insert("year", "2024");
+let spec = PartitionSpec::new(filter);
+let partitions = admin.list_partition_infos_with_spec(&table_path, Some(&spec)).await?;
+
+// Create partition
+admin.create_partition(&table_path, &spec, true).await?;
+
+// Drop partition
+admin.drop_partition(&table_path, &spec, true).await?;
+```
+
+### Offset Operations
+
+```rust
+use fluss::rpc::message::OffsetSpec;
+
+let bucket_ids = vec![0, 1, 2];
+
+// Get earliest offsets
+let earliest = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Earliest).await?;
+
+// Get latest offsets
+let latest = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Latest).await?;
+
+// Get offsets for a specific timestamp
+let timestamp_ms = 1704067200000; // 2024-01-01 00:00:00 UTC
+let offsets = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Timestamp(timestamp_ms)).await?;
+
+// Get offsets for a specific partition
+let partition_offsets = admin.list_partition_offsets(
+    &table_path,
+    "partition_name",
+    &bucket_ids,
+    OffsetSpec::Latest,
+).await?;
+```
+
+### Lake Snapshot
+
+```rust
+// Get latest lake snapshot for lakehouse integration
+let snapshot = admin.get_latest_lake_snapshot(&table_path).await?;
+println!("Snapshot ID: {}", snapshot.snapshot_id);
+```
+
+## Log Table Operations
+
+Log tables are append-only tables without primary keys, suitable for event streaming.
+
+### Creating a Log Table
+
+```rust
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("event_id", DataTypes::int())
+            .column("event_type", DataTypes::string())
+            .column("timestamp", DataTypes::bigint())
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("fluss", "events");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+### Writing to Log Tables
+
+```rust
+use fluss::row::{GenericRow, InternalRow};
+
+let table = conn.get_table(&table_path).await?;
+let append_writer = table.new_append()?.create_writer()?;
+
+// Write a single row
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);                    // event_id (int)
+row.set_field(1, "user_login");         // event_type (string)
+row.set_field(2, 1704067200000i64);     // timestamp (bigint)
+
+append_writer.append(&row)?;
+
+// Write multiple rows
+let mut row2 = GenericRow::new(3);
+row2.set_field(0, 2);
+row2.set_field(1, "page_view");
+row2.set_field(2, 1704067201000i64);
+
+append_writer.append(&row2)?;
+
+// Flush to ensure data is persisted
+append_writer.flush().await?;
+```
+
+Write operations (`append`, `upsert`, `delete`) use a **fire-and-forget** pattern for efficient batching. Each call queues the write and returns a `WriteResultFuture` immediately. Call `flush()` to ensure all queued writes are sent to the server.
+
+If you need per-record acknowledgment, you can await the returned future:
+
+```rust
+// Per-record acknowledgment (blocks until server confirms)
+append_writer.append(&row)?.await?;
+```
+
+### Reading from Log Tables
+
+```rust
+use std::time::Duration;
+
+let table = conn.get_table(&table_path).await?;
+let log_scanner = table.new_scan().create_log_scanner()?;
+
+// Subscribe to bucket 0 starting from offset 0
+log_scanner.subscribe(0, 0).await?;
+
+// Poll for records
+let records = log_scanner.poll(Duration::from_secs(10)).await?;
+
+for record in records {
+    let row = record.row();
+    println!(
+        "event_id={}, event_type={}, timestamp={} @ offset={}",
+        row.get_int(0),
+        row.get_string(1),
+        row.get_long(2),
+        record.offset()
+    );
+}
+```
+
+### Column Projection
+
+```rust
+// Project specific columns by index
+let scanner = table.new_scan().project(&[0, 2])?.create_log_scanner()?;
+
+// Or project by column names
+let scanner = table.new_scan().project_by_name(&["event_id", "timestamp"])?.create_log_scanner()?;
+```
+
+### Subscribe from Specific Offsets
+
+```rust
+use fluss::client::{EARLIEST_OFFSET, LATEST_OFFSET};
+
+// Subscribe from earliest available offset
+log_scanner.subscribe(0, EARLIEST_OFFSET).await?;
+
+// Subscribe from latest offset (only new records)
+log_scanner.subscribe(0, LATEST_OFFSET).await?;
+
+// Subscribe from a specific offset
+log_scanner.subscribe(0, 42).await?;
+
+// Subscribe to all buckets
+let num_buckets = table.get_table_info().get_num_buckets();
+for bucket_id in 0..num_buckets {
+    log_scanner.subscribe(bucket_id, 0).await?;
+}
+```
+
+### Subscribe to Multiple Buckets
+
+```rust
+use std::collections::HashMap;
+
+// Subscribe to multiple buckets at once with specific offsets
+let mut bucket_offsets = HashMap::new();
+bucket_offsets.insert(0, 0i64);    // bucket 0 from offset 0
+bucket_offsets.insert(1, 100i64);  // bucket 1 from offset 100
+log_scanner.subscribe_buckets(&bucket_offsets).await?;
+```
+
+### Unsubscribe from a Partition
+
+```rust
+// Unsubscribe from a specific partition bucket
+log_scanner.unsubscribe_partition(partition_id, bucket_id).await?;
+```
+
+## Partitioned Log Tables
+
+Partitioned tables distribute data across partitions based on partition column values, enabling efficient data organization and querying.
+
+### Creating a Partitioned Log Table
+
+```rust
+use fluss::metadata::{DataTypes, LogFormat, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("event_id", DataTypes::int())
+            .column("event_type", DataTypes::string())
+            .column("dt", DataTypes::string())       // partition column
+            .column("region", DataTypes::string())   // partition column
+            .build()?,
+    )
+    .partitioned_by(vec!["dt", "region"])  // Define partition columns
+    .log_format(LogFormat::ARROW)
+    .build()?;
+
+let table_path = TablePath::new("fluss", "partitioned_events");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+### Writing to Partitioned Log Tables
+
+Writing works the same as non-partitioned tables. Include partition column values in each row:
+
+```rust
+let table = conn.get_table(&table_path).await?;
+let append_writer = table.new_append()?.create_writer()?;
+
+// Partition column values determine which partition the record goes to
+let mut row = GenericRow::new(4);
+row.set_field(0, 1);                  // event_id
+row.set_field(1, "user_login");       // event_type
+row.set_field(2, "2024-01-15");       // dt (partition column)
+row.set_field(3, "US");               // region (partition column)
+
+append_writer.append(&row)?;
+append_writer.flush().await?;
+```
+
+### Reading from Partitioned Log Tables
+
+For partitioned tables, use `subscribe_partition()` instead of `subscribe()`:
+
+```rust
+use std::time::Duration;
+
+let table = conn.get_table(&table_path).await?;
+let admin = conn.get_admin().await?;
+
+// Get partition information
+let partitions = admin.list_partition_infos(&table_path).await?;
+
+let log_scanner = table.new_scan().create_log_scanner()?;
+
+// Subscribe to each partition's buckets
+for partition_info in &partitions {
+    let partition_id = partition_info.get_partition_id();
+    let num_buckets = table.get_table_info().get_num_buckets();
+
+    for bucket_id in 0..num_buckets {
+        log_scanner.subscribe_partition(partition_id, bucket_id, 0).await?;
+    }
+}
+
+// Poll for records
+let records = log_scanner.poll(Duration::from_secs(10)).await?;
+for record in records {
+    println!("Record from partition: {:?}", record.row());
+}
+```
+
+You can also subscribe to multiple partition-buckets at once:
+
+```rust
+use std::collections::HashMap;
+
+let mut partition_bucket_offsets = HashMap::new();
+partition_bucket_offsets.insert((partition_id, 0), 0i64);  // partition, bucket 0, offset 0
+partition_bucket_offsets.insert((partition_id, 1), 0i64);  // partition, bucket 1, offset 0
+log_scanner.subscribe_partition_buckets(&partition_bucket_offsets).await?;
+```
+
+### Managing Partitions
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+// Create a partition
+let mut partition_values = HashMap::new();
+partition_values.insert("dt", "2024-01-15");
+partition_values.insert("region", "EMEA");
+let spec = PartitionSpec::new(partition_values);
+admin.create_partition(&table_path, &spec, true).await?;
+
+// List all partitions
+let partitions = admin.list_partition_infos(&table_path).await?;
+for partition in &partitions {
+    println!(
+        "Partition: id={}, name={}",
+        partition.get_partition_id(),
+        partition.get_partition_name()  // Format: "value1$value2"
+    );
+}
+
+// List partitions with filter (partial spec)
+let mut partial_values = HashMap::new();
+partial_values.insert("dt", "2024-01-15");
+let partial_spec = PartitionSpec::new(partial_values);
+let filtered = admin.list_partition_infos_with_spec(&table_path, Some(&partial_spec)).await?;
+
+// Drop a partition
+admin.drop_partition(&table_path, &spec, true).await?;
+```
+
+## Primary Key Table Operations
+
+Primary key tables (KV tables) support upsert, delete, and lookup operations.
+
+### Creating a Primary Key Table
+
+```rust
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .column("age", DataTypes::bigint())
+            .primary_key(vec!["id"])  // Define primary key
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("fluss", "users");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+### Upserting Records
+
+```rust
+let table = conn.get_table(&table_path).await?;
+let table_upsert = table.new_upsert()?;
+let upsert_writer = table_upsert.create_writer()?;
+
+// Insert or update records
+for (id, name, age) in [(1, "Alice", 25i64), (2, "Bob", 30), (3, "Charlie", 35)] {
+    let mut row = GenericRow::new(3);
+    row.set_field(0, id);
+    row.set_field(1, name);
+    row.set_field(2, age);
+    upsert_writer.upsert(&row)?;
+}
+upsert_writer.flush().await?;
+```
+
+### Updating Records
+
+```rust
+// Update existing record (same primary key)
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);        // id (primary key)
+row.set_field(1, "Alice");  // name
+row.set_field(2, 26i64);    // Updated age
+
+upsert_writer.upsert(&row)?;
+upsert_writer.flush().await?;
+```
+
+### Deleting Records
+
+```rust
+// Delete by primary key (only primary key field needs to be set)
+let mut row = GenericRow::new(3);
+row.set_field(0, 2);  // id of record to delete
+
+upsert_writer.delete(&row)?;
+upsert_writer.flush().await?;
+```
+
+### Partial Updates
+
+Update only specific columns while preserving others:
+
+```rust
+// By column indices
+let partial_upsert = table_upsert.partial_update(Some(vec![0, 2]))?;
+let partial_writer = partial_upsert.create_writer()?;
+
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);       // id (primary key, required)
+row.set_field(2, 27i64);   // age (will be updated)
+// name will remain unchanged
+
+partial_writer.upsert(&row)?;
+partial_writer.flush().await?;
+
+// By column names
+let partial_upsert = table_upsert.partial_update_with_column_names(&["id", "age"])?;
+let partial_writer = partial_upsert.create_writer()?;
+```
+
+### Looking Up Records
+
+```rust
+let mut lookuper = table.new_lookup()?.create_lookuper()?;
+
+// Create a key row (only primary key fields)
+let mut key = GenericRow::new(1);
+key.set_field(0, 1);  // id to lookup
+
+let result = lookuper.lookup(&key).await?;
+
+if let Some(row) = result.get_single_row()? {
+    println!(
+        "Found: id={}, name={}, age={}",
+        row.get_int(0),
+        row.get_string(1),
+        row.get_long(2)
+    );
+} else {
+    println!("Record not found");
+}
+```
+
+## Partitioned Primary Key Tables
+
+Partitioned KV tables combine partitioning with primary key operations. Partition columns must be part of the primary key.
+
+### Creating a Partitioned Primary Key Table
+
+```rust
+use fluss::metadata::{DataTypes, KvFormat, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("user_id", DataTypes::int())
+            .column("region", DataTypes::string())   // partition column
+            .column("zone", DataTypes::bigint())     // partition column
+            .column("score", DataTypes::bigint())
+            // Primary key must include partition columns
+            .primary_key(vec!["user_id", "region", "zone"])
+            .build()?,
+    )
+    .partitioned_by(vec!["region", "zone"])  // Define partition columns
+    .kv_format(KvFormat::COMPACTED)
+    .build()?;
+
+let table_path = TablePath::new("fluss", "partitioned_users");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+### Writing to Partitioned Primary Key Tables
+
+Upsert and delete operations work the same as non-partitioned KV tables. **Partitions must be created before upserting data.**
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+let table = conn.get_table(&table_path).await?;
+
+// Ensure partitions exist before upserting
+for (region, zone) in [("APAC", "1"), ("EMEA", "2"), ("US", "3")] {
+    let mut partition_values = HashMap::new();
+    partition_values.insert("region", region);
+    partition_values.insert("zone", zone);
+    let spec = PartitionSpec::new(partition_values);
+    admin.create_partition(&table_path, &spec, true).await?;
+}
+
+let table_upsert = table.new_upsert()?;
+let upsert_writer = table_upsert.create_writer()?;
+
+// Upsert records - partition is determined by partition column values
+for (user_id, region, zone, score) in [
+    (1001, "APAC", 1i64, 1234i64),
+    (1002, "EMEA", 2, 2234),
+    (1003, "US", 3, 3234),
+] {
+    let mut row = GenericRow::new(4);
+    row.set_field(0, user_id);
+    row.set_field(1, region);
+    row.set_field(2, zone);
+    row.set_field(3, score);
+    upsert_writer.upsert(&row)?;
+}
+upsert_writer.flush().await?;
+
+// Update a record
+let mut row = GenericRow::new(4);
+row.set_field(0, 1001);
+row.set_field(1, "APAC");
+row.set_field(2, 1i64);
+row.set_field(3, 5000i64);  // Updated score
+upsert_writer.upsert(&row)?;
+upsert_writer.flush().await?;
+
+// Delete a record (primary key includes partition columns)
+let mut row = GenericRow::new(4);
+row.set_field(0, 1002);
+row.set_field(1, "EMEA");
+row.set_field(2, 2i64);
+upsert_writer.delete(&row)?;
+upsert_writer.flush().await?;
+```
+
+### Looking Up Records in Partitioned Tables
+
+Lookup requires all primary key columns including partition columns:
+
+```rust
+let mut lookuper = table.new_lookup()?.create_lookuper()?;
+
+// Key must include all primary key columns (including partition columns)
+let mut key = GenericRow::new(3);
+key.set_field(0, 1001);    // user_id
+key.set_field(1, "APAC");  // region (partition column)
+key.set_field(2, 1i64);    // zone (partition column)
+
+let result = lookuper.lookup(&key).await?;
+if let Some(row) = result.get_single_row()? {
+    println!("Found: score={}", row.get_long(3));
+}
+```
+
+> **Note:** Scanning partitioned primary key tables is not supported. Use lookup operations instead.
+
+## Data Types
+
+| Fluss Type      | Rust Type      | Method                                                              |
+|-----------------|----------------|---------------------------------------------------------------------|
+| `BOOLEAN`       | `bool`         | `get_boolean()`, `set_field(idx, bool)`                             |
+| `TINYINT`       | `i8`           | `get_byte()`, `set_field(idx, i8)`                                  |
+| `SMALLINT`      | `i16`          | `get_short()`, `set_field(idx, i16)`                                |
+| `INT`           | `i32`          | `get_int()`, `set_field(idx, i32)`                                  |
+| `BIGINT`        | `i64`          | `get_long()`, `set_field(idx, i64)`                                 |
+| `FLOAT`         | `f32`          | `get_float()`, `set_field(idx, f32)`                                |
+| `DOUBLE`        | `f64`          | `get_double()`, `set_field(idx, f64)`                               |
+| `CHAR`          | `&str`         | `get_char(idx, length)`, `set_field(idx, &str)`                     |
+| `STRING`        | `&str`         | `get_string()`, `set_field(idx, &str)`                              |
+| `DECIMAL`       | `Decimal`      | `get_decimal(idx, precision, scale)`, `set_field(idx, Decimal)`     |
+| `DATE`          | `Date`         | `get_date()`, `set_field(idx, Date)`                                |
+| `TIME`          | `Time`         | `get_time()`, `set_field(idx, Time)`                                |
+| `TIMESTAMP`     | `TimestampNtz` | `get_timestamp_ntz(idx, precision)`, `set_field(idx, TimestampNtz)` |
+| `TIMESTAMP_LTZ` | `TimestampLtz` | `get_timestamp_ltz(idx, precision)`, `set_field(idx, TimestampLtz)` |
+| `BYTES`         | `&[u8]`        | `get_bytes()`, `set_field(idx, &[u8])`                              |
+| `BINARY(n)`     | `&[u8]`        | `get_binary(idx, length)`, `set_field(idx, &[u8])`                  |
+

From 9c0776919149fdc481445ff148cad4670cfeb7de Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Tue, 10 Feb 2026 11:43:37 +0000
Subject: [PATCH 136/287] feat: support projection by names in CPP (#294)

---
 fluss-rust/bindings/cpp/examples/example.cpp | 44 ++++++++++++++++--
 fluss-rust/bindings/cpp/include/fluss.hpp    |  6 ++-
 fluss-rust/bindings/cpp/src/table.cpp        | 48 ++++++++++++++++----
 3 files changed, 84 insertions(+), 14 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index f568422e6b..47087e5436 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -192,12 +192,12 @@ int main() {
         std::exit(1);
     }
 
-    // 7) Projected scan — project [id, updated_at(TimestampLtz)] to verify
-    //    NTZ/LTZ disambiguation works with column index remapping
+    // 7a) Projected scan by index — project [id, updated_at(TimestampLtz)] to verify
+    //     NTZ/LTZ disambiguation works with column index remapping
     std::vector<size_t> projected_columns = {0, 7};
     fluss::LogScanner projected_scanner;
     check("new_log_scanner_with_projection",
-          table.NewScan().Project(projected_columns).CreateLogScanner(projected_scanner));
+          table.NewScan().ProjectByIndex(projected_columns).CreateLogScanner(projected_scanner));
 
     for (int b = 0; b < buckets; ++b) {
         check("subscribe_projected", projected_scanner.Subscribe(b, 0));
@@ -229,6 +229,42 @@ int main() {
                   << ts.nano_of_millisecond << "ns" << std::endl;
     }
 
+    // 7b) Projected scan by column names — same columns as above but using names
+    fluss::LogScanner name_projected_scanner;
+    check("project_by_name_scanner", table.NewScan()
+                                         .ProjectByName({"id", "updated_at"})
+                                         .CreateLogScanner(name_projected_scanner));
+
+    for (int b = 0; b < buckets; ++b) {
+        check("subscribe_name_projected", name_projected_scanner.Subscribe(b, 0));
+    }
+
+    fluss::ScanRecords name_projected_records;
+    check("poll_name_projected", name_projected_scanner.Poll(5000, name_projected_records));
+
+    std::cout << "Name-projected records: " << name_projected_records.Size() << std::endl;
+    for (const auto& rec : name_projected_records.records) {
+        if (rec.row.FieldCount() != 2) {
+            std::cerr << "ERROR: expected 2 fields, got " << rec.row.FieldCount() << std::endl;
+            scan_ok = false;
+            continue;
+        }
+        if (rec.row.GetType(0) != fluss::DatumType::Int32) {
+            std::cerr << "ERROR: name-projected field 0 expected Int32, got "
+                      << static_cast<int>(rec.row.GetType(0)) << std::endl;
+            scan_ok = false;
+        }
+        if (rec.row.GetType(1) != fluss::DatumType::TimestampLtz) {
+            std::cerr << "ERROR: name-projected field 1 expected TimestampLtz, got "
+                      << static_cast<int>(rec.row.GetType(1)) << std::endl;
+            scan_ok = false;
+        }
+
+        auto ts = rec.row.GetTimestamp(1);
+        std::cout << "  id=" << rec.row.GetInt32(0) << " updated_at=" << ts.epoch_millis << "+"
+                  << ts.nano_of_millisecond << "ns" << std::endl;
+    }
+
     if (scan_ok) {
         std::cout << "Scan verification passed!" << std::endl;
     } else {
@@ -336,7 +372,7 @@ int main() {
     fluss::LogScanner projected_arrow_scanner;
     check("new_record_batch_log_scanner_with_projection",
           table.NewScan()
-              .Project(projected_columns)
+              .ProjectByIndex(projected_columns)
               .CreateRecordBatchScanner(projected_arrow_scanner));
 
     for (int b = 0; b < buckets; ++b) {
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index c635c81adf..41aae670bb 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -939,7 +939,8 @@ class TableScan {
     TableScan(TableScan&&) noexcept = default;
     TableScan& operator=(TableScan&&) noexcept = default;
 
-    TableScan& Project(std::vector<size_t> column_indices);
+    TableScan& ProjectByIndex(std::vector<size_t> column_indices);
+    TableScan& ProjectByName(std::vector<std::string> column_names);
 
     Result CreateLogScanner(LogScanner& out);
     Result CreateRecordBatchScanner(LogScanner& out);
@@ -948,8 +949,11 @@ class TableScan {
     friend class Table;
     explicit TableScan(ffi::Table* table) noexcept;
 
+    std::vector<size_t> ResolveNameProjection() const;
+
     ffi::Table* table_{nullptr};
     std::vector<size_t> projection_;
+    std::vector<std::string> name_projection_;
 };
 
 class WriteResult {
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 5b2f66c805..a266363079 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -129,25 +129,54 @@ TableScan Table::NewScan() { return TableScan(table_); }
 // TableScan implementation
 TableScan::TableScan(ffi::Table* table) noexcept : table_(table) {}
 
-TableScan& TableScan::Project(std::vector<size_t> column_indices) {
+TableScan& TableScan::ProjectByIndex(std::vector<size_t> column_indices) {
     projection_ = std::move(column_indices);
+    name_projection_.clear();
     return *this;
 }
 
+TableScan& TableScan::ProjectByName(std::vector<std::string> column_names) {
+    name_projection_ = std::move(column_names);
+    projection_.clear();
+    return *this;
+}
+
+std::vector<size_t> TableScan::ResolveNameProjection() const {
+    auto ffi_info = table_->get_table_info_from_table();
+    const auto& columns = ffi_info.schema.columns;
+
+    std::vector<size_t> indices;
+    for (const auto& name : name_projection_) {
+        bool found = false;
+        for (size_t i = 0; i < columns.size(); ++i) {
+            if (std::string(columns[i].name) == name) {
+                indices.push_back(i);
+                found = true;
+                break;
+            }
+        }
+        if (!found) {
+            throw std::runtime_error("Column '" + name + "' not found");
+        }
+    }
+    return indices;
+}
+
 Result TableScan::CreateLogScanner(LogScanner& out) {
     if (table_ == nullptr) {
         return utils::make_error(1, "Table not available");
     }
 
     try {
-        if (projection_.empty()) {
-            out.scanner_ = table_->new_log_scanner();
-        } else {
+        auto resolved_indices = !name_projection_.empty() ? ResolveNameProjection() : projection_;
+        if (!resolved_indices.empty()) {
             rust::Vec<size_t> rust_indices;
-            for (size_t idx : projection_) {
+            for (size_t idx : resolved_indices) {
                 rust_indices.push_back(idx);
             }
             out.scanner_ = table_->new_log_scanner_with_projection(std::move(rust_indices));
+        } else {
+            out.scanner_ = table_->new_log_scanner();
         }
         return utils::make_ok();
     } catch (const rust::Error& e) {
@@ -163,15 +192,16 @@ Result TableScan::CreateRecordBatchScanner(LogScanner& out) {
     }
 
     try {
-        if (projection_.empty()) {
-            out.scanner_ = table_->new_record_batch_log_scanner();
-        } else {
+        auto resolved_indices = !name_projection_.empty() ? ResolveNameProjection() : projection_;
+        if (!resolved_indices.empty()) {
             rust::Vec<size_t> rust_indices;
-            for (size_t idx : projection_) {
+            for (size_t idx : resolved_indices) {
                 rust_indices.push_back(idx);
             }
             out.scanner_ =
                 table_->new_record_batch_log_scanner_with_projection(std::move(rust_indices));
+        } else {
+            out.scanner_ = table_->new_record_batch_log_scanner();
         }
         return utils::make_ok();
     } catch (const rust::Error& e) {

From de88bbf7e2a7c290a5f7e1d985b45b11cf45bd82 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 11 Feb 2026 04:03:10 +0000
Subject: [PATCH 137/287] chore: Builder pattern, cleanup, consistent API
 (#296)

---
 fluss-rust/bindings/cpp/examples/example.cpp  |   6 +-
 .../bindings/cpp/examples/kv_example.cpp      | 109 +++----
 fluss-rust/bindings/cpp/include/fluss.hpp     |  72 ++++-
 fluss-rust/bindings/cpp/src/admin.cpp         |  49 ++-
 fluss-rust/bindings/cpp/src/connection.cpp    |   6 +-
 fluss-rust/bindings/cpp/src/lib.rs            | 295 +++++-------------
 fluss-rust/bindings/cpp/src/table.cpp         | 190 +++++------
 7 files changed, 328 insertions(+), 399 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 47087e5436..59f1ed03dc 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -79,7 +79,7 @@ int main() {
 
     // 5) Write rows with scalar and temporal values
     fluss::AppendWriter writer;
-    check("new_append_writer", table.NewAppendWriter(writer));
+    check("new_append_writer", table.NewAppend().CreateWriter(writer));
 
     struct RowData {
         int id;
@@ -423,7 +423,7 @@ int main() {
     check("get_decimal_table", conn.GetTable(decimal_table_path, decimal_table));
 
     fluss::AppendWriter decimal_writer;
-    check("new_decimal_writer", decimal_table.NewAppendWriter(decimal_writer));
+    check("new_decimal_writer", decimal_table.NewAppend().CreateWriter(decimal_writer));
 
     // Just provide the value — Rust resolves (p,s) from schema
     {
@@ -512,7 +512,7 @@ int main() {
     check("get_partitioned_table", conn.GetTable(partitioned_table_path, partitioned_table));
 
     fluss::AppendWriter partitioned_writer;
-    check("new_partitioned_writer", partitioned_table.NewAppendWriter(partitioned_writer));
+    check("new_partitioned_writer", partitioned_table.NewAppend().CreateWriter(partitioned_writer));
 
     struct PartitionedRow {
         int id;
diff --git a/fluss-rust/bindings/cpp/examples/kv_example.cpp b/fluss-rust/bindings/cpp/examples/kv_example.cpp
index daebfb2655..2a40db3ec5 100644
--- a/fluss-rust/bindings/cpp/examples/kv_example.cpp
+++ b/fluss-rust/bindings/cpp/examples/kv_example.cpp
@@ -76,7 +76,7 @@ int main() {
     //    - Set("last_seen", ts) auto-routes to SetTimestampLtz (schema-aware)
     std::cout << "\n--- Upsert Rows ---" << std::endl;
     fluss::UpsertWriter upsert_writer;
-    check("new_upsert_writer", kv_table.NewUpsertWriter(upsert_writer));
+    check("new_upsert_writer", kv_table.NewUpsert().CreateWriter(upsert_writer));
 
     // Fire-and-forget upserts
     {
@@ -130,7 +130,7 @@ int main() {
     // 4) Lookup by primary key — verify all types round-trip
     std::cout << "\n--- Lookup by Primary Key ---" << std::endl;
     fluss::Lookuper lookuper;
-    check("new_lookuper", kv_table.NewLookuper(lookuper));
+    check("new_lookuper", kv_table.NewLookup().CreateLookuper(lookuper));
 
     // Lookup existing key
     {
@@ -242,9 +242,9 @@ int main() {
     // 7) Partial update by column names
     std::cout << "\n--- Partial Update by Column Names ---" << std::endl;
     fluss::UpsertWriter partial_writer;
-    check("new_partial_upsert_writer",
-          kv_table.NewUpsertWriter(partial_writer,
-                                   std::vector<std::string>{"user_id", "balance", "last_seen"}));
+    check("new_partial_upsert_writer", kv_table.NewUpsert()
+                                           .PartialUpdateByName({"user_id", "balance", "last_seen"})
+                                           .CreateWriter(partial_writer));
 
     {
         auto row = kv_table.NewRow();
@@ -282,7 +282,7 @@ int main() {
     fluss::UpsertWriter partial_writer_idx;
     // Columns: 0=user_id (PK), 1=name — update name only
     check("new_partial_upsert_writer_idx",
-          kv_table.NewUpsertWriter(partial_writer_idx, std::vector<size_t>{0, 1}));
+          kv_table.NewUpsert().PartialUpdateByIndex({0, 1}).CreateWriter(partial_writer_idx));
 
     {
         // Index-based setters: lighter than name-based, useful for hot paths
@@ -321,37 +321,39 @@ int main() {
 
     // 9) Partitioned KV table
     std::cout << "\n--- Partitioned KV Table ---" << std::endl;
-    fluss::TablePath part_kv_path("fluss", "partitioned_kv_cpp_v1");
-    admin.DropTable(part_kv_path, true);
-
-    auto part_kv_schema = fluss::Schema::NewBuilder()
-                              .AddColumn("region", fluss::DataType::String())
-                              .AddColumn("user_id", fluss::DataType::Int())
-                              .AddColumn("name", fluss::DataType::String())
-                              .AddColumn("score", fluss::DataType::BigInt())
-                              .SetPrimaryKeys({"region", "user_id"})
-                              .Build();
-
-    auto part_kv_descriptor = fluss::TableDescriptor::NewBuilder()
-                                  .SetSchema(part_kv_schema)
-                                  .SetPartitionKeys({"region"})
-                                  .SetComment("partitioned kv table example")
-                                  .Build();
-
-    check("create_part_kv", admin.CreateTable(part_kv_path, part_kv_descriptor, false));
+    fluss::TablePath partitioned_kv_path("fluss", "partitioned_kv_cpp_v1");
+    admin.DropTable(partitioned_kv_path, true);
+
+    auto partitioned_kv_schema = fluss::Schema::NewBuilder()
+                                     .AddColumn("region", fluss::DataType::String())
+                                     .AddColumn("user_id", fluss::DataType::Int())
+                                     .AddColumn("name", fluss::DataType::String())
+                                     .AddColumn("score", fluss::DataType::BigInt())
+                                     .SetPrimaryKeys({"region", "user_id"})
+                                     .Build();
+
+    auto partitioned_kv_descriptor = fluss::TableDescriptor::NewBuilder()
+                                         .SetSchema(partitioned_kv_schema)
+                                         .SetPartitionKeys({"region"})
+                                         .SetComment("partitioned kv table example")
+                                         .Build();
+
+    check("create_partitioned_kv",
+          admin.CreateTable(partitioned_kv_path, partitioned_kv_descriptor, false));
     std::cout << "Created partitioned KV table" << std::endl;
 
     // Create partitions
-    check("create_US", admin.CreatePartition(part_kv_path, {{"region", "US"}}));
-    check("create_EU", admin.CreatePartition(part_kv_path, {{"region", "EU"}}));
-    check("create_APAC", admin.CreatePartition(part_kv_path, {{"region", "APAC"}}));
+    check("create_US", admin.CreatePartition(partitioned_kv_path, {{"region", "US"}}));
+    check("create_EU", admin.CreatePartition(partitioned_kv_path, {{"region", "EU"}}));
+    check("create_APAC", admin.CreatePartition(partitioned_kv_path, {{"region", "APAC"}}));
     std::cout << "Created partitions: US, EU, APAC" << std::endl;
 
-    fluss::Table part_kv_table;
-    check("get_part_kv_table", conn.GetTable(part_kv_path, part_kv_table));
+    fluss::Table partitioned_kv_table;
+    check("get_partitioned_kv_table", conn.GetTable(partitioned_kv_path, partitioned_kv_table));
 
-    fluss::UpsertWriter part_writer;
-    check("new_part_writer", part_kv_table.NewUpsertWriter(part_writer));
+    fluss::UpsertWriter partitioned_writer;
+    check("new_partitioned_writer",
+          partitioned_kv_table.NewUpsert().CreateWriter(partitioned_writer));
 
     // Upsert rows across partitions
     struct TestRow {
@@ -366,28 +368,29 @@ int main() {
     };
 
     for (const auto& td : test_data) {
-        auto row = part_kv_table.NewRow();
+        auto row = partitioned_kv_table.NewRow();
         row.Set("region", td.region);
         row.Set("user_id", td.user_id);
         row.Set("name", td.name);
         row.Set("score", td.score);
-        check("part_upsert", part_writer.Upsert(row));
+        check("partitioned_upsert", partitioned_writer.Upsert(row));
     }
-    check("part_flush", part_writer.Flush());
+    check("partitioned_flush", partitioned_writer.Flush());
     std::cout << "Upserted 5 rows across 3 partitions" << std::endl;
 
     // Lookup all rows
-    fluss::Lookuper part_lookuper;
-    check("new_part_lookuper", part_kv_table.NewLookuper(part_lookuper));
+    fluss::Lookuper partitioned_lookuper;
+    check("new_partitioned_lookuper",
+          partitioned_kv_table.NewLookup().CreateLookuper(partitioned_lookuper));
 
     for (const auto& td : test_data) {
-        auto pk = part_kv_table.NewRow();
+        auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", td.region);
         pk.Set("user_id", td.user_id);
 
         bool found = false;
         fluss::GenericRow result;
-        check("part_lookup", part_lookuper.Lookup(pk, found, result));
+        check("partitioned_lookup", partitioned_lookuper.Lookup(pk, found, result));
         if (!found) {
             std::cerr << "ERROR: Expected to find region=" << td.region << " user_id=" << td.user_id
                       << std::endl;
@@ -403,22 +406,22 @@ int main() {
 
     // Update within a partition
     {
-        auto row = part_kv_table.NewRow();
+        auto row = partitioned_kv_table.NewRow();
         row.Set("region", "US");
         row.Set("user_id", 1);
         row.Set("name", "Gustave Updated");
         row.Set("score", static_cast<int64_t>(999));
         fluss::WriteResult wr;
-        check("part_update", part_writer.Upsert(row, wr));
-        check("part_update_wait", wr.Wait());
+        check("partitioned_update", partitioned_writer.Upsert(row, wr));
+        check("partitioned_update_wait", wr.Wait());
     }
     {
-        auto pk = part_kv_table.NewRow();
+        auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "US");
         pk.Set("user_id", 1);
         bool found = false;
         fluss::GenericRow result;
-        check("part_lookup_updated", part_lookuper.Lookup(pk, found, result));
+        check("partitioned_lookup_updated", partitioned_lookuper.Lookup(pk, found, result));
         if (!found || result.GetString(2) != "Gustave Updated" || result.GetInt64(3) != 999) {
             std::cerr << "ERROR: Partition update verification failed" << std::endl;
             std::exit(1);
@@ -429,12 +432,12 @@ int main() {
 
     // Lookup in non-existent partition
     {
-        auto pk = part_kv_table.NewRow();
+        auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "UNKNOWN");
         pk.Set("user_id", 1);
         bool found = false;
         fluss::GenericRow result;
-        check("part_lookup_unknown", part_lookuper.Lookup(pk, found, result));
+        check("partitioned_lookup_unknown", partitioned_lookuper.Lookup(pk, found, result));
         if (found) {
             std::cerr << "ERROR: Expected UNKNOWN partition lookup to return not found"
                       << std::endl;
@@ -445,20 +448,20 @@ int main() {
 
     // Delete within a partition
     {
-        auto pk = part_kv_table.NewRow();
+        auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "EU");
         pk.Set("user_id", 1);
         fluss::WriteResult wr;
-        check("part_delete", part_writer.Delete(pk, wr));
-        check("part_delete_wait", wr.Wait());
+        check("partitioned_delete", partitioned_writer.Delete(pk, wr));
+        check("partitioned_delete_wait", wr.Wait());
     }
     {
-        auto pk = part_kv_table.NewRow();
+        auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "EU");
         pk.Set("user_id", 1);
         bool found = false;
         fluss::GenericRow result;
-        check("part_lookup_deleted", part_lookuper.Lookup(pk, found, result));
+        check("partitioned_lookup_deleted", partitioned_lookuper.Lookup(pk, found, result));
         if (found) {
             std::cerr << "ERROR: Expected EU/1 to be deleted" << std::endl;
             std::exit(1);
@@ -468,12 +471,12 @@ int main() {
 
     // Verify other record in same partition still exists
     {
-        auto pk = part_kv_table.NewRow();
+        auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "EU");
         pk.Set("user_id", 2);
         bool found = false;
         fluss::GenericRow result;
-        check("part_lookup_eu2", part_lookuper.Lookup(pk, found, result));
+        check("partitioned_lookup_eu2", partitioned_lookuper.Lookup(pk, found, result));
         if (!found || result.GetString(2) != "Maelle") {
             std::cerr << "ERROR: Expected EU/2 (Maelle) to still exist" << std::endl;
             std::exit(1);
@@ -481,7 +484,7 @@ int main() {
         std::cout << "EU/2 still exists: name=" << result.GetString(2) << std::endl;
     }
 
-    check("drop_part_kv", admin.DropTable(part_kv_path, true));
+    check("drop_partitioned_kv", admin.DropTable(partitioned_kv_path, true));
     std::cout << "\nKV table example completed successfully!" << std::endl;
 
     return 0;
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 41aae670bb..1806616906 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -804,6 +804,9 @@ class WriteResult;
 class LogScanner;
 class Admin;
 class Table;
+class TableAppend;
+class TableUpsert;
+class TableLookup;
 class TableScan;
 
 class Connection {
@@ -909,11 +912,9 @@ class Table {
 
     GenericRow NewRow() const;
 
-    Result NewAppendWriter(AppendWriter& out);
-    Result NewUpsertWriter(UpsertWriter& out);
-    Result NewUpsertWriter(UpsertWriter& out, const std::vector<std::string>& column_names);
-    Result NewUpsertWriter(UpsertWriter& out, const std::vector<size_t>& column_indices);
-    Result NewLookuper(Lookuper& out);
+    TableAppend NewAppend();
+    TableUpsert NewUpsert();
+    TableLookup NewLookup();
     TableScan NewScan();
 
     TableInfo GetTableInfo() const;
@@ -922,6 +923,9 @@ class Table {
 
    private:
     friend class Connection;
+    friend class TableAppend;
+    friend class TableUpsert;
+    friend class TableLookup;
     friend class TableScan;
     Table(ffi::Table* table) noexcept;
 
@@ -932,6 +936,61 @@ class Table {
     mutable std::shared_ptr<GenericRow::ColumnMap> column_map_;
 };
 
+class TableAppend {
+   public:
+    TableAppend(const TableAppend&) = delete;
+    TableAppend& operator=(const TableAppend&) = delete;
+    TableAppend(TableAppend&&) noexcept = default;
+    TableAppend& operator=(TableAppend&&) noexcept = default;
+
+    Result CreateWriter(AppendWriter& out);
+
+   private:
+    friend class Table;
+    explicit TableAppend(ffi::Table* table) noexcept;
+
+    ffi::Table* table_{nullptr};
+};
+
+class TableUpsert {
+   public:
+    TableUpsert(const TableUpsert&) = delete;
+    TableUpsert& operator=(const TableUpsert&) = delete;
+    TableUpsert(TableUpsert&&) noexcept = default;
+    TableUpsert& operator=(TableUpsert&&) noexcept = default;
+
+    TableUpsert& PartialUpdateByIndex(std::vector<size_t> column_indices);
+    TableUpsert& PartialUpdateByName(std::vector<std::string> column_names);
+
+    Result CreateWriter(UpsertWriter& out);
+
+   private:
+    friend class Table;
+    explicit TableUpsert(ffi::Table* table) noexcept;
+
+    std::vector<size_t> ResolveNameProjection() const;
+
+    ffi::Table* table_{nullptr};
+    std::vector<size_t> column_indices_;
+    std::vector<std::string> column_names_;
+};
+
+class TableLookup {
+   public:
+    TableLookup(const TableLookup&) = delete;
+    TableLookup& operator=(const TableLookup&) = delete;
+    TableLookup(TableLookup&&) noexcept = default;
+    TableLookup& operator=(TableLookup&&) noexcept = default;
+
+    Result CreateLookuper(Lookuper& out);
+
+   private:
+    friend class Table;
+    explicit TableLookup(ffi::Table* table) noexcept;
+
+    ffi::Table* table_{nullptr};
+};
+
 class TableScan {
    public:
     TableScan(const TableScan&) = delete;
@@ -999,6 +1058,7 @@ class AppendWriter {
 
    private:
     friend class Table;
+    friend class TableAppend;
     AppendWriter(ffi::AppendWriter* writer) noexcept;
 
     void Destroy() noexcept;
@@ -1025,6 +1085,7 @@ class UpsertWriter {
 
    private:
     friend class Table;
+    friend class TableUpsert;
     UpsertWriter(ffi::UpsertWriter* writer) noexcept;
     void Destroy() noexcept;
     ffi::UpsertWriter* writer_{nullptr};
@@ -1046,6 +1107,7 @@ class Lookuper {
 
    private:
     friend class Table;
+    friend class TableLookup;
     Lookuper(ffi::Lookuper* lookuper) noexcept;
     void Destroy() noexcept;
     ffi::Lookuper* lookuper_{nullptr};
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index 77c95d317c..7925256ef5 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -17,9 +17,9 @@
  * under the License.
  */
 
+#include "ffi_converter.hpp"
 #include "fluss.hpp"
 #include "lib.rs.h"
-#include "ffi_converter.hpp"
 #include "rust/cxx.h"
 
 namespace fluss {
@@ -37,9 +37,7 @@ void Admin::Destroy() noexcept {
     }
 }
 
-Admin::Admin(Admin&& other) noexcept : admin_(other.admin_) {
-    other.admin_ = nullptr;
-}
+Admin::Admin(Admin&& other) noexcept : admin_(other.admin_) { other.admin_ = nullptr; }
 
 Admin& Admin::operator=(Admin&& other) noexcept {
     if (this != &other) {
@@ -52,8 +50,7 @@ Admin& Admin::operator=(Admin&& other) noexcept {
 
 bool Admin::Available() const { return admin_ != nullptr; }
 
-Result Admin::CreateTable(const TablePath& table_path,
-                          const TableDescriptor& descriptor,
+Result Admin::CreateTable(const TablePath& table_path, const TableDescriptor& descriptor,
                           bool ignore_if_exists) {
     if (!Available()) {
         return utils::make_error(1, "Admin not available");
@@ -109,17 +106,16 @@ Result Admin::GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& o
 }
 
 // function for common list offsets functionality
-Result Admin::DoListOffsets(const TablePath& table_path,
-                         const std::vector<int32_t>& bucket_ids,
-                         const OffsetQuery& offset_query,
-                         std::unordered_map<int32_t, int64_t>& out,
-                         const std::string* partition_name) {
+Result Admin::DoListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
+                            const OffsetQuery& offset_query,
+                            std::unordered_map<int32_t, int64_t>& out,
+                            const std::string* partition_name) {
     if (!Available()) {
         return utils::make_error(1, "Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
-    
+
     rust::Vec<int32_t> rust_bucket_ids;
     for (int32_t id : bucket_ids) {
         rust_bucket_ids.push_back(id);
@@ -131,11 +127,12 @@ Result Admin::DoListOffsets(const TablePath& table_path,
 
     ffi::FfiListOffsetsResult ffi_result;
     if (partition_name != nullptr) {
-        ffi_result = admin_->list_partition_offsets(ffi_path, rust::String(*partition_name), std::move(rust_bucket_ids), ffi_query);
+        ffi_result = admin_->list_partition_offsets(ffi_path, rust::String(*partition_name),
+                                                    std::move(rust_bucket_ids), ffi_query);
     } else {
         ffi_result = admin_->list_offsets(ffi_path, std::move(rust_bucket_ids), ffi_query);
     }
-    
+
     auto result = utils::from_ffi_result(ffi_result.result);
     if (result.Ok()) {
         out.clear();
@@ -147,23 +144,20 @@ Result Admin::DoListOffsets(const TablePath& table_path,
     return result;
 }
 
-Result Admin::ListOffsets(const TablePath& table_path,
-                          const std::vector<int32_t>& bucket_ids,
+Result Admin::ListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
                           const OffsetQuery& offset_query,
                           std::unordered_map<int32_t, int64_t>& out) {
     return DoListOffsets(table_path, bucket_ids, offset_query, out);
 }
 
-Result Admin::ListPartitionOffsets(const TablePath& table_path,
-                                const std::string& partition_name,
-                                const std::vector<int32_t>& bucket_ids,
-                                const OffsetQuery& offset_query,
-                                std::unordered_map<int32_t, int64_t>& out) {
+Result Admin::ListPartitionOffsets(const TablePath& table_path, const std::string& partition_name,
+                                   const std::vector<int32_t>& bucket_ids,
+                                   const OffsetQuery& offset_query,
+                                   std::unordered_map<int32_t, int64_t>& out) {
     return DoListOffsets(table_path, bucket_ids, offset_query, out, &partition_name);
 }
 
-Result Admin::ListPartitionInfos(const TablePath& table_path,
-                                 std::vector<PartitionInfo>& out) {
+Result Admin::ListPartitionInfos(const TablePath& table_path, std::vector<PartitionInfo>& out) {
     if (!Available()) {
         return utils::make_error(1, "Admin not available");
     }
@@ -221,21 +215,18 @@ Result Admin::DropPartition(const TablePath& table_path,
         rust_spec.push_back(std::move(kv));
     }
 
-    auto ffi_result =
-        admin_->drop_partition(ffi_path, std::move(rust_spec), ignore_if_not_exists);
+    auto ffi_result = admin_->drop_partition(ffi_path, std::move(rust_spec), ignore_if_not_exists);
     return utils::from_ffi_result(ffi_result);
 }
 
-Result Admin::CreateDatabase(const std::string& database_name,
-                             const DatabaseDescriptor& descriptor,
+Result Admin::CreateDatabase(const std::string& database_name, const DatabaseDescriptor& descriptor,
                              bool ignore_if_exists) {
     if (!Available()) {
         return utils::make_error(1, "Admin not available");
     }
 
     auto ffi_desc = utils::to_ffi_database_descriptor(descriptor);
-    auto ffi_result =
-        admin_->create_database(rust::Str(database_name), ffi_desc, ignore_if_exists);
+    auto ffi_result = admin_->create_database(rust::Str(database_name), ffi_desc, ignore_if_exists);
     return utils::from_ffi_result(ffi_result);
 }
 
diff --git a/fluss-rust/bindings/cpp/src/connection.cpp b/fluss-rust/bindings/cpp/src/connection.cpp
index ea884cdb1f..4fbfafb126 100644
--- a/fluss-rust/bindings/cpp/src/connection.cpp
+++ b/fluss-rust/bindings/cpp/src/connection.cpp
@@ -17,9 +17,9 @@
  * under the License.
  */
 
+#include "ffi_converter.hpp"
 #include "fluss.hpp"
 #include "lib.rs.h"
-#include "ffi_converter.hpp"
 #include "rust/cxx.h"
 
 namespace fluss {
@@ -35,9 +35,7 @@ void Connection::Destroy() noexcept {
     }
 }
 
-Connection::Connection(Connection&& other) noexcept : conn_(other.conn_) {
-    other.conn_ = nullptr;
-}
+Connection::Connection(Connection&& other) noexcept : conn_(other.conn_) { other.conn_ = nullptr; }
 
 Connection& Connection::operator=(Connection&& other) noexcept {
     if (this != &other) {
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index ee7f1d8fdb..9b1b5ef83b 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -325,25 +325,15 @@ mod ffi {
         // Table
         unsafe fn delete_table(table: *mut Table);
         fn new_append_writer(self: &Table) -> Result<*mut AppendWriter>;
-        fn new_log_scanner(self: &Table) -> Result<*mut LogScanner>;
-        fn new_log_scanner_with_projection(
-            self: &Table,
-            column_indices: Vec<usize>,
-        ) -> Result<*mut LogScanner>;
-        fn new_record_batch_log_scanner(self: &Table) -> Result<*mut LogScanner>;
-        fn new_record_batch_log_scanner_with_projection(
+        fn create_scanner(
             self: &Table,
             column_indices: Vec<usize>,
+            batch: bool,
         ) -> Result<*mut LogScanner>;
         fn get_table_info_from_table(self: &Table) -> FfiTableInfo;
         fn get_table_path(self: &Table) -> FfiTablePath;
         fn has_primary_key(self: &Table) -> bool;
-        fn new_upsert_writer(self: &Table) -> Result<*mut UpsertWriter>;
-        fn new_upsert_writer_with_column_names(
-            self: &Table,
-            column_names: Vec<String>,
-        ) -> Result<*mut UpsertWriter>;
-        fn new_upsert_writer_with_column_indices(
+        fn create_upsert_writer(
             self: &Table,
             column_indices: Vec<usize>,
         ) -> Result<*mut UpsertWriter>;
@@ -919,153 +909,86 @@ unsafe fn delete_table(table: *mut Table) {
 }
 
 impl Table {
-    fn new_append_writer(&self) -> Result<*mut AppendWriter, String> {
-        let _enter = RUNTIME.enter();
-
-        let fluss_table = fcore::client::FlussTable::new(
+    fn fluss_table(&self) -> fcore::client::FlussTable<'_> {
+        fcore::client::FlussTable::new(
             &self.connection,
             self.metadata.clone(),
             self.table_info.clone(),
-        );
-
-        let table_append = match fluss_table.new_append() {
-            Ok(a) => a,
-            Err(e) => return Err(format!("Failed to create append: {e}")),
-        };
-
-        let writer = match table_append.create_writer() {
-            Ok(w) => w,
-            Err(e) => return Err(format!("Failed to create writer: {e}")),
-        };
-        let writer = Box::into_raw(Box::new(AppendWriter {
-            inner: writer,
-            table_info: self.table_info.clone(),
-        }));
-        Ok(writer)
+        )
     }
 
-    fn new_log_scanner(&self) -> Result<*mut LogScanner, String> {
-        RUNTIME.block_on(async {
-            let fluss_table = fcore::client::FlussTable::new(
-                &self.connection,
-                self.metadata.clone(),
-                self.table_info.clone(),
-            );
-
-            let scanner = fluss_table
-                .new_scan()
-                .create_log_scanner()
-                .map_err(|e| format!("Failed to create log scanner: {e}"))?;
-
-            let scanner_ptr = Box::into_raw(Box::new(LogScanner {
-                inner: Some(scanner),
-                inner_batch: None,
-                projected_columns: self.table_info.get_schema().columns().to_vec(),
-            }));
-
-            Ok(scanner_ptr)
-        })
-    }
-
-    fn new_log_scanner_with_projection(
+    fn resolve_projected_columns(
         &self,
-        column_indices: Vec<usize>,
-    ) -> Result<*mut LogScanner, String> {
-        RUNTIME.block_on(async {
-            let fluss_table = fcore::client::FlussTable::new(
-                &self.connection,
-                self.metadata.clone(),
-                self.table_info.clone(),
-            );
-
-            let all_columns = self.table_info.get_schema().columns();
-            let projected_columns: Vec<_> = column_indices
-                .iter()
-                .map(|&i| {
-                    all_columns.get(i).cloned().ok_or_else(|| {
-                        format!(
-                            "Invalid column index {i}: schema has {} columns",
-                            all_columns.len()
-                        )
-                    })
+        indices: &[usize],
+    ) -> Result<Vec<fcore::metadata::Column>, String> {
+        let all_columns = self.table_info.get_schema().columns();
+        indices
+            .iter()
+            .map(|&i| {
+                all_columns.get(i).cloned().ok_or_else(|| {
+                    format!(
+                        "Invalid column index {i}: schema has {} columns",
+                        all_columns.len()
+                    )
                 })
-                .collect::<Result<_, String>>()?;
-
-            let log_scanner = fluss_table
-                .new_scan()
-                .project(&column_indices)
-                .map_err(|e| format!("Failed to project columns: {e}"))?
-                .create_log_scanner()
-                .map_err(|e| format!("Failed to create log scanner: {e}"))?;
-
-            let scanner = Box::into_raw(Box::new(LogScanner {
-                inner: Some(log_scanner),
-                inner_batch: None,
-                projected_columns,
-            }));
-            Ok(scanner)
-        })
+            })
+            .collect()
     }
 
-    fn new_record_batch_log_scanner(&self) -> Result<*mut LogScanner, String> {
-        RUNTIME.block_on(async {
-            let fluss_table = fcore::client::FlussTable::new(
-                &self.connection,
-                self.metadata.clone(),
-                self.table_info.clone(),
-            );
-
-            let batch_scanner = fluss_table
-                .new_scan()
-                .create_record_batch_log_scanner()
-                .map_err(|e| format!("Failed to create record batch log scanner: {e}"))?;
-
-            let scanner = Box::into_raw(Box::new(LogScanner {
-                inner: None,
-                inner_batch: Some(batch_scanner),
-                projected_columns: self.table_info.get_schema().columns().to_vec(),
-            }));
-            Ok(scanner)
-        })
+    fn new_append_writer(&self) -> Result<*mut AppendWriter, String> {
+        let _enter = RUNTIME.enter();
+
+        let table_append = self
+            .fluss_table()
+            .new_append()
+            .map_err(|e| format!("Failed to create append: {e}"))?;
+
+        let writer = table_append
+            .create_writer()
+            .map_err(|e| format!("Failed to create writer: {e}"))?;
+
+        Ok(Box::into_raw(Box::new(AppendWriter {
+            inner: writer,
+            table_info: self.table_info.clone(),
+        })))
     }
 
-    fn new_record_batch_log_scanner_with_projection(
+    fn create_scanner(
         &self,
         column_indices: Vec<usize>,
+        batch: bool,
     ) -> Result<*mut LogScanner, String> {
         RUNTIME.block_on(async {
-            let fluss_table = fcore::client::FlussTable::new(
-                &self.connection,
-                self.metadata.clone(),
-                self.table_info.clone(),
-            );
-
-            let all_columns = self.table_info.get_schema().columns();
-            let projected_columns: Vec<_> = column_indices
-                .iter()
-                .map(|&i| {
-                    all_columns.get(i).cloned().ok_or_else(|| {
-                        format!(
-                            "Invalid column index {i}: schema has {} columns",
-                            all_columns.len()
-                        )
-                    })
-                })
-                .collect::<Result<_, String>>()?;
-
-            let batch_scanner = fluss_table
-                .new_scan()
-                .project(&column_indices)
-                .map_err(|e| format!("Failed to project columns: {e}"))?
-                .create_record_batch_log_scanner()
-                .map_err(|e| format!("Failed to create record batch log scanner: {e}"))?;
-
-            let scanner = Box::into_raw(Box::new(LogScanner {
-                inner: None,
-                inner_batch: Some(batch_scanner),
+            let fluss_table = self.fluss_table();
+            let scan = fluss_table.new_scan();
+
+            let (projected_columns, scan) = if column_indices.is_empty() {
+                (self.table_info.get_schema().columns().to_vec(), scan)
+            } else {
+                let cols = self.resolve_projected_columns(&column_indices)?;
+                let scan = scan
+                    .project(&column_indices)
+                    .map_err(|e| format!("Failed to project columns: {e}"))?;
+                (cols, scan)
+            };
+
+            let (inner, inner_batch) = if batch {
+                let batch_scanner = scan
+                    .create_record_batch_log_scanner()
+                    .map_err(|e| format!("Failed to create record batch log scanner: {e}"))?;
+                (None, Some(batch_scanner))
+            } else {
+                let log_scanner = scan
+                    .create_log_scanner()
+                    .map_err(|e| format!("Failed to create log scanner: {e}"))?;
+                (Some(log_scanner), None)
+            };
+
+            Ok(Box::into_raw(Box::new(LogScanner {
+                inner,
+                inner_batch,
                 projected_columns,
-            }));
-            Ok(scanner)
+            })))
         })
     }
 
@@ -1084,79 +1007,24 @@ impl Table {
         self.has_pk
     }
 
-    fn new_upsert_writer(&self) -> Result<*mut UpsertWriter, String> {
-        let _enter = RUNTIME.enter();
-
-        let fluss_table = fcore::client::FlussTable::new(
-            &self.connection,
-            self.metadata.clone(),
-            self.table_info.clone(),
-        );
-
-        let table_upsert = fluss_table
-            .new_upsert()
-            .map_err(|e| format!("Failed to create upsert: {e}"))?;
-
-        let writer = table_upsert
-            .create_writer()
-            .map_err(|e| format!("Failed to create upsert writer: {e}"))?;
-
-        Ok(Box::into_raw(Box::new(UpsertWriter {
-            inner: writer,
-            table_info: self.table_info.clone(),
-        })))
-    }
-
-    fn new_upsert_writer_with_column_names(
-        &self,
-        column_names: Vec<String>,
-    ) -> Result<*mut UpsertWriter, String> {
-        let _enter = RUNTIME.enter();
-
-        let fluss_table = fcore::client::FlussTable::new(
-            &self.connection,
-            self.metadata.clone(),
-            self.table_info.clone(),
-        );
-
-        let table_upsert = fluss_table
-            .new_upsert()
-            .map_err(|e| format!("Failed to create upsert: {e}"))?;
-
-        let col_refs: Vec<&str> = column_names.iter().map(|s| s.as_str()).collect();
-        let table_upsert = table_upsert
-            .partial_update_with_column_names(&col_refs)
-            .map_err(|e| format!("Failed to set partial update columns: {e}"))?;
-
-        let writer = table_upsert
-            .create_writer()
-            .map_err(|e| format!("Failed to create upsert writer: {e}"))?;
-
-        Ok(Box::into_raw(Box::new(UpsertWriter {
-            inner: writer,
-            table_info: self.table_info.clone(),
-        })))
-    }
-
-    fn new_upsert_writer_with_column_indices(
+    fn create_upsert_writer(
         &self,
         column_indices: Vec<usize>,
     ) -> Result<*mut UpsertWriter, String> {
         let _enter = RUNTIME.enter();
 
-        let fluss_table = fcore::client::FlussTable::new(
-            &self.connection,
-            self.metadata.clone(),
-            self.table_info.clone(),
-        );
-
-        let table_upsert = fluss_table
+        let table_upsert = self
+            .fluss_table()
             .new_upsert()
             .map_err(|e| format!("Failed to create upsert: {e}"))?;
 
-        let table_upsert = table_upsert
-            .partial_update(Some(column_indices))
-            .map_err(|e| format!("Failed to set partial update columns: {e}"))?;
+        let table_upsert = if column_indices.is_empty() {
+            table_upsert
+        } else {
+            table_upsert
+                .partial_update(Some(column_indices))
+                .map_err(|e| format!("Failed to set partial update columns: {e}"))?
+        };
 
         let writer = table_upsert
             .create_writer()
@@ -1171,13 +1039,8 @@ impl Table {
     fn new_lookuper(&self) -> Result<*mut Lookuper, String> {
         let _enter = RUNTIME.enter();
 
-        let fluss_table = fcore::client::FlussTable::new(
-            &self.connection,
-            self.metadata.clone(),
-            self.table_info.clone(),
-        );
-
-        let table_lookup = fluss_table
+        let table_lookup = self
+            .fluss_table()
             .new_lookup()
             .map_err(|e| format!("Failed to create lookup: {e}"))?;
 
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index a266363079..da4dc30688 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -109,8 +109,19 @@ Table& Table::operator=(Table&& other) noexcept {
 
 bool Table::Available() const { return table_ != nullptr; }
 
-Result Table::NewAppendWriter(AppendWriter& out) {
-    if (!Available()) {
+TableAppend Table::NewAppend() { return TableAppend(table_); }
+
+TableUpsert Table::NewUpsert() { return TableUpsert(table_); }
+
+TableLookup Table::NewLookup() { return TableLookup(table_); }
+
+TableScan Table::NewScan() { return TableScan(table_); }
+
+// TableAppend implementation
+TableAppend::TableAppend(ffi::Table* table) noexcept : table_(table) {}
+
+Result TableAppend::CreateWriter(AppendWriter& out) {
+    if (table_ == nullptr) {
         return utils::make_error(1, "Table not available");
     }
 
@@ -124,7 +135,86 @@ Result Table::NewAppendWriter(AppendWriter& out) {
     }
 }
 
-TableScan Table::NewScan() { return TableScan(table_); }
+// TableUpsert implementation
+TableUpsert::TableUpsert(ffi::Table* table) noexcept : table_(table) {}
+
+TableUpsert& TableUpsert::PartialUpdateByIndex(std::vector<size_t> column_indices) {
+    if (column_indices.empty()) {
+        throw std::invalid_argument("PartialUpdateByIndex requires at least one column");
+    }
+    column_indices_ = std::move(column_indices);
+    column_names_.clear();
+    return *this;
+}
+
+TableUpsert& TableUpsert::PartialUpdateByName(std::vector<std::string> column_names) {
+    if (column_names.empty()) {
+        throw std::invalid_argument("PartialUpdateByName requires at least one column");
+    }
+    column_names_ = std::move(column_names);
+    column_indices_.clear();
+    return *this;
+}
+
+std::vector<size_t> TableUpsert::ResolveNameProjection() const {
+    auto ffi_info = table_->get_table_info_from_table();
+    const auto& columns = ffi_info.schema.columns;
+
+    std::vector<size_t> indices;
+    for (const auto& name : column_names_) {
+        bool found = false;
+        for (size_t i = 0; i < columns.size(); ++i) {
+            if (std::string(columns[i].name) == name) {
+                indices.push_back(i);
+                found = true;
+                break;
+            }
+        }
+        if (!found) {
+            throw std::runtime_error("Column '" + name + "' not found");
+        }
+    }
+    return indices;
+}
+
+Result TableUpsert::CreateWriter(UpsertWriter& out) {
+    if (table_ == nullptr) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        auto resolved_indices = !column_names_.empty() ? ResolveNameProjection() : column_indices_;
+
+        rust::Vec<size_t> rust_indices;
+        for (size_t idx : resolved_indices) {
+            rust_indices.push_back(idx);
+        }
+        out = UpsertWriter(table_->create_upsert_writer(std::move(rust_indices)));
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
+
+// TableLookup implementation
+TableLookup::TableLookup(ffi::Table* table) noexcept : table_(table) {}
+
+Result TableLookup::CreateLookuper(Lookuper& out) {
+    if (table_ == nullptr) {
+        return utils::make_error(1, "Table not available");
+    }
+
+    try {
+        out = Lookuper(table_->new_lookuper());
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_error(1, e.what());
+    } catch (const std::exception& e) {
+        return utils::make_error(1, e.what());
+    }
+}
 
 // TableScan implementation
 TableScan::TableScan(ffi::Table* table) noexcept : table_(table) {}
@@ -169,15 +259,11 @@ Result TableScan::CreateLogScanner(LogScanner& out) {
 
     try {
         auto resolved_indices = !name_projection_.empty() ? ResolveNameProjection() : projection_;
-        if (!resolved_indices.empty()) {
-            rust::Vec<size_t> rust_indices;
-            for (size_t idx : resolved_indices) {
-                rust_indices.push_back(idx);
-            }
-            out.scanner_ = table_->new_log_scanner_with_projection(std::move(rust_indices));
-        } else {
-            out.scanner_ = table_->new_log_scanner();
+        rust::Vec<size_t> rust_indices;
+        for (size_t idx : resolved_indices) {
+            rust_indices.push_back(idx);
         }
+        out.scanner_ = table_->create_scanner(std::move(rust_indices), false);
         return utils::make_ok();
     } catch (const rust::Error& e) {
         return utils::make_error(1, e.what());
@@ -193,16 +279,11 @@ Result TableScan::CreateRecordBatchScanner(LogScanner& out) {
 
     try {
         auto resolved_indices = !name_projection_.empty() ? ResolveNameProjection() : projection_;
-        if (!resolved_indices.empty()) {
-            rust::Vec<size_t> rust_indices;
-            for (size_t idx : resolved_indices) {
-                rust_indices.push_back(idx);
-            }
-            out.scanner_ =
-                table_->new_record_batch_log_scanner_with_projection(std::move(rust_indices));
-        } else {
-            out.scanner_ = table_->new_record_batch_log_scanner();
+        rust::Vec<size_t> rust_indices;
+        for (size_t idx : resolved_indices) {
+            rust_indices.push_back(idx);
         }
+        out.scanner_ = table_->create_scanner(std::move(rust_indices), true);
         return utils::make_ok();
     } catch (const rust::Error& e) {
         return utils::make_error(1, e.what());
@@ -489,75 +570,6 @@ Result Lookuper::Lookup(const GenericRow& pk_row, bool& found, GenericRow& out)
     }
 }
 
-// Table KV methods
-Result Table::NewUpsertWriter(UpsertWriter& out) {
-    if (!Available()) {
-        return utils::make_error(1, "Table not available");
-    }
-
-    try {
-        out = UpsertWriter(table_->new_upsert_writer());
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
-    } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
-    }
-}
-
-Result Table::NewUpsertWriter(UpsertWriter& out, const std::vector<std::string>& column_names) {
-    if (!Available()) {
-        return utils::make_error(1, "Table not available");
-    }
-
-    try {
-        rust::Vec<rust::String> rust_names;
-        for (const auto& name : column_names) {
-            rust_names.push_back(rust::String(name));
-        }
-        out = UpsertWriter(table_->new_upsert_writer_with_column_names(std::move(rust_names)));
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
-    } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
-    }
-}
-
-Result Table::NewUpsertWriter(UpsertWriter& out, const std::vector<size_t>& column_indices) {
-    if (!Available()) {
-        return utils::make_error(1, "Table not available");
-    }
-
-    try {
-        rust::Vec<size_t> rust_indices;
-        for (size_t idx : column_indices) {
-            rust_indices.push_back(idx);
-        }
-        out = UpsertWriter(table_->new_upsert_writer_with_column_indices(std::move(rust_indices)));
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
-    } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
-    }
-}
-
-Result Table::NewLookuper(Lookuper& out) {
-    if (!Available()) {
-        return utils::make_error(1, "Table not available");
-    }
-
-    try {
-        out = Lookuper(table_->new_lookuper());
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
-    } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
-    }
-}
-
 // LogScanner implementation
 LogScanner::LogScanner() noexcept = default;
 

From ef5f60044825676d73cf2ae79604c32c74fe7127 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 11 Feb 2026 07:54:21 +0000
Subject: [PATCH 138/287] chore: refacotr config for CPP and connect -> create 
 in cpp binding(#298)

---
 .../bindings/cpp/examples/admin_example.cpp   |  6 +++--
 fluss-rust/bindings/cpp/examples/example.cpp  |  5 +++-
 .../bindings/cpp/examples/kv_example.cpp      |  7 +++---
 fluss-rust/bindings/cpp/include/fluss.hpp     | 20 +++++++++++++++-
 fluss-rust/bindings/cpp/src/connection.cpp    |  5 ++--
 fluss-rust/bindings/cpp/src/ffi_converter.hpp | 12 ++++++++++
 fluss-rust/bindings/cpp/src/lib.rs            | 23 +++++++++++++++----
 7 files changed, 65 insertions(+), 13 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/admin_example.cpp b/fluss-rust/bindings/cpp/examples/admin_example.cpp
index 196fe975d6..c51062c6c2 100644
--- a/fluss-rust/bindings/cpp/examples/admin_example.cpp
+++ b/fluss-rust/bindings/cpp/examples/admin_example.cpp
@@ -31,13 +31,15 @@ static void check(const char* step, const fluss::Result& r) {
 }
 
 int main() {
-    const std::string bootstrap = "127.0.0.1:9123";
     const std::string db_name = "admin_example_db";
     const std::string table_name = "admin_example_table";
 
     // 1) Connect and get Admin
+    fluss::Configuration config;
+    config.bootstrap_server = "127.0.0.1:9123";
+
     fluss::Connection conn;
-    check("connect", fluss::Connection::Connect(bootstrap, conn));
+    check("create", fluss::Connection::Create(config, conn));
 
     fluss::Admin admin;
     check("get_admin", conn.GetAdmin(admin));
diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 59f1ed03dc..14fbeb2df9 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -34,8 +34,11 @@ static void check(const char* step, const fluss::Result& r) {
 
 int main() {
     // 1) Connect
+    fluss::Configuration config;
+    config.bootstrap_server = "127.0.0.1:9123";
+
     fluss::Connection conn;
-    check("connect", fluss::Connection::Connect("127.0.0.1:9123", conn));
+    check("create", fluss::Connection::Create(config, conn));
 
     // 2) Admin
     fluss::Admin admin;
diff --git a/fluss-rust/bindings/cpp/examples/kv_example.cpp b/fluss-rust/bindings/cpp/examples/kv_example.cpp
index 2a40db3ec5..3839e0fcc6 100644
--- a/fluss-rust/bindings/cpp/examples/kv_example.cpp
+++ b/fluss-rust/bindings/cpp/examples/kv_example.cpp
@@ -30,11 +30,12 @@ static void check(const char* step, const fluss::Result& r) {
 }
 
 int main() {
-    const std::string bootstrap = "127.0.0.1:9123";
-
     // 1) Connect and get Admin
+    fluss::Configuration config;
+    config.bootstrap_server = "127.0.0.1:9123";
+
     fluss::Connection conn;
-    check("connect", fluss::Connection::Connect(bootstrap, conn));
+    check("create", fluss::Connection::Create(config, conn));
 
     fluss::Admin admin;
     check("get_admin", conn.GetAdmin(admin));
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 1806616906..6bd6c2f26c 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -21,6 +21,7 @@
 
 #include <chrono>
 #include <cstdint>
+#include <limits>
 #include <memory>
 #include <stdexcept>
 #include <string>
@@ -809,6 +810,23 @@ class TableUpsert;
 class TableLookup;
 class TableScan;
 
+struct Configuration {
+    // Coordinator server address
+    std::string bootstrap_server{"127.0.0.1:9123"};
+    // Max request size in bytes (10 MB)
+    int32_t request_max_size{10 * 1024 * 1024};
+    // Writer acknowledgment mode: "all", "0", "1", or "-1"
+    std::string writer_acks{"all"};
+    // Max number of writer retries
+    int32_t writer_retries{std::numeric_limits<int32_t>::max()};
+    // Writer batch size in bytes (2 MB)
+    int32_t writer_batch_size{2 * 1024 * 1024};
+    // Number of remote log batches to prefetch during scanning
+    size_t scanner_remote_log_prefetch_num{4};
+    // Number of threads for downloading remote log data
+    size_t scanner_remote_log_download_threads{3};
+};
+
 class Connection {
    public:
     Connection() noexcept;
@@ -819,7 +837,7 @@ class Connection {
     Connection(Connection&& other) noexcept;
     Connection& operator=(Connection&& other) noexcept;
 
-    static Result Connect(const std::string& bootstrap_server, Connection& out);
+    static Result Create(const Configuration& config, Connection& out);
 
     bool Available() const;
 
diff --git a/fluss-rust/bindings/cpp/src/connection.cpp b/fluss-rust/bindings/cpp/src/connection.cpp
index 4fbfafb126..bceb2644c2 100644
--- a/fluss-rust/bindings/cpp/src/connection.cpp
+++ b/fluss-rust/bindings/cpp/src/connection.cpp
@@ -46,9 +46,10 @@ Connection& Connection::operator=(Connection&& other) noexcept {
     return *this;
 }
 
-Result Connection::Connect(const std::string& bootstrap_server, Connection& out) {
+Result Connection::Create(const Configuration& config, Connection& out) {
     try {
-        out.conn_ = ffi::new_connection(bootstrap_server);
+        auto ffi_config = utils::to_ffi_config(config);
+        out.conn_ = ffi::new_connection(ffi_config);
         return utils::make_ok();
     } catch (const rust::Error& e) {
         return utils::make_error(1, e.what());
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 40676e57df..3e6cdcd32e 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -123,6 +123,18 @@ inline ffi::FfiTablePath to_ffi_table_path(const TablePath& path) {
     return ffi_path;
 }
 
+inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
+    ffi::FfiConfig ffi_config;
+    ffi_config.bootstrap_server = rust::String(config.bootstrap_server);
+    ffi_config.request_max_size = config.request_max_size;
+    ffi_config.writer_acks = rust::String(config.writer_acks);
+    ffi_config.writer_retries = config.writer_retries;
+    ffi_config.writer_batch_size = config.writer_batch_size;
+    ffi_config.scanner_remote_log_prefetch_num = config.scanner_remote_log_prefetch_num;
+    ffi_config.scanner_remote_log_download_threads = config.scanner_remote_log_download_threads;
+    return ffi_config;
+}
+
 inline ffi::FfiColumn to_ffi_column(const Column& col) {
     ffi::FfiColumn ffi_col;
     ffi_col.name = rust::String(col.name);
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 9b1b5ef83b..d99209fa90 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -37,6 +37,16 @@ mod ffi {
         value: String,
     }
 
+    struct FfiConfig {
+        bootstrap_server: String,
+        request_max_size: i32,
+        writer_acks: String,
+        writer_retries: i32,
+        writer_batch_size: i32,
+        scanner_remote_log_prefetch_num: usize,
+        scanner_remote_log_download_threads: usize,
+    }
+
     struct FfiResult {
         error_code: i32,
         error_message: String,
@@ -252,7 +262,7 @@ mod ffi {
         type Lookuper;
 
         // Connection
-        fn new_connection(bootstrap_server: &str) -> Result<*mut Connection>;
+        fn new_connection(config: &FfiConfig) -> Result<*mut Connection>;
         unsafe fn delete_connection(conn: *mut Connection);
         fn get_admin(self: &Connection) -> Result<*mut Admin>;
         fn get_table(self: &Connection, table_path: &FfiTablePath) -> Result<*mut Table>;
@@ -442,10 +452,15 @@ fn err_result(code: i32, msg: String) -> ffi::FfiResult {
 }
 
 // Connection implementation
-fn new_connection(bootstrap_server: &str) -> Result<*mut Connection, String> {
+fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
     let config = fluss::config::Config {
-        bootstrap_server: bootstrap_server.to_string(),
-        ..Default::default()
+        bootstrap_server: config.bootstrap_server.to_string(),
+        request_max_size: config.request_max_size,
+        writer_acks: config.writer_acks.to_string(),
+        writer_retries: config.writer_retries,
+        writer_batch_size: config.writer_batch_size,
+        scanner_remote_log_prefetch_num: config.scanner_remote_log_prefetch_num,
+        scanner_remote_log_download_threads: config.scanner_remote_log_download_threads,
     };
 
     let conn = RUNTIME.block_on(async { fcore::client::FlussConnection::new(config).await });

From 309d6ea8b830398f4dd18a9e1f313bff7e730e3b Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Thu, 12 Feb 2026 21:56:56 +0000
Subject: [PATCH 139/287] chore: Verify API consistent across clients (#302)

---
 fluss-rust/README.md                          |   4 +-
 .../bindings/cpp/examples/admin_example.cpp   |   2 +-
 fluss-rust/bindings/cpp/examples/example.cpp  |   7 +-
 .../bindings/cpp/examples/kv_example.cpp      |   4 +-
 fluss-rust/bindings/cpp/include/fluss.hpp     | 141 +++++++-
 fluss-rust/bindings/cpp/src/admin.cpp         |  32 +-
 fluss-rust/bindings/cpp/src/connection.cpp    |  16 +-
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  10 +-
 fluss-rust/bindings/cpp/src/lib.rs            | 132 ++++----
 fluss-rust/bindings/cpp/src/table.cpp         |  92 +++---
 fluss-rust/bindings/python/API_REFERENCE.md   |  46 ++-
 fluss-rust/bindings/python/README.md          |  36 +-
 fluss-rust/bindings/python/example/example.py |  70 ++--
 fluss-rust/bindings/python/fluss/__init__.pyi | 187 +++++++++--
 fluss-rust/bindings/python/src/admin.rs       |  37 ++-
 fluss-rust/bindings/python/src/config.rs      |  90 ++++-
 fluss-rust/bindings/python/src/connection.rs  |  10 +-
 fluss-rust/bindings/python/src/error.rs       | 229 ++++++++++++-
 fluss-rust/bindings/python/src/lib.rs         |   6 +-
 fluss-rust/bindings/python/src/lookup.rs      |  10 +-
 fluss-rust/bindings/python/src/table.rs       | 307 ++++++++++++------
 fluss-rust/bindings/python/src/upsert.rs      | 120 ++-----
 .../bindings/python/src/write_handle.rs       |   4 +-
 .../crates/examples/src/example_kv_table.rs   |   4 +-
 .../src/example_partitioned_kv_table.rs       |   4 +-
 .../crates/examples/src/example_table.rs      |   4 +-
 fluss-rust/crates/fluss/src/client/admin.rs   |  28 +-
 .../crates/fluss/src/client/connection.rs     |   2 +-
 .../crates/fluss/src/client/table/lookup.rs   |  21 +-
 .../crates/fluss/src/client/table/mod.rs      |  14 +-
 .../fluss/src/client/table/remote_log.rs      |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  |   8 +-
 .../crates/fluss/src/client/write/sender.rs   |  10 +-
 .../fluss/src/client/write/writer_client.rs   |   4 +-
 .../crates/fluss/src/cluster/cluster.rs       |  15 +-
 fluss-rust/crates/fluss/src/config.rs         |  12 +-
 fluss-rust/crates/fluss/src/error.rs          |  74 +++--
 .../crates/fluss/src/metadata/json_serde.rs   |  14 +-
 fluss-rust/crates/fluss/src/metadata/table.rs |  68 ++--
 .../fluss/src/rpc/message/create_database.rs  |   2 +-
 .../crates/fluss/tests/integration/admin.rs   | 212 ++++++++++--
 .../fluss/tests/integration/fluss_cluster.rs  |   8 +-
 .../fluss/tests/integration/log_table.rs      |   6 +-
 .../tests/integration/table_remote_scan.rs    |   2 +-
 fluss-rust/docs/rust-client.md                |  10 +-
 45 files changed, 1466 insertions(+), 650 deletions(-)

diff --git a/fluss-rust/README.md b/fluss-rust/README.md
index b1116f1751..a42c0f360e 100644
--- a/fluss-rust/README.md
+++ b/fluss-rust/README.md
@@ -68,7 +68,7 @@ The example code is as follows:
 pub async fn main() -> Result<()> {
     // 1: create the table;
     let mut args = Args::default();
-    args.bootstrap_server = "127.0.0.1:9123".to_string();
+    args.bootstrap_servers = "127.0.0.1:9123".to_string();
     let conn_config = ConnectionConfig::from_args(args);
     let conn = FlussConnection::new(conn_config).await;
 
@@ -91,7 +91,7 @@ pub async fn main() -> Result<()> {
         .unwrap();
 
     // 2: get the table
-    let table_info = admin.get_table(&table_path).await.unwrap();
+    let table_info = admin.get_table_info(&table_path).await.unwrap();
     print!("Get created table:\n {}\n", table_info);
 
     // let's sleep 2 seconds to wait leader ready
diff --git a/fluss-rust/bindings/cpp/examples/admin_example.cpp b/fluss-rust/bindings/cpp/examples/admin_example.cpp
index c51062c6c2..37683b9513 100644
--- a/fluss-rust/bindings/cpp/examples/admin_example.cpp
+++ b/fluss-rust/bindings/cpp/examples/admin_example.cpp
@@ -36,7 +36,7 @@ int main() {
 
     // 1) Connect and get Admin
     fluss::Configuration config;
-    config.bootstrap_server = "127.0.0.1:9123";
+    config.bootstrap_servers = "127.0.0.1:9123";
 
     fluss::Connection conn;
     check("create", fluss::Connection::Create(config, conn));
diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 14fbeb2df9..e1925bb43c 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -35,7 +35,7 @@ static void check(const char* step, const fluss::Result& r) {
 int main() {
     // 1) Connect
     fluss::Configuration config;
-    config.bootstrap_server = "127.0.0.1:9123";
+    config.bootstrap_servers = "127.0.0.1:9123";
 
     fluss::Connection conn;
     check("create", fluss::Connection::Create(config, conn));
@@ -349,7 +349,8 @@ int main() {
     std::cout << "\n=== Testing Arrow Record Batch Polling ===" << std::endl;
 
     fluss::LogScanner arrow_scanner;
-    check("new_record_batch_log_scanner", table.NewScan().CreateRecordBatchScanner(arrow_scanner));
+    check("new_record_batch_log_scanner",
+          table.NewScan().CreateRecordBatchLogScanner(arrow_scanner));
 
     for (int b = 0; b < buckets; ++b) {
         check("subscribe_arrow", arrow_scanner.Subscribe(b, 0));
@@ -376,7 +377,7 @@ int main() {
     check("new_record_batch_log_scanner_with_projection",
           table.NewScan()
               .ProjectByIndex(projected_columns)
-              .CreateRecordBatchScanner(projected_arrow_scanner));
+              .CreateRecordBatchLogScanner(projected_arrow_scanner));
 
     for (int b = 0; b < buckets; ++b) {
         check("subscribe_projected_arrow", projected_arrow_scanner.Subscribe(b, 0));
diff --git a/fluss-rust/bindings/cpp/examples/kv_example.cpp b/fluss-rust/bindings/cpp/examples/kv_example.cpp
index 3839e0fcc6..b24a459d77 100644
--- a/fluss-rust/bindings/cpp/examples/kv_example.cpp
+++ b/fluss-rust/bindings/cpp/examples/kv_example.cpp
@@ -32,7 +32,7 @@ static void check(const char* step, const fluss::Result& r) {
 int main() {
     // 1) Connect and get Admin
     fluss::Configuration config;
-    config.bootstrap_server = "127.0.0.1:9123";
+    config.bootstrap_servers = "127.0.0.1:9123";
 
     fluss::Connection conn;
     check("create", fluss::Connection::Create(config, conn));
@@ -79,7 +79,7 @@ int main() {
     fluss::UpsertWriter upsert_writer;
     check("new_upsert_writer", kv_table.NewUpsert().CreateWriter(upsert_writer));
 
-    // Fire-and-forget upserts
+    // Fire-and-forget upserts (flush at the end)
     {
         auto row = kv_table.NewRow();
         row.Set("user_id", 1);
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 6bd6c2f26c..2fce8eb944 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -46,6 +46,136 @@ struct UpsertWriter;
 struct Lookuper;
 }  // namespace ffi
 
+/// Named constants for Fluss API error codes.
+///
+/// Server API errors have error_code > 0 or == -1.
+/// Client-side errors have error_code == CLIENT_ERROR (-2).
+/// These constants match the Rust core FlussError enum and are stable across protocol versions.
+/// New server error codes work automatically (error_code is a raw int, not a closed enum) —
+/// these constants are convenience names, not an exhaustive list.
+struct ErrorCode {
+    /// Client-side error (not from server API protocol). Check error_message for details.
+    static constexpr int CLIENT_ERROR = -2;
+    /// No error.
+    static constexpr int NONE = 0;
+    /// The server experienced an unexpected error when processing the request.
+    static constexpr int UNKNOWN_SERVER_ERROR = -1;
+    /// The server disconnected before a response was received.
+    static constexpr int NETWORK_EXCEPTION = 1;
+    /// The version of API is not supported.
+    static constexpr int UNSUPPORTED_VERSION = 2;
+    /// This message has failed its CRC checksum, exceeds the valid size, or is otherwise corrupt.
+    static constexpr int CORRUPT_MESSAGE = 3;
+    /// The database does not exist.
+    static constexpr int DATABASE_NOT_EXIST = 4;
+    /// The database is not empty.
+    static constexpr int DATABASE_NOT_EMPTY = 5;
+    /// The database already exists.
+    static constexpr int DATABASE_ALREADY_EXIST = 6;
+    /// The table does not exist.
+    static constexpr int TABLE_NOT_EXIST = 7;
+    /// The table already exists.
+    static constexpr int TABLE_ALREADY_EXIST = 8;
+    /// The schema does not exist.
+    static constexpr int SCHEMA_NOT_EXIST = 9;
+    /// Exception occurred while storing data for log in server.
+    static constexpr int LOG_STORAGE_EXCEPTION = 10;
+    /// Exception occurred while storing data for kv in server.
+    static constexpr int KV_STORAGE_EXCEPTION = 11;
+    /// Not leader or follower.
+    static constexpr int NOT_LEADER_OR_FOLLOWER = 12;
+    /// The record is too large.
+    static constexpr int RECORD_TOO_LARGE_EXCEPTION = 13;
+    /// The record is corrupt.
+    static constexpr int CORRUPT_RECORD_EXCEPTION = 14;
+    /// The client has attempted to perform an operation on an invalid table.
+    static constexpr int INVALID_TABLE_EXCEPTION = 15;
+    /// The client has attempted to perform an operation on an invalid database.
+    static constexpr int INVALID_DATABASE_EXCEPTION = 16;
+    /// The replication factor is larger than the number of available tablet servers.
+    static constexpr int INVALID_REPLICATION_FACTOR = 17;
+    /// Produce request specified an invalid value for required acks.
+    static constexpr int INVALID_REQUIRED_ACKS = 18;
+    /// The log offset is out of range.
+    static constexpr int LOG_OFFSET_OUT_OF_RANGE_EXCEPTION = 19;
+    /// The table is not a primary key table.
+    static constexpr int NON_PRIMARY_KEY_TABLE_EXCEPTION = 20;
+    /// The table or bucket does not exist.
+    static constexpr int UNKNOWN_TABLE_OR_BUCKET_EXCEPTION = 21;
+    /// The update version is invalid.
+    static constexpr int INVALID_UPDATE_VERSION_EXCEPTION = 22;
+    /// The coordinator is invalid.
+    static constexpr int INVALID_COORDINATOR_EXCEPTION = 23;
+    /// The leader epoch is invalid.
+    static constexpr int FENCED_LEADER_EPOCH_EXCEPTION = 24;
+    /// The request timed out.
+    static constexpr int REQUEST_TIME_OUT = 25;
+    /// The general storage exception.
+    static constexpr int STORAGE_EXCEPTION = 26;
+    /// The server did not attempt to execute this operation.
+    static constexpr int OPERATION_NOT_ATTEMPTED_EXCEPTION = 27;
+    /// Records are written to the server already, but to fewer in-sync replicas than required.
+    static constexpr int NOT_ENOUGH_REPLICAS_AFTER_APPEND_EXCEPTION = 28;
+    /// Messages are rejected since there are fewer in-sync replicas than required.
+    static constexpr int NOT_ENOUGH_REPLICAS_EXCEPTION = 29;
+    /// Get file access security token exception.
+    static constexpr int SECURITY_TOKEN_EXCEPTION = 30;
+    /// The tablet server received an out of order sequence batch.
+    static constexpr int OUT_OF_ORDER_SEQUENCE_EXCEPTION = 31;
+    /// The tablet server received a duplicate sequence batch.
+    static constexpr int DUPLICATE_SEQUENCE_EXCEPTION = 32;
+    /// The tablet server could not locate the writer metadata.
+    static constexpr int UNKNOWN_WRITER_ID_EXCEPTION = 33;
+    /// The requested column projection is invalid.
+    static constexpr int INVALID_COLUMN_PROJECTION = 34;
+    /// The requested target column to write is invalid.
+    static constexpr int INVALID_TARGET_COLUMN = 35;
+    /// The partition does not exist.
+    static constexpr int PARTITION_NOT_EXISTS = 36;
+    /// The table is not partitioned.
+    static constexpr int TABLE_NOT_PARTITIONED_EXCEPTION = 37;
+    /// The timestamp is invalid.
+    static constexpr int INVALID_TIMESTAMP_EXCEPTION = 38;
+    /// The config is invalid.
+    static constexpr int INVALID_CONFIG_EXCEPTION = 39;
+    /// The lake storage is not configured.
+    static constexpr int LAKE_STORAGE_NOT_CONFIGURED_EXCEPTION = 40;
+    /// The kv snapshot does not exist.
+    static constexpr int KV_SNAPSHOT_NOT_EXIST = 41;
+    /// The partition already exists.
+    static constexpr int PARTITION_ALREADY_EXISTS = 42;
+    /// The partition spec is invalid.
+    static constexpr int PARTITION_SPEC_INVALID_EXCEPTION = 43;
+    /// There is no currently available leader for the given partition.
+    static constexpr int LEADER_NOT_AVAILABLE_EXCEPTION = 44;
+    /// Exceed the maximum number of partitions.
+    static constexpr int PARTITION_MAX_NUM_EXCEPTION = 45;
+    /// Authentication failed.
+    static constexpr int AUTHENTICATE_EXCEPTION = 46;
+    /// Security is disabled.
+    static constexpr int SECURITY_DISABLED_EXCEPTION = 47;
+    /// Authorization failed.
+    static constexpr int AUTHORIZATION_EXCEPTION = 48;
+    /// Exceed the maximum number of buckets.
+    static constexpr int BUCKET_MAX_NUM_EXCEPTION = 49;
+    /// The tiering epoch is invalid.
+    static constexpr int FENCED_TIERING_EPOCH_EXCEPTION = 50;
+    /// Authentication failed with retriable exception.
+    static constexpr int RETRIABLE_AUTHENTICATE_EXCEPTION = 51;
+    /// The server rack info is invalid.
+    static constexpr int INVALID_SERVER_RACK_INFO_EXCEPTION = 52;
+    /// The lake snapshot does not exist.
+    static constexpr int LAKE_SNAPSHOT_NOT_EXIST = 53;
+    /// The lake table already exists.
+    static constexpr int LAKE_TABLE_ALREADY_EXIST = 54;
+    /// The new ISR contains at least one ineligible replica.
+    static constexpr int INELIGIBLE_REPLICA_EXCEPTION = 55;
+    /// The alter table is invalid.
+    static constexpr int INVALID_ALTER_TABLE_EXCEPTION = 56;
+    /// Deletion operations are disabled on this table.
+    static constexpr int DELETION_DISABLED_EXCEPTION = 57;
+};
+
 struct Date {
     int32_t days_since_epoch{0};
 
@@ -812,9 +942,9 @@ class TableScan;
 
 struct Configuration {
     // Coordinator server address
-    std::string bootstrap_server{"127.0.0.1:9123"};
+    std::string bootstrap_servers{"127.0.0.1:9123"};
     // Max request size in bytes (10 MB)
-    int32_t request_max_size{10 * 1024 * 1024};
+    int32_t writer_request_max_size{10 * 1024 * 1024};
     // Writer acknowledgment mode: "all", "0", "1", or "-1"
     std::string writer_acks{"all"};
     // Max number of writer retries
@@ -824,7 +954,7 @@ struct Configuration {
     // Number of remote log batches to prefetch during scanning
     size_t scanner_remote_log_prefetch_num{4};
     // Number of threads for downloading remote log data
-    size_t scanner_remote_log_download_threads{3};
+    size_t remote_file_download_thread_num{3};
 };
 
 class Connection {
@@ -866,7 +996,7 @@ class Admin {
 
     Result DropTable(const TablePath& table_path, bool ignore_if_not_exists = false);
 
-    Result GetTable(const TablePath& table_path, TableInfo& out);
+    Result GetTableInfo(const TablePath& table_path, TableInfo& out);
 
     Result GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& out);
 
@@ -1020,13 +1150,14 @@ class TableScan {
     TableScan& ProjectByName(std::vector<std::string> column_names);
 
     Result CreateLogScanner(LogScanner& out);
-    Result CreateRecordBatchScanner(LogScanner& out);
+    Result CreateRecordBatchLogScanner(LogScanner& out);
 
    private:
     friend class Table;
     explicit TableScan(ffi::Table* table) noexcept;
 
     std::vector<size_t> ResolveNameProjection() const;
+    Result DoCreateScanner(LogScanner& out, bool is_record_batch);
 
     ffi::Table* table_{nullptr};
     std::vector<size_t> projection_;
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index 7925256ef5..0fb15b2746 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -53,7 +53,7 @@ bool Admin::Available() const { return admin_ != nullptr; }
 Result Admin::CreateTable(const TablePath& table_path, const TableDescriptor& descriptor,
                           bool ignore_if_exists) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
@@ -65,7 +65,7 @@ Result Admin::CreateTable(const TablePath& table_path, const TableDescriptor& de
 
 Result Admin::DropTable(const TablePath& table_path, bool ignore_if_not_exists) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
@@ -73,9 +73,9 @@ Result Admin::DropTable(const TablePath& table_path, bool ignore_if_not_exists)
     return utils::from_ffi_result(ffi_result);
 }
 
-Result Admin::GetTable(const TablePath& table_path, TableInfo& out) {
+Result Admin::GetTableInfo(const TablePath& table_path, TableInfo& out) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
@@ -91,7 +91,7 @@ Result Admin::GetTable(const TablePath& table_path, TableInfo& out) {
 
 Result Admin::GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& out) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
@@ -111,7 +111,7 @@ Result Admin::DoListOffsets(const TablePath& table_path, const std::vector<int32
                             std::unordered_map<int32_t, int64_t>& out,
                             const std::string* partition_name) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
@@ -159,7 +159,7 @@ Result Admin::ListPartitionOffsets(const TablePath& table_path, const std::strin
 
 Result Admin::ListPartitionInfos(const TablePath& table_path, std::vector<PartitionInfo>& out) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
@@ -181,7 +181,7 @@ Result Admin::CreatePartition(const TablePath& table_path,
                               const std::unordered_map<std::string, std::string>& partition_spec,
                               bool ignore_if_exists) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
@@ -202,7 +202,7 @@ Result Admin::DropPartition(const TablePath& table_path,
                             const std::unordered_map<std::string, std::string>& partition_spec,
                             bool ignore_if_not_exists) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
@@ -222,7 +222,7 @@ Result Admin::DropPartition(const TablePath& table_path,
 Result Admin::CreateDatabase(const std::string& database_name, const DatabaseDescriptor& descriptor,
                              bool ignore_if_exists) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_desc = utils::to_ffi_database_descriptor(descriptor);
@@ -233,7 +233,7 @@ Result Admin::CreateDatabase(const std::string& database_name, const DatabaseDes
 Result Admin::DropDatabase(const std::string& database_name, bool ignore_if_not_exists,
                            bool cascade) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_result =
@@ -243,7 +243,7 @@ Result Admin::DropDatabase(const std::string& database_name, bool ignore_if_not_
 
 Result Admin::ListDatabases(std::vector<std::string>& out) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_result = admin_->list_databases();
@@ -260,7 +260,7 @@ Result Admin::ListDatabases(std::vector<std::string>& out) {
 
 Result Admin::DatabaseExists(const std::string& database_name, bool& out) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_result = admin_->database_exists(rust::Str(database_name));
@@ -273,7 +273,7 @@ Result Admin::DatabaseExists(const std::string& database_name, bool& out) {
 
 Result Admin::GetDatabaseInfo(const std::string& database_name, DatabaseInfo& out) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_result = admin_->get_database_info(rust::Str(database_name));
@@ -286,7 +286,7 @@ Result Admin::GetDatabaseInfo(const std::string& database_name, DatabaseInfo& ou
 
 Result Admin::ListTables(const std::string& database_name, std::vector<std::string>& out) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_result = admin_->list_tables(rust::Str(database_name));
@@ -303,7 +303,7 @@ Result Admin::ListTables(const std::string& database_name, std::vector<std::stri
 
 Result Admin::TableExists(const TablePath& table_path, bool& out) {
     if (!Available()) {
-        return utils::make_error(1, "Admin not available");
+        return utils::make_client_error("Admin not available");
     }
 
     auto ffi_path = utils::to_ffi_table_path(table_path);
diff --git a/fluss-rust/bindings/cpp/src/connection.cpp b/fluss-rust/bindings/cpp/src/connection.cpp
index bceb2644c2..dcf85783d9 100644
--- a/fluss-rust/bindings/cpp/src/connection.cpp
+++ b/fluss-rust/bindings/cpp/src/connection.cpp
@@ -52,9 +52,9 @@ Result Connection::Create(const Configuration& config, Connection& out) {
         out.conn_ = ffi::new_connection(ffi_config);
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
@@ -62,22 +62,22 @@ bool Connection::Available() const { return conn_ != nullptr; }
 
 Result Connection::GetAdmin(Admin& out) {
     if (!Available()) {
-        return utils::make_error(1, "Connection not available");
+        return utils::make_client_error("Connection not available");
     }
 
     try {
         out.admin_ = conn_->get_admin();
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
 Result Connection::GetTable(const TablePath& table_path, Table& out) {
     if (!Available()) {
-        return utils::make_error(1, "Connection not available");
+        return utils::make_client_error("Connection not available");
     }
 
     try {
@@ -85,9 +85,9 @@ Result Connection::GetTable(const TablePath& table_path, Table& out) {
         out.table_ = conn_->get_table(ffi_path);
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 3e6cdcd32e..3c918e569a 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -110,6 +110,10 @@ namespace utils {
 
 inline Result make_error(int32_t code, std::string msg) { return Result{code, std::move(msg)}; }
 
+inline Result make_client_error(std::string msg) {
+    return Result{ErrorCode::CLIENT_ERROR, std::move(msg)};
+}
+
 inline Result make_ok() { return Result{0, {}}; }
 
 inline Result from_ffi_result(const ffi::FfiResult& ffi_result) {
@@ -125,13 +129,13 @@ inline ffi::FfiTablePath to_ffi_table_path(const TablePath& path) {
 
 inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi::FfiConfig ffi_config;
-    ffi_config.bootstrap_server = rust::String(config.bootstrap_server);
-    ffi_config.request_max_size = config.request_max_size;
+    ffi_config.bootstrap_servers = rust::String(config.bootstrap_servers);
+    ffi_config.writer_request_max_size = config.writer_request_max_size;
     ffi_config.writer_acks = rust::String(config.writer_acks);
     ffi_config.writer_retries = config.writer_retries;
     ffi_config.writer_batch_size = config.writer_batch_size;
     ffi_config.scanner_remote_log_prefetch_num = config.scanner_remote_log_prefetch_num;
-    ffi_config.scanner_remote_log_download_threads = config.scanner_remote_log_download_threads;
+    ffi_config.remote_file_download_thread_num = config.remote_file_download_thread_num;
     return ffi_config;
 }
 
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index d99209fa90..b5a5139cce 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -38,13 +38,13 @@ mod ffi {
     }
 
     struct FfiConfig {
-        bootstrap_server: String,
-        request_max_size: i32,
+        bootstrap_servers: String,
+        writer_request_max_size: i32,
         writer_acks: String,
         writer_retries: i32,
         writer_batch_size: i32,
         scanner_remote_log_prefetch_num: usize,
-        scanner_remote_log_download_threads: usize,
+        remote_file_download_thread_num: usize,
     }
 
     struct FfiResult {
@@ -437,6 +437,12 @@ pub struct Lookuper {
     table_info: fcore::metadata::TableInfo,
 }
 
+/// Error code for client-side errors that did not originate from the server API protocol.
+/// Must be non-zero so that CPP `Result::Ok()` (which checks `error_code == 0`) correctly
+/// detects client-side errors as failures. The value -2 is outside the server API error
+/// code range (-1 .. 57+), so it will never collide with current or future API codes.
+const CLIENT_ERROR_CODE: i32 = -2;
+
 fn ok_result() -> ffi::FfiResult {
     ffi::FfiResult {
         error_code: 0,
@@ -451,16 +457,32 @@ fn err_result(code: i32, msg: String) -> ffi::FfiResult {
     }
 }
 
+/// Create a client-side error result (not from server API).
+fn client_err(msg: String) -> ffi::FfiResult {
+    err_result(CLIENT_ERROR_CODE, msg)
+}
+
+/// Convert a core Error to FfiResult.
+/// `FlussAPIError` variants carry the server protocol error code directly.
+/// All other error kinds are client-side and use CLIENT_ERROR_CODE.
+fn err_from_core_error(e: &fcore::error::Error) -> ffi::FfiResult {
+    use fcore::error::Error;
+    match e {
+        Error::FlussAPIError { api_error } => err_result(api_error.code, api_error.message.clone()),
+        _ => client_err(e.to_string()),
+    }
+}
+
 // Connection implementation
 fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
     let config = fluss::config::Config {
-        bootstrap_server: config.bootstrap_server.to_string(),
-        request_max_size: config.request_max_size,
+        bootstrap_servers: config.bootstrap_servers.to_string(),
+        writer_request_max_size: config.writer_request_max_size,
         writer_acks: config.writer_acks.to_string(),
         writer_retries: config.writer_retries,
         writer_batch_size: config.writer_batch_size,
         scanner_remote_log_prefetch_num: config.scanner_remote_log_prefetch_num,
-        scanner_remote_log_download_threads: config.scanner_remote_log_download_threads,
+        remote_file_download_thread_num: config.remote_file_download_thread_num,
     };
 
     let conn = RUNTIME.block_on(async { fcore::client::FlussConnection::new(config).await });
@@ -511,7 +533,7 @@ impl Connection {
                 let table = Box::into_raw(Box::new(Table {
                     connection: self.inner.clone(),
                     metadata: t.metadata().clone(),
-                    table_info: t.table_info().clone(),
+                    table_info: t.get_table_info().clone(),
                     table_path: t.table_path().clone(),
                     has_pk: t.has_primary_key(),
                 }));
@@ -545,7 +567,7 @@ impl Admin {
 
         let core_descriptor = match types::ffi_descriptor_to_core(descriptor) {
             Ok(d) => d,
-            Err(e) => return err_result(1, e.to_string()),
+            Err(e) => return client_err(e.to_string()),
         };
 
         let result = RUNTIME.block_on(async {
@@ -556,7 +578,7 @@ impl Admin {
 
         match result {
             Ok(_) => ok_result(),
-            Err(e) => err_result(2, e.to_string()),
+            Err(e) => err_from_core_error(&e),
         }
     }
 
@@ -575,7 +597,7 @@ impl Admin {
 
         match result {
             Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            Err(e) => err_from_core_error(&e),
         }
     }
 
@@ -585,7 +607,7 @@ impl Admin {
             table_path.table_name.clone(),
         );
 
-        let result = RUNTIME.block_on(async { self.inner.get_table(&path).await });
+        let result = RUNTIME.block_on(async { self.inner.get_table_info(&path).await });
 
         match result {
             Ok(info) => ffi::FfiTableInfoResult {
@@ -593,7 +615,7 @@ impl Admin {
                 table_info: types::core_table_info_to_ffi(&info),
             },
             Err(e) => ffi::FfiTableInfoResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 table_info: types::empty_table_info(),
             },
         }
@@ -616,7 +638,7 @@ impl Admin {
                 lake_snapshot: types::core_lake_snapshot_to_ffi(&snapshot),
             },
             Err(e) => ffi::FfiLakeSnapshotResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 lake_snapshot: ffi::FfiLakeSnapshot {
                     snapshot_id: -1,
                     bucket_offsets: vec![],
@@ -646,10 +668,10 @@ impl Admin {
             2 => OffsetSpec::Timestamp(offset_query.timestamp),
             _ => {
                 return ffi::FfiListOffsetsResult {
-                    result: err_result(
-                        1,
-                        format!("Invalid offset_type: {}", offset_query.offset_type),
-                    ),
+                    result: client_err(format!(
+                        "Invalid offset_type: {}",
+                        offset_query.offset_type
+                    )),
                     bucket_offsets: vec![],
                 };
             }
@@ -679,7 +701,7 @@ impl Admin {
                 }
             }
             Err(e) => ffi::FfiListOffsetsResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 bucket_offsets: vec![],
             },
         }
@@ -728,7 +750,7 @@ impl Admin {
                 }
             }
             Err(e) => ffi::FfiListPartitionInfosResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 partition_infos: vec![],
             },
         }
@@ -757,7 +779,7 @@ impl Admin {
 
         match result {
             Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            Err(e) => err_from_core_error(&e),
         }
     }
 
@@ -785,7 +807,7 @@ impl Admin {
 
         match result {
             Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            Err(e) => err_from_core_error(&e),
         }
     }
 
@@ -799,13 +821,13 @@ impl Admin {
 
         let result = RUNTIME.block_on(async {
             self.inner
-                .create_database(database_name, ignore_if_exists, descriptor_opt.as_ref())
+                .create_database(database_name, descriptor_opt.as_ref(), ignore_if_exists)
                 .await
         });
 
         match result {
             Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            Err(e) => err_from_core_error(&e),
         }
     }
 
@@ -823,7 +845,7 @@ impl Admin {
 
         match result {
             Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            Err(e) => err_from_core_error(&e),
         }
     }
 
@@ -836,7 +858,7 @@ impl Admin {
                 database_names: names,
             },
             Err(e) => ffi::FfiListDatabasesResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 database_names: vec![],
             },
         }
@@ -851,7 +873,7 @@ impl Admin {
                 value: exists,
             },
             Err(e) => ffi::FfiBoolResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 value: false,
             },
         }
@@ -866,7 +888,7 @@ impl Admin {
                 database_info: types::core_database_info_to_ffi(&info),
             },
             Err(e) => ffi::FfiDatabaseInfoResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 database_info: ffi::FfiDatabaseInfo {
                     database_name: String::new(),
                     comment: String::new(),
@@ -887,7 +909,7 @@ impl Admin {
                 table_names: names,
             },
             Err(e) => ffi::FfiListTablesResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 table_names: vec![],
             },
         }
@@ -907,7 +929,7 @@ impl Admin {
                 value: exists,
             },
             Err(e) => ffi::FfiBoolResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 value: false,
             },
         }
@@ -1099,7 +1121,7 @@ impl AppendWriter {
 
         match result {
             Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            Err(e) => err_from_core_error(&e),
         }
     }
 }
@@ -1110,10 +1132,10 @@ impl WriteResult {
             let result = RUNTIME.block_on(future);
             match result {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else {
-            err_result(1, "WriteResult already consumed".to_string())
+            client_err("WriteResult already consumed".to_string())
         }
     }
 }
@@ -1173,7 +1195,7 @@ impl UpsertWriter {
 
         match result {
             Ok(_) => ok_result(),
-            Err(e) => err_result(1, e.to_string()),
+            Err(e) => err_from_core_error(&e),
         }
     }
 }
@@ -1204,7 +1226,7 @@ impl Lookuper {
             Ok(r) => self.pad_row(r),
             Err(e) => {
                 return ffi::FfiLookupResult {
-                    result: err_result(1, e.to_string()),
+                    result: client_err(e.to_string()),
                     found: false,
                     row: ffi::FfiGenericRow { fields: vec![] },
                 };
@@ -1215,7 +1237,7 @@ impl Lookuper {
             Ok(r) => r,
             Err(e) => {
                 return ffi::FfiLookupResult {
-                    result: err_result(1, e.to_string()),
+                    result: err_from_core_error(&e),
                     found: false,
                     row: ffi::FfiGenericRow { fields: vec![] },
                 };
@@ -1230,7 +1252,7 @@ impl Lookuper {
                     row: ffi_row,
                 },
                 Err(e) => ffi::FfiLookupResult {
-                    result: err_result(1, e.to_string()),
+                    result: client_err(e.to_string()),
                     found: false,
                     row: ffi::FfiGenericRow { fields: vec![] },
                 },
@@ -1241,7 +1263,7 @@ impl Lookuper {
                 row: ffi::FfiGenericRow { fields: vec![] },
             },
             Err(e) => ffi::FfiLookupResult {
-                result: err_result(1, e.to_string()),
+                result: err_from_core_error(&e),
                 found: false,
                 row: ffi::FfiGenericRow { fields: vec![] },
             },
@@ -1292,7 +1314,7 @@ impl LogScanner {
             });
             match result {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else if let Some(ref inner_batch) = self.inner_batch {
             let result = RUNTIME.block_on(async {
@@ -1306,10 +1328,10 @@ impl LogScanner {
             });
             match result {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else {
-            err_result(1, "LogScanner not initialized".to_string())
+            client_err("LogScanner not initialized".to_string())
         }
     }
 
@@ -1325,7 +1347,7 @@ impl LogScanner {
 
             match result {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else if let Some(ref inner_batch) = self.inner_batch {
             let result =
@@ -1333,10 +1355,10 @@ impl LogScanner {
 
             match result {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else {
-            err_result(1, "LogScanner not initialized".to_string())
+            client_err("LogScanner not initialized".to_string())
         }
     }
 
@@ -1367,7 +1389,7 @@ impl LogScanner {
             });
             match result {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else if let Some(ref inner_batch) = self.inner_batch {
             let result = RUNTIME.block_on(async {
@@ -1377,10 +1399,10 @@ impl LogScanner {
             });
             match result {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else {
-            err_result(1, "LogScanner not initialized".to_string())
+            client_err("LogScanner not initialized".to_string())
         }
     }
 
@@ -1390,7 +1412,7 @@ impl LogScanner {
                 .block_on(async { inner.unsubscribe_partition(partition_id, bucket_id).await })
             {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else if let Some(ref inner_batch) = self.inner_batch {
             match RUNTIME.block_on(async {
@@ -1399,10 +1421,10 @@ impl LogScanner {
                     .await
             }) {
                 Ok(_) => ok_result(),
-                Err(e) => err_result(1, e.to_string()),
+                Err(e) => err_from_core_error(&e),
             }
         } else {
-            err_result(1, "LogScanner not initialized".to_string())
+            client_err("LogScanner not initialized".to_string())
         }
     }
 
@@ -1419,19 +1441,19 @@ impl LogScanner {
                             scan_records,
                         },
                         Err(e) => ffi::FfiScanRecordsResult {
-                            result: err_result(1, e.to_string()),
+                            result: client_err(e.to_string()),
                             scan_records: ffi::FfiScanRecords { records: vec![] },
                         },
                     }
                 }
                 Err(e) => ffi::FfiScanRecordsResult {
-                    result: err_result(1, e.to_string()),
+                    result: err_from_core_error(&e),
                     scan_records: ffi::FfiScanRecords { records: vec![] },
                 },
             }
         } else {
             ffi::FfiScanRecordsResult {
-                result: err_result(1, "Record-based scanner not available".to_string()),
+                result: client_err("Record-based scanner not available".to_string()),
                 scan_records: ffi::FfiScanRecords { records: vec![] },
             }
         }
@@ -1449,18 +1471,18 @@ impl LogScanner {
                         arrow_batches,
                     },
                     Err(e) => ffi::FfiArrowRecordBatchesResult {
-                        result: err_result(1, e),
+                        result: client_err(e),
                         arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
                     },
                 },
                 Err(e) => ffi::FfiArrowRecordBatchesResult {
-                    result: err_result(1, e.to_string()),
+                    result: err_from_core_error(&e),
                     arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
                 },
             }
         } else {
             ffi::FfiArrowRecordBatchesResult {
-                result: err_result(1, "Batch-based scanner not available".to_string()),
+                result: client_err("Batch-based scanner not available".to_string()),
                 arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
             }
         }
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index da4dc30688..078b1bc2c8 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -122,16 +122,16 @@ TableAppend::TableAppend(ffi::Table* table) noexcept : table_(table) {}
 
 Result TableAppend::CreateWriter(AppendWriter& out) {
     if (table_ == nullptr) {
-        return utils::make_error(1, "Table not available");
+        return utils::make_client_error("Table not available");
     }
 
     try {
         out = AppendWriter(table_->new_append_writer());
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
@@ -179,7 +179,7 @@ std::vector<size_t> TableUpsert::ResolveNameProjection() const {
 
 Result TableUpsert::CreateWriter(UpsertWriter& out) {
     if (table_ == nullptr) {
-        return utils::make_error(1, "Table not available");
+        return utils::make_client_error("Table not available");
     }
 
     try {
@@ -192,9 +192,9 @@ Result TableUpsert::CreateWriter(UpsertWriter& out) {
         out = UpsertWriter(table_->create_upsert_writer(std::move(rust_indices)));
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
@@ -203,16 +203,16 @@ TableLookup::TableLookup(ffi::Table* table) noexcept : table_(table) {}
 
 Result TableLookup::CreateLookuper(Lookuper& out) {
     if (table_ == nullptr) {
-        return utils::make_error(1, "Table not available");
+        return utils::make_client_error("Table not available");
     }
 
     try {
         out = Lookuper(table_->new_lookuper());
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
@@ -252,29 +252,15 @@ std::vector<size_t> TableScan::ResolveNameProjection() const {
     return indices;
 }
 
-Result TableScan::CreateLogScanner(LogScanner& out) {
-    if (table_ == nullptr) {
-        return utils::make_error(1, "Table not available");
-    }
+Result TableScan::CreateLogScanner(LogScanner& out) { return DoCreateScanner(out, false); }
 
-    try {
-        auto resolved_indices = !name_projection_.empty() ? ResolveNameProjection() : projection_;
-        rust::Vec<size_t> rust_indices;
-        for (size_t idx : resolved_indices) {
-            rust_indices.push_back(idx);
-        }
-        out.scanner_ = table_->create_scanner(std::move(rust_indices), false);
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
-    } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
-    }
+Result TableScan::CreateRecordBatchLogScanner(LogScanner& out) {
+    return DoCreateScanner(out, true);
 }
 
-Result TableScan::CreateRecordBatchScanner(LogScanner& out) {
+Result TableScan::DoCreateScanner(LogScanner& out, bool is_record_batch) {
     if (table_ == nullptr) {
-        return utils::make_error(1, "Table not available");
+        return utils::make_client_error("Table not available");
     }
 
     try {
@@ -283,12 +269,12 @@ Result TableScan::CreateRecordBatchScanner(LogScanner& out) {
         for (size_t idx : resolved_indices) {
             rust_indices.push_back(idx);
         }
-        out.scanner_ = table_->create_scanner(std::move(rust_indices), true);
+        out.scanner_ = table_->create_scanner(std::move(rust_indices), is_record_batch);
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
@@ -408,7 +394,7 @@ Result AppendWriter::Append(const GenericRow& row) {
 
 Result AppendWriter::Append(const GenericRow& row, WriteResult& out) {
     if (!Available()) {
-        return utils::make_error(1, "AppendWriter not available");
+        return utils::make_client_error("AppendWriter not available");
     }
 
     try {
@@ -417,15 +403,15 @@ Result AppendWriter::Append(const GenericRow& row, WriteResult& out) {
         out = WriteResult(rust_box.into_raw());
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
 Result AppendWriter::Flush() {
     if (!Available()) {
-        return utils::make_error(1, "AppendWriter not available");
+        return utils::make_client_error("AppendWriter not available");
     }
 
     auto ffi_result = writer_->flush();
@@ -468,7 +454,7 @@ Result UpsertWriter::Upsert(const GenericRow& row) {
 
 Result UpsertWriter::Upsert(const GenericRow& row, WriteResult& out) {
     if (!Available()) {
-        return utils::make_error(1, "UpsertWriter not available");
+        return utils::make_client_error("UpsertWriter not available");
     }
 
     try {
@@ -477,9 +463,9 @@ Result UpsertWriter::Upsert(const GenericRow& row, WriteResult& out) {
         out = WriteResult(rust_box.into_raw());
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
@@ -490,7 +476,7 @@ Result UpsertWriter::Delete(const GenericRow& row) {
 
 Result UpsertWriter::Delete(const GenericRow& row, WriteResult& out) {
     if (!Available()) {
-        return utils::make_error(1, "UpsertWriter not available");
+        return utils::make_client_error("UpsertWriter not available");
     }
 
     try {
@@ -499,15 +485,15 @@ Result UpsertWriter::Delete(const GenericRow& row, WriteResult& out) {
         out = WriteResult(rust_box.into_raw());
         return utils::make_ok();
     } catch (const rust::Error& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
 Result UpsertWriter::Flush() {
     if (!Available()) {
-        return utils::make_error(1, "UpsertWriter not available");
+        return utils::make_client_error("UpsertWriter not available");
     }
 
     auto ffi_result = writer_->upsert_flush();
@@ -545,7 +531,7 @@ bool Lookuper::Available() const { return lookuper_ != nullptr; }
 
 Result Lookuper::Lookup(const GenericRow& pk_row, bool& found, GenericRow& out) {
     if (!Available()) {
-        return utils::make_error(1, "Lookuper not available");
+        return utils::make_client_error("Lookuper not available");
     }
 
     try {
@@ -563,10 +549,10 @@ Result Lookuper::Lookup(const GenericRow& pk_row, bool& found, GenericRow& out)
         return utils::make_ok();
     } catch (const rust::Error& e) {
         found = false;
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     } catch (const std::exception& e) {
         found = false;
-        return utils::make_error(1, e.what());
+        return utils::make_client_error(e.what());
     }
 }
 
@@ -601,7 +587,7 @@ bool LogScanner::Available() const { return scanner_ != nullptr; }
 
 Result LogScanner::Subscribe(int32_t bucket_id, int64_t start_offset) {
     if (!Available()) {
-        return utils::make_error(1, "LogScanner not available");
+        return utils::make_client_error("LogScanner not available");
     }
 
     auto ffi_result = scanner_->subscribe(bucket_id, start_offset);
@@ -610,7 +596,7 @@ Result LogScanner::Subscribe(int32_t bucket_id, int64_t start_offset) {
 
 Result LogScanner::Subscribe(const std::vector<BucketSubscription>& bucket_offsets) {
     if (!Available()) {
-        return utils::make_error(1, "LogScanner not available");
+        return utils::make_client_error("LogScanner not available");
     }
 
     rust::Vec<ffi::FfiBucketSubscription> rust_subs;
@@ -628,7 +614,7 @@ Result LogScanner::Subscribe(const std::vector<BucketSubscription>& bucket_offse
 Result LogScanner::SubscribePartitionBuckets(int64_t partition_id, int32_t bucket_id,
                                              int64_t start_offset) {
     if (!Available()) {
-        return utils::make_error(1, "LogScanner not available");
+        return utils::make_client_error("LogScanner not available");
     }
 
     auto ffi_result = scanner_->subscribe_partition(partition_id, bucket_id, start_offset);
@@ -638,7 +624,7 @@ Result LogScanner::SubscribePartitionBuckets(int64_t partition_id, int32_t bucke
 Result LogScanner::SubscribePartitionBuckets(
     const std::vector<PartitionBucketSubscription>& subscriptions) {
     if (!Available()) {
-        return utils::make_error(1, "LogScanner not available");
+        return utils::make_client_error("LogScanner not available");
     }
 
     rust::Vec<ffi::FfiPartitionBucketSubscription> rust_subs;
@@ -656,7 +642,7 @@ Result LogScanner::SubscribePartitionBuckets(
 
 Result LogScanner::UnsubscribePartition(int64_t partition_id, int32_t bucket_id) {
     if (!Available()) {
-        return utils::make_error(1, "LogScanner not available");
+        return utils::make_client_error("LogScanner not available");
     }
 
     auto ffi_result = scanner_->unsubscribe_partition(partition_id, bucket_id);
@@ -665,7 +651,7 @@ Result LogScanner::UnsubscribePartition(int64_t partition_id, int32_t bucket_id)
 
 Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
     if (!Available()) {
-        return utils::make_error(1, "LogScanner not available");
+        return utils::make_client_error("LogScanner not available");
     }
 
     auto ffi_result = scanner_->poll(timeout_ms);
@@ -721,7 +707,7 @@ int64_t ArrowRecordBatch::GetLastOffset() const {
 
 Result LogScanner::PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out) {
     if (!Available()) {
-        return utils::make_error(1, "LogScanner not available");
+        return utils::make_client_error("LogScanner not available");
     }
 
     auto ffi_result = scanner_->poll_record_batch(timeout_ms);
@@ -753,7 +739,7 @@ Result LogScanner::PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out)
             // Return an error indicating that the import failed
             std::string error_msg =
                 "Failed to import Arrow record batch: " + import_result.status().ToString();
-            return utils::make_error(1, error_msg);
+            return utils::make_client_error(error_msg);
         }
     }
 
diff --git a/fluss-rust/bindings/python/API_REFERENCE.md b/fluss-rust/bindings/python/API_REFERENCE.md
index 258b26e6e8..e16a82f87d 100644
--- a/fluss-rust/bindings/python/API_REFERENCE.md
+++ b/fluss-rust/bindings/python/API_REFERENCE.md
@@ -25,15 +25,15 @@ Complete API reference for the Fluss Python client. For a usage guide with examp
 | Method / Property | Description |
 |---|---|
 | `Config(properties: dict = None)` | Create config from a dict of key-value pairs |
-| `.bootstrap_server` | Get/set coordinator server address |
-| `.request_max_size` | Get/set max request size in bytes |
+| `.bootstrap_servers` | Get/set coordinator server address |
+| `.writer_request_max_size` | Get/set max request size in bytes |
 | `.writer_batch_size` | Get/set write batch size in bytes |
 
 ## `FlussConnection`
 
 | Method | Description |
 |---|---|
-| `await FlussConnection.connect(config) -> FlussConnection` | Connect to a Fluss cluster |
+| `await FlussConnection.create(config) -> FlussConnection` | Connect to a Fluss cluster |
 | `await conn.get_admin() -> FlussAdmin` | Get admin interface |
 | `await conn.get_table(table_path) -> FlussTable` | Get a table for read/write operations |
 | `conn.close()` | Close the connection |
@@ -44,14 +44,14 @@ Supports `with` statement (context manager).
 
 | Method | Description |
 |---|---|
-| `await create_database(name, ignore_if_exists=False, database_descriptor=None)` | Create a database |
+| `await create_database(name, database_descriptor=None, ignore_if_exists=False)` | Create a database |
 | `await drop_database(name, ignore_if_not_exists=False, cascade=True)` | Drop a database |
 | `await list_databases() -> list[str]` | List all databases |
 | `await database_exists(name) -> bool` | Check if a database exists |
 | `await get_database_info(name) -> DatabaseInfo` | Get database metadata |
 | `await create_table(table_path, table_descriptor, ignore_if_exists=False)` | Create a table |
 | `await drop_table(table_path, ignore_if_not_exists=False)` | Drop a table |
-| `await get_table(table_path) -> TableInfo` | Get table metadata |
+| `await get_table_info(table_path) -> TableInfo` | Get table metadata |
 | `await list_tables(database_name) -> list[str]` | List tables in a database |
 | `await table_exists(table_path) -> bool` | Check if a table exists |
 | `await list_offsets(table_path, bucket_ids, offset_type, timestamp=None) -> dict[int, int]` | Get offsets for buckets |
@@ -66,9 +66,9 @@ Supports `with` statement (context manager).
 | Method | Description |
 |---|---|
 | `new_scan() -> TableScan` | Create a scan builder |
-| `await new_append_writer() -> AppendWriter` | Create writer for log tables |
-| `new_upsert(columns=None, column_indices=None) -> UpsertWriter` | Create writer for PK tables (optionally partial) |
-| `new_lookup() -> Lookuper` | Create lookuper for PK tables |
+| `new_append() -> TableAppend` | Create an append builder for log tables |
+| `new_upsert() -> TableUpsert` | Create an upsert builder for PK tables |
+| `new_lookup() -> TableLookup` | Create a lookup builder for PK tables |
 | `get_table_info() -> TableInfo` | Get table metadata |
 | `get_table_path() -> TablePath` | Get table path |
 | `has_primary_key() -> bool` | Check if table has a primary key |
@@ -80,7 +80,33 @@ Supports `with` statement (context manager).
 | `.project(indices) -> TableScan` | Project columns by index |
 | `.project_by_name(names) -> TableScan` | Project columns by name |
 | `await .create_log_scanner() -> LogScanner` | Create record-based scanner (for `poll()`) |
-| `await .create_batch_scanner() -> LogScanner` | Create batch-based scanner (for `poll_arrow()`, `to_arrow()`, etc.) |
+| `await .create_record_batch_log_scanner() -> LogScanner` | Create batch-based scanner (for `poll_arrow()`, `to_arrow()`, etc.) |
+
+## `TableAppend`
+
+Builder for creating an `AppendWriter`. Obtain via `FlussTable.new_append()`.
+
+| Method | Description |
+|---|---|
+| `.create_writer() -> AppendWriter` | Create the append writer |
+
+## `TableUpsert`
+
+Builder for creating an `UpsertWriter`. Obtain via `FlussTable.new_upsert()`.
+
+| Method | Description |
+|---|---|
+| `.partial_update_by_name(columns) -> TableUpsert` | Configure partial update by column names |
+| `.partial_update_by_index(indices) -> TableUpsert` | Configure partial update by column indices |
+| `.create_writer() -> UpsertWriter` | Create the upsert writer |
+
+## `TableLookup`
+
+Builder for creating a `Lookuper`. Obtain via `FlussTable.new_lookup()`.
+
+| Method | Description |
+|---|---|
+| `.create_lookuper() -> Lookuper` | Create the lookuper |
 
 ## `AppendWriter`
 
@@ -123,7 +149,7 @@ Supports `with` statement (context manager).
 | `.unsubscribe_partition(partition_id, bucket_id)` | Unsubscribe from a partition bucket |
 | `.poll(timeout_ms) -> list[ScanRecord]` | Poll individual records (record scanner only) |
 | `.poll_arrow(timeout_ms) -> pa.Table` | Poll as Arrow Table (batch scanner only) |
-| `.poll_batches(timeout_ms) -> list[RecordBatch]` | Poll batches with metadata (batch scanner only) |
+| `.poll_record_batch(timeout_ms) -> list[RecordBatch]` | Poll batches with metadata (batch scanner only) |
 | `.to_arrow() -> pa.Table` | Read all subscribed data as Arrow Table (batch scanner only) |
 | `.to_pandas() -> pd.DataFrame` | Read all subscribed data as DataFrame (batch scanner only) |
 
diff --git a/fluss-rust/bindings/python/README.md b/fluss-rust/bindings/python/README.md
index a31c990ad3..20c5f5522a 100644
--- a/fluss-rust/bindings/python/README.md
+++ b/fluss-rust/bindings/python/README.md
@@ -54,7 +54,7 @@ import fluss
 async def main():
     # Connect
     config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
-    conn = await fluss.FlussConnection.connect(config)
+    conn = await fluss.FlussConnection.create(config)
     admin = await conn.get_admin()
 
     # Create a log table
@@ -68,14 +68,14 @@ async def main():
 
     # Write
     table = await conn.get_table(table_path)
-    writer = await table.new_append_writer()
+    writer = table.new_append().create_writer()
     writer.append({"id": 1, "name": "Alice", "score": 95.5})
     writer.append({"id": 2, "name": "Bob", "score": 87.0})
     await writer.flush()
 
     # Read
-    num_buckets = (await admin.get_table(table_path)).num_buckets
-    scanner = await table.new_scan().create_batch_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner = await table.new_scan().create_record_batch_log_scanner()
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
     print(scanner.to_pandas())
 
@@ -90,13 +90,13 @@ asyncio.run(main())
 
 ```python
 config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
-conn = await fluss.FlussConnection.connect(config)
+conn = await fluss.FlussConnection.create(config)
 ```
 
 The connection also supports context managers:
 
 ```python
-with await fluss.FlussConnection.connect(config) as conn:
+with await fluss.FlussConnection.create(config) as conn:
     ...
 ```
 
@@ -141,7 +141,7 @@ schema = fluss.Schema(pa.schema([
 table_path = fluss.TablePath("my_database", "my_table")
 await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
 
-table_info = await admin.get_table(table_path)
+table_info = await admin.get_table_info(table_path)
 tables = await admin.list_tables("my_database")
 await admin.drop_table(table_path, ignore_if_not_exists=True)
 ```
@@ -184,7 +184,7 @@ Write methods like `append()` and `write_arrow_batch()` return a `WriteResultHan
 
 ```python
 table = await conn.get_table(table_path)
-writer = await table.new_append_writer()
+writer = table.new_append().create_writer()
 
 # Fire-and-forget: queue writes, flush at the end
 writer.append({"id": 1, "name": "Alice", "score": 95.5})
@@ -205,19 +205,19 @@ await writer.flush()
 ### Reading
 
 There are two scanner types:
-- **Batch scanner** (`create_batch_scanner()`) — returns Arrow Tables or DataFrames, best for analytics
+- **Batch scanner** (`create_record_batch_log_scanner()`) — returns Arrow Tables or DataFrames, best for analytics
 - **Record scanner** (`create_log_scanner()`) — returns individual records with metadata (offset, timestamp, change type), best for streaming
 
 And two reading modes:
 - **`to_arrow()` / `to_pandas()`** — reads all data from subscribed buckets up to the current latest offset, then returns. Best for one-shot batch reads.
-- **`poll_arrow()` / `poll()` / `poll_batches()`** — returns whatever data is available within the timeout, then returns. Call in a loop for continuous streaming.
+- **`poll_arrow()` / `poll()` / `poll_record_batch()`** — returns whatever data is available within the timeout, then returns. Call in a loop for continuous streaming.
 
 #### Batch Read (One-Shot)
 
 ```python
-num_buckets = (await admin.get_table(table_path)).num_buckets
+num_buckets = (await admin.get_table_info(table_path)).num_buckets
 
-scanner = await table.new_scan().create_batch_scanner()
+scanner = await table.new_scan().create_record_batch_log_scanner()
 scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
 # Reads everything up to current latest offset, then returns
@@ -231,7 +231,7 @@ Use `poll_arrow()` or `poll()` in a loop for streaming consumption:
 
 ```python
 # Batch scanner: poll as Arrow Tables
-scanner = await table.new_scan().create_batch_scanner()
+scanner = await table.new_scan().create_record_batch_log_scanner()
 scanner.subscribe(bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
 
 while True:
@@ -253,16 +253,16 @@ while True:
 To only consume new records (skip existing data), use `LATEST_OFFSET`:
 
 ```python
-scanner = await table.new_scan().create_batch_scanner()
+scanner = await table.new_scan().create_record_batch_log_scanner()
 scanner.subscribe(bucket_id=0, start_offset=fluss.LATEST_OFFSET)
 ```
 
 ### Column Projection
 
 ```python
-scanner = await table.new_scan().project([0, 2]).create_batch_scanner()
+scanner = await table.new_scan().project([0, 2]).create_record_batch_log_scanner()
 # or by name
-scanner = await table.new_scan().project_by_name(["id", "score"]).create_batch_scanner()
+scanner = await table.new_scan().project_by_name(["id", "score"]).create_record_batch_log_scanner()
 ```
 
 ## Primary Key Tables
@@ -356,7 +356,7 @@ Same as non-partitioned tables — include partition column values in each row:
 
 ```python
 table = await conn.get_table(table_path)
-writer = await table.new_append_writer()
+writer = table.new_append().create_writer()
 writer.append({"id": 1, "region": "US", "value": 100})
 writer.append({"id": 2, "region": "EU", "value": 200})
 await writer.flush()
@@ -367,7 +367,7 @@ await writer.flush()
 Use `subscribe_partition()` or `subscribe_partition_buckets()` instead of `subscribe()`:
 
 ```python
-scanner = await table.new_scan().create_batch_scanner()
+scanner = await table.new_scan().create_record_batch_log_scanner()
 
 # Subscribe to individual partitions
 for p in partition_infos:
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 3d4235392d..8e68843266 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -32,15 +32,15 @@ async def main():
     config_spec = {
         "bootstrap.servers": "127.0.0.1:9123",
         # Add other configuration options as needed
-        "request.max.size": "10485760",  # 10 MB
+        "writer.request-max-size": "10485760",  # 10 MB
         "writer.acks": "all",  # Wait for all replicas to acknowledge
         "writer.retries": "3",  # Retry up to 3 times on failure
-        "writer.batch.size": "1000",  # Batch size for writes
+        "writer.batch-size": "1000",  # Batch size for writes
     }
     config = fluss.Config(config_spec)
 
-    # Create connection using the static connect method
-    conn = await fluss.FlussConnection.connect(config)
+    # Create connection using the static create method
+    conn = await fluss.FlussConnection.create(config)
 
     # Define fields for PyArrow
     fields = [
@@ -78,7 +78,7 @@ async def main():
 
     # Get table information via admin
     try:
-        table_info = await admin.get_table(table_path)
+        table_info = await admin.get_table_info(table_path)
         print(f"Table info: {table_info}")
         print(f"Table ID: {table_info.table_id}")
         print(f"Schema ID: {table_info.schema_id}")
@@ -105,7 +105,7 @@ async def main():
     print(f"Got table: {table}")
 
     # Create a writer for the table
-    append_writer = await table.new_append_writer()
+    append_writer = table.new_append().create_writer()
     print(f"Created append writer: {append_writer}")
 
     try:
@@ -264,13 +264,13 @@ async def main():
     # Now scan the table to verify data was written
     print("\n--- Scanning table (batch scanner) ---")
     try:
-        # Use new_scan().create_batch_scanner() for batch-based operations
-        batch_scanner = await table.new_scan().create_batch_scanner()
+        # Use new_scan().create_record_batch_log_scanner() for batch-based operations
+        batch_scanner = await table.new_scan().create_record_batch_log_scanner()
         print(f"Created batch scanner: {batch_scanner}")
 
         # Subscribe to buckets (required before to_arrow/to_pandas)
         # Use subscribe_buckets to subscribe all buckets from EARLIEST_OFFSET
-        num_buckets = (await admin.get_table(table_path)).num_buckets
+        num_buckets = (await admin.get_table_info(table_path)).num_buckets
         batch_scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
         print(f"Subscribed to {num_buckets} buckets from EARLIEST_OFFSET")
 
@@ -285,7 +285,7 @@ async def main():
             print(f"Could not convert to PyArrow: {e}")
 
         # Create a new batch scanner for to_pandas() test
-        batch_scanner2 = await table.new_scan().create_batch_scanner()
+        batch_scanner2 = await table.new_scan().create_record_batch_log_scanner()
         batch_scanner2.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
         # Try to get as Pandas DataFrame
@@ -302,7 +302,7 @@ async def main():
 
         # Test poll_arrow() method for incremental reading as Arrow Table
         print("\n--- Testing poll_arrow() method ---")
-        batch_scanner3 = await table.new_scan().create_batch_scanner()
+        batch_scanner3 = await table.new_scan().create_record_batch_log_scanner()
         batch_scanner3.subscribe(bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
         print(f"Subscribed to bucket 0 at EARLIEST_OFFSET ({fluss.EARLIEST_OFFSET})")
 
@@ -323,13 +323,13 @@ async def main():
         except Exception as e:
             print(f"Error during poll_arrow: {e}")
 
-        # Test poll_batches() method for batches with metadata
-        print("\n--- Testing poll_batches() method ---")
-        batch_scanner4 = await table.new_scan().create_batch_scanner()
+        # Test poll_record_batch() method for batches with metadata
+        print("\n--- Testing poll_record_batch() method ---")
+        batch_scanner4 = await table.new_scan().create_record_batch_log_scanner()
         batch_scanner4.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
         try:
-            batches = batch_scanner4.poll_batches(5000)
+            batches = batch_scanner4.poll_record_batch(5000)
             print(f"Number of batches: {len(batches)}")
 
             for i, batch in enumerate(batches):
@@ -338,7 +338,7 @@ async def main():
                       f"rows={batch.batch.num_rows}")
 
         except Exception as e:
-            print(f"Error during poll_batches: {e}")
+            print(f"Error during poll_record_batch: {e}")
 
     except Exception as e:
         print(f"Error during batch scanning: {e}")
@@ -419,7 +419,7 @@ async def main():
     # --- Test Upsert ---
     print("\n--- Testing Upsert (fire-and-forget) ---")
     try:
-        upsert_writer = pk_table.new_upsert()
+        upsert_writer = pk_table.new_upsert().create_writer()
         print(f"Created upsert writer: {upsert_writer}")
 
         # Fire-and-forget: queue writes synchronously, flush at end.
@@ -504,7 +504,7 @@ async def main():
     # --- Test Lookup ---
     print("\n--- Testing Lookup ---")
     try:
-        lookuper = pk_table.new_lookup()
+        lookuper = pk_table.new_lookup().create_lookuper()
         print(f"Created lookuper: {lookuper}")
 
         result = await lookuper.lookup({"user_id": 1})
@@ -552,13 +552,13 @@ async def main():
     # --- Test Delete ---
     print("\n--- Testing Delete ---")
     try:
-        upsert_writer = pk_table.new_upsert()
+        upsert_writer = pk_table.new_upsert().create_writer()
 
         handle = upsert_writer.delete({"user_id": 3})
         await handle.wait()
         print("Deleted user_id=3 — server acknowledged")
 
-        lookuper = pk_table.new_lookup()
+        lookuper = pk_table.new_lookup().create_lookuper()
         result = await lookuper.lookup({"user_id": 3})
         if result:
             print(f"Lookup user_id=3 after delete: Still found! -> {result}")
@@ -572,12 +572,12 @@ async def main():
     # --- Test Partial Update by column names ---
     print("\n--- Testing Partial Update (by column names) ---")
     try:
-        partial_writer = pk_table.new_upsert(columns=["user_id", "balance"])
+        partial_writer = pk_table.new_upsert().partial_update_by_name(["user_id", "balance"]).create_writer()
         handle = partial_writer.upsert({"user_id": 1, "balance": Decimal("9999.99")})
         await handle.wait()
         print("Partial update: set balance=9999.99 for user_id=1")
 
-        lookuper = pk_table.new_lookup()
+        lookuper = pk_table.new_lookup().create_lookuper()
         result = await lookuper.lookup({"user_id": 1})
         if result:
             print(f"Partial update verified:"
@@ -594,12 +594,12 @@ async def main():
     print("\n--- Testing Partial Update (by column indices) ---")
     try:
         # Columns: 0=user_id (PK), 1=name — update name only
-        partial_writer_idx = pk_table.new_upsert(column_indices=[0, 1])
+        partial_writer_idx = pk_table.new_upsert().partial_update_by_index([0, 1]).create_writer()
         handle = partial_writer_idx.upsert([1, "Alice Renamed"])
         await handle.wait()
         print("Partial update by indices: set name='Alice Renamed' for user_id=1")
 
-        lookuper = pk_table.new_lookup()
+        lookuper = pk_table.new_lookup().create_lookuper()
         result = await lookuper.lookup({"user_id": 1})
         if result:
             print(f"Partial update by indices verified:"
@@ -616,11 +616,11 @@ async def main():
     print("\n--- Testing Column Projection ---")
     try:
         # Get bucket count for subscriptions
-        num_buckets = (await admin.get_table(table_path)).num_buckets
+        num_buckets = (await admin.get_table_info(table_path)).num_buckets
 
         # Project specific columns by index (using batch scanner for to_pandas)
         print("\n1. Projection by index [0, 1] (id, name):")
-        scanner_index = await table.new_scan().project([0, 1]).create_batch_scanner()
+        scanner_index = await table.new_scan().project([0, 1]).create_record_batch_log_scanner()
         scanner_index.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
         df_projected = scanner_index.to_pandas()
         print(df_projected.head())
@@ -632,7 +632,7 @@ async def main():
         print("\n2. Projection by name ['name', 'score'] (Pythonic):")
         scanner_names = await table.new_scan() \
             .project_by_name(["name", "score"]) \
-            .create_batch_scanner()
+            .create_record_batch_log_scanner()
         scanner_names.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
         df_named = scanner_names.to_pandas()
         print(df_named.head())
@@ -640,7 +640,7 @@ async def main():
 
         # Test empty result schema with projection
         print("\n3. Testing empty result schema with projection:")
-        scanner_proj = await table.new_scan().project([0, 2]).create_batch_scanner()
+        scanner_proj = await table.new_scan().project([0, 2]).create_record_batch_log_scanner()
         scanner_proj.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
         # Quick poll that may return empty
         result = scanner_proj.poll_arrow(100)
@@ -709,7 +709,7 @@ async def main():
 
         # Get the table and write some data
         partitioned_table = await conn.get_table(partitioned_table_path)
-        partitioned_writer = await partitioned_table.new_append_writer()
+        partitioned_writer = partitioned_table.new_append().create_writer()
 
         # Append data to US partition
         partitioned_writer.append({"id": 1, "region": "US", "value": 100})
@@ -744,7 +744,7 @@ async def main():
 
         # Demo: subscribe_partition for reading partitioned data
         print("\n--- Testing subscribe_partition + to_arrow() ---")
-        partitioned_scanner = await partitioned_table.new_scan().create_batch_scanner()
+        partitioned_scanner = await partitioned_table.new_scan().create_record_batch_log_scanner()
 
         # Subscribe to each partition using partition_id
         for p in partition_infos:
@@ -762,7 +762,7 @@ async def main():
 
         # Demo: subscribe_partition_buckets for batch subscribing to multiple partitions at once
         print("\n--- Testing subscribe_partition_buckets + to_arrow() ---")
-        partitioned_scanner_batch = await partitioned_table.new_scan().create_batch_scanner()
+        partitioned_scanner_batch = await partitioned_table.new_scan().create_record_batch_log_scanner()
         partition_bucket_offsets = {
             (p.partition_id, 0): fluss.EARLIEST_OFFSET for p in partition_infos
         }
@@ -774,7 +774,7 @@ async def main():
 
         # Demo: unsubscribe_partition - unsubscribe from one partition, read remaining
         print("\n--- Testing unsubscribe_partition ---")
-        partitioned_scanner3 = await partitioned_table.new_scan().create_batch_scanner()
+        partitioned_scanner3 = await partitioned_table.new_scan().create_record_batch_log_scanner()
         for p in partition_infos:
             partitioned_scanner3.subscribe_partition(p.partition_id, 0, fluss.EARLIEST_OFFSET)
         # Unsubscribe from the first partition
@@ -787,7 +787,7 @@ async def main():
 
         # Demo: to_pandas() also works for partitioned tables
         print("\n--- Testing to_pandas() on partitioned table ---")
-        partitioned_scanner2 = await partitioned_table.new_scan().create_batch_scanner()
+        partitioned_scanner2 = await partitioned_table.new_scan().create_record_batch_log_scanner()
         for p in partition_infos:
             partitioned_scanner2.subscribe_partition(p.partition_id, 0, fluss.EARLIEST_OFFSET)
         partitioned_df = partitioned_scanner2.to_pandas()
@@ -839,7 +839,7 @@ async def main():
         print("Created partitions: US, EU, APAC")
 
         partitioned_kv_table = await conn.get_table(partitioned_kv_path)
-        upsert_writer = partitioned_kv_table.new_upsert()
+        upsert_writer = partitioned_kv_table.new_upsert().create_writer()
 
         # Upsert rows across partitions
         test_data = [
@@ -859,7 +859,7 @@ async def main():
 
         # Lookup all rows across partitions
         print("\n--- Lookup across partitions ---")
-        lookuper = partitioned_kv_table.new_lookup()
+        lookuper = partitioned_kv_table.new_lookup().create_lookuper()
         for region, user_id, name, score in test_data:
             result = await lookuper.lookup({"region": region, "user_id": user_id})
             assert result is not None, f"Expected to find region={region} user_id={user_id}"
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index adbfc2fe02..55837de536 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -93,21 +93,37 @@ class RecordBatch:
 class Config:
     def __init__(self, properties: Optional[Dict[str, str]] = None) -> None: ...
     @property
-    def bootstrap_server(self) -> Optional[str]: ...
-    @bootstrap_server.setter
-    def bootstrap_server(self, server: str) -> None: ...
+    def bootstrap_servers(self) -> str: ...
+    @bootstrap_servers.setter
+    def bootstrap_servers(self, server: str) -> None: ...
     @property
-    def request_max_size(self) -> int: ...
-    @request_max_size.setter
-    def request_max_size(self, size: int) -> None: ...
+    def writer_request_max_size(self) -> int: ...
+    @writer_request_max_size.setter
+    def writer_request_max_size(self, size: int) -> None: ...
+    @property
+    def writer_acks(self) -> str: ...
+    @writer_acks.setter
+    def writer_acks(self, acks: str) -> None: ...
+    @property
+    def writer_retries(self) -> int: ...
+    @writer_retries.setter
+    def writer_retries(self, retries: int) -> None: ...
     @property
     def writer_batch_size(self) -> int: ...
     @writer_batch_size.setter
     def writer_batch_size(self, size: int) -> None: ...
+    @property
+    def scanner_remote_log_prefetch_num(self) -> int: ...
+    @scanner_remote_log_prefetch_num.setter
+    def scanner_remote_log_prefetch_num(self, num: int) -> None: ...
+    @property
+    def remote_file_download_thread_num(self) -> int: ...
+    @remote_file_download_thread_num.setter
+    def remote_file_download_thread_num(self, num: int) -> None: ...
 
 class FlussConnection:
     @staticmethod
-    async def connect(config: Config) -> FlussConnection: ...
+    async def create(config: Config) -> FlussConnection: ...
     async def get_admin(self) -> FlussAdmin: ...
     async def get_table(self, table_path: TablePath) -> FlussTable: ...
     def close(self) -> None: ...
@@ -124,8 +140,8 @@ class FlussAdmin:
     async def create_database(
         self,
         database_name: str,
-        ignore_if_exists: bool = False,
         database_descriptor: Optional["DatabaseDescriptor"] = None,
+        ignore_if_exists: bool = False,
     ) -> None:
         """Create a database."""
         ...
@@ -166,7 +182,7 @@ class FlussAdmin:
         table_descriptor: TableDescriptor,
         ignore_if_exists: Optional[bool] = False,
     ) -> None: ...
-    async def get_table(self, table_path: TablePath) -> TableInfo: ...
+    async def get_table_info(self, table_path: TablePath) -> TableInfo: ...
     async def get_latest_lake_snapshot(self, table_path: TablePath) -> LakeSnapshot: ...
     async def drop_table(
         self,
@@ -285,7 +301,7 @@ class TableScan:
         # Batch-based scanning with column names
         scanner = await table.new_scan() \\
             .project_by_name(["id", "name"]) \\
-            .create_batch_scanner()
+            .create_record_batch_log_scanner()
         ```
     """
 
@@ -319,14 +335,14 @@ class TableScan:
             LogScanner for record-by-record scanning with `poll()`
         """
         ...
-    async def create_batch_scanner(self) -> LogScanner:
+    async def create_record_batch_log_scanner(self) -> LogScanner:
         """Create a batch-based log scanner.
 
         Use this scanner with `poll_arrow()` to get Arrow Tables, or with
-        `poll_batches()` to get individual batches with metadata.
+        `poll_record_batch()` to get individual batches with metadata.
 
         Returns:
-            LogScanner for batch-based scanning with `poll_arrow()` or `poll_batches()`
+            LogScanner for batch-based scanning with `poll_arrow()` or `poll_record_batch()`
         """
         ...
     def __repr__(self) -> str: ...
@@ -347,25 +363,68 @@ class FlussTable:
             # Batch-based scanning
             scanner = await table.new_scan() \\
                 .project_by_name(["id", "name"]) \\
-                .create_batch_scanner()
+                .create_record_batch_log_scanner()
             ```
 
         Returns:
             TableScan builder for configuring the scanner.
         """
         ...
-    async def new_append_writer(self) -> AppendWriter: ...
-    def new_upsert(
-        self,
-        columns: Optional[List[str]] = None,
-        column_indices: Optional[List[int]] = None,
-    ) -> UpsertWriter: ...
-    def new_lookup(self) -> Lookuper: ...
+    def new_append(self) -> TableAppend: ...
+    def new_upsert(self) -> TableUpsert: ...
+    def new_lookup(self) -> TableLookup: ...
     def get_table_info(self) -> TableInfo: ...
     def get_table_path(self) -> TablePath: ...
     def has_primary_key(self) -> bool: ...
     def __repr__(self) -> str: ...
 
+class TableAppend:
+    """Builder for creating an AppendWriter.
+
+    Obtain via `FlussTable.new_append()`, then call `create_writer()`.
+
+    Example:
+        writer = table.new_append().create_writer()
+    """
+
+    def create_writer(self) -> AppendWriter: ...
+    def __repr__(self) -> str: ...
+
+class TableUpsert:
+    """Builder for creating an UpsertWriter, with optional partial update.
+
+    Obtain via `FlussTable.new_upsert()`, then optionally call
+    `partial_update_by_name()` or `partial_update_by_index()`,
+    then call `create_writer()`.
+
+    Example:
+        # Full row upsert
+        writer = table.new_upsert().create_writer()
+
+        # Partial update by column names
+        writer = table.new_upsert().partial_update_by_name(["col1", "col2"]).create_writer()
+
+        # Partial update by column indices
+        writer = table.new_upsert().partial_update_by_index([0, 1]).create_writer()
+    """
+
+    def partial_update_by_name(self, columns: List[str]) -> "TableUpsert": ...
+    def partial_update_by_index(self, column_indices: List[int]) -> "TableUpsert": ...
+    def create_writer(self) -> UpsertWriter: ...
+    def __repr__(self) -> str: ...
+
+class TableLookup:
+    """Builder for creating a Lookuper.
+
+    Obtain via `FlussTable.new_lookup()`, then call `create_lookuper()`.
+
+    Example:
+        lookuper = table.new_lookup().create_lookuper()
+    """
+
+    def create_lookuper(self) -> Lookuper: ...
+    def __repr__(self) -> str: ...
+
 class AppendWriter:
     def append(self, row: dict | list | tuple) -> WriteResultHandle:
         """Append a single row to the table.
@@ -465,14 +524,14 @@ class LogScanner:
 
     This scanner supports two modes:
     - Record-based scanning via `poll()` - returns individual records with metadata
-    - Batch-based scanning via `poll_arrow()` / `poll_batches()` - returns Arrow batches
+    - Batch-based scanning via `poll_arrow()` / `poll_record_batch()` - returns Arrow batches
 
     Create scanners using the builder pattern:
         # Record-based scanning
         scanner = await table.new_scan().create_log_scanner()
 
         # Batch-based scanning
-        scanner = await table.new_scan().create_batch_scanner()
+        scanner = await table.new_scan().create_record_batch_log_scanner()
 
         # With projection
         scanner = await table.new_scan().project([0, 1]).create_log_scanner()
@@ -538,10 +597,10 @@ class LogScanner:
             Returns an empty list if no records are available or timeout expires.
         """
         ...
-    def poll_batches(self, timeout_ms: int) -> List[RecordBatch]:
+    def poll_record_batch(self, timeout_ms: int) -> List[RecordBatch]:
         """Poll for batches with metadata.
 
-        Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+        Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
 
         Args:
             timeout_ms: Timeout in milliseconds to wait for batches.
@@ -557,7 +616,7 @@ class LogScanner:
     def poll_arrow(self, timeout_ms: int) -> pa.Table:
         """Poll for records as an Arrow Table.
 
-        Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+        Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
 
         Args:
             timeout_ms: Timeout in milliseconds to wait for records.
@@ -573,7 +632,7 @@ class LogScanner:
     def to_pandas(self) -> pd.DataFrame:
         """Convert all data to Pandas DataFrame.
 
-        Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+        Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
         Reads from currently subscribed buckets until reaching their latest offsets.
 
         You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
@@ -582,7 +641,7 @@ class LogScanner:
     def to_arrow(self) -> pa.Table:
         """Convert all data to Arrow Table.
 
-        Requires a batch-based scanner (created with new_scan().create_batch_scanner()).
+        Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
         Reads from currently subscribed buckets until reaching their latest offsets.
 
         You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
@@ -655,7 +714,8 @@ class TableInfo:
 
 class FlussError(Exception):
     message: str
-    def __init__(self, message: str) -> None: ...
+    error_code: int
+    def __init__(self, message: str, error_code: int = -2) -> None: ...
     def __str__(self) -> str: ...
 
 class LakeSnapshot:
@@ -703,6 +763,75 @@ class PartitionInfo:
         ...
     def __repr__(self) -> str: ...
 
+class ErrorCode:
+    """Named constants for Fluss API error codes.
+
+    Server API errors have error_code > 0 or == -1.
+    Client-side errors have error_code == CLIENT_ERROR (-2).
+    These constants are convenience names — new server error codes work
+    automatically since error_code is a raw int, not a closed enum.
+    """
+
+    CLIENT_ERROR: int
+    UNKNOWN_SERVER_ERROR: int
+    NETWORK_EXCEPTION: int
+    UNSUPPORTED_VERSION: int
+    CORRUPT_MESSAGE: int
+    DATABASE_NOT_EXIST: int
+    DATABASE_NOT_EMPTY: int
+    DATABASE_ALREADY_EXIST: int
+    TABLE_NOT_EXIST: int
+    TABLE_ALREADY_EXIST: int
+    SCHEMA_NOT_EXIST: int
+    LOG_STORAGE_EXCEPTION: int
+    KV_STORAGE_EXCEPTION: int
+    NOT_LEADER_OR_FOLLOWER: int
+    RECORD_TOO_LARGE_EXCEPTION: int
+    CORRUPT_RECORD_EXCEPTION: int
+    INVALID_TABLE_EXCEPTION: int
+    INVALID_DATABASE_EXCEPTION: int
+    INVALID_REPLICATION_FACTOR: int
+    INVALID_REQUIRED_ACKS: int
+    LOG_OFFSET_OUT_OF_RANGE_EXCEPTION: int
+    NON_PRIMARY_KEY_TABLE_EXCEPTION: int
+    UNKNOWN_TABLE_OR_BUCKET_EXCEPTION: int
+    INVALID_UPDATE_VERSION_EXCEPTION: int
+    INVALID_COORDINATOR_EXCEPTION: int
+    FENCED_LEADER_EPOCH_EXCEPTION: int
+    REQUEST_TIME_OUT: int
+    STORAGE_EXCEPTION: int
+    OPERATION_NOT_ATTEMPTED_EXCEPTION: int
+    NOT_ENOUGH_REPLICAS_AFTER_APPEND_EXCEPTION: int
+    NOT_ENOUGH_REPLICAS_EXCEPTION: int
+    SECURITY_TOKEN_EXCEPTION: int
+    OUT_OF_ORDER_SEQUENCE_EXCEPTION: int
+    DUPLICATE_SEQUENCE_EXCEPTION: int
+    UNKNOWN_WRITER_ID_EXCEPTION: int
+    INVALID_COLUMN_PROJECTION: int
+    INVALID_TARGET_COLUMN: int
+    PARTITION_NOT_EXISTS: int
+    TABLE_NOT_PARTITIONED_EXCEPTION: int
+    INVALID_TIMESTAMP_EXCEPTION: int
+    INVALID_CONFIG_EXCEPTION: int
+    LAKE_STORAGE_NOT_CONFIGURED_EXCEPTION: int
+    KV_SNAPSHOT_NOT_EXIST: int
+    PARTITION_ALREADY_EXISTS: int
+    PARTITION_SPEC_INVALID_EXCEPTION: int
+    LEADER_NOT_AVAILABLE_EXCEPTION: int
+    PARTITION_MAX_NUM_EXCEPTION: int
+    AUTHENTICATE_EXCEPTION: int
+    SECURITY_DISABLED_EXCEPTION: int
+    AUTHORIZATION_EXCEPTION: int
+    BUCKET_MAX_NUM_EXCEPTION: int
+    FENCED_TIERING_EPOCH_EXCEPTION: int
+    RETRIABLE_AUTHENTICATE_EXCEPTION: int
+    INVALID_SERVER_RACK_INFO_EXCEPTION: int
+    LAKE_SNAPSHOT_NOT_EXIST: int
+    LAKE_TABLE_ALREADY_EXIST: int
+    INELIGIBLE_REPLICA_EXCEPTION: int
+    INVALID_ALTER_TABLE_EXCEPTION: int
+    DELETION_DISABLED_EXCEPTION: int
+
 class OffsetType:
     """Offset type constants for list_offsets()."""
 
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index 335aa248ad..d03ce7a21c 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -67,13 +67,13 @@ impl FlussAdmin {
     ///
     /// Returns:
     ///     None
-    #[pyo3(signature = (database_name, ignore_if_exists=false, database_descriptor=None))]
+    #[pyo3(signature = (database_name, database_descriptor=None, ignore_if_exists=false))]
     pub fn create_database<'py>(
         &self,
         py: Python<'py>,
         database_name: &str,
-        ignore_if_exists: bool,
         database_descriptor: Option<&DatabaseDescriptor>,
+        ignore_if_exists: bool,
     ) -> PyResult<Bound<'py, PyAny>> {
         let admin = self.__admin.clone();
         let name = database_name.to_string();
@@ -81,9 +81,9 @@ impl FlussAdmin {
 
         future_into_py(py, async move {
             admin
-                .create_database(&name, ignore_if_exists, descriptor.as_ref())
+                .create_database(&name, descriptor.as_ref(), ignore_if_exists)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to create database: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Ok(py.None()))
         })
@@ -113,7 +113,7 @@ impl FlussAdmin {
             admin
                 .drop_database(&name, ignore_if_not_exists, cascade)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to drop database: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Ok(py.None()))
         })
@@ -130,7 +130,7 @@ impl FlussAdmin {
             let names = admin
                 .list_databases()
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to list databases: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| {
                 let py_list = pyo3::types::PyList::empty(py);
@@ -158,9 +158,10 @@ impl FlussAdmin {
         let name = database_name.to_string();
 
         future_into_py(py, async move {
-            let exists = admin.database_exists(&name).await.map_err(|e| {
-                FlussError::new_err(format!("Failed to check database exists: {e}"))
-            })?;
+            let exists = admin
+                .database_exists(&name)
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Ok(exists.into_pyobject(py)?.to_owned().into_any().unbind()))
         })
@@ -185,7 +186,7 @@ impl FlussAdmin {
             let info = admin
                 .get_database_info(&name)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to get database info: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Py::new(py, DatabaseInfo::from_core(info)))
         })
@@ -210,7 +211,7 @@ impl FlussAdmin {
             let names = admin
                 .list_tables(&name)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to list tables: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| {
                 let py_list = pyo3::types::PyList::empty(py);
@@ -241,7 +242,7 @@ impl FlussAdmin {
             let exists = admin
                 .table_exists(&core_table_path)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to check table exists: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Ok(exists.into_pyobject(py)?.to_owned().into_any().unbind()))
         })
@@ -272,7 +273,7 @@ impl FlussAdmin {
             admin
                 .drop_partition(&core_table_path, &core_partition_spec, ignore_if_not_exists)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to drop partition: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Ok(py.None()))
         })
@@ -297,14 +298,14 @@ impl FlussAdmin {
             admin
                 .create_table(&core_table_path, &core_descriptor, ignore)
                 .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Ok(py.None()))
         })
     }
 
     /// Get table information
-    pub fn get_table<'py>(
+    pub fn get_table_info<'py>(
         &self,
         py: Python<'py>,
         table_path: &TablePath,
@@ -314,9 +315,9 @@ impl FlussAdmin {
 
         future_into_py(py, async move {
             let core_table_info = admin
-                .get_table(&core_table_path)
+                .get_table_info(&core_table_path)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to get table: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| {
                 let table_info = TableInfo::from_core(core_table_info);
@@ -338,7 +339,7 @@ impl FlussAdmin {
             let core_lake_snapshot = admin
                 .get_latest_lake_snapshot(&core_table_path)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to get lake snapshot: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| {
                 let lake_snapshot = LakeSnapshot::from_core(core_lake_snapshot);
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 1e80dbf3c9..237ab6fae0 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -40,11 +40,11 @@ impl Config {
 
                 match key.as_str() {
                     "bootstrap.servers" => {
-                        config.bootstrap_server = value;
+                        config.bootstrap_servers = value;
                     }
-                    "request.max.size" => {
+                    "writer.request-max-size" => {
                         if let Ok(size) = value.parse::<i32>() {
-                            config.request_max_size = size;
+                            config.writer_request_max_size = size;
                         }
                     }
                     "writer.acks" => {
@@ -55,11 +55,21 @@ impl Config {
                             config.writer_retries = retries;
                         }
                     }
-                    "writer.batch.size" => {
+                    "writer.batch-size" => {
                         if let Ok(size) = value.parse::<i32>() {
                             config.writer_batch_size = size;
                         }
                     }
+                    "scanner.remote-log.prefetch-num" => {
+                        if let Ok(num) = value.parse::<usize>() {
+                            config.scanner_remote_log_prefetch_num = num;
+                        }
+                    }
+                    "remote-file.download-thread-num" => {
+                        if let Ok(num) = value.parse::<usize>() {
+                            config.remote_file_download_thread_num = num;
+                        }
+                    }
                     _ => {
                         return Err(FlussError::new_err(format!("Unknown property: {key}")));
                     }
@@ -70,28 +80,52 @@ impl Config {
         Ok(Self { inner: config })
     }
 
-    /// Get the bootstrap server
+    /// Get the bootstrap servers
+    #[getter]
+    fn bootstrap_servers(&self) -> String {
+        self.inner.bootstrap_servers.clone()
+    }
+
+    /// Set the bootstrap servers
+    #[setter]
+    fn set_bootstrap_servers(&mut self, server: String) {
+        self.inner.bootstrap_servers = server;
+    }
+
+    /// Get the writer request max size
+    #[getter]
+    fn writer_request_max_size(&self) -> i32 {
+        self.inner.writer_request_max_size
+    }
+
+    /// Set the writer request max size
+    #[setter]
+    fn set_writer_request_max_size(&mut self, size: i32) {
+        self.inner.writer_request_max_size = size;
+    }
+
+    /// Get the writer acks
     #[getter]
-    fn bootstrap_server(&self) -> String {
-        self.inner.bootstrap_server.clone()
+    fn writer_acks(&self) -> String {
+        self.inner.writer_acks.clone()
     }
 
-    /// Set the bootstrap server
+    /// Set the writer acks
     #[setter]
-    fn set_bootstrap_server(&mut self, server: String) {
-        self.inner.bootstrap_server = server;
+    fn set_writer_acks(&mut self, acks: String) {
+        self.inner.writer_acks = acks;
     }
 
-    /// Get the request max size
+    /// Get the writer retries
     #[getter]
-    fn request_max_size(&self) -> i32 {
-        self.inner.request_max_size
+    fn writer_retries(&self) -> i32 {
+        self.inner.writer_retries
     }
 
-    /// Set the request max size
+    /// Set the writer retries
     #[setter]
-    fn set_request_max_size(&mut self, size: i32) {
-        self.inner.request_max_size = size;
+    fn set_writer_retries(&mut self, retries: i32) {
+        self.inner.writer_retries = retries;
     }
 
     /// Get the writer batch size
@@ -105,6 +139,30 @@ impl Config {
     fn set_writer_batch_size(&mut self, size: i32) {
         self.inner.writer_batch_size = size;
     }
+
+    /// Get the scanner remote log prefetch num
+    #[getter]
+    fn scanner_remote_log_prefetch_num(&self) -> usize {
+        self.inner.scanner_remote_log_prefetch_num
+    }
+
+    /// Set the scanner remote log prefetch num
+    #[setter]
+    fn set_scanner_remote_log_prefetch_num(&mut self, num: usize) {
+        self.inner.scanner_remote_log_prefetch_num = num;
+    }
+
+    /// Get the remote file download thread num
+    #[getter]
+    fn remote_file_download_thread_num(&self) -> usize {
+        self.inner.remote_file_download_thread_num
+    }
+
+    /// Set the remote file download thread num
+    #[setter]
+    fn set_remote_file_download_thread_num(&mut self, num: usize) {
+        self.inner.remote_file_download_thread_num = num;
+    }
 }
 
 impl Config {
diff --git a/fluss-rust/bindings/python/src/connection.rs b/fluss-rust/bindings/python/src/connection.rs
index a7559cec57..31a9505bba 100644
--- a/fluss-rust/bindings/python/src/connection.rs
+++ b/fluss-rust/bindings/python/src/connection.rs
@@ -29,13 +29,13 @@ pub struct FlussConnection {
 impl FlussConnection {
     /// Create a new FlussConnection (async)
     #[staticmethod]
-    fn connect<'py>(py: Python<'py>, config: &Config) -> PyResult<Bound<'py, PyAny>> {
+    fn create<'py>(py: Python<'py>, config: &Config) -> PyResult<Bound<'py, PyAny>> {
         let rust_config = config.get_core_config();
 
         future_into_py(py, async move {
             let connection = fcore::client::FlussConnection::new(rust_config)
                 .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             let py_connection = FlussConnection {
                 inner: Arc::new(connection),
@@ -53,7 +53,7 @@ impl FlussConnection {
             let admin = client
                 .get_admin()
                 .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             let py_admin = FlussAdmin::from_core(admin);
 
@@ -74,12 +74,12 @@ impl FlussConnection {
             let core_table = client
                 .get_table(&core_path)
                 .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             let py_table = FlussTable::new_table(
                 client.clone(),
                 core_table.metadata().clone(),
-                core_table.table_info().clone(),
+                core_table.get_table_info().clone(),
                 core_table.table_path().clone(),
                 core_table.has_primary_key(),
             );
diff --git a/fluss-rust/bindings/python/src/error.rs b/fluss-rust/bindings/python/src/error.rs
index 35d9d9149f..606b9f4fd3 100644
--- a/fluss-rust/bindings/python/src/error.rs
+++ b/fluss-rust/bindings/python/src/error.rs
@@ -18,28 +18,249 @@
 use pyo3::exceptions::PyException;
 use pyo3::prelude::*;
 
+/// Error code for client-side errors that did not originate from the server API protocol.
+/// The value -2 is outside the server API error code range (-1 .. 57+), so it will never
+/// collide with current or future API codes. Consistent with the CPP binding.
+const CLIENT_ERROR_CODE: i32 = -2;
+
 /// Fluss errors
 #[pyclass(extends=PyException)]
 #[derive(Debug, Clone)]
 pub struct FlussError {
     #[pyo3(get)]
     pub message: String,
+    #[pyo3(get)]
+    pub error_code: i32,
 }
 
 #[pymethods]
 impl FlussError {
     #[new]
-    fn new(message: String) -> Self {
-        Self { message }
+    #[pyo3(signature = (message, error_code=-2))]
+    fn new(message: String, error_code: i32) -> Self {
+        Self {
+            message,
+            error_code,
+        }
     }
 
     fn __str__(&self) -> String {
-        format!("FlussError: {}", self.message)
+        if self.error_code != CLIENT_ERROR_CODE {
+            format!("FlussError(code={}): {}", self.error_code, self.message)
+        } else {
+            format!("FlussError: {}", self.message)
+        }
     }
 }
 
 impl FlussError {
     pub fn new_err(message: impl ToString) -> PyErr {
-        PyErr::new::<FlussError, _>(message.to_string())
+        PyErr::new::<FlussError, _>((message.to_string(), CLIENT_ERROR_CODE))
+    }
+
+    /// Create a PyErr from a core Error.
+    /// `FlussAPIError` variants carry the server protocol error code directly.
+    /// All other error kinds are client-side and use CLIENT_ERROR_CODE.
+    pub fn from_core_error(error: &fluss::error::Error) -> PyErr {
+        use fluss::error::Error;
+        let (msg, code) = match error {
+            Error::FlussAPIError { api_error } => (api_error.message.clone(), api_error.code),
+            _ => (error.to_string(), CLIENT_ERROR_CODE),
+        };
+        PyErr::new::<FlussError, _>((msg, code))
     }
 }
+
+/// Named constants for Fluss API error codes.
+///
+/// Server API errors have error_code > 0 or == -1.
+/// Client-side errors have error_code == CLIENT_ERROR (-2).
+/// These constants match the Rust core FlussError enum and are stable across protocol versions.
+/// New server error codes work automatically (error_code is a raw int, not a closed enum) —
+/// these constants are convenience names, not an exhaustive list.
+#[pyclass]
+pub struct ErrorCode;
+
+#[pymethods]
+impl ErrorCode {
+    /// Client-side error (not from server API protocol). Check the error message for details.
+    #[classattr]
+    const CLIENT_ERROR: i32 = -2;
+    /// No error.
+    #[classattr]
+    const NONE: i32 = 0;
+    /// The server experienced an unexpected error when processing the request.
+    #[classattr]
+    const UNKNOWN_SERVER_ERROR: i32 = -1;
+    /// The server disconnected before a response was received.
+    #[classattr]
+    const NETWORK_EXCEPTION: i32 = 1;
+    /// The version of API is not supported.
+    #[classattr]
+    const UNSUPPORTED_VERSION: i32 = 2;
+    /// This message has failed its CRC checksum, exceeds the valid size, or is otherwise corrupt.
+    #[classattr]
+    const CORRUPT_MESSAGE: i32 = 3;
+    /// The database does not exist.
+    #[classattr]
+    const DATABASE_NOT_EXIST: i32 = 4;
+    /// The database is not empty.
+    #[classattr]
+    const DATABASE_NOT_EMPTY: i32 = 5;
+    /// The database already exists.
+    #[classattr]
+    const DATABASE_ALREADY_EXIST: i32 = 6;
+    /// The table does not exist.
+    #[classattr]
+    const TABLE_NOT_EXIST: i32 = 7;
+    /// The table already exists.
+    #[classattr]
+    const TABLE_ALREADY_EXIST: i32 = 8;
+    /// The schema does not exist.
+    #[classattr]
+    const SCHEMA_NOT_EXIST: i32 = 9;
+    /// Exception occurred while storing data for log in server.
+    #[classattr]
+    const LOG_STORAGE_EXCEPTION: i32 = 10;
+    /// Exception occurred while storing data for kv in server.
+    #[classattr]
+    const KV_STORAGE_EXCEPTION: i32 = 11;
+    /// Not leader or follower.
+    #[classattr]
+    const NOT_LEADER_OR_FOLLOWER: i32 = 12;
+    /// The record is too large.
+    #[classattr]
+    const RECORD_TOO_LARGE_EXCEPTION: i32 = 13;
+    /// The record is corrupt.
+    #[classattr]
+    const CORRUPT_RECORD_EXCEPTION: i32 = 14;
+    /// The client has attempted to perform an operation on an invalid table.
+    #[classattr]
+    const INVALID_TABLE_EXCEPTION: i32 = 15;
+    /// The client has attempted to perform an operation on an invalid database.
+    #[classattr]
+    const INVALID_DATABASE_EXCEPTION: i32 = 16;
+    /// The replication factor is larger than the number of available tablet servers.
+    #[classattr]
+    const INVALID_REPLICATION_FACTOR: i32 = 17;
+    /// Produce request specified an invalid value for required acks.
+    #[classattr]
+    const INVALID_REQUIRED_ACKS: i32 = 18;
+    /// The log offset is out of range.
+    #[classattr]
+    const LOG_OFFSET_OUT_OF_RANGE_EXCEPTION: i32 = 19;
+    /// The table is not a primary key table.
+    #[classattr]
+    const NON_PRIMARY_KEY_TABLE_EXCEPTION: i32 = 20;
+    /// The table or bucket does not exist.
+    #[classattr]
+    const UNKNOWN_TABLE_OR_BUCKET_EXCEPTION: i32 = 21;
+    /// The update version is invalid.
+    #[classattr]
+    const INVALID_UPDATE_VERSION_EXCEPTION: i32 = 22;
+    /// The coordinator is invalid.
+    #[classattr]
+    const INVALID_COORDINATOR_EXCEPTION: i32 = 23;
+    /// The leader epoch is invalid.
+    #[classattr]
+    const FENCED_LEADER_EPOCH_EXCEPTION: i32 = 24;
+    /// The request timed out.
+    #[classattr]
+    const REQUEST_TIME_OUT: i32 = 25;
+    /// The general storage exception.
+    #[classattr]
+    const STORAGE_EXCEPTION: i32 = 26;
+    /// The server did not attempt to execute this operation.
+    #[classattr]
+    const OPERATION_NOT_ATTEMPTED_EXCEPTION: i32 = 27;
+    /// Records are written to the server already, but to fewer in-sync replicas than required.
+    #[classattr]
+    const NOT_ENOUGH_REPLICAS_AFTER_APPEND_EXCEPTION: i32 = 28;
+    /// Messages are rejected since there are fewer in-sync replicas than required.
+    #[classattr]
+    const NOT_ENOUGH_REPLICAS_EXCEPTION: i32 = 29;
+    /// Get file access security token exception.
+    #[classattr]
+    const SECURITY_TOKEN_EXCEPTION: i32 = 30;
+    /// The tablet server received an out of order sequence batch.
+    #[classattr]
+    const OUT_OF_ORDER_SEQUENCE_EXCEPTION: i32 = 31;
+    /// The tablet server received a duplicate sequence batch.
+    #[classattr]
+    const DUPLICATE_SEQUENCE_EXCEPTION: i32 = 32;
+    /// The tablet server could not locate the writer metadata.
+    #[classattr]
+    const UNKNOWN_WRITER_ID_EXCEPTION: i32 = 33;
+    /// The requested column projection is invalid.
+    #[classattr]
+    const INVALID_COLUMN_PROJECTION: i32 = 34;
+    /// The requested target column to write is invalid.
+    #[classattr]
+    const INVALID_TARGET_COLUMN: i32 = 35;
+    /// The partition does not exist.
+    #[classattr]
+    const PARTITION_NOT_EXISTS: i32 = 36;
+    /// The table is not partitioned.
+    #[classattr]
+    const TABLE_NOT_PARTITIONED_EXCEPTION: i32 = 37;
+    /// The timestamp is invalid.
+    #[classattr]
+    const INVALID_TIMESTAMP_EXCEPTION: i32 = 38;
+    /// The config is invalid.
+    #[classattr]
+    const INVALID_CONFIG_EXCEPTION: i32 = 39;
+    /// The lake storage is not configured.
+    #[classattr]
+    const LAKE_STORAGE_NOT_CONFIGURED_EXCEPTION: i32 = 40;
+    /// The kv snapshot does not exist.
+    #[classattr]
+    const KV_SNAPSHOT_NOT_EXIST: i32 = 41;
+    /// The partition already exists.
+    #[classattr]
+    const PARTITION_ALREADY_EXISTS: i32 = 42;
+    /// The partition spec is invalid.
+    #[classattr]
+    const PARTITION_SPEC_INVALID_EXCEPTION: i32 = 43;
+    /// There is no currently available leader for the given partition.
+    #[classattr]
+    const LEADER_NOT_AVAILABLE_EXCEPTION: i32 = 44;
+    /// Exceed the maximum number of partitions.
+    #[classattr]
+    const PARTITION_MAX_NUM_EXCEPTION: i32 = 45;
+    /// Authentication failed.
+    #[classattr]
+    const AUTHENTICATE_EXCEPTION: i32 = 46;
+    /// Security is disabled.
+    #[classattr]
+    const SECURITY_DISABLED_EXCEPTION: i32 = 47;
+    /// Authorization failed.
+    #[classattr]
+    const AUTHORIZATION_EXCEPTION: i32 = 48;
+    /// Exceed the maximum number of buckets.
+    #[classattr]
+    const BUCKET_MAX_NUM_EXCEPTION: i32 = 49;
+    /// The tiering epoch is invalid.
+    #[classattr]
+    const FENCED_TIERING_EPOCH_EXCEPTION: i32 = 50;
+    /// Authentication failed with retriable exception.
+    #[classattr]
+    const RETRIABLE_AUTHENTICATE_EXCEPTION: i32 = 51;
+    /// The server rack info is invalid.
+    #[classattr]
+    const INVALID_SERVER_RACK_INFO_EXCEPTION: i32 = 52;
+    /// The lake snapshot does not exist.
+    #[classattr]
+    const LAKE_SNAPSHOT_NOT_EXIST: i32 = 53;
+    /// The lake table already exists.
+    #[classattr]
+    const LAKE_TABLE_ALREADY_EXIST: i32 = 54;
+    /// The new ISR contains at least one ineligible replica.
+    #[classattr]
+    const INELIGIBLE_REPLICA_EXCEPTION: i32 = 55;
+    /// The alter table is invalid.
+    #[classattr]
+    const INVALID_ALTER_TABLE_EXCEPTION: i32 = 56;
+    /// Deletion operations are disabled on this table.
+    #[classattr]
+    const DELETION_DISABLED_EXCEPTION: i32 = 57;
+}
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 094dc0062f..41d516e5b4 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -78,6 +78,9 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<FlussAdmin>()?;
     m.add_class::<FlussTable>()?;
     m.add_class::<TableScan>()?;
+    m.add_class::<TableAppend>()?;
+    m.add_class::<TableUpsert>()?;
+    m.add_class::<TableLookup>()?;
     m.add_class::<AppendWriter>()?;
     m.add_class::<UpsertWriter>()?;
     m.add_class::<Lookuper>()?;
@@ -98,8 +101,9 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add("EARLIEST_OFFSET", fcore::client::EARLIEST_OFFSET)?;
     m.add("LATEST_OFFSET", fcore::client::LATEST_OFFSET)?;
 
-    // Register exception types
+    // Register exception types and error codes
     m.add_class::<FlussError>()?;
+    m.add_class::<ErrorCode>()?;
 
     Ok(())
 }
diff --git a/fluss-rust/bindings/python/src/lookup.rs b/fluss-rust/bindings/python/src/lookup.rs
index e5c1f62313..718f8e5038 100644
--- a/fluss-rust/bindings/python/src/lookup.rs
+++ b/fluss-rust/bindings/python/src/lookup.rs
@@ -27,7 +27,7 @@ use tokio::sync::Mutex;
 /// repeated lookups efficient. Create once and reuse for multiple lookups.
 ///
 /// # Example:
-///     lookuper = table.new_lookup()
+///     lookuper = table.new_lookup().create_lookuper()
 ///     result = await lookuper.lookup({"user_id": 1})
 ///     result2 = await lookuper.lookup({"user_id": 2})  # Reuses cached encoders
 #[pyclass]
@@ -64,13 +64,13 @@ impl Lookuper {
                 lookuper
                     .lookup(&generic_row)
                     .await
-                    .map_err(|e| FlussError::new_err(e.to_string()))?
+                    .map_err(|e| FlussError::from_core_error(&e))?
             };
 
             // Extract row data
             let row_opt = result
                 .get_single_row()
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             // Convert to Python with GIL
             Python::attach(|py| match row_opt {
@@ -98,11 +98,11 @@ impl Lookuper {
 
         let table_lookup = fluss_table
             .new_lookup()
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
         let lookuper = table_lookup
             .create_lookuper()
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
         Ok(Self {
             inner: Arc::new(Mutex::new(lookuper)),
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 81acf0083d..6ec2d257cb 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -223,11 +223,14 @@ impl TableScan {
     /// Create a batch-based log scanner.
     ///
     /// Use this scanner with `poll_arrow()` to get Arrow Tables, or with
-    /// `poll_batches()` to get individual batches with metadata.
+    /// `poll_record_batch()` to get individual batches with metadata.
     ///
     /// Returns:
-    ///     LogScanner for batch-based scanning with `poll_arrow()` or `poll_batches()`
-    pub fn create_batch_scanner<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+    ///     LogScanner for batch-based scanning with `poll_arrow()` or `poll_record_batch()`
+    pub fn create_record_batch_log_scanner<'py>(
+        &self,
+        py: Python<'py>,
+    ) -> PyResult<Bound<'py, PyAny>> {
         self.create_scanner_internal(py, ScannerType::Batch)
     }
 
@@ -260,22 +263,22 @@ impl TableScan {
             let admin = conn
                 .get_admin()
                 .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             let (projected_schema, projected_row_type) =
                 calculate_projected_types(&table_info, projection_indices)?;
 
             let scanner_kind = match scanner_type {
                 ScannerType::Record => {
-                    let s = table_scan.create_log_scanner().map_err(|e| {
-                        FlussError::new_err(format!("Failed to create log scanner: {e}"))
-                    })?;
+                    let s = table_scan
+                        .create_log_scanner()
+                        .map_err(|e| FlussError::from_core_error(&e))?;
                     ScannerKind::Record(s)
                 }
                 ScannerType::Batch => {
-                    let s = table_scan.create_record_batch_log_scanner().map_err(|e| {
-                        FlussError::new_err(format!("Failed to create batch scanner: {e}"))
-                    })?;
+                    let s = table_scan
+                        .create_record_batch_log_scanner()
+                        .map_err(|e| FlussError::from_core_error(&e))?;
                     ScannerKind::Batch(s)
                 }
             };
@@ -332,12 +335,12 @@ fn apply_projection(
     match projection {
         Some(ProjectionType::Indices(indices)) => table_scan
             .project(&indices)
-            .map_err(|e| FlussError::new_err(format!("Failed to project columns: {e}"))),
+            .map_err(|e| FlussError::from_core_error(&e)),
         Some(ProjectionType::Names(names)) => {
             let column_name_refs: Vec<&str> = names.iter().map(|s| s.as_str()).collect();
             table_scan
                 .project_by_name(&column_name_refs)
-                .map_err(|e| FlussError::new_err(format!("Failed to project columns: {e}")))
+                .map_err(|e| FlussError::from_core_error(&e))
         }
         None => Ok(table_scan),
     }
@@ -348,8 +351,8 @@ fn calculate_projected_types(
     table_info: &fcore::metadata::TableInfo,
     projection_indices: Option<Vec<usize>>,
 ) -> PyResult<(SchemaRef, fcore::metadata::RowType)> {
-    let full_schema = to_arrow_schema(table_info.get_row_type())
-        .map_err(|e| FlussError::new_err(format!("Failed to get arrow schema: {e}")))?;
+    let full_schema =
+        to_arrow_schema(table_info.get_row_type()).map_err(|e| FlussError::from_core_error(&e))?;
     let full_row_type = table_info.get_row_type();
 
     match projection_indices {
@@ -387,26 +390,25 @@ impl FlussTable {
         }
     }
 
-    /// Create a new append writer for the table
-    fn new_append_writer<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let conn = self.connection.clone();
-        let metadata = self.metadata.clone();
-        let table_info = self.table_info.clone();
-
-        future_into_py(py, async move {
-            let fluss_table = fcore::client::FlussTable::new(&conn, metadata, table_info.clone());
-
-            let table_append = fluss_table
-                .new_append()
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
-
-            let rust_writer = table_append
-                .create_writer()
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+    /// Create a new TableAppend builder for the table.
+    ///
+    /// Returns:
+    ///     TableAppend builder. Call `create_writer()` to get an AppendWriter.
+    fn new_append(&self) -> PyResult<TableAppend> {
+        let _guard = TOKIO_RUNTIME.enter();
+        let fluss_table = fcore::client::FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
 
-            let py_writer = AppendWriter::from_core(rust_writer, table_info);
+        let table_append = fluss_table
+            .new_append()
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
-            Python::attach(|py| Py::new(py, py_writer))
+        Ok(TableAppend {
+            inner: table_append,
+            table_info: self.table_info.clone(),
         })
     }
 
@@ -425,52 +427,41 @@ impl FlussTable {
         self.has_primary_key
     }
 
-    /// Create a new lookuper for primary key lookups.
+    /// Create a new TableLookup builder for primary key lookups.
     ///
     /// This is only available for tables with a primary key.
-    pub fn new_lookup(&self, _py: Python) -> PyResult<crate::Lookuper> {
+    ///
+    /// Returns:
+    ///     TableLookup builder. Call `create_lookuper()` to get a Lookuper.
+    pub fn new_lookup(&self) -> PyResult<TableLookup> {
         if !self.has_primary_key {
             return Err(FlussError::new_err(
                 "Lookup is only supported for primary key tables",
             ));
         }
 
-        crate::Lookuper::new(
-            &self.connection,
-            self.metadata.clone(),
-            self.table_info.clone(),
-        )
+        Ok(TableLookup {
+            connection: self.connection.clone(),
+            metadata: self.metadata.clone(),
+            table_info: self.table_info.clone(),
+        })
     }
 
-    /// Create a new upsert writer for the table.
+    /// Create a new TableUpsert builder for the table.
     ///
     /// This is only available for tables with a primary key.
     ///
-    /// Args:
-    ///     columns: Optional list of column names for partial update.
-    ///              Only the specified columns will be updated.
-    ///     column_indices: Optional list of column indices (0-based) for partial update.
-    ///                     Alternative to `columns` parameter.
-    #[pyo3(signature = (columns=None, column_indices=None))]
-    pub fn new_upsert(
-        &self,
-        _py: Python,
-        columns: Option<Vec<String>>,
-        column_indices: Option<Vec<usize>>,
-    ) -> PyResult<crate::UpsertWriter> {
+    /// Returns:
+    ///     TableUpsert builder. Call `create_writer()` to get an UpsertWriter,
+    ///     or use `partial_update_by_name()` / `partial_update_by_index()` first.
+    pub fn new_upsert(&self) -> PyResult<TableUpsert> {
         if !self.has_primary_key {
             return Err(FlussError::new_err(
                 "Upsert is only supported for primary key tables",
             ));
         }
 
-        // Validate that at most one parameter is specified
-        if columns.is_some() && column_indices.is_some() {
-            return Err(FlussError::new_err(
-                "Specify only one of 'columns' or 'column_indices', not both",
-            ));
-        }
-
+        let _guard = TOKIO_RUNTIME.enter();
         let fluss_table = fcore::client::FlussTable::new(
             &self.connection,
             self.metadata.clone(),
@@ -479,14 +470,13 @@ impl FlussTable {
 
         let table_upsert = fluss_table
             .new_upsert()
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
-        crate::UpsertWriter::new(
-            table_upsert,
-            self.table_info.clone(),
-            columns,
-            column_indices,
-        )
+        Ok(TableUpsert {
+            inner: table_upsert,
+            table_info: self.table_info.clone(),
+            target_columns: None,
+        })
     }
 
     fn __repr__(&self) -> String {
@@ -517,6 +507,145 @@ impl FlussTable {
     }
 }
 
+/// Builder for creating an AppendWriter.
+///
+/// Obtain via `FlussTable.new_append()`, then call `create_writer()`.
+#[pyclass]
+pub struct TableAppend {
+    inner: fcore::client::TableAppend,
+    table_info: fcore::metadata::TableInfo,
+}
+
+#[pymethods]
+impl TableAppend {
+    /// Create an AppendWriter from this builder.
+    pub fn create_writer(&self) -> PyResult<AppendWriter> {
+        let rust_writer = self
+            .inner
+            .create_writer()
+            .map_err(|e| FlussError::from_core_error(&e))?;
+        Ok(AppendWriter::from_core(
+            rust_writer,
+            self.table_info.clone(),
+        ))
+    }
+
+    fn __repr__(&self) -> String {
+        "TableAppend()".to_string()
+    }
+}
+
+/// Builder for creating an UpsertWriter, with optional partial update configuration.
+///
+/// Obtain via `FlussTable.new_upsert()`, then optionally call
+/// `partial_update_by_name()` or `partial_update_by_index()`,
+/// then call `create_writer()`.
+#[pyclass]
+pub struct TableUpsert {
+    inner: fcore::client::TableUpsert,
+    table_info: fcore::metadata::TableInfo,
+    /// Column indices for partial updates, tracked for Python's dict→GenericRow conversion.
+    target_columns: Option<Vec<usize>>,
+}
+
+#[pymethods]
+impl TableUpsert {
+    /// Configure partial update by column names.
+    ///
+    /// Only the specified columns will be updated on upsert.
+    ///
+    /// Args:
+    ///     columns: List of column names to update.
+    ///
+    /// Returns:
+    ///     A new TableUpsert configured for partial update.
+    pub fn partial_update_by_name(&self, columns: Vec<String>) -> PyResult<TableUpsert> {
+        let col_refs: Vec<&str> = columns.iter().map(|s| s.as_str()).collect();
+        // Core validates and resolves names → indices internally
+        let updated = self
+            .inner
+            .partial_update_with_column_names(&col_refs)
+            .map_err(|e| FlussError::from_core_error(&e))?;
+        // Resolve indices for Python's row conversion layer (core validated names above)
+        let row_type = self.table_info.row_type();
+        let indices: Vec<usize> = columns
+            .iter()
+            .map(|name| {
+                row_type.get_field_index(name).ok_or_else(|| {
+                    FlussError::new_err(format!("Unknown column name '{name}' for partial update"))
+                })
+            })
+            .collect::<PyResult<Vec<usize>>>()?;
+        Ok(TableUpsert {
+            inner: updated,
+            table_info: self.table_info.clone(),
+            target_columns: Some(indices),
+        })
+    }
+
+    /// Configure partial update by column indices.
+    ///
+    /// Only the specified columns will be updated on upsert.
+    ///
+    /// Args:
+    ///     column_indices: List of column indices (0-based) to update.
+    ///
+    /// Returns:
+    ///     A new TableUpsert configured for partial update.
+    pub fn partial_update_by_index(&self, column_indices: Vec<usize>) -> PyResult<TableUpsert> {
+        let target = column_indices.clone();
+        // Core validates indices internally
+        let updated = self
+            .inner
+            .partial_update(Some(column_indices))
+            .map_err(|e| FlussError::from_core_error(&e))?;
+        Ok(TableUpsert {
+            inner: updated,
+            table_info: self.table_info.clone(),
+            target_columns: Some(target),
+        })
+    }
+
+    /// Create an UpsertWriter from this builder.
+    pub fn create_writer(&self) -> PyResult<crate::UpsertWriter> {
+        crate::UpsertWriter::new(
+            &self.inner,
+            self.table_info.clone(),
+            self.target_columns.clone(),
+        )
+    }
+
+    fn __repr__(&self) -> String {
+        "TableUpsert()".to_string()
+    }
+}
+
+/// Builder for creating a Lookuper.
+///
+/// Obtain via `FlussTable.new_lookup()`, then call `create_lookuper()`.
+#[pyclass]
+pub struct TableLookup {
+    connection: Arc<fcore::client::FlussConnection>,
+    metadata: Arc<fcore::client::Metadata>,
+    table_info: fcore::metadata::TableInfo,
+}
+
+#[pymethods]
+impl TableLookup {
+    /// Create a Lookuper from this builder.
+    pub fn create_lookuper(&self) -> PyResult<crate::Lookuper> {
+        crate::Lookuper::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        )
+    }
+
+    fn __repr__(&self) -> String {
+        "TableLookup()".to_string()
+    }
+}
+
 /// Writer for appending data to a Fluss table
 #[pyclass]
 pub struct AppendWriter {
@@ -553,7 +682,7 @@ impl AppendWriter {
         let result_future = self
             .inner
             .append_arrow_batch(rust_batch)
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
         Ok(WriteResultHandle::new(result_future))
     }
 
@@ -568,7 +697,7 @@ impl AppendWriter {
         let result_future = self
             .inner
             .append(&generic_row)
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
         Ok(WriteResultHandle::new(result_future))
     }
 
@@ -577,7 +706,7 @@ impl AppendWriter {
         // Get the expected Arrow schema from the Fluss table
         let row_type = self.table_info.get_row_type();
         let expected_schema = fcore::record::to_arrow_schema(row_type)
-            .map_err(|e| FlussError::new_err(format!("Failed to get table schema: {e}")))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
         // Convert Arrow schema to PyArrow schema
         let py_schema = expected_schema
@@ -609,7 +738,7 @@ impl AppendWriter {
             inner
                 .flush()
                 .await
-                .map_err(|e| FlussError::new_err(e.to_string()))
+                .map_err(|e| FlussError::from_core_error(&e))
         })
     }
 
@@ -1466,7 +1595,7 @@ impl ScannerKind {
         match self {
             Self::Batch(s) => Ok(s),
             Self::Record(_) => Err(FlussError::new_err(
-                "This method requires a batch-based scanner. Use new_scan().create_batch_scanner().",
+                "This method requires a batch-based scanner. Use new_scan().create_record_batch_log_scanner().",
             )),
         }
     }
@@ -1487,7 +1616,7 @@ macro_rules! with_scanner {
 ///
 /// This scanner supports two modes:
 /// - Record-based scanning via `poll()` - returns individual records with metadata
-/// - Batch-based scanning via `poll_arrow()` / `poll_batches()` - returns Arrow batches
+/// - Batch-based scanning via `poll_arrow()` / `poll_record_batch()` - returns Arrow batches
 #[pyclass]
 pub struct LogScanner {
     scanner: ScannerKind,
@@ -1512,7 +1641,7 @@ impl LogScanner {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
                 with_scanner!(&self.scanner, subscribe(bucket_id, start_offset))
-                    .map_err(|e| FlussError::new_err(e.to_string()))
+                    .map_err(|e| FlussError::from_core_error(&e))
             })
         })
     }
@@ -1525,7 +1654,7 @@ impl LogScanner {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
                 with_scanner!(&self.scanner, subscribe_buckets(&bucket_offsets))
-                    .map_err(|e| FlussError::new_err(e.to_string()))
+                    .map_err(|e| FlussError::from_core_error(&e))
             })
         })
     }
@@ -1549,7 +1678,7 @@ impl LogScanner {
                     &self.scanner,
                     subscribe_partition(partition_id, bucket_id, start_offset)
                 )
-                .map_err(|e| FlussError::new_err(e.to_string()))
+                .map_err(|e| FlussError::from_core_error(&e))
             })
         })
     }
@@ -1569,7 +1698,7 @@ impl LogScanner {
                     &self.scanner,
                     subscribe_partition_buckets(&partition_bucket_offsets)
                 )
-                .map_err(|e| FlussError::new_err(e.to_string()))
+                .map_err(|e| FlussError::from_core_error(&e))
             })
         })
     }
@@ -1586,7 +1715,7 @@ impl LogScanner {
                     &self.scanner,
                     unsubscribe_partition(partition_id, bucket_id)
                 )
-                .map_err(|e| FlussError::new_err(e.to_string()))
+                .map_err(|e| FlussError::from_core_error(&e))
             })
         })
     }
@@ -1616,7 +1745,7 @@ impl LogScanner {
         let timeout = Duration::from_millis(timeout_ms as u64);
         let scan_records = py
             .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
         // Convert ScanRecords to Python ScanRecord list
         // Use projected_row_type to handle column projection correctly
@@ -1643,10 +1772,10 @@ impl LogScanner {
     ///     bucket, base_offset, and last_offset metadata.
     ///
     /// Note:
-    ///     - Requires a batch-based scanner (created with new_scan().create_batch_scanner())
+    ///     - Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner())
     ///     - Returns an empty list if no batches are available
     ///     - When timeout expires, returns an empty list (NOT an error)
-    fn poll_batches(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<RecordBatch>> {
+    fn poll_record_batch(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<RecordBatch>> {
         let scanner = self.scanner.as_batch()?;
 
         if timeout_ms < 0 {
@@ -1658,7 +1787,7 @@ impl LogScanner {
         let timeout = Duration::from_millis(timeout_ms as u64);
         let scan_batches = py
             .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
         // Convert ScanBatch to RecordBatch with metadata
         let result = scan_batches
@@ -1678,7 +1807,7 @@ impl LogScanner {
     ///     PyArrow Table containing the polled records (batches merged)
     ///
     /// Note:
-    ///     - Requires a batch-based scanner (created with new_scan().create_batch_scanner())
+    ///     - Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner())
     ///     - Returns an empty table (with correct schema) if no records are available
     ///     - When timeout expires, returns an empty table (NOT an error)
     fn poll_arrow(&self, py: Python, timeout_ms: i64) -> PyResult<Py<PyAny>> {
@@ -1693,7 +1822,7 @@ impl LogScanner {
         let timeout = Duration::from_millis(timeout_ms as u64);
         let scan_batches = py
             .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
         // Convert ScanBatch to Arrow batches
         if scan_batches.is_empty() {
@@ -1809,7 +1938,7 @@ impl LogScanner {
             .detach(|| {
                 TOKIO_RUNTIME.block_on(async { self.admin.list_partition_infos(table_path).await })
             })
-            .map_err(|e| FlussError::new_err(format!("Failed to list partition infos: {e}")))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
         // Build and cache the mapping
         let map: HashMap<i64, String> = partition_infos
@@ -1848,7 +1977,7 @@ impl LogScanner {
                             .await
                     })
                 })
-                .map_err(|e| FlussError::new_err(format!("Failed to list offsets: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             // Convert to TableBucket-keyed map
             let table_id = self.table_info.table_id;
@@ -1912,11 +2041,7 @@ impl LogScanner {
                             .await
                     })
                 })
-                .map_err(|e| {
-                    FlussError::new_err(format!(
-                        "Failed to list offsets for partition {partition_name}: {e}"
-                    ))
-                })?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             for (bucket_id, offset) in offsets {
                 if offset > 0 {
@@ -1947,7 +2072,7 @@ impl LogScanner {
                 .detach(|| {
                     TOKIO_RUNTIME.block_on(async { scanner.poll(Duration::from_millis(500)).await })
                 })
-                .map_err(|e| FlussError::new_err(format!("Failed to poll: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             if scan_batches.is_empty() {
                 continue;
diff --git a/fluss-rust/bindings/python/src/upsert.rs b/fluss-rust/bindings/python/src/upsert.rs
index 745163e3dd..02ad7fa4bb 100644
--- a/fluss-rust/bindings/python/src/upsert.rs
+++ b/fluss-rust/bindings/python/src/upsert.rs
@@ -18,7 +18,7 @@
 use crate::table::{python_to_generic_row, python_to_sparse_generic_row};
 use crate::*;
 use pyo3_async_runtimes::tokio::future_into_py;
-use std::sync::{Arc, Mutex};
+use std::sync::Arc;
 
 /// Writer for upserting and deleting data in a Fluss primary key table.
 ///
@@ -26,7 +26,7 @@ use std::sync::{Arc, Mutex};
 /// to ensure all queued writes are delivered to the server.
 ///
 /// # Example:
-///     writer = table.new_upsert()
+///     writer = table.new_upsert().create_writer()
 ///
 ///     # Fire-and-forget — ignore the returned handle
 ///     writer.upsert(row1)
@@ -38,13 +38,7 @@ use std::sync::{Arc, Mutex};
 ///     await handle.wait()
 #[pyclass]
 pub struct UpsertWriter {
-    inner: Arc<UpsertWriterInner>,
-}
-
-struct UpsertWriterInner {
-    table_upsert: fcore::client::TableUpsert,
-    /// Lazily initialized writer - created on first write operation
-    writer: Mutex<Option<Arc<fcore::client::UpsertWriter>>>,
+    writer: Arc<fcore::client::UpsertWriter>,
     table_info: fcore::metadata::TableInfo,
     /// Column indices for partial updates (None = full row)
     target_columns: Option<Vec<usize>>,
@@ -64,16 +58,16 @@ impl UpsertWriter {
     ///          For dict: keys are column names, values are column values.
     ///          For list/tuple: values must be in schema order.
     pub fn upsert(&self, row: &Bound<'_, PyAny>) -> PyResult<WriteResultHandle> {
-        let generic_row = if let Some(target_cols) = &self.inner.target_columns {
-            python_to_sparse_generic_row(row, &self.inner.table_info, target_cols)?
+        let generic_row = if let Some(target_cols) = &self.target_columns {
+            python_to_sparse_generic_row(row, &self.table_info, target_cols)?
         } else {
-            python_to_generic_row(row, &self.inner.table_info)?
+            python_to_generic_row(row, &self.table_info)?
         };
 
-        let writer = self.inner.get_or_create_writer()?;
-        let result_future = writer
+        let result_future = self
+            .writer
             .upsert(&generic_row)
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
         Ok(WriteResultHandle::new(result_future))
     }
 
@@ -86,13 +80,13 @@ impl UpsertWriter {
     ///         For dict: keys are PK column names.
     ///         For list/tuple: values in PK column order.
     pub fn delete(&self, pk: &Bound<'_, PyAny>) -> PyResult<WriteResultHandle> {
-        let pk_indices = self.inner.table_info.get_schema().primary_key_indexes();
-        let generic_row = python_to_sparse_generic_row(pk, &self.inner.table_info, &pk_indices)?;
+        let pk_indices = self.table_info.get_schema().primary_key_indexes();
+        let generic_row = python_to_sparse_generic_row(pk, &self.table_info, &pk_indices)?;
 
-        let writer = self.inner.get_or_create_writer()?;
-        let result_future = writer
+        let result_future = self
+            .writer
             .delete(&generic_row)
-            .map_err(|e| FlussError::new_err(e.to_string()))?;
+            .map_err(|e| FlussError::from_core_error(&e))?;
         Ok(WriteResultHandle::new(result_future))
     }
 
@@ -104,25 +98,13 @@ impl UpsertWriter {
     /// Returns:
     ///     None on success
     pub fn flush<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        // Clone the Arc<UpsertWriter> out of the lock so we don't hold the guard across await
-        let writer = {
-            let guard = self
-                .inner
-                .writer
-                .lock()
-                .map_err(|e| FlussError::new_err(format!("Lock poisoned: {e}")))?;
-            guard.as_ref().cloned()
-        };
+        let writer = self.writer.clone();
 
         future_into_py(py, async move {
-            if let Some(writer) = writer {
-                writer
-                    .flush()
-                    .await
-                    .map_err(|e| FlussError::new_err(e.to_string()))
-            } else {
-                Ok(())
-            }
+            writer
+                .flush()
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))
         })
     }
 
@@ -132,65 +114,19 @@ impl UpsertWriter {
 }
 
 impl UpsertWriter {
-    /// Create an UpsertWriter from a TableUpsert.
-    ///
-    /// Optionally supports partial updates via column names or indices.
+    /// Create an UpsertWriter by eagerly creating the core writer from a TableUpsert.
     pub fn new(
-        table_upsert: fcore::client::TableUpsert,
+        table_upsert: &fcore::client::TableUpsert,
         table_info: fcore::metadata::TableInfo,
-        columns: Option<Vec<String>>,
-        column_indices: Option<Vec<usize>>,
+        target_columns: Option<Vec<usize>>,
     ) -> PyResult<Self> {
-        // Resolve target column indices (names → indices, or use provided indices directly)
-        let target_columns = if let Some(cols) = columns {
-            let row_type = table_info.row_type();
-            Some(
-                cols.iter()
-                    .map(|name| {
-                        row_type
-                            .get_field_index(name)
-                            .ok_or_else(|| FlussError::new_err(format!("Unknown column: {name}")))
-                    })
-                    .collect::<PyResult<Vec<usize>>>()?,
-            )
-        } else {
-            column_indices
-        };
-
-        // Apply partial update to the Rust core using resolved indices
-        let table_upsert = if let Some(ref indices) = target_columns {
-            table_upsert
-                .partial_update(Some(indices.clone()))
-                .map_err(|e| FlussError::new_err(e.to_string()))?
-        } else {
-            table_upsert
-        };
-
+        let writer = table_upsert
+            .create_writer()
+            .map_err(|e| FlussError::from_core_error(&e))?;
         Ok(Self {
-            inner: Arc::new(UpsertWriterInner {
-                table_upsert,
-                writer: Mutex::new(None),
-                table_info,
-                target_columns,
-            }),
+            writer: Arc::new(writer),
+            table_info,
+            target_columns,
         })
     }
 }
-
-impl UpsertWriterInner {
-    /// Get the cached writer or create one on first use.
-    fn get_or_create_writer(&self) -> PyResult<Arc<fcore::client::UpsertWriter>> {
-        let mut guard = self
-            .writer
-            .lock()
-            .map_err(|e| FlussError::new_err(format!("Lock poisoned: {e}")))?;
-        if guard.is_none() {
-            let writer = self
-                .table_upsert
-                .create_writer()
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
-            *guard = Some(Arc::new(writer));
-        }
-        Ok(guard.as_ref().unwrap().clone())
-    }
-}
diff --git a/fluss-rust/bindings/python/src/write_handle.rs b/fluss-rust/bindings/python/src/write_handle.rs
index 4f3ce99739..83cbeccadc 100644
--- a/fluss-rust/bindings/python/src/write_handle.rs
+++ b/fluss-rust/bindings/python/src/write_handle.rs
@@ -62,9 +62,7 @@ impl WriteResultHandle {
             .ok_or_else(|| FlussError::new_err("WriteResultHandle already consumed"))?;
 
         future_into_py(py, async move {
-            future
-                .await
-                .map_err(|e| FlussError::new_err(e.to_string()))?;
+            future.await.map_err(|e| FlussError::from_core_error(&e))?;
             Ok(())
         })
     }
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 3acf73f2bf..90788b1401 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -26,7 +26,7 @@ use fluss::row::{GenericRow, InternalRow};
 #[allow(dead_code)]
 pub async fn main() -> Result<()> {
     let mut config = Config::parse();
-    config.bootstrap_server = "127.0.0.1:9123".to_string();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
 
     let conn = FlussConnection::new(config).await?;
 
@@ -49,7 +49,7 @@ pub async fn main() -> Result<()> {
         .await?;
     println!(
         "Created KV Table:\n {}\n",
-        admin.get_table(&table_path).await?
+        admin.get_table_info(&table_path).await?
     );
 
     let table = conn.get_table(&table_path).await?;
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index ee1f541fb7..e0471785d2 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -27,7 +27,7 @@ use std::collections::HashMap;
 #[allow(dead_code)]
 pub async fn main() -> Result<()> {
     let mut config = Config::parse();
-    config.bootstrap_server = "127.0.0.1:9123".to_string();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
 
     let conn = FlussConnection::new(config).await?;
 
@@ -52,7 +52,7 @@ pub async fn main() -> Result<()> {
         .await?;
     println!(
         "Created KV Table:\n {}\n",
-        admin.get_table(&table_path).await?
+        admin.get_table_info(&table_path).await?
     );
 
     create_partition(&table_path, &mut admin, "APAC", 1).await;
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index 199fce2347..cfe1627b24 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -29,7 +29,7 @@ use std::time::Duration;
 #[tokio::main]
 pub async fn main() -> Result<()> {
     let mut config = Config::parse();
-    config.bootstrap_server = "127.0.0.1:9123".to_string();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
 
     let conn = FlussConnection::new(config).await?;
 
@@ -52,7 +52,7 @@ pub async fn main() -> Result<()> {
         .await?;
 
     // 2: get the table
-    let table_info = admin.get_table(&table_path).await?;
+    let table_info = admin.get_table_info(&table_path).await?;
     print!("Get created table:\n {table_info}\n");
 
     // write row
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 737ead3d55..3012f85c9a 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -66,15 +66,15 @@ impl FlussAdmin {
     pub async fn create_database(
         &self,
         database_name: &str,
-        ignore_if_exists: bool,
         database_descriptor: Option<&DatabaseDescriptor>,
+        ignore_if_exists: bool,
     ) -> Result<()> {
         let _response = self
             .admin_gateway
             .request(CreateDatabaseRequest::new(
                 database_name,
-                ignore_if_exists,
                 database_descriptor,
+                ignore_if_exists,
             )?)
             .await?;
         Ok(())
@@ -97,15 +97,19 @@ impl FlussAdmin {
         Ok(())
     }
 
-    pub async fn drop_table(&self, table_path: &TablePath, ignore_if_exists: bool) -> Result<()> {
+    pub async fn drop_table(
+        &self,
+        table_path: &TablePath,
+        ignore_if_not_exists: bool,
+    ) -> Result<()> {
         let _response = self
             .admin_gateway
-            .request(DropTableRequest::new(table_path, ignore_if_exists))
+            .request(DropTableRequest::new(table_path, ignore_if_not_exists))
             .await?;
         Ok(())
     }
 
-    pub async fn get_table(&self, table_path: &TablePath) -> Result<TableInfo> {
+    pub async fn get_table_info(&self, table_path: &TablePath) -> Result<TableInfo> {
         let response = self
             .admin_gateway
             .request(GetTableRequest::new(table_path))
@@ -349,8 +353,10 @@ impl FlussAdmin {
             Some(
                 cluster
                     .get_partition_id(&physical_table_path)
-                    .ok_or_else(|| Error::PartitionNotExist {
-                        message: format!("Partition '{name}' not found for table '{table_path}'"),
+                    .ok_or_else(|| {
+                        Error::partition_not_exist(format!(
+                            "Partition '{name}' not found for table '{table_path}'"
+                        ))
                     })?,
             )
         } else {
@@ -424,11 +430,9 @@ impl FlussAdmin {
             let task = tokio::spawn(async move {
                 let cluster = metadata.get_cluster();
                 let tablet_server = cluster.get_tablet_server(leader_id).ok_or_else(|| {
-                    Error::LeaderNotAvailable {
-                        message: format!(
-                            "Tablet server {leader_id} is not found in metadata cache."
-                        ),
-                    }
+                    Error::leader_not_available(format!(
+                        "Tablet server {leader_id} is not found in metadata cache."
+                    ))
                 })?;
                 let connection = rpc_client.get_connection(tablet_server).await?;
                 let list_offsets_response = connection.request(request).await?;
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 4dcefbb012..b370682afd 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -37,7 +37,7 @@ pub struct FlussConnection {
 impl FlussConnection {
     pub async fn new(arg: Config) -> Result<Self> {
         let connections = Arc::new(RpcClient::new());
-        let metadata = Metadata::new(arg.bootstrap_server.as_str(), connections.clone()).await?;
+        let metadata = Metadata::new(arg.bootstrap_servers.as_str(), connections.clone()).await?;
 
         Ok(FlussConnection {
             metadata: Arc::new(metadata),
diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index 5410002e7c..ce154912e4 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -254,20 +254,19 @@ impl Lookuper {
             .metadata
             .leader_for(self.table_path.as_ref(), &table_bucket)
             .await?
-            .ok_or_else(|| Error::LeaderNotAvailable {
-                message: format!("No leader found for table bucket: {table_bucket}"),
+            .ok_or_else(|| {
+                Error::leader_not_available(format!(
+                    "No leader found for table bucket: {table_bucket}"
+                ))
             })?;
 
         // Get connection to the tablet server
-        let tablet_server =
-            cluster
-                .get_tablet_server(leader.id())
-                .ok_or_else(|| Error::LeaderNotAvailable {
-                    message: format!(
-                        "Tablet server {} is not found in metadata cache",
-                        leader.id()
-                    ),
-                })?;
+        let tablet_server = cluster.get_tablet_server(leader.id()).ok_or_else(|| {
+            Error::leader_not_available(format!(
+                "Tablet server {} is not found in metadata cache",
+                leader.id()
+            ))
+        })?;
 
         let connection = self.rpc_client.get_connection(tablet_server).await?;
 
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 62f51b476d..4e5b5d1359 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -36,7 +36,7 @@ mod upsert;
 pub use append::{AppendWriter, TableAppend};
 pub use lookup::{LookupResult, Lookuper, TableLookup};
 pub use remote_log::{
-    DEFAULT_SCANNER_REMOTE_LOG_DOWNLOAD_THREADS, DEFAULT_SCANNER_REMOTE_LOG_PREFETCH_NUM,
+    DEFAULT_REMOTE_FILE_DOWNLOAD_THREAD_NUM, DEFAULT_SCANNER_REMOTE_LOG_PREFETCH_NUM,
 };
 pub use scanner::{LogScanner, RecordBatchLogScanner, TableScan};
 pub use upsert::{TableUpsert, UpsertWriter};
@@ -61,11 +61,13 @@ impl<'a> FlussTable<'a> {
         }
     }
 
-    pub fn get_table_info(&self) -> &TableInfo {
-        &self.table_info
-    }
-
     pub fn new_append(&self) -> Result<TableAppend> {
+        if self.has_primary_key {
+            return Err(Error::UnsupportedOperation {
+                message: "Append is only supported for log tables (without primary key)"
+                    .to_string(),
+            });
+        }
         Ok(TableAppend::new(
             self.table_path.clone(),
             Arc::new(self.table_info.clone()),
@@ -81,7 +83,7 @@ impl<'a> FlussTable<'a> {
         &self.metadata
     }
 
-    pub fn table_info(&self) -> &TableInfo {
+    pub fn get_table_info(&self) -> &TableInfo {
         &self.table_info
     }
 
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index 5583f89d5a..02820d93c3 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -47,7 +47,7 @@ pub const DEFAULT_SCANNER_REMOTE_LOG_PREFETCH_NUM: usize = 4;
 
 /// Default maximum concurrent remote log downloads
 /// Matches Java's REMOTE_FILE_DOWNLOAD_THREAD_NUM (default: 3)
-pub const DEFAULT_SCANNER_REMOTE_LOG_DOWNLOAD_THREADS: usize = 3;
+pub const DEFAULT_REMOTE_FILE_DOWNLOAD_THREAD_NUM: usize = 3;
 
 /// Initial retry backoff delay (milliseconds)
 /// Prevents hot-spin retry loops on persistent failures
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 57f90a1e5a..86f4aec9f2 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -88,7 +88,7 @@ impl<'a> TableScan<'a> {
     ///
     /// # pub async fn example() -> Result<()> {
     ///     let mut config = Config::default();
-    ///     config.bootstrap_server = "127.0.0.1:9123".to_string();
+    ///     config.bootstrap_servers = "127.0.0.1:9123".to_string();
     ///     let conn = FlussConnection::new(config).await?;
     ///
     ///     let table_descriptor = TableDescriptor::builder()
@@ -104,7 +104,7 @@ impl<'a> TableScan<'a> {
     ///     let admin = conn.get_admin().await?;
     ///     admin.create_table(&table_path, &table_descriptor, true)
     ///         .await?;
-    ///     let table_info = admin.get_table(&table_path).await?;
+    ///     let table_info = admin.get_table_info(&table_path).await?;
     ///     let table = conn.get_table(&table_path).await?;
     ///
     ///     // Project columns by indices
@@ -164,7 +164,7 @@ impl<'a> TableScan<'a> {
     ///
     /// # pub async fn example() -> Result<()> {
     ///     let mut config = Config::default();
-    ///     config.bootstrap_server = "127.0.0.1:9123".to_string();
+    ///     config.bootstrap_servers = "127.0.0.1:9123".to_string();
     ///     let conn = FlussConnection::new(config).await?;
     ///
     ///     let table_descriptor = TableDescriptor::builder()
@@ -652,7 +652,7 @@ impl LogFetcher {
         let remote_log_downloader = Arc::new(RemoteLogDownloader::new(
             tmp_dir,
             config.scanner_remote_log_prefetch_num,
-            config.scanner_remote_log_download_threads,
+            config.remote_file_download_thread_num,
             credentials_rx,
         )?);
 
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index 069f2d2ba1..ac3836aa38 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -98,13 +98,9 @@ impl Sender {
                 .update_tables_metadata(&table_paths, &physical_table_paths, vec![])
                 .await
             {
-                match &e {
-                    crate::error::Error::FlussAPIError { api_error }
-                        if api_error.code == FlussError::PartitionNotExists.code() =>
-                    {
-                        warn!(
-                            "Partition does not exist during metadata update, continuing: {api_error}"
-                        );
+                match e.api_error() {
+                    Some(FlussError::PartitionNotExists) => {
+                        warn!("Partition does not exist during metadata update, continuing: {e}");
                     }
                     _ => return Err(e),
                 }
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index 330affaaaa..41ef4bbb42 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -52,7 +52,7 @@ impl WriterClient {
         let mut sender = Sender::new(
             metadata.clone(),
             accumulator.clone(),
-            config.request_max_size,
+            config.writer_request_max_size,
             30_000,
             Self::get_ack(&config)?,
             config.writer_retries,
@@ -70,7 +70,7 @@ impl WriterClient {
         });
 
         Ok(Self {
-            max_request_size: config.request_max_size,
+            max_request_size: config.writer_request_max_size,
             config,
             shutdown_tx,
             sender_join_handle: join_handle,
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
index 1f950ad6b9..5b1e08365c 100644
--- a/fluss-rust/crates/fluss/src/cluster/cluster.rs
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -16,7 +16,6 @@
 // under the License.
 
 use crate::cluster::{BucketLocation, ServerNode, ServerType};
-use crate::error::Error::PartitionNotExist;
 use crate::error::{Error, Result};
 use crate::metadata::{
     JsonSerde, PhysicalTablePath, TableBucket, TableDescriptor, TableInfo, TablePath,
@@ -318,12 +317,10 @@ impl Cluster {
         let partition_id = self.get_partition_id(physical_table_path);
 
         if physical_table_path.get_partition_name().is_some() && partition_id.is_none() {
-            return Err(PartitionNotExist {
-                message: format!(
-                    "The partition {} is not found in cluster",
-                    physical_table_path.get_partition_name().unwrap()
-                ),
-            });
+            return Err(Error::partition_not_exist(format!(
+                "The partition {} is not found in cluster",
+                physical_table_path.get_partition_name().unwrap()
+            )));
         }
 
         Ok(TableBucket::new_with_partition(
@@ -390,9 +387,7 @@ impl Cluster {
     pub fn get_table(&self, table_path: &TablePath) -> Result<&TableInfo> {
         self.table_info_by_path
             .get(table_path)
-            .ok_or_else(|| Error::InvalidTableError {
-                message: format!("Table info not found for {table_path}"),
-            })
+            .ok_or_else(|| Error::invalid_table(format!("Table info not found for {table_path}")))
     }
 
     pub fn opt_get_table(&self, table_path: &TablePath) -> Option<&TableInfo> {
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 972d15c622..92f0b0d95c 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -31,10 +31,10 @@ const DEFAULT_ACKS: &str = "all";
 #[command(author, version, about, long_about = None)]
 pub struct Config {
     #[arg(long, default_value_t = String::from(DEFAULT_BOOTSTRAP_SERVER))]
-    pub bootstrap_server: String,
+    pub bootstrap_servers: String,
 
     #[arg(long, default_value_t = DEFAULT_REQUEST_MAX_SIZE)]
-    pub request_max_size: i32,
+    pub writer_request_max_size: i32,
 
     #[arg(long, default_value_t = String::from(DEFAULT_ACKS))]
     pub writer_acks: String,
@@ -53,19 +53,19 @@ pub struct Config {
     /// Maximum concurrent remote log downloads
     /// Default: 3 (matching Java REMOTE_FILE_DOWNLOAD_THREAD_NUM)
     #[arg(long, default_value_t = DEFAULT_DOWNLOAD_THREADS)]
-    pub scanner_remote_log_download_threads: usize,
+    pub remote_file_download_thread_num: usize,
 }
 
 impl Default for Config {
     fn default() -> Self {
         Self {
-            bootstrap_server: String::from(DEFAULT_BOOTSTRAP_SERVER),
-            request_max_size: DEFAULT_REQUEST_MAX_SIZE,
+            bootstrap_servers: String::from(DEFAULT_BOOTSTRAP_SERVER),
+            writer_request_max_size: DEFAULT_REQUEST_MAX_SIZE,
             writer_acks: String::from(DEFAULT_ACKS),
             writer_retries: i32::MAX,
             writer_batch_size: DEFAULT_WRITER_BATCH_SIZE,
             scanner_remote_log_prefetch_num: DEFAULT_PREFETCH_NUM,
-            scanner_remote_log_download_threads: DEFAULT_DOWNLOAD_THREADS,
+            remote_file_download_thread_num: DEFAULT_DOWNLOAD_THREADS,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index ef86530833..af9f274c77 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -57,12 +57,6 @@ pub enum Error {
         source: opendal::Error,
     },
 
-    #[snafu(
-        visibility(pub(crate)),
-        display("Fluss hitting invalid table error {}.", message)
-    )]
-    InvalidTableError { message: String },
-
     #[snafu(
         visibility(pub(crate)),
         display("Fluss hitting json serde error {}.", message)
@@ -93,18 +87,6 @@ pub enum Error {
     )]
     IllegalArgument { message: String },
 
-    #[snafu(
-        visibility(pub(crate)),
-        display("Fluss hitting invalid partition error {}.", message)
-    )]
-    InvalidPartition { message: String },
-
-    #[snafu(
-        visibility(pub(crate)),
-        display("Fluss hitting partition not exist error {}.", message)
-    )]
-    PartitionNotExist { message: String },
-
     #[snafu(
         visibility(pub(crate)),
         display("Fluss hitting IO not supported error {}.", message)
@@ -122,16 +104,60 @@ pub enum Error {
     )]
     UnsupportedOperation { message: String },
 
-    #[snafu(
-        visibility(pub(crate)),
-        display("Fluss hitting leader not available error {}.", message)
-    )]
-    LeaderNotAvailable { message: String },
-
     #[snafu(visibility(pub(crate)), display("Fluss API Error: {}.", api_error))]
     FlussAPIError { api_error: ApiError },
 }
 
+/// Convenience constructors for API errors that may be raised client-side.
+/// These create `FlussAPIError` with the correct protocol error code,
+/// consistent with Java where e.g. `InvalidTableException` always carries code 15.
+impl Error {
+    pub fn invalid_table(message: impl Into<String>) -> Self {
+        Error::FlussAPIError {
+            api_error: ApiError {
+                code: FlussError::InvalidTableException.code(),
+                message: message.into(),
+            },
+        }
+    }
+
+    pub fn partition_not_exist(message: impl Into<String>) -> Self {
+        Error::FlussAPIError {
+            api_error: ApiError {
+                code: FlussError::PartitionNotExists.code(),
+                message: message.into(),
+            },
+        }
+    }
+
+    pub fn invalid_partition(message: impl Into<String>) -> Self {
+        Error::FlussAPIError {
+            api_error: ApiError {
+                code: FlussError::PartitionSpecInvalidException.code(),
+                message: message.into(),
+            },
+        }
+    }
+
+    pub fn leader_not_available(message: impl Into<String>) -> Self {
+        Error::FlussAPIError {
+            api_error: ApiError {
+                code: FlussError::LeaderNotAvailableException.code(),
+                message: message.into(),
+            },
+        }
+    }
+
+    /// Returns the API error kind if this is an API error, for ergonomic pattern matching.
+    pub fn api_error(&self) -> Option<FlussError> {
+        if let Error::FlussAPIError { api_error } = self {
+            Some(FlussError::for_code(api_error.code))
+        } else {
+            None
+        }
+    }
+}
+
 impl From<ArrowError> for Error {
     fn from(value: ArrowError) -> Self {
         Error::ArrowError {
diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
index d58fb7ee8e..20f5d09757 100644
--- a/fluss-rust/crates/fluss/src/metadata/json_serde.rs
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -476,15 +476,17 @@ impl JsonSerde for Schema {
         let mut schema_builder = Schema::builder().with_columns(columns);
 
         if let Some(pk_node) = node.get(Self::PRIMARY_KEY_NAME) {
-            let pk_array = pk_node.as_array().ok_or_else(|| Error::InvalidTableError {
-                message: "Primary key must be an array".to_string(),
-            })?;
+            let pk_array = pk_node
+                .as_array()
+                .ok_or_else(|| Error::invalid_table("Primary key must be an array"))?;
 
             let mut primary_keys = Vec::with_capacity(pk_array.len());
             for name_node in pk_array {
-                primary_keys.push(name_node.as_str().ok_or_else(|| Error::InvalidTableError {
-                    message: "Primary key element must be a string".to_string(),
-                })?);
+                primary_keys.push(
+                    name_node.as_str().ok_or_else(|| {
+                        Error::invalid_table("Primary key element must be a string")
+                    })?,
+                );
             }
 
             schema_builder = schema_builder.primary_key(primary_keys);
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 66de2a9488..7f0d2e2a27 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -16,7 +16,7 @@
 // under the License.
 
 use crate::compression::ArrowCompressionInfo;
-use crate::error::Error::{IllegalArgument, InvalidTableError};
+use crate::error::Error::IllegalArgument;
 use crate::error::{Error, Result};
 use crate::metadata::DataLakeFormat;
 use crate::metadata::datatype::{DataField, DataType, RowType};
@@ -271,9 +271,9 @@ impl SchemaBuilder {
     ) -> Result<Vec<Column>> {
         let names: Vec<_> = columns.iter().map(|c| &c.name).collect();
         if let Some(duplicates) = Self::find_duplicates(&names) {
-            return Err(InvalidTableError {
-                message: format!("Duplicate column names found: {duplicates:?}"),
-            });
+            return Err(Error::invalid_table(format!(
+                "Duplicate column names found: {duplicates:?}"
+            )));
         }
 
         let Some(pk) = primary_key else {
@@ -283,9 +283,9 @@ impl SchemaBuilder {
         let pk_set: HashSet<_> = pk.column_names.iter().collect();
         let all_columns: HashSet<_> = columns.iter().map(|c| &c.name).collect();
         if !pk_set.is_subset(&all_columns) {
-            return Err(InvalidTableError {
-                message: format!("Primary key columns {pk_set:?} not found in schema"),
-            });
+            return Err(Error::invalid_table(format!(
+                "Primary key columns {pk_set:?} not found in schema"
+            )));
         }
 
         Ok(columns
@@ -506,13 +506,9 @@ impl TableDescriptor {
     pub fn replication_factor(&self) -> Result<i32> {
         self.properties
             .get("table.replication.factor")
-            .ok_or_else(|| InvalidTableError {
-                message: "Replication factor is not set".to_string(),
-            })?
+            .ok_or_else(|| Error::invalid_table("Replication factor is not set"))?
             .parse()
-            .map_err(|_e| InvalidTableError {
-                message: "Replication factor can't be convert into int".to_string(),
-            })
+            .map_err(|_e| Error::invalid_table("Replication factor can't be converted to int"))
     }
 
     pub fn with_properties<K: Into<String>, V: Into<String>>(
@@ -569,13 +565,11 @@ impl TableDescriptor {
         bucket_keys.retain(|k| !partition_keys.contains(k));
 
         if bucket_keys.is_empty() {
-            return Err(InvalidTableError {
-                message: format!(
-                    "Primary Key constraint {:?} should not be same with partition fields {:?}.",
-                    schema.primary_key().unwrap().column_names(),
-                    partition_keys
-                ),
-            });
+            return Err(Error::invalid_table(format!(
+                "Primary Key constraint {:?} should not be same with partition fields {:?}.",
+                schema.primary_key().unwrap().column_names(),
+                partition_keys
+            )));
         }
 
         Ok(bucket_keys)
@@ -592,12 +586,10 @@ impl TableDescriptor {
                 .iter()
                 .any(|k| partition_keys.contains(k))
             {
-                return Err(InvalidTableError {
-                    message: format!(
-                        "Bucket key {:?} shouldn't include any column in partition keys {:?}.",
-                        distribution.bucket_keys, partition_keys
-                    ),
-                });
+                return Err(Error::invalid_table(format!(
+                    "Bucket key {:?} shouldn't include any column in partition keys {:?}.",
+                    distribution.bucket_keys, partition_keys
+                )));
             }
 
             return if let Some(pk) = schema.primary_key() {
@@ -616,15 +608,13 @@ impl TableDescriptor {
                         .iter()
                         .all(|k| pk_columns.contains(k))
                     {
-                        return Err(InvalidTableError {
-                            message: format!(
-                                "Bucket keys must be a subset of primary keys excluding partition keys for primary-key tables. \
-                                The primary keys are {:?}, the partition keys are {:?}, but the user-defined bucket keys are {:?}.",
-                                pk.column_names(),
-                                partition_keys,
-                                distribution.bucket_keys
-                            ),
-                        });
+                        return Err(Error::invalid_table(format!(
+                            "Bucket keys must be a subset of primary keys excluding partition keys for primary-key tables. \
+                            The primary keys are {:?}, the partition keys are {:?}, but the user-defined bucket keys are {:?}.",
+                            pk.column_names(),
+                            partition_keys,
+                            distribution.bucket_keys
+                        )));
                     }
                     Ok(Some(distribution))
                 }
@@ -667,9 +657,7 @@ impl LogFormat {
         match s.to_uppercase().as_str() {
             "ARROW" => Ok(LogFormat::ARROW),
             "INDEXED" => Ok(LogFormat::INDEXED),
-            _ => Err(InvalidTableError {
-                message: format!("Unknown log format: {s}"),
-            }),
+            _ => Err(Error::invalid_table(format!("Unknown log format: {s}"))),
         }
     }
 }
@@ -695,9 +683,7 @@ impl KvFormat {
         match s.to_uppercase().as_str() {
             "INDEXED" => Ok(KvFormat::INDEXED),
             "COMPACTED" => Ok(KvFormat::COMPACTED),
-            _ => Err(InvalidTableError {
-                message: format!("Unknown kv format: {s}"),
-            }),
+            _ => Err(Error::invalid_table(format!("Unknown kv format: {s}"))),
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_database.rs b/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
index 7d24235a57..e03cd1ffa4 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
@@ -37,8 +37,8 @@ pub struct CreateDatabaseRequest {
 impl CreateDatabaseRequest {
     pub fn new(
         database_name: &str,
-        ignore_if_exists: bool,
         database_descriptor: Option<&DatabaseDescriptor>,
+        ignore_if_exists: bool,
     ) -> FlussResult<Self> {
         let database_json = if let Some(descriptor) = database_descriptor {
             Some(descriptor.to_json_bytes()?)
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index c6c98b85d4..121158c1d5 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -69,16 +69,16 @@ mod admin_test {
 
         let db_name = "test_create_database";
 
-        assert_eq!(admin.database_exists(db_name).await.unwrap(), false);
+        assert!(!admin.database_exists(db_name).await.unwrap());
 
         // create database
         admin
-            .create_database(db_name, false, Some(&db_descriptor))
+            .create_database(db_name, Some(&db_descriptor), false)
             .await
             .expect("should create database");
 
         // database should exist
-        assert_eq!(admin.database_exists(db_name).await.unwrap(), true);
+        assert!(admin.database_exists(db_name).await.unwrap());
 
         // get database
         let db_info = admin
@@ -96,7 +96,7 @@ mod admin_test {
             .expect("should drop_database");
 
         // database shouldn't exist now
-        assert_eq!(admin.database_exists(db_name).await.unwrap(), false);
+        assert!(!admin.database_exists(db_name).await.unwrap());
 
         // Note: We don't stop the shared cluster here as it's used by other tests
     }
@@ -115,9 +115,9 @@ mod admin_test {
             .comment("Database for test_create_table")
             .build();
 
-        assert_eq!(admin.database_exists(test_db_name).await.unwrap(), false);
+        assert!(!admin.database_exists(test_db_name).await.unwrap());
         admin
-            .create_database(test_db_name, false, Some(&db_descriptor))
+            .create_database(test_db_name, Some(&db_descriptor), false)
             .await
             .expect("Failed to create test database");
 
@@ -170,7 +170,7 @@ mod admin_test {
         );
 
         let table_info = admin
-            .get_table(&table_path)
+            .get_table_info(&table_path)
             .await
             .expect("Failed to get table info");
 
@@ -212,7 +212,7 @@ mod admin_test {
             .await
             .expect("Failed to drop table");
         // table shouldn't exist now
-        assert_eq!(admin.table_exists(&table_path).await.unwrap(), false);
+        assert!(!admin.table_exists(&table_path).await.unwrap());
 
         // drop database
         admin
@@ -221,7 +221,7 @@ mod admin_test {
             .expect("Should drop database");
 
         // database shouldn't exist now
-        assert_eq!(admin.database_exists(test_db_name).await.unwrap(), false);
+        assert!(!admin.database_exists(test_db_name).await.unwrap());
     }
 
     #[tokio::test]
@@ -239,7 +239,7 @@ mod admin_test {
             .build();
 
         admin
-            .create_database(test_db_name, true, Some(&db_descriptor))
+            .create_database(test_db_name, Some(&db_descriptor), true)
             .await
             .expect("Failed to create test database");
 
@@ -374,23 +374,185 @@ mod admin_test {
 
         let table_path = TablePath::new("fluss", "not_exist");
 
-        let result = admin.get_table(&table_path).await;
+        let result = admin.get_table_info(&table_path).await;
         assert!(result.is_err(), "Expected error but got Ok");
 
         let error = result.unwrap_err();
-        match error {
-            fluss::error::Error::FlussAPIError { api_error } => {
-                assert_eq!(
-                    api_error.code,
-                    FlussError::TableNotExist.code(),
-                    "Expected error code 7 (TableNotExist)"
-                );
-                assert_eq!(
-                    api_error.message, "Table 'fluss.not_exist' does not exist.",
-                    "Expected specific error message"
-                );
-            }
-            other => panic!("Expected FlussAPIError, got {:?}", other),
-        }
+        assert_eq!(
+            error.api_error(),
+            Some(FlussError::TableNotExist),
+            "Expected TableNotExist error, got {:?}",
+            error
+        );
+    }
+
+    /// Helper to assert that an error is a FlussAPIError with the expected code.
+    fn assert_api_error(error: fluss::error::Error, expected: FlussError) {
+        assert_eq!(
+            error.api_error(),
+            Some(expected),
+            "Expected {:?}, got {:?}",
+            expected,
+            error
+        );
+    }
+
+    #[tokio::test]
+    async fn test_error_database_not_exist() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().await.unwrap();
+
+        // get_database_info for non-existent database
+        let result = admin.get_database_info("no_such_db").await;
+        assert_api_error(result.unwrap_err(), FlussError::DatabaseNotExist);
+
+        // drop_database without ignore flag
+        let result = admin.drop_database("no_such_db", false, false).await;
+        assert_api_error(result.unwrap_err(), FlussError::DatabaseNotExist);
+
+        // list_tables for non-existent database
+        let result = admin.list_tables("no_such_db").await;
+        assert_api_error(result.unwrap_err(), FlussError::DatabaseNotExist);
+    }
+
+    #[tokio::test]
+    async fn test_error_database_already_exist() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().await.unwrap();
+
+        let db_name = "test_error_db_already_exist";
+        let descriptor = DatabaseDescriptorBuilder::default().build();
+
+        admin
+            .create_database(db_name, Some(&descriptor), false)
+            .await
+            .unwrap();
+
+        // create same database again without ignore flag
+        let result = admin
+            .create_database(db_name, Some(&descriptor), false)
+            .await;
+        assert_api_error(result.unwrap_err(), FlussError::DatabaseAlreadyExist);
+
+        // with ignore flag should succeed
+        admin
+            .create_database(db_name, Some(&descriptor), true)
+            .await
+            .expect("create_database with ignore_if_exists should succeed");
+
+        // cleanup
+        admin.drop_database(db_name, true, true).await.unwrap();
+    }
+
+    #[tokio::test]
+    async fn test_error_table_already_exist() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().await.unwrap();
+
+        let db_name = "test_error_tbl_already_exist_db";
+        let descriptor = DatabaseDescriptorBuilder::default().build();
+        admin
+            .create_database(db_name, Some(&descriptor), true)
+            .await
+            .unwrap();
+
+        let table_path = TablePath::new(db_name, "my_table");
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .build()
+            .unwrap();
+        let table_descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .distributed_by(Some(1), vec![])
+            .property("table.replication.factor", "1")
+            .build()
+            .unwrap();
+
+        admin
+            .create_table(&table_path, &table_descriptor, false)
+            .await
+            .unwrap();
+
+        // create same table again without ignore flag
+        let result = admin
+            .create_table(&table_path, &table_descriptor, false)
+            .await;
+        assert_api_error(result.unwrap_err(), FlussError::TableAlreadyExist);
+
+        // with ignore flag should succeed
+        admin
+            .create_table(&table_path, &table_descriptor, true)
+            .await
+            .expect("create_table with ignore_if_exists should succeed");
+
+        // cleanup
+        admin.drop_table(&table_path, true).await.unwrap();
+        admin.drop_database(db_name, true, true).await.unwrap();
+    }
+
+    #[tokio::test]
+    async fn test_error_table_not_exist() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().await.unwrap();
+
+        let table_path = TablePath::new("fluss", "no_such_table");
+
+        // drop without ignore flag
+        let result = admin.drop_table(&table_path, false).await;
+        assert_api_error(result.unwrap_err(), FlussError::TableNotExist);
+
+        // drop with ignore flag should succeed
+        admin
+            .drop_table(&table_path, true)
+            .await
+            .expect("drop_table with ignore_if_not_exists should succeed");
+    }
+
+    #[tokio::test]
+    async fn test_error_table_not_partitioned() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().await.unwrap();
+
+        let db_name = "test_error_not_partitioned_db";
+        let descriptor = DatabaseDescriptorBuilder::default().build();
+        admin
+            .create_database(db_name, Some(&descriptor), true)
+            .await
+            .unwrap();
+
+        let table_path = TablePath::new(db_name, "non_partitioned_table");
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .build()
+            .unwrap();
+        let table_descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .distributed_by(Some(1), vec![])
+            .property("table.replication.factor", "1")
+            .build()
+            .unwrap();
+
+        admin
+            .create_table(&table_path, &table_descriptor, false)
+            .await
+            .unwrap();
+
+        // list_partition_infos on non-partitioned table
+        let result = admin.list_partition_infos(&table_path).await;
+        assert_api_error(
+            result.unwrap_err(),
+            FlussError::TableNotPartitionedException,
+        );
+
+        // cleanup
+        admin.drop_table(&table_path, true).await.unwrap();
+        admin.drop_database(db_name, true, true).await.unwrap();
     }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
index a579303cf0..e4dcad9fd9 100644
--- a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
+++ b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
@@ -240,9 +240,11 @@ impl FlussTestingCluster {
     }
 
     pub async fn get_fluss_connection(&self) -> FlussConnection {
-        let mut config = Config::default();
-        config.writer_acks = "all".to_string();
-        config.bootstrap_server = self.bootstrap_servers.clone();
+        let config = Config {
+            writer_acks: "all".to_string(),
+            bootstrap_servers: self.bootstrap_servers.clone(),
+            ..Default::default()
+        };
 
         // Retry mechanism: retry for up to 1 minute
         let max_retries = 60; // 60 retry attempts
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index d80ce791a6..d837631ac7 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -115,7 +115,7 @@ mod table_test {
             .get_table(&table_path)
             .await
             .expect("Failed to get table");
-        let num_buckets = table.table_info().get_num_buckets();
+        let num_buckets = table.get_table_info().get_num_buckets();
         let log_scanner = table
             .new_scan()
             .create_log_scanner()
@@ -134,7 +134,7 @@ mod table_test {
             .expect("Failed to poll records");
 
         // Verify the scanned records
-        let table_bucket = TableBucket::new(table.table_info().table_id, 0);
+        let table_bucket = TableBucket::new(table.get_table_info().table_id, 0);
         let records = scan_records.records(&table_bucket);
 
         assert_eq!(records.len(), 6, "Expected 6 records");
@@ -664,7 +664,7 @@ mod table_test {
             .await
             .expect("Failed to get table");
 
-        let field_count = table.table_info().schema.columns().len();
+        let field_count = table.get_table_info().schema.columns().len();
 
         let append_writer = table
             .new_append()
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index baac77298a..210dfc4e5f 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -154,7 +154,7 @@ mod table_remote_scan_test {
         append_writer.flush().await.expect("Failed to flush");
 
         // Create a log scanner and subscribe to all buckets to read appended records
-        let num_buckets = table.table_info().get_num_buckets();
+        let num_buckets = table.get_table_info().get_num_buckets();
         let log_scanner = table
             .new_scan()
             .project(&[1, 0])
diff --git a/fluss-rust/docs/rust-client.md b/fluss-rust/docs/rust-client.md
index 779b974c28..2221658b49 100644
--- a/fluss-rust/docs/rust-client.md
+++ b/fluss-rust/docs/rust-client.md
@@ -118,7 +118,7 @@ use fluss::error::Result;
 #[tokio::main]
 async fn main() -> Result<()> {
     let mut config = Config::default();
-    config.bootstrap_server = "127.0.0.1:9123".to_string();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
 
     let conn = FlussConnection::new(config).await?;
 
@@ -132,8 +132,8 @@ async fn main() -> Result<()> {
 
 | Option | Description | Default |
 |--------|-------------|---------|
-| `bootstrap_server` | Coordinator server address | `127.0.0.1:9123` |
-| `request_max_size` | Maximum request size in bytes | 10 MB |
+| `bootstrap_servers` | Coordinator server address | `127.0.0.1:9123` |
+| `writer_request_max_size` | Maximum request size in bytes | 10 MB |
 | `writer_acks` | Acknowledgment setting (`all` waits for all replicas) | `all` |
 | `writer_retries` | Number of retries on failure | `i32::MAX` |
 | `writer_batch_size` | Batch size for writes | 2 MB |
@@ -150,7 +150,7 @@ let admin = conn.get_admin().await?;
 
 ```rust
 // Create database
-admin.create_database("my_database", true, None).await?;
+admin.create_database("my_database", None, true).await?;
 
 // List all databases
 let databases = admin.list_databases().await?;
@@ -188,7 +188,7 @@ let table_path = TablePath::new("my_database", "my_table");
 admin.create_table(&table_path, &table_descriptor, true).await?;
 
 // Get table information
-let table_info = admin.get_table(&table_path).await?;
+let table_info = admin.get_table_info(&table_path).await?;
 println!("Table: {}", table_info);
 
 // List tables in database

From 2865891c0f3cb76c2e4c3dd3860f731cf19318e3 Mon Sep 17 00:00:00 2001
From: Junfan Zhang <junfan.zhang@outlook.com>
Date: Fri, 13 Feb 2026 11:50:59 +0800
Subject: [PATCH 140/287] chore: align DataLakeFormat parsing with lake format
 config option (#306)

---
 .../fluss/src/metadata/data_lake_format.rs    | 37 +++++++++++++++++--
 1 file changed, 34 insertions(+), 3 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs b/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
index c1861098c3..b0c3b0d7b3 100644
--- a/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
+++ b/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
@@ -23,11 +23,42 @@ use strum_macros::{Display, EnumString};
 /// between different table formats so that the appropriate integration and
 /// semantics can be applied.
 #[derive(Debug, EnumString, Display, PartialEq)]
+#[strum(ascii_case_insensitive)]
 pub enum DataLakeFormat {
-    /// Apache Paimon data lake table format.
+    #[strum(serialize = "paimon")]
     Paimon,
-    /// Lance columnar data format / lakehouse table format.
+
+    #[strum(serialize = "lance")]
     Lance,
-    /// Apache Iceberg data lake table format.
+
+    #[strum(serialize = "iceberg")]
     Iceberg,
 }
+
+#[cfg(test)]
+mod tests {
+    use crate::metadata::DataLakeFormat;
+    use crate::metadata::DataLakeFormat::{Iceberg, Lance, Paimon};
+
+    #[test]
+    fn test_parse() {
+        let cases = vec![
+            ("paimon", Paimon),
+            ("Paimon", Paimon),
+            ("PAIMON", Paimon),
+            ("lance", Lance),
+            ("LANCE", Lance),
+            ("iceberg", Iceberg),
+            ("ICEBERG", Iceberg),
+        ];
+
+        for (raw, expected) in cases {
+            let parsed = raw.parse::<DataLakeFormat>().unwrap();
+            assert_eq!(parsed, expected, "failed to parse: {}", raw);
+        }
+
+        // negative cases
+        assert!("unknown".parse::<DataLakeFormat>().is_err());
+        assert!("".parse::<DataLakeFormat>().is_err());
+    }
+}

From 7ec82a549d0571b4b0d61a6a0382c51ebe54f89d Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Fri, 13 Feb 2026 09:21:24 +0000
Subject: [PATCH 141/287] feat: add unsubscribe to all clients (#305)

---
 fluss-rust/bindings/cpp/examples/example.cpp  |  30 +++
 fluss-rust/bindings/cpp/include/fluss.hpp     |   1 +
 fluss-rust/bindings/cpp/src/lib.rs            | 251 +++++++-----------
 fluss-rust/bindings/cpp/src/table.cpp         |   9 +
 fluss-rust/bindings/python/API_REFERENCE.md   |   1 +
 fluss-rust/bindings/python/example/example.py |  14 +
 fluss-rust/bindings/python/fluss/__init__.pyi |   7 +
 fluss-rust/bindings/python/src/table.rs       |  13 +
 .../crates/fluss/src/client/table/scanner.rs  |  23 ++
 .../fluss/tests/integration/log_table.rs      |  12 +
 fluss-rust/docs/rust-client.md                |   7 +
 11 files changed, 207 insertions(+), 161 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index e1925bb43c..2c7f55452d 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -345,6 +345,11 @@ int main() {
         std::cout << "  ... and " << (batch_records.Size() - 5) << " more records" << std::endl;
     }
 
+    // 9.1) Unsubscribe from a bucket
+    std::cout << "\n=== Unsubscribe Example ===" << std::endl;
+    check("unsubscribe", batch_scanner.Unsubscribe(subscriptions[0].bucket_id));
+    std::cout << "Unsubscribed from bucket " << subscriptions[0].bucket_id << std::endl;
+
     // 10) Arrow record batch polling
     std::cout << "\n=== Testing Arrow Record Batch Polling ===" << std::endl;
 
@@ -589,6 +594,31 @@ int main() {
                   << std::endl;
     }
 
+    // 13.3) UnsubscribePartition: unsubscribe from one partition, verify remaining
+    std::cout << "\n--- Testing UnsubscribePartition ---" << std::endl;
+    fluss::LogScanner unsub_partition_scanner;
+    check("new_unsub_partition_scanner",
+          partitioned_table.NewScan().CreateLogScanner(unsub_partition_scanner));
+
+    for (const auto& pi : partition_infos) {
+        check("subscribe_for_unsub",
+              unsub_partition_scanner.SubscribePartitionBuckets(pi.partition_id, 0, 0));
+    }
+    // Unsubscribe from the first partition
+    check("unsubscribe_partition",
+          unsub_partition_scanner.UnsubscribePartition(partition_infos[0].partition_id, 0));
+    std::cout << "Unsubscribed from partition " << partition_infos[0].partition_name << std::endl;
+
+    fluss::ScanRecords unsub_records;
+    check("poll_after_unsub", unsub_partition_scanner.Poll(5000, unsub_records));
+    std::cout << "After unsubscribe, scanned " << unsub_records.Size() << " records" << std::endl;
+    for (size_t i = 0; i < unsub_records.Size(); ++i) {
+        const auto& rec = unsub_records[i];
+        std::cout << "  Record " << i << ": id=" << rec.row.GetInt32(0)
+                  << ", region=" << rec.row.GetString(1) << ", value=" << rec.row.GetInt64(2)
+                  << std::endl;
+    }
+
     // Cleanup
     check("drop_partitioned_table", admin.DropTable(partitioned_table_path, true));
     std::cout << "Dropped partitioned table" << std::endl;
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 2fce8eb944..926fbc66a2 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -1278,6 +1278,7 @@ class LogScanner {
     Result Subscribe(const std::vector<BucketSubscription>& bucket_offsets);
     Result SubscribePartitionBuckets(int64_t partition_id, int32_t bucket_id, int64_t start_offset);
     Result SubscribePartitionBuckets(const std::vector<PartitionBucketSubscription>& subscriptions);
+    Result Unsubscribe(int32_t bucket_id);
     Result UnsubscribePartition(int64_t partition_id, int32_t bucket_id);
     Result Poll(int64_t timeout_ms, ScanRecords& out);
     Result PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out);
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index b5a5139cce..8a5bdfdd66 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -384,6 +384,7 @@ mod ffi {
             self: &LogScanner,
             subscriptions: Vec<FfiPartitionBucketSubscription>,
         ) -> FfiResult;
+        fn unsubscribe(self: &LogScanner, bucket_id: i32) -> FfiResult;
         fn unsubscribe_partition(self: &LogScanner, partition_id: i64, bucket_id: i32)
         -> FfiResult;
         fn poll(self: &LogScanner, timeout_ms: i64) -> FfiScanRecordsResult;
@@ -419,9 +420,13 @@ pub struct WriteResult {
     inner: Option<fcore::client::WriteResultFuture>,
 }
 
+enum ScannerKind {
+    Record(fcore::client::LogScanner),
+    Batch(fcore::client::RecordBatchLogScanner),
+}
+
 pub struct LogScanner {
-    inner: Option<fcore::client::LogScanner>,
-    inner_batch: Option<fcore::client::RecordBatchLogScanner>,
+    scanner: ScannerKind,
     /// Fluss columns matching the projected Arrow fields (1:1 by index).
     /// For non-projected scanners this is the full table schema columns.
     projected_columns: Vec<fcore::metadata::Column>,
@@ -1009,21 +1014,20 @@ impl Table {
                 (cols, scan)
             };
 
-            let (inner, inner_batch) = if batch {
-                let batch_scanner = scan
+            let scanner = if batch {
+                let s = scan
                     .create_record_batch_log_scanner()
                     .map_err(|e| format!("Failed to create record batch log scanner: {e}"))?;
-                (None, Some(batch_scanner))
+                ScannerKind::Batch(s)
             } else {
-                let log_scanner = scan
+                let s = scan
                     .create_log_scanner()
                     .map_err(|e| format!("Failed to create log scanner: {e}"))?;
-                (Some(log_scanner), None)
+                ScannerKind::Record(s)
             };
 
             Ok(Box::into_raw(Box::new(LogScanner {
-                inner,
-                inner_batch,
+                scanner,
                 projected_columns,
             })))
         })
@@ -1291,75 +1295,34 @@ pub extern "C" fn free_arrow_ffi_structures(array_ptr: usize, schema_ptr: usize)
     }
 }
 
-impl LogScanner {
-    fn subscribe(&self, bucket_id: i32, start_offset: i64) -> ffi::FfiResult {
-        self.do_subscribe(None, bucket_id, start_offset)
-    }
-
-    fn do_subscribe(
-        &self,
-        partition_id: Option<PartitionId>,
-        bucket_id: i32,
-        start_offset: i64,
-    ) -> ffi::FfiResult {
-        if let Some(ref inner) = self.inner {
-            let result = RUNTIME.block_on(async {
-                if let Some(partition_id) = partition_id {
-                    inner
-                        .subscribe_partition(partition_id, bucket_id, start_offset)
-                        .await
-                } else {
-                    inner.subscribe(bucket_id, start_offset).await
-                }
-            });
-            match result {
-                Ok(_) => ok_result(),
-                Err(e) => err_from_core_error(&e),
+/// Dispatch a method call to whichever scanner variant is active.
+/// Both LogScanner and RecordBatchLogScanner share the same subscribe/unsubscribe interface.
+macro_rules! dispatch_scanner {
+    ($self:expr, $method:ident($($arg:expr),*)) => {
+        match RUNTIME.block_on(async {
+            match &$self.scanner {
+                ScannerKind::Record(s) => s.$method($($arg),*).await,
+                ScannerKind::Batch(s) => s.$method($($arg),*).await,
             }
-        } else if let Some(ref inner_batch) = self.inner_batch {
-            let result = RUNTIME.block_on(async {
-                if let Some(partition_id) = partition_id {
-                    inner_batch
-                        .subscribe_partition(partition_id, bucket_id, start_offset)
-                        .await
-                } else {
-                    inner_batch.subscribe(bucket_id, start_offset).await
-                }
-            });
-            match result {
-                Ok(_) => ok_result(),
-                Err(e) => err_from_core_error(&e),
-            }
-        } else {
-            client_err("LogScanner not initialized".to_string())
+        }) {
+            Ok(_) => ok_result(),
+            Err(e) => err_from_core_error(&e),
         }
+    };
+}
+
+impl LogScanner {
+    fn subscribe(&self, bucket_id: i32, start_offset: i64) -> ffi::FfiResult {
+        dispatch_scanner!(self, subscribe(bucket_id, start_offset))
     }
 
     fn subscribe_buckets(&self, subscriptions: Vec<ffi::FfiBucketSubscription>) -> ffi::FfiResult {
         use std::collections::HashMap;
-        let mut bucket_offsets = HashMap::new();
-        for sub in subscriptions {
-            bucket_offsets.insert(sub.bucket_id, sub.offset);
-        }
-
-        if let Some(ref inner) = self.inner {
-            let result = RUNTIME.block_on(async { inner.subscribe_buckets(&bucket_offsets).await });
-
-            match result {
-                Ok(_) => ok_result(),
-                Err(e) => err_from_core_error(&e),
-            }
-        } else if let Some(ref inner_batch) = self.inner_batch {
-            let result =
-                RUNTIME.block_on(async { inner_batch.subscribe_buckets(&bucket_offsets).await });
-
-            match result {
-                Ok(_) => ok_result(),
-                Err(e) => err_from_core_error(&e),
-            }
-        } else {
-            client_err("LogScanner not initialized".to_string())
-        }
+        let bucket_offsets: HashMap<i32, i64> = subscriptions
+            .into_iter()
+            .map(|s| (s.bucket_id, s.offset))
+            .collect();
+        dispatch_scanner!(self, subscribe_buckets(&bucket_offsets))
     }
 
     fn subscribe_partition(
@@ -1368,7 +1331,10 @@ impl LogScanner {
         bucket_id: i32,
         start_offset: i64,
     ) -> ffi::FfiResult {
-        self.do_subscribe(Some(partition_id), bucket_id, start_offset)
+        dispatch_scanner!(
+            self,
+            subscribe_partition(partition_id, bucket_id, start_offset)
+        )
     }
 
     fn subscribe_partition_buckets(
@@ -1376,115 +1342,78 @@ impl LogScanner {
         subscriptions: Vec<ffi::FfiPartitionBucketSubscription>,
     ) -> ffi::FfiResult {
         use std::collections::HashMap;
-        let mut partition_bucket_offsets: HashMap<(PartitionId, i32), i64> = HashMap::new();
-        for sub in subscriptions {
-            partition_bucket_offsets.insert((sub.partition_id, sub.bucket_id), sub.offset);
-        }
+        let offsets: HashMap<(PartitionId, i32), i64> = subscriptions
+            .into_iter()
+            .map(|s| ((s.partition_id, s.bucket_id), s.offset))
+            .collect();
+        dispatch_scanner!(self, subscribe_partition_buckets(&offsets))
+    }
 
-        if let Some(ref inner) = self.inner {
-            let result = RUNTIME.block_on(async {
-                inner
-                    .subscribe_partition_buckets(&partition_bucket_offsets)
-                    .await
-            });
-            match result {
-                Ok(_) => ok_result(),
-                Err(e) => err_from_core_error(&e),
-            }
-        } else if let Some(ref inner_batch) = self.inner_batch {
-            let result = RUNTIME.block_on(async {
-                inner_batch
-                    .subscribe_partition_buckets(&partition_bucket_offsets)
-                    .await
-            });
-            match result {
-                Ok(_) => ok_result(),
-                Err(e) => err_from_core_error(&e),
-            }
-        } else {
-            client_err("LogScanner not initialized".to_string())
-        }
+    fn unsubscribe(&self, bucket_id: i32) -> ffi::FfiResult {
+        dispatch_scanner!(self, unsubscribe(bucket_id))
     }
 
     fn unsubscribe_partition(&self, partition_id: PartitionId, bucket_id: i32) -> ffi::FfiResult {
-        if let Some(ref inner) = self.inner {
-            match RUNTIME
-                .block_on(async { inner.unsubscribe_partition(partition_id, bucket_id).await })
-            {
-                Ok(_) => ok_result(),
-                Err(e) => err_from_core_error(&e),
-            }
-        } else if let Some(ref inner_batch) = self.inner_batch {
-            match RUNTIME.block_on(async {
-                inner_batch
-                    .unsubscribe_partition(partition_id, bucket_id)
-                    .await
-            }) {
-                Ok(_) => ok_result(),
-                Err(e) => err_from_core_error(&e),
-            }
-        } else {
-            client_err("LogScanner not initialized".to_string())
-        }
+        dispatch_scanner!(self, unsubscribe_partition(partition_id, bucket_id))
     }
 
     fn poll(&self, timeout_ms: i64) -> ffi::FfiScanRecordsResult {
-        if let Some(ref inner) = self.inner {
-            let timeout = Duration::from_millis(timeout_ms as u64);
-            let result = RUNTIME.block_on(async { inner.poll(timeout).await });
+        let ScannerKind::Record(ref inner) = self.scanner else {
+            return ffi::FfiScanRecordsResult {
+                result: client_err("Record-based scanner not available".to_string()),
+                scan_records: ffi::FfiScanRecords { records: vec![] },
+            };
+        };
 
-            match result {
-                Ok(records) => {
-                    match types::core_scan_records_to_ffi(&records, &self.projected_columns) {
-                        Ok(scan_records) => ffi::FfiScanRecordsResult {
-                            result: ok_result(),
-                            scan_records,
-                        },
-                        Err(e) => ffi::FfiScanRecordsResult {
-                            result: client_err(e.to_string()),
-                            scan_records: ffi::FfiScanRecords { records: vec![] },
-                        },
-                    }
+        let timeout = Duration::from_millis(timeout_ms as u64);
+        let result = RUNTIME.block_on(async { inner.poll(timeout).await });
+
+        match result {
+            Ok(records) => {
+                match types::core_scan_records_to_ffi(&records, &self.projected_columns) {
+                    Ok(scan_records) => ffi::FfiScanRecordsResult {
+                        result: ok_result(),
+                        scan_records,
+                    },
+                    Err(e) => ffi::FfiScanRecordsResult {
+                        result: client_err(e.to_string()),
+                        scan_records: ffi::FfiScanRecords { records: vec![] },
+                    },
                 }
-                Err(e) => ffi::FfiScanRecordsResult {
-                    result: err_from_core_error(&e),
-                    scan_records: ffi::FfiScanRecords { records: vec![] },
-                },
             }
-        } else {
-            ffi::FfiScanRecordsResult {
-                result: client_err("Record-based scanner not available".to_string()),
+            Err(e) => ffi::FfiScanRecordsResult {
+                result: err_from_core_error(&e),
                 scan_records: ffi::FfiScanRecords { records: vec![] },
-            }
+            },
         }
     }
 
     fn poll_record_batch(&self, timeout_ms: i64) -> ffi::FfiArrowRecordBatchesResult {
-        if let Some(ref inner_batch) = self.inner_batch {
-            let timeout = Duration::from_millis(timeout_ms as u64);
-            let result = RUNTIME.block_on(async { inner_batch.poll(timeout).await });
+        let ScannerKind::Batch(ref inner_batch) = self.scanner else {
+            return ffi::FfiArrowRecordBatchesResult {
+                result: client_err("Batch-based scanner not available".to_string()),
+                arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
+            };
+        };
 
-            match result {
-                Ok(batches) => match types::core_scan_batches_to_ffi(&batches) {
-                    Ok(arrow_batches) => ffi::FfiArrowRecordBatchesResult {
-                        result: ok_result(),
-                        arrow_batches,
-                    },
-                    Err(e) => ffi::FfiArrowRecordBatchesResult {
-                        result: client_err(e),
-                        arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
-                    },
+        let timeout = Duration::from_millis(timeout_ms as u64);
+        let result = RUNTIME.block_on(async { inner_batch.poll(timeout).await });
+
+        match result {
+            Ok(batches) => match types::core_scan_batches_to_ffi(&batches) {
+                Ok(arrow_batches) => ffi::FfiArrowRecordBatchesResult {
+                    result: ok_result(),
+                    arrow_batches,
                 },
                 Err(e) => ffi::FfiArrowRecordBatchesResult {
-                    result: err_from_core_error(&e),
+                    result: client_err(e),
                     arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
                 },
-            }
-        } else {
-            ffi::FfiArrowRecordBatchesResult {
-                result: client_err("Batch-based scanner not available".to_string()),
+            },
+            Err(e) => ffi::FfiArrowRecordBatchesResult {
+                result: err_from_core_error(&e),
                 arrow_batches: ffi::FfiArrowRecordBatches { batches: vec![] },
-            }
+            },
         }
     }
 }
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 078b1bc2c8..19fd72dd5f 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -640,6 +640,15 @@ Result LogScanner::SubscribePartitionBuckets(
     return utils::from_ffi_result(ffi_result);
 }
 
+Result LogScanner::Unsubscribe(int32_t bucket_id) {
+    if (!Available()) {
+        return utils::make_client_error("LogScanner not available");
+    }
+
+    auto ffi_result = scanner_->unsubscribe(bucket_id);
+    return utils::from_ffi_result(ffi_result);
+}
+
 Result LogScanner::UnsubscribePartition(int64_t partition_id, int32_t bucket_id) {
     if (!Available()) {
         return utils::make_client_error("LogScanner not available");
diff --git a/fluss-rust/bindings/python/API_REFERENCE.md b/fluss-rust/bindings/python/API_REFERENCE.md
index e16a82f87d..3749ee1d87 100644
--- a/fluss-rust/bindings/python/API_REFERENCE.md
+++ b/fluss-rust/bindings/python/API_REFERENCE.md
@@ -146,6 +146,7 @@ Builder for creating a `Lookuper`. Obtain via `FlussTable.new_lookup()`.
 | `.subscribe_buckets(bucket_offsets)` | Subscribe to multiple buckets (`{bucket_id: offset}`) |
 | `.subscribe_partition(partition_id, bucket_id, start_offset)` | Subscribe to a partition bucket |
 | `.subscribe_partition_buckets(partition_bucket_offsets)` | Subscribe to multiple partition+bucket combos (`{(part_id, bucket_id): offset}`) |
+| `.unsubscribe(bucket_id)` | Unsubscribe from a bucket (non-partitioned tables) |
 | `.unsubscribe_partition(partition_id, bucket_id)` | Unsubscribe from a partition bucket |
 | `.poll(timeout_ms) -> list[ScanRecord]` | Poll individual records (record scanner only) |
 | `.poll_arrow(timeout_ms) -> pa.Table` | Poll as Arrow Table (batch scanner only) |
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 8e68843266..4ea3bd6a47 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -374,6 +374,20 @@ async def main():
     except Exception as e:
         print(f"Error during record scanning: {e}")
 
+    # Demo: unsubscribe — unsubscribe from a bucket (non-partitioned tables)
+    print("\n--- Testing unsubscribe ---")
+    try:
+        unsub_scanner = await table.new_scan().create_record_batch_log_scanner()
+        unsub_scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+        print(f"Subscribed to {num_buckets} buckets")
+        # Unsubscribe from bucket 0 — future polls will skip this bucket
+        unsub_scanner.unsubscribe(bucket_id=0)
+        print("Unsubscribed from bucket 0")
+        remaining = unsub_scanner.poll_arrow(5000)
+        print(f"After unsubscribe, got {remaining.num_rows} records (from remaining buckets)")
+    except Exception as e:
+        print(f"Error during unsubscribe test: {e}")
+
     # =====================================================
     # Demo: Primary Key Table with Lookup and Upsert
     # =====================================================
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 55837de536..dff90c38f8 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -573,6 +573,13 @@ class LogScanner:
                 Example: {(partition_id_1, 0): EARLIEST_OFFSET, (partition_id_2, 1): 100}
         """
         ...
+    def unsubscribe(self, bucket_id: int) -> None:
+        """Unsubscribe from a specific bucket (non-partitioned tables only).
+
+        Args:
+            bucket_id: The bucket ID to unsubscribe from
+        """
+        ...
     def unsubscribe_partition(self, partition_id: int, bucket_id: int) -> None:
         """Unsubscribe from a specific partition bucket (partitioned tables only).
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 6ec2d257cb..80852152e1 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -1703,6 +1703,19 @@ impl LogScanner {
         })
     }
 
+    /// Unsubscribe from a specific bucket (non-partitioned tables only).
+    ///
+    /// Args:
+    ///     bucket_id: The bucket ID to unsubscribe from
+    fn unsubscribe(&self, py: Python, bucket_id: i32) -> PyResult<()> {
+        py.detach(|| {
+            TOKIO_RUNTIME.block_on(async {
+                with_scanner!(&self.scanner, unsubscribe(bucket_id))
+                    .map_err(|e| FlussError::from_core_error(&e))
+            })
+        })
+    }
+
     /// Unsubscribe from a specific partition bucket (partitioned tables only).
     ///
     /// Args:
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 86f4aec9f2..0900267b80 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -434,6 +434,21 @@ impl LogScannerInner {
         Ok(())
     }
 
+    async fn unsubscribe(&self, bucket: i32) -> Result<()> {
+        if self.is_partitioned_table {
+            return Err(Error::UnsupportedOperation {
+                message:
+                    "The table is a partitioned table, please use \"unsubscribe_partition\" to \
+                    unsubscribe a partitioned bucket instead."
+                        .to_string(),
+            });
+        }
+        let table_bucket = TableBucket::new(self.table_id, bucket);
+        self.log_scanner_status
+            .unassign_scan_buckets(from_ref(&table_bucket));
+        Ok(())
+    }
+
     async fn unsubscribe_partition(&self, partition_id: PartitionId, bucket: i32) -> Result<()> {
         if !self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
@@ -535,6 +550,10 @@ impl LogScanner {
             .await
     }
 
+    pub async fn unsubscribe(&self, bucket: i32) -> Result<()> {
+        self.inner.unsubscribe(bucket).await
+    }
+
     pub async fn unsubscribe_partition(
         &self,
         partition_id: PartitionId,
@@ -589,6 +608,10 @@ impl RecordBatchLogScanner {
             .await
     }
 
+    pub async fn unsubscribe(&self, bucket: i32) -> Result<()> {
+        self.inner.unsubscribe(bucket).await
+    }
+
     pub async fn unsubscribe_partition(
         &self,
         partition_id: PartitionId,
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index d837631ac7..22e893cb5d 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -158,6 +158,18 @@ mod table_test {
                 i
             );
         }
+
+        // Test unsubscribe: unsubscribe from bucket 0, verify no error
+        log_scanner
+            .unsubscribe(0)
+            .await
+            .expect("Failed to unsubscribe from bucket 0");
+
+        // Verify unsubscribe_partition fails on a non-partitioned table
+        assert!(
+            log_scanner.unsubscribe_partition(0, 0).await.is_err(),
+            "unsubscribe_partition should fail on a non-partitioned table"
+        );
     }
 
     #[tokio::test]
diff --git a/fluss-rust/docs/rust-client.md b/fluss-rust/docs/rust-client.md
index 2221658b49..0396882904 100644
--- a/fluss-rust/docs/rust-client.md
+++ b/fluss-rust/docs/rust-client.md
@@ -384,6 +384,13 @@ bucket_offsets.insert(1, 100i64);  // bucket 1 from offset 100
 log_scanner.subscribe_buckets(&bucket_offsets).await?;
 ```
 
+### Unsubscribe from a Bucket
+
+```rust
+// Unsubscribe from a specific bucket (non-partitioned tables)
+log_scanner.unsubscribe(bucket_id).await?;
+```
+
 ### Unsubscribe from a Partition
 
 ```rust

From 110690c60e3eb3d3d61b633b266508469fb4035b Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Fri, 13 Feb 2026 14:46:58 +0000
Subject: [PATCH 142/287] chore: Fix issue where FixedSizedBinary type cannot
 be build in arrow (#304)

---
 fluss-rust/crates/fluss/src/record/arrow.rs   | 13 +++--
 fluss-rust/crates/fluss/src/row/datum.rs      | 48 ++++++++++++++++---
 .../fluss/tests/integration/log_table.rs      | 25 ++++++----
 3 files changed, 66 insertions(+), 20 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index fe2f2f4463..7fb9d34a0e 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -24,11 +24,11 @@ use crate::row::field_getter::FieldGetter;
 use crate::row::{ColumnarRow, InternalRow};
 use arrow::array::{
     ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
-    Float32Builder, Float64Builder, Int8Builder, Int16Builder, Int32Builder, Int64Builder,
-    StringBuilder, Time32MillisecondBuilder, Time32SecondBuilder, Time64MicrosecondBuilder,
-    Time64NanosecondBuilder, TimestampMicrosecondBuilder, TimestampMillisecondBuilder,
-    TimestampNanosecondBuilder, TimestampSecondBuilder, UInt8Builder, UInt16Builder, UInt32Builder,
-    UInt64Builder,
+    FixedSizeBinaryBuilder, Float32Builder, Float64Builder, Int8Builder, Int16Builder,
+    Int32Builder, Int64Builder, StringBuilder, Time32MillisecondBuilder, Time32SecondBuilder,
+    Time64MicrosecondBuilder, Time64NanosecondBuilder, TimestampMicrosecondBuilder,
+    TimestampMillisecondBuilder, TimestampNanosecondBuilder, TimestampSecondBuilder, UInt8Builder,
+    UInt16Builder, UInt32Builder, UInt64Builder,
 };
 use arrow::{
     array::RecordBatch,
@@ -266,6 +266,9 @@ impl RowAppendRecordBatchBuilder {
             arrow_schema::DataType::Boolean => Ok(Box::new(BooleanBuilder::new())),
             arrow_schema::DataType::Utf8 => Ok(Box::new(StringBuilder::new())),
             arrow_schema::DataType::Binary => Ok(Box::new(BinaryBuilder::new())),
+            arrow_schema::DataType::FixedSizeBinary(size) => {
+                Ok(Box::new(FixedSizeBinaryBuilder::new(*size)))
+            }
             arrow_schema::DataType::Decimal128(precision, scale) => {
                 let builder = Decimal128Builder::new()
                     .with_precision_and_scale(*precision, *scale)
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index e1b70adca2..b370fb1d89 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -19,13 +19,14 @@ use crate::error::Error::RowConvertError;
 use crate::error::Result;
 use crate::row::Decimal;
 use arrow::array::{
-    ArrayBuilder, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder, Float32Builder,
-    Float64Builder, Int8Builder, Int16Builder, Int32Builder, Int64Builder, StringBuilder,
-    Time32MillisecondBuilder, Time32SecondBuilder, Time64MicrosecondBuilder,
-    Time64NanosecondBuilder, TimestampMicrosecondBuilder, TimestampMillisecondBuilder,
-    TimestampNanosecondBuilder, TimestampSecondBuilder,
+    ArrayBuilder, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
+    FixedSizeBinaryBuilder, Float32Builder, Float64Builder, Int8Builder, Int16Builder,
+    Int32Builder, Int64Builder, StringBuilder, Time32MillisecondBuilder, Time32SecondBuilder,
+    Time64MicrosecondBuilder, Time64NanosecondBuilder, TimestampMicrosecondBuilder,
+    TimestampMillisecondBuilder, TimestampNanosecondBuilder, TimestampSecondBuilder,
 };
 use arrow::datatypes as arrow_schema;
+use arrow::error::ArrowError;
 use jiff::ToSpan;
 use ordered_float::OrderedFloat;
 use parse_display::Display;
@@ -439,6 +440,24 @@ fn millis_nanos_to_nanos(millis: i64, nanos: i32) -> Result<i64> {
         })
 }
 
+trait AppendResult {
+    fn into_append_result(self) -> Result<()>;
+}
+
+impl AppendResult for () {
+    fn into_append_result(self) -> Result<()> {
+        Ok(())
+    }
+}
+
+impl AppendResult for std::result::Result<(), ArrowError> {
+    fn into_append_result(self) -> Result<()> {
+        self.map_err(|e| RowConvertError {
+            message: format!("Failed to append value: {e}"),
+        })
+    }
+}
+
 impl Datum<'_> {
     pub fn append_to(
         &self,
@@ -457,7 +476,7 @@ impl Datum<'_> {
         macro_rules! append_value_to_arrow {
             ($builder_type:ty, $value:expr) => {
                 if let Some(b) = builder.as_any_mut().downcast_mut::<$builder_type>() {
-                    b.append_value($value);
+                    b.append_value($value).into_append_result()?;
                     return Ok(());
                 }
             };
@@ -474,6 +493,7 @@ impl Datum<'_> {
                 append_null_to_arrow!(Float64Builder);
                 append_null_to_arrow!(StringBuilder);
                 append_null_to_arrow!(BinaryBuilder);
+                append_null_to_arrow!(FixedSizeBinaryBuilder);
                 append_null_to_arrow!(Decimal128Builder);
                 append_null_to_arrow!(Date32Builder);
                 append_null_to_arrow!(Time32SecondBuilder);
@@ -493,7 +513,21 @@ impl Datum<'_> {
             Datum::Float32(v) => append_value_to_arrow!(Float32Builder, v.into_inner()),
             Datum::Float64(v) => append_value_to_arrow!(Float64Builder, v.into_inner()),
             Datum::String(v) => append_value_to_arrow!(StringBuilder, v.as_ref()),
-            Datum::Blob(v) => append_value_to_arrow!(BinaryBuilder, v.as_ref()),
+            Datum::Blob(v) => match data_type {
+                arrow_schema::DataType::Binary => {
+                    append_value_to_arrow!(BinaryBuilder, v.as_ref());
+                }
+                arrow_schema::DataType::FixedSizeBinary(_) => {
+                    append_value_to_arrow!(FixedSizeBinaryBuilder, v.as_ref());
+                }
+                _ => {
+                    return Err(RowConvertError {
+                        message: format!(
+                            "Expected Binary or FixedSizeBinary Arrow type, got: {data_type:?}"
+                        ),
+                    });
+                }
+            },
             Datum::Decimal(decimal) => {
                 // Extract target precision and scale from Arrow schema
                 let (p, s) = match data_type {
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 22e893cb5d..efb445f3f4 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -646,6 +646,8 @@ mod table_test {
                     )
                     // Bytes type
                     .column("col_bytes", DataTypes::bytes())
+                    // Fixed-size binary type
+                    .column("col_binary", DataTypes::binary(4))
                     // Timestamp types with negative values (before Unix epoch)
                     .column(
                         "col_timestamp_us_neg",
@@ -713,6 +715,7 @@ mod table_test {
         let col_timestamp_ltz_us = TimestampLtz::from_millis_nanos(1769163227123, 456000).unwrap();
         let col_timestamp_ltz_ns = TimestampLtz::from_millis_nanos(1769163227123, 999_999).unwrap();
         let col_bytes: Vec<u8> = b"binary data".to_vec();
+        let col_binary: Vec<u8> = vec![0xDE, 0xAD, 0xBE, 0xEF];
 
         // 1960-06-15 08:30:45.123456 UTC (before 1970)
         let col_timestamp_us_neg = TimestampNtz::from_millis_nanos(-301234154877, 456000).unwrap();
@@ -749,10 +752,11 @@ mod table_test {
         row.set_field(21, col_timestamp_ltz_us.clone());
         row.set_field(22, col_timestamp_ltz_ns.clone());
         row.set_field(23, col_bytes.as_slice());
-        row.set_field(24, col_timestamp_us_neg.clone());
-        row.set_field(25, col_timestamp_ns_neg.clone());
-        row.set_field(26, col_timestamp_ltz_us_neg.clone());
-        row.set_field(27, col_timestamp_ltz_ns_neg.clone());
+        row.set_field(24, col_binary.as_slice());
+        row.set_field(25, col_timestamp_us_neg.clone());
+        row.set_field(26, col_timestamp_ns_neg.clone());
+        row.set_field(27, col_timestamp_ltz_us_neg.clone());
+        row.set_field(28, col_timestamp_ltz_ns_neg.clone());
 
         append_writer
             .append(&row)
@@ -910,9 +914,14 @@ mod table_test {
             "col_timestamp_ltz_ns nanos mismatch"
         );
         assert_eq!(found_row.get_bytes(23), col_bytes, "col_bytes mismatch");
+        assert_eq!(
+            found_row.get_binary(24, 4),
+            col_binary,
+            "col_binary mismatch"
+        );
 
         // Verify timestamps before Unix epoch (negative timestamps)
-        let read_ts_us_neg = found_row.get_timestamp_ntz(24, 6);
+        let read_ts_us_neg = found_row.get_timestamp_ntz(25, 6);
         assert_eq!(
             read_ts_us_neg.get_millisecond(),
             col_timestamp_us_neg.get_millisecond(),
@@ -924,7 +933,7 @@ mod table_test {
             "col_timestamp_us_neg nanos mismatch"
         );
 
-        let read_ts_ns_neg = found_row.get_timestamp_ntz(25, 9);
+        let read_ts_ns_neg = found_row.get_timestamp_ntz(26, 9);
         assert_eq!(
             read_ts_ns_neg.get_millisecond(),
             col_timestamp_ns_neg.get_millisecond(),
@@ -936,7 +945,7 @@ mod table_test {
             "col_timestamp_ns_neg nanos mismatch"
         );
 
-        let read_ts_ltz_us_neg = found_row.get_timestamp_ltz(26, 6);
+        let read_ts_ltz_us_neg = found_row.get_timestamp_ltz(27, 6);
         assert_eq!(
             read_ts_ltz_us_neg.get_epoch_millisecond(),
             col_timestamp_ltz_us_neg.get_epoch_millisecond(),
@@ -948,7 +957,7 @@ mod table_test {
             "col_timestamp_ltz_us_neg nanos mismatch"
         );
 
-        let read_ts_ltz_ns_neg = found_row.get_timestamp_ltz(27, 9);
+        let read_ts_ltz_ns_neg = found_row.get_timestamp_ltz(28, 9);
         assert_eq!(
             read_ts_ltz_ns_neg.get_epoch_millisecond(),
             col_timestamp_ltz_ns_neg.get_epoch_millisecond(),

From 80d903f0b6c99ec86692555ea30de0cb47803d56 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sat, 14 Feb 2026 00:09:06 +0000
Subject: [PATCH 143/287] chore: remove LATEST_OFFSET which isn't handle by
 server (#312)

---
 fluss-rust/bindings/cpp/include/fluss.hpp              | 1 -
 fluss-rust/bindings/python/fluss/__init__.pyi          | 2 --
 fluss-rust/bindings/python/src/lib.rs                  | 1 -
 fluss-rust/crates/fluss/src/client/table/mod.rs        | 1 -
 fluss-rust/crates/fluss/tests/integration/log_table.rs | 6 +++---
 5 files changed, 3 insertions(+), 8 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 926fbc66a2..dd298823a4 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -304,7 +304,6 @@ enum class DatumType {
 };
 
 constexpr int64_t EARLIEST_OFFSET = -2;
-constexpr int64_t LATEST_OFFSET = -1;
 
 enum class OffsetSpec {
     Earliest = 0,
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index dff90c38f8..daccca8512 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -848,7 +848,5 @@ class OffsetType:
 
 # Constant for earliest offset (-2)
 EARLIEST_OFFSET: int
-# Constant for latest offset (-1)
-LATEST_OFFSET: int
 
 __version__: str
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 41d516e5b4..801db2c87b 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -99,7 +99,6 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
 
     // Register constants
     m.add("EARLIEST_OFFSET", fcore::client::EARLIEST_OFFSET)?;
-    m.add("LATEST_OFFSET", fcore::client::LATEST_OFFSET)?;
 
     // Register exception types and error codes
     m.add_class::<FlussError>()?;
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 4e5b5d1359..4c3dfe2ddc 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -22,7 +22,6 @@ use crate::metadata::{TableInfo, TablePath};
 use std::sync::Arc;
 
 pub const EARLIEST_OFFSET: i64 = -2;
-pub const LATEST_OFFSET: i64 = -1;
 
 mod append;
 mod lookup;
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index efb445f3f4..76420676c0 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -38,7 +38,7 @@ mod table_test {
         create_partitions, create_table, get_cluster, start_cluster, stop_cluster,
     };
     use arrow::array::record_batch;
-    use fluss::client::{FlussTable, TableScan};
+    use fluss::client::{EARLIEST_OFFSET, FlussTable, TableScan};
     use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
     use fluss::record::ScanRecord;
     use fluss::row::InternalRow;
@@ -122,9 +122,9 @@ mod table_test {
             .expect("Failed to create log scanner");
         for bucket_id in 0..num_buckets {
             log_scanner
-                .subscribe(bucket_id, 0)
+                .subscribe(bucket_id, EARLIEST_OFFSET)
                 .await
-                .expect("Failed to subscribe");
+                .expect("Failed to subscribe with EARLIEST_OFFSET");
         }
 
         // Poll for records

From 815596db9b511e031bf2e4bfb67adeafaf883a9a Mon Sep 17 00:00:00 2001
From: Junfan Zhang <junfan.zhang@outlook.com>
Date: Sat, 14 Feb 2026 08:09:30 +0800
Subject: [PATCH 144/287] chore: allow propagating hostname as raw bootstrap
 address (#307)

---
 .../crates/fluss/src/client/metadata.rs       | 61 ++++++++++++++++---
 1 file changed, 54 insertions(+), 7 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index ce00ced2b5..3d8e77b2eb 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -24,7 +24,7 @@ use crate::rpc::{RpcClient, ServerConnection};
 use log::info;
 use parking_lot::RwLock;
 use std::collections::HashSet;
-use std::net::SocketAddr;
+use std::net::{SocketAddr, ToSocketAddrs};
 use std::sync::Arc;
 
 #[derive(Default)]
@@ -44,13 +44,33 @@ impl Metadata {
         })
     }
 
+    fn parse_bootstrap(boot_strap: &str) -> Result<SocketAddr> {
+        // Resolve all socket addresses and deterministically choose one.
+        let addrs = boot_strap
+            .to_socket_addrs()
+            .map_err(|e| Error::IllegalArgument {
+                message: format!("Invalid bootstrap address '{boot_strap}': {e}"),
+            })?;
+
+        // Prefer IPv4 addresses; if none are available, fall back to the first IPv6.
+        let mut ipv6_candidate: Option<SocketAddr> = None;
+        for addr in addrs {
+            if addr.is_ipv4() {
+                return Ok(addr);
+            }
+            if ipv6_candidate.is_none() {
+                ipv6_candidate = Some(addr);
+            }
+        }
+
+        let addr = ipv6_candidate.ok_or_else(|| Error::IllegalArgument {
+            message: format!("Unable to resolve bootstrap address '{boot_strap}'"),
+        })?;
+        Ok(addr)
+    }
+
     async fn init_cluster(boot_strap: &str, connections: Arc<RpcClient>) -> Result<Cluster> {
-        let socket_address =
-            boot_strap
-                .parse::<SocketAddr>()
-                .map_err(|e| Error::IllegalArgument {
-                    message: format!("Invalid bootstrap address '{boot_strap}': {e}"),
-                })?;
+        let socket_address = Self::parse_bootstrap(boot_strap)?;
         let server_node = ServerNode::new(
             -1,
             socket_address.ip().to_string(),
@@ -273,4 +293,31 @@ mod tests {
         let cluster = metadata.get_cluster();
         assert!(cluster.get_tablet_server(1).is_none());
     }
+
+    #[test]
+    fn parse_bootstrap_variants() {
+        // valid IP
+        let addr = Metadata::parse_bootstrap("127.0.0.1:8080").unwrap();
+        assert_eq!(addr.port(), 8080);
+
+        // valid hostname
+        let addr = Metadata::parse_bootstrap("localhost:9090").unwrap();
+        assert_eq!(addr.port(), 9090);
+
+        // valid IPv6 address
+        let addr = Metadata::parse_bootstrap("[::1]:8080").unwrap();
+        assert_eq!(addr.port(), 8080);
+
+        // invalid input: missing port
+        assert!(Metadata::parse_bootstrap("localhost").is_err());
+
+        // invalid input: out-of-range port
+        assert!(Metadata::parse_bootstrap("localhost:99999").is_err());
+
+        // invalid input: empty string
+        assert!(Metadata::parse_bootstrap("").is_err());
+
+        // invalid input: nonsensical address
+        assert!(Metadata::parse_bootstrap("invalid_address").is_err());
+    }
 }

From bf20af924c2613b04edc5e57563b2e97ee4bfe8d Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sun, 15 Feb 2026 01:01:44 +0000
Subject: [PATCH 145/287] [docs] introduce client doc website (#300)

---
 .../.github/workflows/release_python.yml      |   6 +
 fluss-rust/.gitignore                         |  21 +-
 fluss-rust/.licenserc.yaml                    |   3 +-
 fluss-rust/DEVELOPMENT.md                     |  18 -
 fluss-rust/README.md                          |  18 -
 fluss-rust/bindings/cpp/README.md             |  18 -
 fluss-rust/bindings/python/API_REFERENCE.md   | 305 -------
 fluss-rust/bindings/python/DEVELOPMENT.md     |  19 -
 fluss-rust/bindings/python/README.md          | 434 +---------
 fluss-rust/bindings/python/generate_readme.py | 104 +++
 fluss-rust/bindings/python/pyproject.toml     |   2 +-
 fluss-rust/crates/fluss/README.md             |  18 -
 fluss-rust/docs/creating-a-release.md         |  18 -
 fluss-rust/docs/generate-release-note.md      |  18 -
 fluss-rust/docs/rust-client.md                | 755 ------------------
 .../docs/verifying-a-release-candidate.md     |  18 -
 fluss-rust/justfile                           |   4 +
 fluss-rust/website/babel.config.js            |   3 +
 .../docs/developer-guide/_category_.json      |   4 +
 .../docs/developer-guide/contributing.md      | 126 +++
 fluss-rust/website/docs/index.md              |  45 ++
 .../website/docs/user-guide/_category_.json   |   4 +
 .../docs/user-guide/cpp/_category_.json       |   4 +
 .../docs/user-guide/cpp/api-reference.md      | 495 ++++++++++++
 .../website/docs/user-guide/cpp/data-types.md | 110 +++
 .../docs/user-guide/cpp/error-handling.md     | 170 ++++
 .../user-guide/cpp/example/_category_.json    |   4 +
 .../cpp/example/admin-operations.md           | 154 ++++
 .../user-guide/cpp/example/configuration.md   |  35 +
 .../docs/user-guide/cpp/example/index.md      |  63 ++
 .../docs/user-guide/cpp/example/log-tables.md | 121 +++
 .../cpp/example/partitioned-tables.md         | 180 +++++
 .../cpp/example/primary-key-tables.md         | 133 +++
 .../docs/user-guide/cpp/installation.md       | 107 +++
 .../docs/user-guide/python/_category_.json    |   4 +
 .../docs/user-guide/python/api-reference.md   | 286 +++++++
 .../docs/user-guide/python/data-types.md      |  66 ++
 .../docs/user-guide/python/error-handling.md  | 109 +++
 .../user-guide/python/example/_category_.json |   4 +
 .../python/example/admin-operations.md        |  77 ++
 .../python/example/configuration.md           |  36 +
 .../docs/user-guide/python/example/index.md   |  46 ++
 .../user-guide/python/example/log-tables.md   | 122 +++
 .../python/example/partitioned-tables.md      | 104 +++
 .../python/example/primary-key-tables.md      |  61 ++
 .../docs/user-guide/python/installation.md    |  41 +
 .../docs/user-guide/rust/_category_.json      |   4 +
 .../docs/user-guide/rust/api-reference.md     | 443 ++++++++++
 .../docs/user-guide/rust/data-types.md        |  80 ++
 .../docs/user-guide/rust/error-handling.md    | 180 +++++
 .../user-guide/rust/example/_category_.json   |   4 +
 .../rust/example/admin-operations.md          | 118 +++
 .../user-guide/rust/example/configuration.md  |  26 +
 .../docs/user-guide/rust/example/index.md     |  56 ++
 .../user-guide/rust/example/log-tables.md     | 140 ++++
 .../rust/example/partitioned-tables.md        | 215 +++++
 .../rust/example/primary-key-tables.md        | 114 +++
 .../docs/user-guide/rust/installation.md      |  76 ++
 fluss-rust/website/docusaurus.config.ts       |  84 ++
 fluss-rust/website/package.json               |  43 +
 fluss-rust/website/sidebars.ts                |  24 +
 fluss-rust/website/src/css/custom.css         | 209 +++++
 .../website/static/img/logo/fluss_favicon.svg |  19 +
 .../static/img/logo/png/colored_logo.png      | Bin 0 -> 45184 bytes
 .../static/img/logo/svg/colored_logo.svg      |  19 +
 fluss-rust/website/tsconfig.json              |   6 +
 66 files changed, 4712 insertions(+), 1641 deletions(-)
 delete mode 100644 fluss-rust/bindings/python/API_REFERENCE.md
 create mode 100644 fluss-rust/bindings/python/generate_readme.py
 create mode 100644 fluss-rust/website/babel.config.js
 create mode 100644 fluss-rust/website/docs/developer-guide/_category_.json
 create mode 100644 fluss-rust/website/docs/developer-guide/contributing.md
 create mode 100644 fluss-rust/website/docs/index.md
 create mode 100644 fluss-rust/website/docs/user-guide/_category_.json
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/_category_.json
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/api-reference.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/data-types.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/error-handling.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/example/_category_.json
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/example/configuration.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/example/index.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/example/primary-key-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/cpp/installation.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/_category_.json
 create mode 100644 fluss-rust/website/docs/user-guide/python/api-reference.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/data-types.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/error-handling.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/example/_category_.json
 create mode 100644 fluss-rust/website/docs/user-guide/python/example/admin-operations.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/example/configuration.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/example/index.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/example/log-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/example/partitioned-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/example/primary-key-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/python/installation.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/_category_.json
 create mode 100644 fluss-rust/website/docs/user-guide/rust/api-reference.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/data-types.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/error-handling.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/example/_category_.json
 create mode 100644 fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/example/configuration.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/example/index.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/example/log-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
 create mode 100644 fluss-rust/website/docs/user-guide/rust/installation.md
 create mode 100644 fluss-rust/website/docusaurus.config.ts
 create mode 100644 fluss-rust/website/package.json
 create mode 100644 fluss-rust/website/sidebars.ts
 create mode 100644 fluss-rust/website/src/css/custom.css
 create mode 100644 fluss-rust/website/static/img/logo/fluss_favicon.svg
 create mode 100644 fluss-rust/website/static/img/logo/png/colored_logo.png
 create mode 100644 fluss-rust/website/static/img/logo/svg/colored_logo.svg
 create mode 100644 fluss-rust/website/tsconfig.json

diff --git a/fluss-rust/.github/workflows/release_python.yml b/fluss-rust/.github/workflows/release_python.yml
index 59c8f8c91e..d7bd04ccb7 100644
--- a/fluss-rust/.github/workflows/release_python.yml
+++ b/fluss-rust/.github/workflows/release_python.yml
@@ -49,6 +49,9 @@ jobs:
     steps:
       - uses: actions/checkout@v4
 
+      - name: Generate Python README
+        run: python bindings/python/generate_readme.py
+
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
 
@@ -78,6 +81,9 @@ jobs:
     steps:
       - uses: actions/checkout@v4
 
+      - name: Generate Python README
+        run: python3 bindings/python/generate_readme.py
+
       - name: Install protoc (Linux)
         if: runner.os == 'Linux'
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
index 9c585d8632..476f84e979 100644
--- a/fluss-rust/.gitignore
+++ b/fluss-rust/.gitignore
@@ -20,6 +20,7 @@ Cargo.lock
 .vscode/
 
 # Python
+bindings/python/GENERATED_README.md
 __pycache__/
 *.py[cod]
 *$py.class
@@ -29,4 +30,22 @@ dist/
 build/
 
 # CPP
-*CMakeFiles/
\ No newline at end of file
+*CMakeFiles/
+
+# Website (Docusaurus)
+website/node_modules
+website/build
+website/.docusaurus
+website/.cache-loader
+website/.env.local
+website/.env.development.local
+website/.env.test.local
+website/.env.production.local
+website/npm-debug.log*
+website/yarn-debug.log*
+website/yarn-error.log*
+website/package-lock.json
+website/versioned_docs
+website/versioned_sidebars
+website/versions.json
+website/pnpm-lock.yaml
\ No newline at end of file
diff --git a/fluss-rust/.licenserc.yaml b/fluss-rust/.licenserc.yaml
index a3cfcd146b..d323856373 100644
--- a/fluss-rust/.licenserc.yaml
+++ b/fluss-rust/.licenserc.yaml
@@ -21,10 +21,11 @@ header:
     copyright-owner: Apache Software Foundation
 
   paths-ignore:
-    - '.github/PULL_REQUEST_TEMPLATE.md'
     - '.gitignore'
     - 'LICENSE'
     - 'NOTICE'
     - 'DISCLAIMER'
     - 'bindings/python/fluss/py.typed'
+    - 'website/**'
+    - '**/*.md'
   comment: on-failure
diff --git a/fluss-rust/DEVELOPMENT.md b/fluss-rust/DEVELOPMENT.md
index a0669a755e..a1180d6f6c 100644
--- a/fluss-rust/DEVELOPMENT.md
+++ b/fluss-rust/DEVELOPMENT.md
@@ -1,21 +1,3 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
 # Development Guide
 
 Welcome to the development guide of `fluss-rust`! This project builds `fluss-rust` client and language specific bindings.  
diff --git a/fluss-rust/README.md b/fluss-rust/README.md
index a42c0f360e..dafe19c880 100644
--- a/fluss-rust/README.md
+++ b/fluss-rust/README.md
@@ -1,21 +1,3 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
 # Apache Fluss™ Rust (Incubating)
 
 ![Experimental](https://img.shields.io/badge/status-experimental-orange)
diff --git a/fluss-rust/bindings/cpp/README.md b/fluss-rust/bindings/cpp/README.md
index 2556a4b6c8..539e313024 100644
--- a/fluss-rust/bindings/cpp/README.md
+++ b/fluss-rust/bindings/cpp/README.md
@@ -1,21 +1,3 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
 # Apache Fluss™ C++ Bindings (Incubating)
 
 C++ bindings for Fluss, built on top of the [fluss-rust](../../crates/fluss) client. The API is exposed via a C++ header ([include/fluss.hpp](include/fluss.hpp)) and implemented with Rust FFI.
diff --git a/fluss-rust/bindings/python/API_REFERENCE.md b/fluss-rust/bindings/python/API_REFERENCE.md
deleted file mode 100644
index 3749ee1d87..0000000000
--- a/fluss-rust/bindings/python/API_REFERENCE.md
+++ /dev/null
@@ -1,305 +0,0 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
-# Python API Reference
-
-Complete API reference for the Fluss Python client. For a usage guide with examples, see the [Python Client Guide](README.md).
-
-## `Config`
-
-| Method / Property | Description |
-|---|---|
-| `Config(properties: dict = None)` | Create config from a dict of key-value pairs |
-| `.bootstrap_servers` | Get/set coordinator server address |
-| `.writer_request_max_size` | Get/set max request size in bytes |
-| `.writer_batch_size` | Get/set write batch size in bytes |
-
-## `FlussConnection`
-
-| Method | Description |
-|---|---|
-| `await FlussConnection.create(config) -> FlussConnection` | Connect to a Fluss cluster |
-| `await conn.get_admin() -> FlussAdmin` | Get admin interface |
-| `await conn.get_table(table_path) -> FlussTable` | Get a table for read/write operations |
-| `conn.close()` | Close the connection |
-
-Supports `with` statement (context manager).
-
-## `FlussAdmin`
-
-| Method | Description |
-|---|---|
-| `await create_database(name, database_descriptor=None, ignore_if_exists=False)` | Create a database |
-| `await drop_database(name, ignore_if_not_exists=False, cascade=True)` | Drop a database |
-| `await list_databases() -> list[str]` | List all databases |
-| `await database_exists(name) -> bool` | Check if a database exists |
-| `await get_database_info(name) -> DatabaseInfo` | Get database metadata |
-| `await create_table(table_path, table_descriptor, ignore_if_exists=False)` | Create a table |
-| `await drop_table(table_path, ignore_if_not_exists=False)` | Drop a table |
-| `await get_table_info(table_path) -> TableInfo` | Get table metadata |
-| `await list_tables(database_name) -> list[str]` | List tables in a database |
-| `await table_exists(table_path) -> bool` | Check if a table exists |
-| `await list_offsets(table_path, bucket_ids, offset_type, timestamp=None) -> dict[int, int]` | Get offsets for buckets |
-| `await list_partition_offsets(table_path, partition_name, bucket_ids, offset_type, timestamp=None) -> dict[int, int]` | Get offsets for a partition's buckets |
-| `await create_partition(table_path, partition_spec, ignore_if_exists=False)` | Create a partition |
-| `await drop_partition(table_path, partition_spec, ignore_if_not_exists=False)` | Drop a partition |
-| `await list_partition_infos(table_path) -> list[PartitionInfo]` | List partitions |
-| `await get_latest_lake_snapshot(table_path) -> LakeSnapshot` | Get latest lake snapshot |
-
-## `FlussTable`
-
-| Method | Description |
-|---|---|
-| `new_scan() -> TableScan` | Create a scan builder |
-| `new_append() -> TableAppend` | Create an append builder for log tables |
-| `new_upsert() -> TableUpsert` | Create an upsert builder for PK tables |
-| `new_lookup() -> TableLookup` | Create a lookup builder for PK tables |
-| `get_table_info() -> TableInfo` | Get table metadata |
-| `get_table_path() -> TablePath` | Get table path |
-| `has_primary_key() -> bool` | Check if table has a primary key |
-
-## `TableScan`
-
-| Method | Description |
-|---|---|
-| `.project(indices) -> TableScan` | Project columns by index |
-| `.project_by_name(names) -> TableScan` | Project columns by name |
-| `await .create_log_scanner() -> LogScanner` | Create record-based scanner (for `poll()`) |
-| `await .create_record_batch_log_scanner() -> LogScanner` | Create batch-based scanner (for `poll_arrow()`, `to_arrow()`, etc.) |
-
-## `TableAppend`
-
-Builder for creating an `AppendWriter`. Obtain via `FlussTable.new_append()`.
-
-| Method | Description |
-|---|---|
-| `.create_writer() -> AppendWriter` | Create the append writer |
-
-## `TableUpsert`
-
-Builder for creating an `UpsertWriter`. Obtain via `FlussTable.new_upsert()`.
-
-| Method | Description |
-|---|---|
-| `.partial_update_by_name(columns) -> TableUpsert` | Configure partial update by column names |
-| `.partial_update_by_index(indices) -> TableUpsert` | Configure partial update by column indices |
-| `.create_writer() -> UpsertWriter` | Create the upsert writer |
-
-## `TableLookup`
-
-Builder for creating a `Lookuper`. Obtain via `FlussTable.new_lookup()`.
-
-| Method | Description |
-|---|---|
-| `.create_lookuper() -> Lookuper` | Create the lookuper |
-
-## `AppendWriter`
-
-| Method | Description |
-|---|---|
-| `.append(row) -> WriteResultHandle` | Append a row (dict, list, or tuple) |
-| `.write_arrow(table)` | Write a PyArrow Table |
-| `.write_arrow_batch(batch) -> WriteResultHandle` | Write a PyArrow RecordBatch |
-| `.write_pandas(df)` | Write a Pandas DataFrame |
-| `await .flush()` | Flush all pending writes |
-
-## `UpsertWriter`
-
-| Method | Description |
-|---|---|
-| `.upsert(row) -> WriteResultHandle` | Upsert a row (insert or update by PK) |
-| `.delete(pk) -> WriteResultHandle` | Delete a row by primary key |
-| `await .flush()` | Flush all pending operations |
-
-## `WriteResultHandle`
-
-| Method | Description |
-|---|---|
-| `await .wait()` | Wait for server acknowledgment of this write |
-
-## `Lookuper`
-
-| Method | Description |
-|---|---|
-| `await .lookup(pk) -> dict \| None` | Lookup a row by primary key |
-
-## `LogScanner`
-
-| Method | Description |
-|---|---|
-| `.subscribe(bucket_id, start_offset)` | Subscribe to a bucket |
-| `.subscribe_buckets(bucket_offsets)` | Subscribe to multiple buckets (`{bucket_id: offset}`) |
-| `.subscribe_partition(partition_id, bucket_id, start_offset)` | Subscribe to a partition bucket |
-| `.subscribe_partition_buckets(partition_bucket_offsets)` | Subscribe to multiple partition+bucket combos (`{(part_id, bucket_id): offset}`) |
-| `.unsubscribe(bucket_id)` | Unsubscribe from a bucket (non-partitioned tables) |
-| `.unsubscribe_partition(partition_id, bucket_id)` | Unsubscribe from a partition bucket |
-| `.poll(timeout_ms) -> list[ScanRecord]` | Poll individual records (record scanner only) |
-| `.poll_arrow(timeout_ms) -> pa.Table` | Poll as Arrow Table (batch scanner only) |
-| `.poll_record_batch(timeout_ms) -> list[RecordBatch]` | Poll batches with metadata (batch scanner only) |
-| `.to_arrow() -> pa.Table` | Read all subscribed data as Arrow Table (batch scanner only) |
-| `.to_pandas() -> pd.DataFrame` | Read all subscribed data as DataFrame (batch scanner only) |
-
-## `ScanRecord`
-
-| Property | Description |
-|---|---|
-| `.bucket -> TableBucket` | Bucket this record belongs to |
-| `.offset -> int` | Record offset in the log |
-| `.timestamp -> int` | Record timestamp |
-| `.change_type -> ChangeType` | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
-| `.row -> dict` | Row data as `{column_name: value}` |
-
-## `RecordBatch`
-
-| Property | Description |
-|---|---|
-| `.batch -> pa.RecordBatch` | Arrow RecordBatch data |
-| `.bucket -> TableBucket` | Bucket this batch belongs to |
-| `.base_offset -> int` | First record offset |
-| `.last_offset -> int` | Last record offset |
-
-## `Schema`
-
-| Method | Description |
-|---|---|
-| `Schema(schema: pa.Schema, primary_keys=None)` | Create from PyArrow schema |
-| `.get_column_names() -> list[str]` | Get column names |
-| `.get_column_types() -> list[str]` | Get column type names |
-
-## `TableDescriptor`
-
-| Method | Description |
-|---|---|
-| `TableDescriptor(schema, *, partition_keys=None, bucket_count=None, bucket_keys=None, comment=None, log_format=None, kv_format=None, properties=None, custom_properties=None)` | Create table descriptor |
-| `.get_schema() -> Schema` | Get the schema |
-
-## `TablePath`
-
-| Method / Property | Description |
-|---|---|
-| `TablePath(database, table)` | Create a table path |
-| `.database_name -> str` | Database name |
-| `.table_name -> str` | Table name |
-
-## `TableInfo`
-
-| Property / Method | Description |
-|---|---|
-| `.table_id -> int` | Table ID |
-| `.table_path -> TablePath` | Table path |
-| `.num_buckets -> int` | Number of buckets |
-| `.schema_id -> int` | Schema ID |
-| `.comment -> str \| None` | Table comment |
-| `.created_time -> int` | Creation timestamp |
-| `.modified_time -> int` | Last modification timestamp |
-| `.get_primary_keys() -> list[str]` | Primary key columns |
-| `.get_partition_keys() -> list[str]` | Partition columns |
-| `.get_bucket_keys() -> list[str]` | Bucket key columns |
-| `.has_primary_key() -> bool` | Has primary key? |
-| `.is_partitioned() -> bool` | Is partitioned? |
-| `.get_schema() -> Schema` | Get table schema |
-| `.get_column_names() -> list[str]` | Column names |
-| `.get_column_count() -> int` | Number of columns |
-| `.get_properties() -> dict` | All table properties |
-| `.get_custom_properties() -> dict` | Custom properties only |
-
-## `PartitionInfo`
-
-| Property | Description |
-|---|---|
-| `.partition_id -> int` | Partition ID |
-| `.partition_name -> str` | Partition name |
-
-## `DatabaseDescriptor`
-
-| Method / Property | Description |
-|---|---|
-| `DatabaseDescriptor(comment=None, custom_properties=None)` | Create descriptor |
-| `.comment -> str \| None` | Database comment |
-| `.get_custom_properties() -> dict` | Custom properties |
-
-## `DatabaseInfo`
-
-| Property / Method | Description |
-|---|---|
-| `.database_name -> str` | Database name |
-| `.created_time -> int` | Creation timestamp |
-| `.modified_time -> int` | Last modification timestamp |
-| `.get_database_descriptor() -> DatabaseDescriptor` | Get descriptor |
-
-## `LakeSnapshot`
-
-| Property / Method | Description |
-|---|---|
-| `.snapshot_id -> int` | Snapshot ID |
-| `.table_buckets_offset -> dict[TableBucket, int]` | All bucket offsets |
-| `.get_bucket_offset(bucket) -> int \| None` | Get offset for a bucket |
-| `.get_table_buckets() -> list[TableBucket]` | Get all buckets |
-
-## `TableBucket`
-
-| Method / Property | Description |
-|---|---|
-| `TableBucket(table_id, bucket)` | Create non-partitioned bucket |
-| `TableBucket.with_partition(table_id, partition_id, bucket)` | Create partitioned bucket |
-| `.table_id -> int` | Table ID |
-| `.bucket_id -> int` | Bucket ID |
-| `.partition_id -> int \| None` | Partition ID (None if non-partitioned) |
-
-## `FlussError`
-
-| Property | Description |
-|---|---|
-| `.message -> str` | Error message |
-
-Raised for all Fluss-specific errors (connection failures, table not found, schema mismatches, etc.). Inherits from `Exception`.
-
-## Constants
-
-| Constant | Value | Description |
-|---|---|---|
-| `fluss.EARLIEST_OFFSET` | `-2` | Start reading from earliest available offset |
-| `fluss.LATEST_OFFSET` | `-1` | Start reading from latest offset (only new records) |
-| `fluss.OffsetType.EARLIEST` | `"earliest"` | For `list_offsets()` |
-| `fluss.OffsetType.LATEST` | `"latest"` | For `list_offsets()` |
-| `fluss.OffsetType.TIMESTAMP` | `"timestamp"` | For `list_offsets()` with timestamp |
-
-## `ChangeType`
-
-| Value | Short String | Description |
-|---|---|---|
-| `ChangeType.AppendOnly` (0) | `+A` | Append-only |
-| `ChangeType.Insert` (1) | `+I` | Insert |
-| `ChangeType.UpdateBefore` (2) | `-U` | Previous value of updated row |
-| `ChangeType.UpdateAfter` (3) | `+U` | New value of updated row |
-| `ChangeType.Delete` (4) | `-D` | Delete |
-
-## Data Types
-
-| PyArrow Type | Fluss Type | Python Type |
-|---|---|---|
-| `pa.boolean()` | Boolean | `bool` |
-| `pa.int8()` / `int16()` / `int32()` / `int64()` | TinyInt / SmallInt / Int / BigInt | `int` |
-| `pa.float32()` / `float64()` | Float / Double | `float` |
-| `pa.string()` | String | `str` |
-| `pa.binary()` | Bytes | `bytes` |
-| `pa.date32()` | Date | `datetime.date` |
-| `pa.time32("ms")` | Time | `datetime.time` |
-| `pa.timestamp("us")` | Timestamp (NTZ) | `datetime.datetime` |
-| `pa.timestamp("us", tz="UTC")` | TimestampLTZ | `datetime.datetime` |
-| `pa.decimal128(precision, scale)` | Decimal | `decimal.Decimal` |
diff --git a/fluss-rust/bindings/python/DEVELOPMENT.md b/fluss-rust/bindings/python/DEVELOPMENT.md
index e316f5e8e6..cccd0d1ee6 100644
--- a/fluss-rust/bindings/python/DEVELOPMENT.md
+++ b/fluss-rust/bindings/python/DEVELOPMENT.md
@@ -1,22 +1,3 @@
-<!--
-  ~ Licensed to the Apache Software Foundation (ASF) under one
-  ~ or more contributor license agreements.  See the NOTICE file
-  ~ distributed with this work for additional information
-  ~ regarding copyright ownership.  The ASF licenses this file
-  ~ to you under the Apache License, Version 2.0 (the
-  ~ "License"); you may not use this file except in compliance
-  ~ with the License.  You may obtain a copy of the License at
-  ~
-  ~   http://www.apache.org/licenses/LICENSE-2.0
-  ~
-  ~ Unless required by applicable law or agreed to in writing,
-  ~ software distributed under the License is distributed on an
-  ~ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-  ~ KIND, either express or implied.  See the License for the
-  ~ specific language governing permissions and limitations
-  ~ under the License.
--->
-
 # Development
 
 ## Requirements
diff --git a/fluss-rust/bindings/python/README.md b/fluss-rust/bindings/python/README.md
index 20c5f5522a..54a167bc56 100644
--- a/fluss-rust/bindings/python/README.md
+++ b/fluss-rust/bindings/python/README.md
@@ -18,436 +18,4 @@
 
 # Fluss Python Client
 
-This guide covers how to use the Fluss Python client for reading and writing data to log tables and primary key tables.
-
-The Python client is async-first, built on top of the Rust core via [PyO3](https://pyo3.rs/), and uses [PyArrow](https://arrow.apache.org/docs/python/) for schema definitions and data interchange.
-
-## Key Concepts
-
-- **Log table** — an append-only table (no primary key). Records are immutable once written. Use for event streams, logs, and audit trails.
-- **Primary key (PK) table** — a table with a primary key. Supports upsert, delete, and point lookups.
-- **Bucket** — the unit of parallelism within a table (similar to Kafka partitions). Each table has one or more buckets. Readers subscribe to individual buckets.
-- **Partition** — a way to organize data by column values (e.g. by date or region). Each partition contains its own set of buckets. Partitions must be created explicitly before writing.
-- **Offset** — the position of a record within a bucket. Used to track reading progress. Start from `EARLIEST_OFFSET` to read all data, or `LATEST_OFFSET` to only read new records.
-
-## Prerequisites
-
-You need a running Fluss cluster to use the Python client. See the [Quick-Start guide](../../README.md#quick-start) for how to start a local cluster.
-
-## Installation
-
-```bash
-pip install pyfluss
-```
-
-To build from source instead, see the [Development Guide](DEVELOPMENT.md).
-
-## Quick Start
-
-A minimal end-to-end example: connect, create a table, write data, and read it back. Assumes a Fluss cluster is running on `localhost:9123`.
-
-```python
-import asyncio
-import pyarrow as pa
-import fluss
-
-async def main():
-    # Connect
-    config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
-    conn = await fluss.FlussConnection.create(config)
-    admin = await conn.get_admin()
-
-    # Create a log table
-    schema = fluss.Schema(pa.schema([
-        pa.field("id", pa.int32()),
-        pa.field("name", pa.string()),
-        pa.field("score", pa.float32()),
-    ]))
-    table_path = fluss.TablePath("fluss", "quick_start")
-    await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
-
-    # Write
-    table = await conn.get_table(table_path)
-    writer = table.new_append().create_writer()
-    writer.append({"id": 1, "name": "Alice", "score": 95.5})
-    writer.append({"id": 2, "name": "Bob", "score": 87.0})
-    await writer.flush()
-
-    # Read
-    num_buckets = (await admin.get_table_info(table_path)).num_buckets
-    scanner = await table.new_scan().create_record_batch_log_scanner()
-    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
-    print(scanner.to_pandas())
-
-    # Cleanup
-    await admin.drop_table(table_path, ignore_if_not_exists=True)
-    conn.close()
-
-asyncio.run(main())
-```
-
-## Connection Setup
-
-```python
-config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
-conn = await fluss.FlussConnection.create(config)
-```
-
-The connection also supports context managers:
-
-```python
-with await fluss.FlussConnection.create(config) as conn:
-    ...
-```
-
-### Configuration Options
-
-| Key | Description | Default |
-|-----|-------------|---------|
-| `bootstrap.servers` | Coordinator server address | `127.0.0.1:9123` |
-| `request.max.size` | Maximum request size in bytes | `10485760` (10 MB) |
-| `writer.acks` | Acknowledgment setting (`all` waits for all replicas) | `all` |
-| `writer.retries` | Number of retries on failure | `2147483647` |
-| `writer.batch.size` | Batch size for writes in bytes | `2097152` (2 MB) |
-
-## Admin Operations
-
-```python
-admin = await conn.get_admin()
-```
-
-### Databases
-
-```python
-await admin.create_database("my_database", ignore_if_exists=True)
-databases = await admin.list_databases()
-exists = await admin.database_exists("my_database")
-await admin.drop_database("my_database", ignore_if_not_exists=True, cascade=True)
-```
-
-### Tables
-
-Schemas are defined using PyArrow and wrapped in `fluss.Schema`:
-
-```python
-import pyarrow as pa
-
-schema = fluss.Schema(pa.schema([
-    pa.field("id", pa.int32()),
-    pa.field("name", pa.string()),
-    pa.field("amount", pa.int64()),
-]))
-
-table_path = fluss.TablePath("my_database", "my_table")
-await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
-
-table_info = await admin.get_table_info(table_path)
-tables = await admin.list_tables("my_database")
-await admin.drop_table(table_path, ignore_if_not_exists=True)
-```
-
-`TableDescriptor` accepts these optional parameters:
-
-| Parameter | Description |
-|---|---|
-| `partition_keys` | Column names to partition by (e.g. `["region"]`) |
-| `bucket_count` | Number of buckets (parallelism units) for the table |
-| `bucket_keys` | Columns used to determine bucket assignment |
-| `comment` | Table comment / description |
-| `log_format` | Log storage format: `"ARROW"` or `"INDEXED"` |
-| `kv_format` | KV storage format for primary key tables: `"INDEXED"` or `"COMPACTED"` |
-| `properties` | Table configuration properties as a dict (e.g. `{"table.replication.factor": "1"}`) |
-| `custom_properties` | User-defined properties as a dict |
-
-### Offsets
-
-```python
-# Latest offsets for buckets
-offsets = await admin.list_offsets(table_path, bucket_ids=[0, 1], offset_type="latest")
-
-# By timestamp
-offsets = await admin.list_offsets(table_path, bucket_ids=[0], offset_type="timestamp", timestamp=1704067200000)
-
-# Per-partition offsets
-offsets = await admin.list_partition_offsets(table_path, partition_name="US", bucket_ids=[0], offset_type="latest")
-```
-
-## Log Tables
-
-Log tables are append-only tables without primary keys, suitable for event streaming.
-
-### Writing
-
-Rows can be appended as dicts, lists, or tuples. For bulk writes, use `write_arrow()`, `write_arrow_batch()`, or `write_pandas()`.
-
-Write methods like `append()` and `write_arrow_batch()` return a `WriteResultHandle`. You can ignore it for fire-and-forget semantics (flush at the end), or `await handle.wait()` to block until the server acknowledges that specific write.
-
-```python
-table = await conn.get_table(table_path)
-writer = table.new_append().create_writer()
-
-# Fire-and-forget: queue writes, flush at the end
-writer.append({"id": 1, "name": "Alice", "score": 95.5})
-writer.append([2, "Bob", 87.0])
-await writer.flush()
-
-# Per-record acknowledgment
-handle = writer.append({"id": 3, "name": "Charlie", "score": 91.0})
-await handle.wait()
-
-# Bulk writes
-writer.write_arrow(pa_table)          # PyArrow Table
-writer.write_arrow_batch(record_batch) # PyArrow RecordBatch
-writer.write_pandas(df)                # Pandas DataFrame
-await writer.flush()
-```
-
-### Reading
-
-There are two scanner types:
-- **Batch scanner** (`create_record_batch_log_scanner()`) — returns Arrow Tables or DataFrames, best for analytics
-- **Record scanner** (`create_log_scanner()`) — returns individual records with metadata (offset, timestamp, change type), best for streaming
-
-And two reading modes:
-- **`to_arrow()` / `to_pandas()`** — reads all data from subscribed buckets up to the current latest offset, then returns. Best for one-shot batch reads.
-- **`poll_arrow()` / `poll()` / `poll_record_batch()`** — returns whatever data is available within the timeout, then returns. Call in a loop for continuous streaming.
-
-#### Batch Read (One-Shot)
-
-```python
-num_buckets = (await admin.get_table_info(table_path)).num_buckets
-
-scanner = await table.new_scan().create_record_batch_log_scanner()
-scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
-
-# Reads everything up to current latest offset, then returns
-arrow_table = scanner.to_arrow()
-df = scanner.to_pandas()
-```
-
-#### Continuous Polling
-
-Use `poll_arrow()` or `poll()` in a loop for streaming consumption:
-
-```python
-# Batch scanner: poll as Arrow Tables
-scanner = await table.new_scan().create_record_batch_log_scanner()
-scanner.subscribe(bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
-
-while True:
-    result = scanner.poll_arrow(timeout_ms=5000)
-    if result.num_rows > 0:
-        print(result.to_pandas())
-
-# Record scanner: poll individual records with metadata
-scanner = await table.new_scan().create_log_scanner()
-scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
-
-while True:
-    for record in scanner.poll(timeout_ms=5000):
-        print(f"offset={record.offset}, change={record.change_type.short_string()}, row={record.row}")
-```
-
-#### Subscribe from Latest Offset
-
-To only consume new records (skip existing data), use `LATEST_OFFSET`:
-
-```python
-scanner = await table.new_scan().create_record_batch_log_scanner()
-scanner.subscribe(bucket_id=0, start_offset=fluss.LATEST_OFFSET)
-```
-
-### Column Projection
-
-```python
-scanner = await table.new_scan().project([0, 2]).create_record_batch_log_scanner()
-# or by name
-scanner = await table.new_scan().project_by_name(["id", "score"]).create_record_batch_log_scanner()
-```
-
-## Primary Key Tables
-
-Primary key tables support upsert, delete, and point lookup operations.
-
-### Creating
-
-Pass `primary_keys` to `fluss.Schema`:
-
-```python
-schema = fluss.Schema(
-    pa.schema([
-        pa.field("id", pa.int32()),
-        pa.field("name", pa.string()),
-        pa.field("age", pa.int64()),
-    ]),
-    primary_keys=["id"],
-)
-table_path = fluss.TablePath("fluss", "users")
-await admin.create_table(table_path, fluss.TableDescriptor(schema, bucket_count=3), ignore_if_exists=True)
-```
-
-### Upsert, Delete, Lookup
-
-```python
-table = await conn.get_table(table_path)
-
-# Upsert (fire-and-forget, flush at the end)
-writer = table.new_upsert()
-writer.upsert({"id": 1, "name": "Alice", "age": 25})
-writer.upsert({"id": 2, "name": "Bob", "age": 30})
-await writer.flush()
-
-# Per-record acknowledgment (for read-after-write)
-handle = writer.upsert({"id": 3, "name": "Charlie", "age": 35})
-await handle.wait()
-
-# Delete by primary key
-handle = writer.delete({"id": 2})
-await handle.wait()
-
-# Lookup
-lookuper = table.new_lookup()
-result = await lookuper.lookup({"id": 1})
-if result:
-    print(f"Found: name={result['name']}, age={result['age']}")
-```
-
-### Partial Updates
-
-Update specific columns while preserving others:
-
-```python
-partial_writer = table.new_upsert(columns=["id", "age"])
-partial_writer.upsert({"id": 1, "age": 27})  # only updates age
-await partial_writer.flush()
-```
-
-## Partitioned Tables
-
-Partitioned tables distribute data across partitions based on column values. Partitions must be created before writing.
-
-### Creating and Managing Partitions
-
-```python
-schema = fluss.Schema(pa.schema([
-    pa.field("id", pa.int32()),
-    pa.field("region", pa.string()),
-    pa.field("value", pa.int64()),
-]))
-
-table_path = fluss.TablePath("fluss", "partitioned_events")
-await admin.create_table(
-    table_path,
-    fluss.TableDescriptor(schema, partition_keys=["region"], bucket_count=1),
-    ignore_if_exists=True,
-)
-
-# Create partitions
-await admin.create_partition(table_path, {"region": "US"}, ignore_if_exists=True)
-await admin.create_partition(table_path, {"region": "EU"}, ignore_if_exists=True)
-
-# List partitions
-partition_infos = await admin.list_partition_infos(table_path)
-```
-
-### Writing
-
-Same as non-partitioned tables — include partition column values in each row:
-
-```python
-table = await conn.get_table(table_path)
-writer = table.new_append().create_writer()
-writer.append({"id": 1, "region": "US", "value": 100})
-writer.append({"id": 2, "region": "EU", "value": 200})
-await writer.flush()
-```
-
-### Reading
-
-Use `subscribe_partition()` or `subscribe_partition_buckets()` instead of `subscribe()`:
-
-```python
-scanner = await table.new_scan().create_record_batch_log_scanner()
-
-# Subscribe to individual partitions
-for p in partition_infos:
-    scanner.subscribe_partition(partition_id=p.partition_id, bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
-
-# Or batch-subscribe
-scanner.subscribe_partition_buckets({
-    (p.partition_id, 0): fluss.EARLIEST_OFFSET for p in partition_infos
-})
-
-print(scanner.to_pandas())
-```
-
-### Partitioned Primary Key Tables
-
-Partition columns must be part of the primary key. Partitions must be created before upserting.
-
-```python
-schema = fluss.Schema(
-    pa.schema([
-        pa.field("user_id", pa.int32()),
-        pa.field("region", pa.string()),
-        pa.field("score", pa.int64()),
-    ]),
-    primary_keys=["user_id", "region"],
-)
-
-table_path = fluss.TablePath("fluss", "partitioned_users")
-await admin.create_table(
-    table_path,
-    fluss.TableDescriptor(schema, partition_keys=["region"]),
-    ignore_if_exists=True,
-)
-
-await admin.create_partition(table_path, {"region": "US"}, ignore_if_exists=True)
-
-table = await conn.get_table(table_path)
-writer = table.new_upsert()
-writer.upsert({"user_id": 1, "region": "US", "score": 1234})
-await writer.flush()
-
-# Lookup includes partition columns
-lookuper = table.new_lookup()
-result = await lookuper.lookup({"user_id": 1, "region": "US"})
-```
-
-## Error Handling
-
-The client raises `fluss.FlussError` for Fluss-specific errors (connection failures, table not found, invalid operations, etc.):
-
-```python
-try:
-    await admin.create_table(table_path, table_descriptor)
-except fluss.FlussError as e:
-    print(f"Fluss error: {e.message}")
-```
-
-Common error scenarios:
-- **Connection refused** — Fluss cluster is not running or wrong address in `bootstrap.servers`
-- **Table not found** — table doesn't exist or wrong database/table name
-- **Partition not found** — writing to a partitioned table before creating partitions
-- **Schema mismatch** — row data doesn't match the table schema
-
-## Data Types
-
-The Python client uses PyArrow types for schema definitions:
-
-| PyArrow Type | Fluss Type | Python Type |
-|---|---|---|
-| `pa.boolean()` | Boolean | `bool` |
-| `pa.int8()` / `int16()` / `int32()` / `int64()` | TinyInt / SmallInt / Int / BigInt | `int` |
-| `pa.float32()` / `float64()` | Float / Double | `float` |
-| `pa.string()` | String | `str` |
-| `pa.binary()` | Bytes | `bytes` |
-| `pa.date32()` | Date | `datetime.date` |
-| `pa.time32("ms")` | Time | `datetime.time` |
-| `pa.timestamp("us")` | Timestamp (NTZ) | `datetime.datetime` |
-| `pa.timestamp("us", tz="UTC")` | TimestampLTZ | `datetime.datetime` |
-| `pa.decimal128(precision, scale)` | Decimal | `decimal.Decimal` |
-
-All Python native types (`date`, `time`, `datetime`, `Decimal`) work when appending rows via dicts.
-
-For a complete list of classes, methods, and properties, see the [API Reference](API_REFERENCE.md).
+For full documentation, see the [Python user guide](../../website/docs/user-guide/python/).
diff --git a/fluss-rust/bindings/python/generate_readme.py b/fluss-rust/bindings/python/generate_readme.py
new file mode 100644
index 0000000000..206f9e2ab0
--- /dev/null
+++ b/fluss-rust/bindings/python/generate_readme.py
@@ -0,0 +1,104 @@
+#!/usr/bin/env python3
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to you under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Generate bindings/python/GENERATED_README.md from the website docs.
+
+Usage:
+    python generate_readme.py          # writes GENERATED_README.md
+    python generate_readme.py --check  # exits non-zero if GENERATED_README.md is stale
+"""
+
+from __future__ import annotations
+
+import re
+import sys
+from pathlib import Path
+
+SCRIPT_DIR = Path(__file__).resolve().parent
+DOCS_DIR = SCRIPT_DIR / "../../website/docs/user-guide/python"
+
+LICENSE_HEADER = """\
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+"""
+
+# Files in the order they should appear in the README.
+SECTIONS: list[str] = [
+    "installation.md",
+    "example/index.md",
+    "example/configuration.md",
+    "example/admin-operations.md",
+    "example/log-tables.md",
+    "example/primary-key-tables.md",
+    "example/partitioned-tables.md",
+    "error-handling.md",
+    "data-types.md",
+    "api-reference.md",
+]
+
+FRONTMATTER_RE = re.compile(r"^---\n.*?^---\n", re.MULTILINE | re.DOTALL)
+
+
+def strip_frontmatter(text: str) -> str:
+    return FRONTMATTER_RE.sub("", text, count=1)
+
+
+def build_readme() -> str:
+    parts = [LICENSE_HEADER, "# Fluss Python Client\n"]
+
+    for section in SECTIONS:
+        path = DOCS_DIR / section
+        if not path.exists():
+            print(f"warning: {path} not found, skipping", file=sys.stderr)
+            continue
+        content = strip_frontmatter(path.read_text()).strip()
+        parts.append(content)
+
+    return "\n\n".join(parts) + "\n"
+
+
+def main() -> None:
+    readme = build_readme()
+    dest = SCRIPT_DIR / "GENERATED_README.md"
+
+    if "--check" in sys.argv:
+        if not dest.exists() or dest.read_text() != readme:
+            print("GENERATED_README.md is out of date. Run: python generate_readme.py")
+            sys.exit(1)
+        print("GENERATED_README.md is up to date.")
+        return
+
+    dest.write_text(readme)
+    print(f"Wrote {dest}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index 0e61b23484..0be25a03db 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -24,7 +24,7 @@ name = "pyfluss"
 description = "Apache Fluss (incubating) Python Binding"
 authors = [{name = "Apache Fluss", email = "dev@fluss.apache.org"}]
 license = {text = "Apache-2.0"}
-readme = "README.md"
+readme = "GENERATED_README.md"
 requires-python = ">=3.9"
 classifiers = [
     "License :: OSI Approved :: Apache Software License",
diff --git a/fluss-rust/crates/fluss/README.md b/fluss-rust/crates/fluss/README.md
index bee8ce8450..aad8de96c1 100644
--- a/fluss-rust/crates/fluss/README.md
+++ b/fluss-rust/crates/fluss/README.md
@@ -1,21 +1,3 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
 # Apache Fluss™ Rust Client (Incubating)
 
 Rust client library for [Apache Fluss™](https://fluss.apache.org/). This crate provides the core client used by the fluss-rust workspace and by the Python and C++ bindings.
diff --git a/fluss-rust/docs/creating-a-release.md b/fluss-rust/docs/creating-a-release.md
index 164b64b770..8b4c868fbf 100644
--- a/fluss-rust/docs/creating-a-release.md
+++ b/fluss-rust/docs/creating-a-release.md
@@ -1,21 +1,3 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
 # Creating a Fluss Rust Client Release
 
 This document describes in detail how to create a release of the **Fluss clients** (fluss-rust, fluss-python, fluss-cpp) from the [fluss-rust](https://github.com/apache/fluss-rust) repository. It is based on the [Creating a Fluss Release](https://fluss.apache.org/community/how-to-release/creating-a-fluss-release/) guide of the Apache Fluss project and the [release guide of Apache OpenDAL](https://nightlies.apache.org/opendal/opendal-docs-stable/community/release/); releases are source archives plus CI-published crates.io and PyPI.
diff --git a/fluss-rust/docs/generate-release-note.md b/fluss-rust/docs/generate-release-note.md
index 1167f4cdb7..edbc43bdbd 100644
--- a/fluss-rust/docs/generate-release-note.md
+++ b/fluss-rust/docs/generate-release-note.md
@@ -1,21 +1,3 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
 # Generate Release Note
 
 Use GitHub's **Generate release notes** to produce a draft from merged PRs between tags. Categories (Added, Fixed, Docs, etc.) are configured in [.github/release.yml](../.github/release.yml).
diff --git a/fluss-rust/docs/rust-client.md b/fluss-rust/docs/rust-client.md
index 0396882904..e69de29bb2 100644
--- a/fluss-rust/docs/rust-client.md
+++ b/fluss-rust/docs/rust-client.md
@@ -1,755 +0,0 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
-# Fluss Rust Client Guide
-
-This guide covers how to use the Fluss Rust client for reading and writing data to log tables and primary key tables.
-
-## Adding to Your Project
-
-The Fluss Rust client is published to [crates.io](https://crates.io/crates/fluss-rs) as `fluss-rs`. The crate's library name is `fluss`, so you import it with `use fluss::...`.
-
-```toml
-[dependencies]
-fluss-rs = "0.1"
-tokio = { version = "1", features = ["full"] }
-```
-
-### Feature Flags
-
-The Fluss crate supports optional storage backends:
-
-```toml
-[dependencies]
-# Default: memory and filesystem storage
-fluss-rs = "0.1"
-
-# With S3 storage support
-fluss-rs = { version = "0.1", features = ["storage-s3"] }
-
-# With OSS storage support
-fluss-rs = { version = "0.1", features = ["storage-oss"] }
-
-# All storage backends
-fluss-rs = { version = "0.1", features = ["storage-all"] }
-```
-
-Available features:
-- `storage-memory` (default) - In-memory storage
-- `storage-fs` (default) - Local filesystem storage
-- `storage-s3` - Amazon S3 storage
-- `storage-oss` - Alibaba OSS storage
-- `storage-all` - All storage backends
-
-### Alternative: Git or Path Dependency
-
-For development against unreleased changes, you can depend on the Git repository or a local checkout:
-
-```toml
-[dependencies]
-# From Git
-fluss = { git = "https://github.com/apache/fluss-rust.git", package = "fluss-rs" }
-
-# From local path
-fluss = { path = "/path/to/fluss-rust/crates/fluss", package = "fluss-rs" }
-```
-
-> **Note:** When using `git` or `path` dependencies, the `package = "fluss-rs"` field is required so that Cargo resolves the correct package while still allowing `use fluss::...` imports.
-
-## Building from Source
-
-### Prerequisites
-
-- Rust 1.85+
-- Protobuf compiler (`protoc`) - only required when [building from source](#building-from-source)
-
-
-### 1. Clone the Repository
-
-```bash
-git clone https://github.com/apache/fluss-rust.git
-cd fluss-rust
-```
-
-### 2. Install Dependencies
-
-The Protobuf compiler (`protoc`) is required to build from source.
-
-#### macOS
-
-```bash
-brew install protobuf
-```
-
-#### Ubuntu/Debian
-
-```bash
-sudo apt-get install protobuf-compiler
-```
-
-### 3. Build the Library
-
-```bash
-cargo build --workspace --all-targets
-```
-
-## Connection Setup
-
-```rust
-use fluss::client::FlussConnection;
-use fluss::config::Config;
-use fluss::error::Result;
-
-#[tokio::main]
-async fn main() -> Result<()> {
-    let mut config = Config::default();
-    config.bootstrap_servers = "127.0.0.1:9123".to_string();
-
-    let conn = FlussConnection::new(config).await?;
-
-    // Use the connection...
-
-    Ok(())
-}
-```
-
-### Configuration Options
-
-| Option | Description | Default |
-|--------|-------------|---------|
-| `bootstrap_servers` | Coordinator server address | `127.0.0.1:9123` |
-| `writer_request_max_size` | Maximum request size in bytes | 10 MB |
-| `writer_acks` | Acknowledgment setting (`all` waits for all replicas) | `all` |
-| `writer_retries` | Number of retries on failure | `i32::MAX` |
-| `writer_batch_size` | Batch size for writes | 2 MB |
-
-## Admin Operations
-
-### Get Admin Interface
-
-```rust
-let admin = conn.get_admin().await?;
-```
-
-### Database Operations
-
-```rust
-// Create database
-admin.create_database("my_database", None, true).await?;
-
-// List all databases
-let databases = admin.list_databases().await?;
-println!("Databases: {:?}", databases);
-
-// Check if database exists
-let exists = admin.database_exists("my_database").await?;
-
-// Get database information
-let db_info = admin.get_database_info("my_database").await?;
-
-// Drop database
-admin.drop_database("my_database", true, false).await?;
-```
-
-### Table Operations
-
-```rust
-use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
-
-// Define table schema
-let table_descriptor = TableDescriptor::builder()
-    .schema(
-        Schema::builder()
-            .column("id", DataTypes::int())
-            .column("name", DataTypes::string())
-            .column("amount", DataTypes::bigint())
-            .build()?,
-    )
-    .build()?;
-
-let table_path = TablePath::new("my_database", "my_table");
-
-// Create table
-admin.create_table(&table_path, &table_descriptor, true).await?;
-
-// Get table information
-let table_info = admin.get_table_info(&table_path).await?;
-println!("Table: {}", table_info);
-
-// List tables in database
-let tables = admin.list_tables("my_database").await?;
-
-// Check if table exists
-let exists = admin.table_exists(&table_path).await?;
-
-// Drop table
-admin.drop_table(&table_path, true).await?;
-```
-
-### Partition Operations
-
-```rust
-use fluss::metadata::PartitionSpec;
-use std::collections::HashMap;
-
-// List all partitions
-let partitions = admin.list_partition_infos(&table_path).await?;
-
-// List partitions matching a spec
-let mut filter = HashMap::new();
-filter.insert("year", "2024");
-let spec = PartitionSpec::new(filter);
-let partitions = admin.list_partition_infos_with_spec(&table_path, Some(&spec)).await?;
-
-// Create partition
-admin.create_partition(&table_path, &spec, true).await?;
-
-// Drop partition
-admin.drop_partition(&table_path, &spec, true).await?;
-```
-
-### Offset Operations
-
-```rust
-use fluss::rpc::message::OffsetSpec;
-
-let bucket_ids = vec![0, 1, 2];
-
-// Get earliest offsets
-let earliest = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Earliest).await?;
-
-// Get latest offsets
-let latest = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Latest).await?;
-
-// Get offsets for a specific timestamp
-let timestamp_ms = 1704067200000; // 2024-01-01 00:00:00 UTC
-let offsets = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Timestamp(timestamp_ms)).await?;
-
-// Get offsets for a specific partition
-let partition_offsets = admin.list_partition_offsets(
-    &table_path,
-    "partition_name",
-    &bucket_ids,
-    OffsetSpec::Latest,
-).await?;
-```
-
-### Lake Snapshot
-
-```rust
-// Get latest lake snapshot for lakehouse integration
-let snapshot = admin.get_latest_lake_snapshot(&table_path).await?;
-println!("Snapshot ID: {}", snapshot.snapshot_id);
-```
-
-## Log Table Operations
-
-Log tables are append-only tables without primary keys, suitable for event streaming.
-
-### Creating a Log Table
-
-```rust
-let table_descriptor = TableDescriptor::builder()
-    .schema(
-        Schema::builder()
-            .column("event_id", DataTypes::int())
-            .column("event_type", DataTypes::string())
-            .column("timestamp", DataTypes::bigint())
-            .build()?,
-    )
-    .build()?;
-
-let table_path = TablePath::new("fluss", "events");
-admin.create_table(&table_path, &table_descriptor, true).await?;
-```
-
-### Writing to Log Tables
-
-```rust
-use fluss::row::{GenericRow, InternalRow};
-
-let table = conn.get_table(&table_path).await?;
-let append_writer = table.new_append()?.create_writer()?;
-
-// Write a single row
-let mut row = GenericRow::new(3);
-row.set_field(0, 1);                    // event_id (int)
-row.set_field(1, "user_login");         // event_type (string)
-row.set_field(2, 1704067200000i64);     // timestamp (bigint)
-
-append_writer.append(&row)?;
-
-// Write multiple rows
-let mut row2 = GenericRow::new(3);
-row2.set_field(0, 2);
-row2.set_field(1, "page_view");
-row2.set_field(2, 1704067201000i64);
-
-append_writer.append(&row2)?;
-
-// Flush to ensure data is persisted
-append_writer.flush().await?;
-```
-
-Write operations (`append`, `upsert`, `delete`) use a **fire-and-forget** pattern for efficient batching. Each call queues the write and returns a `WriteResultFuture` immediately. Call `flush()` to ensure all queued writes are sent to the server.
-
-If you need per-record acknowledgment, you can await the returned future:
-
-```rust
-// Per-record acknowledgment (blocks until server confirms)
-append_writer.append(&row)?.await?;
-```
-
-### Reading from Log Tables
-
-```rust
-use std::time::Duration;
-
-let table = conn.get_table(&table_path).await?;
-let log_scanner = table.new_scan().create_log_scanner()?;
-
-// Subscribe to bucket 0 starting from offset 0
-log_scanner.subscribe(0, 0).await?;
-
-// Poll for records
-let records = log_scanner.poll(Duration::from_secs(10)).await?;
-
-for record in records {
-    let row = record.row();
-    println!(
-        "event_id={}, event_type={}, timestamp={} @ offset={}",
-        row.get_int(0),
-        row.get_string(1),
-        row.get_long(2),
-        record.offset()
-    );
-}
-```
-
-### Column Projection
-
-```rust
-// Project specific columns by index
-let scanner = table.new_scan().project(&[0, 2])?.create_log_scanner()?;
-
-// Or project by column names
-let scanner = table.new_scan().project_by_name(&["event_id", "timestamp"])?.create_log_scanner()?;
-```
-
-### Subscribe from Specific Offsets
-
-```rust
-use fluss::client::{EARLIEST_OFFSET, LATEST_OFFSET};
-
-// Subscribe from earliest available offset
-log_scanner.subscribe(0, EARLIEST_OFFSET).await?;
-
-// Subscribe from latest offset (only new records)
-log_scanner.subscribe(0, LATEST_OFFSET).await?;
-
-// Subscribe from a specific offset
-log_scanner.subscribe(0, 42).await?;
-
-// Subscribe to all buckets
-let num_buckets = table.get_table_info().get_num_buckets();
-for bucket_id in 0..num_buckets {
-    log_scanner.subscribe(bucket_id, 0).await?;
-}
-```
-
-### Subscribe to Multiple Buckets
-
-```rust
-use std::collections::HashMap;
-
-// Subscribe to multiple buckets at once with specific offsets
-let mut bucket_offsets = HashMap::new();
-bucket_offsets.insert(0, 0i64);    // bucket 0 from offset 0
-bucket_offsets.insert(1, 100i64);  // bucket 1 from offset 100
-log_scanner.subscribe_buckets(&bucket_offsets).await?;
-```
-
-### Unsubscribe from a Bucket
-
-```rust
-// Unsubscribe from a specific bucket (non-partitioned tables)
-log_scanner.unsubscribe(bucket_id).await?;
-```
-
-### Unsubscribe from a Partition
-
-```rust
-// Unsubscribe from a specific partition bucket
-log_scanner.unsubscribe_partition(partition_id, bucket_id).await?;
-```
-
-## Partitioned Log Tables
-
-Partitioned tables distribute data across partitions based on partition column values, enabling efficient data organization and querying.
-
-### Creating a Partitioned Log Table
-
-```rust
-use fluss::metadata::{DataTypes, LogFormat, Schema, TableDescriptor, TablePath};
-
-let table_descriptor = TableDescriptor::builder()
-    .schema(
-        Schema::builder()
-            .column("event_id", DataTypes::int())
-            .column("event_type", DataTypes::string())
-            .column("dt", DataTypes::string())       // partition column
-            .column("region", DataTypes::string())   // partition column
-            .build()?,
-    )
-    .partitioned_by(vec!["dt", "region"])  // Define partition columns
-    .log_format(LogFormat::ARROW)
-    .build()?;
-
-let table_path = TablePath::new("fluss", "partitioned_events");
-admin.create_table(&table_path, &table_descriptor, true).await?;
-```
-
-### Writing to Partitioned Log Tables
-
-Writing works the same as non-partitioned tables. Include partition column values in each row:
-
-```rust
-let table = conn.get_table(&table_path).await?;
-let append_writer = table.new_append()?.create_writer()?;
-
-// Partition column values determine which partition the record goes to
-let mut row = GenericRow::new(4);
-row.set_field(0, 1);                  // event_id
-row.set_field(1, "user_login");       // event_type
-row.set_field(2, "2024-01-15");       // dt (partition column)
-row.set_field(3, "US");               // region (partition column)
-
-append_writer.append(&row)?;
-append_writer.flush().await?;
-```
-
-### Reading from Partitioned Log Tables
-
-For partitioned tables, use `subscribe_partition()` instead of `subscribe()`:
-
-```rust
-use std::time::Duration;
-
-let table = conn.get_table(&table_path).await?;
-let admin = conn.get_admin().await?;
-
-// Get partition information
-let partitions = admin.list_partition_infos(&table_path).await?;
-
-let log_scanner = table.new_scan().create_log_scanner()?;
-
-// Subscribe to each partition's buckets
-for partition_info in &partitions {
-    let partition_id = partition_info.get_partition_id();
-    let num_buckets = table.get_table_info().get_num_buckets();
-
-    for bucket_id in 0..num_buckets {
-        log_scanner.subscribe_partition(partition_id, bucket_id, 0).await?;
-    }
-}
-
-// Poll for records
-let records = log_scanner.poll(Duration::from_secs(10)).await?;
-for record in records {
-    println!("Record from partition: {:?}", record.row());
-}
-```
-
-You can also subscribe to multiple partition-buckets at once:
-
-```rust
-use std::collections::HashMap;
-
-let mut partition_bucket_offsets = HashMap::new();
-partition_bucket_offsets.insert((partition_id, 0), 0i64);  // partition, bucket 0, offset 0
-partition_bucket_offsets.insert((partition_id, 1), 0i64);  // partition, bucket 1, offset 0
-log_scanner.subscribe_partition_buckets(&partition_bucket_offsets).await?;
-```
-
-### Managing Partitions
-
-```rust
-use fluss::metadata::PartitionSpec;
-use std::collections::HashMap;
-
-// Create a partition
-let mut partition_values = HashMap::new();
-partition_values.insert("dt", "2024-01-15");
-partition_values.insert("region", "EMEA");
-let spec = PartitionSpec::new(partition_values);
-admin.create_partition(&table_path, &spec, true).await?;
-
-// List all partitions
-let partitions = admin.list_partition_infos(&table_path).await?;
-for partition in &partitions {
-    println!(
-        "Partition: id={}, name={}",
-        partition.get_partition_id(),
-        partition.get_partition_name()  // Format: "value1$value2"
-    );
-}
-
-// List partitions with filter (partial spec)
-let mut partial_values = HashMap::new();
-partial_values.insert("dt", "2024-01-15");
-let partial_spec = PartitionSpec::new(partial_values);
-let filtered = admin.list_partition_infos_with_spec(&table_path, Some(&partial_spec)).await?;
-
-// Drop a partition
-admin.drop_partition(&table_path, &spec, true).await?;
-```
-
-## Primary Key Table Operations
-
-Primary key tables (KV tables) support upsert, delete, and lookup operations.
-
-### Creating a Primary Key Table
-
-```rust
-let table_descriptor = TableDescriptor::builder()
-    .schema(
-        Schema::builder()
-            .column("id", DataTypes::int())
-            .column("name", DataTypes::string())
-            .column("age", DataTypes::bigint())
-            .primary_key(vec!["id"])  // Define primary key
-            .build()?,
-    )
-    .build()?;
-
-let table_path = TablePath::new("fluss", "users");
-admin.create_table(&table_path, &table_descriptor, true).await?;
-```
-
-### Upserting Records
-
-```rust
-let table = conn.get_table(&table_path).await?;
-let table_upsert = table.new_upsert()?;
-let upsert_writer = table_upsert.create_writer()?;
-
-// Insert or update records
-for (id, name, age) in [(1, "Alice", 25i64), (2, "Bob", 30), (3, "Charlie", 35)] {
-    let mut row = GenericRow::new(3);
-    row.set_field(0, id);
-    row.set_field(1, name);
-    row.set_field(2, age);
-    upsert_writer.upsert(&row)?;
-}
-upsert_writer.flush().await?;
-```
-
-### Updating Records
-
-```rust
-// Update existing record (same primary key)
-let mut row = GenericRow::new(3);
-row.set_field(0, 1);        // id (primary key)
-row.set_field(1, "Alice");  // name
-row.set_field(2, 26i64);    // Updated age
-
-upsert_writer.upsert(&row)?;
-upsert_writer.flush().await?;
-```
-
-### Deleting Records
-
-```rust
-// Delete by primary key (only primary key field needs to be set)
-let mut row = GenericRow::new(3);
-row.set_field(0, 2);  // id of record to delete
-
-upsert_writer.delete(&row)?;
-upsert_writer.flush().await?;
-```
-
-### Partial Updates
-
-Update only specific columns while preserving others:
-
-```rust
-// By column indices
-let partial_upsert = table_upsert.partial_update(Some(vec![0, 2]))?;
-let partial_writer = partial_upsert.create_writer()?;
-
-let mut row = GenericRow::new(3);
-row.set_field(0, 1);       // id (primary key, required)
-row.set_field(2, 27i64);   // age (will be updated)
-// name will remain unchanged
-
-partial_writer.upsert(&row)?;
-partial_writer.flush().await?;
-
-// By column names
-let partial_upsert = table_upsert.partial_update_with_column_names(&["id", "age"])?;
-let partial_writer = partial_upsert.create_writer()?;
-```
-
-### Looking Up Records
-
-```rust
-let mut lookuper = table.new_lookup()?.create_lookuper()?;
-
-// Create a key row (only primary key fields)
-let mut key = GenericRow::new(1);
-key.set_field(0, 1);  // id to lookup
-
-let result = lookuper.lookup(&key).await?;
-
-if let Some(row) = result.get_single_row()? {
-    println!(
-        "Found: id={}, name={}, age={}",
-        row.get_int(0),
-        row.get_string(1),
-        row.get_long(2)
-    );
-} else {
-    println!("Record not found");
-}
-```
-
-## Partitioned Primary Key Tables
-
-Partitioned KV tables combine partitioning with primary key operations. Partition columns must be part of the primary key.
-
-### Creating a Partitioned Primary Key Table
-
-```rust
-use fluss::metadata::{DataTypes, KvFormat, Schema, TableDescriptor, TablePath};
-
-let table_descriptor = TableDescriptor::builder()
-    .schema(
-        Schema::builder()
-            .column("user_id", DataTypes::int())
-            .column("region", DataTypes::string())   // partition column
-            .column("zone", DataTypes::bigint())     // partition column
-            .column("score", DataTypes::bigint())
-            // Primary key must include partition columns
-            .primary_key(vec!["user_id", "region", "zone"])
-            .build()?,
-    )
-    .partitioned_by(vec!["region", "zone"])  // Define partition columns
-    .kv_format(KvFormat::COMPACTED)
-    .build()?;
-
-let table_path = TablePath::new("fluss", "partitioned_users");
-admin.create_table(&table_path, &table_descriptor, true).await?;
-```
-
-### Writing to Partitioned Primary Key Tables
-
-Upsert and delete operations work the same as non-partitioned KV tables. **Partitions must be created before upserting data.**
-
-```rust
-use fluss::metadata::PartitionSpec;
-use std::collections::HashMap;
-
-let table = conn.get_table(&table_path).await?;
-
-// Ensure partitions exist before upserting
-for (region, zone) in [("APAC", "1"), ("EMEA", "2"), ("US", "3")] {
-    let mut partition_values = HashMap::new();
-    partition_values.insert("region", region);
-    partition_values.insert("zone", zone);
-    let spec = PartitionSpec::new(partition_values);
-    admin.create_partition(&table_path, &spec, true).await?;
-}
-
-let table_upsert = table.new_upsert()?;
-let upsert_writer = table_upsert.create_writer()?;
-
-// Upsert records - partition is determined by partition column values
-for (user_id, region, zone, score) in [
-    (1001, "APAC", 1i64, 1234i64),
-    (1002, "EMEA", 2, 2234),
-    (1003, "US", 3, 3234),
-] {
-    let mut row = GenericRow::new(4);
-    row.set_field(0, user_id);
-    row.set_field(1, region);
-    row.set_field(2, zone);
-    row.set_field(3, score);
-    upsert_writer.upsert(&row)?;
-}
-upsert_writer.flush().await?;
-
-// Update a record
-let mut row = GenericRow::new(4);
-row.set_field(0, 1001);
-row.set_field(1, "APAC");
-row.set_field(2, 1i64);
-row.set_field(3, 5000i64);  // Updated score
-upsert_writer.upsert(&row)?;
-upsert_writer.flush().await?;
-
-// Delete a record (primary key includes partition columns)
-let mut row = GenericRow::new(4);
-row.set_field(0, 1002);
-row.set_field(1, "EMEA");
-row.set_field(2, 2i64);
-upsert_writer.delete(&row)?;
-upsert_writer.flush().await?;
-```
-
-### Looking Up Records in Partitioned Tables
-
-Lookup requires all primary key columns including partition columns:
-
-```rust
-let mut lookuper = table.new_lookup()?.create_lookuper()?;
-
-// Key must include all primary key columns (including partition columns)
-let mut key = GenericRow::new(3);
-key.set_field(0, 1001);    // user_id
-key.set_field(1, "APAC");  // region (partition column)
-key.set_field(2, 1i64);    // zone (partition column)
-
-let result = lookuper.lookup(&key).await?;
-if let Some(row) = result.get_single_row()? {
-    println!("Found: score={}", row.get_long(3));
-}
-```
-
-> **Note:** Scanning partitioned primary key tables is not supported. Use lookup operations instead.
-
-## Data Types
-
-| Fluss Type      | Rust Type      | Method                                                              |
-|-----------------|----------------|---------------------------------------------------------------------|
-| `BOOLEAN`       | `bool`         | `get_boolean()`, `set_field(idx, bool)`                             |
-| `TINYINT`       | `i8`           | `get_byte()`, `set_field(idx, i8)`                                  |
-| `SMALLINT`      | `i16`          | `get_short()`, `set_field(idx, i16)`                                |
-| `INT`           | `i32`          | `get_int()`, `set_field(idx, i32)`                                  |
-| `BIGINT`        | `i64`          | `get_long()`, `set_field(idx, i64)`                                 |
-| `FLOAT`         | `f32`          | `get_float()`, `set_field(idx, f32)`                                |
-| `DOUBLE`        | `f64`          | `get_double()`, `set_field(idx, f64)`                               |
-| `CHAR`          | `&str`         | `get_char(idx, length)`, `set_field(idx, &str)`                     |
-| `STRING`        | `&str`         | `get_string()`, `set_field(idx, &str)`                              |
-| `DECIMAL`       | `Decimal`      | `get_decimal(idx, precision, scale)`, `set_field(idx, Decimal)`     |
-| `DATE`          | `Date`         | `get_date()`, `set_field(idx, Date)`                                |
-| `TIME`          | `Time`         | `get_time()`, `set_field(idx, Time)`                                |
-| `TIMESTAMP`     | `TimestampNtz` | `get_timestamp_ntz(idx, precision)`, `set_field(idx, TimestampNtz)` |
-| `TIMESTAMP_LTZ` | `TimestampLtz` | `get_timestamp_ltz(idx, precision)`, `set_field(idx, TimestampLtz)` |
-| `BYTES`         | `&[u8]`        | `get_bytes()`, `set_field(idx, &[u8])`                              |
-| `BINARY(n)`     | `&[u8]`        | `get_binary(idx, length)`, `set_field(idx, &[u8])`                  |
-
diff --git a/fluss-rust/docs/verifying-a-release-candidate.md b/fluss-rust/docs/verifying-a-release-candidate.md
index e67d4efc7b..dc70f723bd 100644
--- a/fluss-rust/docs/verifying-a-release-candidate.md
+++ b/fluss-rust/docs/verifying-a-release-candidate.md
@@ -1,21 +1,3 @@
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-
 # How to Verify a Release Candidate
 
 This document describes how to verify a release candidate (RC) of the **Fluss clients** (fluss-rust, fluss-python, fluss-cpp) from the [fluss-rust](https://github.com/apache/fluss-rust) repository. It is intended for anyone participating in the release vote (binding or non-binding) and is based on [Verifying a Fluss Release](https://fluss.apache.org/community/how-to-release/verifying-a-fluss-release/) of the Apache Fluss project, adapted for the fluss-rust source distribution and tooling (Rust, Python, C++).
diff --git a/fluss-rust/justfile b/fluss-rust/justfile
index c4e1a763ac..c2a611688b 100644
--- a/fluss-rust/justfile
+++ b/fluss-rust/justfile
@@ -26,3 +26,7 @@ release [version]:
 # Usage: just bump-version <current> <next>   e.g. just bump-version 0.1.0 0.1.1
 bump-version from to:
     ./scripts/bump-version.sh {{from}} {{to}}
+
+# Regenerate bindings/python/GENERATED_README.md from website docs.
+generate-python-readme:
+    python bindings/python/generate_readme.py
diff --git a/fluss-rust/website/babel.config.js b/fluss-rust/website/babel.config.js
new file mode 100644
index 0000000000..e00595dae7
--- /dev/null
+++ b/fluss-rust/website/babel.config.js
@@ -0,0 +1,3 @@
+module.exports = {
+  presets: [require.resolve('@docusaurus/core/lib/babel/preset')],
+};
diff --git a/fluss-rust/website/docs/developer-guide/_category_.json b/fluss-rust/website/docs/developer-guide/_category_.json
new file mode 100644
index 0000000000..cc7b01abbc
--- /dev/null
+++ b/fluss-rust/website/docs/developer-guide/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Developer Guide",
+  "position": 3
+}
diff --git a/fluss-rust/website/docs/developer-guide/contributing.md b/fluss-rust/website/docs/developer-guide/contributing.md
new file mode 100644
index 0000000000..eced106aad
--- /dev/null
+++ b/fluss-rust/website/docs/developer-guide/contributing.md
@@ -0,0 +1,126 @@
+# Contributing
+
+Welcome to the development guide for `fluss-rust`! This project builds the Fluss Rust client and language-specific bindings (Python, C++).
+
+## Prerequisites
+
+- Rust 1.85+ (see [rust-toolchain.toml](https://github.com/apache/fluss-rust/blob/main/rust-toolchain.toml))
+- Protobuf compiler (`protoc`)
+
+Install using your preferred package/version manager:
+
+```bash
+# Using mise
+mise install protobuf
+mise install rust
+
+# Using Homebrew (macOS)
+brew install protobuf
+
+# Using apt (Ubuntu/Debian)
+sudo apt-get install protobuf-compiler
+```
+
+## IDE Setup
+
+We recommend [RustRover](https://www.jetbrains.com/rust/) IDE.
+
+### Importing the Project
+
+1. Clone the repository:
+   ```bash
+   git clone https://github.com/apache/fluss-rust.git
+   ```
+2. Open RustRover, go to the `Projects` tab, click `Open`, and navigate to the root directory.
+3. Click `Open`.
+
+### Copyright Profile
+
+Fluss is an Apache project, every file needs an Apache licence header. To automate this in RustRover:
+
+1. Go to `Settings` > `Editor` > `Copyright` > `Copyright Profiles`.
+2. Add a new profile named `Apache` with this text:
+   ```
+   Licensed to the Apache Software Foundation (ASF) under one
+   or more contributor license agreements.  See the NOTICE file
+   distributed with this work for additional information
+   regarding copyright ownership.  The ASF licenses this file
+   to you under the Apache License, Version 2.0 (the
+   "License"); you may not use this file except in compliance
+   with the License.  You may obtain a copy of the License at
+
+     http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing,
+   software distributed under the License is distributed on an
+   "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+   KIND, either express or implied.  See the License for the
+   specific language governing permissions and limitations
+   under the License.
+   ```
+3. Go to `Editor` > `Copyright` and set `Apache` as the default profile.
+4. Go to `Editor` > `Copyright` > `Formatting` > `Rust`, choose `Use custom formatting`, then `Use line comment`.
+5. Click `Apply`.
+
+## Project Structure
+
+```
+crates/fluss        (Fluss Rust client crate)
+crates/examples     (Rust client examples)
+bindings/cpp        (C++ bindings)
+bindings/python     (Python bindings - PyO3)
+```
+
+## Building and Testing
+
+### Rust Client
+
+```bash
+# Build everything
+cargo build --workspace --all-targets
+
+# Run unit tests
+cargo test --workspace
+
+# Run integration tests (requires a running Fluss cluster)
+RUST_TEST_THREADS=1 cargo test --features integration_tests --workspace
+
+# Run a single test
+cargo test test_name
+```
+
+### Python Bindings
+
+```bash
+cd bindings/python
+pip install maturin
+pip install -e ".[dev]"
+maturin develop
+```
+
+### C++ Bindings
+
+```bash
+cd bindings/cpp
+mkdir -p build && cd build
+cmake ..
+cmake --build .
+```
+
+## License Check (cargo-deny)
+
+We use [cargo-deny](https://embarkstudios.github.io/cargo-deny/) to ensure all dependency licenses are Apache-compatible:
+
+```bash
+cargo install cargo-deny --locked
+cargo deny check licenses
+```
+
+## Formatting and Clippy
+
+CI runs formatting and clippy checks. Run these before submitting a PR:
+
+```bash
+cargo fmt --all
+cargo clippy --all-targets --fix --allow-dirty --allow-staged
+```
diff --git a/fluss-rust/website/docs/index.md b/fluss-rust/website/docs/index.md
new file mode 100644
index 0000000000..4153813877
--- /dev/null
+++ b/fluss-rust/website/docs/index.md
@@ -0,0 +1,45 @@
+---
+slug: /
+sidebar_position: 1
+title: Introduction
+---
+
+# Introduction
+
+[Apache Fluss](https://fluss.apache.org/) (incubating) is a streaming storage system built for real-time analytics, serving as the real-time data layer for Lakehouse architectures.
+
+This documentation covers the **Fluss client libraries** for Rust, Python, and C++, which are developed in the [fluss-rust](https://github.com/apache/fluss-rust) repository. These clients allow you to:
+
+- **Create and manage** databases, tables, and partitions
+- **Write** data to log tables (append-only) and primary key tables (upsert/delete)
+- **Read** data via log scanning and key lookups
+- **Integrate** with the broader Fluss ecosystem including lakehouse snapshots
+
+## Prerequisites
+
+You need a running Fluss cluster to use any of the client libraries. See the [Deploying a Local Cluster](https://fluss.apache.org/docs/install-deploy/deploying-local-cluster/) guide to get started.
+
+## Key Concepts
+
+- **Log table** — an append-only table (no primary key). Records are immutable once written. Use for event streams, logs, and audit trails.
+  - **Offset** — the position of a record within a log table's bucket. Used to track reading progress. Start from `EARLIEST_OFFSET` to read all data, or resolve the current latest offset via `list_offsets` to only read new records.
+- **Primary key (PK) table** — a table with a primary key. Supports upsert, delete, and point lookups.
+- **Bucket** — the unit of parallelism within a table (similar to Kafka partitions). Each table has one or more buckets. Readers subscribe to individual buckets.
+- **Partition** — a way to organize data by column values (e.g. by date or region). Each partition contains its own set of buckets. Partitions must be created explicitly before writing.
+
+## Client Overview
+
+|                        | Rust                                                       | Python                   | C++                                            |
+|------------------------|------------------------------------------------------------|--------------------------|------------------------------------------------|
+| **Package**            | [fluss-rs](https://crates.io/crates/fluss-rs) on crates.io | Build from source (PyO3) | Build from source (CMake)                      |
+| **Async runtime**      | Tokio                                                      | asyncio                  | Synchronous (Tokio runtime managed internally) |
+| **Data format**        | Arrow RecordBatch / GenericRow                             | PyArrow / Pandas / dict  | Arrow RecordBatch / GenericRow                 |
+| **Log tables**         | Read + Write                                               | Read + Write             | Read + Write                                   |
+| **Primary key tables** | Upsert + Delete + Lookup                                   | Upsert + Delete + Lookup | Upsert + Delete + Lookup                       |
+| **Partitioned tables** | Read + Write                                               | Read + Write             | Read + Write                                   |
+
+## How This Guide Is Organised
+
+The **User Guide** walks through installation, configuration, and working with each table type across all three languages. Code examples are shown side by side under **Rust**, **Python**, and **C++** headings.
+
+The **Developer Guide** covers building from source, running tests, and the release process for contributors.
diff --git a/fluss-rust/website/docs/user-guide/_category_.json b/fluss-rust/website/docs/user-guide/_category_.json
new file mode 100644
index 0000000000..68ea78e784
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "User Guide",
+  "position": 2
+}
diff --git a/fluss-rust/website/docs/user-guide/cpp/_category_.json b/fluss-rust/website/docs/user-guide/cpp/_category_.json
new file mode 100644
index 0000000000..fbdf7a264d
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "C++",
+  "position": 3
+}
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
new file mode 100644
index 0000000000..00ff8086d8
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -0,0 +1,495 @@
+---
+sidebar_position: 2
+---
+# API Reference
+
+Complete API reference for the Fluss C++ client.
+
+## `Result`
+
+| Field / Method  | Type          | Description                                                    |
+|-----------------|---------------|----------------------------------------------------------------|
+| `error_code`    | `int32_t`     | 0 for success, non-zero for errors                             |
+| `error_message` | `std::string` | Human-readable error description                               |
+| `Ok()`          | `bool`        | Returns `true` if operation succeeded (`error_code == 0`)      |
+
+## `Configuration`
+
+| Field                             | Type          | Default              | Description                                                     |
+|-----------------------------------|---------------|----------------------|-----------------------------------------------------------------|
+| `bootstrap_servers`               | `std::string` | `"127.0.0.1:9123"`   | Coordinator server address                                      |
+| `writer_request_max_size`         | `int32_t`     | `10485760` (10 MB)   | Maximum request size in bytes                                   |
+| `writer_acks`                     | `std::string` | `"all"`              | Acknowledgment setting (`"all"`, `"0"`, `"1"`, or `"-1"`)       |
+| `writer_retries`                  | `int32_t`     | `INT32_MAX`          | Number of retries on failure                                    |
+| `writer_batch_size`               | `int32_t`     | `2097152` (2 MB)     | Batch size for writes in bytes                                  |
+| `scanner_remote_log_prefetch_num` | `size_t`      | `4`                  | Number of remote log segments to prefetch                       |
+| `remote_file_download_thread_num` | `size_t`      | `3`                  | Number of threads for remote log downloads                      |
+
+## `Connection`
+
+| Method                                                                  | Description                                       |
+|-------------------------------------------------------------------------|---------------------------------------------------|
+| `static Create(const Configuration& config, Connection& out) -> Result` | Create a connection to a Fluss cluster            |
+| `GetAdmin(Admin& out) -> Result`                                        | Get the admin interface                           |
+| `GetTable(const TablePath& table_path, Table& out) -> Result`           | Get a table for read/write operations             |
+| `Available() -> bool`                                                   | Check if the connection is valid and initialized  |
+
+## `Admin`
+
+### Database Operations
+
+| Method                                                                                                                    | Description              |
+|---------------------------------------------------------------------------------------------------------------------------|--------------------------|
+| `CreateDatabase(const std::string& database_name, const DatabaseDescriptor& descriptor, bool ignore_if_exists) -> Result` | Create a database        |
+| `DropDatabase(const std::string& name, bool ignore_if_not_exists, bool cascade) -> Result`                                | Drop a database          |
+| `ListDatabases(std::vector<std::string>& out) -> Result`                                                                  | List all databases       |
+| `DatabaseExists(const std::string& name, bool& out) -> Result`                                                            | Check if a database exists |
+| `GetDatabaseInfo(const std::string& name, DatabaseInfo& out) -> Result`                                                   | Get database metadata    |
+
+### Table Operations
+
+| Method                                                                                                     | Description                 |
+|------------------------------------------------------------------------------------------------------------|-----------------------------|
+| `CreateTable(const TablePath& path, const TableDescriptor& descriptor, bool ignore_if_exists) -> Result`   | Create a table              |
+| `DropTable(const TablePath& path, bool ignore_if_not_exists) -> Result`                                    | Drop a table                |
+| `GetTableInfo(const TablePath& path, TableInfo& out) -> Result`                                            | Get table metadata          |
+| `ListTables(const std::string& database_name, std::vector<std::string>& out) -> Result`                    | List tables in a database   |
+| `TableExists(const TablePath& path, bool& out) -> Result`                                                  | Check if a table exists     |
+
+### Partition Operations
+
+| Method                                                                                                                                          | Description              |
+|-------------------------------------------------------------------------------------------------------------------------------------------------|--------------------------|
+| `CreatePartition(const TablePath& path, const std::unordered_map<std::string, std::string>& partition_spec, bool ignore_if_exists) -> Result`   | Create a partition       |
+| `DropPartition(const TablePath& path, const std::unordered_map<std::string, std::string>& partition_spec, bool ignore_if_not_exists) -> Result` | Drop a partition         |
+| `ListPartitionInfos(const TablePath& path, std::vector<PartitionInfo>& out) -> Result`                                                          | List partition metadata  |
+
+### Offset Operations
+
+| Method                                                                                                                                                                                                  | Description                             |
+|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------|
+| `ListOffsets(const TablePath& path, const std::vector<int32_t>& bucket_ids, const OffsetQuery& query, std::unordered_map<int32_t, int64_t>& out) -> Result`                                             | Get offsets for buckets                 |
+| `ListPartitionOffsets(const TablePath& path, const std::string& partition_name, const std::vector<int32_t>& bucket_ids, const OffsetQuery& query, std::unordered_map<int32_t, int64_t>& out) -> Result` | Get offsets for a partition's buckets   |
+
+### Lake Operations
+
+| Method                                                                      | Description                  |
+|-----------------------------------------------------------------------------|------------------------------|
+| `GetLatestLakeSnapshot(const TablePath& path, LakeSnapshot& out) -> Result` | Get the latest lake snapshot |
+
+## `Table`
+
+| Method                        | Description                              |
+|-------------------------------|------------------------------------------|
+| `NewRow() -> GenericRow`      | Create a schema-aware row for this table |
+| `NewAppend() -> TableAppend`  | Create an append builder for log tables  |
+| `NewUpsert() -> TableUpsert`  | Create an upsert builder for PK tables   |
+| `NewLookup() -> TableLookup`  | Create a lookup builder for PK tables    |
+| `NewScan() -> TableScan`      | Create a scan builder                    |
+| `GetTableInfo() -> TableInfo` | Get table metadata                       |
+| `GetTablePath() -> TablePath` | Get the table path                       |
+| `HasPrimaryKey() -> bool`     | Check if the table has a primary key     |
+
+## `TableAppend`
+
+| Method                                       | Description             |
+|----------------------------------------------|-------------------------|
+| `CreateWriter(AppendWriter& out) -> Result`  | Create an append writer |
+
+## `TableUpsert`
+
+| Method                                                                       | Description                                |
+|------------------------------------------------------------------------------|--------------------------------------------|
+| `PartialUpdateByIndex(std::vector<size_t> column_indices) -> TableUpsert&`   | Configure partial update by column indices |
+| `PartialUpdateByName(std::vector<std::string> column_names) -> TableUpsert&` | Configure partial update by column names   |
+| `CreateWriter(UpsertWriter& out) -> Result`                                  | Create an upsert writer                    |
+
+## `TableLookup`
+
+| Method                                    | Description                         |
+|-------------------------------------------|-------------------------------------|
+| `CreateLookuper(Lookuper& out) -> Result` | Create a lookuper for point lookups |
+
+## `TableScan`
+
+| Method                                                               | Description                                   |
+|----------------------------------------------------------------------|-----------------------------------------------|
+| `ProjectByIndex(std::vector<size_t> column_indices) -> TableScan&`   | Project columns by index                      |
+| `ProjectByName(std::vector<std::string> column_names) -> TableScan&` | Project columns by name                       |
+| `CreateLogScanner(LogScanner& out) -> Result`                        | Create a record-based log scanner             |
+| `CreateRecordBatchLogScanner(LogScanner& out) -> Result`             | Create an Arrow RecordBatch-based log scanner |
+
+## `AppendWriter`
+
+| Method                                                      | Description                            |
+|-------------------------------------------------------------|----------------------------------------|
+| `Append(const GenericRow& row) -> Result`                   | Append a row (fire-and-forget)         |
+| `Append(const GenericRow& row, WriteResult& out) -> Result` | Append a row with write acknowledgment |
+| `Flush() -> Result`                                         | Flush all pending writes               |
+
+## `UpsertWriter`
+
+| Method                                                      | Description                                   |
+|-------------------------------------------------------------|-----------------------------------------------|
+| `Upsert(const GenericRow& row) -> Result`                   | Upsert a row (fire-and-forget)                |
+| `Upsert(const GenericRow& row, WriteResult& out) -> Result` | Upsert a row with write acknowledgment        |
+| `Delete(const GenericRow& row) -> Result`                   | Delete a row by primary key (fire-and-forget) |
+| `Delete(const GenericRow& row, WriteResult& out) -> Result` | Delete a row with write acknowledgment        |
+| `Flush() -> Result`                                         | Flush all pending operations                  |
+
+## `WriteResult`
+
+| Method             | Description                                 |
+|--------------------|---------------------------------------------|
+| `Wait() -> Result` | Wait for server acknowledgment of the write |
+
+## `Lookuper`
+
+| Method                                                                     |  Description                |
+|----------------------------------------------------------------------------|-----------------------------|
+| `Lookup(const GenericRow& pk_row, bool& found, GenericRow& out) -> Result` | Lookup a row by primary key |
+
+## `LogScanner`
+
+| Method                                                                                               |  Description                              |
+|------------------------------------------------------------------------------------------------------|-------------------------------------------|
+| `Subscribe(int32_t bucket_id, int64_t offset) -> Result`                                             | Subscribe to a single bucket at an offset |
+| `Subscribe(const std::vector<BucketSubscription>& bucket_offsets) -> Result`                         | Subscribe to multiple buckets             |
+| `SubscribePartitionBuckets(int64_t partition_id, int32_t bucket_id, int64_t start_offset) -> Result` | Subscribe to a single partition bucket    |
+| `SubscribePartitionBuckets(const std::vector<PartitionBucketSubscription>& subscriptions) -> Result` | Subscribe to multiple partition buckets   |
+| `Unsubscribe(int32_t bucket_id) -> Result`                                                           | Unsubscribe from a non-partitioned bucket |
+| `UnsubscribePartition(int64_t partition_id, int32_t bucket_id) -> Result`                            | Unsubscribe from a partition bucket       |
+| `Poll(int64_t timeout_ms, ScanRecords& out) -> Result`                                               | Poll individual records                   |
+| `PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out) -> Result`                             | Poll Arrow RecordBatches                  |
+
+## `GenericRow`
+
+### Index-Based Getters
+
+| Method                                         |  Description                   |
+|------------------------------------------------|--------------------------------|
+| `GetBool(size_t idx) -> bool`                  | Get boolean value at index     |
+| `GetInt32(size_t idx) -> int32_t`              | Get 32-bit integer at index    |
+| `GetInt64(size_t idx) -> int64_t`              | Get 64-bit integer at index    |
+| `GetFloat32(size_t idx) -> float`              | Get 32-bit float at index      |
+| `GetFloat64(size_t idx) -> double`             | Get 64-bit float at index      |
+| `GetString(size_t idx) -> std::string`         | Get string at index            |
+| `GetBytes(size_t idx) -> std::vector<uint8_t>` | Get binary data at index       |
+| `GetDate(size_t idx) -> Date`                  | Get date at index              |
+| `GetTime(size_t idx) -> Time`                  | Get time at index              |
+| `GetTimestamp(size_t idx) -> Timestamp`        | Get timestamp at index         |
+| `DecimalToString(size_t idx) -> std::string`   | Get decimal as string at index |
+
+### Index-Based Setters
+
+| Method                                                    |  Description                   |
+|-----------------------------------------------------------|--------------------------------|
+| `SetNull(size_t idx)`                                     | Set field to null              |
+| `SetBool(size_t idx, bool value)`                         | Set boolean value              |
+| `SetInt32(size_t idx, int32_t value)`                     | Set 32-bit integer             |
+| `SetInt64(size_t idx, int64_t value)`                     | Set 64-bit integer             |
+| `SetFloat32(size_t idx, float value)`                     | Set 32-bit float               |
+| `SetFloat64(size_t idx, double value)`                    | Set 64-bit float               |
+| `SetString(size_t idx, const std::string& value)`         | Set string value               |
+| `SetBytes(size_t idx, const std::vector<uint8_t>& value)` | Set binary data                |
+| `SetDate(size_t idx, const Date& value)`                  | Set date value                 |
+| `SetTime(size_t idx, const Time& value)`                  | Set time value                 |
+| `SetTimestampNtz(size_t idx, const Timestamp& value)`     | Set timestamp without timezone |
+| `SetTimestampLtz(size_t idx, const Timestamp& value)`     | Set timestamp with timezone    |
+| `SetDecimal(size_t idx, const std::string& value)`        | Set decimal from string        |
+
+### Name-Based Setters
+
+When using `table.NewRow()`, the `Set()` method auto-routes to the correct type based on the schema:
+
+| Method                                                   |  Description                      |
+|----------------------------------------------------------|-----------------------------------|
+| `Set(const std::string& name, bool value)`               | Set boolean by column name        |
+| `Set(const std::string& name, int32_t value)`            | Set integer by column name        |
+| `Set(const std::string& name, int64_t value)`            | Set big integer by column name    |
+| `Set(const std::string& name, float value)`              | Set float by column name          |
+| `Set(const std::string& name, double value)`             | Set double by column name         |
+| `Set(const std::string& name, const std::string& value)` | Set string/decimal by column name |
+| `Set(const std::string& name, const Date& value)`        | Set date by column name           |
+| `Set(const std::string& name, const Time& value)`        | Set time by column name           |
+| `Set(const std::string& name, const Timestamp& value)`   | Set timestamp by column name      |
+
+### Row Inspection
+
+| Method                             |  Description                     |
+|------------------------------------|----------------------------------|
+| `FieldCount() -> size_t`           | Get the number of fields         |
+| `GetType(size_t idx) -> DatumType` | Get the datum type at index      |
+| `IsNull(size_t idx) -> bool`       | Check if field is null           |
+| `IsDecimal(size_t idx) -> bool`    | Check if field is a decimal type |
+
+## `ScanRecord`
+
+| Field       | Type         |  Description                  |
+|-------------|--------------|-------------------------------|
+| `bucket_id` | `int32_t`    | Bucket this record belongs to |
+| `offset`    | `int64_t`    | Record offset in the log      |
+| `timestamp` | `int64_t`    | Record timestamp              |
+| `row`       | `GenericRow` | Row data                      |
+
+## `ScanRecords`
+
+| Method                                        |  Description                               |
+|-----------------------------------------------|--------------------------------------------|
+| `Size() -> size_t`                            | Number of records                          |
+| `Empty() -> bool`                             | Check if empty                             |
+| `operator[](size_t idx) -> const ScanRecord&` | Access record by index                     |
+| `begin() / end()`                             | Iterator support for range-based for loops |
+
+## `ArrowRecordBatch`
+
+| Method                                                         | Description                          |
+|----------------------------------------------------------------|--------------------------------------|
+| `GetArrowRecordBatch() -> std::shared_ptr<arrow::RecordBatch>` | Get the underlying Arrow RecordBatch |
+| `Available() -> bool`                                          | Check if the batch is valid          |
+| `NumRows() -> int64_t`                                         | Number of rows in the batch          |
+| `GetTableId() -> int64_t`                                      | Table ID                             |
+| `GetPartitionId() -> int64_t`                                  | Partition ID                         |
+| `GetBucketId() -> int32_t`                                     | Bucket ID                            |
+| `GetBaseOffset() -> int64_t`                                   | First record offset                  |
+| `GetLastOffset() -> int64_t`                                   | Last record offset                   |
+
+## `ArrowRecordBatches`
+
+| Method                   |  Description                               |
+|--------------------------|--------------------------------------------|
+| `Size() -> size_t`       | Number of batches                          |
+| `Empty() -> bool`        | Check if empty                             |
+| `operator[](size_t idx)` | Access batch by index                      |
+| `begin() / end()`        | Iterator support for range-based for loops |
+
+## `Schema`
+
+| Method                            |  Description                |
+|-----------------------------------|-----------------------------|
+| `NewBuilder() -> Schema::Builder` | Create a new schema builder |
+
+## `Schema::Builder`
+
+| Method                                                                 |  Description            |
+|------------------------------------------------------------------------|-------------------------|
+| `AddColumn(const std::string& name, const DataType& type) -> Builder&` | Add a column            |
+| `SetPrimaryKeys(const std::vector<std::string>& keys) -> Builder&`     | Set primary key columns |
+| `Build() -> Schema`                                                    | Build the schema        |
+
+## `TableDescriptor`
+
+| Method                                     |  Description                          |
+|--------------------------------------------|---------------------------------------|
+| `NewBuilder() -> TableDescriptor::Builder` | Create a new table descriptor builder |
+
+## `TableDescriptor::Builder`
+
+| Method                                                                      |  Description               |
+|-----------------------------------------------------------------------------|----------------------------|
+| `SetSchema(const Schema& schema) -> Builder&`                               | Set the table schema       |
+| `SetPartitionKeys(const std::vector<std::string>& keys) -> Builder&`        | Set partition key columns  |
+| `SetBucketCount(int32_t count) -> Builder&`                                 | Set the number of buckets  |
+| `SetBucketKeys(const std::vector<std::string>& keys) -> Builder&`           | Set bucket key columns     |
+| `SetProperty(const std::string& key, const std::string& value) -> Builder&` | Set a table property       |
+| `SetComment(const std::string& comment) -> Builder&`                        | Set a table comment        |
+| `Build() -> TableDescriptor`                                                | Build the table descriptor |
+
+## `DataType`
+
+### Factory Methods
+
+| Method                                        |  Description                       |
+|-----------------------------------------------|------------------------------------|
+| `DataType::Boolean()`                         | Boolean type                       |
+| `DataType::TinyInt()`                         | 8-bit signed integer               |
+| `DataType::SmallInt()`                        | 16-bit signed integer              |
+| `DataType::Int()`                             | 32-bit signed integer              |
+| `DataType::BigInt()`                          | 64-bit signed integer              |
+| `DataType::Float()`                           | 32-bit floating point              |
+| `DataType::Double()`                          | 64-bit floating point              |
+| `DataType::String()`                          | UTF-8 string                       |
+| `DataType::Bytes()`                           | Binary data                        |
+| `DataType::Date()`                            | Date (days since epoch)            |
+| `DataType::Time()`                            | Time (milliseconds since midnight) |
+| `DataType::Timestamp(int precision)`          | Timestamp without timezone         |
+| `DataType::TimestampLtz(int precision)`       | Timestamp with timezone            |
+| `DataType::Decimal(int precision, int scale)` | Decimal with precision and scale   |
+
+### Accessors
+
+| Method               |  Description                                |
+|----------------------|---------------------------------------------|
+| `id() -> TypeId`     | Get the type ID                             |
+| `precision() -> int` | Get precision (for Decimal/Timestamp types) |
+| `scale() -> int`     | Get scale (for Decimal type)                |
+
+## `TablePath`
+
+| Method / Field                                                     |  Description          |
+|--------------------------------------------------------------------|-----------------------|
+| `TablePath(const std::string& database, const std::string& table)` | Create a table path   |
+| `database_name -> std::string`                                     | Database name         |
+| `table_name -> std::string`                                        | Table name            |
+| `ToString() -> std::string`                                        | String representation |
+
+## `TableInfo`
+
+| Field             | Type                                           |  Description                        |
+|-------------------|------------------------------------------------|-------------------------------------|
+| `table_id`        | `int64_t`                                      | Table ID                            |
+| `schema_id`       | `int32_t`                                      | Schema ID                           |
+| `table_path`      | `TablePath`                                    | Table path                          |
+| `created_time`    | `int64_t`                                      | Creation timestamp                  |
+| `modified_time`   | `int64_t`                                      | Last modification timestamp         |
+| `primary_keys`    | `std::vector<std::string>`                     | Primary key columns                 |
+| `bucket_keys`     | `std::vector<std::string>`                     | Bucket key columns                  |
+| `partition_keys`  | `std::vector<std::string>`                     | Partition key columns               |
+| `num_buckets`     | `int32_t`                                      | Number of buckets                   |
+| `has_primary_key` | `bool`                                         | Whether the table has a primary key |
+| `is_partitioned`  | `bool`                                         | Whether the table is partitioned    |
+| `properties`      | `std::unordered_map<std::string, std::string>` | Table properties                    |
+| `comment`         | `std::string`                                  | Table comment                       |
+| `schema`          | `Schema`                                       | Table schema                        |
+
+## Temporal Types
+
+### `Date`
+
+| Method                                        |  Description                 |
+|-----------------------------------------------|------------------------------|
+| `Date::FromDays(int32_t days)`                | Create from days since epoch |
+| `Date::FromYMD(int year, int month, int day)` | Create from year, month, day |
+| `Year() -> int`                               | Get year                     |
+| `Month() -> int`                              | Get month                    |
+| `Day() -> int`                                | Get day                      |
+
+### `Time`
+
+| Method                                            |  Description                                 |
+|---------------------------------------------------|----------------------------------------------|
+| `Time::FromMillis(int32_t millis)`                | Create from milliseconds since midnight      |
+| `Time::FromHMS(int hour, int minute, int second)` | Create from hour, minute, second             |
+| `Hour() -> int`                                   | Get hour                                     |
+| `Minute() -> int`                                 | Get minute                                   |
+| `Second() -> int`                                 | Get second                                   |
+| `Millis() -> int64_t`                             | Get sub-second millisecond component (0-999) |
+
+### `Timestamp`
+
+| Method                                                               |  Description                             |
+|----------------------------------------------------------------------|------------------------------------------|
+| `Timestamp::FromMillis(int64_t millis)`                              | Create from milliseconds since epoch     |
+| `Timestamp::FromMillisNanos(int64_t millis, int32_t nanos)`          | Create from milliseconds and nanoseconds |
+| `Timestamp::FromTimePoint(std::chrono::system_clock::time_point tp)` | Create from a time point                 |
+
+## `PartitionInfo`
+
+| Field            | Type          |  Description   |
+|------------------|---------------|----------------|
+| `partition_id`   | `int64_t`     | Partition ID   |
+| `partition_name` | `std::string` | Partition name |
+
+## `DatabaseDescriptor`
+
+| Field        | Type                                           | Description       |
+|--------------|------------------------------------------------|-------------------|
+| `comment`    | `std::string`                                  | Database comment  |
+| `properties` | `std::unordered_map<std::string, std::string>` | Custom properties |
+
+## `DatabaseInfo`
+
+| Field           | Type                                           |  Description                |
+|-----------------|------------------------------------------------|-----------------------------|
+| `database_name` | `std::string`                                  | Database name               |
+| `comment`       | `std::string`                                  | Database comment            |
+| `properties`    | `std::unordered_map<std::string, std::string>` | Custom properties           |
+| `created_time`  | `int64_t`                                      | Creation timestamp          |
+| `modified_time` | `int64_t`                                      | Last modification timestamp |
+
+## `LakeSnapshot`
+
+| Field            | Type                        |  Description       |
+|------------------|-----------------------------|--------------------|
+| `snapshot_id`    | `int64_t`                   | Snapshot ID        |
+| `bucket_offsets` | `std::vector<BucketOffset>` | All bucket offsets |
+
+## `BucketOffset`
+
+| Field          | Type      | Description  |
+|----------------|-----------|--------------|
+| `table_id`     | `int64_t` | Table ID     |
+| `partition_id` | `int64_t` | Partition ID |
+| `bucket_id`    | `int32_t` | Bucket ID    |
+| `offset`       | `int64_t` | Offset value |
+
+## `OffsetQuery`
+
+| Method                                             | Description                             |
+|----------------------------------------------------|-----------------------------------------|
+| `OffsetQuery::Earliest()`                          | Query for the earliest available offset |
+| `OffsetQuery::Latest()`                            | Query for the latest offset             |
+| `OffsetQuery::FromTimestamp(int64_t timestamp_ms)` | Query offset at a specific timestamp    |
+
+## Constants
+
+| Constant                 |  Value |  Description                                            |
+|--------------------------|--------|---------------------------------------------------------|
+| `fluss::EARLIEST_OFFSET` | `-2`   | Start reading from the earliest available offset        |
+
+To start reading from the latest offset (only new records), resolve the current offset via `ListOffsets` before subscribing:
+
+```cpp
+std::unordered_map<int32_t, int64_t> offsets;
+admin.ListOffsets(table_path, {0}, fluss::OffsetQuery::Latest(), offsets);
+scanner.Subscribe(0, offsets[0]);
+```
+
+## Enums
+
+### `TypeId`
+
+| Value          |  Description               |
+|----------------|----------------------------|
+| `Boolean`      | Boolean type               |
+| `TinyInt`      | 8-bit signed integer       |
+| `SmallInt`     | 16-bit signed integer      |
+| `Int`          | 32-bit signed integer      |
+| `BigInt`       | 64-bit signed integer      |
+| `Float`        | 32-bit floating point      |
+| `Double`       | 64-bit floating point      |
+| `String`       | UTF-8 string               |
+| `Bytes`        | Binary data                |
+| `Date`         | Date                       |
+| `Time`         | Time                       |
+| `Timestamp`    | Timestamp without timezone |
+| `TimestampLtz` | Timestamp with timezone    |
+| `Decimal`      | Decimal                    |
+
+### `DatumType`
+
+| Value           | C++ Type               |  Description                    |
+|-----------------|------------------------|---------------------------------|
+| `Null`          | --                     | Null value                      |
+| `Bool`          | `bool`                 | Boolean                         |
+| `Int32`         | `int32_t`              | 32-bit integer                  |
+| `Int64`         | `int64_t`              | 64-bit integer                  |
+| `Float32`       | `float`                | 32-bit float                    |
+| `Float64`       | `double`               | 64-bit float                    |
+| `String`        | `std::string`          | String                          |
+| `Bytes`         | `std::vector<uint8_t>` | Binary data                     |
+| `DecimalI64`    | `int64_t`              | Decimal (64-bit internal)       |
+| `DecimalI128`   | `__int128`             | Decimal (128-bit internal)      |
+| `DecimalString` | `std::string`          | Decimal (string representation) |
+| `Date`          | `Date`                 | Date                            |
+| `Time`          | `Time`                 | Time                            |
+| `TimestampNtz`  | `Timestamp`            | Timestamp without timezone      |
+| `TimestampLtz`  | `Timestamp`            | Timestamp with timezone         |
+
+### `OffsetSpec`
+
+| Value       |  Description                   |
+|-------------|--------------------------------|
+| `Earliest`  | Earliest available offset      |
+| `Latest`    | Latest offset                  |
+| `Timestamp` | Offset at a specific timestamp |
diff --git a/fluss-rust/website/docs/user-guide/cpp/data-types.md b/fluss-rust/website/docs/user-guide/cpp/data-types.md
new file mode 100644
index 0000000000..11712fac55
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/data-types.md
@@ -0,0 +1,110 @@
+---
+sidebar_position: 3
+---
+# Data Types
+
+## Schema DataTypes
+
+| DataType                   | Description                                                    |
+|----------------------------|----------------------------------------------------------------|
+| `DataType::Boolean()`      | Boolean value                                                  |
+| `DataType::TinyInt()`      | 8-bit signed integer                                           |
+| `DataType::SmallInt()`     | 16-bit signed integer                                          |
+| `DataType::Int()`          | 32-bit signed integer                                          |
+| `DataType::BigInt()`       | 64-bit signed integer                                          |
+| `DataType::Float()`        | 32-bit floating point                                          |
+| `DataType::Double()`       | 64-bit floating point                                          |
+| `DataType::String()`       | UTF-8 string                                                   |
+| `DataType::Bytes()`        | Binary data                                                    |
+| `DataType::Date()`         | Date (days since epoch)                                        |
+| `DataType::Time()`         | Time (milliseconds since midnight)                             |
+| `DataType::Timestamp()`    | Timestamp without timezone (default precision 6, microseconds) |
+| `DataType::TimestampLtz()` | Timestamp with timezone (default precision 6, microseconds)    |
+| `DataType::Decimal(p, s)`  | Decimal with precision and scale                               |
+
+## GenericRow Setters
+
+```cpp
+fluss::GenericRow row;
+row.SetNull(0);
+row.SetBool(1, true);
+row.SetInt32(2, 42);
+row.SetInt64(3, 1234567890L);
+row.SetFloat32(4, 3.14f);
+row.SetFloat64(5, 2.71828);
+row.SetString(6, "hello");
+row.SetBytes(7, {0x01, 0x02, 0x03});
+```
+
+## Name-Based Setters
+
+When using `table.NewRow()`, you can set fields by column name. The setter automatically routes to the correct type based on the schema:
+
+```cpp
+auto row = table.NewRow();
+row.Set("user_id", 1);
+row.Set("name", "Alice");
+row.Set("score", 95.5f);
+row.Set("balance", "1234.56");   // decimal as string
+row.Set("birth_date", fluss::Date::FromYMD(1990, 3, 15));
+row.Set("login_time", fluss::Time::FromHMS(9, 30, 0));
+row.Set("created_at", fluss::Timestamp::FromMillis(1700000000000));
+row.Set("nickname", nullptr);    // set to null
+```
+
+## GenericRow Getters
+
+```cpp
+std::string name = result_row.GetString(1);
+float score = result_row.GetFloat32(3);
+std::string balance = result_row.DecimalToString(4);
+fluss::Date date = result_row.GetDate(5);
+fluss::Time time = result_row.GetTime(6);
+fluss::Timestamp ts = result_row.GetTimestamp(7);
+```
+
+## DatumType Enum
+
+| DatumType       | C++ Type               | Getter                 |
+|-----------------|------------------------|------------------------|
+| `Null`          | --                     | `IsNull(idx)`          |
+| `Bool`          | `bool`                 | `GetBool(idx)`         |
+| `Int32`         | `int32_t`              | `GetInt32(idx)`        |
+| `Int64`         | `int64_t`              | `GetInt64(idx)`        |
+| `Float32`       | `float`                | `GetFloat32(idx)`      |
+| `Float64`       | `double`               | `GetFloat64(idx)`      |
+| `String`        | `std::string`          | `GetString(idx)`       |
+| `Bytes`         | `std::vector<uint8_t>` | `GetBytes(idx)`        |
+| `Date`          | `Date`                 | `GetDate(idx)`         |
+| `Time`          | `Time`                 | `GetTime(idx)`         |
+| `TimestampNtz`  | `Timestamp`            | `GetTimestamp(idx)`    |
+| `TimestampLtz`  | `Timestamp`            | `GetTimestamp(idx)`    |
+| `DecimalString` | `std::string`          | `DecimalToString(idx)` |
+
+## Type Checking
+
+```cpp
+if (rec.row.GetType(0) == fluss::DatumType::Int32) {
+    int32_t value = rec.row.GetInt32(0);
+}
+if (rec.row.IsNull(1)) {
+    // field is null
+}
+if (rec.row.IsDecimal(2)) {
+    std::string decimal_str = rec.row.DecimalToString(2);
+}
+```
+
+## Constants
+
+```cpp
+constexpr int64_t fluss::EARLIEST_OFFSET = -2;  // Start from earliest
+```
+
+To start reading from the latest offset, resolve the current offset via `ListOffsets` before subscribing:
+
+```cpp
+std::unordered_map<int32_t, int64_t> offsets;
+admin.ListOffsets(table_path, {0}, fluss::OffsetQuery::Latest(), offsets);
+scanner.Subscribe(0, offsets[0]);
+```
diff --git a/fluss-rust/website/docs/user-guide/cpp/error-handling.md b/fluss-rust/website/docs/user-guide/cpp/error-handling.md
new file mode 100644
index 0000000000..76b03e3e97
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/error-handling.md
@@ -0,0 +1,170 @@
+---
+sidebar_position: 4
+---
+# Error Handling
+
+All C++ client operations return a `fluss::Result` struct instead of throwing exceptions. This gives you explicit control over error handling.
+
+## The `Result` Struct
+
+```cpp
+#include "fluss.hpp"
+
+// All operations return fluss::Result
+fluss::Result result = admin.CreateTable(path, descriptor);
+if (!result.Ok()) {
+    std::cerr << "Error code: " << result.error_code << std::endl;
+    std::cerr << "Error message: " << result.error_message << std::endl;
+}
+```
+
+| Field / Method   | Type          | Description                               |
+|------------------|---------------|-------------------------------------------|
+| `error_code`     | `int32_t`     | 0 for success, non-zero for errors        |
+| `error_message`  | `std::string` | Human-readable error description          |
+| `Ok()`           | `bool`        | Returns `true` if the operation succeeded |
+
+## Handling Errors
+
+Check the `Result` after each operation and decide how to respond, e.g. log and continue, retry, or abort:
+
+```cpp
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+if (!result.Ok()) {
+    // Log, retry, or propagate the error as appropriate
+    std::cerr << "Connection failed (code " << result.error_code
+              << "): " << result.error_message << std::endl;
+    return 1;
+}
+```
+
+## Connection State Checking
+
+Use `Available()` to verify that a connection or object is valid before using it:
+
+```cpp
+fluss::Connection conn;
+if (!conn.Available()) {
+    // Connection not initialized or already moved
+}
+
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+fluss::Result result = fluss::Connection::Create(config, conn);
+if (result.Ok() && conn.Available()) {
+    // Connection is ready to use
+}
+```
+
+## Error Codes
+
+Server-side errors carry a specific error code (>0 or -1). Client-side errors (connection failures, type mismatches, etc.) use `ErrorCode::CLIENT_ERROR` (-2). Use `fluss::ErrorCode` to match on specific codes:
+
+```cpp
+fluss::Result result = admin.DropTable(table_path);
+if (!result.Ok()) {
+    if (result.error_code == fluss::ErrorCode::TABLE_NOT_EXIST) {
+        std::cerr << "Table does not exist" << std::endl;
+    } else if (result.error_code == fluss::ErrorCode::PARTITION_NOT_EXISTS) {
+        std::cerr << "Partition does not exist" << std::endl;
+    } else if (result.error_code == fluss::ErrorCode::CLIENT_ERROR) {
+        std::cerr << "Client-side error: " << result.error_message << std::endl;
+    } else {
+        std::cerr << "Server error (code " << result.error_code
+                  << "): " << result.error_message << std::endl;
+    }
+}
+```
+
+### Common Error Codes
+
+| Constant                                      | Code | Description                         |
+|-----------------------------------------------|------|-------------------------------------|
+| `ErrorCode::CLIENT_ERROR`                     | -2   | Client-side error (not from server) |
+| `ErrorCode::UNKNOWN_SERVER_ERROR`             | -1   | Unexpected server error             |
+| `ErrorCode::NETWORK_EXCEPTION`                | 1    | Server disconnected before response |
+| `ErrorCode::DATABASE_NOT_EXIST`               | 4    | Database does not exist             |
+| `ErrorCode::DATABASE_ALREADY_EXIST`           | 6    | Database already exists             |
+| `ErrorCode::TABLE_NOT_EXIST`                  | 7    | Table does not exist                |
+| `ErrorCode::TABLE_ALREADY_EXIST`              | 8    | Table already exists                |
+| `ErrorCode::INVALID_TABLE_EXCEPTION`          | 15   | Invalid table operation             |
+| `ErrorCode::REQUEST_TIME_OUT`                 | 25   | Request timed out                   |
+| `ErrorCode::PARTITION_NOT_EXISTS`             | 36   | Partition does not exist            |
+| `ErrorCode::PARTITION_ALREADY_EXISTS`         | 42   | Partition already exists            |
+| `ErrorCode::PARTITION_SPEC_INVALID_EXCEPTION` | 43   | Invalid partition spec              |
+| `ErrorCode::LEADER_NOT_AVAILABLE_EXCEPTION`   | 44   | No leader available for partition   |
+
+See `fluss::ErrorCode` in `fluss.hpp` for the full list of named constants.
+
+## Common Error Scenarios
+
+### Connection Refused
+
+The cluster is not running or the address is incorrect:
+
+```cpp
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+if (!result.Ok()) {
+    // "Connection refused" or timeout error
+    std::cerr << "Cannot connect to cluster: " << result.error_message << std::endl;
+}
+```
+
+### Table Not Found
+
+Attempting to access a table that does not exist:
+
+```cpp
+fluss::Table table;
+fluss::Result result = conn.GetTable(fluss::TablePath("fluss", "nonexistent"), table);
+if (!result.Ok()) {
+    if (result.error_code == fluss::ErrorCode::TABLE_NOT_EXIST) {
+        std::cerr << "Table not found" << std::endl;
+    }
+}
+```
+
+### Partition Not Found
+
+Writing to a partitioned primary key table before creating partitions:
+
+```cpp
+// This will fail if partitions are not created first
+auto row = table.NewRow();
+row.Set("user_id", 1);
+row.Set("region", "US");
+row.Set("score", static_cast<int64_t>(100));
+fluss::WriteResult wr;
+fluss::Result result = writer.Upsert(row, wr);
+if (!result.Ok()) {
+    if (result.error_code == fluss::ErrorCode::PARTITION_NOT_EXISTS) {
+        std::cerr << "Partition not found, create partitions before writing" << std::endl;
+    }
+}
+```
+
+### Schema Mismatch
+
+Using incorrect types or column indices when writing:
+
+```cpp
+fluss::GenericRow row;
+// Setting wrong type for a column will result in an error
+// when the row is sent to the server
+row.SetString(0, "not_an_integer");  // Column 0 expects Int
+fluss::Result result = writer.Append(row);
+if (!result.Ok()) {
+    std::cerr << "Schema mismatch: " << result.error_message << std::endl;
+}
+```
+
+## Best Practices
+
+1. **Always check `Result`**: Never ignore the return value of operations that return `Result`.
+2. **Handle errors gracefully**: Log errors and retry or fail gracefully rather than crashing.
+3. **Verify connection state**: Use `Available()` to check connection validity before operations.
+4. **Create partitions before writing**: For partitioned primary key tables, always create partitions before attempting upserts.
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/_category_.json b/fluss-rust/website/docs/user-guide/cpp/example/_category_.json
new file mode 100644
index 0000000000..dd2229499b
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/example/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Example",
+  "position": 5
+}
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md b/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
new file mode 100644
index 0000000000..1a33012616
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
@@ -0,0 +1,154 @@
+---
+sidebar_position: 3
+---
+# Admin Operations
+
+## Get Admin Interface
+
+```cpp
+fluss::Admin admin;
+conn.GetAdmin(admin);
+```
+
+## Database Operations
+
+```cpp
+// Create database
+fluss::DatabaseDescriptor db_descriptor;
+db_descriptor.comment = "My database";
+admin.CreateDatabase("my_database", db_descriptor, true);
+
+// List all databases
+std::vector<std::string> databases;
+admin.ListDatabases(databases);
+for (const auto& db : databases) {
+    std::cout << "Database: " << db << std::endl;
+}
+
+// Check if database exists
+bool exists = false;
+admin.DatabaseExists("my_database", exists);
+
+// Get database information
+fluss::DatabaseInfo db_info;
+admin.GetDatabaseInfo("my_database", db_info);
+std::cout << "Database: " << db_info.database_name << std::endl;
+
+// Drop database
+admin.DropDatabase("my_database", true, false);
+```
+
+## Table Operations
+
+```cpp
+fluss::TablePath table_path("fluss", "my_table");
+
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("id", fluss::DataType::Int())
+    .AddColumn("name", fluss::DataType::String())
+    .AddColumn("score", fluss::DataType::Float())
+    .AddColumn("age", fluss::DataType::Int())
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetBucketCount(3)
+    .SetComment("Example table")
+    .Build();
+
+// Create table
+admin.CreateTable(table_path, descriptor, true);
+
+// Get table information
+fluss::TableInfo table_info;
+admin.GetTableInfo(table_path, table_info);
+std::cout << "Table ID: " << table_info.table_id << std::endl;
+std::cout << "Number of buckets: " << table_info.num_buckets << std::endl;
+std::cout << "Has primary key: " << table_info.has_primary_key << std::endl;
+std::cout << "Is partitioned: " << table_info.is_partitioned << std::endl;
+
+// Drop table
+admin.DropTable(table_path, true);
+```
+
+## Schema Builder Options
+
+```cpp
+// Schema with primary key
+auto pk_schema = fluss::Schema::NewBuilder()
+    .AddColumn("id", fluss::DataType::Int())
+    .AddColumn("name", fluss::DataType::String())
+    .AddColumn("value", fluss::DataType::Double())
+    .SetPrimaryKeys({"id"})
+    .Build();
+
+// Table descriptor with partitioning
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetPartitionKeys({"date"})
+    .SetBucketCount(3)
+    .SetBucketKeys({"user_id"})
+    .SetProperty("retention_days", "7")
+    .SetComment("Sample table")
+    .Build();
+```
+
+## Partition Operations
+
+```cpp
+// Create a partition
+std::unordered_map<std::string, std::string> partition_spec = {{"region", "US"}};
+admin.CreatePartition(table_path, partition_spec, true);
+
+// List all partitions
+std::vector<fluss::PartitionInfo> partitions;
+admin.ListPartitionInfos(table_path, partitions);
+for (const auto& p : partitions) {
+    std::cout << "Partition: id=" << p.partition_id
+              << ", name=" << p.partition_name << std::endl;
+}
+
+// Drop a partition
+admin.DropPartition(table_path, partition_spec, true);
+```
+
+## Offset Operations
+
+```cpp
+std::vector<int32_t> bucket_ids = {0, 1, 2};
+
+// Query earliest offsets
+std::unordered_map<int32_t, int64_t> earliest_offsets;
+admin.ListOffsets(table_path, bucket_ids,
+                  fluss::OffsetQuery::Earliest(), earliest_offsets);
+
+// Query latest offsets
+std::unordered_map<int32_t, int64_t> latest_offsets;
+admin.ListOffsets(table_path, bucket_ids,
+                  fluss::OffsetQuery::Latest(), latest_offsets);
+
+// Query offsets for a specific timestamp
+std::unordered_map<int32_t, int64_t> timestamp_offsets;
+admin.ListOffsets(table_path, bucket_ids,
+                  fluss::OffsetQuery::FromTimestamp(timestamp_ms),
+                  timestamp_offsets);
+
+// Query partition offsets
+std::unordered_map<int32_t, int64_t> partition_offsets;
+admin.ListPartitionOffsets(table_path, "partition_name",
+                           bucket_ids, fluss::OffsetQuery::Latest(),
+                           partition_offsets);
+```
+
+## Lake Snapshot
+
+```cpp
+fluss::LakeSnapshot snapshot;
+admin.GetLatestLakeSnapshot(table_path, snapshot);
+std::cout << "Snapshot ID: " << snapshot.snapshot_id << std::endl;
+for (const auto& bucket_offset : snapshot.bucket_offsets) {
+    std::cout << "  Table " << bucket_offset.table_id
+              << ", Bucket " << bucket_offset.bucket_id
+              << ": offset=" << bucket_offset.offset << std::endl;
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
new file mode 100644
index 0000000000..518a5845ff
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
@@ -0,0 +1,35 @@
+---
+sidebar_position: 2
+---
+# Configuration
+
+## Connection Setup
+
+```cpp
+#include "fluss.hpp"
+
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+
+if (!result.Ok()) {
+    std::cerr << "Connection failed: " << result.error_message << std::endl;
+}
+```
+
+## Connection Configurations
+
+All fields have sensible defaults. Only `bootstrap_servers` typically needs to be set.
+
+```cpp
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";    // Coordinator address
+config.writer_request_max_size = 10 * 1024 * 1024;     // Max request size (10 MB)
+config.writer_acks = "all";                      // Wait for all replicas
+config.writer_retries = std::numeric_limits<int32_t>::max();  // Retry on failure
+config.writer_batch_size = 2 * 1024 * 1024;     // Batch size (2 MB)
+config.scanner_remote_log_prefetch_num = 4;      // Remote log prefetch count
+config.remote_file_download_thread_num = 3;  // Download threads
+```
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/index.md b/fluss-rust/website/docs/user-guide/cpp/example/index.md
new file mode 100644
index 0000000000..51f60e4175
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/example/index.md
@@ -0,0 +1,63 @@
+---
+sidebar_position: 1
+---
+# Example
+
+Minimal working example: connect to Fluss, create a table, write data, and read it back.
+
+```cpp
+#include <iostream>
+#include "fluss.hpp"
+
+int main() {
+    // Connect
+    fluss::Configuration config;
+    config.bootstrap_servers = "127.0.0.1:9123";
+
+    fluss::Connection conn;
+    fluss::Connection::Create(config, conn);
+
+    fluss::Admin admin;
+    conn.GetAdmin(admin);
+
+    // Create a log table
+    fluss::TablePath table_path("fluss", "quickstart_cpp");
+    auto schema = fluss::Schema::NewBuilder()
+        .AddColumn("id", fluss::DataType::Int())
+        .AddColumn("name", fluss::DataType::String())
+        .Build();
+    auto descriptor = fluss::TableDescriptor::NewBuilder()
+        .SetSchema(schema)
+        .Build();
+    admin.CreateTable(table_path, descriptor, true);
+
+    // Write
+    fluss::Table table;
+    conn.GetTable(table_path, table);
+
+    fluss::AppendWriter writer;
+    table.NewAppend().CreateWriter(writer);
+
+    fluss::GenericRow row;
+    row.SetInt32(0, 1);
+    row.SetString(1, "hello");
+    writer.Append(row);
+    writer.Flush();
+
+    // Read
+    fluss::LogScanner scanner;
+    table.NewScan().CreateLogScanner(scanner);
+    auto info = table.GetTableInfo();
+    for (int b = 0; b < info.num_buckets; ++b) {
+        scanner.Subscribe(b, 0);
+    }
+    fluss::ScanRecords records;
+    scanner.Poll(5000, records);
+    for (const auto& rec : records) {
+        std::cout << "id=" << rec.row.GetInt32(0)
+                  << ", name=" << rec.row.GetString(1) << std::endl;
+    }
+
+    return 0;
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md b/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
new file mode 100644
index 0000000000..c94bb84572
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
@@ -0,0 +1,121 @@
+---
+sidebar_position: 4
+---
+# Log Tables
+
+Log tables are append-only tables without primary keys, suitable for event streaming.
+
+## Creating a Log Table
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("event_id", fluss::DataType::Int())
+    .AddColumn("event_type", fluss::DataType::String())
+    .AddColumn("timestamp", fluss::DataType::BigInt())
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .Build();
+
+fluss::TablePath table_path("fluss", "events");
+admin.CreateTable(table_path, descriptor, true);
+```
+
+## Writing to Log Tables
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+fluss::AppendWriter writer;
+table.NewAppend().CreateWriter(writer);
+
+fluss::GenericRow row;
+row.SetInt32(0, 1);           // event_id
+row.SetString(1, "user_login");  // event_type
+row.SetInt64(2, 1704067200000L); // timestamp
+writer.Append(row);
+
+writer.Flush();
+```
+
+## Reading from Log Tables
+
+```cpp
+fluss::LogScanner scanner;
+table.NewScan().CreateLogScanner(scanner);
+
+auto info = table.GetTableInfo();
+for (int b = 0; b < info.num_buckets; ++b) {
+    scanner.Subscribe(b, 0);
+}
+
+fluss::ScanRecords records;
+scanner.Poll(5000, records);  // timeout in ms
+
+for (const auto& rec : records) {
+    std::cout << "event_id=" << rec.row.GetInt32(0)
+              << " event_type=" << rec.row.GetString(1)
+              << " timestamp=" << rec.row.GetInt64(2)
+              << " @ offset=" << rec.offset << std::endl;
+}
+```
+
+**Batch subscribe:**
+
+```cpp
+std::vector<fluss::BucketSubscription> subscriptions;
+subscriptions.push_back({0, 0});    // bucket 0, offset 0
+subscriptions.push_back({1, 100});  // bucket 1, offset 100
+scanner.Subscribe(subscriptions);
+```
+
+**Unsubscribe from a bucket:**
+
+```cpp
+// Stop receiving records from bucket 1
+scanner.Unsubscribe(1);
+```
+
+**Arrow RecordBatch polling (high performance):**
+
+```cpp
+#include <arrow/record_batch.h>
+
+fluss::LogScanner arrow_scanner;
+table.NewScan().CreateRecordBatchLogScanner(arrow_scanner);
+
+for (int b = 0; b < info.num_buckets; ++b) {
+    arrow_scanner.Subscribe(b, 0);
+}
+
+fluss::ArrowRecordBatches batches;
+arrow_scanner.PollRecordBatch(5000, batches);
+
+for (size_t i = 0; i < batches.Size(); ++i) {
+    const auto& batch = batches[i];
+    if (batch->Available()) {
+        auto arrow_batch = batch->GetArrowRecordBatch();
+        std::cout << "Batch " << i << ": " << arrow_batch->num_rows() << " rows"
+                  << ", partition_id=" << batch->GetPartitionId()
+                  << ", bucket_id=" << batch->GetBucketId() << std::endl;
+    }
+}
+```
+
+## Column Projection
+
+```cpp
+// Project by column index
+fluss::LogScanner projected_scanner;
+table.NewScan().ProjectByIndex({0, 2}).CreateLogScanner(projected_scanner);
+
+// Project by column name
+fluss::LogScanner name_projected_scanner;
+table.NewScan().ProjectByName({"event_id", "timestamp"}).CreateLogScanner(name_projected_scanner);
+
+// Arrow RecordBatch with projection
+fluss::LogScanner projected_arrow_scanner;
+table.NewScan().ProjectByIndex({0, 2}).CreateRecordBatchLogScanner(projected_arrow_scanner);
+```
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
new file mode 100644
index 0000000000..6a6927f561
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
@@ -0,0 +1,180 @@
+---
+sidebar_position: 6
+---
+# Partitioned Tables
+
+Partitioned tables distribute data across partitions based on partition column values, enabling efficient data organization and querying. Both log tables and primary key tables support partitioning.
+
+## Partitioned Log Tables
+
+### Creating a Partitioned Log Table
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("event_id", fluss::DataType::Int())
+    .AddColumn("event_type", fluss::DataType::String())
+    .AddColumn("dt", fluss::DataType::String())
+    .AddColumn("region", fluss::DataType::String())
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetPartitionKeys({"dt", "region"})
+    .SetBucketCount(3)
+    .Build();
+
+fluss::TablePath table_path("fluss", "partitioned_events");
+admin.CreateTable(table_path, descriptor, true);
+```
+
+### Writing to Partitioned Log Tables
+
+**Partitions must exist before writing data, otherwise the client will by default retry indefinitely.** Include partition column values in each row, the client routes records to the correct partition automatically.
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+fluss::AppendWriter writer;
+table.NewAppend().CreateWriter(writer);
+
+fluss::GenericRow row;
+row.SetInt32(0, 1);
+row.SetString(1, "user_login");
+row.SetString(2, "2024-01-15");
+row.SetString(3, "US");
+writer.Append(row);
+writer.Flush();
+```
+
+### Reading from Partitioned Log Tables
+
+For partitioned tables, use partition-aware subscribe methods.
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+fluss::LogScanner scanner;
+table.NewScan().CreateLogScanner(scanner);
+
+// Subscribe to individual partitions
+for (const auto& pi : partition_infos) {
+    scanner.SubscribePartitionBuckets(pi.partition_id, 0, 0);
+}
+
+fluss::ScanRecords records;
+scanner.Poll(5000, records);
+
+for (const auto& rec : records) {
+    std::cout << "bucket_id=" << rec.bucket_id
+              << " offset=" << rec.offset << std::endl;
+}
+
+// Or batch-subscribe to all partitions at once
+fluss::LogScanner batch_scanner;
+table.NewScan().CreateLogScanner(batch_scanner);
+
+std::vector<fluss::PartitionBucketSubscription> subs;
+for (const auto& pi : partition_infos) {
+    subs.push_back({pi.partition_id, 0, 0});
+}
+batch_scanner.SubscribePartitionBuckets(subs);
+```
+
+**Unsubscribe from a partition bucket:**
+
+```cpp
+// Stop receiving records from a specific partition bucket
+scanner.UnsubscribePartition(partition_infos[0].partition_id, 0);
+```
+
+### Managing Partitions
+
+```cpp
+// Create a partition
+admin.CreatePartition(table_path, {{"dt", "2024-01-15"}, {"region", "EMEA"}}, true);
+
+// List partitions
+std::vector<fluss::PartitionInfo> partition_infos;
+admin.ListPartitionInfos(table_path, partition_infos);
+
+// Query partition offsets
+std::vector<int32_t> bucket_ids = {0, 1, 2};
+std::unordered_map<int32_t, int64_t> offsets;
+admin.ListPartitionOffsets(table_path, "2024-01-15$US",
+                           bucket_ids, fluss::OffsetQuery::Latest(), offsets);
+```
+
+## Partitioned Primary Key Tables
+
+Partitioned KV tables combine partitioning with primary key operations. Partition columns must be part of the primary key.
+
+### Creating a Partitioned Primary Key Table
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("user_id", fluss::DataType::Int())
+    .AddColumn("region", fluss::DataType::String())
+    .AddColumn("zone", fluss::DataType::BigInt())
+    .AddColumn("score", fluss::DataType::BigInt())
+    .SetPrimaryKeys({"user_id", "region", "zone"})
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetPartitionKeys({"region", "zone"})
+    .SetBucketCount(3)
+    .Build();
+
+fluss::TablePath table_path("fluss", "partitioned_users");
+admin.CreateTable(table_path, descriptor, true);
+```
+
+### Writing to Partitioned Primary Key Tables
+
+**Partitions must exist before upserting data, otherwise the client will by default retry indefinitely.**
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+// Create partitions first
+admin.CreatePartition(table_path, {{"region", "APAC"}, {"zone", "1"}}, true);
+admin.CreatePartition(table_path, {{"region", "EMEA"}, {"zone", "2"}}, true);
+admin.CreatePartition(table_path, {{"region", "US"}, {"zone", "3"}}, true);
+
+fluss::UpsertWriter writer;
+table.NewUpsert().CreateWriter(writer);
+
+auto row = table.NewRow();
+row.Set("user_id", 1001);
+row.Set("region", "APAC");
+row.Set("zone", static_cast<int64_t>(1));
+row.Set("score", static_cast<int64_t>(1234));
+writer.Upsert(row);
+writer.Flush();
+```
+
+### Looking Up Records in Partitioned Tables
+
+Lookup requires all primary key columns including partition columns.
+
+> **Note:** Scanning partitioned primary key tables is not supported. Use lookup operations instead.
+
+```cpp
+fluss::Lookuper lookuper;
+table.NewLookup().CreateLookuper(lookuper);
+
+auto pk = table.NewRow();
+pk.Set("user_id", 1001);
+pk.Set("region", "APAC");
+pk.Set("zone", static_cast<int64_t>(1));
+
+bool found = false;
+fluss::GenericRow result;
+lookuper.Lookup(pk, found, result);
+if (found) {
+    std::cout << "score=" << result.GetInt64(3) << std::endl;
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/primary-key-tables.md b/fluss-rust/website/docs/user-guide/cpp/example/primary-key-tables.md
new file mode 100644
index 0000000000..7aa87e31a7
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/example/primary-key-tables.md
@@ -0,0 +1,133 @@
+---
+sidebar_position: 5
+---
+# Primary Key Tables
+
+Primary key tables (KV tables) support upsert, delete, and lookup operations.
+
+## Creating a Primary Key Table
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("id", fluss::DataType::Int())
+    .AddColumn("name", fluss::DataType::String())
+    .AddColumn("age", fluss::DataType::BigInt())
+    .SetPrimaryKeys({"id"})
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetBucketCount(3)
+    .Build();
+
+fluss::TablePath table_path("fluss", "users");
+admin.CreateTable(table_path, descriptor, true);
+```
+
+## Upserting Records
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+fluss::UpsertWriter upsert_writer;
+table.NewUpsert().CreateWriter(upsert_writer);
+
+// Fire-and-forget upserts
+{
+    auto row = table.NewRow();
+    row.Set("id", 1);
+    row.Set("name", "Alice");
+    row.Set("age", static_cast<int64_t>(25));
+    upsert_writer.Upsert(row);
+}
+{
+    auto row = table.NewRow();
+    row.Set("id", 2);
+    row.Set("name", "Bob");
+    row.Set("age", static_cast<int64_t>(30));
+    upsert_writer.Upsert(row);
+}
+upsert_writer.Flush();
+
+// Per-record acknowledgment
+{
+    auto row = table.NewRow();
+    row.Set("id", 3);
+    row.Set("name", "Charlie");
+    row.Set("age", static_cast<int64_t>(35));
+    fluss::WriteResult wr;
+    upsert_writer.Upsert(row, wr);
+    wr.Wait();
+}
+```
+
+## Updating Records
+
+Upsert with the same primary key to update an existing record.
+
+```cpp
+auto row = table.NewRow();
+row.Set("id", 1);
+row.Set("name", "Alice Updated");
+row.Set("age", static_cast<int64_t>(26));
+fluss::WriteResult wr;
+upsert_writer.Upsert(row, wr);
+wr.Wait();
+```
+
+## Deleting Records
+
+```cpp
+auto pk_row = table.NewRow();
+pk_row.Set("id", 2);
+fluss::WriteResult wr;
+upsert_writer.Delete(pk_row, wr);
+wr.Wait();
+```
+
+## Partial Updates
+
+Update only specific columns while preserving others.
+
+```cpp
+// By column names
+fluss::UpsertWriter partial_writer;
+table.NewUpsert()
+    .PartialUpdateByName({"id", "age"})
+    .CreateWriter(partial_writer);
+
+auto row = table.NewRow();
+row.Set("id", 1);
+row.Set("age", static_cast<int64_t>(27));
+fluss::WriteResult wr;
+partial_writer.Upsert(row, wr);
+wr.Wait();
+
+// By column indices
+fluss::UpsertWriter partial_writer_idx;
+table.NewUpsert()
+    .PartialUpdateByIndex({0, 2})
+    .CreateWriter(partial_writer_idx);
+```
+
+## Looking Up Records
+
+```cpp
+fluss::Lookuper lookuper;
+table.NewLookup().CreateLookuper(lookuper);
+
+auto pk_row = table.NewRow();
+pk_row.Set("id", 1);
+
+bool found = false;
+fluss::GenericRow result_row;
+lookuper.Lookup(pk_row, found, result_row);
+
+if (found) {
+    std::cout << "Found: name=" << result_row.GetString(1)
+              << ", age=" << result_row.GetInt64(2) << std::endl;
+} else {
+    std::cout << "Not found" << std::endl;
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/cpp/installation.md b/fluss-rust/website/docs/user-guide/cpp/installation.md
new file mode 100644
index 0000000000..6360da4369
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/cpp/installation.md
@@ -0,0 +1,107 @@
+---
+sidebar_position: 1
+---
+# Installation
+
+The C++ bindings are not yet published as a package. You need to build from source.
+
+**Prerequisites:** CMake 3.22+, C++17 compiler, Rust 1.85+, Apache Arrow C++ library
+
+```bash
+git clone https://github.com/apache/fluss-rust.git
+cd fluss-rust
+```
+
+Install dependencies:
+
+```bash
+# macOS
+brew install cmake arrow
+
+# Ubuntu/Debian
+sudo apt-get install cmake libarrow-dev
+```
+
+If Arrow is not available via package manager, build from source:
+
+```bash
+git clone https://github.com/apache/arrow.git
+cd arrow/cpp
+cmake -B build -DARROW_BUILD_SHARED=ON
+cmake --build build
+sudo cmake --install build
+```
+
+Build the C++ bindings:
+
+```bash
+cd bindings/cpp
+mkdir -p build && cd build
+
+# Debug mode
+cmake ..
+
+# Or Release mode
+cmake -DCMAKE_BUILD_TYPE=Release ..
+
+# Build
+cmake --build .
+```
+
+This produces:
+- `libfluss_cpp.a` (Static library)
+- `fluss_cpp_example` (Example executable)
+- Header files in `include/`
+
+## Integrating into Your Project
+
+**Option 1: CMake FetchContent**
+
+```cmake
+include(FetchContent)
+FetchContent_Declare(
+    fluss-cpp
+    GIT_REPOSITORY https://github.com/apache/fluss-rust.git
+    SOURCE_SUBDIR bindings/cpp
+)
+FetchContent_MakeAvailable(fluss-cpp)
+
+target_link_libraries(your_target PRIVATE fluss_cpp)
+```
+
+**Option 2: Manual Integration**
+
+Copy the build artifacts and configure CMake:
+
+```cmake
+find_package(Arrow REQUIRED)
+
+add_library(fluss_cpp STATIC IMPORTED)
+set_target_properties(fluss_cpp PROPERTIES
+    IMPORTED_LOCATION ${CMAKE_SOURCE_DIR}/lib/libfluss_cpp.a
+    INTERFACE_INCLUDE_DIRECTORIES ${CMAKE_SOURCE_DIR}/include
+)
+
+target_link_libraries(your_target
+    PRIVATE
+    fluss_cpp
+    Arrow::arrow_shared
+    ${CMAKE_DL_LIBS}
+    Threads::Threads
+)
+
+# On macOS, also link these frameworks
+if(APPLE)
+    target_link_libraries(your_target PRIVATE
+        "-framework CoreFoundation"
+        "-framework Security"
+    )
+endif()
+```
+
+**Option 3: Subdirectory**
+
+```cmake
+add_subdirectory(vendor/fluss-rust/bindings/cpp)
+target_link_libraries(your_target PRIVATE fluss_cpp)
+```
diff --git a/fluss-rust/website/docs/user-guide/python/_category_.json b/fluss-rust/website/docs/user-guide/python/_category_.json
new file mode 100644
index 0000000000..a9f34b477f
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Python",
+  "position": 2
+}
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
new file mode 100644
index 0000000000..321e25e6b7
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -0,0 +1,286 @@
+---
+sidebar_position: 2
+---
+# API Reference
+
+Complete API reference for the Fluss Python client.
+
+## `Config`
+
+| Method / Property                  | Description                                               |
+|------------------------------------|-----------------------------------------------------------|
+| `Config(properties: dict = None)`  | Create config from a dict of key-value pairs              |
+| `.bootstrap_servers`               | Get/set coordinator server address                        |
+| `.writer_request_max_size`         | Get/set max request size in bytes                         |
+| `.writer_acks`                     | Get/set acknowledgment setting (`"all"` for all replicas) |
+| `.writer_retries`                  | Get/set number of retries on failure                      |
+| `.writer_batch_size`               | Get/set write batch size in bytes                         |
+| `.scanner_remote_log_prefetch_num` | Get/set number of remote log segments to prefetch         |
+| `.remote_file_download_thread_num` | Get/set number of threads for remote log downloads        |
+
+## `FlussConnection`
+
+| Method                                                    |  Description                          |
+|-----------------------------------------------------------|---------------------------------------|
+| `await FlussConnection.create(config) -> FlussConnection` | Connect to a Fluss cluster            |
+| `await conn.get_admin() -> FlussAdmin`                    | Get admin interface                   |
+| `await conn.get_table(table_path) -> FlussTable`          | Get a table for read/write operations |
+| `conn.close()`                                            | Close the connection                  |
+
+Supports `with` statement (context manager).
+
+## `FlussAdmin`
+
+| Method                                                                                                                |  Description                          |
+|-----------------------------------------------------------------------------------------------------------------------|---------------------------------------|
+| `await create_database(name, database_descriptor=None, ignore_if_exists=False)`                                       | Create a database                     |
+| `await drop_database(name, ignore_if_not_exists=False, cascade=True)`                                                 | Drop a database                       |
+| `await list_databases() -> list[str]`                                                                                 | List all databases                    |
+| `await database_exists(name) -> bool`                                                                                 | Check if a database exists            |
+| `await get_database_info(name) -> DatabaseInfo`                                                                       | Get database metadata                 |
+| `await create_table(table_path, table_descriptor, ignore_if_exists=False)`                                            | Create a table                        |
+| `await drop_table(table_path, ignore_if_not_exists=False)`                                                            | Drop a table                          |
+| `await get_table_info(table_path) -> TableInfo`                                                                       | Get table metadata                    |
+| `await list_tables(database_name) -> list[str]`                                                                       | List tables in a database             |
+| `await table_exists(table_path) -> bool`                                                                              | Check if a table exists               |
+| `await list_offsets(table_path, bucket_ids, offset_type, timestamp=None) -> dict[int, int]`                           | Get offsets for buckets               |
+| `await list_partition_offsets(table_path, partition_name, bucket_ids, offset_type, timestamp=None) -> dict[int, int]` | Get offsets for a partition's buckets |
+| `await create_partition(table_path, partition_spec, ignore_if_exists=False)`                                          | Create a partition                    |
+| `await drop_partition(table_path, partition_spec, ignore_if_not_exists=False)`                                        | Drop a partition                      |
+| `await list_partition_infos(table_path) -> list[PartitionInfo]`                                                       | List partitions                       |
+| `await get_latest_lake_snapshot(table_path) -> LakeSnapshot`                                                          | Get latest lake snapshot              |
+
+## `FlussTable`
+
+| Method                          |  Description                            |
+|---------------------------------|-----------------------------------------|
+| `new_scan() -> TableScan`       | Create a scan builder                   |
+| `new_append() -> TableAppend`   | Create an append builder for log tables |
+| `new_upsert() -> TableUpsert`   | Create an upsert builder for PK tables  |
+| `new_lookup() -> TableLookup`   | Create a lookup builder for PK tables   |
+| `get_table_info() -> TableInfo` | Get table metadata                      |
+| `get_table_path() -> TablePath` | Get table path                          |
+| `has_primary_key() -> bool`     | Check if table has a primary key        |
+
+## `TableScan`
+
+| Method                                                   |  Description                                                        |
+|----------------------------------------------------------|---------------------------------------------------------------------|
+| `.project(indices) -> TableScan`                         | Project columns by index                                            |
+| `.project_by_name(names) -> TableScan`                   | Project columns by name                                             |
+| `await .create_log_scanner() -> LogScanner`              | Create record-based scanner (for `poll()`)                          |
+| `await .create_record_batch_log_scanner() -> LogScanner` | Create batch-based scanner (for `poll_arrow()`, `to_arrow()`, etc.) |
+
+## `TableAppend`
+
+Builder for creating an `AppendWriter`. Obtain via `FlussTable.new_append()`.
+
+| Method                             |  Description             |
+|------------------------------------|--------------------------|
+| `.create_writer() -> AppendWriter` | Create the append writer |
+
+## `TableUpsert`
+
+Builder for creating an `UpsertWriter`. Obtain via `FlussTable.new_upsert()`.
+
+| Method                                             |  Description                               |
+|----------------------------------------------------|--------------------------------------------|
+| `.partial_update_by_name(columns) -> TableUpsert`  | Configure partial update by column names   |
+| `.partial_update_by_index(indices) -> TableUpsert` | Configure partial update by column indices |
+| `.create_writer() -> UpsertWriter`                 | Create the upsert writer                   |
+
+## `TableLookup`
+
+Builder for creating a `Lookuper`. Obtain via `FlussTable.new_lookup()`.
+
+| Method                           |  Description        |
+|----------------------------------|---------------------|
+| `.create_lookuper() -> Lookuper` | Create the lookuper |
+
+## `AppendWriter`
+
+| Method                                           |  Description                        |
+|--------------------------------------------------|-------------------------------------|
+| `.append(row) -> WriteResultHandle`              | Append a row (dict, list, or tuple) |
+| `.write_arrow(table)`                            | Write a PyArrow Table               |
+| `.write_arrow_batch(batch) -> WriteResultHandle` | Write a PyArrow RecordBatch         |
+| `.write_pandas(df)`                              | Write a Pandas DataFrame            |
+| `await .flush()`                                 | Flush all pending writes            |
+
+## `UpsertWriter`
+
+| Method                              |  Description                          |
+|-------------------------------------|---------------------------------------|
+| `.upsert(row) -> WriteResultHandle` | Upsert a row (insert or update by PK) |
+| `.delete(pk) -> WriteResultHandle`  | Delete a row by primary key           |
+| `await .flush()`                    | Flush all pending operations          |
+
+## `WriteResultHandle`
+
+| Method          |  Description                                 |
+|-----------------|----------------------------------------------|
+| `await .wait()` | Wait for server acknowledgment of this write |
+
+## `Lookuper`
+
+| Method                              |  Description                |
+|-------------------------------------|-----------------------------|
+| `await .lookup(pk) -> dict \| None` | Lookup a row by primary key |
+
+## `LogScanner`
+
+| Method                                                        |  Description                                                                     |
+|---------------------------------------------------------------|----------------------------------------------------------------------------------|
+| `.subscribe(bucket_id, start_offset)`                         | Subscribe to a bucket                                                            |
+| `.subscribe_buckets(bucket_offsets)`                          | Subscribe to multiple buckets (`{bucket_id: offset}`)                            |
+| `.subscribe_partition(partition_id, bucket_id, start_offset)` | Subscribe to a partition bucket                                                  |
+| `.subscribe_partition_buckets(partition_bucket_offsets)`      | Subscribe to multiple partition+bucket combos (`{(part_id, bucket_id): offset}`) |
+| `.unsubscribe(bucket_id)`                                     | Unsubscribe from a bucket (non-partitioned tables)                               |
+| `.unsubscribe_partition(partition_id, bucket_id)`             | Unsubscribe from a partition bucket                                              |
+| `.poll(timeout_ms) -> list[ScanRecord]`                       | Poll individual records (record scanner only)                                    |
+| `.poll_arrow(timeout_ms) -> pa.Table`                         | Poll as Arrow Table (batch scanner only)                                         |
+| `.poll_record_batch(timeout_ms) -> list[RecordBatch]`         | Poll batches with metadata (batch scanner only)                                  |
+| `.to_arrow() -> pa.Table`                                     | Read all subscribed data as Arrow Table (batch scanner only)                     |
+| `.to_pandas() -> pd.DataFrame`                                | Read all subscribed data as DataFrame (batch scanner only)                       |
+
+## `ScanRecord`
+
+| Property                     |  Description                                                        |
+|------------------------------|---------------------------------------------------------------------|
+| `.bucket -> TableBucket`     | Bucket this record belongs to                                       |
+| `.offset -> int`             | Record offset in the log                                            |
+| `.timestamp -> int`          | Record timestamp                                                    |
+| `.change_type -> ChangeType` | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
+| `.row -> dict`               | Row data as `{column_name: value}`                                  |
+
+## `RecordBatch`
+
+| Property                   | Description                  |
+|----------------------------|------------------------------|
+| `.batch -> pa.RecordBatch` | Arrow RecordBatch data       |
+| `.bucket -> TableBucket`   | Bucket this batch belongs to |
+| `.base_offset -> int`      | First record offset          |
+| `.last_offset -> int`      | Last record offset           |
+
+## `Schema`
+
+| Method                                         |  Description               |
+|------------------------------------------------|----------------------------|
+| `Schema(schema: pa.Schema, primary_keys=None)` | Create from PyArrow schema |
+| `.get_column_names() -> list[str]`             | Get column names           |
+| `.get_column_types() -> list[str]`             | Get column type names      |
+
+## `TableDescriptor`
+
+| Method                                                                                                                                                                         | Description             |
+|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-------------------------|
+| `TableDescriptor(schema, *, partition_keys=None, bucket_count=None, bucket_keys=None, comment=None, log_format=None, kv_format=None, properties=None, custom_properties=None)` | Create table descriptor |
+| `.get_schema() -> Schema`                                                                                                                                                      | Get the schema          |
+
+## `TablePath`
+
+| Method / Property            | Description         |
+|------------------------------|---------------------|
+| `TablePath(database, table)` | Create a table path |
+| `.database_name -> str`      | Database name       |
+| `.table_name -> str`         | Table name          |
+
+## `TableInfo`
+
+| Property / Method                    |  Description                |
+|--------------------------------------|-----------------------------|
+| `.table_id -> int`                   | Table ID                    |
+| `.table_path -> TablePath`           | Table path                  |
+| `.num_buckets -> int`                | Number of buckets           |
+| `.schema_id -> int`                  | Schema ID                   |
+| `.comment -> str \| None`            | Table comment               |
+| `.created_time -> int`               | Creation timestamp          |
+| `.modified_time -> int`              | Last modification timestamp |
+| `.get_primary_keys() -> list[str]`   | Primary key columns         |
+| `.get_partition_keys() -> list[str]` | Partition columns           |
+| `.get_bucket_keys() -> list[str]`    | Bucket key columns          |
+| `.has_primary_key() -> bool`         | Has primary key?            |
+| `.is_partitioned() -> bool`          | Is partitioned?             |
+| `.get_schema() -> Schema`            | Get table schema            |
+| `.get_column_names() -> list[str]`   | Column names                |
+| `.get_column_count() -> int`         | Number of columns           |
+| `.get_properties() -> dict`          | All table properties        |
+| `.get_custom_properties() -> dict`   | Custom properties only      |
+
+## `PartitionInfo`
+
+| Property                 |  Description   |
+|--------------------------|----------------|
+| `.partition_id -> int`   | Partition ID   |
+| `.partition_name -> str` | Partition name |
+
+## `DatabaseDescriptor`
+
+| Method / Property                                          | Description       |
+|------------------------------------------------------------|-------------------|
+| `DatabaseDescriptor(comment=None, custom_properties=None)` | Create descriptor |
+| `.comment -> str \| None`                                  | Database comment  |
+| `.get_custom_properties() -> dict`                         | Custom properties |
+
+## `DatabaseInfo`
+
+| Property / Method                                  | Description                 |
+|----------------------------------------------------|-----------------------------|
+| `.database_name -> str`                            | Database name               |
+| `.created_time -> int`                             | Creation timestamp          |
+| `.modified_time -> int`                            | Last modification timestamp |
+| `.get_database_descriptor() -> DatabaseDescriptor` | Get descriptor              |
+
+## `LakeSnapshot`
+
+| Property / Method                                 | Description             |
+|---------------------------------------------------|-------------------------|
+| `.snapshot_id -> int`                             | Snapshot ID             |
+| `.table_buckets_offset -> dict[TableBucket, int]` | All bucket offsets      |
+| `.get_bucket_offset(bucket) -> int \| None`       | Get offset for a bucket |
+| `.get_table_buckets() -> list[TableBucket]`       | Get all buckets         |
+
+## `TableBucket`
+
+| Method / Property                                            | Description                            |
+|--------------------------------------------------------------|----------------------------------------|
+| `TableBucket(table_id, bucket)`                              | Create non-partitioned bucket          |
+| `TableBucket.with_partition(table_id, partition_id, bucket)` | Create partitioned bucket              |
+| `.table_id -> int`                                           | Table ID                               |
+| `.bucket_id -> int`                                          | Bucket ID                              |
+| `.partition_id -> int \| None`                               | Partition ID (None if non-partitioned) |
+
+## `FlussError`
+
+| Property             | Description                                                                         |
+|----------------------|-------------------------------------------------------------------------------------|
+| `.message -> str`    | Error message                                                                       |
+| `.error_code -> int` | Error code (`ErrorCode.CLIENT_ERROR` for client-side errors, server code otherwise) |
+
+Raised for all Fluss-specific errors (connection failures, table not found, schema mismatches, etc.). Inherits from `Exception`. See [Error Handling](./error-handling.md) for details on matching specific error codes.
+
+## Constants
+
+| Constant                     | Value         | Description                                         |
+|------------------------------|---------------|-----------------------------------------------------|
+| `fluss.EARLIEST_OFFSET`      | `-2`          | Start reading from earliest available offset        |
+| `fluss.OffsetType.EARLIEST`  | `"earliest"`  | For `list_offsets()`                                |
+| `fluss.OffsetType.LATEST`    | `"latest"`    | For `list_offsets()`                                |
+| `fluss.OffsetType.TIMESTAMP` | `"timestamp"` | For `list_offsets()` with timestamp                 |
+
+To start reading from the latest offset (only new records), resolve the current offset via `list_offsets` before subscribing:
+
+```python
+offsets = await admin.list_offsets(table_path, [0], fluss.OffsetType.LATEST)
+scanner.subscribe(bucket_id=0, start_offset=offsets[0])
+```
+
+## `ChangeType`
+
+| Value                         | Short String | Description                   |
+|-------------------------------|--------------|-------------------------------|
+| `ChangeType.AppendOnly` (0)   | `+A`         | Append-only                   |
+| `ChangeType.Insert` (1)       | `+I`         | Insert                        |
+| `ChangeType.UpdateBefore` (2) | `-U`         | Previous value of updated row |
+| `ChangeType.UpdateAfter` (3)  | `+U`         | New value of updated row      |
+| `ChangeType.Delete` (4)       | `-D`         | Delete                        |
diff --git a/fluss-rust/website/docs/user-guide/python/data-types.md b/fluss-rust/website/docs/user-guide/python/data-types.md
new file mode 100644
index 0000000000..6d7e78d16f
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/data-types.md
@@ -0,0 +1,66 @@
+---
+sidebar_position: 3
+---
+# Data Types
+
+The Python client uses PyArrow types for schema definitions:
+
+| PyArrow Type                                    | Fluss Type                        | Python Type         |
+|-------------------------------------------------|-----------------------------------|---------------------|
+| `pa.bool_()`                                    | Boolean                           | `bool`              |
+| `pa.int8()` / `int16()` / `int32()` / `int64()` | TinyInt / SmallInt / Int / BigInt | `int`               |
+| `pa.float32()` / `float64()`                    | Float / Double                    | `float`             |
+| `pa.string()`                                   | String                            | `str`               |
+| `pa.binary()`                                   | Bytes                             | `bytes`             |
+| `pa.date32()`                                   | Date                              | `datetime.date`     |
+| `pa.time32("ms")`                               | Time                              | `datetime.time`     |
+| `pa.timestamp("us")`                            | Timestamp (NTZ)                   | `datetime.datetime` |
+| `pa.timestamp("us", tz="UTC")`                  | TimestampLTZ                      | `datetime.datetime` |
+| `pa.decimal128(precision, scale)`               | Decimal                           | `decimal.Decimal`   |
+
+All Python native types (`date`, `time`, `datetime`, `Decimal`) work when appending rows via dicts.
+
+## Writing Data
+
+Rows can be dicts, lists, or tuples:
+
+```python
+from datetime import date, time, datetime
+from decimal import Decimal
+
+row = {
+    "user_id": 1,
+    "name": "Alice",
+    "active": True,
+    "score": 95.5,
+    "balance": Decimal("1234.56"),
+    "birth_date": date(1990, 3, 15),
+    "login_time": time(9, 30, 0),
+    "created_at": datetime(2024, 1, 1, 0, 0, 0),
+    "nickname": None,  # null value
+}
+handle = writer.append(row)
+```
+
+Lists and tuples must have values in column order:
+
+```python
+row = [1, "Alice", True, 95.5, Decimal("1234.56"), date(1990, 3, 15), time(9, 30, 0), datetime(2024, 1, 1), None]
+handle = writer.append(row)
+```
+
+## Reading Data
+
+```python
+records = scanner.poll(timeout_ms=1000)
+for record in records:
+    row = record.row  # dict[str, Any]
+    print(row["user_id"])     # int
+    print(row["name"])        # str
+    print(row["balance"])     # decimal.Decimal
+    print(row["birth_date"])  # datetime.date
+    print(row["created_at"])  # datetime.datetime
+
+    if row["nickname"] is None:
+        print("nickname is null")
+```
diff --git a/fluss-rust/website/docs/user-guide/python/error-handling.md b/fluss-rust/website/docs/user-guide/python/error-handling.md
new file mode 100644
index 0000000000..9fa482190a
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/error-handling.md
@@ -0,0 +1,109 @@
+---
+sidebar_position: 4
+---
+# Error Handling
+
+The client raises `fluss.FlussError` for all Fluss-specific errors. Each error carries a `message` and an `error_code`.
+
+## Basic Usage
+
+```python
+import fluss
+
+try:
+    await admin.create_table(table_path, table_descriptor)
+except fluss.FlussError as e:
+    print(f"Error (code {e.error_code}): {e.message}")
+```
+
+## Error Codes
+
+Server-side errors carry a specific error code (>0 or -1). Client-side errors (connection failures, type mismatches, etc.) use `ErrorCode.CLIENT_ERROR` (-2). Use `fluss.ErrorCode` to match on specific codes:
+
+```python
+import fluss
+
+try:
+    await admin.drop_table(table_path)
+except fluss.FlussError as e:
+    if e.error_code == fluss.ErrorCode.TABLE_NOT_EXIST:
+        print("Table does not exist")
+    elif e.error_code == fluss.ErrorCode.PARTITION_NOT_EXISTS:
+        print("Partition does not exist")
+    elif e.error_code == fluss.ErrorCode.CLIENT_ERROR:
+        print(f"Client-side error: {e.message}")
+    else:
+        print(f"Server error (code {e.error_code}): {e.message}")
+```
+
+### Common Error Codes
+
+| Constant                                     | Code | Description                         |
+|----------------------------------------------|------|-------------------------------------|
+| `ErrorCode.CLIENT_ERROR`                     | -2   | Client-side error (not from server) |
+| `ErrorCode.UNKNOWN_SERVER_ERROR`             | -1   | Unexpected server error             |
+| `ErrorCode.NETWORK_EXCEPTION`                | 1    | Server disconnected before response |
+| `ErrorCode.DATABASE_NOT_EXIST`               | 4    | Database does not exist             |
+| `ErrorCode.DATABASE_ALREADY_EXIST`           | 6    | Database already exists             |
+| `ErrorCode.TABLE_NOT_EXIST`                  | 7    | Table does not exist                |
+| `ErrorCode.TABLE_ALREADY_EXIST`              | 8    | Table already exists                |
+| `ErrorCode.INVALID_TABLE_EXCEPTION`          | 15   | Invalid table operation             |
+| `ErrorCode.REQUEST_TIME_OUT`                 | 25   | Request timed out                   |
+| `ErrorCode.PARTITION_NOT_EXISTS`             | 36   | Partition does not exist            |
+| `ErrorCode.PARTITION_ALREADY_EXISTS`         | 42   | Partition already exists            |
+| `ErrorCode.PARTITION_SPEC_INVALID_EXCEPTION` | 43   | Invalid partition spec              |
+| `ErrorCode.LEADER_NOT_AVAILABLE_EXCEPTION`   | 44   | No leader available for partition   |
+
+See `fluss.ErrorCode` for the full list of named constants.
+
+## Common Error Scenarios
+
+### Connection Refused
+
+The Fluss cluster is not running or the address is incorrect.
+
+```python
+try:
+    config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
+    conn = await fluss.FlussConnection.create(config)
+except fluss.FlussError as e:
+    # error_code == ErrorCode.CLIENT_ERROR for connection failures
+    print(f"Cannot connect to cluster: {e.message}")
+```
+
+### Table Not Found
+
+The table does not exist or has been dropped.
+
+```python
+try:
+    await admin.drop_table(table_path)
+except fluss.FlussError as e:
+    if e.error_code == fluss.ErrorCode.TABLE_NOT_EXIST:
+        print("Table not found")
+```
+
+### Partition Not Found
+
+Writing to a partitioned table before creating partitions.
+
+```python
+try:
+    await admin.drop_partition(table_path, {"region": "US"})
+except fluss.FlussError as e:
+    if e.error_code == fluss.ErrorCode.PARTITION_NOT_EXISTS:
+        print("Partition does not exist, create it first")
+```
+
+### Schema Mismatch
+
+Row data doesn't match the table schema.
+
+```python
+try:
+    writer.append({"wrong_column": "value"})
+    await writer.flush()
+except fluss.FlussError as e:
+    # error_code == ErrorCode.CLIENT_ERROR for type/schema mismatches
+    print(f"Schema mismatch: {e.message}")
+```
diff --git a/fluss-rust/website/docs/user-guide/python/example/_category_.json b/fluss-rust/website/docs/user-guide/python/example/_category_.json
new file mode 100644
index 0000000000..dd2229499b
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/example/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Example",
+  "position": 5
+}
diff --git a/fluss-rust/website/docs/user-guide/python/example/admin-operations.md b/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
new file mode 100644
index 0000000000..8c62ee78c9
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
@@ -0,0 +1,77 @@
+---
+sidebar_position: 3
+---
+# Admin Operations
+
+```python
+admin = await conn.get_admin()
+```
+
+## Databases
+
+```python
+await admin.create_database("my_database", ignore_if_exists=True)
+databases = await admin.list_databases()
+exists = await admin.database_exists("my_database")
+await admin.drop_database("my_database", ignore_if_not_exists=True, cascade=True)
+```
+
+## Tables
+
+Schemas are defined using PyArrow and wrapped in `fluss.Schema`:
+
+```python
+import pyarrow as pa
+
+schema = fluss.Schema(pa.schema([
+    pa.field("id", pa.int32()),
+    pa.field("name", pa.string()),
+    pa.field("amount", pa.int64()),
+]))
+
+table_path = fluss.TablePath("my_database", "my_table")
+await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
+
+table_info = await admin.get_table_info(table_path)
+tables = await admin.list_tables("my_database")
+await admin.drop_table(table_path, ignore_if_not_exists=True)
+```
+
+### TableDescriptor Options
+
+`TableDescriptor` accepts these optional parameters:
+
+| Parameter           | Description                                                                         |
+|---------------------|-------------------------------------------------------------------------------------|
+| `partition_keys`    | Column names to partition by (e.g. `["region"]`)                                    |
+| `bucket_count`      | Number of buckets (parallelism units) for the table                                 |
+| `bucket_keys`       | Columns used to determine bucket assignment                                         |
+| `comment`           | Table comment / description                                                         |
+| `log_format`        | Log storage format: `"ARROW"` or `"INDEXED"`                                        |
+| `kv_format`         | KV storage format for primary key tables: `"INDEXED"` or `"COMPACTED"`              |
+| `properties`        | Table configuration properties as a dict (e.g. `{"table.replication.factor": "1"}`) |
+| `custom_properties` | User-defined properties as a dict                                                   |
+
+## Offsets
+
+```python
+# Latest offsets for buckets
+offsets = await admin.list_offsets(table_path, bucket_ids=[0, 1], offset_type="latest")
+
+# By timestamp
+offsets = await admin.list_offsets(table_path, bucket_ids=[0], offset_type="timestamp", timestamp=1704067200000)
+
+# Per-partition offsets
+offsets = await admin.list_partition_offsets(table_path, partition_name="US", bucket_ids=[0], offset_type="latest")
+```
+
+## Lake Snapshot
+
+```python
+snapshot = await admin.get_latest_lake_snapshot(table_path)
+print(f"Snapshot ID: {snapshot.snapshot_id}")
+print(f"Table buckets: {snapshot.get_table_buckets()}")
+
+bucket = fluss.TableBucket(table_id=1, bucket=0)
+offset = snapshot.get_bucket_offset(bucket)
+```
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
new file mode 100644
index 0000000000..c4ef4f3c69
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -0,0 +1,36 @@
+---
+sidebar_position: 2
+---
+# Configuration
+
+## Connection Setup
+
+```python
+import fluss
+
+config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
+conn = await fluss.FlussConnection.create(config)
+```
+
+The connection also supports context managers:
+
+```python
+with await fluss.FlussConnection.create(config) as conn:
+    ...
+```
+
+## Connection Configurations
+
+| Key                 | Description                                           | Default            |
+|---------------------|-------------------------------------------------------|--------------------|
+| `bootstrap.servers` | Coordinator server address                            | `127.0.0.1:9123`   |
+| `request.max.size`  | Maximum request size in bytes                         | `10485760` (10 MB) |
+| `writer.acks`       | Acknowledgment setting (`all` waits for all replicas) | `all`              |
+| `writer.retries`    | Number of retries on failure                          | `2147483647`       |
+| `writer.batch.size` | Batch size for writes in bytes                        | `2097152` (2 MB)   |
+
+Remember to close the connection when done:
+
+```python
+conn.close()
+```
diff --git a/fluss-rust/website/docs/user-guide/python/example/index.md b/fluss-rust/website/docs/user-guide/python/example/index.md
new file mode 100644
index 0000000000..389b648698
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/example/index.md
@@ -0,0 +1,46 @@
+---
+sidebar_position: 1
+---
+# Example
+
+Minimal working example: connect to Fluss, create a table, write data, and read it back.
+
+```python
+import asyncio
+import pyarrow as pa
+import fluss
+
+async def main():
+    # Connect
+    config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
+    conn = await fluss.FlussConnection.create(config)
+    admin = await conn.get_admin()
+
+    # Create a log table
+    schema = fluss.Schema(pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("name", pa.string()),
+        pa.field("score", pa.float32()),
+    ]))
+    table_path = fluss.TablePath("fluss", "quick_start")
+    await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
+
+    # Write
+    table = await conn.get_table(table_path)
+    writer = table.new_append().create_writer()
+    writer.append({"id": 1, "name": "Alice", "score": 95.5})
+    writer.append({"id": 2, "name": "Bob", "score": 87.0})
+    await writer.flush()
+
+    # Read
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+    print(scanner.to_pandas())
+
+    # Cleanup
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    conn.close()
+
+asyncio.run(main())
+```
diff --git a/fluss-rust/website/docs/user-guide/python/example/log-tables.md b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
new file mode 100644
index 0000000000..63903a4e46
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
@@ -0,0 +1,122 @@
+---
+sidebar_position: 4
+---
+# Log Tables
+
+Log tables are append-only tables without primary keys, suitable for event streaming.
+
+## Creating a Log Table
+
+```python
+import pyarrow as pa
+
+schema = fluss.Schema(pa.schema([
+    pa.field("id", pa.int32()),
+    pa.field("name", pa.string()),
+    pa.field("score", pa.float32()),
+]))
+
+table_path = fluss.TablePath("fluss", "events")
+await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
+```
+
+## Writing
+
+Rows can be appended as dicts, lists, or tuples. For bulk writes, use `write_arrow()`, `write_arrow_batch()`, or `write_pandas()`.
+
+Write methods like `append()` and `write_arrow_batch()` return a `WriteResultHandle`. You can ignore it for fire-and-forget semantics (flush at the end), or `await handle.wait()` to block until the server acknowledges that specific write.
+
+```python
+table = await conn.get_table(table_path)
+writer = table.new_append().create_writer()
+
+# Fire-and-forget: queue writes, flush at the end
+writer.append({"id": 1, "name": "Alice", "score": 95.5})
+writer.append([2, "Bob", 87.0])
+await writer.flush()
+
+# Per-record acknowledgment
+handle = writer.append({"id": 3, "name": "Charlie", "score": 91.0})
+await handle.wait()
+
+# Bulk writes
+writer.write_arrow(pa_table)          # PyArrow Table
+writer.write_arrow_batch(record_batch) # PyArrow RecordBatch
+writer.write_pandas(df)                # Pandas DataFrame
+await writer.flush()
+```
+
+## Reading
+
+There are two scanner types:
+- **Batch scanner** (`create_record_batch_log_scanner()`): returns Arrow Tables or DataFrames, best for analytics
+- **Record scanner** (`create_log_scanner()`): returns individual records with metadata (offset, timestamp, change type), best for streaming
+
+And two reading modes:
+- **`to_arrow()` / `to_pandas()`**: reads all data from subscribed buckets up to the current latest offset, then returns. Best for one-shot batch reads.
+- **`poll_arrow()` / `poll()` / `poll_record_batch()`**: returns whatever data is available within the timeout, then returns. Call in a loop for continuous streaming.
+
+### Batch Read (One-Shot)
+
+```python
+num_buckets = (await admin.get_table_info(table_path)).num_buckets
+
+scanner = await table.new_scan().create_record_batch_log_scanner()
+scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+# Reads everything up to current latest offset, then returns
+arrow_table = scanner.to_arrow()
+df = scanner.to_pandas()
+```
+
+### Continuous Polling
+
+Use `poll_arrow()` or `poll()` in a loop for streaming consumption:
+
+```python
+# Batch scanner: poll as Arrow Tables
+scanner = await table.new_scan().create_record_batch_log_scanner()
+scanner.subscribe(bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
+
+while True:
+    result = scanner.poll_arrow(timeout_ms=5000)
+    if result.num_rows > 0:
+        print(result.to_pandas())
+
+# Record scanner: poll individual records with metadata
+scanner = await table.new_scan().create_log_scanner()
+scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+while True:
+    for record in scanner.poll(timeout_ms=5000):
+        print(f"offset={record.offset}, change={record.change_type.short_string()}, row={record.row}")
+```
+
+### Unsubscribing
+
+To stop consuming from a bucket, use `unsubscribe()`:
+
+```python
+scanner.unsubscribe(bucket_id=0)
+```
+
+### Subscribe from Latest Offset
+
+To only consume new records (skip existing data), first resolve the current latest offset via `list_offsets`, then subscribe at that offset:
+
+```python
+admin = await conn.get_admin()
+offsets = await admin.list_offsets(table_path, [0], fluss.OffsetType.LATEST)
+latest = offsets[0]
+
+scanner = await table.new_scan().create_record_batch_log_scanner()
+scanner.subscribe(bucket_id=0, start_offset=latest)
+```
+
+## Column Projection
+
+```python
+scanner = await table.new_scan().project([0, 2]).create_record_batch_log_scanner()
+# or by name
+scanner = await table.new_scan().project_by_name(["id", "score"]).create_record_batch_log_scanner()
+```
diff --git a/fluss-rust/website/docs/user-guide/python/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/python/example/partitioned-tables.md
new file mode 100644
index 0000000000..f82809201b
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/example/partitioned-tables.md
@@ -0,0 +1,104 @@
+---
+sidebar_position: 6
+---
+# Partitioned Tables
+
+Partitioned tables distribute data across partitions based on column values. Partitions must exist before writing data, otherwise the client will by default retry indefinitely.
+
+## Creating and Managing Partitions
+
+```python
+import pyarrow as pa
+
+schema = fluss.Schema(pa.schema([
+    pa.field("id", pa.int32()),
+    pa.field("region", pa.string()),
+    pa.field("value", pa.int64()),
+]))
+
+table_path = fluss.TablePath("fluss", "partitioned_events")
+await admin.create_table(
+    table_path,
+    fluss.TableDescriptor(schema, partition_keys=["region"], bucket_count=1),
+    ignore_if_exists=True,
+)
+
+# Create partitions
+await admin.create_partition(table_path, {"region": "US"}, ignore_if_exists=True)
+await admin.create_partition(table_path, {"region": "EU"}, ignore_if_exists=True)
+
+# List partitions
+partition_infos = await admin.list_partition_infos(table_path)
+```
+
+## Writing
+
+Same as non-partitioned tables - include partition column values in each row. **Partitions must exist before writing data, otherwise the client will by default retry indefinitely.**
+
+```python
+table = await conn.get_table(table_path)
+writer = table.new_append().create_writer()
+writer.append({"id": 1, "region": "US", "value": 100})
+writer.append({"id": 2, "region": "EU", "value": 200})
+await writer.flush()
+```
+
+## Reading
+
+Use `subscribe_partition()` or `subscribe_partition_buckets()` instead of `subscribe()`:
+
+```python
+scanner = await table.new_scan().create_record_batch_log_scanner()
+
+# Subscribe to individual partitions
+for p in partition_infos:
+    scanner.subscribe_partition(partition_id=p.partition_id, bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
+
+# Or batch-subscribe
+scanner.subscribe_partition_buckets({
+    (p.partition_id, 0): fluss.EARLIEST_OFFSET for p in partition_infos
+})
+
+print(scanner.to_pandas())
+```
+
+### Unsubscribing
+
+To stop consuming from a specific partition bucket, use `unsubscribe_partition()`:
+
+```python
+scanner.unsubscribe_partition(partition_id=partition_infos[0].partition_id, bucket_id=0)
+```
+
+## Partitioned Primary Key Tables
+
+Partition columns must be part of the primary key. Partitions must exist before upserting data, otherwise the client will by default retry indefinitely.
+
+```python
+schema = fluss.Schema(
+    pa.schema([
+        pa.field("user_id", pa.int32()),
+        pa.field("region", pa.string()),
+        pa.field("score", pa.int64()),
+    ]),
+    primary_keys=["user_id", "region"],
+)
+
+table_path = fluss.TablePath("fluss", "partitioned_users")
+await admin.create_table(
+    table_path,
+    fluss.TableDescriptor(schema, partition_keys=["region"]),
+    ignore_if_exists=True,
+)
+
+await admin.create_partition(table_path, {"region": "US"}, ignore_if_exists=True)
+
+table = await conn.get_table(table_path)
+writer = table.new_upsert().create_writer()
+writer.upsert({"user_id": 1, "region": "US", "score": 1234})
+await writer.flush()
+
+# Lookup includes partition columns
+lookuper = table.new_lookup().create_lookuper()
+result = await lookuper.lookup({"user_id": 1, "region": "US"})
+```
diff --git a/fluss-rust/website/docs/user-guide/python/example/primary-key-tables.md b/fluss-rust/website/docs/user-guide/python/example/primary-key-tables.md
new file mode 100644
index 0000000000..cd61e5084c
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/example/primary-key-tables.md
@@ -0,0 +1,61 @@
+---
+sidebar_position: 5
+---
+# Primary Key Tables
+
+Primary key tables support upsert, delete, and point lookup operations.
+
+## Creating a Primary Key Table
+
+Pass `primary_keys` to `fluss.Schema`:
+
+```python
+import pyarrow as pa
+
+schema = fluss.Schema(
+    pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("name", pa.string()),
+        pa.field("age", pa.int64()),
+    ]),
+    primary_keys=["id"],
+)
+table_path = fluss.TablePath("fluss", "users")
+await admin.create_table(table_path, fluss.TableDescriptor(schema, bucket_count=3), ignore_if_exists=True)
+```
+
+## Upsert, Delete, Lookup
+
+```python
+table = await conn.get_table(table_path)
+
+# Upsert (fire-and-forget, flush at the end)
+writer = table.new_upsert().create_writer()
+writer.upsert({"id": 1, "name": "Alice", "age": 25})
+writer.upsert({"id": 2, "name": "Bob", "age": 30})
+await writer.flush()
+
+# Per-record acknowledgment (for read-after-write)
+handle = writer.upsert({"id": 3, "name": "Charlie", "age": 35})
+await handle.wait()
+
+# Delete by primary key
+handle = writer.delete({"id": 2})
+await handle.wait()
+
+# Lookup
+lookuper = table.new_lookup().create_lookuper()
+result = await lookuper.lookup({"id": 1})
+if result:
+    print(f"Found: name={result['name']}, age={result['age']}")
+```
+
+## Partial Updates
+
+Update specific columns while preserving others:
+
+```python
+partial_writer = table.new_upsert().partial_update_by_name(["id", "age"]).create_writer()
+partial_writer.upsert({"id": 1, "age": 27})  # only updates age
+await partial_writer.flush()
+```
diff --git a/fluss-rust/website/docs/user-guide/python/installation.md b/fluss-rust/website/docs/user-guide/python/installation.md
new file mode 100644
index 0000000000..4182dbb431
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/python/installation.md
@@ -0,0 +1,41 @@
+---
+sidebar_position: 1
+---
+# Installation
+
+```bash
+pip install pyfluss
+```
+
+## Building From Source (Optional)
+
+**Prerequisites:** Python 3.9+, Rust 1.85+
+
+```bash
+git clone https://github.com/apache/fluss-rust.git
+cd fluss-rust/bindings/python
+```
+
+Install [maturin](https://github.com/PyO3/maturin):
+
+```bash
+pip install maturin
+```
+
+Build and install:
+
+```bash
+# Development mode (editable)
+maturin develop
+
+# Or build a wheel
+maturin build --release
+pip install target/wheels/fluss-*.whl
+```
+
+Verify:
+
+```python
+import fluss
+print("Fluss Python bindings installed successfully!")
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/_category_.json b/fluss-rust/website/docs/user-guide/rust/_category_.json
new file mode 100644
index 0000000000..cdec432dad
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Rust",
+  "position": 1
+}
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
new file mode 100644
index 0000000000..d5d0671542
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -0,0 +1,443 @@
+---
+sidebar_position: 2
+---
+# API Reference
+
+Complete API reference for the Fluss Rust client.
+
+## `Config`
+
+| Field                             | Type     | Default            | Description                                             |
+|-----------------------------------|----------|--------------------|---------------------------------------------------------|
+| `bootstrap_servers`               | `String` | `"127.0.0.1:9123"` | Coordinator server address                              |
+| `writer_request_max_size`         | `i32`    | `10485760` (10 MB) | Maximum request size in bytes                           |
+| `writer_acks`                     | `String` | `"all"`            | Acknowledgment setting (`"all"` waits for all replicas) |
+| `writer_retries`                  | `i32`    | `i32::MAX`         | Number of retries on failure                            |
+| `writer_batch_size`               | `i32`    | `2097152` (2 MB)   | Batch size for writes in bytes                          |
+| `scanner_remote_log_prefetch_num` | `usize`  | `4`                | Number of remote log segments to prefetch               |
+| `remote_file_download_thread_num` | `usize`  | `3`                | Number of threads for remote log downloads              |
+
+## `FlussConnection`
+
+| Method                                                                        | Description                                    |
+|-------------------------------------------------------------------------------|------------------------------------------------|
+| `async fn new(config: Config) -> Result<Self>`                                | Create a new connection to a Fluss cluster     |
+| `async fn get_admin(&self) -> Result<FlussAdmin>`                             | Get the admin interface for cluster management |
+| `async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>>` | Get a table for read/write operations          |
+| `fn config(&self) -> &Config`                                                 | Get a reference to the connection config       |
+
+## `FlussAdmin`
+
+### Database Operations
+
+| Method                                                                                                                       | Description                |
+|------------------------------------------------------------------------------------------------------------------------------|----------------------------|
+| `async fn create_database(&self, name: &str, descriptor: Option<&DatabaseDescriptor>, ignore_if_exists: bool) -> Result<()>` | Create a database          |
+| `async fn drop_database(&self, name: &str, ignore_if_not_exists: bool, cascade: bool) -> Result<()>`                         | Drop a database            |
+| `async fn list_databases(&self) -> Result<Vec<String>>`                                                                      | List all databases         |
+| `async fn database_exists(&self, name: &str) -> Result<bool>`                                                                | Check if a database exists |
+| `async fn get_database_info(&self, name: &str) -> Result<DatabaseInfo>`                                                      | Get database metadata      |
+
+### Table Operations
+
+| Method                                                                                                                     | Description               |
+|----------------------------------------------------------------------------------------------------------------------------|---------------------------|
+| `async fn create_table(&self, table_path: &TablePath, descriptor: &TableDescriptor, ignore_if_exists: bool) -> Result<()>` | Create a table            |
+| `async fn drop_table(&self, table_path: &TablePath, ignore_if_not_exists: bool) -> Result<()>`                             | Drop a table              |
+| `async fn get_table_info(&self, table_path: &TablePath) -> Result<TableInfo>`                                              | Get table metadata        |
+| `async fn list_tables(&self, database_name: &str) -> Result<Vec<String>>`                                                  | List tables in a database |
+| `async fn table_exists(&self, table_path: &TablePath) -> Result<bool>`                                                     | Check if a table exists   |
+
+### Partition Operations
+
+| Method                                                                                                                   | Description         |
+|--------------------------------------------------------------------------------------------------------------------------|---------------------|
+| `async fn list_partition_infos(&self, table_path: &TablePath) -> Result<Vec<PartitionInfo>>`                             | List all partitions |
+| `async fn create_partition(&self, table_path: &TablePath, spec: &PartitionSpec, ignore_if_exists: bool) -> Result<()>`   | Create a partition  |
+| `async fn drop_partition(&self, table_path: &TablePath, spec: &PartitionSpec, ignore_if_not_exists: bool) -> Result<()>` | Drop a partition    |
+
+### Offset Operations
+
+| Method                                                                                                                                                           |  Description                          |
+|------------------------------------------------------------------------------------------------------------------------------------------------------------------|---------------------------------------|
+| `async fn list_offsets(&self, table_path: &TablePath, bucket_ids: &[i32], offset_spec: OffsetSpec) -> Result<HashMap<i32, i64>>`                                 | Get offsets for buckets               |
+| `async fn list_partition_offsets(&self, table_path: &TablePath, partition_name: &str, bucket_ids: &[i32], offset_spec: OffsetSpec) -> Result<HashMap<i32, i64>>` | Get offsets for a partition's buckets |
+
+### Lake Operations
+
+| Method                                                                                     |  Description                 |
+|--------------------------------------------------------------------------------------------|------------------------------|
+| `async fn get_latest_lake_snapshot(&self, table_path: &TablePath) -> Result<LakeSnapshot>` | Get the latest lake snapshot |
+
+## `FlussTable<'a>`
+
+| Method                                        | Description                             |
+|-----------------------------------------------|-----------------------------------------|
+| `fn get_table_info(&self) -> &TableInfo`      | Get table metadata                      |
+| `fn new_append(&self) -> Result<TableAppend>` | Create an append builder for log tables |
+| `fn new_scan(&self) -> TableScan<'_>`         | Create a scan builder                   |
+| `fn new_lookup(&self) -> Result<TableLookup>` | Create a lookup builder for PK tables   |
+| `fn new_upsert(&self) -> Result<TableUpsert>` | Create an upsert builder for PK tables  |
+| `fn has_primary_key(&self) -> bool`           | Check if the table has a primary key    |
+| `fn table_path(&self) -> &TablePath`          | Get the table path                      |
+
+## `TableAppend`
+
+| Method                                            | Description             |
+|---------------------------------------------------|-------------------------|
+| `fn create_writer(&self) -> Result<AppendWriter>` | Create an append writer |
+
+## `AppendWriter`
+
+| Method                                                                          | Description                                       |
+|---------------------------------------------------------------------------------|---------------------------------------------------|
+| `fn append(&self, row: &impl InternalRow) -> Result<WriteResultFuture>`         | Append a row; returns a future for acknowledgment |
+| `fn append_arrow_batch(&self, batch: RecordBatch) -> Result<WriteResultFuture>` | Append an Arrow RecordBatch                       |
+| `async fn flush(&self) -> Result<()>`                                           | Flush all pending writes to the server            |
+
+## `TableScan<'a>`
+
+| Method                                                                      | Description                             |
+|-----------------------------------------------------------------------------|-----------------------------------------|
+| `fn project(self, indices: &[usize]) -> Result<Self>`                       | Project columns by index                |
+| `fn project_by_name(self, names: &[&str]) -> Result<Self>`                  | Project columns by name                 |
+| `fn create_log_scanner(self) -> Result<LogScanner>`                         | Create a record-based log scanner       |
+| `fn create_record_batch_log_scanner(self) -> Result<RecordBatchLogScanner>` | Create an Arrow batch-based log scanner |
+
+## `LogScanner`
+
+| Method                                                                                                    | Description                                              |
+|-----------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
+| `async fn subscribe(&self, bucket_id: i32, start_offset: i64) -> Result<()>`                              | Subscribe to a bucket                                    |
+| `async fn subscribe_buckets(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()>`                     | Subscribe to multiple buckets                            |
+| `async fn subscribe_partition(&self, partition_id: i64, bucket_id: i32, start_offset: i64) -> Result<()>` | Subscribe to a partition bucket                          |
+| `async fn subscribe_partition_buckets(&self, offsets: &HashMap<(i64, i32), i64>) -> Result<()>`           | Subscribe to multiple partition-bucket pairs             |
+| `async fn unsubscribe(&self, bucket_id: i32) -> Result<()>`                                               | Unsubscribe from a bucket (non-partitioned tables)       |
+| `async fn unsubscribe_partition(&self, partition_id: i64, bucket_id: i32) -> Result<()>`                  | Unsubscribe from a partition bucket (partitioned tables) |
+| `async fn poll(&self, timeout: Duration) -> Result<ScanRecords>`                                          | Poll for records                                         |
+
+## `RecordBatchLogScanner`
+
+| Method                                                                                                    | Description                                              |
+|-----------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
+| `async fn subscribe(&self, bucket_id: i32, start_offset: i64) -> Result<()>`                              | Subscribe to a bucket                                    |
+| `async fn subscribe_buckets(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()>`                     | Subscribe to multiple buckets                            |
+| `async fn subscribe_partition(&self, partition_id: i64, bucket_id: i32, start_offset: i64) -> Result<()>` | Subscribe to a partition bucket                          |
+| `async fn subscribe_partition_buckets(&self, offsets: &HashMap<(i64, i32), i64>) -> Result<()>`           | Subscribe to multiple partition-bucket pairs             |
+| `async fn unsubscribe(&self, bucket_id: i32) -> Result<()>`                                               | Unsubscribe from a bucket (non-partitioned tables)       |
+| `async fn unsubscribe_partition(&self, partition_id: i64, bucket_id: i32) -> Result<()>`                  | Unsubscribe from a partition bucket (partitioned tables) |
+| `async fn poll(&self, timeout: Duration) -> Result<Vec<ScanBatch>>`                                       | Poll for Arrow record batches                            |
+| `fn is_partitioned(&self) -> bool`                                                                        | Check if the table is partitioned                        |
+| `fn get_subscribed_buckets(&self) -> Vec<(TableBucket, i64)>`                                             | Get all current subscriptions as (bucket, offset) pairs  |
+
+## `ScanRecord`
+
+| Method                                 | Description                            |
+|----------------------------------------|----------------------------------------|
+| `fn row(&self) -> &dyn InternalRow`    | Get the row data                       |
+| `fn offset(&self) -> i64`              | Record offset in the log               |
+| `fn timestamp(&self) -> i64`           | Record timestamp                       |
+| `fn change_type(&self) -> &ChangeType` | Change type (AppendOnly, Insert, etc.) |
+
+## `ScanRecords`
+
+| Method                                                                   | Description                       |
+|--------------------------------------------------------------------------|-----------------------------------|
+| `fn count(&self) -> usize`                                               | Number of records                 |
+| `fn is_empty(&self) -> bool`                                             | Whether the result set is empty   |
+| `fn records(&self, bucket: &TableBucket) -> &[ScanRecord]`               | Get records for a specific bucket |
+| `fn records_by_buckets(&self) -> &HashMap<TableBucket, Vec<ScanRecord>>` | Get all records grouped by bucket |
+
+`ScanRecords` also implements `IntoIterator`, so you can iterate over all records directly:
+
+```rust
+for record in records {
+    println!("offset={}", record.offset());
+}
+```
+
+## `ScanBatch`
+
+| Method                             | Description                    |
+|------------------------------------|--------------------------------|
+| `fn bucket(&self) -> &TableBucket` | Bucket this batch belongs to   |
+| `fn batch(&self) -> &RecordBatch`  | Arrow RecordBatch data         |
+| `fn base_offset(&self) -> i64`     | First record offset            |
+| `fn last_offset(&self) -> i64`     | Last record offset             |
+| `fn num_records(&self) -> usize`   | Number of records in the batch |
+
+## `TableUpsert`
+
+| Method                                                                                | Description                                       |
+|---------------------------------------------------------------------------------------|---------------------------------------------------|
+| `fn create_writer(&self) -> Result<UpsertWriter>`                                     | Create an upsert writer                           |
+| `fn partial_update(&self, column_indices: Option<Vec<usize>>) -> Result<TableUpsert>` | Create a partial update builder by column indices |
+| `fn partial_update_with_column_names(&self, names: &[&str]) -> Result<TableUpsert>`   | Create a partial update builder by column names   |
+
+## `UpsertWriter`
+
+| Method                                                                  | Description                           |
+|-------------------------------------------------------------------------|---------------------------------------|
+| `fn upsert(&self, row: &impl InternalRow) -> Result<WriteResultFuture>` | Upsert a row (insert or update by PK) |
+| `fn delete(&self, row: &impl InternalRow) -> Result<WriteResultFuture>` | Delete a row by primary key           |
+| `async fn flush(&self) -> Result<()>`                                   | Flush all pending operations          |
+
+## `TableLookup`
+
+| Method                                          |  Description                        |
+|-------------------------------------------------|-------------------------------------|
+| `fn create_lookuper(&self) -> Result<Lookuper>` | Create a lookuper for point lookups |
+
+## `Lookuper`
+
+| Method                                                                       |  Description                |
+|------------------------------------------------------------------------------|-----------------------------|
+| `async fn lookup(&mut self, key: &impl InternalRow) -> Result<LookupResult>` | Lookup a row by primary key |
+
+## `LookupResult`
+
+| Method                                                         |  Description                     |
+|----------------------------------------------------------------|----------------------------------|
+| `fn get_single_row(&self) -> Result<Option<impl InternalRow>>` | Get a single row from the result |
+| `fn get_rows(&self) -> Vec<impl InternalRow>`                  | Get all rows from the result     |
+
+## `WriteResultFuture`
+
+| Description                                                                                                                                   |
+|-----------------------------------------------------------------------------------------------------------------------------------------------|
+| Implements `Future<Output = Result<(), Error>>`. Await to wait for server acknowledgment. Returned by `append()`, `upsert()`, and `delete()`. |
+
+Usage:
+
+```rust
+// Fire-and-forget (batched)
+writer.append(&row)?;
+writer.flush().await?;
+
+// Per-record acknowledgment
+writer.append(&row)?.await?;
+```
+
+## `Schema`
+
+| Method                                         |  Description                             |
+|------------------------------------------------|------------------------------------------|
+| `fn builder() -> SchemaBuilder`                | Create a schema builder                  |
+| `fn columns(&self) -> &[Column]`               | Get all columns                          |
+| `fn primary_key(&self) -> Option<&PrimaryKey>` | Get primary key (None if no primary key) |
+| `fn column_names(&self) -> Vec<&str>`          | Get all column names                     |
+| `fn primary_key_indexes(&self) -> Vec<usize>`  | Get primary key column indices           |
+
+## `SchemaBuilder`
+
+| Method                                               |  Description            |
+|------------------------------------------------------|-------------------------|
+| `fn column(name: &str, data_type: DataType) -> Self` | Add a column            |
+| `fn primary_key(keys: Vec<&str>) -> Self`            | Set primary key columns |
+| `fn build() -> Result<Schema>`                       | Build the schema        |
+
+## `TableDescriptor`
+
+| Method                                             |  Description                         |
+|----------------------------------------------------|--------------------------------------|
+| `fn builder() -> TableDescriptorBuilder`           | Create a table descriptor builder    |
+| `fn schema(&self) -> &Schema`                      | Get the table schema                 |
+| `fn partition_keys(&self) -> &[String]`            | Get partition key column names       |
+| `fn has_primary_key(&self) -> bool`                | Check if the table has a primary key |
+| `fn properties(&self) -> &HashMap<String, String>` | Get all table properties             |
+| `fn comment(&self) -> Option<&str>`                | Get table comment                    |
+
+## `TableDescriptorBuilder`
+
+| Method                                                                           |  Description                                |
+|----------------------------------------------------------------------------------|---------------------------------------------|
+| `fn schema(schema: Schema) -> Self`                                              | Set the schema                              |
+| `fn log_format(format: LogFormat) -> Self`                                       | Set log format (e.g., `LogFormat::ARROW`)   |
+| `fn kv_format(format: KvFormat) -> Self`                                         | Set KV format (e.g., `KvFormat::COMPACTED`) |
+| `fn property(key: &str, value: &str) -> Self`                                    | Set a table property                        |
+| `fn partitioned_by(keys: Vec<&str>) -> Self`                                     | Set partition columns                       |
+| `fn distributed_by(bucket_count: Option<i32>, bucket_keys: Vec<String>) -> Self` | Set bucket distribution                     |
+| `fn comment(comment: &str) -> Self`                                              | Set table comment                           |
+| `fn build() -> Result<TableDescriptor>`                                          | Build the table descriptor                  |
+
+## `TablePath`
+
+| Method                                                |  Description        |
+|-------------------------------------------------------|---------------------|
+| `TablePath::new(database: &str, table: &str) -> Self` | Create a table path |
+| `fn database(&self) -> &str`                          | Get database name   |
+| `fn table(&self) -> &str`                             | Get table name      |
+
+## `TableInfo`
+
+| Field / Method       | Description                                         |
+|----------------------|-----------------------------------------------------|
+| `.table_path`        | `TablePath` -- Table path                           |
+| `.table_id`          | `i64` -- Table ID                                   |
+| `.schema_id`         | `i32` -- Schema ID                                  |
+| `.schema`            | `Schema` -- Table schema                            |
+| `.primary_keys`      | `Vec<String>` -- Primary key column names           |
+| `.partition_keys`    | `Vec<String>` -- Partition key column names         |
+| `.num_buckets`       | `i32` -- Number of buckets                          |
+| `.properties`        | `HashMap<String, String>` -- All table properties   |
+| `.custom_properties` | `HashMap<String, String>` -- Custom properties only |
+| `.comment`           | `Option<String>` -- Table comment                   |
+| `.created_time`      | `i64` -- Creation timestamp                         |
+| `.modified_time`     | `i64` -- Last modification timestamp                |
+
+## `TableBucket`
+
+| Method                                                                                              | Description                                |
+|-----------------------------------------------------------------------------------------------------|--------------------------------------------|
+| `TableBucket::new(table_id: i64, bucket_id: i32) -> Self`                                           | Create a non-partitioned bucket            |
+| `TableBucket::new_with_partition(table_id: i64, partition_id: Option<i64>, bucket_id: i32) -> Self` | Create a partitioned bucket                |
+| `fn table_id(&self) -> i64`                                                                         | Get table ID                               |
+| `fn partition_id(&self) -> Option<i64>`                                                             | Get partition ID (None if non-partitioned) |
+| `fn bucket_id(&self) -> i32`                                                                        | Get bucket ID                              |
+
+## `PartitionSpec`
+
+| Method                                                      | Description                                           |
+|-------------------------------------------------------------|-------------------------------------------------------|
+| `PartitionSpec::new(spec_map: HashMap<&str, &str>) -> Self` | Create from a map of partition column names to values |
+| `fn get_spec_map(&self) -> &HashMap<String, String>`        | Get the partition spec map                            |
+
+## `PartitionInfo`
+
+| Method                                   |  Description       |
+|------------------------------------------|--------------------|
+| `fn get_partition_id(&self) -> i64`      | Get partition ID   |
+| `fn get_partition_name(&self) -> String` | Get partition name |
+
+## `DatabaseDescriptor`
+
+| Method                                                    | Description                          |
+|-----------------------------------------------------------|--------------------------------------|
+| `fn builder() -> DatabaseDescriptorBuilder`               | Create a database descriptor builder |
+| `fn comment(&self) -> Option<&str>`                       | Get database comment                 |
+| `fn custom_properties(&self) -> &HashMap<String, String>` | Get custom properties                |
+
+## `DatabaseDescriptorBuilder`
+
+| Method                                                                                    | Description                   |
+|-------------------------------------------------------------------------------------------|-------------------------------|
+| `fn comment(comment: impl Into<String>) -> Self`                                          | Set database comment          |
+| `fn custom_properties(properties: HashMap<impl Into<String>, impl Into<String>>) -> Self` | Set custom properties         |
+| `fn custom_property(key: impl Into<String>, value: impl Into<String>) -> Self`            | Set a single custom property  |
+| `fn build() -> DatabaseDescriptor`                                                        | Build the database descriptor |
+
+## `DatabaseInfo`
+
+| Method                                                 | Description                     |
+|--------------------------------------------------------|---------------------------------|
+| `fn database_name(&self) -> &str`                      | Get database name               |
+| `fn created_time(&self) -> i64`                        | Get creation timestamp          |
+| `fn modified_time(&self) -> i64`                       | Get last modification timestamp |
+| `fn database_descriptor(&self) -> &DatabaseDescriptor` | Get the database descriptor     |
+
+## `LakeSnapshot`
+
+| Field                   | Description                                       |
+|-------------------------|---------------------------------------------------|
+| `.snapshot_id`          | `i64` -- Snapshot ID                              |
+| `.table_buckets_offset` | `HashMap<TableBucket, i64>` -- All bucket offsets |
+
+## `GenericRow<'a>`
+
+| Method                                                             | Description                                      |
+|--------------------------------------------------------------------|--------------------------------------------------|
+| `GenericRow::new(field_count: usize) -> Self`                      | Create a new row with the given number of fields |
+| `fn set_field(&mut self, pos: usize, value: impl Into<Datum<'a>>)` | Set a field value by position                    |
+| `GenericRow::from_data(data: Vec<impl Into<Datum<'a>>>) -> Self`   | Create a row from existing field data            |
+
+Implements the `InternalRow` trait (see below).
+
+## `InternalRow` trait
+
+| Method                                                                         |  Description                            |
+|--------------------------------------------------------------------------------|-----------------------------------------|
+| `fn get_boolean(&self, idx: usize) -> bool`                                    | Get boolean value                       |
+| `fn get_byte(&self, idx: usize) -> i8`                                         | Get tinyint value                       |
+| `fn get_short(&self, idx: usize) -> i16`                                       | Get smallint value                      |
+| `fn get_int(&self, idx: usize) -> i32`                                         | Get int value                           |
+| `fn get_long(&self, idx: usize) -> i64`                                        | Get bigint value                        |
+| `fn get_float(&self, idx: usize) -> f32`                                       | Get float value                         |
+| `fn get_double(&self, idx: usize) -> f64`                                      | Get double value                        |
+| `fn get_string(&self, idx: usize) -> &str`                                     | Get string value                        |
+| `fn get_decimal(&self, idx: usize, precision: usize, scale: usize) -> Decimal` | Get decimal value                       |
+| `fn get_date(&self, idx: usize) -> Date`                                       | Get date value                          |
+| `fn get_time(&self, idx: usize) -> Time`                                       | Get time value                          |
+| `fn get_timestamp_ntz(&self, idx: usize, precision: u32) -> TimestampNtz`      | Get timestamp value                     |
+| `fn get_timestamp_ltz(&self, idx: usize, precision: u32) -> TimestampLtz`      | Get timestamp with local timezone value |
+| `fn get_bytes(&self, idx: usize) -> &[u8]`                                     | Get bytes value                         |
+| `fn get_binary(&self, idx: usize, length: usize) -> &[u8]`                     | Get fixed-length binary value           |
+| `fn get_char(&self, idx: usize, length: usize) -> &str`                        | Get fixed-length char value             |
+
+## `ChangeType`
+
+| Value                      | Short String  | Description                      |
+|----------------------------|---------------|----------------------------------|
+| `ChangeType::AppendOnly`   | `+A`          | Append-only record               |
+| `ChangeType::Insert`       | `+I`          | Inserted row                     |
+| `ChangeType::UpdateBefore` | `-U`          | Previous value of an updated row |
+| `ChangeType::UpdateAfter`  | `+U`          | New value of an updated row      |
+| `ChangeType::Delete`       | `-D`          | Deleted row                      |
+
+| Method                           | Description                         |
+|----------------------------------|-------------------------------------|
+| `fn short_string(&self) -> &str` | Get the short string representation |
+
+## `OffsetSpec`
+
+| Variant                      | Description                                     |
+|------------------------------|-------------------------------------------------|
+| `OffsetSpec::Earliest`       | Start from the earliest available offset        |
+| `OffsetSpec::Latest`         | Start from the latest offset (only new records) |
+| `OffsetSpec::Timestamp(i64)` | Start from a specific timestamp in milliseconds |
+
+## Constants
+
+| Constant                         | Value  | Description                                             |
+|----------------------------------|--------|---------------------------------------------------------|
+| `fluss::client::EARLIEST_OFFSET` | `-2`   | Start reading from the earliest available offset        |
+
+To start reading from the latest offset (only new records), resolve the current offset via `list_offsets` before subscribing:
+
+```rust
+use fluss::rpc::message::OffsetSpec;
+
+let offsets = admin.list_offsets(&table_path, &[0], OffsetSpec::Latest).await?;
+let latest = offsets[&0];
+log_scanner.subscribe(0, latest).await?;
+```
+
+## `DataTypes` factory
+
+| Method                                           | Returns    | Description                        |
+|--------------------------------------------------|------------|------------------------------------|
+| `DataTypes::boolean()`                           | `DataType` | Boolean type                       |
+| `DataTypes::tinyint()`                           | `DataType` | 8-bit signed integer               |
+| `DataTypes::smallint()`                          | `DataType` | 16-bit signed integer              |
+| `DataTypes::int()`                               | `DataType` | 32-bit signed integer              |
+| `DataTypes::bigint()`                            | `DataType` | 64-bit signed integer              |
+| `DataTypes::float()`                             | `DataType` | 32-bit floating point              |
+| `DataTypes::double()`                            | `DataType` | 64-bit floating point              |
+| `DataTypes::string()`                            | `DataType` | Variable-length string             |
+| `DataTypes::bytes()`                             | `DataType` | Variable-length byte array         |
+| `DataTypes::date()`                              | `DataType` | Date (days since epoch)            |
+| `DataTypes::time()`                              | `DataType` | Time (milliseconds since midnight) |
+| `DataTypes::timestamp()`                         | `DataType` | Timestamp without timezone         |
+| `DataTypes::timestamp_ltz()`                     | `DataType` | Timestamp with local timezone      |
+| `DataTypes::decimal(precision: u32, scale: u32)` | `DataType` | Fixed-point decimal                |
+| `DataTypes::char(length: u32)`                   | `DataType` | Fixed-length string                |
+| `DataTypes::binary(length: usize)`               | `DataType` | Fixed-length byte array            |
+| `DataTypes::array(element: DataType)`            | `DataType` | Array of elements                  |
+| `DataTypes::map(key: DataType, value: DataType)` | `DataType` | Map of key-value pairs             |
+| `DataTypes::row(fields: Vec<DataField>)`         | `DataType` | Nested row type                    |
+
+## `DataField`
+
+| Method                                                                                                   | Description         |
+|----------------------------------------------------------------------------------------------------------|---------------------|
+| `DataField::new(name: impl Into<String>, data_type: DataType, description: Option<String>) -> DataField` | Create a data field |
+| `fn name(&self) -> &str`                                                                                 | Get the field name  |
diff --git a/fluss-rust/website/docs/user-guide/rust/data-types.md b/fluss-rust/website/docs/user-guide/rust/data-types.md
new file mode 100644
index 0000000000..fe050bfc3c
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/data-types.md
@@ -0,0 +1,80 @@
+---
+sidebar_position: 3
+---
+# Data Types
+
+| Fluss Type      | Rust Type      | Getter                               | Setter                         |
+|-----------------|----------------|--------------------------------------|--------------------------------|
+| `BOOLEAN`       | `bool`         | `get_boolean()`                      | `set_field(idx, bool)`         |
+| `TINYINT`       | `i8`           | `get_byte()`                         | `set_field(idx, i8)`           |
+| `SMALLINT`      | `i16`          | `get_short()`                        | `set_field(idx, i16)`          |
+| `INT`           | `i32`          | `get_int()`                          | `set_field(idx, i32)`          |
+| `BIGINT`        | `i64`          | `get_long()`                         | `set_field(idx, i64)`          |
+| `FLOAT`         | `f32`          | `get_float()`                        | `set_field(idx, f32)`          |
+| `DOUBLE`        | `f64`          | `get_double()`                       | `set_field(idx, f64)`          |
+| `CHAR`          | `&str`         | `get_char(idx, length)`              | `set_field(idx, &str)`         |
+| `STRING`        | `&str`         | `get_string()`                       | `set_field(idx, &str)`         |
+| `DECIMAL`       | `Decimal`      | `get_decimal(idx, precision, scale)` | `set_field(idx, Decimal)`      |
+| `DATE`          | `Date`         | `get_date()`                         | `set_field(idx, Date)`         |
+| `TIME`          | `Time`         | `get_time()`                         | `set_field(idx, Time)`         |
+| `TIMESTAMP`     | `TimestampNtz` | `get_timestamp_ntz(idx, precision)`  | `set_field(idx, TimestampNtz)` |
+| `TIMESTAMP_LTZ` | `TimestampLtz` | `get_timestamp_ltz(idx, precision)`  | `set_field(idx, TimestampLtz)` |
+| `BYTES`         | `&[u8]`        | `get_bytes()`                        | `set_field(idx, &[u8])`        |
+| `BINARY(n)`     | `&[u8]`        | `get_binary(idx, length)`            | `set_field(idx, &[u8])`        |
+
+## Constructing Special Types
+
+Primitive types (`bool`, `i8`, `i16`, `i32`, `i64`, `f32`, `f64`, `&str`, `&[u8]`) can be passed directly to `set_field`. The following types require explicit construction:
+
+```rust
+use fluss::row::{Date, Time, TimestampNtz, TimestampLtz, Decimal};
+
+// Date: days since Unix epoch
+let date = Date::new(19738);
+
+// Time: milliseconds since midnight
+let time = Time::new(43200000);
+
+// Timestamp without timezone: milliseconds since epoch
+// DataTypes::timestamp() defaults to precision 6 (microseconds).
+// Use DataTypes::timestamp_with_precision(p) for a different precision (0–9).
+let ts = TimestampNtz::new(1704067200000);
+
+// Timestamp with local timezone: milliseconds since epoch
+// DataTypes::timestamp_ltz() also defaults to precision 6.
+let ts_ltz = TimestampLtz::new(1704067200000);
+
+// Decimal: from an unscaled long value with precision and scale
+let decimal = Decimal::from_unscaled_long(12345, 10, 2)?; // represents 123.45
+```
+
+## Creating Rows from Data
+
+`GenericRow::from_data` accepts a `Vec<Datum>`. Because multiple crates implement `From<&str>`, Rust cannot infer the target type from `.into()` alone. Annotate the vector type explicitly:
+
+```rust
+use fluss::row::{Datum, GenericRow};
+
+let data: Vec<Datum> = vec![1i32.into(), "hello".into(), Datum::Null];
+let row = GenericRow::from_data(data);
+```
+
+## Reading Row Data
+
+```rust
+use fluss::row::InternalRow;
+
+for record in scan_records {
+    let row = record.row();
+
+    if row.is_null_at(0) {
+        // field is null
+    }
+    let id: i32 = row.get_int(0);
+    let name: &str = row.get_string(1);
+    let score: f32 = row.get_float(2);
+    let date: Date = row.get_date(3);
+    let ts: TimestampNtz = row.get_timestamp_ntz(4, 6);
+    let decimal: Decimal = row.get_decimal(5, 10, 2);
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/error-handling.md b/fluss-rust/website/docs/user-guide/rust/error-handling.md
new file mode 100644
index 0000000000..35ede6c85c
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/error-handling.md
@@ -0,0 +1,180 @@
+---
+sidebar_position: 4
+---
+# Error Handling
+
+The Fluss Rust client uses a unified `Error` type and a `Result<T>` alias for all fallible operations.
+
+## Basic Usage
+
+```rust
+use fluss::error::{Error, Result};
+
+// All operations return Result<T>
+let conn = FlussConnection::new(config).await?;
+let admin = conn.get_admin().await?;
+let table = conn.get_table(&table_path).await?;
+```
+
+Use the `?` operator to propagate errors, or `match` on specific variants for fine-grained handling.
+
+## Matching Error Variants
+
+```rust
+use fluss::error::Error;
+
+match result {
+    Ok(val) => {
+        // handle success
+    }
+    Err(Error::RpcError { message, .. }) => {
+        eprintln!("RPC failure: {}", message);
+    }
+    Err(Error::UnsupportedOperation { message }) => {
+        eprintln!("Unsupported: {}", message);
+    }
+    Err(Error::FlussAPIError { api_error }) => {
+        eprintln!("Server error: {}", api_error);
+    }
+    Err(e) => {
+        eprintln!("Unexpected error: {}", e);
+    }
+}
+```
+
+## Error Variants
+
+| Variant                        | Description                                                  |
+|--------------------------------|--------------------------------------------------------------|
+| `UnexpectedError`              | General unexpected errors with a message and optional source |
+| `IoUnexpectedError`            | I/O errors (network, file system)                            |
+| `RemoteStorageUnexpectedError` | Remote storage errors (OpenDAL backend failures)             |
+| `RpcError`                     | RPC communication failures (connection refused, timeout)     |
+| `RowConvertError`              | Row conversion failures (type mismatch, invalid data)        |
+| `ArrowError`                   | Arrow data handling errors (schema mismatch, encoding)       |
+| `IllegalArgument`              | Invalid arguments passed to an API method                    |
+| `UnsupportedOperation`         | Operation not supported on the table type                    |
+| `FlussAPIError`                | Server-side API errors returned by the Fluss cluster         |
+
+Server side errors are represented as `FlussAPIError` with a specific error code. Use the `api_error()` helper to match them ergonomically:
+
+```rust
+use fluss::error::FlussError;
+
+match result {
+    Err(ref e) if e.api_error() == Some(FlussError::InvalidTableException) => {
+        eprintln!("Invalid table: {}", e);
+    }
+    Err(ref e) if e.api_error() == Some(FlussError::PartitionNotExists) => {
+        eprintln!("Partition does not exist: {}", e);
+    }
+    Err(ref e) if e.api_error() == Some(FlussError::LeaderNotAvailableException) => {
+        eprintln!("Leader not available: {}", e);
+    }
+    _ => {}
+}
+```
+
+## Common Error Scenarios
+
+### Connection Refused
+
+The Fluss cluster is not running or the address is incorrect.
+
+```rust
+let result = FlussConnection::new(config).await;
+match result {
+    Err(Error::RpcError { message, .. }) => {
+        eprintln!("Cannot connect to cluster: {}", message);
+    }
+    _ => {}
+}
+```
+
+### Table Not Found
+
+The table does not exist or has been dropped.
+
+```rust
+use fluss::error::{Error, FlussError};
+
+// Admin operations return FlussError::TableNotExist (code 7)
+let result = admin.drop_table(&table_path, false).await;
+match result {
+    Err(ref e) if e.api_error() == Some(FlussError::TableNotExist) => {
+        eprintln!("Table not found: {}", e);
+    }
+    _ => {}
+}
+
+// conn.get_table() wraps the error differently, match on FlussAPIError directly
+let result = conn.get_table(&table_path).await;
+match result {
+    Err(Error::FlussAPIError { ref api_error }) => {
+        eprintln!("Server error (code {}): {}", api_error.code, api_error.message);
+    }
+    _ => {}
+}
+```
+
+### Partition Not Found
+
+The partition does not exist on a partitioned table.
+
+```rust
+use fluss::error::FlussError;
+
+let result = admin.drop_partition(&table_path, &spec, false).await;
+match result {
+    Err(ref e) if e.api_error() == Some(FlussError::PartitionNotExists) => {
+        eprintln!("Partition does not exist: {}", e);
+    }
+    _ => {}
+}
+```
+
+### Schema Mismatch
+
+Row data does not match the expected table schema.
+
+```rust
+let result = writer.append(&row);
+match result {
+    Err(Error::RowConvertError { .. }) => {
+        eprintln!("Row does not match table schema");
+    }
+    _ => {}
+}
+```
+
+## Using `Result<T>` in Application Code
+
+The `fluss::error::Result<T>` type alias makes it easy to use Fluss errors with the `?` operator in your application functions:
+
+```rust
+use fluss::error::Result;
+
+async fn my_pipeline() -> Result<()> {
+    let conn = FlussConnection::new(config).await?;
+    let admin = conn.get_admin().await?;
+    let table = conn.get_table(&table_path).await?;
+    let writer = table.new_append()?.create_writer()?;
+    writer.append(&row)?;
+    writer.flush().await?;
+    Ok(())
+}
+```
+
+For applications that use other error types alongside Fluss errors, you can convert with standard `From` / `Into` traits or use crates like `anyhow`:
+
+```rust
+use anyhow::Result;
+
+#[tokio::main]
+async fn main() -> Result<()> {
+    let conn = FlussConnection::new(config).await?;
+    // fluss::error::Error implements std::error::Error,
+    // so it converts into anyhow::Error automatically
+    Ok(())
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/example/_category_.json b/fluss-rust/website/docs/user-guide/rust/example/_category_.json
new file mode 100644
index 0000000000..dd2229499b
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/example/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Example",
+  "position": 5
+}
diff --git a/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md b/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
new file mode 100644
index 0000000000..7fcc4017a6
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
@@ -0,0 +1,118 @@
+---
+sidebar_position: 3
+---
+# Admin Operations
+
+## Get Admin Interface
+
+```rust
+let admin = conn.get_admin().await?;
+```
+
+## Database Operations
+
+```rust
+// Create database
+admin.create_database("my_database", None, true).await?;
+
+// List all databases
+let databases = admin.list_databases().await?;
+println!("Databases: {:?}", databases);
+
+// Check if database exists
+let exists = admin.database_exists("my_database").await?;
+
+// Get database information
+let db_info = admin.get_database_info("my_database").await?;
+
+// Drop database
+admin.drop_database("my_database", true, false).await?;
+```
+
+## Table Operations
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .column("amount", DataTypes::bigint())
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("my_database", "my_table");
+
+// Create table
+admin.create_table(&table_path, &table_descriptor, true).await?;
+
+// Get table information
+let table_info = admin.get_table_info(&table_path).await?;
+println!("Table: {}", table_info);
+
+// List tables in database
+let tables = admin.list_tables("my_database").await?;
+
+// Check if table exists
+let exists = admin.table_exists(&table_path).await?;
+
+// Drop table
+admin.drop_table(&table_path, true).await?;
+```
+
+## Partition Operations
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+// List all partitions
+let partitions = admin.list_partition_infos(&table_path).await?;
+
+// List partitions matching a spec
+let mut filter = HashMap::new();
+filter.insert("year", "2024");
+let spec = PartitionSpec::new(filter);
+let partitions = admin.list_partition_infos_with_spec(&table_path, Some(&spec)).await?;
+
+// Create partition
+admin.create_partition(&table_path, &spec, true).await?;
+
+// Drop partition
+admin.drop_partition(&table_path, &spec, true).await?;
+```
+
+## Offset Operations
+
+```rust
+use fluss::rpc::message::OffsetSpec;
+
+let bucket_ids = vec![0, 1, 2];
+
+// Get earliest offsets
+let earliest = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Earliest).await?;
+
+// Get latest offsets
+let latest = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Latest).await?;
+
+// Get offsets for a specific timestamp
+let timestamp_ms = 1704067200000; // 2024-01-01 00:00:00 UTC
+let offsets = admin.list_offsets(
+    &table_path, &bucket_ids, OffsetSpec::Timestamp(timestamp_ms),
+).await?;
+
+// Get offsets for a specific partition
+let partition_offsets = admin.list_partition_offsets(
+    &table_path, "partition_name", &bucket_ids, OffsetSpec::Latest,
+).await?;
+```
+
+## Lake Snapshot
+
+```rust
+let snapshot = admin.get_latest_lake_snapshot(&table_path).await?;
+println!("Snapshot ID: {}", snapshot.snapshot_id);
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/example/configuration.md b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
new file mode 100644
index 0000000000..a84c24dcad
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
@@ -0,0 +1,26 @@
+---
+sidebar_position: 2
+---
+# Configuration
+
+## Connection Setup
+
+```rust
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+
+let mut config = Config::default();
+config.bootstrap_servers = "127.0.0.1:9123".to_string();
+
+let conn = FlussConnection::new(config).await?;
+```
+
+## Connection Configurations
+
+| Option                    | Description                                           | Default          |
+|---------------------------|-------------------------------------------------------|------------------|
+| `bootstrap_servers`       | Coordinator server address                            | `127.0.0.1:9123` |
+| `writer_request_max_size` | Maximum request size in bytes                         | 10 MB            |
+| `writer_acks`             | Acknowledgment setting (`all` waits for all replicas) | `all`            |
+| `writer_retries`          | Number of retries on failure                          | `i32::MAX`       |
+| `writer_batch_size`       | Batch size for writes                                 | 2 MB             |
diff --git a/fluss-rust/website/docs/user-guide/rust/example/index.md b/fluss-rust/website/docs/user-guide/rust/example/index.md
new file mode 100644
index 0000000000..dcee87b0f6
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/example/index.md
@@ -0,0 +1,56 @@
+---
+sidebar_position: 1
+---
+# Example
+
+Minimal working examples: connect to Fluss, create a table, write data, and read it back.
+
+```rust
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+use fluss::error::Result;
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+use fluss::row::{GenericRow, InternalRow};
+use std::time::Duration;
+
+#[tokio::main]
+async fn main() -> Result<()> {
+    // Connect
+    let mut config = Config::default();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
+    let conn = FlussConnection::new(config).await?;
+    let admin = conn.get_admin().await?;
+
+    // Create a log table
+    let table_path = TablePath::new("fluss", "quickstart_rust");
+    let descriptor = TableDescriptor::builder()
+        .schema(
+            Schema::builder()
+                .column("id", DataTypes::int())
+                .column("name", DataTypes::string())
+                .build()?,
+        )
+        .build()?;
+    admin.create_table(&table_path, &descriptor, true).await?;
+
+    // Write
+    let table = conn.get_table(&table_path).await?;
+    let writer = table.new_append()?.create_writer()?;
+    let mut row = GenericRow::new(2);
+    row.set_field(0, 1);
+    row.set_field(1, "hello");
+    writer.append(&row)?;
+    writer.flush().await?;
+
+    // Read
+    let scanner = table.new_scan().create_log_scanner()?;
+    scanner.subscribe(0, 0).await?;
+    let records = scanner.poll(Duration::from_secs(5)).await?;
+    for record in records {
+        let row = record.row();
+        println!("id={}, name={}", row.get_int(0), row.get_string(1));
+    }
+
+    Ok(())
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
new file mode 100644
index 0000000000..3ba33542fb
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
@@ -0,0 +1,140 @@
+---
+sidebar_position: 4
+---
+# Log Tables
+
+Log tables are append-only tables without primary keys, suitable for event streaming.
+
+## Creating a Log Table
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("event_id", DataTypes::int())
+            .column("event_type", DataTypes::string())
+            .column("timestamp", DataTypes::bigint())
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("fluss", "events");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+## Writing to Log Tables
+
+```rust
+use fluss::row::{GenericRow, InternalRow};
+
+let table = conn.get_table(&table_path).await?;
+let append_writer = table.new_append()?.create_writer()?;
+
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);                    // event_id
+row.set_field(1, "user_login");         // event_type
+row.set_field(2, 1704067200000i64);     // timestamp
+
+append_writer.append(&row)?;
+append_writer.flush().await?;
+```
+
+Write operations use a **fire-and-forget** pattern for efficient batching. Each call queues the write and returns a `WriteResultFuture` immediately. Call `flush()` to ensure all queued writes are sent to the server.
+
+For per-record acknowledgment:
+
+```rust
+append_writer.append(&row)?.await?;
+```
+
+## Reading from Log Tables
+
+```rust
+use std::time::Duration;
+
+let table = conn.get_table(&table_path).await?;
+let log_scanner = table.new_scan().create_log_scanner()?;
+
+// Subscribe to bucket 0 starting from offset 0
+log_scanner.subscribe(0, 0).await?;
+
+// Poll for records
+let records = log_scanner.poll(Duration::from_secs(10)).await?;
+
+for record in records {
+    let row = record.row();
+    println!(
+        "event_id={}, event_type={}, timestamp={} @ offset={}",
+        row.get_int(0),
+        row.get_string(1),
+        row.get_long(2),
+        record.offset()
+    );
+}
+```
+
+**Subscribe from special offsets:**
+
+```rust
+use fluss::client::EARLIEST_OFFSET;
+
+log_scanner.subscribe(0, EARLIEST_OFFSET).await?;  // from earliest
+log_scanner.subscribe(0, 42).await?;                // from specific offset
+```
+
+**Subscribe from latest offset (only new records):**
+
+To start reading only new records, first resolve the current latest offset via `list_offsets`, then subscribe at that offset:
+
+```rust
+use fluss::rpc::message::OffsetSpec;
+
+let admin = conn.get_admin().await?;
+let offsets = admin.list_offsets(&table_path, &[0], OffsetSpec::Latest).await?;
+let latest = offsets[&0];
+log_scanner.subscribe(0, latest).await?;
+```
+
+**Subscribe to all buckets:**
+
+```rust
+let num_buckets = table.get_table_info().get_num_buckets();
+for bucket_id in 0..num_buckets {
+    log_scanner.subscribe(bucket_id, 0).await?;
+}
+```
+
+**Subscribe to multiple buckets at once:**
+
+```rust
+use std::collections::HashMap;
+
+let mut bucket_offsets = HashMap::new();
+bucket_offsets.insert(0, 0i64);
+bucket_offsets.insert(1, 100i64);
+log_scanner.subscribe_buckets(&bucket_offsets).await?;
+```
+
+**Unsubscribe from a bucket:**
+
+```rust
+// Non-partitioned tables
+log_scanner.unsubscribe(bucket_id).await?;
+
+// Partitioned tables
+log_scanner.unsubscribe_partition(partition_id, bucket_id).await?;
+```
+
+## Column Projection
+
+```rust
+// Project by column index
+let scanner = table.new_scan().project(&[0, 2])?.create_log_scanner()?;
+
+// Project by column name
+let scanner = table.new_scan()
+    .project_by_name(&["event_id", "timestamp"])?
+    .create_log_scanner()?;
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
new file mode 100644
index 0000000000..3edf4d88ce
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
@@ -0,0 +1,215 @@
+---
+sidebar_position: 6
+---
+# Partitioned Tables
+
+Partitioned tables distribute data across partitions based on partition column values, enabling efficient data organization and querying. Both log tables and primary key tables support partitioning.
+
+## Partitioned Log Tables
+
+### Creating a Partitioned Log Table
+
+```rust
+use fluss::metadata::{DataTypes, LogFormat, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("event_id", DataTypes::int())
+            .column("event_type", DataTypes::string())
+            .column("dt", DataTypes::string())
+            .column("region", DataTypes::string())
+            .build()?,
+    )
+    .partitioned_by(vec!["dt", "region"])
+    .log_format(LogFormat::ARROW)
+    .build()?;
+
+let table_path = TablePath::new("fluss", "partitioned_events");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+### Writing to Partitioned Log Tables
+
+**Partitions must exist before writing data, otherwise the client will by default retry indefinitely.** Include partition column values in each row, the client routes records to the correct partition automatically.
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+let table = conn.get_table(&table_path).await?;
+
+// Create the partition before writing
+let mut partition_values = HashMap::new();
+partition_values.insert("dt", "2024-01-15");
+partition_values.insert("region", "US");
+admin.create_partition(&table_path, &PartitionSpec::new(partition_values), true).await?;
+
+let append_writer = table.new_append()?.create_writer()?;
+
+let mut row = GenericRow::new(4);
+row.set_field(0, 1);              // event_id
+row.set_field(1, "user_login");   // event_type
+row.set_field(2, "2024-01-15");   // dt (partition column)
+row.set_field(3, "US");           // region (partition column)
+
+append_writer.append(&row)?;
+append_writer.flush().await?;
+```
+
+### Reading from Partitioned Log Tables
+
+For partitioned tables, use partition-aware subscribe methods.
+
+```rust
+use std::time::Duration;
+
+let table = conn.get_table(&table_path).await?;
+let admin = conn.get_admin().await?;
+let partitions = admin.list_partition_infos(&table_path).await?;
+
+let log_scanner = table.new_scan().create_log_scanner()?;
+
+// Subscribe to each partition's buckets
+for partition_info in &partitions {
+    let partition_id = partition_info.get_partition_id();
+    let num_buckets = table.get_table_info().get_num_buckets();
+    for bucket_id in 0..num_buckets {
+        log_scanner.subscribe_partition(partition_id, bucket_id, 0).await?;
+    }
+}
+
+let records = log_scanner.poll(Duration::from_secs(10)).await?;
+for record in records {
+    println!("Record: {:?}", record.row());
+}
+```
+
+Subscribe to multiple partition-buckets at once:
+
+```rust
+use std::collections::HashMap;
+
+let mut partition_bucket_offsets = HashMap::new();
+partition_bucket_offsets.insert((partition_id, 0), 0i64);
+partition_bucket_offsets.insert((partition_id, 1), 0i64);
+log_scanner.subscribe_partition_buckets(&partition_bucket_offsets).await?;
+```
+
+### Managing Partitions
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+// Create a partition
+let mut partition_values = HashMap::new();
+partition_values.insert("dt", "2024-01-15");
+partition_values.insert("region", "EMEA");
+let spec = PartitionSpec::new(partition_values);
+admin.create_partition(&table_path, &spec, true).await?;
+
+// List all partitions
+let partitions = admin.list_partition_infos(&table_path).await?;
+for partition in &partitions {
+    println!(
+        "Partition: id={}, name={}",
+        partition.get_partition_id(),
+        partition.get_partition_name()
+    );
+}
+
+// List with filter
+let mut partial_values = HashMap::new();
+partial_values.insert("dt", "2024-01-15");
+let partial_spec = PartitionSpec::new(partial_values);
+let filtered = admin.list_partition_infos_with_spec(
+    &table_path, Some(&partial_spec),
+).await?;
+
+// Drop a partition
+admin.drop_partition(&table_path, &spec, true).await?;
+```
+
+## Partitioned Primary Key Tables
+
+Partitioned KV tables combine partitioning with primary key operations. Partition columns must be part of the primary key.
+
+### Creating a Partitioned Primary Key Table
+
+```rust
+use fluss::metadata::{DataTypes, KvFormat, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("user_id", DataTypes::int())
+            .column("region", DataTypes::string())
+            .column("zone", DataTypes::bigint())
+            .column("score", DataTypes::bigint())
+            .primary_key(vec!["user_id", "region", "zone"])
+            .build()?,
+    )
+    .partitioned_by(vec!["region", "zone"])
+    .kv_format(KvFormat::COMPACTED)
+    .build()?;
+
+let table_path = TablePath::new("fluss", "partitioned_users");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+### Writing to Partitioned Primary Key Tables
+
+**Partitions must exist before upserting data, otherwise the client will by default retry indefinitely.**
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+let table = conn.get_table(&table_path).await?;
+
+// Create partitions first
+for (region, zone) in [("APAC", "1"), ("EMEA", "2"), ("US", "3")] {
+    let mut values = HashMap::new();
+    values.insert("region", region);
+    values.insert("zone", zone);
+    admin.create_partition(&table_path, &PartitionSpec::new(values), true).await?;
+}
+
+let table_upsert = table.new_upsert()?;
+let upsert_writer = table_upsert.create_writer()?;
+
+for (user_id, region, zone, score) in [
+    (1001, "APAC", 1i64, 1234i64),
+    (1002, "EMEA", 2, 2234),
+    (1003, "US", 3, 3234),
+] {
+    let mut row = GenericRow::new(4);
+    row.set_field(0, user_id);
+    row.set_field(1, region);
+    row.set_field(2, zone);
+    row.set_field(3, score);
+    upsert_writer.upsert(&row)?;
+}
+upsert_writer.flush().await?;
+```
+
+### Looking Up Records in Partitioned Tables
+
+Lookup requires all primary key columns including partition columns.
+
+```rust
+let mut lookuper = table.new_lookup()?.create_lookuper()?;
+
+let mut key = GenericRow::new(3);
+key.set_field(0, 1001);    // user_id
+key.set_field(1, "APAC");  // region (partition column)
+key.set_field(2, 1i64);    // zone (partition column)
+
+let result = lookuper.lookup(&key).await?;
+if let Some(row) = result.get_single_row()? {
+    println!("Found: score={}", row.get_long(3));
+}
+```
+
+> **Note:** Scanning partitioned primary key tables is not supported. Use lookup operations instead.
diff --git a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
new file mode 100644
index 0000000000..5b299cca3a
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
@@ -0,0 +1,114 @@
+---
+sidebar_position: 5
+---
+# Primary Key Tables
+
+Primary key tables (KV tables) support upsert, delete, and lookup operations.
+
+## Creating a Primary Key Table
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .column("age", DataTypes::bigint())
+            .primary_key(vec!["id"])
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("fluss", "users");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+## Upserting Records
+
+```rust
+use fluss::row::{GenericRow, InternalRow};
+
+let table = conn.get_table(&table_path).await?;
+let table_upsert = table.new_upsert()?;
+let upsert_writer = table_upsert.create_writer()?;
+
+for (id, name, age) in [(1, "Alice", 25i64), (2, "Bob", 30), (3, "Charlie", 35)] {
+    let mut row = GenericRow::new(3);
+    row.set_field(0, id);
+    row.set_field(1, name);
+    row.set_field(2, age);
+    upsert_writer.upsert(&row)?;
+}
+upsert_writer.flush().await?;
+```
+
+## Updating Records
+
+Upsert with the same primary key to update an existing record.
+
+```rust
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);        // id (primary key)
+row.set_field(1, "Alice");
+row.set_field(2, 26i64);    // updated age
+
+upsert_writer.upsert(&row)?;
+upsert_writer.flush().await?;
+```
+
+## Deleting Records
+
+```rust
+// Only primary key field needs to be set
+let mut row = GenericRow::new(3);
+row.set_field(0, 2);  // id of record to delete
+
+upsert_writer.delete(&row)?;
+upsert_writer.flush().await?;
+```
+
+## Partial Updates
+
+Update only specific columns while preserving others.
+
+```rust
+// By column indices
+let partial_upsert = table_upsert.partial_update(Some(vec![0, 2]))?;
+let partial_writer = partial_upsert.create_writer()?;
+
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);       // id (primary key, required)
+row.set_field(2, 27i64);   // age (will be updated)
+// name will remain unchanged
+
+partial_writer.upsert(&row)?;
+partial_writer.flush().await?;
+
+// By column names
+let partial_upsert = table_upsert.partial_update_with_column_names(&["id", "age"])?;
+let partial_writer = partial_upsert.create_writer()?;
+```
+
+## Looking Up Records
+
+```rust
+let mut lookuper = table.new_lookup()?.create_lookuper()?;
+
+let mut key = GenericRow::new(1);
+key.set_field(0, 1);  // id to lookup
+
+let result = lookuper.lookup(&key).await?;
+
+if let Some(row) = result.get_single_row()? {
+    println!(
+        "Found: id={}, name={}, age={}",
+        row.get_int(0),
+        row.get_string(1),
+        row.get_long(2)
+    );
+} else {
+    println!("Record not found");
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/installation.md b/fluss-rust/website/docs/user-guide/rust/installation.md
new file mode 100644
index 0000000000..e698783195
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/installation.md
@@ -0,0 +1,76 @@
+---
+sidebar_position: 1
+---
+# Installation
+
+The Fluss Rust client is published to [crates.io](https://crates.io/crates/fluss-rs) as `fluss-rs`. The crate's library name is `fluss`, so you import it with `use fluss::...`.
+
+```toml
+[dependencies]
+fluss-rs = "0.1"
+tokio = { version = "1", features = ["full"] }
+```
+
+## Feature Flags
+
+```toml
+[dependencies]
+# Default: memory and filesystem storage
+fluss-rs = "0.1"
+
+# With S3 storage support
+fluss-rs = { version = "0.1", features = ["storage-s3"] }
+
+# With OSS storage support
+fluss-rs = { version = "0.1", features = ["storage-oss"] }
+
+# All storage backends
+fluss-rs = { version = "0.1", features = ["storage-all"] }
+```
+
+Available features:
+- `storage-memory` (default: In-memory storage)
+- `storage-fs` (default: Local filesystem storage)
+- `storage-s3` (Amazon S3 storage)
+- `storage-oss` (Alibaba OSS storage)
+- `storage-all` (All storage backends)
+
+## Git or Path Dependency
+
+For development against unreleased changes:
+
+```toml
+[dependencies]
+# From Git
+fluss = { git = "https://github.com/apache/fluss-rust.git", package = "fluss-rs" }
+
+# From local path
+fluss = { path = "/path/to/fluss-rust/crates/fluss", package = "fluss-rs" }
+```
+
+> **Note:** When using `git` or `path` dependencies, the `package = "fluss-rs"` field is required so that Cargo resolves the correct package while still allowing `use fluss::...` imports.
+
+## Building from Source
+
+**Prerequisites:** Rust 1.85+, Protobuf compiler (`protoc`)
+
+```bash
+git clone https://github.com/apache/fluss-rust.git
+cd fluss-rust
+```
+
+Install `protoc`:
+
+```bash
+# macOS
+brew install protobuf
+
+# Ubuntu/Debian
+sudo apt-get install protobuf-compiler
+```
+
+Build:
+
+```bash
+cargo build --workspace --all-targets
+```
diff --git a/fluss-rust/website/docusaurus.config.ts b/fluss-rust/website/docusaurus.config.ts
new file mode 100644
index 0000000000..0d974e95df
--- /dev/null
+++ b/fluss-rust/website/docusaurus.config.ts
@@ -0,0 +1,84 @@
+import {themes as prismThemes} from 'prism-react-renderer';
+import type {Config} from '@docusaurus/types';
+import type * as Preset from '@docusaurus/preset-classic';
+
+const config: Config = {
+  title: 'Apache Fluss Clients',
+  tagline: 'Rust, Python, and C++ clients for Apache Fluss',
+  favicon: 'img/logo/fluss_favicon.svg',
+
+  url: 'https://fluss.apache.org/',
+  baseUrl: '/fluss-rust/',
+
+  organizationName: 'apache',
+  projectName: 'fluss-rust',
+
+  onBrokenLinks: 'throw',
+
+  i18n: {
+    defaultLocale: 'en',
+    locales: ['en'],
+  },
+
+  presets: [
+    [
+      'classic',
+      {
+        docs: {
+          routeBasePath: '/',
+          sidebarPath: './sidebars.ts',
+          editUrl: 'https://github.com/apache/fluss-rust/edit/main/website/',
+        },
+        blog: false,
+        theme: {
+          customCss: './src/css/custom.css',
+        },
+      } satisfies Preset.Options,
+    ],
+  ],
+
+  themeConfig: {
+    image: 'img/logo/png/colored_logo.png',
+    colorMode: {
+      defaultMode: 'light',
+      disableSwitch: true,
+    },
+    navbar: {
+      title: '',
+      logo: {
+        alt: 'Fluss',
+        src: 'img/logo/svg/colored_logo.svg',
+      },
+      items: [
+        {
+          type: 'docSidebar',
+          sidebarId: 'docsSidebar',
+          position: 'left',
+          label: 'Client Docs',
+        },
+        {
+          href: 'https://fluss.apache.org/',
+          label: 'Fluss',
+          position: 'left',
+        },
+        {
+          href: 'https://github.com/apache/fluss-rust',
+          position: 'right',
+          className: 'header-github-link',
+          'aria-label': 'GitHub repository',
+        },
+      ],
+    },
+    footer: {
+      style: 'dark',
+      copyright: `Copyright © ${new Date().getFullYear()} The Apache Software Foundation, Licensed under the Apache License, Version 2.0.`,
+    },
+    prism: {
+      theme: prismThemes.vsDark,
+      darkTheme: prismThemes.dracula,
+      additionalLanguages: ['rust', 'toml', 'bash', 'cmake'],
+    },
+  } satisfies Preset.ThemeConfig,
+};
+
+export default config;
diff --git a/fluss-rust/website/package.json b/fluss-rust/website/package.json
new file mode 100644
index 0000000000..644a705184
--- /dev/null
+++ b/fluss-rust/website/package.json
@@ -0,0 +1,43 @@
+{
+  "name": "fluss-clients-website",
+  "version": "0.0.0",
+  "private": true,
+  "scripts": {
+    "docusaurus": "docusaurus",
+    "start": "docusaurus start",
+    "build": "docusaurus build",
+    "swizzle": "docusaurus swizzle",
+    "clear": "docusaurus clear",
+    "serve": "docusaurus serve"
+  },
+  "dependencies": {
+    "@docusaurus/core": "^3.9.2",
+    "@docusaurus/preset-classic": "^3.9.2",
+    "@mdx-js/react": "^3.0.0",
+    "clsx": "^2.0.0",
+    "prism-react-renderer": "^2.3.0",
+    "react": "^18.0.0",
+    "react-dom": "^18.0.0"
+  },
+  "devDependencies": {
+    "@docusaurus/module-type-aliases": "^3.9.2",
+    "@docusaurus/tsconfig": "^3.9.2",
+    "@docusaurus/types": "^3.9.2",
+    "typescript": "~5.5.2"
+  },
+  "browserslist": {
+    "production": [
+      ">0.5%",
+      "not dead",
+      "not op_mini all"
+    ],
+    "development": [
+      "last 3 chrome version",
+      "last 3 firefox version",
+      "last 5 safari version"
+    ]
+  },
+  "engines": {
+    "node": ">=20.0"
+  }
+}
diff --git a/fluss-rust/website/sidebars.ts b/fluss-rust/website/sidebars.ts
new file mode 100644
index 0000000000..51bdd5cf7a
--- /dev/null
+++ b/fluss-rust/website/sidebars.ts
@@ -0,0 +1,24 @@
+import type {SidebarsConfig} from '@docusaurus/plugin-content-docs';
+
+const sidebars: SidebarsConfig = {
+  docsSidebar: [
+    'index',
+    {
+      type: 'category',
+      label: 'User Guide',
+      items: [
+        {type: 'autogenerated', dirName: 'user-guide'},
+      ],
+    },
+    {
+      type: 'category',
+      label: 'Developer Guide',
+      items: [
+        'developer-guide/contributing',
+      ],
+    },
+    'release',
+  ],
+};
+
+export default sidebars;
diff --git a/fluss-rust/website/src/css/custom.css b/fluss-rust/website/src/css/custom.css
new file mode 100644
index 0000000000..9143372f85
--- /dev/null
+++ b/fluss-rust/website/src/css/custom.css
@@ -0,0 +1,209 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *    http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/**
+ * Copied from the main fluss.apache.org website (fluss/website/src/css/custom.css)
+ * to ensure visual consistency.
+ */
+
+/* Import Inter font from Google Fonts */
+@import url('https://fonts.googleapis.com/css2?family=Inter:wght@400;500;600;700;800&display=swap');
+
+/* You can override the default Infima variables here. */
+:root {
+  --ifm-color-primary: #0071e3;
+  --ifm-color-primary-dark: #0066cc;
+  --ifm-color-primary-darker: #0060c1;
+  --ifm-color-primary-darkest: #004f9f;
+  --ifm-color-primary-light: #007cfa;
+  --ifm-color-primary-lighter: #0682ff;
+  --ifm-color-primary-lightest: #2893ff;
+  --ifm-code-font-size: 90%;
+  --ifm-font-family-base: 'Inter', -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, 'Helvetica Neue', Arial, 'PingFang SC', 'Hiragino Sans GB', 'Microsoft YaHei', sans-serif;
+  --docusaurus-highlighted-code-line-bg: #E2E9F3;
+
+  --ifm-menu-color-background-active: #edeefa99;
+  --ifm-menu-color-background-hover: #edeefa99;
+}
+
+
+.navbar__brand {
+  font-family: monaco;
+  color: inherit;
+}
+
+.header-github-link:hover {
+  opacity: 0.6;
+}
+
+.header-github-link::before {
+  content: '';
+  width: 24px;
+  height: 24px;
+  display: flex;
+  background: url("data:image/svg+xml,%3Csvg viewBox='0 0 24 24' xmlns='http://www.w3.org/2000/svg'%3E%3Cpath d='M12 .297c-6.63 0-12 5.373-12 12 0 5.303 3.438 9.8 8.205 11.385.6.113.82-.258.82-.577 0-.285-.01-1.04-.015-2.04-3.338.724-4.042-1.61-4.042-1.61C4.422 18.07 3.633 17.7 3.633 17.7c-1.087-.744.084-.729.084-.729 1.205.084 1.838 1.236 1.838 1.236 1.07 1.835 2.809 1.305 3.495.998.108-.776.417-1.305.76-1.605-2.665-.3-5.466-1.332-5.466-5.93 0-1.31.465-2.38 1.235-3.22-.135-.303-.54-1.523.105-3.176 0 0 1.005-.322 3.3 1.23.96-.267 1.98-.399 3-.405 1.02.006 2.04.138 3 .405 2.28-1.552 3.285-1.23 3.285-1.23.645 1.653.24 2.873.12 3.176.765.84 1.23 1.91 1.23 3.22 0 4.61-2.805 5.625-5.475 5.92.42.36.81 1.096.81 2.22 0 1.606-.015 2.896-.015 3.286 0 .315.21.69.825.57C20.565 22.092 24 17.592 24 12.297c0-6.627-5.373-12-12-12'/%3E%3C/svg%3E")
+  no-repeat;
+}
+
+
+.menu__list-item {
+  font-size: 0.95rem;
+  font-weight: 500;
+}
+
+.menu__link--sublist-caret:after {
+  background: var(--ifm-menu-link-sublist-icon) 50% / 1.5rem 1.5rem;
+}
+
+
+.markdown {
+    padding-left: 1rem;
+    h1,
+    h2,
+    h3,
+    h4,
+    h5,
+    h6 {
+        color: #1d1d1d;
+        margin-bottom: 0.3125rem;
+        font-weight: 700;
+    }
+
+    b,
+    strong {
+        font-weight: 700;
+        color: #1d1d1d;
+    }
+
+    h1,
+    h1:first-child {
+        font-size: 2.5rem;
+        margin-bottom: 1.5rem;
+        margin-top: 0;
+    }
+
+    h2 {
+        font-size: 2rem;
+        margin-bottom: 1.25rem;
+        margin-top: 2rem;
+        padding-top: 2rem;
+        border-top: 1px solid #e6e7e9;
+    }
+
+    h3 {
+        font-size: 1.5rem;
+        margin-bottom: 1.25rem;
+        margin-top: 1rem;
+    }
+    p {
+        line-height: 1.875;
+
+        code {
+          border-radius: 4px;
+          background-color: #edf2fa;
+          border: none;
+          padding: 3px 4px;
+          font-size: 14px;
+          color: #4c576c;
+      }
+    }
+
+    li > code {
+        border-radius: 4px;
+        background-color: #edf2fa;
+        border: none;
+        padding: 3px 4px;
+        font-size: 14px;
+        color: #4c576c;
+    }
+
+    table thead tr {
+        background-color: #f7f9fe;
+    }
+
+    table thead th {
+        background-color: #f7f9fe;
+        color: #1d1d1d;
+        font-size: 1rem;
+        font-weight: 500;
+    }
+
+    table tr {
+        border-bottom: none;
+        background-color: var(--global-colors-white);
+        font-size: var(--global-font-size-small);
+
+        code {
+            border-radius: 4px;
+            background-color: #edf2fa;
+            border: none;
+            padding: 3px 4px;
+            font-size: 14px;
+            color: #4c576c;
+        }
+    }
+
+    table tr th {
+        padding: 0.53rem 0.8125rem;
+        border-color: #dfe5f0;
+    }
+
+    table tr td {
+        padding: 0.65rem 0.8125rem;
+        border-color: #dfe5f0;
+    }
+    a {
+        color: var(--ifm-color-primary);
+    }
+    ul {
+        padding-left: 20px;
+        li {
+            margin-top: 4px;
+            position: relative;
+            list-style: initial;
+        }
+    }
+    ol {
+        padding-left: 20px;
+        li {
+            list-style: decimal;
+        }
+    }
+}
+
+.theme-doc-markdown {
+    header {
+        margin-top: 1rem;
+
+        & + h1 {
+            display: none;
+        }
+    }
+}
+
+.breadcrumbs__item--active .breadcrumbs__link {
+  background: var(--ifm-menu-color-background-active);
+}
+
+.footer__copyright {
+    color: #dfe5f0;
+    font-size: .75rem;
+    line-height: 1.8;
+    opacity: .6;
+    text-align: center;
+    width: 98%;
+}
diff --git a/fluss-rust/website/static/img/logo/fluss_favicon.svg b/fluss-rust/website/static/img/logo/fluss_favicon.svg
new file mode 100644
index 0000000000..7c044d55d5
--- /dev/null
+++ b/fluss-rust/website/static/img/logo/fluss_favicon.svg
@@ -0,0 +1,19 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+<svg width="142" height="144" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xml:space="preserve" overflow="hidden"><defs><clipPath id="clip0"><rect x="118" y="81" width="142" height="144"/></clipPath><clipPath id="clip1"><rect x="118" y="81" width="142" height="144"/></clipPath><clipPath id="clip2"><rect x="119" y="82" width="141" height="143"/></clipPath><clipPath id="clip3"><rect x="119" y="82" width="141" height="143"/></clipPath><clipPath id="clip4"><rect x="119" y="82" width="401" height="173"/></clipPath><linearGradient x1="59.1276" y1="1.49011" x2="59.1276" y2="126.123" gradientUnits="userSpaceOnUse" spreadMethod="pad" id="fill5"><stop offset="0" stop-color="#FFFFFF" stop-opacity="1"/><stop offset="0.335714" stop-color="#FFFFFF" stop-opacity="1"/><stop offset="1" stop-color="#96A1FF" stop-opacity="1"/></linearGradient><linearGradient x1="69.5384" y1="92.8835" x2="69.5384" y2="170.369" gradientUnits="userSpaceOnUse" spreadMethod="pad" id="fill6"><stop offset="0" stop-color="#002CDC" stop-opacity="1"/><stop offset="1" stop-color="#3B5FEE" stop-opacity="1"/></linearGradient></defs><g clip-path="url(#clip0)" transform="translate(-118 -81)"><g clip-path="url(#clip1)"><g clip-path="url(#clip2)"><g clip-path="url(#clip3)"><g clip-path="url(#clip4)"><path d="M53.1018 21.9594C53.1018 24.9913 51.0461 27.4492 48.5103 27.4492 45.9745 27.4492 43.9188 24.9913 43.9188 21.9594 43.9188 18.9274 45.9745 16.4695 48.5103 16.4695 51.0461 16.4695 53.1018 18.9274 53.1018 21.9594Z" fill="#000000" fill-rule="nonzero" fill-opacity="1" transform="matrix(0.650313 -0.761909 0.753395 0.657662 121.741 121.546)"/><path d="M113.737 21.7028C113.737 23.7968 111.727 25.4944 109.247 25.4944 106.767 25.4944 104.757 23.7968 104.757 21.7028 104.757 19.6088 106.767 17.9113 109.247 17.9113 111.727 17.9113 113.737 19.6088 113.737 21.7028Z" fill="#000000" fill-rule="nonzero" fill-opacity="1" transform="matrix(0.778888 -0.627162 0.620154 0.78769 130.596 151.964)"/><path d="M13.0434 119.963C9.0102 119.963 7.80818 118.503 7.50022 117.281 7.04326 115.443 8.52343 113.377 11.3546 111.877 20.9808 106.781 34.7494 96.6879 41.8523 85.0253L42.2993 84.2902 43.1636 84.3101C43.9483 84.3299 44.6139 84.6875 45.051 85.3134 46.2828 87.1214 45.2696 90.5089 42.647 97.8005 41.6039 100.711 40.5211 103.721 40.3224 105.291 39.4581 111.996 33.5374 116.089 20.5238 118.97 17.5337 119.636 15.0203 119.963 13.0434 119.963Z" fill="#B0B7F3" fill-rule="nonzero" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M20.8459 120.425 20.8476 120.425C33.9046 117.534 40.889 112.552 41.8007 105.478 41.918 104.551 42.6561 102.192 44.0149 98.4003L44.0492 98.3049C46.7341 90.84 47.4752 86.2251 46.2726 84.4602 45.5323 83.4001 44.5073 82.8535 43.1977 82.8203L41.4732 82.7807 40.5796 84.2502C37.4024 89.467 32.7408 94.6401 26.5948 99.7696 21.4547 104.06 16.1421 107.656 10.657 110.56 6.90856 112.546 5.37466 114.908 6.0553 117.645 6.69515 120.184 9.02453 121.454 13.0434 121.454 15.1638 121.454 17.7647 121.111 20.8459 120.425ZM38.8441 105.104C38.1113 110.789 31.8972 114.926 20.2017 117.515L20.2001 117.515C17.3313 118.154 14.9458 118.473 13.0434 118.473 10.5727 118.473 9.20664 117.955 8.94515 116.917 8.64093 115.694 9.67664 114.453 12.0523 113.194 17.7206 110.193 23.2046 106.481 28.5044 102.058 34.903 96.7173 39.7765 91.2982 43.1249 85.8004L43.1253 85.7997 43.1293 85.7998C43.4305 85.8074 43.6638 85.9297 43.8293 86.1666 44.4482 87.0751 43.5867 90.7849 41.2448 97.2962L41.2094 97.3949C39.7772 101.391 38.9888 103.961 38.8441 105.104Z" fill="#000000" fill-rule="evenodd" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M104.427 71.7641C102.46 71.7641 100.433 70.9892 98.8738 69.6382 98.0989 68.9726 91.3934 62.7638 93.4895 50.1277L94.1154 46.3428 96.2115 49.5615C97.2446 51.1608 99.1122 52.8695 101.089 54.6874 103.751 57.1312 106.761 59.9028 108.818 63.3003 110.586 66.2308 109.94 68.2673 109.404 69.221 108.5 70.8104 106.652 71.7641 104.437 71.7641L104.427 71.7641Z" fill="#B0B7F3" fill-rule="nonzero" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M104.427 73.2542 104.437 73.2542C107.362 73.2542 109.45 72.1533 110.703 69.9515 111.947 67.7393 111.744 65.2651 110.093 62.5287 108.64 60.1293 105.975 57.1499 102.098 53.5906L102.02 53.5187C99.5929 51.2873 98.0731 49.6971 97.4601 48.7483L93.271 42.3156 92.0195 49.8838C91.0855 55.5146 91.6645 60.5553 93.7565 65.0058 94.9134 67.467 96.294 69.3866 97.8981 70.7645 99.8143 72.4243 101.991 73.2542 104.427 73.2542ZM108.105 68.4904C107.429 69.6795 106.206 70.274 104.437 70.274L104.427 70.274C102.731 70.274 101.206 69.6866 99.8494 68.5119 98.5616 67.4056 97.4296 65.8143 96.4536 63.738 94.6248 59.8475 94.1268 55.392 94.9596 50.3715L94.9598 50.37 94.9628 50.3746C95.7092 51.5302 97.3891 53.3095 100.002 55.7125L100.08 55.7843C103.75 59.1528 106.238 61.9153 107.543 64.0718 108.595 65.8145 108.782 67.2873 108.105 68.4904Z" fill="#000000" fill-rule="evenodd" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M35.1375 123.838C33.4288 116.447 35.813 108.579 38.1078 100.97 39.5482 96.1916 40.9191 91.6716 41.088 87.7476 41.4556 79.254 43.2437 62.7337 43.8894 56.952 42.9556 57.3096 41.5748 57.9951 39.7072 59.2766 35.8527 61.9389 24.1306 70.0352 14.3256 70.0352 13.7693 70.0352 13.2229 70.0054 12.7064 69.9557 9.74601 69.6676 7.40157 67.3629 7.00421 64.3529 6.77572 62.5946 6.86513 56.5547 17.7827 52.4718 20.8523 51.3393 23.7233 49.0246 27.3591 46.0841 30.091 43.8788 33.1904 41.3754 37.1442 38.723 38.4555 37.8289 39.8661 37.223 41.2271 36.6368 44.9822 35.0176 48.2207 33.6268 49.5916 26.5637 51.8565 14.9011 54.7374 8.91086 65.8536 4.23191 70.1054 2.44378 75.2016 1.49011 80.5759 1.49011 88.1457 1.49011 95.6857 3.37758 100.752 6.52668 109.147 11.752 111.938 23.1563 111.183 29.2161 110.289 36.3885 105.898 41.7231 96.9771 46.4418 95.0201 54.1009 93.1723 64.8695 94.9307 74.0982 95.1194 74.4161 95.4472 74.9724 95.5168 75.0916 97.2552 77.6944 99.699 79.2739 102.053 80.7938 104.487 82.3634 107.011 83.9926 108.6 86.6946 109.723 88.6616 109.951 91.7709 109.286 96.2115L109.107 97.4532 107.855 97.483C100.235 97.6718 82.9495 98.844 73.4035 104.298 63.8576 109.752 47.267 117.063 37.5117 124.683L35.664 126.123 35.1375 123.848 35.1375 123.838Z" fill="url(#fill5)" fill-rule="nonzero" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M33.6475 124.004C32.5122 118.832 33.5168 111.033 36.6611 100.606L36.6812 100.54 36.716 100.424C38.5319 94.4006 39.493 90.1538 39.5993 87.6836 39.8524 81.8341 40.6886 72.4405 42.1077 59.5029 41.6156 59.7963 41.0965 60.1305 40.5503 60.5052 29.914 67.852 21.1724 71.5253 14.3256 71.5253 13.7495 71.5253 13.1622 71.4965 12.5637 71.439 8.42584 71.0363 6.08023 68.7393 5.52692 64.5479 5.26244 62.5126 5.73332 60.5004 6.93955 58.5114 8.80904 55.4286 12.2494 52.9501 17.2607 51.076 19.1687 50.3722 22.2224 48.322 26.422 44.9255L26.4427 44.9089C30.3576 41.7485 33.648 39.274 36.314 37.4855 37.2569 36.8426 38.6919 36.1062 40.6189 35.2763L40.6377 35.2682 40.647 35.2643C42.8894 34.2973 44.4268 33.4021 45.2593 32.5786 46.6182 31.2344 47.5747 29.1348 48.1288 26.2798 49.3784 19.8453 51.0584 15.0669 53.1688 11.9445 55.6817 8.22673 59.7173 5.19805 65.2756 2.85851 69.8068 0.952836 74.907 0 80.5759 0 88.9082 0 95.8958 1.75371 101.539 5.26112 105.66 7.82616 108.743 11.7457 110.788 17.0196 112.512 21.4644 113.136 25.5913 112.661 29.4004 111.753 36.6828 106.953 42.6971 98.2611 47.4434 95.6866 57.7621 95.0486 66.4696 96.3471 73.5659L96.4468 73.7343 96.7784 74.2975C97.8311 75.8552 99.8588 77.6034 102.862 79.5419 106.363 81.7999 108.704 83.9323 109.885 85.9391 111.177 88.2034 111.468 91.7011 110.759 96.4324L110.402 98.9129 107.89 98.9727C92.4457 99.3553 81.1966 101.561 74.1427 105.591 72.1164 106.749 68.5306 108.648 63.3855 111.289 51.1261 117.582 42.8072 122.437 38.429 125.857L34.7387 128.734 33.6475 124.019 33.6475 124.004ZM36.5913 123.51 36.5893 123.502C35.5131 118.847 36.4881 111.502 39.5145 101.467L39.5344 101.4 39.5694 101.284C41.4573 95.0218 42.4597 90.5311 42.5767 87.8117 42.8443 81.6283 43.7755 71.3969 45.3703 57.1174L45.642 54.6852 43.3565 55.5605C42.0479 56.0616 40.5505 56.8908 38.8641 58.0479 28.7324 65.046 20.553 68.5451 14.3256 68.5451 13.8447 68.5451 13.3525 68.5209 12.849 68.4725 10.2841 68.2229 8.82827 66.7847 8.4815 64.1579 7.93486 59.9511 11.2092 56.5209 18.3046 53.8674 20.5114 53.0533 23.8419 50.8451 28.2961 47.2428L28.3147 47.2278C32.1613 44.1225 35.3812 41.7001 37.9744 39.9605 38.7718 39.4168 40.0463 38.7678 41.7977 38.0135L41.8165 38.0055 41.8271 38.0009C44.4135 36.8856 46.2562 35.7844 47.3552 34.6973 49.1503 32.9216 50.3833 30.305 51.0544 26.8476 52.2266 20.8113 53.7545 16.3999 55.6379 13.6134 57.82 10.385 61.4179 7.71569 66.4317 5.60532 70.5929 3.85525 75.3077 2.98022 80.5759 2.98022 88.3411 2.98022 94.8043 4.58423 99.9653 7.79224 103.522 10.0063 106.203 13.4413 108.009 18.0973 109.552 22.075 110.117 25.7199 109.704 29.0319 108.904 35.4499 104.429 40.8141 96.2803 45.1246L95.6968 45.4333 95.5334 46.0729C92.6847 57.2217 91.9958 66.6564 93.4669 74.3771L93.5157 74.633 93.8821 75.2523 94.2542 75.8841 94.2777 75.9192C95.5524 77.8278 97.8749 79.8699 101.245 82.0457 104.351 84.0485 106.374 85.85 107.316 87.4501 108.254 89.0937 108.419 91.9405 107.811 95.9906L107.811 95.9935C91.8678 96.3892 80.1521 98.7261 72.6643 103.004 70.6767 104.14 67.1302 106.017 62.0248 108.638 49.5979 115.016 41.1212 119.972 36.5945 123.508L36.5913 123.51Z" fill="#000000" fill-rule="evenodd" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M78.4791 81.8435C70.5319 82.8369 65.5649 78.8635 65.5649 71.4128 65.5649 63.9622 66.5583 52.0413 72.0219 43.5973 78.8168 37.4978 95.8935 40.9551 95.367 44.0942 92.3868 49.5578 90.609 62.996 89.4066 71.4128 88.9099 74.8897 86.4264 80.8501 78.4791 81.8435Z" fill="#FFFFFF" fill-rule="nonzero" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M91.7908 33.4185C93.877 30.8356 96.3605 29.0475 96.4598 27.6567 96.5592 26.2659 91.7908 24.1798 89.9033 24.4778 88.0159 24.7758 83.6449 27.6567 83.7442 29.2461 83.8436 30.8356 87.4198 32.3257 89.2079 33.6171 89.0093 35.4052 86.0787 37.1636 83.8336 37.1636 80.8335 37.1636 77.3765 35.4748 77.1679 36.2695 76.8996 37.3126 80.2474 38.8822 83.8336 38.8822 86.337 38.8822 87.8967 37.9881 89.1881 36.8258 90.3901 35.7529 91.304 36.2993 91.7213 36.6371 92.6948 37.4318 94.6717 37.9881 96.2711 37.9881 98.0989 37.9881 101.029 36.5278 100.751 35.8821 100.304 34.8191 98.1387 36.3987 96.5294 36.3987 93.1816 36.3987 91.4729 34.5112 91.7709 33.4185L91.7908 33.4185Z" fill="#000000" fill-rule="nonzero" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M75.1016 22.7288C75.1016 24.4845 74.0786 25.9077 72.8167 25.9077 71.5548 25.9077 70.5319 24.4845 70.5319 22.7288 70.5319 20.9732 71.5548 19.5499 72.8167 19.5499 74.0786 19.5499 75.1016 20.9732 75.1016 22.7288Z" fill="#000000" fill-rule="nonzero" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M104.794 22.729C104.794 24.375 103.86 25.7092 102.708 25.7092 101.556 25.7092 100.622 24.375 100.622 22.729 100.622 21.0831 101.556 19.7488 102.708 19.7488 103.86 19.7488 104.794 21.0831 104.794 22.729Z" fill="#000000" fill-rule="nonzero" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M78.499 104.944C76.8301 105.526 73.2704 106.904 67.8199 109.076 67.4159 107.917 67.6311 106.444 68.4656 104.655 72.5386 97.4036 70.1544 92.1385 84.8568 88.6616 79.6911 91.2444 78.8964 94.5227 78.7971 100.582 78.8103 102.258 78.711 103.715 78.499 104.953L78.499 104.944Z" fill="#000000" fill-rule="nonzero" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M1.12754e-05 139.014C7.84267 140.529 19.5771 141.638 26.868 139.856 37.4497 137.271 48.9674 125.97 63.3225 114.135 77.6778 102.3 102.565 95.1492 122.32 101.933 128.024 103.894 130.941 107.816 130.941 107.915 129.266 106.826 127.493 105.637 125.719 104.845 117.246 100.983 107.097 100.884 98.1318 102.963 96.8509 103.261 95.6687 103.558 94.3878 103.954 93.2055 104.35 91.9246 104.746 90.7424 105.142 89.56 105.538 88.3778 106.034 87.1954 106.529 86.013 107.024 84.8308 107.618 83.747 108.113 82.5647 108.708 81.4809 109.302 80.3971 109.995 79.3133 110.688 78.2295 111.283 77.1458 112.075 76.062 112.768 75.0767 113.561 73.9929 114.254 73.0077 115.046 71.9239 115.839 71.0371 116.631 67.2932 119.899 63.8448 123.564 60.3964 127.03 46.6027 141.787 36.5531 149.71 15.3701 150.403 11.9217 150.502 3.3499 150.205 0.0985432 148.522 23.6463 166.052 59.8052 171.4 78.6237 170.211 98.4274 169.023 121.679 160.604 127.986 144.956 115.473 135.646 111.531 150.899 101.481 145.848 91.432 140.796 97.6391 128.615 107.197 121.187 116.753 113.759 123.463 114.422 126.99 115.878 132.498 118.146 132.626 122.474 132.32 123.564 131.936 124.95 130.843 125.842 129.759 126.733 132.813 126.238 134.783 125.544 137.148 123.167 139.02 120.592 139.414 117.621 138.823 114.551 137.837 108.906 134.587 103.558 129.956 100.388 118.724 92.4652 104.408 92.1186 90.6044 93.525 75.057 95.1096 56.1007 105.717 40.9473 117.384 31.7746 124.445 16.0597 135.953 0 139.024L1.12754e-05 139.014ZM76.5546 140.004C67.0961 150.998 51.263 158.307 35.3708 157.138 27.6858 156.573 22.661 155.454 21.5772 154.464 33.7944 155.85 48.2777 151.493 53.9922 147.828 59.7066 144.164 66.6035 135.547 70.3475 132.972 74.0915 130.397 76.259 130.992 77.5399 131.883 79.7074 133.27 79.1163 137.033 76.5546 140.004Z" fill="url(#fill6)" fill-rule="nonzero" transform="matrix(1 0 0 1.0113 119 82.3391)"/><path d="M71.5253 45.2C75.4989 47.1868 80.9627 48.677 86.4264 48.6769 90.0688 48.6769 93.3802 48.1802 96.3604 47.1868L98.844 43.7099C91.8901 47.0213 82.7839 47.518 71.5253 45.2Z" fill="#000000" fill-rule="nonzero" fill-opacity="1" transform="matrix(1 0 0 1.0113 119 82.3391)"/></g></g></g></g></g></svg>
\ No newline at end of file
diff --git a/fluss-rust/website/static/img/logo/png/colored_logo.png b/fluss-rust/website/static/img/logo/png/colored_logo.png
new file mode 100644
index 0000000000000000000000000000000000000000..2cd7dd3749494998b019b51f206077d65501c352
GIT binary patch
literal 45184
zcmZs@by!r}_Xj*6S40UB1Emy|5v5hS6bu@{k!}!_?q)y`5D>f$64KHg(lG-9j)-)3
z=Kw?30Q2rM-tX^y|9E*Gy_dbuS$plZJ}dV=eo$3@MsxPsSr`mPBllcZ4F)@{41<vu
zoH-3f7Mdn^z<<ab)t)_u6|^%ifnO*bAIrTw1Ae^Dm<GdO*I{z9k6yaPuZ-!0i4S?R
z?Hce#EBtow9sIob+~wUro7L>(_PnD^3xE8n160V!8)X$KZ&`&3iJ)bt^(#%21kZ3s
z&#vA5kbjQbom-k>m)rh)ryO&xWu*eorIBF8f>lbL?$4($ypf|n-K4knam0ObE%u-T
z`T9h?58<4XBgK|XG+#Ct>%%PNEX5YsCOEz(<D*%6SEwRZ*)Y?tt~XT`(O!i|uu=lf
zVbp)}oXB7rk?p0F=21a;qB}b;&S*jthD8+c`cG+<f@eg6?I~{7<Or@VsiuqK!=Xv(
z3JSQi+#AP{Xy3FCca_P%<e1)o#*65{c+zIZrN{>w*2B%QX3${rKkpcl72JEy%2y-a
z>vKXwFg{^-N1dumb=)$l|3JTgT(l=&xobP@-ojp~dMR*+92)dhPVf9~8dhPp_>uHG
zEWhQ&$t*_4^M?G{8<2Kju-?xm-k<BXKloIv$y_9jOfrjX^9&8dormc9*1dLcn=EC%
znK&zvevvc%+yEOhb37rY^(Df2=`b}l)e-NRiv1{k2`4v~TSDSi8Uwb_^qd@J{j1oT
zj+WMj(Tlo4P*y}#^qNVf+Itv@tOUET-*J?Qub*7|!9K1y;HFZ-l^kkeRjsDO7&2(x
zmJ9LqKEL@t)z5CPYi}J~m%kQZ?N*}6RiMQhe0TdX^o-#*3V4x$!$n%f@<%Pbo}ZnJ
ze2wHU(Fdi6lJ?<S?I4>cKdL658^86oO1Hpbz@bW)JGvDipZyCh;oMro_KoyhXC3oD
z%4rMn8X^nbRX@gu0`I(k7ilJ&_9|Q(n!oc)RgX_e#Dn#-rC3UhyL{l(c9FgW-4f#c
zfeJLw$lpMvs1VM23bpEW`^RUa+?>1N;o;wMawKIU?^4`>9)VqqOvR>DGG>xHew)1<
zVNV*XOktLIf1ATCDT-C*;#LxAth4GOj-lHlx(LO3Dspr!f;0%rn>!!V=@;+FR!3S8
zmi$melv;s;Bkxt+_G3AgBP-HlMb8}0C@yMY$>i6jDM^s<U246-my%2iNVP>!lO9r!
z{MM+?p{nuBF`298U;~mO%upV@$e0}Nk;K(l3nx9Mdp)Q=zz=svT2Aj+mGlswvIqr7
z*e{2wi;1KsIzO15QDV%F@=QvjMYfZM7%MN5GjJr&jl;8R*hHWq;Rzl2D=^s*XBE_|
z*?1Glq>3_;ths(2+mDfIUR!Y!VOR9sj0W1gud|1<8!yoOU5J)*Tfpd>L%RoQAwE%$
zcxe$%?d3P$qN!ve)k21>E+Y`D)!B5iO~woFpj9T%zD_^qEAi#q`_5bG7hBCNQ@tL+
zb8<o&8ygdZ80f`pDWIopW;43~sb`h%dTjC8@$y%`vz+Og`LF&}8-8=2{@;--k}30~
zVyU)m%W$Wu+nP05SXtLZod($ds?h0q1jC}nJqe`%j<7z5s?oBA7I6xaut+l<0{x9N
z4~-=mGGsd#pydMP?Z}UR6{FSA^eI&8y^r0dT^XVA{QEDjIPnH`QWW(3DAKD+kcS2*
z19F{HbU0mN24pRMNDdY+e7I2qjaz(~q^Rz5(`QJbBA5z}EDdxS$-Z2D37K*|njyY^
zr#sdqSF~q57?8`#$q^P8w>nza4En3X(p$DRx%bAS;s}`v<*t3!dX5U5`G#zB@l3~m
ztZdw)g`gE+uzrUJQZGD3W#ux<V_k;E9jdszPp*Xw@ry&+@J*;ocOp}L9uf@1UHjg8
zta|8GNU*I<xw|Eb2AI-w&N9^tVe0an0P)lBujpHBu4~2MAbI<;#LfhGN2Vs!ry(9Q
z2p2b+ZiMn#U4d2<>jX0>6W<iMb`i;SKe|YsQ>RS?<DMW8N~~XvSx9P^zWI(}S1u$t
zQ~rwmD|yaDkGFPak6v)5>-}Jmae+ANj7g~;gqy?d*(hY38k$`gOIq=y9bM}J)c-Y+
z@FOIjQJQq{NPw2?6l$O%TyK^RTKp{%4VJSGx>2Jh%lxG29CtLtZGF?#-vQpAOne!B
z6u!#szFlwefVsqy9+yO{)shrmkbG9W7OVEqo#aC^o<%V1Hi)y^aO*X_5iyr>dPF0(
zE!q+%*nH?cxx(G-!H8KsMql;Fh8A9VD4`rveGw-&MR^lob1qr_-HSn^Z~N8d5(sF1
zP{t#k&$;4fJ;!_Ga(3o4unlg#(_!tj49x>y1S=*MXIh}g7%w+asqgt|Cc#)J7=Fk&
ziYZ>4Xv)7q($S!T&=($<sLQx%XY-#0|F~4vO3e^InjHwy(tF#&M$3}tPsK9o+cFI5
zb<`=d_v6{V2QRKtK~lV<08ss5oP$r>#|`>@H<%T!I7Vp<lTh9k^xM6-=zJk%fC^01
zkH<iZM47-eLU|#*f8jaBVJ3(>)`*#i1@kb^dR4v7;>gdP6r!rhS2UIhB>Ia<lL6Ve
z@>dLPNJini!MAdTV2D`$pe|pm%cCG6p{U={=*(>_al{4@VF0maw}I;{P4QN*x=M3?
z#klr#wh`~PxZKeT>f|d-&@*G*K);_-J1I7D5ykC1MM54c&fl;k9$ERYK+Dl?YCuF%
z9`U!(%eW8FD|aA`Jqb_rOyG)En4;QF%hZPl{S{t}xP<cHm8uT70w<MH@-v@t=y{9K
z$pG(?J9@CrkF4)dcee#0(F~poTsEGVT{QZ|)9CbwD9T#U%BKfC?fDo`R|*eT@wt|9
z?)SPQN$yM(@Rd~Mpp~y3o(cY}gNuB^*^g}@8Ti&2W%2AHLW0e%FbOJZI3f@%$km5w
zAHoB10*a7%)U#GqK_+(zhf2v0ga<C=6avc@6%C2sdPq!C3pwyw+ll|wY&<rEo1DDP
zUQLBnlOLe4<JJu5B>B0)o1E;gtjE;k?-lSYtUMe$b!BxSvKz#|-A!E@+k|cTQxMaP
z{${0i-^x}|_3Ez{C@R)XYt`iIh@+(&-)pO&-NIJNm_6dQjjMF~eY_pp(_1q#asxO<
zbmFGu5*F%aqlP^#p~nmrZSLy9sGo-iYvnCGNR}C?;#vMBBILnr#&tPV+wmhaD{J}g
zDEFTPV*xjas_%UV#*ADBC6BmxG{2Y9o_$<h$Te1js=A8vr0F+uQvp737nY|jpY$3l
zS|x21{1^1g_fMd;>VvQ5oNE^<bX>R`czXC80?~I3{lR|NjIH7!vrc=}noPL1yD>!N
zsfr!>f`ap!c+$Xct-(kB4Aa{dO$~#OmPqEyc)Ec~m-h>gVb1Wf65ljxYgAf?usfOT
zLi_pu^ZtNB*;@SPlxjnh0lU2X$+W2s(^N``3qJ0543&vDJWsDJ{&KoFs_DO;wo8&|
z3@b#puj>1OQbGH9oozW4K8TsG=i}?k)K)2lMb4?;_y-Eh(stzLY1*!rzxH<b<N6Gz
zZ9N3ilBnt$pr<V!+mR1AJVndMh-SC*(M&RO>O;dYGb-gt?d<jhy)ONqFy#VAzm%QR
z0*}O@DQ7SxdsnZ%x6EEm&qBbeW-Y0_@j3R~e{;zxk)Kf|56d>bF3sKd5?Oc}v2`Ef
zqW=7-ZZ(YYy!ou>C$*5A92buxNiD9+1IH5$4GqZ#K?h#rcf_x5?vXH66cI&VT)k`!
zB~cmexY~$9_jdO$j_7X7&uZEr3^ddUYUC5Q_qyKCIcV((>y+<?lVr{3pgg^owkEf;
zxZZU5>4CdmJNl`}LIZOgXZp01%DcZl;k8<?xLljfasY)oostWUB9BK~;Q3_T+u|)E
zuG%vG19Z?%4DoZFgcMf|D(Z|QZCCo3_`O4C7R3k0l7wZJo=Int1_nJ_&&OW`eua1C
zi|SzjGWzh0Qv104p0pNEG<K_ETT8)zfRytZ;``1j%P09J=B(aYQ1|f$sZ^$|%+(*c
zD$euTL!)Y;cy4G-Sn7kEdwW-ty8T*)Mj}18;%^H>2uKc(14+%PPj98J_xYUhv?|t=
zZLe~=I`B&bJ2hqW5`m~DrO}KR8>nRe;6}A99<u}m1^J&-D$mKeKnia4SKl#Y$=Urt
z03(TMd!2gbb^s}4+X3xA3|bZy7GBJv&M*#^aUA;vNG@G~m@zyLTuRML0+~m=-3R_a
z4xPV|&3BUGkL_d2pUhtswfv>C{=*_|16A*J;VE_mf=Y?>GCAqxh4y)&DfZCjZ%$NV
za-3ABq3v8}hq9-4YO-87al<lgXLYJn7dJQI!-Gdrt#hXSsG+>wLQxD8^yqF3D}3et
zR$S5doSdg@Ul*-ON`?c{xfdS>Ejbv+W`FIlGz(5OHYQp7@`d=KLbWl<n2CU`FmD?a
zCtVjQFI76DJg8BoejXkz(h(C88o!l=!-RlRqWd<)E1v)e{V&coI(2<6-j)3=qT&%;
zkbhdnS&o#A@5Te){E}d`AsKI&5gVyC8?O-kq7@y$L4!yqVLmxeYl%GBoRdAOjP;Wm
zS9BTc4^~l-7<JdAxDs5%J6@L|+gJkEAzT|4F4_M;cZ~!nhfN6&Rdl8qed=3$1o5C4
z1XlU{ZGM!49!TtMc}kONM6~xgCH8Ad)CSI~P!$Wic~jUZsdw!HUoUEsx<|DU<xQ=`
zu1F2RRr)^I!jq8GbxJ?^jxIEQ*X5zSZ*+tX{68jPi>(6eubgc-(=V+6A6uX%Ulv{?
zXiM;-2Emo1Q0pz88ww-7#Za&-qOMcAV>mLBDvM{3P`Z{4&<Fi=mN6Ifn!^s)yh}hR
zMYcY9=$4<Z2+h>b&e?Ux`Yqj*9@?9!nBvo`8ml11S6?H!uJts>_Nr}ngI($NDpY6F
z#z<C0%iTY=kSgncf=ag2@1huW&3Enm;am!y7YGQWAhrCmIv3y8#z6mFYt_ISA<JBD
z07YDwiK&BI1_zclMec)K?U2C;)#yk}lb%IMKVN`$sV+%O_19+yje>77{7~2KnW~}g
zaQ^W(Y{K9&j<Kq7UAbcJwe@&y8lPQP{2FA(^=XVbp~bDmk{ci&1qDY~q{}cxsj-;X
z03zZUc9p6TRNG+pfpH2~U^H{V7G{rw;=iLhsFigXe&SKh-(H+nEBm{&bfLqFaCFO3
zT-6Q6Z@@F*gfljd_yS3BU{chUQxDer$z-hcR#|azq?-6nue!C>S?!$$Iv+lLx2gB{
zCXj-0tKNm#ppM|6BN)oocG{2t8kQiU%vj9~mr&Hc`t{zlDJvD@*Jk4vo-qaSj_|Uu
zCyh6%*{OR-NDq4+emQ7X)cd~p6&ZwUa6wN+q}tME=-|}D)_k-Hv=5lmt!I=*ExQ~K
zjIvy)l*%i-sa4eEl?-^HIp0UET}Fl%9y6TI``Bsf3G(--R<kAB>?<B|&@@avGIgf@
zRsaXJCeWn`8V552SaN6w^{#zk1lqIqKMPfSLhDE6bopyMy6kGQRpaLyM}L+`wkxe+
z!=nfDybZbryed(Se-`S*FP$pY<O0R(%-m}6C$+okot&Y~?Ckwm3q8(sOLQSqcFx_L
z9MKar4o!<dG<S8qNY$=!a&sG;HA0*LEgl%G(hu0*;5pE&P+V-Ya@iQsk>^yCx3{zF
z^!x<M_qXrQk7#$W_8<^?S7`g}4+)a^hl8hioGYqyd6@dtAs5<%C-C)8k?<u=&*^dP
z^F8X;=Bv)(36b4*7e<HTua8toR|{tl7}qSHOCiO)Fk^60Xk}RRFaBbN@~~DOzsK@R
zZZ@AXjD92LPgSiP;3NlV8PX%>7i@#vm0lIoIzW=245aRRGUBi;d`m-?F)H+2AIoK&
zfY7z!x4A9nH8NKPdPiLr3-l5(;pm{|5u@OOyZwKW2ixYrdfbWEFR&YE4amJa#FW}n
zEU}HRYQ53M^L=Iy#pAU=@{5bo;q(bFUrW)L@q7xk(R)una^5U@GQ~-=Y6jh^;YJ5x
z-PZ&pl~*|X8y(VllG5-~zA+$3ga?&gdxws|=j2Q;E-qH%ku|j}fmS0?CqtmMKugCI
zQG$4XqZ-<<Z{locV*vd<iGb)C!cUiYYM-)JCT3`c022GJzq-08);YW~1FU%?R|oX$
zy$r^}C6w6vC6sbpav%{HCY@2vx(P~s2|E|zT)iI`u`c&Ptg5M93+1aIDS(DbxiW{D
zC4fU@K^Xibs*nXPZ_6E#`aX_!cIWA*+{U}YQ{*nqKO_;Pe8*sO>)A8E5BJvnzPkX2
zNKJD2_2CfE{G(FmI-81~)IZTaqjdSk1JWDMKs@^wT7jHlQk?reN7WZ&Xaj?mVEh%p
zZD(q;aj~U^+Iv!Z>l?Lb|Kp8_Hmy=rYx;*0zjI}sJ!xlA4UjN9zk$G9Z^)I}+<9w(
zIk!*Vf;>JqCkI5>$D~Z-^fSB1;lT*mw0=Pg3!cdf0NAv2IxS)W9MFQL?aXij_p{bI
zMGB63v&*4RX5&W&BmXX{95Z8z<d)%ONPfm0#DQR9f)wogow~0K=};>CV8De3ROohB
zQ~vryqpX7C&yAhB(jByPbgl^$K9=-<84%6Dww(L|`}P1fW-J(2cJ=G5pdcy3isr|*
zY=brrOv2LMqTo!UBP5&7n-a<y+@M#m*i{}arvRk<myQRZ<1}Z%{{SR5|Ej&UbgZW+
z8*NPsakd}<udaK>)C0ux)b#(8gYJLbf%^}%{+0>8kGF+mqnHEd$vt`<cu{9i^^gQr
zV<t^S9T>l!TkImGGJW$L?@7YBXr5K@=9iHLPcnRjYVz-x;=io$nJ8n4B)NO@jxvs2
zm{`{o<5#&Jdj?#Wi#2C?<VC`EOxFQbnCfU-`nlv{W^UTH9UY7rki8enX$}uk-N+~W
z4rTwlOU<HW)vTm$-Rlz0<~ert?byx9YGTFs;pKkyelx-Xp6fC_z1}|@{|WN+@2b{~
zmM#Yi@^ny6#D@khEf=}AY^Vp+L&EeWa~yUMS1T1yYRQzm{U9Yi4iqU3KAu}`s6t}<
z#8RzmOVnSzHr#(XAUtc49o^FKC}iR=zkl<JVL((X)W2i@7F~49SYm^~t_Xuddi|L*
z%7MJk6jE9;=S3uUTH3rgt|-f=^tnuomoDL6A#e=)pp>IyidH*2Trv1Z>$Bt9aW+5<
zwEw3~s(Ov(VLRvb#0b6O*dz6=?uFK};h5%wMkj74yh1LO7Px)jCGCzLYE;n3mlwXt
z7I;k3XZ<g*GUt=ftyr&RbrH#f?1SsdF_vYvRh&Et7tz2|pP%FM``xU(H_pizX+=fK
z02sL&TGnSR>?KjiLlvD?14HxgLw)e~7%piMoKx}zdK3+!eCpTI99h6E^S>D)<HLrQ
zqFD<|Nt6;VN;BcGBeWW(Y3r?mv-MGUpaz!}=~#lzSyei?9G{P;eSZ2{c>FU%2yOMZ
z0CzW<Mfv2ctyY8|d=M7#t1}yNNSR}z>2khQbNY^u!wX*rts)0eU$8X(Q~vj|h+7w{
z!v1PXjy^szIyGINgPxu^OVs|^@Ccx}Gh~RiPKl@6Irs++H~Y8YQAmb{0tLb&FqW3C
zX)lgK3_8T$-zh%uO_|J_iS7n5C3#K|81r7`YVt(;Guc>9m)9xg{MU>oYzuRmU*)E0
z+i6jm-=Br+;7ZB!J#jh&&jM=|;1)}N7wJL^C?-y(Aw{&Azv56y;t#2gxJri`%D%@9
zvt{6N${Rl1s8eQUPIK$<RP#D$MKH4<oLRM>G#SC4K!#fHdq(;2OKRJJ;z^6Z_*SCR
z2^B6sRM|r3uK+EZluo&4im;@`>nD~(s*NI%A;H1VSYz4nNl7P5jr$IDle2u(ZBWKg
z&&v2~=}(J7F|DE+6BA(;?kH|-!Si%7L#wGxD7s+ULH(>csQ3Tu2qbmPv>}?9Y;`>`
zyljY#9x1(=t>8%#{_Cy_FX@M0_KX$ZY++9FGL;OVk0~8yDi@kywpXWQXmqt^N@QkX
zVL?hnN}Dl-S&jJn`&<6_{C(W*<}{_PevLsmTDLi=kS%`So3uN9JN7&s5$(i|*?*rY
zTibYY^p?z#@k}`Ntb4{iuosjTVJR40L}w;kanZf#%goHITYVy6TT8z&A7|foa<G&n
z8ODn|m>zC_@&15RjSMopL)pw)@bkF?af)yL5+8T`^xO4D=i9<T^xV7y>c{up`8fJQ
z4E?}rl9YjzFgO$Nrh#<Cp<>sKX6B}Ab5`PIVEj-qrdCZJ?vJ`Zeo{VcdmLosLo&DB
zCJM@KPL5}xesZ!+HzQ{Eo8a@s+GG1@zFQ{o1EwM4`;T<@PF{S^B)RJqmQzcmH=nhp
zv=BFtJTsW%R<__^l+7dURn6gwac2IWr2H(Q30+FK`CdoIQ5oG&A<V(!v9_^m^q4NS
zHxO5R79Q~{9M4+)THvfL8^6F}Av<5DM?#y+hKoyu#?r7Ys#czH@nb49X~CL-RMU`5
z2Tv7H*+TEgHMMl=X2R|D^94254EU%jcKYe8kGU&=RZW%+-1J%Z$L)2{9d|0*5)fxp
zpygtOWt{t>K_s1(z{_pq8o1pZ$6Wn-?&nHWMO1-raOi^2LEFUWo2Gmn6PAXTHCCkf
z68J||Pa`_jU!Nmsa903C)gDvEaW6-2+^=1ld#<~r!vWP#tng?B`VBwLh}ERw@qM`D
zzcWTDR1BNtI*MndC~`??BNEvTJ1J*$cHn_hDrY7Ba&$*RxjkCQ8lL?VlE8Z7R!qXz
zn~!r79_M0P_-c0#4+xoN|F!ew3TQB|!oz=j=B`tW$%(TGaU+b#Ydn%|x>uMe^>ToY
z_(6Gm^UB}moFNEOOO?P|*9T<Z=RD%meSm4XZ%|O}A^+dHk>0e*4o=KbRuV@anCT?M
zBl>b8%>4zZdmd8f20Knziuw@fNfkHWRf4dHS9mywrxb2VWp*D+BnYfwFk6}LzKuJm
zH?<L%8)<)87ACUAd+p1xh1q)J-t#1hzNeajbQR<4UHw!Xd-x4E?hz~Ql@r~vE1qH2
zs;=vU<8JWPEyZ~7(bbW1U&bo$7-q?5Dn@cma)u>kA(jTFtx=hkN4ph;o(Zb`bmL)e
zb6-$%Jp`P}iCv-X9!D5d<r$V{h*v6yOP)dn4Q$28#_P`2Iq$x;1#gym_2>j}_!o;3
zj~8OibI|vO(0lXfB+@~G%fsf$ThBTG#+idSVCl8H9%3U^s|kBpYbkdF@#E%au0vs@
zD%bbLS2erOso4726eYvWNtvzSq4~Rbt@yByseNm5o~=6mewz7$67SkqGM^!hUU=%@
zJ&BF<^wt4zN_zXs)~68Wl2z2tD68eEw5LlZuA~Gx{$ZbP2wK1{+`h?fTrQ&Gu54Mi
zqpnYks-QTv;V;BHh<rG<+fKOot!(|)lO}<`-HouOL4Opp#EyXb;uKKU1F5P{o~W33
zbdea3MSg`(4(>fi<Ay(*E&*L?ZT<oojvDdVM9&nyC$&aa;)+khIXxE59Eiu9Yc*2M
zGIV-LZSi%VMoQ+qb<uNChQ7-9LJo#TThDl_GRDL_aE{Q+OX~J`2>b+s!qzFWdfa)|
z<RM(3nV{QTSGRq#y{;R@jo;dA^N6SZnOoRgMZnEU70g>%l=P{&U9j)oN*i{Tf!Y1D
zr08ka;>}p`ec*6AW!^x$8IeNC2dn=Q#x1P%G>FZL)k7HTPuJdosr7MwJ>-Gg^Q!AK
zO>SSom}4Azhcmzis5L_@8~=6cVgYcnG39EI3l9fKs$A78xf*WieAL02drliiS#xqf
zf@c~{pap+=uH)i<9QF+nUi9K@t<b{X4c>OxIy{O%<wrH5p5#qTkR=yfgik$(CowR7
z$*FhDAn%}pNvr%kA3wV|+1Tk%m!P<db{>Df6NN21T1*Yy|C1`h&JGEV=z_fV(pz2I
zXJq7^pW6(j(71tyvxo71Xenc&)x^kF0Ta0)@2t|jJASW+aUs+&K6@EDWrxzEhQ-RD
z7XK|=K@4W`v1e<e{>dNn%Nr~A5#j_Z=e9$_n!<p%#ho2xv#KsF_v+$mG-apD#?Wb0
zqd_xaoM<-+@G$c)<#-J)1HeI-!&cjfDw>o2Od5GdRc;Pc(wp$lPMTijKH>Ke<r6_)
z)DatgdvQYYe|G_Pfo#~>!#$&Q-@<m3i|gEf;aNTB`v#_`j}bi|1D8cTCsd?%Z-cVY
zx;5^VCP+;#^7pDI<-g~klZ?6fnx0O)h*mMY@OOWBiT6s^6LG@IPMt!#Bi@^G*Y#Qc
zhp8a5vf<i_gdr8Z9YGN#H*)DvhcgNm8F$y?DgQ}i0F@RszwjI02kv*Ur|1$7Rvz|*
z7kjT1H}`o&$3OgZnAyK<Ex=`aWVqG*gs>X2ye%j~s3gv@5$(k{>pf=<3Z;51n3#Sr
z_#Q{f7?OKuK`k7<%Q9leL-H1zll~%-CzD<hYHismZ*3lY{<zbqLyYa<nlA2`wJ`O(
zbmEJ_6c-H4m<o@(nRv%1RS*-s=d%X1%OzAGQ9c?kC1)5`z2w&Za#Dm0w%DSSeoi?3
zOXsW~<v^X{YkI7PPLgX^*-oQAaR?AqImUjUPmz-ybww`cp}h?Xu`PDB8$Wl56=O()
zsvn<RG9RwmI}B&C5!9GQVuL0r41YW1O#tKUO!})PfyhbI1&F$%*Pc|~v>zpicb3>A
zgXW$5okm^aAP3*UA6mbb{__|NXC5-N(^OTT_(->w__lf#j<-zb04lojtM~-*kXM(o
zNA3UE?mGVt#mpVRfpv_v;*A&xFYvaCHmYi`#G`xN>paH<xUQ^Znp^G)zv+QktHtw5
zl;U24{r7wV5>00Tr&HiGLf$|u(IkjYl}<cnW`-`0ZG3k5ZQ#`Rh_Wj&R@Q~pnch;{
z<=vO;hH-@z75RbyHLKouq%b>s;>mPsjn!*{7&~5*7Ixfvg9`xiX_jdO>Y`X62c5Xx
zYGa2!wXOSLYm&DWz0_u=OB{BVeQzu}1c_8P$f)hv0`Xny_Pmft2LyH<36<`(K3Hce
z^J9j?7vJDd0E}vKNJ{6p?HT{z<oeDArNhw?b^&L9)RFgHJbbQ0vOKs$GAi}nhzM)o
z=CSgdp{Dgl`*QQX<(1!l7TF6e0_?PnK|a1I(2>3Y!f!$R&U!oyww?7d0>w;I*nO~n
zYM{ehK<s`2W^RfHxm*0?XfY|#`Px@m*-=k?!*%pTHa7-gA#kS<W5027_*+9k*UP;)
z$|I4>BwoXfd?ggH%9!(4!)ntHEJ6a=vLsLHJ(N+am->h8%ObopM)Wz%znu7F4ht~b
z*7|Jt<cRTmX~;My^c#0D+{BVmD}?M2?yrQtgjy5T2zKE&+bPRz$Aztxd+1&V&g~SO
zQPm<yWmK2WF8+ps6mLh*W|1B&G8&Xgzkzi4$PrL$?q>#m@|KW$CzkD(eMeo(CH&3p
zs*WfsC1&0g{{elB>6~u_@$wJUMPN-gKrwAZOzQ@jb7viTK{)%kVR?pbcK?8~AfadW
zTNPs-Tl-;$w+p@0?#;0dGl$q47|B%qj_b82Kj%Zw?e=J()pm4LmAL=7fBt5~NGE;I
z;f&IqLU5S!oZ50z4CYI}_#G=(K=Ad%D{VNkB_-*KcxUM4_Zzh5vGpEyTw?u-8~5y~
zj`u@Ln&{g)>>E{C5&QbE%y9Fv&Mi~VA3PPRv@i|S4=+$d*Ej79&6xVk)ac?C*kUHu
z*<Eo#-_hVM2BL?Oc4_A-!6T)msP^QrnP9tEr=)C|^7np$w;b4^ru=r=^M4W@HU5)N
zp?XTy+NqNTWNDb^8ox@jrq|l{(EU+!$18FAR>Mwxpy8gzq~C4izPeMnE?nq&6uoHe
zFbn}xocPh4<c*vdwltH@XAS32`Qp;ff0dSPA{~z{>a$5GtM#r}JK*b<+$wJet~w^^
zHHrB+^*^yF3Euf<N5o6`YJkqRaEeTl&x%6LX<_AgGAH=^J*~iONNg{m9z0_l8XkoC
zoJ80^GOavm6F(OfR5AL37j>7N)+8v!b**a8@O)uMZ`8zLzoE1~@_71qr>`)~@kC{c
zs{Z=i`U!~IE3uOAQ0@t06OQE-Eh~S7PohG3ktbl2_s4bwM8X6MgRj-&9%h@Jo+=v<
zGAJ#@$kX*XLq4mUhfc)^&EP9IXThg(V>=5NUUt3X+Ba}Y39Dz^dH8bR%kgMO$H2^1
zp`eC}txZ%=v2IqhTuxaTS)IPRcK?j2CeMh0$yeqRaj`)7*7-zO=?&0%YL|yLmdvI{
z2?wWeg*fXA0|pY-Rev@Yq$+}?woJb7AD!`t9d%r0y!IO>v^xi7ZJURnP4jVg0x`CW
z+FMmq#@To-9D}SXJK-&CSM6-0Bfl3(pD_gm{wQsYY-`WBJoeI4Z>08yoDJ3Ncu+50
z8)e+aG6n^h3+r4CPQJby8FxpL9A7KPymcRWQBV}%O4|`KIA8v2z!3xsSD9+-)E*x#
zT;4e7m|K*_)hU*Td&W^u?!>7P`gPvjsA@PlT>cfbJnS(+U>m<JE(eaYeK`U+?22Dj
z`<~8$EGew3jm1W+uWCzTFQalH(W&jr>i5ds<u|RzTvFqDhHA~C53;KV_xpFDy^4G>
z3!Ld27#=f_0W!<mt0PXioiKI$+%iCBv@|Xh`(Uz%^Qa7eMDe#XG_GW(l6SbPLQ(2Y
zazx9NWt<jI$<aXv_cV5bpGlh+^>U$oZxnTU%LBMSW_aVqFm8Zn!h)#OK+^0~IJgy4
zz!B6LU=Pkf_%8glhOE}fTYy<4(Q#|1uRB*M!f#dcILcFNtth&My??<W&Zc%3p(o=e
zky-giTGtGz^a)TA{qndI)I4^1t&?fHRCp7a$|fI`C^q5|yU$UF({O7VipF4e&6D=@
z&Y`kH>^FVSnLo(VBFr^f|Gr!ncxX~kZWbBO=O48kc8F{zvWKLjC&t_c>OSYa*FGpj
zKzY#aRubMzvp~-y_Q9(|=Y+SOp)FICKvFyt1_p2V_>X!Fyh_K|#Y$#OH?{;V$zsmq
zBf`MZA#j};mV7eKT@hF*jOIi&l_L8v-t4pX=w-X`1<c8xJ01zLd5x&Rt%S67A9Bzj
z#eXER03v}opM-KacGV!k%erc84l7kbt0;O_DFoQd>RL^Yp*}vFD~{1eQ{VHUO)c>n
zqe3AnIALBawnB@t{#W`s`j;En1>=WQ5(N6}-l2knhhDp##Lfvuvmw3cr8biOOmB27
zEI!w8j7_ViWBh@W7%~g-TrFF)LVirg$~7qip6tr*)PvsIvRwK(i)50`Y0_{AA1rI+
z>@XhN<d3luM>+VGTr>-`F0PrCIE$-<>)?a}X95XtgN`3&teb*sIrG*7<b01se!5>^
zEDwi5W__vi)%cfXYZ5)>eUcjoPmYGz@U=lLhU6$qfa@e}f}o5u4ancE(Uo03mKKVQ
z&QBh&mfU-fdSCCOa6>kbgBGG9jRYO&`lx#&u6s>0p>E%5icBr(kN@GwUOUAsvsyD3
z)qSaGXW3Fn@+ao7ZysD&fq$?aM5Ve`)NP$qg0f0ziSs_4j0R||Tl}~P+#KVFzp?Tm
zxQCSJxn^<Z%0NVk_vXfvqxZzaB3!3wWu2nnS{3|>?7=aAUzE|J2T}s0g07>FG25bK
zS-0QsNm<<e!jqiwmrTEzof^Jmq0htOq%Wh)Yi171X3&&0Lfx`6s*$VB>q>L`6iRz+
zN&z1s$9w-wVeN3oiN~Q3GUa{#w#f*N!uMWmG!IN$4a$Oi-!Q300B6ho+MFj&67Atp
zW92QrvCn=os`4j8kZYiQ4NWjSPcVOrn|Pg7@W^ea>>9!LnWw<O2UJi!x`iKoZ=Ue7
z`OtP^b=A%>u8L-}zk-xl-pOheQO?P-H(stPe03#a44JBswP$*air}68fZd{58x469
zc871M+AcBPZw1p;V9r<I<W*5Bm2}c(5DYm67s3AGK*xl%@ZV&Ncl|cXay0io6+XuQ
zld+UV%K!V#B2YPNrxLxqx*lDf*_)jS-B&>x_dkOo&n4Xisjf@uqONE{qPA<$3-_He
zpCtSeujH_4_l~g(xN~O6HrxFVbyK-e3s--g90=r<U;kg1rWGv#E<Pdi(sRe%#hyx8
zsz??G!*}?q1hBN~yT9*gi2WQn;&(d?jrf`QOaS@3(Op?hI2*PS<c+r$_<(UHgZZ8~
zNnqvj*BVAX8Hy<rCCecS242SW#G#~w9r~|Uh1IyD57(YMv+)HS3zhXBaWvY`9rsT=
zN)mU>p9;P3QlixBCFA1*S9|`U$rpM!GiQ4m<|}bOre&%k(aYH03$Y_v257Q|<65we
z6I(Ico2Gg-gtZ63$HL7~MwOdBmIv<G2c{a0Q`N8x8#d3lGm6rM+Tenolf+An@ULwB
z<#k*q{S%2N=C$x7&5ot+9y?tfnN=fl-EVjiWo4$GPkIm2fo(f+0nnMBw5Q(#jth8=
zT-@X><72XnS7$c?()Qz!mR}oM1`>0pEjw76Q7W_OBo8aLTj~j77{bd4hM2D!`uSa_
zviy_$S3l`Nje=EMW?vqqExKjg$5p)UqBi8he2bYzRrTm`c2if9G<Bski7W41C~(M)
z4^NJoF?Ni|4PNG5mak#XS?>;K&d|9LRg5Lf`o@sl5R)+3rbG6~mz9B%XOtGTAr}HW
z#-(EA!cS||SU0}MY*Z}phweP-{oeP_s`LPnE`rzi5<O-RiT@ldK{)R|Fh)s#YJ{k+
ziG=*^)EAAJ-&ofx63XSQ?vr&JOIUQT=>-?qp#}kurytJ6xTXaDb$EJg4RW&nQ`PLs
zKTwz|DiwAf^rFWZ>jtAr<&jppPcnl<bsJ7xS=$kZ%%A~7BA&wVt=bZ~XlXPO4^r0S
zrF+6HUF$g&@T6ZGqmDQcm2q#^w`Ey^N7JZKXB|PV4>9AEzd&@$MSK*wUMax4#Mdi=
zt{FF%NyMi$s2U?E&0y4z?&?VgW$X&^Hb%=|>6HE}NZdW)4;F*CTgGFk8Sf6n##)Vf
z7i`WF{9joiOM=(2E+Q>lJx9~EvE8ioj%{$t@Wt9=>-2ku!B9m*Pw#(DC6V~^d%6OQ
zF(jL|2ONe3_>;0_j3nsAi1`GIu_PaTwDxsqyH3m;&JV<4c6Bddj>}Sm5lsVV!QfA`
zrOg>_w?i2}BU%X)9)Yuj!lu4G1C>C=#0QJ^4!uuUVDHlz7cOlIu|M$31sDB5S?l6`
z8cq*xM2f6B*+y8a_`6OdOpoCuE9Z}<##}Qs+XP$VcB={zSR9gI`Rs~~Yx3pdlbe-y
zb)GJ$K`2|hX#ZM@jg8WrIB}?r<HUc_NbTP^UUMBl-`R9!pT=0Ijeyws0NNHwpR-f>
zBv0r>1(V@#9_M(>ApbX6LwZxf-FwP+{cM<=sKwU@ztDvW6(tajJR9oD6QYc=9KD2M
za0^mRv?;qFTj3x91dZ8N9eridy${7&d%Bpf4z201PW0Vc0~r=lx{)ynIxVp?rdgak
zubK~?zrF`VAN06%tBv0)+%1`KSXsZ}$&?tmytDD^6yAE14-@3eDbJsuJChqM%%w-+
z$xZUm0`e3<M2Tr}mDZXLj0C2bG~n29W1O#YQMs#St7X-Rk$cA)%c~VNf{j=Di@fWN
zR`$_H+gI3DCB*q<uhgf3yNYNMa1|eAPu}|W9_7SPa;8o}SuE=~xLfaj#<<!mAl(Ih
zMit~n*M8wiD=}+JdZsd3;XAmSP&+{0(`zx<?04ZSu&(AvYGw9aG4br_;i6kt^2~bI
zJoXw6Lp&?`Z9U>6T}Nlq+I=hwLZXykI$uo|KaRtkj}TuUcRRs#JQxcws`kwW(zcMh
zL?B%CGx~qS{>4aI;BetfyGysCQYuB&s?~qK)cO6kWMa+3HHYvZlTGzWsK!Aet*Q&v
zi$vn#ed}$3q2Dz&FhgHpR@$X1Ni>Y*hZ0j{u$TaF&!gyH6Ymlm)}F)8E5#@1@E>0s
zozt}U#<#;X6STvEHQRXhk+?#1;x~Qwxim_-vEz!=yZuuwB?)cK_JbQhY#*V_c@(7K
zPh^{{@wLRSyH>oPfr=HOddPK2&mjtB4{IzxgS_9!L&|{_8_uhIoM$BN{~2L$tTLs)
z`3g6R$NM-s?z%a$YmMj=81TWMagAG{8Q%VVkDiDRec_2Y7D8_D`4B7-37Mi{TT-T(
z7X0E@eV@1)oX)VkI)i~_pLLAm<1#s_x;Aa@1@rB?`a@OEd`^>CER>P^E?0BFlX0GF
zY3wa3&SJ#&J%?G{k^J}L@)=dVOay;EgC>X^Fx|I`NaA-kAfmT_y9t+MuIAvx-5nM9
z^KR7UXwub{9arB){E`KM(#Gx`<I|Zh8VVZc>ETl?pT>jYV$@(1c8MS=vLL4LZv$_W
zu;>uT9B+lN-@I|RxrI+ZJ9FXkXX>$>{oq$9Yfj6ukf&Hz%A7WCtZ<Op1AR$8XAm{G
zJ4e8o0%I6I1w0dBzuHphlp`U$aIzFn6g%EeJ=d?Xa3m%3Ff=B=RIfC0=l8v?0Ut5^
z@s_xIPdKMIe<4-<I#}M;qR~CcmJDWLXw}f7)fXGJ0d8!14d^ZH=Nz4}#&I`$A@5`4
zWP8VLUB}(~m}fO}>?gdI1-D^y-{kOQ8Lt=dSfOtf;ERC&^Of0*)3fU<6&~hZ=EFQA
zc+7>!UOUW~v+HtYQLrW@Tt=b`0V+8|uAFtBHoiXeg@0haOXuVH-nx#upU*{9Iy<Gt
zTSuT+_w?Sb$1vk6Uq2`N%^tu}e*!=~=$G<7S>mq)cx?A$ktWUYr>V~G{gb@`>z-qm
zfg1I(%)Db?b%#hg)f`Pqjw(YMSg!^oUf3j816688NE>2zcz49c<*LT|=DnI#j2K@2
z_V0H43(4D;zP$v8ecJ+Ly9iK0)8?#?x7mR}-TM-H-BA9gq=<MAYI*dapsi(UXkLIY
zle@-UQF8Qq@8(I<h<~E>Le!8m@lvEp*&9c(;9X^DK<#x-R5_*e)xf29$N&B(o^U|&
zf$A3?-=_dP1z8}jrUJ>S${?zJ&oofotPnj}SV3yrm}o_y1Wp!fGUqvmoRRutk7l0f
z7lc?Mr{>Nj3MIJzdGjpu1ivEc>kUFwkv~XX?fd|oKFHA*bLq)~BipOt7sJ_XxDwt}
z(6(36t!4?X8nv+R%2rQWVqINxz)FpuL5xthU(hRa{M7sC>OzZz1Rbmq5*3H(FNsRP
z+%?b~t^Z#&s;C-*GMTCk#V;D1#d_$d38RBJo}5u;EC%v}Ys~e0h{mvO+(hO$T_ViQ
z;h)uRACFZyViU4k8Xe9Ef=*H{tG^x;m7<^jSCBZF=3y4Hc$;@LdNQ}x&fJXru^}P&
zWip^EuC2fE+M5wu1Dh!d$%obp_ud#0$zb&`;f*#lsoHe!5%v3XaZU-h&k8>Hk@@^p
z++qYLJEEk30rJ9?e>`?w(BnM8PZTVRAA9x8Yd<-qss<vuOepy3<aYdGCJ?!z>UgR0
zEfwsipbslL<E7#FCE*M4eA=$#U*w~UuAsNZg4vFH(sKvtc#)VfeMuTngE_l>9?2z#
z`LcqNqY_;6g{4LTwW$NOk+sCR_zWd5mH{pNGY9(hu{<)){CCO<SGw=L<2-10rF2x}
zy*XXvL=PKPB_Ru9<UiNJ#}B}4*aSW^i{g9o#?jFWPX%D=jMX!Dh|-eH<Ep5$N<{hS
z4veI|Ki(_GpilHpT!~oSiuj8hA(Y8t;AP)&(01c{3*3RO7A+jL_X4n#IBVyHzuiDJ
zQ>L8+A5Y{>)LJvuvg?k(dsW08yJ8bQ1}zFsP{E2K02g=KV~$shlfsjj138VW0V6Rh
zh07V;m+Cn|MfQ4Fe;9AY!IjB0GR~p50$Iz(ccPw+_SXYtSRfQb83S%4Wr0RFsmjFu
z2b)fRW*lyNp1<8&Rt&gtr(4*T4ekd+j_(+r;=;w$^IlE$H-5D7CPY+^A=!?H5_|>-
zCX9xa*Ie&$S^a{$-vF7hACP9f{x5rn$5%5rf@b0v5CM}EmG5kcFP6?`;Hs;XL^q2u
ziLUPZ0-!)8^EHCp@b>FGGTz3?{i}h@%6IPTi7-#-)-%JYpX4|$h^;B&+>12q->Oks
zN3T|3m^Mt1hi?f%xt{htBWbwfy{<Od4J01<TS-ChX%jp3*gt%?fJpfsDffa}&i4ht
zZs#{<We&&U;=SwbasB-5?&0j<la9RCaqi5oqdfI85ZF2;k72MK+*ajGL8(H^*7<l?
zQ4QDzNyj|E0n}&x=TDNKh{UVTI{@vud}?Io&@Bi7{_j=h!i2CGThN?xl)+JZwJXJ{
z+reD$1aYs6aB?(gvy~tVj-3P9Aqxfds_!=-SZO1XA4N|TU(sTP9s*+w>79La-}>LE
zvAX>+0Rlc;tf%1bTNVWn=oJAn6#fSm&pSa3zZEs0H^KKoF9fi1vAfOqJd77MLf4Gf
z{@*JYhK=sl7gka}vnE@bPnviiCgDMSLWzAO%e+=X5AOB=cbr@aav#38CXzl;Qxcy%
z07t!_WGo&_AOcw7)YwP)p3!R##dz+Ib=wY26_^^WJC$rwhu^pM7uO_I)b>v?B}amm
znc?|BuWy22TOO|<y))w!R@8<B7-NCtG$O(6trh7AhNnxrVzm8RLY*~$FZ$eI*CUH1
z`JYS8QXvh@HEaii;>MRY6p%vrlGxHJ?jP%VFz+1Kt`<A$gIl~%{th|a6~F(1;(@v~
z27LL{B|37@;DBu9_+UG~M?8KVT)^0Va`daCeI`{Zt|MwVz+DAa83MSl`|w}=s%!ig
zUrVoO;a_44n8R(guL~Q+zlzJ<RT<;jt2vr>{fb9>Zxbd$+?LWA|D1@`9sL_ob`5In
z!&zW3(EpIO2TCWo3a~dhGnf0btW5x?EA#vNf+l1##Q>_dM{$UM<;uzi%JKX3GA??}
zc;vn5bo{f8W9QV}XyTgjfKiRISlEV_9gHzm8!1K;+`&dY#K;S~y4lgoIFT86<gvzt
zRS|L!&i=C&c<3$#tY?gc?ul(U!_zlq$L7wvQXQrJuGJ@Wn7R`+H;3X0LVwG;E<JzN
zv8&5*kd$BqLiWf(Y^p_|ANic6yqF(W0I&;V_yV|p@qgTZ0^DcZ1EgJEj_^|VHJ?xW
z8ByD{!`$zR2810s7$*mvQ(Cl64I<6G0fP3Qi#57D$wQWFOx>b@SpqVK#sDt50M5QI
z6w=SdBr_}DC7G;~G>Ge?_U59ANsq+Bc3m-?;v%>`^wo{Jws?;8J(aQDMz#d(Gs&nC
zFOevtX*ZbRAn-cAFYYg#BBTNL$_d0-nmg=sL)a+tHI|sC(>e!gLmm1FhQy}Oi4Xff
zF++deT;Pv6R(CzPDJ2$RKn!aAI&qv1yp??;S>T=j`81ZBg>d!AA97~Hh%Y>okr%^l
zMQ;fkIlU@I3!H2tHbKAo$dh-))on9qB7EQ9md+fxQtd@x;XIkc=r^yrrj_e|yXcVw
zE1gPqBBK%Eq$1q>&#N(m?LywN{-1ep-=9_l{YJ;x<B{Eu^J&8oF>iu~PsW7?wh~uR
z_&Tq70&BgG#rNZ#3C(f|rvdS8NwUFbKz5TCfN!FKB2km(DgD5Pjh=Ak882J^++S1s
z874xY1GQXz9A1hRO>8*yzj713R~Jk?>hJ#Igr`H-t-TR&W;<LIe?`A>56N3m)&flC
zG2KO2vN-%L2(a~8p#3O(^L_5d($8;BWPqU90P_U+IF90@WZEAtI*)_&=$l}ZiEEvD
z$o<uwy$Tv7dCa&s7ji#!Yro88LE=Lvfg%~QnLwc7`lkN{%oPz}Gy+(mI^gR>D<<rV
z68&$q|7k7K3or7K#v%7W9yNBZhf4Kia)chURj52Kz<GSQTX(W6rgkLNQ6Y+#3#bCO
zT<+uoUp4^Jh%D%!<EqHdy=wxrh)Ah%M`85R(@XQhMrU7V@&+X(XqEfe;S4-Prd<sf
zU42Vv6i?Pi8a=%g@`z=~$}kMES3p}Z!r7O+z8Q*IQ2Y@3^j}DayktGA!qi)@YITp8
z0-*b9$FU7=Nd38}xH)@nBtAVDxkreD&80iK;**aWLUAMbqg-bu{=9+j+nYfB`vev4
znnmxDvuu@Qz9)blj1(M&A%t!Lr>TXAq+4Z~a7qtx47UYo3|LwkgWl^F6+dw0wc_~9
zrW)*^q`A4e^D)%A5k-f5P*JyJ##nuBQXHrr#_%AGVWRWpStPtO;l{S0+<QyI>UIgV
z?OM&*!M++B6|4s4z76uIZpRwB;L;R<nVH2Ec;nMio%2M`V!}dPNz%bDai8T~|NS4l
zywgd<?>YHx?Kh{dv(t_YU$3WNj^s(c0l%H1Cvy@Dm6cEn`M==)+qCET|Ly`@DS|{)
z61<76nu#lTY2N_J$m=zIv3AGzBJBjOB<p;(i9>wd#SL2nVJ%`K()gGtbz%aq!6+v?
zRKr_$aZ)}a)1DJd^LtXeI~5cEPVb7TA1(88Pir7K4ZNS}@ibTOwVXduJ(XPb|L2I`
za5M`~v@)Xa{*E~P?~e^7p`6NDW4#8d^z`8fVTpmqvVUF;oM3i(w1`;V{Ek-Qh<crx
z@<?I@=9d{RX#H5p`8Y^YAi{Ob=RD@HHFW>V>b9g@+=vl1;T9Q;Pni-N>O9Q{sbl4}
zB%7D~Vf5FTC!A73n3yL3$X>Q9KlUDybHwFWphpi!@Xt5)hz$agy=$ZJ);q}bbJA}h
z69uN^`vDl$|AmlxTD7pPg>WOCCcek0GgzV3n(mE!ELCbr2p@(j>{o}E8!O&p;L*`?
zVQD|X)H7Yq#>51i!qtJ@>p~6$>QV!l4_5?FdCj+{pEGnQ@bbdh|8PsF8yzb#YxURl
z8DQZ=uhT_sq(sbGw21eEPt|vop!^r|8>a!(p^6pa2Ym7hSXBJU-k&t@I3=pgK;0cR
zjIEdq=vG5f<_i+@xOB?Jzs_NH|8@788i?-t3=Vq19jwp5u<3t;mA7*kUmISSlJFZt
z6gO^IXYo9p)2qk~X6$X=j^frSC_X9xh8tQ~IBkCN+lWcVH645p9aLj;#_$$k!tfpV
z>&_bJH-~92%`7CZZ_(*F`|qUh8F2Q+x?};*$XL028pkpr1`>18%mrbs1U>VilDQXL
z#N|TnnRA$uVBRB#aF%p%Fi0@TgFoBdkzsN&`z59RpJ$xZ1baS(Xjo9@Zy(5`LFf|n
zH51;%1_JIM=O}qPy{;1Vd{%v1IHfc}8AiP%@6j5?J)m<EOV=@@SHad4bn?4B_Sso*
z5c&zyA><ICs%`Ru35}bdQO@-2tUZs$>3_iRb~1FODCgykcon-JSx3D!wBZX1!LhG$
zSv(2q6`A|ynC~HU#J<M;E5zCmmNdXGtUl%=zgzBE$-UZ1N7pySZya0L@3e0y*>eP$
z>%P{`cL`Z7JUSHcnZGIG68VFTt-chh8KE+ihyN!-St;ZIA3)`H$&);A)nUB~Byp#b
zArOI!u*<{e1}e&1&2<1UeVB2?<)C?xFYzA9hqG7}$`8G{34@&ic@`;xgn_oMv=Stv
zf0AmfL)Q;JT7s2Ie{Dz@d&H}1zuin8`o}=Wwr*!epEw{X9$|1$HYXC1W5#;IN0tEx
zXiR~O@)VFbbnpgMML^=<o39j3YLn97oo7FED`^9<8*SG?Zu-Tw?q2iVehHOV^w>I;
z_Hyuj^|9LkvA0GI$~C|RP(E5fXZtr|Uom#Zlbr${)~cA>w<bd<7}23p*(_j!F@6G=
zjY$T7g@^$Oq`q3-m*ZdCD}1t__p=!kqzA;I8p8FKg3b0V42pZ?<1L13Isw-{$({=`
z$7b}sExY!o=riu(tD+L3L(|VDi_;$s+#D5GXuq1dHj*{ijE5PvT@b4gtNC7&SmrLo
zNOs!f)MMLE@IG>iU)QNt2S0z3SCgx?Fnu}pGiwO3FeJ6smY0`T@h5I?USwe$5C2BU
zM!|D8v*Y03bJ`s{B>pvwV7S#x=)4NkjGEEVI-X+N+u@z4)!tPIdzE0?XG#IP<0mJV
ztj&+fuv(;$w@YD=?$%wTxX_d)@HK2>j4x04(Q~au3Ru(X{)bw(65oREqnoU-jQjxQ
z<Xcxn$qeZPoyc!jc2cd}=-cCLY6w)mej{5yYVd>m^_7T?j~1%JkM6v3L|<i<GTOQX
zXCPYiWQ-l{Zsg{jtVbMb`|8c2z?lQA*XFhpd6pip6S?$9#tE9H^y>5S6@TEdT}a7@
zpFJ5$H8iU;g?~cf#7*wpyGGkSs4oYmu;2iignDwobdeK}6Zw5@ssz|OM-uzV*fKv>
zS9;~zaXuy{QNIiEj1wParzmcKbm^mAD=Qqm|13^$^;KzM?eAqJO!QJ6(Uk)xEpV8^
zP~ZJUw3X~WAT#JslK?A{<>{OmmX4^&(qE+bL;+}h2JAJbR~K2uUUt9vp!7|TjUzz`
zGtd|3!>dlES3FH2T@5($4J=7vus9E`4P;sL9*}xF(}bgGn`_#);W`V~<j8#@=)U<m
ziNuIY`NV#d%~AzDI4B9I>ZF1_EKXr~9!!%UP37N7b^R)kaQ!XtQpWq&Vi8G2pKsk4
zJvU}W6=!|8l!@6mK9?s-=6i7nyypnC7xOPz>>X2pGEDB=L!VdV5^L;$g->A@v93V8
zS#+N9hFSuMb?k?|RJur8zscLNZ6iyWNhdDbm<?_{ciuXDgg_f7L-Yzb#ds6q{%s;q
z8Kx<4Mbs|<C>i$90SMSz)Bc@VQO=?w-r77Be*t=Xeh;&>ch_A9Fp>wBj`{Z-U_x%g
z`}ccgm<iyY3hXEb1qMGG%fR{I064v&m*AR#@~?%ko-8owsgJfT^LozRm+mQplUWbc
z{R<2aEDA23v%N9cNfpU=2E1q_1BWS^G*d12Ydo>_(a>+kgMUOQ`3ofNtLYCO{balH
zf7qRR42SjJNuTgkC4bM*%c<UsT#R^?pt$BP4b;9{KCwPuAYWuA35@+ZAJ~}$SOdmw
z2<Z3z3RF&}AaVDDYS|dkb-Oy_YU&0n<&5C*Hsu;}f^FwpdtuA5t(QWE$dJ1f8H^k#
z8a6-q7|ut@BuYjx_ZaTW4Op6=1uVd_*ue4)cQLXW=>_68w=bE;sU$d~xw}=6ZO3>*
zYT`H%D^WKe(1kqw-4=VKxoN3GjDIEXeHn;A7(m*y2+-DkhcST}ei&qCbzTIj$QmXP
zg$-V8wqYC&`wgl#Rsk!ob{$@1{rZAEAb?}Z=Ri$=z&3z$hXAx<$tMQ(bIV_9g`VXs
zJWD&{n$Jen=3SlLKmQL`?*Y|x@`Vk@f-br?iU_DELP9lCq=*n!iu58)KtSmokzRwY
zC?G`$y-Jr3N-qJFV(3*MKq9>pLkkcf?}Xj`fA9NojvfMJelvG&dG5W>OkRB|*DRYo
zL?%0|_<T<iJr51-E)8ca=%2qwf<dIE!LC6vE^o>fQHK#=Q*Y@7dnwHTlt}{)26~e7
zKriW<VyZ%+D4NpH@Niv&kJ;;cl2F4G|0LH2=hZ8aL_1*AO`+fomsLUtT3|ufz5?wj
zD)ekfuPFp3DL-{ur!2qB`qi8>@1ALDv_hfSdc_y>PBCDX_`?^7wA_eWPSck48$5M$
zbhbjJ(@fwb8@A)$ErM`0hmhdHaf~x{{aneP&gtH_KZCF-fB%{rD+{vlQ^<+&s;7d2
zUN*&jUi2Q}kUkBtBI#4WaY34akv->Y9mzbuRV~stb5fdDQ|vFsS~o;M-00(zF}qDZ
zR)$7`OBbAaw(6Xg1<%}ZpL5m)+`7x7w_HzNSa<|0rEWH)U#aZgyL(`_m7e>GUJs<_
z%P--quQ93_obQ$QlCu!q8btI{UXyyzwdMn#t)F=KZ|O~3f^<_At*aRb^Vmu%!6qMD
zMu0U?!%xNxYNbIc$~=jy!iWdh@#kO=LJX6Nlt#vLcEv{Wyh`I{&fOXKYkylVPz=5Z
zmgE9V^4MAR(ScW-`g1Oi_51h&_RURwMRj4WClz#aIG<(M4LFjSSF7+R4%b#GO+G&R
z!zKdRAE22r&@zAI7Qs&fpn<z!DUeX$NT>!U{iZtk%8r=~tTZ6IC(N`4*u0=1KQU}-
z)L8;&XzHpf9$9U8Kpm;cM~Hvg10TKQfg81$;A9v>o{^UM&mBo$rcUY}@d95Qqt#sI
zn4kcfHJA|=A2)nb4z=Rs**=lxvbx(*Y?VSEoVoj&v{Sxe`}Jl2Y{!gyeXio4cqZqa
zKOh&%>43O3pJy~004-8TJf9++q11aPoe}8PRp3#%&cWi}>!6u^xgUocXWof3F<N$M
zz&|WVR!9!lDHM#{7*?h1P?pb9{DU^z&D!;@`h)u;q;0@hE<pNRU@x9uI-q+e2R4AC
zB~b0tNf7V?SS*0DZgV9+*VR3LRTa0LnzV3KZ`NKEexqti-2x`hjMzon>L!GS>L$KD
zLW6;Q8Zp7~U{jzfTc?N$#O=jLu#ct1@z3O4z?y?3)$W}y2nm6T`fW|RAf<emp2OID
zP1M;6KR;)mldI(|E)T7eC6=GC<^rnqTt2y31OBgTiU!^VQvTGrlAXTGnxoC*d+GG)
zuZ!!*xJe_*epTGjgju`8pRlj=cS1;hgG(k9rh=HOsvJum_|YO^b<=ntKHzhKOX>dC
zFZEqE;(z(-?&X^P-OAUS(llUa5BauCkt05iKO-|oLdP#nAYT>tBHZmc5vU1e+~x6`
zh+SN&)Gpe-SU~s#5J9n+<KIZ+?dhtU-f9~iyqD;Sxc44tBl%iVvyjBib{{rhN5afO
zTK)6X-0a=tzsGM<M&an^c4Rhm03(>mTi_+B?((%bu)|dV8ID~pBx-|n32viPe>c)a
zX>*}N&7N2S(@o<D`$oI-MWcUqpA}c8(J$KpE9Z1Tq$InqV1fK3<>(dnt0)UYn7dbe
z8!g7YH1CvfO^|;@SaewiP8nX3f|<$FT)ac@!x0+Hq1e{Lg|)bHD@wy9DN)i$BOzUA
zd>@fz<*|E!ynUnQulaTp{J{a+B){1Pm*PIT1Oy1+@qpOqW{2u$e(D|hU1&Kil$dLH
zkQopKly0>9n;dFM*;VrQTHX9UOMCb@(H6yTT~&OT&hh~YUKWuPWq%*851~oT3$Az>
zLp|3Ca$kZo{$K;X`WRoIW}Ayet`~?jwz`<a;8)}*wkuUfBokB*IfhZu4|7TQ!S|)t
zCaxy~JgE`tzvwRg9lZJ{CbsS7z2`r2i=jMRVyvpWH3k`GWz+y@M=|~7n-uf>YHRiw
zL+6u2`ofV}cz>Cy$`Z+l`ahl&mVO-ZYn>~VuOfJM7qZWPkaQ=&)LJ)@a#3Yob!MFS
zm{8X}4-U6v;b;NNd)F_faGc|TJkkgFDuC;rrXfEyo^;drAG{vmd)o8ec7?PU^26L^
zQvl73?*|XINw_-t=h2UTJNL;y{c+zgPL1hFCa)hi=jsQ)o<57m55BkMOH>#r<6RqQ
zAA2uFl2P2Vs8}C2gGUk>OY1pis#@!j<h3pM0HS;&Dy}MOiRI4H4-bwzdK0OXM=}DS
zOLqlWhB#FSz%okT#{i6E1H6pFo0O1&dGhr0X*1X@Np~KlP{L;ovF0q5f6dopmA4Mt
z!a!kGw>PXO89H*yp=ui=F8LklW0XmfTNAqj1|4;CkJ%D}Sz%7tDfj)qx5p3M%{Vd7
zj)Lk#Q5=Nc9S%(uDqOXUGo9*|`@NgJV9(N`*0MA+6(ZL6bD@*A%*E7K`Jcxs<Rpeb
zEw0xMEQgqKHpP!v=Onm)A1C>DE;&%<@|SlETk~_gHphz&r}~wm-uKv#N0=w#zs4O2
z?>EG7m~EIU`RBpK3HmW7KT+Mf^r>tyO;(|Q0c8M9HSknTYAq@A)z7XZc!oy+k9cxb
z*4!6<B9LA|nJaN(tKTDzJpIm{b)3!LMBPooJ$txp#y!W^-40KB>7Q3bzUiw*lJvFg
z%&rI((2B#-t+|&MMV1LhH6Cb=EGf*dj^Q>LG$D}g`ydp22X+ei*kV`4y(&B5H0||e
zEr$?fAeOBk9TAuk6iPS;P<{?g+_$yLTuhc1e7M4b6Jjv;oj_Q^In`j<+Lc`*%E-W1
zkPyD|B&n_Bb>w1beSK(`n3C~^-1uOQWVye!uyC9EU8Jlr&TXh)A6eOM%K#x$@y~zQ
z>i=~X_5clj<bs78rL1Zvr@~$6*)FxTxD1~$^&P>e$+eNBxRT2ab7($53EsWk4_<90
zN)oiZk*I#=2_Ch@oXOpt2E6NjANlK(84Kga!#3YVLPGD~R<4xqy>kUh&>a}FUj}#V
zr^~@Y@+))00ypf6J%<#d1gv~|@yb^KBNo!6a>mqDoI_%pIGYS^e2`WVyQAv9Jo7Wc
z=^Sh=#)cNSCGTJ39^Kn+CDjAVivqla&0u>*dLZVUD#X@NYOG}(aT_K|DGg%Xz%gmz
zuw`E!Ar39b4d$EvW)gA8$2o(}&j!vnft2IKr`Ny(v9tj<`S!2H)AuZ8U>cA3X4-=<
zl$%+=rng*X%f+WwW24nWKx_p+F|}(G4Me$jlxJlGYdf|E3$#?WUTSR2CC9!DE{+6o
zW+nphYV&JU)+OZ87}3E}u$dTUIiZL+)Y<VN6cJqQ7Z&dbwu$LxK#HnB*nNHxgvkpc
z0D%Vx0JD1oFuYP3_QBL@$Y_%7-<|#0Kl0OOlD;XD%?(`DQLH!tmws8EvPKNyOQYiW
z1gU7wC_}m91C;IP;A<@<-B*jG+DaEaorwW}8eV|+acUrpp3?Je_i{Ru($l9YdjcX0
za)x7I^G{aUda?vOvW@D5N9e8Qa(mR|xRDV`{uwnVPZ4iMK9FF{2JqSy;O^|@f;Sl$
zzNF@e=t=zPwT-DuTRV+|Z@TsxGkWAimzx+P7GHlQ3_f=B*QF|Aju;sc@lIsT8oSZP
zl3C2=zJIpZvmDt|_TE9V<RaMP=Xp=~>RSOGfK-%rEUZB(V*z__qyBxFMegWjQ8o3|
z60?a2JUd$tHoSHzlaRV{WVj<5*+x$8b95x*oN5i={lhhj@^0Z$89kj8?b=0?yit>k
zpj44HSuF12`yAx2#XG6&=laea8#y(regT&Hzcd^Q4E>Y4Zc-pai7YgM7i1LySbYaJ
zyvVZ$5}7Xte0BG3m4EP!6qG}KfmWXQH2G#H&9^i+-|gb$=N|Y$-o<Ccpsw_)`3M^h
zt>hl{B=-&nj3Gfk@FXPY+rLm2BK;(}q!pyMrP{h{JQ=^qa&=GTY6m(1Os@FSadzTS
z$5qvv)s!sU9=TCqWZ@u*Qq*WM=qNnyhkv#2<oK*;)($+4%L{Ye+wQ2~?Ul&Ua4r$l
zS(di^H+cL>XKG5l9o@6JPSx5%WQk!mNotNmXY>8p{Eyg`e(oM33hOLekvy<3{t({g
zQ70~U4?T7rT~m1Ss%l4u^}yW^#Ue}BYXu^h8g!x}<KiMCRirXkFF0WNtve0(PVInQ
zePE_S*z<wAoNp+Fe7c@128#*MraG)3V|9Bvyk+I?0z>m@mkZbMYnBx?8(F#1KKPe;
z#g-imfAyQMAF9gxB>gVAPw7~97!Z$k+Hkz<UC<@x6ce{`cq>F9$z5U`=Z#optDe3B
zRO7MW356JtU-unnM^vR$y7pG>ITOH(muU+AfIDly=5sw6B(L|HYJ>9_?Z4!9j0iPe
zQ!&tEP(^0DQ6$35uaIUOFXbn3s7S(llng$6@ZM2-p)c&gLdavFD@B4(#EAca(}ai?
zNbsFZ8qI4LG^9^Fsh|VZhcmz<vOwoYqW`a??D?ez5CK_q_hw&R6$w)kKns{MKBp>X
ztO_HeYWVdA%k&Zfr+(R}@SBF1-t-+TOLmG=E@J5@!uNS)8q%w5_KMqGZ#!qj;^_kK
z#_e$b&dh#w#Gx1JBsh2R8LRY<Iv%H!-^~FgcCEGTSw^YUBh3o3!-2o+j^vKY2o|PT
z)Mgz#G0NGEA6@mNG&uG$!ct^_*`>3(0l{tfsf0!fSi0IuI$+Be96DWl#doYJ$!2!$
zBTP3Td~Lw2s7Z`8E$}vwsD5Db8D_)D(-@$oLE*zux@o22zCzj?mQQv1vqCdlkD%7?
z5n~n=ia>6y`E+wAbS5WH)I%^flY=2<+y(e+O!Ar}k^p~jB8XZM>67Lz{uq?-?-Q;m
zAH(y~h{B-rX(}JumUw@)VHq(YKX%*7`{REsdqd8_Y`%7!4K|wna9!LxtQdJX&dZzl
z@FfLP10UXo`@bhOiqs%YD=@ERM3sPh8>}bJ++gLf*^r^uWLz6#E{?i{OD=N^`W)dp
zlOfNY!Lp>k17n6LDCx>V_3jnzVCFb~96!*Y9q5Xy{#?vVAoW?)OoOS{@-O4e%?yvl
zdlGJaX||Nl)~|l`g$cgL)z*~C`uma|CK8#(yd@5|22E5OtK@O1E~}BaP14aLC`5o7
zHCd=x@?ZaYlBTP`xlq%@c$pkuxrhr%XV{0Lr)g(cCGs46!Fi@cLAhtb2_8sPW_w}y
zdSzp9e^1q5nmwi6ak5YShL3g%6Fy!YH&2GIUY0`ux1HNa*3$bzp$!P6F6hDxNKbC*
zQ+3e5DBDOZGHaOnZAGY)ZgLh(i$-~{xN+)6?a{WA$-|@@T|NnS6=#6e6{rPuhmep9
zp+{+tQwP&<8--b!Uh0ckLHFfmI53`w_<Fy^_l`rw-cDgalJ*`QxtTq??u71+pZ-oB
zJ&hIpEM8=-_M2`Ld;@$TPV?6F|03o8GT5f%<c(=X(U&)a2Cbi&-$p&{%jXeGxE`jx
zx0~}aDputJU*g2?aifIknWfK0j=6}iqln4c+jo}Ko%}=^yW{!OW;n6I<q}bwZ4ngf
z#Xlw1y%YsjBg!7%wyYX&moMOZkdhuFa-L8Ai@*&EXXTo@(cWjoukPi9KT-`L7zKwX
zv_VE)CEQfVW-65$lm;LgZNf%<!m~EDTBW*|)3U_Vbt^n<cZx&c@>3i){B(XR+os6T
z+Z=VeDh|xG+oPw=g<V7$5ARkDvN?gh@X}?gbCB7Pg2#HoO=PhGRdXusmxQC=EsHJf
zb?CisvCQ~A<G$Q`p0~Ht^})|SIi0$c1lApP7Yfij`k7J%>H)WOsWmCG!ar5HKbpAH
zo~`qAzkw|e>tW*>UUgWd^Ca-f&4h-)&S$=)LllJMe|BS1?GW?snrFLqh4r#it%D3(
z-S${_l02_UP`~UQaeTk@#`12s#3sKk<Ell;w~l6D&(`mLa+zdLhm}QTc%~Kve?j=o
zWum_?(?iIhstVZw)ej9Sh|r)1l8JT3KJzk_fxcOMI#;0f<&!?2qfV%ky_HTs*dn?r
z6-J}DSIly#v+D?PQg-dpo|9WUIq8;>=;ThJW38Kvv9bKSYpT&gt#cJec&DRBS3To}
z)ihOJX6}f$->h6%ynaDK#;#tUxno?ct=W`V$h?D`?|3|^j^5rFetwqK`qHt^Jb8Be
zgs@IX$zuR-&K2f=+v5~&vwjE^<}-w9BIdqHhlDrMf;w9n|E0*<#O$4|rbF0v51tZM
zBegIO_hMf2;^Z=IA(~Y=EasR7VyeyF?mQXKxw9ZC7d3jFZ%2c8795SlL_p>4up+*e
zhs6ouwx0T(9O4-sRNPHEDWFVL8HzX2;zp~t`aT?gH)8fw_gU@v@%t8`h63oa$wxCu
zj4<c?*|^|4k4yUNa4wtEV_nv`L)Gw`U!(8`-9F`dZIud0*F(|C+VmtxANLjd2Zu0*
zH7r*Cm9hUVnMe+IEBET55wJl&J3TlZu0COBF{!I)FmE94<VGL{%qC7$Q2j=L-{?PS
zRX`R9q1s)H6hUWqDG>`L<Zy7yZd;Ea|2=fl6CL{y6<VW2JFL^ues7N(1>BRdw6e(P
zzQVPYal@HBQ>A)Ug<XsW&FOFlk9zRr@p_kJ@*1AwtU3ellls~Xoa0W5(2=_>YXUC8
z$vAfHH~$H)-uw)|wb(B1wQjk7-@)8dEj`@0k!T%nf|eTbX0OQf_O(mAJw5F?Io+42
z0?FIjwQN;<D9A~5Tu!Jfh$E+cd8|N16?m{xVY<T|ai@2G_ms|5^F8^h%J3~&yHH*L
zy>ee)Hqw+O&8yRcst0=2u1p%hK0!ujYYw!MiiqyNYDMru<NK3!V0YAjCU$7Q0+BRW
zCg<%3=)ghTQtiRHg3glCZH~V?d=GXm_|<d8$LFLVFVo+#3OQ8lc}bh)AYUNZ_D)8^
zj|~{$SPA06j#)}Lt6%jhqZEp@hwWjRWkWA~iIZ&(?){V1=~C)bLkmuZK3mmP?MM5-
zUmxTA)40rl262Jr(1V)ZM=;G(ur|@F*YFH#-&P7Tm>fT6DBAdMDrvM-Pq#ba``Vq-
zj9<Lz(BNX0@HFjKyZWeJfOk;tBqG`PuvCW8>9rii*s^oRX0bhRHBJ0zaq;%#ZvW%J
z*u?Xo0O~q0%h}*7TFD;5wtv(-6S0MrihX@9`Yz;@b#y#zU&}X*TJNX!gJORK)6Q3R
z4s}ffJ&?x`Ri`+TRTv$0w~9#<g+M3smOH!WUX#^({PK!ND7qe<Dh&yVHMuu(4ui)<
zwullU90ZHdNRqMOJNNqzFvRt8hgV+Dt}VG{O=;j<bvfX7%o<1=#!+4KM4mI2r+Y_!
zx<{6TM#dEi$ontWWgh*lSA^-TJMhs|&##OZ^inMO8}_rXz82@h+DVLDa@|QT-1(0S
zaOoy8YdcW-Q#P1&0JXG#Tt6FX0VQ!EXY7M!KH@}$Tu3X?OI!dwo?k#0h`OOR-b!b#
zbTIG?^?xB<-*xxK%_nC~Kkm}%#t*UMhZ-b7YN!{nTK+04CM1TZjofS<s1!pJL!7H;
z7yl`r8UvH|k^;rfqL5(YmV%NksH~~Ks`JCLAcpo!E|y95L?^i=$%uF(!}fYmv%WBY
zl=7(v9`sT0{%31;MZ&=$KHjbsGpF~ofs9-qiN9jG9Xu|&6)YiA-jMO+T8gF`W%aNv
zRF~D<wv?Y&v7R9Baxl2$vGM)&gByBsw>eD$r|S~ySD$_+^nM=MB3>He82(0!RKI1Z
zGNjAfO3I6mup0mEZGV*)nwa!Cciy<z?q+3>kpMc$e4W^R>GfP${%;y4Wq=a>H%E}}
z#bioz<I-0F-{)!7W-@8@Gx`oS0~gC&qe+r(SwbY?O%<{)GAw;qBT8Vhue~n4UzK5U
zg1t9}gtp^g-6AjT8f%$cl2$F;pv`6=l1`hp$vU_d4)~^pY<pH}+Lk=dJy<pGYP(t{
zF)VM8e2pYgCTH%O>r{+CKRRPBE_mM@fwI|LcVKr2@9RIEl!Kkwj9n_Jr_fh9DMU$m
zwZG#)sqZuSwTNeG_QqQl^Kpx?S4DA@IQl!jusWCyo8A?LWBcbSFB(_OZ(Q7-=g$Zg
ziADh9NX&T3HcKYv`221$xMRWwseDO|NT8HJ?MS_TM@?3!Q0a3_Qb=Wxig0c#=w?1~
z<iWBFq6f|Hw-e4Xs4d6ky@;DnbRB$*mmE2SH-20G!RY=l9pUwE<8x7-$l>r7awGhL
z-}H`EMRujZMA}Z_+I%sexaV}FeR+nt3xxa23_h_khU0?8CFAYSS$le!DpxgT{q($E
zSk~ZsH75Ut-L#oqp_UlJL_y_cdO|x|1Qz$$*&;to%zXNl5!qQw6Z;^%=o-H4OU6sO
zKo!Pf!Qe9MFMpU>!wU{E5&&nb^uH(<Z(M?{i`ou0${<gX?8Qhe1|rcMX^ra4Y(!!%
zo&~<b+3+j>{z91dfW2HaKMg}(<JQ4u3@m1K=A>})e+kY7Q2jslipPB$h6(Lt%UpK)
z-WP?dNT$`MwGCoWN=PW--aHF%P0NvaH2(|K#f>jE&3CR~x62WGt-frie(fAQ=Rl(}
z(*GUO4C>oXj^6DFnO*Bs)?`EOd#qG#;FRRgmUs_g;uG#J=uEU<ueU9Nd({mcG!U3P
zPM6kcQ=~1P(0#sI!hP!|0Mh)kIn%-tSM=PgZw!N=Wz8kZm^&8yW4AaWWub>bE#E?C
z>dbFyCt$^dvSYm?ly@@e+X$f-U7fD(FM#iC35`p=Y!xiOH}}!sx3^R1ep55OUF98p
z#NFBO9q!;6PkN?s-6+52;QLlt%`e|Q!Y4G=+Pk?>=*{9{2<O!bx6|qtz6>|KI`#4Y
z*8u<jN)>&7IP$1{rH>4@%4$<>wQ&au#AJ4VhVTcN9V(BeKn2=e*NBPCbRS>-LmLK<
zf5>}BE1960ES~tHgqwVCHtrWo$FAB4`9R`Nf8SuY$4N|o`Fgl=mo%K?N{S<Ra|oda
zjh>|L{0e^jC8xe8fCYFt&^zV_9`By0C?jkvFCxJcm&91|dbB!EtXoaCjf5+-1T5qS
znJftgy3}g$!FF28$`R!|WoQIU!_^|LTeaH;K6LaI?y%S!!U&B|i3}O$Tp}2~S`V&J
ziSi93$XK6VsPMRw{nT&3ME8;W^8Km%XNPVLYboy<o)lQ&ZNR+IX_e4yCAP3XxsEsp
zwPTaGGLELms@q@23sVJPbsb+QrmvC{0^`x*PVB0y!dz_~YVzEsU3;?DKUd9_*p<so
zUxjLo(zY7ckgy9;_FB`G7I*2jSpOAVp`$fr0VPdmgY&aLSu{&e^MHU2xy1sMf!ZXc
zc5omVYN)#G$P+%w?w*U4R+`YhUPkXMw{{ILWa1C_lU@lte2H0=X_!-Zv|TZoP26^K
z82Y&-7hRsN?q_3GzadM{s~J?+67G#S^2VYn7E+&f4n+!Ud%T*{WN44O=2G7FBQ=f?
zI6&^#K4IayRP3T&Xd$?K_jX#bm=CS>Nl+Dk&h~GjbqpvVd`+ryHg*E7`CgW(PvtkL
z6S7_3t^A6M{DwIw<hd!9S16dEZP`joPU2hFGQswx`PtY82E*2`h7F<ADX*SUr*L3x
zfhnyPcr&A{!n=R4@Uxg#18A+q7!bs)4uiUF*TMw7o&Iu(GH6fU2Xlag%|kPEHlgtj
zpeB(#I4{;aG@$%lODsV>C)OB1w)#NOc3X5zb$<BBXMX2+_1iGr_)yO^UwMylvT7Mp
z@f)v7kKeFCPP(wciRY#d&|A4Ur!aTp*BdiFcRPC!W%KXk4-+?MqKulL|0P{i*aA@m
z?Om=HmqB-+H7|jNfj6Y@heb#Gqm?#~+#TV>W*&T3;g<}|wrIUf+TJ&OMTRvy<0i#_
zIm-+yRM8$cHz1ok^0QJFSxlO7dS>Z=u-*AZ`va6JgC5DU`52R)&#Ys_?8d(ijlam`
zA+T_(*~g@3^AC&*lz)`)LY~ydJ$n9x_J2-7AqrKV?>l4j$tKxA49%Uq3fD3gF4OUA
z*49f1)h=rc9@{J4Qr|+>Hl~kIJR+6`54EBqRgTg^1<G^BQ!<`MEsm`$pl$gjC^~jy
zH6_nB+u|L6&nVV8tgU;M_;#fsO}oR}W+T>Xy4<pcYr#bUdJg<ph(ZWRZK&PhW8z0Z
zBGoXJWAiLfoz^ib{4Drq`F0)&JW{M86&HSaXj!&mDu)>i>)b;f)+pLY8Ol_d(Edt=
z(4MmpdXZFKRpo<3_D-qLKA^ND-cZtQ&8~j;<j;1L`-gGk<up>qeJfx8y<)aWmjnq)
z3pQVLd1QN6CeLTR;Aa%N@FwIRN&_Sq6J5en`C<@a8_8J4Di}<o-~DpnTp%jN!W51&
z>NXVH%Pmpgb1Q$Aw(c~`t1|mR=t~2~oxGrOPG;sAAB2)?hMViV22ze4Lpw1`)hELN
zqzngoMce*cV1v4+gO^5jc5xmRdmotk<bnEgQcG_>PpQqKG6s_fV4>D;b>@%<5Y=ez
zwQm@eYV8r-gbmROrL<iUCe^HifN+WzR-ytijPJWZIW*fl^Lwvmv?V1&lR#*69?g0x
z%xo0W>Erg^c#<m|7Fn&lWjwiQT=NqFL~__K87Dq-Xqytz&RN%I3LXy0pi)1i=}P3Z
z3qVAt0ph>q%^g8VD4jOff}VrMBu(I36gDisMpSMsHNQLZUW4tgwD%~q{ZQGuB5L;7
zrsN(`&<KuUz-uhdD01}Baq2q>8~eRFDj3l{?Au!Le3(W#=stam5iF}o3c&T_Vguxa
z#dMUBb+O6?HV_GI4Ge~cGBB!aexzq4c+WH3z+EV&ZEcBMl}+iLd?z)DzwB-mI&e4M
z(`}Q8kfaN6_003Z@s8+j)qBhP53_EscqVU}RK#ZQd!L0o{|h_`5`g`4=vS~sxp8K@
z$M|_z!YIW5t_#6wqqolR9Ib?nAtkNuf*&@eqqp*|Zi32H?Vu=@(r>a+=F?)SvZgfs
z-goRmlZoiuex7_=wp^d1f}hdLc5GZ2V6xV?sQC|-p~Lwns4cf)hTb&X>N7}Sd59i2
z5W}?aplV{q@Sy41IvZn>lix}#VMAm#`mcr_P0S@Vl1=kJRx_(+(4dI#2v5MZ4GJ7T
zuQrrL6^16)SH&Rx%yiwo5>BYbEXT8fa<cU`V=d{2AVxtT6-i5k(n>}(!C}|6iX2d6
z@NCsA&|@Gc{rEgg6#6?X<GElhh9UPUff!u0tVeikf=K2TNMbcu;8khEtGc$w`S0_t
z$F1J2g70iM@Byw;6tzbV3ikXPC#Ct42cEsA>H5aqK$MK1Q*+=+HaCsIJer@x%Nm2?
zyiI2BpCVh#9!fLY45<F36elOGMq-cWg(pcIDbHTeZ4<N8jyT9;TsI-5{}H%YsC=3z
z&zk{}uRSF{)v!pQCDQ4izEO!{l0#*ab4&2vKf1M%gX2g|232zo6y<Sp=nXuXTw+w2
z_^f|+*e=1mRxpRP)tQ5i_1fkL^S{OZvIi%F9v_z-02$$WV*NCSmTJ;qdBt-<!cCa}
zfk{8;O&~2x(|iBic%z6*FEYTZxw4`3N-S6si{EM8XpVq6U@zGF>^%637w9=(6NrJ<
z*MQdh{TaRE12{yVBeY~hgPcsKz_{f2|H_zdvy1n2kV}g(W7m!t<HmjI?DL!M-Q`lL
zWbLDfMx^wc{HeC&bQ5vMY^T~udAw~G*Z1RaalJE{ZsQwxG%jh~lTSTEHObw`flU2D
zE<vs2$GP$V;PxPp`v5^pn~C3dHD$K`k^{E4tb^lRN%h1$IZ5T}^#kpRwVBgoiYZvq
zgqPBWv7lwfb6E)|G7j&@UqsvI8yH+G!}gt+saogffM}>a4+$6p3+uuFMn-d?7&?87
zigGk`wa&p3xZ;Ow*TbeBt9&I>=7WXyJNtR)6=$-cnZ0&i<E}#zexxatVCE7*W~52x
zwGm>rYTeXY@hHd5ZqPl02!8|!H$Z^uq^b3E_GzFyZ)3fIoWhhRxe}vE>PPx|8(8<i
z0%!$gqvyh5YfA3hwNPRM1H4R#C*HG>;&);wqSGyX3RKiI=uk@16`rcY?IFR4u6D2q
zkWvQ6Scz<4KC;c`c^#|Hg89O;dbYM|<aAiiqL4@GfJ_91gCY`k+|D4SRtjK>1ihvT
zMg;Q)!)AB;0o~DB`G#%^gb2h5qzVbB&3+07>j#4|sQT{(#gOEh|H3}=6J*p{!P~?H
z!`El$3@2lmp;ZyV!p{1|Kf-}#ly8a@fVuofaQW0+JAFFzBXC&(K|rX-Iq}=rCsQ2s
zG^krQcXy0jCMiH2i1(Kt#}$s;6^J=Hn<kdo_|VJXlGIUhD6>)dhic~c7^B3Mz!Lw5
zC|^B6LFg9o4qb4a9BO?oG~f^n3c1kI`{%8j+~}J|z{qd?MfEDx`s>k;fMmOAP=J?H
zM6DF8+>R0@grNFuQ8~M-7$9AY7X6@S>Qh+^%uD|+{42W`>;CSQ;FiOgd)+4A0-)5g
zAq!{_JU^p$|47yNs|w&dUdDm8#4*XP<<|T+#hin%)}PyuLczRtI2*VB%}|~Tb;0$N
zW+3mcF!hz@_TC>qLJ@&t;k2Nc)yv^_N8DeQ-MMY|n;s%H1x>a{2$-kBNT6vz+KJU*
zDbg7%hSx$XUPc9XzLGP;F~W?aNPFfZvmGdhq~gaDlra?R{wk)(C*gSu%u~O(LIpd~
zep=c<#k(=+1mqhSjLPXcCcj;6B3z!LO6N)$_~{@hGAV?BHiVHWZ}QVQ8hXQarrhU(
zje@M-8>e5@S$JdPiw1|~qeO{2$n|0^@Qgvhwpp4_8J`|S*Q-0lU}#Fb9<p8>28sei
zM5mck(-@RqL5)P8IKlrPLqUtU@9DARLF}VaM>)F={ModqPM|=AE1s`+_6RDckaHO4
zkuqSV?ikw0L<r+(^rGli`4NWnv<xkxoQ|Zf&*L?owWCBFu$z@8yUP`P6~m5AH~-c4
z<1Wf~@ob+^p|W1g7phfW$+IY?50VX;8SnOPe@eB_MA@a+PI$%#f!VtgM!8!xb!wPv
zLc=oS*S1B_Q8*rY!f@Esv8w0qyw-*#zJ^kDo#mbB>?>Efsnf@$;$ypPx%KXwqRIW_
zFzIG<XKD{^UD@q$VZ@`|>W^GNT6b7<F_FqXh`J|_BL^$D^zHb^4=JI}8#h=s2pmrJ
zJ$`in2**ZK<j4z$H%~!=694W0xLo7vHhUNqJdF{gPCv3#iLebKNPzj%Y*BRfTis-B
zW8w7YPr{O<_8lj;A`x69jC@oC!hgLJECrqxyP?DAwcL8PJWOJHSXnRTW48`e;5q_Z
zZZp!4{&hdXiq*tRA9~9VNMHI?ncx+l7sIqWpiL4WuS67-Zz_Cp9q*Vb@t!YP+u-;y
zf#;x6{!2l_^YgdmQrN%jEPUvE73MVYO8gqOEgsjVcegt_$TtS_x|oD(dr4hUL!n3j
zgc?bopGe?J<vSm!a%=J{@htGZbcF-g@h-GFAh)o7b$EgB<Bl9Ekl#Q!vQpiq^(T4{
zEMO0w#*)^|=ae%)XMl@c%61hYQI!fcbU)M9XmN&0jZPeYhxpci8qEI~QQdp5Vw0->
zAXo=B8U`Fa3->Td1*94rw}(N5UFf+DHXP(u8u#>{G134&*4!Ok90A#QS&A|jHvQ$9
z#IvuRgR%8OIFiUZx=Y7%)Go#(vD3p#3XrEYeSW+Zy8Mv}nn5xCnB!5d4Gn>HQc04h
zEn8P0-4-$HyY8D4USokM6-MnWu6XUt{5P0l`AwtO<7t!*Zoebm+z&cX%M8@h79gvO
zR!S|_F~M2Hn}0-Jf6N|P{noR2*v@^X*fpfS>Ef}WaO7^`zsql4(f`45IfZI3V&{AP
z&QN>nixrl>@UJgTD}KF}e6__w<=3qMB2zx*bM`V%{K3GLx(dgss-FUtBC&&%M%-5U
zO=HB@xwmt~>&fMZJC)nYiXg@El>tJe_Q@KNqh-@^Ubjv|V=hyvJF(Y3Gq-zhkz}t5
z2A=`B669oO^!f@lZufT%We^*>zA1W8>Q=*bpdSi+0x|GLQ@MfpgP%XtHjUj#NU%)T
z%{cYW&V?#g%#R<e2<OIN_w(f8r9#IEx8S5b+KY>CMjoazC#>)8Y40A-;H)p@<Ul30
zZ%nO)zGDXLg1Oob{K&IW;mfpO1BK;t%6r=gU;>(*(L1}TWRDWH8~UqFwy$j&<WQ|t
z648n%^3ZApU@Q)TC<XK04v8Lx;Ft#OG8ILza^u&kh%s>q(IL>N+WuqxfA8o)18LIz
z*Z)L+1fkp1FI(Il(!x!TEcjGYIKYN?#Hm018G;%(OKpuOD7(b`rnXX=stEZFPX(9a
z!bcsd5;&_UqzFXO`?Lc^|2lyv61}pf{MyoJs{f21;k^l3czj1zZh66Y({nzow(L3r
zG+hx<{<j>c3L8*{-ViGM+T<l1{I9hur0VRWI_OGhR=ap8UI`CG39xvUsCY}AjbBfM
z6Yv13dl(DXP-X|%$am6qT2GI(gelwN4`Q_Tzv-!k)di26JzhS%7kQ|1x7xcq@kK7%
zcV`gzh;nZ43hXaOyxjxg)Eq#F)pStvwbP54KdqBvsd90hV|al>1O&r9=J#^uwr%7L
zts|*FR62&H!A?u6%|GflcfYM0r@~qyl5pf^M!N?0-7ZJ}9v+Mm5NsVvWcC=04Smo?
z^7qtZkwc}`?Gw9v24jL3fYUTG8)sH*+ihNSFA3j_+Nn*((dd;JE_v-uw^#S~btJ_c
z%p6=ARzNozVC8S{LPb7O({xDxOHkev@tf;aR)2_a0GKBr%fhxT>r2ZKbo8#4OB?A^
z7mPpir6B19`skg9hH%1PKZZHSJ^2rpx$#~bq3GW+gWkIsA+1~vA1u8CUc7GKp54ll
zGGTYKw_eX<h0}ZbL29`Td_d#|eo%wO{hebZBfSKJPGvb9NKGk<cosB%+BOdLuxCnD
z{!5<>IJ8`#n(n3_kZKGX9bbS+#Ad<UBocYGzWU?p1k=hxzXgMu9;oGgm;dck4G1<p
zW=+GKb<DkX{I_uj!-KVR1t4RTm&d8JPalmtI;kTczp|3B^2vMF12wV9aO7)`0I9-~
z=rTs(hTDXY3C@p3aTsb$Qj5A<?>(6sLtw$kyZI{ZEFdlfa8N@*5a>-dy-7}__*+)&
zNj?CCq*89Juh8i1gTro`o)gYLT6S-KSbt)~pj!E%=BeO@a!Ki)aIBtGo{m}l-a1ud
z)Wg`undq&@&3wpVngl2M8sQPJJ^C}3TpLKbAv3%E>c}yFX1q|;I|F+;#o<(p-e<AA
zr(x5VTsg-^!|`2*tri#vUpK%BO*etNGO+&Se#4_+O)k2>ee{_7?%(!8Hz83p{o%kk
z<*s$LN+`i0gBN@RSn;!Stx<}UMFoNP_iKHXE)XTuk7Oz9^y<p;f-EUfeAAWjKmDOm
z7<_zKFcm#)%FWEx6aUsW_K^Fl-N<vhc6-B!U|}W}zA0;FD=yq52u^YwpYi$h0>I>_
z8aeZ7#jEYMKF&>yWun9KEWoE+Zcyn)_5y$=eJ>#qfmSZ4duh5*<B|l3<ri>wM!#m|
z9>@)jJnT)=EAmO6cty&a9(WeTEEzshEqP-c3(w37f$nA3_zF{ZX<;c&vm`U!XTFnI
z$d}M=&Da6NHg@Vr+Jno<>;c+m+b3;yEEE#p{V#kCP#Vjtrq}biIt*}C6B;Cgb)55k
z=K5FkhQdew2D`{m*SY2xEH13C+aeO?q_>00G;pSCg)S&FjO9mZHgi0vn(#BA{u7iR
zgfS->nM#lc4Q&J;*gXuVde5&rxtj(_t(A;it#EbXP2@4h6rvHC3U1rK2^`I640y($
zU)X!diB$TbdyQYN`?$HBeW&b3Iqt|KPe)g_%|r4FsC+6vZF~3@PXTxDZ3Z?L@J9S%
zH_#EZsd|HX);s=QYH5>~e=qp2`~5ou6Ngp4Yvqo6%Wbk}ovTLs$A+!gvFb122;?@s
zAE6;^s`^Us*Y<<=4ybd`x|-k1_g8dQB^VB>2{)0RBiYccvXe@`0gMeEVKx1!=S_d2
zz_v|REuUc1logL`voP>~J)l}~)@N(Y!-sEGI~pqyT#wQyc?}eZXEcvX01e|8M#mAS
z<5%MH05kuwnMhDXxdyv~?)VqUb)k{XohfziZf}Qu{pli)w4eMQX^H;V>=%x9ik0<b
zU;+hcjr+k2lv245%zHQ?ey-S6j-8Pe{1dUiyg?TT$3XO!>B>0rs`!vopCeedeA>pP
z<9tFHCVI!NbL|!RdE7Wt#h1>t%A9sPy4<<OGl0vu(7b!M*QS}+5Na|ye<UX|tOLtb
zc9MI_#k^#*V^`O$BevHEJDj&t4bP`rGi>w+d)bh##48XMy0mKbY6=AX&!-N>!dW9n
z3rF-)HaeH{SdaEbZ|Xb0Ijx_qFXkNL@`Uyp5y&f@8}VH*TXK&^td%5mm%fCTuQxxo
zE`yzZhPCtS?_J}zo3K;e`eHS}{e=4uW32B7Gj!kN^jWgeC&#H!Xzx8H|13%Q34{_A
zYQ90?P@mvtDKYPP1K&|yO!@;nzuH6?_{7qgkg!2R!h4SfzPjJbZVO?A_TLBg!4OCm
zHNkz9P<{OmjcgSa9y70GuEb9@$voHanhqBcuLd6<NsIc;Uiz=oN}JLX%dXf`pqR5A
z5<h$>O<82r^>5y+cO+wNCig3Vg=Ln=O$e~0^<@8jw;qIz&IQCZYQi(E*6)c&Wm&DO
z%v4mU$X&r491N>(&3y=tR7e%QB|weY7pP$j5b`0LX<W3j964#u3Gv!(ueNs@l`X)I
zls$_HC0H=13C8$3*Kd-LGQcql8T&o)xWd_g62p;ua29!Wy18?m=tCY+U-?;*)-leb
z#syu!HrKr@<YBbjA@#V^b*e-v)yt_?;JPTgbMHtDQSuy=OdhYhYt-;N5w>sqMf0JP
zv^SNia_by8{ie-Fk9wgH2gozG=}YeL#SLz>H8O&InbYpyH3ldmRSB(d+_V+fY>Ma0
zQo$B{7Sx9@Gs;7q)JvrWi*jv0aJu8vuN8?Uz;HX;-O4T)<<x3D*Itft+Jiv71v%95
z4%w;LZ0icwFDc^We;?FjBMH(zHPmQetgaGr!a|?8-@LIMyCtS;vrc?pt|NlZtk)hf
z&N<J`FT!#fz)1Pf1UT*}Y_N9CF1O9$ibq5nDOEh7XLdcXao;n?G+U9OJp!CXxuF{$
zz1?LLSAD+3*d)dmvAg+4R{OtIxZ{Gc?Z@C?lTUoc5>G{P=MMQyea*&_d9LGA^3i=#
zg8U?`m+COJs*UB+;*g{F!t@del_hg>sA;X-Mus)TV53LY+QQ5gGHf6fsj8s&QEgpJ
zsJrV7nonDM!v3XJQILG<xwO?6;9%CZ8G>Kd4;p{p0^##b3gcgJC7`GH6s^=w`f?8T
zgb#IK<BT=tbDkQ|@4BOYC`(zRlogMoogXwd#~-vz1<!GnSCyj@e>MEp8`;cIeApf#
zvc_MM+bHRkr?_;V@vGIkufAm{fyPHl;)dS$Dw-i`wNY9a#0*=IcF_(1{Bf(Nt$jnh
z412nJPMf%EY&j)6&6KCV6@rxaYUa?oj_4!J`uU6ejveNtUmHjJ8&HmV({S}d&ID^;
zLV^Sw6CHHE#47_%*klU<$rro8)QA>OYRx7~PC?#(TmTFG(uM6kTl8578FYsrAEN;~
zQ`!_n)xHOv$#E6RzI@X8FMQ!X5vanTNlt`gS8~?tSi|k2z{uH{w9Bh7tjC0lK^1Z)
zI#gg|Ly&!)CCo!GhZI^j6zF?*ftV4qjV9sboezRq_?_d2@{1VULYFSg)ph#&r-^$7
zpFeCk1<3%3%yD;_b1}G)^jaSTuTO5?2Dskaby@8v<ZYSpw?*FfhK$ae<j6CY@|n}=
zBuU-gjm-7WKvEKN+Zh?09y<4mtx5_h*hP`P*`+S}5FD;kl_``#HFjzVh~aMid@!R^
z?7q~mM@YOh?f+xO5*<V9joXpoeTW(RU+s_U#O~W)q>KNhJ-B;OQ!G*hju_V2L_QUB
zIFj!9mR<JD!*{0Kk<w<9K-^xEo4CW0i5v7VPUOA~H_#_^GL_&J!tX>{XW<56HGCt2
zZlTPcn7b=pJ7=p`VNw5_(4vxI6?HkcWnd>(zXRR!7i|*cCp&SSTYQ>>ZS(m2Ex6pv
zCSRr7`!Df|LXGKcA`d-xqwvTLyx9G9AuUpNL&anyK{91Dfe1ICZmq+gRK4o1BpkN4
z7%Qv(-b#rx2fs0G^%<Lch(}eO{G0$%#{dp-XUttlkevE~+WYx@H(!uhhng#SYzGfo
zMz-XMJIR7<8?no_QHLk$<+`<xs57}3?B(GtGd>AAvW8hTVR3jOZHaL3F96OcK?Ljj
z*$uA~+pY;+Yk&_O9MoA|2N!HWII>AqnM28qOjePMk<+xLAfr1`{zfYvRqGJYE=v|0
zeuy@ca2Vvloea?u`oK{~B;zdx5#$o}rEsU@pY!6)Er%I|_~9WaWHScZ2J-kISxo1T
ztyDBh*`@WDT;u-R1wVRlCuNGXB9w~#_Cq!aZ4HI_d&tLX%G-yRx|#N^u9sXG>gJ}@
z(4U-Pb#pQJwj2JU75Lq56AlN!F6lfB9L+PLi3&{d*mc;SmduTDvJ%{%{JYvvIEvi-
zYd`~0uT*Dk(LiV?UwexPm(2)Wl3e3TZ29J@qHa9-AdN&(=s#^kMd6n(fI2cnx78ok
zBuriABlz(#=nwAt9lPO0F9k6+EAUu%_F|RE5nCseiB+j`8vXn$+*H-lgfgXq;|@4%
z6}r)_7RmuP3mN|)awy++$p@kE^3pq|qKEx#N`MfQnRcW}mToWfPgC5g{`39D^5@D0
z6CBMRI$(!tseON_F{oc=13Bs^%L3En%o=Zlf!*+$mxA4@azmXq5pRaP-s5vNjdx5`
zCj_NV`6`dAR2WV=4f%L~)a{@BXjFwOSb1!Adwxb4$-A$b!CQ&_G`Lhf)e?frPosnj
zG#JpGg=7IV{ag*CA}7Sl^dH`%I;gOpTBB*=BEQTs_q+|J(UK_^l9v;wa^bt}`)Boh
zP4lha_%U;OD5lG}PhM=;Pi6BC3e+T={Tm#(k<IU6l$L*0c<<3S;9itiK)*ve)BK#r
z*tO>di)qe-dYUKlzYHnP8Qnu`#${8FiNufXfhC+T-hJ!8&vsy@m;^gZPYS=0In3|@
zihiobMy-KH4JnrHj>_K;|JzuS`IK@qTZHsB7+ymOlt>^NajD;!R0C>HGlQ;EX;QQK
zO#OGK!J1Z3T$4+_-O(v2S>2N58Cy<TekTQ@zZlClTD_m+f|LoJ@%K%FZ6|Y+<3DAA
zRb-s*4?stqs%eUFI)#u*e4jy^$TzyHW)new`sESW)%x$xV(pCOm(;e5%}2;lg|sPu
z+^U(b0Kw!9GjrZF=_2WGS-kQIaAE+!DbS3+#h$P+(|;-H3`F>my&PbAo)A{*BX)<-
zuePNi$~t7n^|bnM*(t95=A7`v7T1S1Rh4W0zwYX1TSt8g!K<$*GdyJh1(V~lg(USr
z`FWR)-l~@`2Bnp20wNqvNs0V3$6Y`ZeRIRee57vShQFb+-(Ej=%ex(^HMMVX47ER`
z#^NHwmOKX>9mWrv%4mHPd2U>?|04nls<V)QA4MVboRH_nl5<FLi`Scw<;&gF!T2wZ
zZLhM|t#ghMZ5mq=G9pb>tE|7^;_AB%ov*8#N@PY7G=&xQ?-TBXp1LJQ)z8;Ji0rW-
zrp2}ckH@-8j6|oh$7|rIhyJ6OhN**=$+$~yJ{g(KC5MQ)xXLT-L_K=Hit<wwc{8J6
z?<GuYGJjFL?F8hxBG_AMQTt<n%HA?PlgNcn?z|wk8qj6z&l1!qOJ!%p+h2@uZZ;p<
z(Xu)kz%`_(|29hI)?^ynMyEZHd6+Y!T&Lpz?WB*R@afw>ym#@Ra|$0X>m7VGo$(y9
z0=@Z9Zx^A_9%bNU4+l3E(D<_EE;hJJqC}0f%Dc4@Ym(SD5}K0j3fsL{G|#IFb^5Tp
zJK(4;K^&nwXSrz=tZhmiRweI<_#=zX6m(Mpu;O!#JoaQC8fysHXAVv*t;MI4{ZtL-
zcl%LnCAhqwZZ2=N&w?RiFe+G|avwY)SEAYD^XMQ)2I!|ZtYw)f|G4pG<)@E{|3ifW
z@LR7MnNR8esODR>TbczOu!K6(FU-T#60v0;uPG>>(E&+)Je_;sk;!MzLIx*c9%br4
zqs+U0N@0b{=@Go%uc(*{<?b_{Qf{Igf3E_|(P)!XN%p5q5AV~RI&J|SpEaO$!PfgS
z(J*B70Q2v6Q8ItzbrytBg-7bNVbmo=F{up2h<22~)RToCc;S`z3KwMxR^<9QLS_{0
zU4+32mCLQYS0zYd3iW?npq{%w&X^(b)3PUMhC#&z;(k0~+D}jn^{fOxF>0jP%6N|l
z<%{dMybvV6>_<{way$uFgdbJF$SfUgFCPZ4g@Yf*(Qe9%xvtgTw^FTgAml;<J^@S|
z@F|(=(=8(~!5}qtS~ch?Atit6NssD&9#lGfzG!w6<;ThFWZgRu>y20TjUx3edz;9N
zfzJ6_Wz{5UbTI46#WA;nuggAr`e{g*&BuK*_wh;GV@o>&Jg@bw-0m4$xhphZonN!1
zeS>Gc?M36?169uW6}>(;Uzz@L;5poD&3oR@8Tzt0wC5mOQmbw-KxoF~z)pQ<?gRKV
zSqXHx;fOol4DmspOE+=L%I_%5cLQjLv@qDT%Qtenb-3u{7$8I&+cI;yz~-G-wi?uL
zP-j>eRW|7T8aRY5mRmWo&J4m63yY5dI&3YrO5zosOecqedSdKGgb>1$hp9+2U-hUb
zNH&_Q)MD|ibHJ1HPeU{KrPf18W{?-<=}+H)v8|8Ce&<Df8@GvtDTkL?h=Nb*&hG$|
zL)?vjM1KfGF9T=&4)_gZACoNWfzz3XU)+&sKlOK}v>JfRAgu^e5eSuPBrQ0hUEbQr
zC=ib2+v*hq=B^3P^$iuT_-gG4jKM(M0sY=`YT)VJbFd4}i&!_i`Xz6|+M)<t5!cE3
zbu2b6E*)9rKQrmk=&86tUk|?<0`0$HvTry>kdWFNVGsc{<DUy7TqgS8va18ys0zda
z-IC>hrDll77mA$c&J;=PrSY|A{avPcDc7Azsm~tJl+VFbe^d2}Wgey9y8T2X0T2;=
zw#Yb-#`vQayfShPgNE-22e0f7;CuY>%6{8dMf8N+Lz7AVeM>(iF`MTgPo=2cP+)VV
zcXHQy!%~8HB_=NNeY4pdP#xHb$#b_!_!Np+=m{q6q^#aYbGCVQC5xzUy)^ZWQ0?`;
zeH#_0GS<C2u(?GTOgr+24ruqw3V>COkK&_87$MQKfJaD&WV>aVFi`g=NU5ZS11G0u
z^xHBgNjIOyM*FvoNn#m{mZw5~oPKq<deZ^aO`ct0#=9siy*~r3pT%x>0Ww@f?%k@#
zcQP$@2qPB{ck3#{mi$QJah8lyl7H22jiAR#EZB|+^~rWblzS<0<l~IQ4T-j`RQslt
zbC9djQ-E~v_PJHPDz<UAYJ4HPMb-D==+q9zzooawGpS`ab-g`#_dA!sOgFylp4n`w
z?T>fEq32t&6ifIaTo|S0_i7oZVZkIPa6Qm@!!ISaj%gwq@A${`?pLX^-p_a$74)G5
zU=FrL?+a_-T9j_F2faS~?)x5VqTg{I1nV}=w|CL*lC0i?VZfW>mydGMyHETpA=VPS
z=fIH+2;?K5$b0oB<u>{m8O105UdacU-4xjP7GVtkDFb6|KU<^_4nHhf7q$HHmK7pw
zHin?Ssr+gnD#*xpO)G(f<~2#Kci@=Wbg8q6v-1#Ml^pw+f${W}b@jEWsxzubgUc)O
zsF;NMW!f~S&F)65SV<tQ>T9OUuhlf|O21{<W;qo=vmG;^kJ53TG^hUI^HxRsyXc*~
zE@eQ8xn{Hc))C8zZTn1`y#enYx|}KSZTHg+J)hCz9yR#9B?yBWyEAoIz1)=sxFrXt
zlRVojiMdLSQh3-VyfE-=z&aV+enTa1%yF7Mj9WYzPy{>z^+}Mq1kkNC`Ri65>w}0h
zwi8P90&16U%%s-Oa2BM01;Kh3)Yx0_XQ+RAOE>xSeQfTxh+gc^#epY=)7CWS4uwc{
zFoN|@<MT`=b*YMIRt%NJ;q1Ho0q!tlcLBmfJ#`Xw%u#?qTHbt9gn++u%nsKnQxD7{
z?)h29DNwo&!wf9g9gJ+~nyGIN7R&nQ!;>KaZA+jK>aY=WDg`}Tx5sbX(qVe)19T-J
z%aNl!P9Zs{tqj~0uuA2KP`^sA=_d1GT1$L*gp7?!`Z42s6yuy~x}Kj3l;lI8k@ZFT
zawugJlD5d!vb?kJQZ6zdPyQ--0+MJB!ZUS*Aeul_A|tO#EsOV_>9RA!{o$NO?M6eV
zQGe(YDaUu;eX|v3+tZG8cP{x9ikt{A`tL5L|GoFwer>KGp*v*O!T-aRGOTr|xB7&;
zbIv<VyBZo?s?naHFu@XL*mxLq{L#SRjsqD@vAogNk>YW+T(iw!r$!3wQ*^!cK%ugW
z;@<8UUm}D!MP~#lg@XW3eMpmO*O5naVP!GHN01o%fAxG+7g9N~zXsRWIducQ?z6Kx
z_5wK+KH~|Fc8@u(uUvxgL@y@@9Z)~J0Ro``?bYYn_lR0ZC^?VS8vZlZ*XeL)z6jjY
z5d%fZ(Q_XV!?PViy`zM$r@Be36$q4d*vZjb?X^WAQCQq1eegl`KA?N{Pq!Y7XZmQ$
z{KU9kyaH}P0B<OcF!R}P-|yU3?yeV(<G6u#oJ^G*UuyR~h{M6RAEbo)tj03c9fq4|
zsxadT10#|#m;%;qQrvT7uGz#))tB23k0%L9jQFNVI|!IfG|bS9ICFW?K9gF!uqzxD
zNj3HFUsKRoToIHf<m^;|fs9@c;@(&`*mBfR*gRRe9-nOC^siZzpBfQNl@YkYi*bFd
z^`Yf~+1C%y_a)@i8yDXn{%#j{?Si-Jw7dB2*1Abtzq!~>^vhuli}X3r-2pqxY(CI}
zxxci?-3u;l1)6^jCN%zP$9vbSYrY+@ri#Hl)N<Jl#LkB1m;q<5LE7})tu@tA=fHb}
zlnGrgma6=IBnSy`*jI8%L+O-(4}=6?p_*c2kB#pM7}*F%REvLAuZwlhJP(ZuiGiZo
zFvN>P#_QBk2>OVvLr*lt729@AHwn_T$^~2q(3DdeVq>kIfwZwyx;L1z`+oZ7A6%m@
zU3Rs}YF5?zqx@8rWZnbz3U1t@z6Giwmhftqs*wMusqYSJGU@uxuIsv%M^-_xfb6cJ
zDH01!5O77sP&KFsAw;Q43m`4Dpgt^01T={RLX#5Qh=70)YCse)gd#0;BGQBap-M~0
zJ9m7(>-z40Gjry&IrBSbGBf`n=WxcJo~i<8*$Q^1TuIrDUD4-P;XK<u9^e71yp1fN
zid=c-{uhqRKtqP2L}x$nBs5MACx71l@hfDlgA6@66PJaD7e1Cdj#wvNSu>F~l>2^E
zXNVKG2Q$SE;hjNgM~{%sYoy%CpDy?{Vn0YpAU0svGnZYd1-0<x12_LrGfJ|ieO#3*
znsN$=<E@jpVz9Ar_SRTPa#p=+^>y%Q1-M%3bKgGY%!f}D)-yt{Cp*qmIqjM`)SsRC
zO{s$q<XO(RySH^7d$T_wA#Gx=LHR*R&f-C+ANU-)Ue~gR`7Bp@`U`E$zU93*vw~?Q
zaaur?XYuR1Bv5IXTt(!{`#^$Q6*Q{RM)o=OCk&}a{SJf53O|nd0y+^r?=rk4x<f7u
zS=y1@{q_+M2&0PefTvWC*H)|ycA(?gO^!Q9e?L21DP+D)F8@})ZyayI!Fq7dwuqY&
z<O2PH5PZKUU6!=~8o#ckTVywK{BuGZO8RTN!$!2yLUw=c{P>Xy#m$T-@Pn6pD*uXI
zK0<){0GD%#0kxE!N||g!hXfU1CGK|_v#goA^8IyA(Mpa!a!j40ROpR9@SP`WW=ps&
zjLk|n3uH>aGM<^dLXa2DfVhf8RL?Rz{sp0Hb)>p!^Ia-GHtSD;RLJ*ypG0+-%7_04
zoB^H3<_nSJwoS!_Y&|uXP2u%UZ~_u*R2_;tk&aw?Ee8<O`#5pohV*f8iOALHiPgGZ
zft$`W?6V($#SkA6Q*g8ne$C&~**;s3w!#s21ktz8j4@+E1#KUd+Hy`FBBJbCjR$A0
zr{Rtk?fo!M1XU-6>40f)<^np)DiqHQUW=3K^;eh^=MEx%haX0>iIpzgr{~okpO@PB
z{dP2tuUYk%Ol?n8*eC7DS=`=V9;SaZ`K!M$nK}8>!}BL)jD4M4$2>-rUr|%H5q`oA
zp7ZNABPahE^<kDVHN}&9){@GCPk7z%`Be3)r3yfb%iC_~*x({56iTnI{p*GI3r3jp
zyht4DR!x6Gcz93Br4QKZ`Ed-*84~ZyWBH52qaw?ji?;kX*;$=53aQX$iY!H?qV^LO
zM{rGo>Aw#o@>XZM?zwq3_!`b0LzvqLo8!d2!rA=Q{*Cd594*C}guIC!--#sHfQjDH
zFJ4IMpCGF5yA1S3xF3KtPwdL`G8p`LOhFgHAYw(6chpk_wYX5Bn0txrB(pM-w?Hai
z?Rv1^T>a^{;MkMcUnBZ;4hH|sd?yzSnZQv4_<vQLwP&}Vr`wqvhN>!C>86j&DLPs>
z)gTTvSSmVA!G%}4C6PMP1t0z>pgcm*C@9xQ*oNoEkcc_~k7O-aYxA!?X?eNDO)LxZ
zauQ|vE5_X14K?;?f^PP*<I9P##gQ9mlqG`Ks?aLx4KzsHz;?tA2ghn6y57%0R8C$Q
zb{e!HX=xV0k)FOjSAFoq+c;6pNowK#A14x)hQv;qSi^jT-OF@AD`r%Y3~o)?2<i%O
zEKPN6Ns={$efg&^UD?}|lMX?&la~W+b?{<xbxOCbMR{ilcbSHX(Wy^B$s&E5`hAzV
zt)3|{!>nENa%N)(|E0J5!%B6G!&t{NSv9bR9C?Xarny5ql?8-C8kI!u%N1u9dTi!j
z_xb3vSN_+ExlQF9JgN7&0h5g1tu?4Lb0v>|ccj9<dgZ5xYc{(9JOF=e=)*&X-wa6A
zK;{-@!HcuG&3esWgB&OKBgt41!?P^7daXaF!`40N>6gu2bLY(H9dM)@qv)Dl_wxpX
zn6DilQnd&6l->Io3W*1DnCi&`A(d_&^jt+{#yxF>x-uQKZ`6$o&05PqE{y$mKbyy`
zYRD<!HlaFPRyXcX;K^#)OXr|Y?$iLxkpr9Sv1hk^x%vMq>L%0n1R96!RJ`ZH@W;US
zNFC2cYnT@a7mSBa@=7KXbcZH%JEk;{;Mi(P*S#4xy=cDPLXRIli~q})n3VC8MCI4x
zfV=L}YYptG<+D<g6(-y?E&kg{wLMZt<5Byun>_(`)@3VfH+!-T>Aj%i_X4vw9q`^M
zt%L8E^&gk6SmnbGJQ@2TVi7f-y`IY?WnnMoiEf9@8{hxUr0~k#tz^EwwZ_>C{0#O|
zYMgD{N~$DsFc)Wmv|32CyM;+R*Q@BhDOa@7Jv;3XDjZP+?@ek{)y-ilR)RG1F)o=E
zgh0(9v&FN$1Kk00{E+h_|C>v9PAx%eR{gXC!^7%4yY6oRlH2dwHKP!)b;R)yqTJNW
zqbkNqU%o?B!Jj92`S#yeltufc><$Z)@~qUrj}9D-(7qX!T602$x&;QStgX9=K@*)h
zGYa0<u9gifWDg$6SIxJHKf_v?FI0^;d+UB1JF9QsY<0%;;Cs<ww@Rn^vAAq&px@5q
zJiX(WLq!c|hw51?FkA-kLgw55&Cr#;%m}RYRaHzMCD~&L?S<`IcRu4i7=NlBr^zyF
zwxOws^O+xbJ>R)@N2{ts6fB#+atsq)(r1PQZ!Dr%tSH^oSqt1g*oRxYe)wic7v~c*
zpp8y?$2e<4NbK`+_^2Jtp(K0eO|)z2G6MzkuQ7oZF9Lp9@h{aGF2ZqBE;?&P^Fv?G
za}3w&?KkaU3IF1K+g^nI7LPpgAAJB-A_^)Nw-)ARn6%??SG8SVdk_MWWsu)T9o+LA
zwbwG9ga}JyEMP;Q?(OCa^5PtF)Ipc-Lo+}320Wl6`_z%hvy9?w3d!69`>8>WN~d&o
z7Af)NeYCDUaB4LOs-y*K7Ck?=?NME}(|otIIt>Kh19^+-4XTF9un_Mnkz{8-Q1yom
ze7d_+nK^$!+jQZz_*oc>GuCVu5NYR{crMUj*Osysy&NOk&pm1P0%<^S`QRhuQ^T%X
zZ%gf-6dWu!2mQV7q9Ucgh0Ot{Q7!Q_L7|lU|MmvTIH4M?r1zZ=zQo`3fR!fdf+&3V
z`7&M&8uI*^rC)A$ujiJLXtwSs?Ni+!RpTrx?~-U8*RbL(^3}itc^m)v<x8GgCX}Ph
zU9P;*<n-+{eu$!HP8!9Y+njn<VtiJo+yZ8wW4_xV=L#Bn*{$+Vd1bR&=Qbx%y>P7M
zU_+v1_1*R~%$Zoeew}a&Mj2-H_HhQ#d(GjHz;D}Y`b)(i8q$-qmFRGW^PusKq9?`)
z+Wzz11dYKAHcm8a{i--yzIi#-ZD^@ZCSYcB<VF%4)1GZ3Hc}mfYckCBO{p3PHNWur
zOq?2a^F_piVk65hn#t~fV{g+EhvD0~6=tU^gjv{m{UKqHt~u$Hoq#c6MM#~kg<=k}
zkLFA2{O&snHp)*k80@d6mt+nQ@u?djpZ-;W-l?kG8Y#WIMFg70pUxQ}bSzqE78}qO
z(392671)&WiNG8<2fI0+Z+Iy9NYwZvOYQ#TE>TL^b&~Um<u{Xs$qRyz17*1moByMx
z2&gq~i?d#&oURzKy<245{d|IqpaEsRi+|@>He~!lJ8_ANtMC=izn&olJQi5eU2IUY
zR+~p)M>XqfpGZ`<TP4~1cY{?wO+;~%I(KIsQD-fKo!#N|jUU=sV74)k%=8g=bX9VF
zNm=qj1I2qLn9yPS_ZSAy%+|QCe*^&+PPwXcX9*%<+3c~Z$eyp8lr_KkN|P?Xu1nM;
zh#Giv6Ls+g1ne<Y4$42hCN+lcUHDiX1oViM!r$xfdJc`IVnRRX?`-Uz)LU+oHB6q(
z_=XFc$m#GyqhCIqURS^jIjwOF{f5|eEA(_hL-YNuGCgrx{M_<?vLSDJyKRT^(-x7X
z^<rLpug*~a5mz;`Kx1u6<7n^tm4RsEO6Tr$0=6(xcG@oK&Q9eW;3;ERNEWzqdO+-_
znLk-!R=?QzJz=5UjM*`|Nxp%uD71Nes9`z2`Wba(>Rg#HRfEJAYvCCj)Re<(p5d3+
zW^&W7tK||pf#-++d#&_Va^=*G$szxIlmch<Bh#c@?9|20=S<$sub!W2rB(|^CJl(}
z<0U)f8kPw;^Lq!C-)>nPzzjPjj;j42b9wl`e-8q7EE_$lQms)|`Hw}xyghN2!V}`<
z`=6UGhlpaTh4_2%s#wdskm1c&t>c>hTC2<c;@i^}<lOtE0l0!Ei~8aJ0ixxld)NMv
z$|Di26W9BPQzJiUy~rKm)>Vx5q}DMAga`UG<+Hu-^Y4GZz#0%r0W18Zn(X~*mQYT6
zrGZBKc4bjM<#Q^K2)E!PN@N6UH4~d8n0{Ysw37Cw&(A!G)cZJZVsKoQgV>x)Gw2g{
zK{XDYT|1Nqo=h-D`)rxg*gdaAN~<D4sK2dy-*A3WDfw1m(*yZ)vm5Qs!Z8I=c{Lan
z2J^V3awmV*(5Bfcsdr3Sgh~;<z_Y&+6^@J_7Ha#5^$3Bq&H#;WH0wjC(A9N-u;7tO
z>($BYKHw`aDM9tiSo9E=_nSGp?^K$v_xa29vfUUkUy`kbu}?}}m|+7E5w4RLtIDJ1
zJ#jAQ-G|2X$^^kbdkk%v+UyQ)m&D6u7YcdO;r#w0pQnw5y9dG+a+O=hkzac&THaL)
zpdJJN)NaSkY?8aqAyLFgcK@-F5Iq8wi!Q+%#11T|x1OJG8hqvjp_2$Im`d)5D)t~w
z)K2E9AQXw!v~PGNNN*@!qGGW;XE|OfMUcO9tW1E+Tw9U9p9j4{2K#bshjL}Xa=fX(
zR%}jo6R0^z%_1-UeZ6^2>a5lyoZ~yoRO$I&eG)YoWBf~`O12<!!}6vl`5lsM%SWR6
z_6RrRuD_vofGPusQ<0~ae$m;*3tsTBM*-LuusX*25XbhbFe4GQ#jZwJ*ZDaIa^W<I
z(pdzzA@GniIJIph9b-39ElmF*Mh+!ixh5!Awz{ITuc^MEQ#<CCNupodC^mdTU_s7<
zW_3nT*qatDsIpRe6QJm)oJYzzC8ixpN%u{A=tx<!b#-$3#7~vBZ4#d5OauT9{=>wm
zt?3$7Z_{s1II2q96_#@8T4<P1mw!f*B$V0$Lc2yF%V<Y!ZMs}Q(jF|m+kS#@s_ldi
zYk9QyoMO=)JJ)M6xZh1xIn_dhWUYeP(}6)}Te6S;QIOJ(IU6k*cwhi4n(G#pL2fp8
zsAP)vcAI5Of8Jytii0%w#D@P=mX*!=y487vc@Sr^zk0Q`<3z%_ph7oyylZ@x{K&Gl
z*T8Dm2t7a-S`J}eFQMNmvhO8%mG^I#CvLtWp&F67#bI^Pw9>d9r+I5>^#pjy_})6B
zn38Xh5lYM2#UCCC43YryHW3A<NBAB%5*k>wd^2|p&Y1af{J!xa&PP2n(u}%vYof{#
z2eo4S5>bK0+yxDnf1`xF4cNC?uZYs8<ZLt5O@v>&a&QQ!Sj)U40E04dk>%XcRCRX8
zn}xfsbuve%^jBw#@YZJzuLpC+7SQ9)>x149rHbo$>)wN5BpY?!EsPS9;rv|q=tAR>
z<*g)mk_8EltSFXI+ASBC{sCULuo0mW9VP482A$)d`=`-=ODnE<vE34_gj8Kt!!XVK
z=#>oWPPjG3wSM&04kdO#+b=p!^nf_w8pQOROWuj(CGNysO45m!@oHpvajGJc=8_1n
zUVT45le76{5}yR0EdT!X1Ihx`VZSDQfKh&h<ajJ$V0A_Br0??GXpmF_hL`$kk?nzL
z8n5(LeK|zJv81n!*^bWrw|KE(b533M@FcJ2a5UO&@=#*5<CHqmFQI0sCj-1{4*OE#
zbzNste^r|hsC%X1B9C2|D{$-W?Jm`^bXw%|cb&CpSox<!T{_`q_Bq{pFH6uR0uz*3
zi!7}Aq#JF7yX3R&lyR}VHBJ=LJ1of1c^~Ar^|qwZG3FXlDm9hK@V`ka;bu`T%19mO
zUh04o<{yoq?SylaMfmO)y*jgxRH7@Mnp?>>tcF2B_%^k%U+9E;LyX!NS5%ZWv67==
zaV}nsFrOxY6R^3G#{SKpA;NU7ja%OY*C)6;ckzIBxa<hKkP;lwgu6{xUFxk2aMo(v
za2zO|$HXASRA|M9)mTuv#m|!PbAzsnsKz(kT>oU!r?J3Ps+xPQYeSz+I~vD+0kGk}
zvvGFnJpAlQutvio230GBb?W7oqyTEQ`an%vVEmFn=(<NLyg0tM#_Ffp^CzOAbrDwa
zuA>$yDErwYY&hrBm|mkPgXqV`%Hds+f)8NTnIzek>`*#dj`b}IUBUYtfNGC5Ei-iQ
z_6<lCxy}Iv#gA23=4$@W;rq9zO{@U_b~U@E0mX`*s6qi^?)6N?`qr2H1BSEnN;X_n
zYq^GL|L4j#hy*)rgC)@!F!eU;lbqJ>N4*Eh1Z=tvWS~`1maYA?CO0>|*g*fff;v*+
zo5>cE5-`Ea_^^qBfqt5@zt)my?<JpvTPUib_`wf7u_zUr4;2i;v@A~)`KTE_F{)=}
z!V5%P^B$6^OdTof{txc$U;N4XR=$zd;%1^J+)D|PEyz-LZ?tJwB~?C<N;61OHqZEQ
zQKqg_Lp3g3f;V7qt(`w1!fnpu*M!o$t&#DXx=1hnaK~baX}3~$8un*7g-enJq2kot
z;jERp$+b$QBBHE&$b!))s^VEwQrcPSXzn>-)gpezm&AIe6T5Mo$`SlUXj>fNq=~;&
z8RxII0oh^GpTU*A?5;s&qkKm;*~32$<VY@)F%yHmv+4&wh~hb8BaNmK3<itP)1m>p
zK}^Jh)YmIt?nwxd(>|((;l6mTzT;@f_c<^Jvj{CwEOCZPtoD?|A_vZcpxcdy94+1@
zzPy-p-DEdFzCx*?kaspJyl;J3NOOIBT`P_^$3KCULrk``Yajz{_8@7_B$cNF61!;J
zb7%U0+L&v7Wv8xyV+q$3Bv===D}9&#13)`uVzINSB%Zt*!PWV^^4oG9=@B9P(zQzd
zzmnaGlP|%7<uz5dn?l@|P1?et(p}OYpT_VVkloz8rpt4c?6HLp9AMNft`LNV?P373
z+FgM!cj?D5-<gp*)%K!Y<;$b00}U)m+s{#J-o_ht+=HU<$<jy1li^9sbyF9B%xR>;
z;ySjj0HeKGF7!7fG>mX)St?m_|DCzOzLKgiQXl6Q>cp$&1%+FWD-zR04J+f2&))Xl
zW&;9?aJsU&JCUAM^?lp&@#|3<_FD3)pj8-lkMmtALp@vv-JFe_+S%H7APta;QRplE
z;ewCl{D!lbgAW!Kz6IT^A94sSdog9wn@QX<NX{AuYr$``)jlKjuXOFBf3*K(mf_tV
zvf7JJqS-L+A($5ugVb!|;l<->&E-~?sEy4_DR6UA-stGRsfVx0M8zm_#A^!4t`c!C
zJAd0g{eifZVqbmRUuJFJ))%8X#AB`du8^FH#<>5^Qti|Yv+byo5c1f(@W(i4Hx~xI
zY9WP(BCSUUK74h~eyXt5wAqH_x6S@G9x&4H$M-C8V*{MgW>0`b8w*12C*=LGof{Z(
zATp<9ZVJPkb`Cu=6qpCU=hjjV@0VAr3X`!t5*{$5gzTWtke1|+(nm)f!qF*5Gb_XE
zV-9PFAM}?PR4!s+UE#F6th`E?@&)nbxw^)iY1Ic}c){oV@%U{e@xQx!8lN%*BOk7Q
zG~YMc_GiEXWEi<j;5Ywxmqm65qm@Buac~FOG%VuLeM%(RQ#@6)h<8iGh>yD2hb2Be
z3>Ng#`Qw!G)kVSaAA`~|5y?vsdn~Ine7C-E_ZQ)>_LbSGQ#m*q^)*KV%bvYRS3ar5
z+nlZhB|SHfk*zg{+npsKYfi=@&&TFGV`l7Ck~MM67j)#cn97&|4q!?bhDSA7qFy|@
zX!g9S4XzH=7+hus2#+ls!bn1_73!bVnm^a9(^7z@k;O5xHEqX1&{qpz7p=q_wL(j9
z#NaiZvPjlW#T_azV@8&G_z#wDlW3s8_gK<UJhCAky@m{<*i!kH{B^N=48*;15@MeO
zwPc$&uw%bn_$fhat0WeUy!0+~q;943dBsY_szhf5m0o)<k+KxPy_3#id+3yR#UOEZ
zd?G6U!m4jL!VB0m!d8PyBTFm-<r5?EhLn7RL3IU<;D&+Q=nA0?o-a^m?_KIURFD-m
zts%2v<3q%>AKFf@_fLe>A(sQ}6x+-Mlf-Jh=xQFioXi>XUHb#iAf|1y9!k9Nl$FlG
zE7<c4&6yi$&L^Nw;qJxD67C|3LGPe~ozCd$j6iwF3A8tFj?mRf7uz7_BT{SGk3IHX
zB~hbQVAD?})L`9Lbq+Fcgn*&=z@bDspM>fo>N{V&CR4|ZRvi4=`ol`4mqFyKwC6oR
zkxG<g4}V@NSot~uk@pI9A9()*`A5{UAFO?!nDAr>no#Z)n_1YurrChIQ1BntudU%?
zg;r>Vf@#0>_N`%w*6?VSdJ*LvqRMTsVrriU#H``Nd6Jtc<e0Fbgj)8+&?V4{uUC}E
z{oc%L0P%YPIi@S|no`Y3@^)L?#0?k5y{OckH5e5J5#DwO^0u0OlulwPOPbE@voE8^
zs6>DLvq6cdG`OG)E+dv~;PgBIS}N632n!zy$8g?swtqh!r>W`eu80C2Aq8j3OSXqX
z(!G7N)-5P-24kkC<ENl1(j}6xcjbpZdceaU3vEDF(i`T|R3C-Zc?f9C=c8AfM!}En
zff)d4*H6@WQD&mD#@C`Q1KKO`R5d>;B%XJ-j71RLU)!XEYimL3`@S<NLnV6Su{k?~
zI8zEWIA8%3E*DEYQMJ&bR$THZ|7~=J&huOG^v<F*m3XMd$)7<q@h&Z4E;VXyYg*xF
zbe{rXU{4%Xjpo;)E(ylhLCTjHXJCkPSKp~B+Bqg^F&{&9dJZoK*U5lUjz>y=AI~^S
zhnIZcTQ?GOsX*c;TfmHiHQWg^Xskd^d5Dmn#swM2qrbAgp7!yAJP;OT4DxRe1&wNZ
zm#Tq2fDVjeoNZ(zBz3$&b)oh?i1(gu<|fD~Zo3B*pAKsqd@1#mh?cNFQu;DOaD~mi
zvuM=3HRy?hgeIBpUHg9Z+hR42oJHA8ro0nv%;}fevC=9j<=@I(*2n@;rX=;bT`Oau
zbC=&j$u@69ns{0<f7RC81(v=3QRhV4R+1NJS@k0~klP+9tu*#JkMdq=OO&&XiGIfo
ziH8(e>D*Z`SQiTVvnTs(IqdPw@4nK1T|3uTszy&$WD~?IEyo}Qg88!Dcrvq9%nDl>
z9OdWp)yzrio~p<}TkCkvt9WJq=PDFP9W^;B$u;%CN%@2;9UACC)nfU-T_aS6l%`Z9
zRM1y-9(1pEivz;EOmh9XimJ;C1C;PYTXh8kY#<pbo#VtU2NfYo-sm05-aAD%v6${+
zI)$8PY65E2>Lpk9*6Cj!ghMUfD(_H!>lhYgg1wF;m3Ps9#$`~{+%d99KQi=l&8BK{
zjePK8Mk6ul%)zv&(w`;Defp?&`_qp%F1;8ne2XfycM&Y3wK1dhQVx}fXBy@tm1mN^
zJwS{HJ?d}Z>>G9a>hDy9z}x<Y6b6d|TfItIh&(tZNrO?G>anc*j*2#Vf;$MRu0>g<
z?Qr&Kq>N-|=gS-ze^0sE+c*B0ZY}e6e?(xRhv%smwrTyoZf<L*ktVsW7}91ika{{l
zs`fXCx>;K7cJHHz{peKYtasUT%{P?$eP8p2%N3lKxEuonT`$DP0PT~g@(^kav)&N5
W9Nu-N2|Nx2eaK4|7xOOMe)xYmUaqhJ

literal 0
HcmV?d00001

diff --git a/fluss-rust/website/static/img/logo/svg/colored_logo.svg b/fluss-rust/website/static/img/logo/svg/colored_logo.svg
new file mode 100644
index 0000000000..3b136ac448
--- /dev/null
+++ b/fluss-rust/website/static/img/logo/svg/colored_logo.svg
@@ -0,0 +1,19 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" fill="none" version="1.1" width="403.4100341796875" height="171.5" viewBox="0 0 403.4100341796875 171.5"><defs><clipPath id="master_svg0_14_8989"><rect x="180" y="54.5" width="223.41001892089844" height="91.2300033569336" rx="0"/></clipPath><linearGradient x1="0.5" y1="0" x2="0.5" y2="1" id="master_svg1_14_05037"><stop offset="0%" stop-color="#FFFFFF" stop-opacity="1"/><stop offset="33.571428060531616%" stop-color="#FFFFFF" stop-opacity="1"/><stop offset="100%" stop-color="#96A1FF" stop-opacity="1"/></linearGradient><linearGradient x1="0.5" y1="0" x2="0.5" y2="1" id="master_svg2_14_2646"><stop offset="0%" stop-color="#002CDC" stop-opacity="1"/><stop offset="100%" stop-color="#3B5FEE" stop-opacity="1"/></linearGradient></defs><g><g clip-path="url(#master_svg0_14_8989)"><g><path d="M209.625,54.5L237.465,54.5L236.20499999999998,65.225L211.38,65.225C205.695,65.225,200.91,69.455,200.20499999999998,75.08L198.72,86.96000000000001L230.07,86.96000000000001L228.79500000000002,97.685L197.43,97.685L192.42,138.26C191.895,142.51999999999998,188.28,145.715,183.99,145.715L180,145.715L188.955,72.785C190.23,62.345,199.095,54.5,209.625,54.5Z" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M235.79966546875,127.715L244.72466796875,54.5L255.92966796875,54.5L247.00466796875,127.715L235.78466796875,127.715L235.79966546875,127.715Z" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M294.10490234375,117.00455078125L299.36990234375,73.41455078125L310.57490234375,73.41455078125L303.94490234375,127.72955078125L279.46490234375,127.72955078125C266.00990234375,127.72955078125,259.27490234375,121.54955078124999,259.27490234375,109.20455078124999C259.27490234375,107.70455078124999,259.37990234375,106.08455078125,259.57490334375,104.32955078124999L263.38490234375,73.41455364227L274.58990234375,73.41455364227L270.79490234375,104.61455078125C270.65990234375,105.45455078124999,270.59990234375,106.62455078125001,270.59990234375,108.12455078125001C270.59990234375,111.49955078125001,271.39490234375,113.83955078125,272.98490234375,115.14455078124999C274.57490234375,116.44955078125,277.15490234375,117.09455078125,280.73990234375,117.09455078125L294.08990234375,117.00455078125L294.10490234375,117.00455078125Z" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M327.360234375,128.1196875C321.375244375,127.9846875,316.215234375,127.7296875,311.865234375,127.3396875L312.765232375,120.81468749999999C313.080234375,118.5796875,315.090234375,116.9746875,317.340234375,117.16968750000001C321.870234375,117.54468750000001,325.635234375,117.78468749999999,328.635234375,117.88968750000001L331.950234375,117.88968750000001C336.105234375,117.88968750000001,339.015234375,117.3646875,340.680234375,116.3296875C342.330234375,115.29468750000001,343.365234375,113.79468750000001,343.755234375,111.84468749999999C343.815234375,111.51468750000001,343.860234375,111.06468749999999,343.860234375,110.4796875C343.860234375,108.8596875,343.605234375,107.7796875,343.080234375,107.2546875C342.630234375,106.53468749999999,341.880234375,106.0546875,340.845234375,105.78468749999999C339.810234375,105.5296875,337.815234375,105.2296875,334.890234375,104.9146875L332.655234375,104.6296875C329.280234375,104.3746875,326.055234375,103.7896875,322.995234375,102.8746875C320.595244375,101.9596875,318.810244375,100.6546875,317.625244375,98.9296875C316.455244375,97.2046875,315.870244375,94.9246875,315.870244375,92.0596875C315.870244375,91.4746875,315.930244375,90.46968749999999,316.065234375,89.0446875C316.515244375,85.0846875,317.655234375,81.9796875,319.485234375,79.7296875C321.300234375,77.4796875,323.835234375,75.8746875,327.090234375,74.8996875C330.345234375,73.9246885,334.530234375,73.4296875,339.660234375,73.4296875L343.665234375,73.4296875L357.420234375,73.5346875L356.610234375,80.1346875C356.355234375,82.26468750000001,354.540234375,83.8696875,352.395234375,83.8696875L338.415234375,83.8696875C335.550234375,83.8696875,333.375234375,84.0196875,331.875234375,84.3046875C330.375234375,84.6046875,329.295234375,85.0846875,328.605234375,85.7746875C327.915234375,86.4646875,327.480234375,87.4546875,327.285234375,88.7446875C327.225234375,89.0746875,327.180234375,89.4946875,327.180234375,90.0196875C327.180234375,91.0546875,327.480234375,91.9396875,328.050234375,92.6446875C328.695234375,93.4246875,329.655234375,93.9646875,330.930234375,94.2496875C332.190234375,94.5346875,334.560234375,94.8796875,337.995234375,95.2696875C342.090234375,95.6596875,345.435234375,96.2746875,348.045234375,97.1296875C350.325234375,97.9096875,352.050234375,99.2446875,353.265234375,101.1346875C354.465234375,103.0246875,355.065234375,105.4546875,355.065234375,108.4546875C355.065234375,109.8796875,355.005234375,110.9896875,354.870234375,111.7696875C354.090234375,117.81468749999999,351.810234375,122.0596875,348.045234375,124.4896875C344.280234375,126.91968750000001,338.490234375,128.1496875,330.690234375,128.1496875L327.375234375,128.1496875L327.360234375,128.1196875Z" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M373.3651171875,128.1196875C367.3801271875,127.9846875,362.2201171875,127.7296875,357.8701171875,127.3396875L358.7701151875,120.81468749999999C359.0851171875,118.5796875,361.0951171875,116.9746875,363.3451171875,117.16968750000001C367.8751171875,117.54468750000001,371.6401171875,117.78468749999999,374.6401171875,117.88968750000001L377.9551171875,117.88968750000001C382.1101171875,117.88968750000001,385.0201171875,117.3646875,386.6851171875,116.3296875C388.3351171875,115.29468750000001,389.3701171875,113.79468750000001,389.7601171875,111.84468749999999C389.8201171875,111.51468750000001,389.8652171875,111.06468749999999,389.8652171875,110.4796875C389.8652171875,108.8596875,389.6102171875,107.7796875,389.0851171875,107.2546875C388.6351171875,106.53468749999999,387.8851171875,106.0546875,386.8501171875,105.78468749999999C385.8151171875,105.5296875,383.8201171875,105.2296875,380.8951171875,104.9146875L378.6601171875,104.6296875C375.2851171875,104.3746875,372.0601171875,103.7896875,369.0001171875,102.8746875C366.6001371875,101.9596875,364.8151371875,100.6546875,363.6301371875,98.9296875C362.4601371875,97.2046875,361.8751371875,94.9246875,361.8751371875,92.0596875C361.8751371875,91.4746875,361.9351371875,90.46968749999999,362.0701371875,89.0446875C362.5201371875,85.0846875,363.6601271875,81.9796875,365.4901271875,79.7296875C367.3051271875,77.4796875,369.8401171875,75.8746875,373.0951171875,74.8996875C376.3501171875,73.9246885,380.5351171875,73.4296875,385.6651171875,73.4296875L389.6701171875,73.4296875L403.4251171875,73.5346875L402.6151171875,80.1346875C402.3601171875,82.26468750000001,400.5451171875,83.8696875,398.4001171875,83.8696875L384.4201171875,83.8696875C381.5551171875,83.8696875,379.3801171875,84.0196875,377.8801171875,84.3046875C376.3801171875,84.6046875,375.3001171875,85.0846875,374.6102171875,85.7746875C373.9202171875,86.4646875,373.4852171875,87.4546875,373.2901171875,88.7446875C373.2302171875,89.0746875,373.1851171875,89.4946875,373.1851171875,90.0196875C373.1851171875,91.0546875,373.4851171875,91.9396875,374.0551171875,92.6446875C374.7001171875,93.4246875,375.6601171875,93.9646875,376.9351171875,94.2496875C378.1951171875,94.5346875,380.5651171875,94.8796875,384.0001171875,95.2696875C388.0951171875,95.6596875,391.4402171875,96.2746875,394.0501171875,97.1296875C396.3301171875,97.9096875,398.0551171875,99.2446875,399.2701171875,101.1346875C400.4701171875,103.0246875,401.0701171875,105.4546875,401.0701171875,108.4546875C401.0701171875,109.8796875,401.0101171875,110.9896875,400.8751171875,111.7696875C400.0951171875,117.81468749999999,397.8151171875,122.0596875,394.0501171875,124.4896875C390.2851171875,126.91968750000001,384.4951171875,128.1496875,376.6951171875,128.1496875L373.3801171875,128.1496875L373.3651171875,128.1196875Z" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g></g><g><g transform="matrix(0.653420627117157,-0.7569950819015503,0.7569950819015503,0.653420627117157,2.759073555469513,39.02634325623512)"><ellipse cx="48.59999990463257" cy="22" rx="4.599999904632568" ry="5.5" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g transform="matrix(0.7823152542114258,-0.6228827238082886,0.6228827238082886,0.7823152542114258,11.673297647153959,69.30429944698699)"><ellipse cx="109.490234375" cy="21.751171827316284" rx="4.5" ry="3.799999952316284" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M13.130000372772216,120.75960174560547C9.070000372772217,120.75960174560547,7.860000372772217,119.28960174560547,7.550000172772217,118.05960174560548C7.0900003727722165,116.20960174560547,8.580000372772217,114.12960174560547,11.430000372772216,112.61960174560546C21.120020372772217,107.48960174560547,34.980020372772216,97.32960174560547,42.130020372772215,85.58959974560547L42.58002037277222,84.84960174560547L43.450020372772215,84.86959834560547C44.240020372772214,84.88959504560547,44.910020372772216,85.24959574560548,45.350020372772214,85.87960174560547C46.590020372772216,87.69960174560546,45.57002037277222,91.10960174560547,42.93002037277222,98.44960174560546C41.880020372772215,101.37960174560547,40.79002037277222,104.40960174560547,40.590020372772216,105.98960174560547C39.72002037277222,112.73960174560547,33.76002037277222,116.85960174560546,20.660020372772216,119.75960174560547C17.650020372772218,120.42960174560547,15.120000372772218,120.75960174560547,13.130000372772216,120.75960174560547Z" fill="#B0B7F3" fill-opacity="1"/><path d="M20.984220372772217,121.22410174560547L20.985920372772217,121.22380174560547Q40.701520372772215,116.85880174560546,42.07812037277222,106.17800174560547Q42.255220372772214,104.77850174560547,44.307020372772215,99.05340174560547L44.341520372772216,98.95730174560546Q48.395620372772214,87.68567174560548,46.579720372772215,85.02071874560546Q45.461820372772216,83.42004174560547,43.48442037277222,83.36999174560547L41.748420372772216,83.33009174560547L40.84892037277222,84.80936734560547Q36.05152037277222,92.68648174560546,26.771320372772216,100.43170174560547Q19.009920372772214,106.90940174560546,10.727740372772217,111.29410174560547Q5.067750372772217,114.29290174560546,6.0954903727722165,118.42620174560547Q7.061633372772217,122.25960174560547,13.130000372772216,122.25960174560547Q16.331720372772217,122.25960174560547,20.984220372772217,121.22410174560547ZM39.10192037277221,105.80120174560547Q37.995420372772216,114.38570174560547,20.33582037277222,118.29510174560548L20.33412037277222,118.29540174560546Q16.00248037277222,119.25960174560547,13.130010372772217,119.25960174560547Q9.399350372772217,119.25960174560547,9.004520372772216,117.69300174560547Q8.545160372772216,115.84560174560546,12.132260372772217,113.94510174560547Q20.691120372772218,109.41390174560547,28.693620372772216,102.73500174560547Q38.355220372772216,94.67132174560547,43.41112037277222,86.36983174560547L43.411520372772216,86.36911174560547L43.415520372772214,86.36920174560547Q43.87032037277222,86.38072174560547,44.120220372772216,86.73848174560547Q45.054720372772216,88.11024174560546,41.518520372772215,97.94190174560546L41.48292037277222,98.04130174560547Q39.320320372772215,104.07580174560547,39.10192037277221,105.80120174560547Z" fill-rule="evenodd" fill="#000000" fill-opacity="1"/></g><g><path d="M105.119969140625,72.2403791809082C103.139999140625,72.2403791809082,101.100009140625,71.4603791809082,99.529999140625,70.1003791809082C98.749999140625,69.4303791809082,91.999999140625,63.180379180908204,94.110000140625,50.460379180908205L94.739999140625,46.6503791809082L96.849999140625,49.890379180908205C97.889999140625,51.500379180908205,99.769999140625,53.2203791809082,101.759999140625,55.0503791809082C104.439969140625,57.5103791809082,107.469969140625,60.3003791809082,109.539969140625,63.7203791809082C111.319969140625,66.6703791809082,110.669969140625,68.7203791809082,110.12996914062501,69.6803791809082C109.219969140625,71.2803791809082,107.359969140625,72.2403791809082,105.12996914062501,72.2403791809082L105.119969140625,72.2403791809082Z" fill="#B0B7F3" fill-opacity="1"/><path d="M105.119969140625,73.7403791809082L105.12996914062501,73.7403791809082Q109.54646914062499,73.7403791809082,111.43736914062501,70.4157791809082Q113.316269140625,67.0754791809082,110.823269140625,62.943679180908205Q108.63036914062499,59.3206791809082,102.775339140625,53.9462591809082L102.696679140625,53.873929180908206Q99.032449140625,50.5045291809082,98.106959140625,49.071809180908204L93.889965140625,42.5964291809082L92.630219140625,50.2149091809082Q91.219869140625,58.717179180908204,94.378749140625,65.4372791809082Q96.125649140625,69.1535791809082,98.547879140625,71.2341791809082Q101.441109140625,73.7403791809082,105.119969140625,73.7403791809082ZM108.822669140625,68.9449791809082Q107.801469140625,70.7403791809082,105.12996914062501,70.7403791809082L105.119969140625,70.7403791809082Q102.559789140625,70.7403791809082,100.512119140625,68.9665791809082Q98.567499140625,67.29617918090821,97.093749140625,64.1609791809082Q94.332310140625,58.2864791809082,95.589779140625,50.7058491809082L95.590029140625,50.7043291809082L95.593039140625,50.708949180908206Q96.720139140625,52.453799180908206,100.666059140625,56.0822291809082L100.744649140625,56.1544991809082Q106.285869140625,61.240779180908206,108.256769140625,64.4970791809082Q109.844469140625,67.12837918090821,108.822669140625,68.9449791809082Z" fill-rule="evenodd" fill="#000000" fill-opacity="1"/></g><g><path d="M35.3707,124.66C33.6507,117.22,36.0507,109.3,38.3607,101.64C39.8107,96.83,41.1907,92.28,41.3607,88.33C41.7307,79.78,43.5307,63.15,44.1807,57.33C43.2407,57.69,41.8507,58.38,39.9707,59.67C36.0907,62.35,24.2907,70.5,14.42069,70.5C13.86069,70.5,13.310690000000001,70.47,12.79069,70.42C9.810690000000001,70.13,7.450694,67.81,7.0506941,64.78C6.820694,63.01,6.9106941,56.93,17.9007,52.82C20.9907,51.68,23.8807,49.35,27.5407,46.39C30.2907,44.17,33.4107,41.65,37.390699999999995,38.98C38.7107,38.08,40.1307,37.47,41.5007,36.88C45.2807,35.25,48.5407,33.85,49.9207,26.74C52.2007,15,55.1007,8.969999999999999,66.2907,4.26C70.5707,2.46,75.7007,1.5,81.1107,1.5C88.7307,1.5,96.3207,3.4,101.4207,6.57C109.871,11.83,112.681,23.31,111.921,29.41C111.021,36.63,106.6007,42,97.6207,46.75C95.6507,54.46,93.7907,65.3,95.5607,74.59C95.7507,74.91,96.0807,75.47,96.1507,75.59C97.9007,78.21,100.3607,79.8,102.7307,81.33C105.1807,82.91,107.721,84.55,109.321,87.27C110.451,89.25,110.681,92.38,110.011,96.85L109.831,98.1L108.571,98.13C100.9007,98.32,83.5,99.5,73.8907,104.99C64.28139999999999,110.48,47.5807,117.84,37.7607,125.51L35.9007,126.96L35.3707,124.67L35.3707,124.66Z" fill="url(#master_svg1_14_05037)" fill-opacity="1"/><path d="M33.8708,124.827Q32.1566,117.018,36.904399999999995,101.2737L36.9246,101.2069L36.9597,101.0905Q39.7016,91.9954,39.8621,88.2655Q40.2443,79.433,42.3872,59.8978Q41.6441,60.3409,40.8194,60.9068Q24.7591,72,14.42069,72Q13.55073,72,12.647120000000001,71.9131Q6.399075,71.3051,5.5636,64.97630000000001Q5.16425,61.9031,6.9856073,58.8997Q9.80846,54.2448,17.3753,51.415Q20.2562,50.3522,26.5974,45.2237L26.6182,45.2069Q32.5295,40.4349,36.555,37.7343Q37.9788,36.7635,40.8885,35.5104L40.9074,35.5023L40.9168,35.4983Q44.3026,34.0382,45.5597,32.794799999999995Q47.6115,30.7651,48.4482,26.4542Q50.3351,16.7384,53.5217,12.0238Q57.316,6.41009,65.7088,2.8774800000000003Q72.5508,0,81.1107,0Q93.6921,0,102.2126,5.29604Q108.435,9.16913,111.523,17.1326Q114.126,23.844,113.409,29.5955Q112.038,40.5916,98.9132,47.7583Q95.0259,63.339,96.9865,74.0541L97.0869,74.2237L97.4207,74.7906Q99.0102,77.1427,103.5443,80.0698Q108.831,83.4793,110.614,86.5095Q112.565,89.9284,111.494,97.0724L111.135,99.5694L108.606,99.6296Q85.2858,100.2073,74.6348,106.292Q71.5751,108.04,63.8062,112.028Q45.295,121.529,38.684,126.692L34.969300000000004,129.588L33.8708,124.842L33.8708,124.827ZM36.8341,124.33L36.8321,124.322Q35.2071,117.293,39.7767,102.14L39.7968,102.073L39.832,101.956Q42.6826,92.5007,42.8593,88.3945Q43.2633,79.0578,45.6714,57.4965L45.9449,55.0481L43.6442,55.9292Q41.6684,56.6859,39.122,58.4332Q23.8237,69,14.42069,69Q13.69459,69,12.93427,68.9269Q9.061399999999999,68.55,8.53779,64.5837Q7.71239,58.2316,18.426099999999998,54.2249Q21.7583,52.9956,28.4839,47.5563L28.5026,47.5412Q34.3108,42.8524,38.2264,40.2257Q39.4305,39.4047,42.0751,38.2658L42.094,38.2577L42.1047,38.2531Q46.0101,36.569,47.6695,34.9276Q50.38,32.246300000000005,51.3932,27.0258Q53.1633,17.9112,56.0072,13.7037Q59.302,8.82909,66.8726,5.64252Q73.1559,3,81.1107,3Q92.8358,3,100.6288,7.84396Q105.9994,11.18706,108.726,18.2174Q111.055,24.2236,110.432,29.2246Q109.224,38.9154,96.9193,45.4241L96.3319,45.7348L96.1674,46.3787Q91.866,63.2128,94.0872,74.8707L94.1363,75.1283L94.5052,75.7517L94.8797,76.3877L94.9034,76.4231Q96.8282,79.3049,101.9171,82.5902Q106.6065,85.6144,108.028,88.0305Q109.444,90.5122,108.527,96.6277L108.527,96.6306Q84.4528,97.228,73.1466,103.688Q70.1454,105.402,62.4364,109.359Q43.6724,118.989,36.8374,124.328L36.8341,124.33Z" fill-rule="evenodd" fill="#000000" fill-opacity="1"/></g><g><path d="M79,82.38669999999999C71,83.38669999999999,66.00000622869,79.3869,66.00000311434,71.8868C66,64.3867,67,52.3867,72.49993,43.88664C79.3399,37.74664,96.5299,41.226865,95.9999,44.38687C93,49.88672,91.21039999999999,63.414100000000005,90,71.8867C89.5,75.38669999999999,87,81.38669999999999,79,82.38669999999999Z" fill="#FFFFFF" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M92.40000255126954,33.64025049560547C94.50000255126953,31.04025049560547,97.00000255126953,29.24025049560547,97.10000255126953,27.840250495605467C97.20000255126953,26.44025049560547,92.40000255126954,24.340251495605468,90.50000255126953,24.64025119560547C88.60000255126953,24.94025049560547,84.19999255126953,27.840250495605467,84.30000255126953,29.44025049560547C84.40001255126953,31.04025049560547,88.00000255126953,32.54025049560547,89.80000255126953,33.84025049560547C89.60000255126953,35.64022049560547,86.65000255126954,37.41022049560547,84.39000255126953,37.41022049560547C81.37000255126954,37.41022049560547,77.88999955126953,35.71022049560547,77.68000035126953,36.510220495605466C77.41000355126953,37.56022049560547,80.78000255126953,39.14022049560547,84.39000255126953,39.14022049560547C86.90999255126953,39.14022049560547,88.48000255126954,38.24022049560547,89.78000255126953,37.07022049560547C90.99000255126953,35.99022049560547,91.91000255126953,36.54022049560547,92.33000255126953,36.88022049560547C93.31000255126953,37.68022049560547,95.30000255126953,38.24022049560547,96.91000255126953,38.24022049560547C98.75000255126953,38.24022049560547,101.70000255126953,36.77022049560547,101.42000255126953,36.120220495605466C100.97000255126953,35.05022049560547,98.79000255126954,36.64022049560547,97.17000255126953,36.64022049560547C93.80000255126953,36.64022049560547,92.08000255126953,34.74022049560547,92.38000255126953,33.64025049560547L92.40000255126954,33.64025049560547Z" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><ellipse cx="73.29999995231628" cy="22.87967801094055" rx="2.299999952316284" ry="3.200000047683716" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><ellipse cx="103.39000082015991" cy="22.879873275756836" rx="2.0999999046325684" ry="3" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M79.02001440429687,105.64Q76.50000440429687,106.52,68.26999640429688,109.8Q67.65999640429688,108.05,68.91999840429688,105.35C73.01999440429688,98.05,70.61999440429688,92.75,85.42001440429688,89.25C80.22001440429688,91.85,79.42001440429688,95.15,79.32001440429687,101.25Q79.34001440429688,103.78,79.02001440429687,105.65L79.02001440429687,105.64Z" fill="#000000" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M0.0000113502,139.93639237060546C7.89472,141.46179237060545,19.707,142.57839237060546,27.0463,140.78379237060545C37.6982,138.18169237060548,49.2924,126.80629237060546,63.7428,114.89259237060547C78.1933,102.97880237060546,103.246,95.78070237060547,123.132,102.60992237060547C128.874,104.58389237060547,131.81,108.53189237060548,131.81,108.63159237060547C130.124,107.53499237060547,128.339,106.33859237060547,126.553,105.54099237060547C118.024,101.65284237060547,107.808,101.55314237060547,98.7831,103.64679237060547C97.4937,103.94589237060546,96.3036,104.24499237060547,95.0142,104.64369237060546C93.8241,105.04249237060547,92.5347,105.44129237060547,91.3446,105.84009237060548C90.1544,106.23889237060547,88.9643,106.73739237060546,87.7741,107.23589237060547C86.5839,107.73429237060547,85.3938,108.33249237060546,84.3028,108.83099237060547C83.1127,109.42919237060546,82.0217,110.02739237060547,80.9307,110.72519237060547C79.8397,111.42309237060547,78.7487,112.02129237060547,77.6578,112.81889237060547C76.5668,113.51679237060547,75.575,114.31429237060547,74.484,115.01219237060548C73.4922,115.80979237060546,72.4012,116.60739237060547,71.5086,117.40489237060547C67.7398,120.69489237060547,64.2685,124.38369237060547,60.7972,127.87309237060546C46.912,142.72789237060547,36.7957,150.70359237060546,15.4721,151.40149237060547C12.0008,151.50119237060545,3.37213,151.20209237060547,0.0991972,149.50729237060546C23.8032,167.15359237060545,60.2021,172.53729237060548,79.1455,171.34089237060547C99.0806,170.14449237060546,122.487,161.67029237060547,128.835,145.91819237060548C116.239,136.54669237060546,112.271,151.89999237060547,102.155,146.81549237060545C92.0388,141.73089237060546,98.2871,129.46829237060547,107.908,121.99099237060547C117.528,114.51369237060547,124.282,115.18169237060548,127.833,116.64719237060547C133.377,118.93029237060547,133.506,123.28699237060547,133.198,124.38369237060547C132.812,125.77949237060547,131.711,126.67669237060547,130.62,127.57399237060547C133.694,127.07549237060547,135.678,126.37759237060547,138.058,123.98489237060546C139.943,121.39279237060546,140.339,118.40189237060547,139.744,115.31129237060547C138.752,109.62859237060547,135.48,104.24499237060547,130.818,101.05466237060547C119.512,93.07891737060547,105.101,92.72998037060547,91.2057,94.14567237060547C75.5551,95.74082237060547,56.473,106.41829237060547,41.2191,118.16259237060547C31.9855,125.27099237060547,16.1663,136.85579237060546,0,139.94639237060545L0.0000113502,139.93639237060546ZM77.0627,140.93339237060547C67.5414,151.99969237060546,51.6032,159.35729237060548,35.6055,158.18089237060548C27.8695,157.61259237060546,22.8114,156.48609237060546,21.7204,155.48909237060548C34.0187,156.88479237060545,48.5981,152.49819237060547,54.3505,148.80939237060545C60.1029,145.12059237060546,67.0455,136.44699237060547,70.8144,133.85489237060546C74.5832,131.26279237060547,76.7651,131.86099237060546,78.0545,132.75819237060546C80.2364,134.15399237060547,79.6414,137.94249237060546,77.0627,140.93339237060547Z" fill="url(#master_svg2_14_2646)" fill-opacity="1" style="mix-blend-mode:passthrough"/></g><g><path d="M72,45.5C76,47.5,81.50006,49.00005,87,49Q92.4999,48.99995,96.9999,47.49995L99.5,44Q89,49,72,45.5Z" fill="#000000" fill-opacity="1"/></g></g></g></svg>
\ No newline at end of file
diff --git a/fluss-rust/website/tsconfig.json b/fluss-rust/website/tsconfig.json
new file mode 100644
index 0000000000..d250afaedd
--- /dev/null
+++ b/fluss-rust/website/tsconfig.json
@@ -0,0 +1,6 @@
+{
+  "extends": "@docusaurus/tsconfig",
+  "compilerOptions": {
+    "baseUrl": "."
+  }
+}

From 6adf7fee6c47cf6e68c8cd74bc7d000c52f249a6 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 16 Feb 2026 00:26:31 +0000
Subject: [PATCH 146/287] chore: cleanup after docs review (#313)

---
 fluss-rust/bindings/cpp/examples/example.cpp  | 15 +++-
 fluss-rust/bindings/cpp/include/fluss.hpp     | 22 +++---
 fluss-rust/bindings/cpp/src/admin.cpp         | 45 +++++++++--
 fluss-rust/bindings/cpp/src/lib.rs            | 78 +++++++++++++------
 fluss-rust/bindings/python/example/example.py | 18 +++--
 fluss-rust/bindings/python/fluss/__init__.pyi | 46 +++++++----
 fluss-rust/bindings/python/src/admin.rs       | 54 ++++---------
 fluss-rust/bindings/python/src/lib.rs         | 52 ++++++++++---
 .../docs/user-guide/cpp/api-reference.md      | 14 ++--
 .../website/docs/user-guide/cpp/data-types.md |  2 +-
 .../cpp/example/admin-operations.md           |  8 +-
 .../cpp/example/partitioned-tables.md         |  2 +-
 .../docs/user-guide/python/api-reference.md   | 17 ++--
 .../python/example/admin-operations.md        |  6 +-
 .../python/example/configuration.md           |  4 +-
 .../user-guide/python/example/log-tables.md   |  2 +-
 16 files changed, 248 insertions(+), 137 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 2c7f55452d..2b7f331e66 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -286,7 +286,7 @@ int main() {
 
     std::unordered_map<int32_t, int64_t> earliest_offsets;
     check("list_earliest_offsets",
-          admin.ListOffsets(table_path, all_bucket_ids, fluss::OffsetQuery::Earliest(),
+          admin.ListOffsets(table_path, all_bucket_ids, fluss::OffsetSpec::Earliest(),
                             earliest_offsets));
     std::cout << "Earliest offsets:" << std::endl;
     for (const auto& [bucket_id, offset] : earliest_offsets) {
@@ -295,7 +295,7 @@ int main() {
 
     std::unordered_map<int32_t, int64_t> latest_offsets;
     check("list_latest_offsets", admin.ListOffsets(table_path, all_bucket_ids,
-                                                   fluss::OffsetQuery::Latest(), latest_offsets));
+                                                   fluss::OffsetSpec::Latest(), latest_offsets));
     std::cout << "Latest offsets:" << std::endl;
     for (const auto& [bucket_id, offset] : latest_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
@@ -310,7 +310,7 @@ int main() {
     std::unordered_map<int32_t, int64_t> timestamp_offsets;
     check("list_timestamp_offsets",
           admin.ListOffsets(table_path, all_bucket_ids,
-                            fluss::OffsetQuery::FromTimestamp(timestamp_ms), timestamp_offsets));
+                            fluss::OffsetSpec::Timestamp(timestamp_ms), timestamp_offsets));
     std::cout << "Offsets for timestamp " << timestamp_ms << " (1 hour ago):" << std::endl;
     for (const auto& [bucket_id, offset] : timestamp_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
@@ -507,7 +507,7 @@ int main() {
           admin.CreatePartition(partitioned_table_path, {{"region", "EU"}}, true));
     std::cout << "Created partitions: US, EU" << std::endl;
 
-    // List partitions
+    // List all partitions
     std::vector<fluss::PartitionInfo> partition_infos;
     check("list_partition_infos",
           admin.ListPartitionInfos(partitioned_table_path, partition_infos));
@@ -516,6 +516,13 @@ int main() {
                   << std::endl;
     }
 
+    // List partitions with partial spec filter
+    std::vector<fluss::PartitionInfo> us_partition_infos;
+    check("list_partition_infos_with_spec",
+          admin.ListPartitionInfos(partitioned_table_path, {{"region", "US"}}, us_partition_infos));
+    std::cout << "  Filtered (region=US): " << us_partition_infos.size() << " partition(s)"
+              << std::endl;
+
     // Write data to partitioned table
     fluss::Table partitioned_table;
     check("get_partitioned_table", conn.GetTable(partitioned_table_path, partitioned_table));
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index dd298823a4..30a8636baf 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -305,19 +305,19 @@ enum class DatumType {
 
 constexpr int64_t EARLIEST_OFFSET = -2;
 
-enum class OffsetSpec {
+enum class OffsetType {
     Earliest = 0,
     Latest = 1,
     Timestamp = 2,
 };
 
-struct OffsetQuery {
-    OffsetSpec spec;
+struct OffsetSpec {
+    OffsetType type;
     int64_t timestamp{0};
 
-    static OffsetQuery Earliest() { return {OffsetSpec::Earliest, 0}; }
-    static OffsetQuery Latest() { return {OffsetSpec::Latest, 0}; }
-    static OffsetQuery FromTimestamp(int64_t ts) { return {OffsetSpec::Timestamp, ts}; }
+    static OffsetSpec Earliest() { return {OffsetType::Earliest, 0}; }
+    static OffsetSpec Latest() { return {OffsetType::Latest, 0}; }
+    static OffsetSpec Timestamp(int64_t ts) { return {OffsetType::Timestamp, ts}; }
 };
 
 struct Result {
@@ -1000,15 +1000,19 @@ class Admin {
     Result GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& out);
 
     Result ListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
-                       const OffsetQuery& offset_query, std::unordered_map<int32_t, int64_t>& out);
+                       const OffsetSpec& offset_spec, std::unordered_map<int32_t, int64_t>& out);
 
     Result ListPartitionOffsets(const TablePath& table_path, const std::string& partition_name,
                                 const std::vector<int32_t>& bucket_ids,
-                                const OffsetQuery& offset_query,
+                                const OffsetSpec& offset_spec,
                                 std::unordered_map<int32_t, int64_t>& out);
 
     Result ListPartitionInfos(const TablePath& table_path, std::vector<PartitionInfo>& out);
 
+    Result ListPartitionInfos(const TablePath& table_path,
+                              const std::unordered_map<std::string, std::string>& partition_spec,
+                              std::vector<PartitionInfo>& out);
+
     Result CreatePartition(const TablePath& table_path,
                            const std::unordered_map<std::string, std::string>& partition_spec,
                            bool ignore_if_exists = false);
@@ -1035,7 +1039,7 @@ class Admin {
 
    private:
     Result DoListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
-                         const OffsetQuery& offset_query, std::unordered_map<int32_t, int64_t>& out,
+                         const OffsetSpec& offset_spec, std::unordered_map<int32_t, int64_t>& out,
                          const std::string* partition_name = nullptr);
 
     friend class Connection;
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index 0fb15b2746..8deb182dcd 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -107,7 +107,7 @@ Result Admin::GetLatestLakeSnapshot(const TablePath& table_path, LakeSnapshot& o
 
 // function for common list offsets functionality
 Result Admin::DoListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
-                            const OffsetQuery& offset_query,
+                            const OffsetSpec& offset_spec,
                             std::unordered_map<int32_t, int64_t>& out,
                             const std::string* partition_name) {
     if (!Available()) {
@@ -122,8 +122,8 @@ Result Admin::DoListOffsets(const TablePath& table_path, const std::vector<int32
     }
 
     ffi::FfiOffsetQuery ffi_query;
-    ffi_query.offset_type = static_cast<int32_t>(offset_query.spec);
-    ffi_query.timestamp = offset_query.timestamp;
+    ffi_query.offset_type = static_cast<int32_t>(offset_spec.type);
+    ffi_query.timestamp = offset_spec.timestamp;
 
     ffi::FfiListOffsetsResult ffi_result;
     if (partition_name != nullptr) {
@@ -145,16 +145,16 @@ Result Admin::DoListOffsets(const TablePath& table_path, const std::vector<int32
 }
 
 Result Admin::ListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
-                          const OffsetQuery& offset_query,
+                          const OffsetSpec& offset_spec,
                           std::unordered_map<int32_t, int64_t>& out) {
-    return DoListOffsets(table_path, bucket_ids, offset_query, out);
+    return DoListOffsets(table_path, bucket_ids, offset_spec, out);
 }
 
 Result Admin::ListPartitionOffsets(const TablePath& table_path, const std::string& partition_name,
                                    const std::vector<int32_t>& bucket_ids,
-                                   const OffsetQuery& offset_query,
+                                   const OffsetSpec& offset_spec,
                                    std::unordered_map<int32_t, int64_t>& out) {
-    return DoListOffsets(table_path, bucket_ids, offset_query, out, &partition_name);
+    return DoListOffsets(table_path, bucket_ids, offset_spec, out, &partition_name);
 }
 
 Result Admin::ListPartitionInfos(const TablePath& table_path, std::vector<PartitionInfo>& out) {
@@ -177,6 +177,37 @@ Result Admin::ListPartitionInfos(const TablePath& table_path, std::vector<Partit
     return result;
 }
 
+Result Admin::ListPartitionInfos(const TablePath& table_path,
+                                 const std::unordered_map<std::string, std::string>& partition_spec,
+                                 std::vector<PartitionInfo>& out) {
+    if (!Available()) {
+        return utils::make_client_error("Admin not available");
+    }
+
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+
+    rust::Vec<ffi::FfiPartitionKeyValue> rust_spec;
+    for (const auto& [key, value] : partition_spec) {
+        ffi::FfiPartitionKeyValue kv;
+        kv.key = rust::String(key);
+        kv.value = rust::String(value);
+        rust_spec.push_back(std::move(kv));
+    }
+
+    auto ffi_result = admin_->list_partition_infos_with_spec(ffi_path, std::move(rust_spec));
+
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.clear();
+        out.reserve(ffi_result.partition_infos.size());
+        for (const auto& pi : ffi_result.partition_infos) {
+            out.push_back({pi.partition_id, std::string(pi.partition_name)});
+        }
+    }
+
+    return result;
+}
+
 Result Admin::CreatePartition(const TablePath& table_path,
                               const std::unordered_map<std::string, std::string>& partition_spec,
                               bool ignore_if_exists) {
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 8a5bdfdd66..fab8edff84 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -302,6 +302,11 @@ mod ffi {
             self: &Admin,
             table_path: &FfiTablePath,
         ) -> FfiListPartitionInfosResult;
+        fn list_partition_infos_with_spec(
+            self: &Admin,
+            table_path: &FfiTablePath,
+            partition_spec: Vec<FfiPartitionKeyValue>,
+        ) -> FfiListPartitionInfosResult;
         fn create_partition(
             self: &Admin,
             table_path: &FfiTablePath,
@@ -735,30 +740,20 @@ impl Admin {
         &self,
         table_path: &ffi::FfiTablePath,
     ) -> ffi::FfiListPartitionInfosResult {
-        let path = fcore::metadata::TablePath::new(
-            table_path.database_name.clone(),
-            table_path.table_name.clone(),
-        );
-        let result = RUNTIME.block_on(async { self.inner.list_partition_infos(&path).await });
-        match result {
-            Ok(infos) => {
-                let partition_infos: Vec<ffi::FfiPartitionInfo> = infos
-                    .into_iter()
-                    .map(|info| ffi::FfiPartitionInfo {
-                        partition_id: info.get_partition_id(),
-                        partition_name: info.get_partition_name(),
-                    })
-                    .collect();
-                ffi::FfiListPartitionInfosResult {
-                    result: ok_result(),
-                    partition_infos,
-                }
-            }
-            Err(e) => ffi::FfiListPartitionInfosResult {
-                result: err_from_core_error(&e),
-                partition_infos: vec![],
-            },
-        }
+        self.do_list_partition_infos(table_path, None)
+    }
+
+    fn list_partition_infos_with_spec(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        partition_spec: Vec<ffi::FfiPartitionKeyValue>,
+    ) -> ffi::FfiListPartitionInfosResult {
+        let spec_map: std::collections::HashMap<String, String> = partition_spec
+            .into_iter()
+            .map(|kv| (kv.key, kv.value))
+            .collect();
+        let spec = fcore::metadata::PartitionSpec::new(spec_map);
+        self.do_list_partition_infos(table_path, Some(&spec))
     }
     fn create_partition(
         &self,
@@ -939,6 +934,41 @@ impl Admin {
             },
         }
     }
+
+    fn do_list_partition_infos(
+        &self,
+        table_path: &ffi::FfiTablePath,
+        partial_partition_spec: Option<&fcore::metadata::PartitionSpec>,
+    ) -> ffi::FfiListPartitionInfosResult {
+        let path = fcore::metadata::TablePath::new(
+            table_path.database_name.clone(),
+            table_path.table_name.clone(),
+        );
+        let result = RUNTIME.block_on(async {
+            self.inner
+                .list_partition_infos_with_spec(&path, partial_partition_spec)
+                .await
+        });
+        match result {
+            Ok(infos) => {
+                let partition_infos: Vec<ffi::FfiPartitionInfo> = infos
+                    .into_iter()
+                    .map(|info| ffi::FfiPartitionInfo {
+                        partition_id: info.get_partition_id(),
+                        partition_name: info.get_partition_name(),
+                    })
+                    .collect();
+                ffi::FfiListPartitionInfosResult {
+                    result: ok_result(),
+                    partition_infos,
+                }
+            }
+            Err(e) => ffi::FfiListPartitionInfosResult {
+                result: err_from_core_error(&e),
+                partition_infos: vec![],
+            },
+        }
+    }
 }
 
 // Table implementation
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 4ea3bd6a47..9c2b7e308c 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -90,11 +90,11 @@ async def main():
     # Demo: List offsets
     print("\n--- Testing list_offsets() ---")
     try:
-        # Query latest offsets using OffsetType constant (recommended for type safety)
+        # Query latest offsets using OffsetSpec factory method
         offsets = await admin.list_offsets(
             table_path,
             bucket_ids=[0],
-            offset_type=fluss.OffsetType.LATEST
+            offset_spec=fluss.OffsetSpec.latest()
         )
         print(f"Latest offsets for table (before writes): {offsets}")
     except Exception as e:
@@ -248,11 +248,10 @@ async def main():
         # Demo: Check offsets after writes
         print("\n--- Checking offsets after writes ---")
         try:
-            # Query with string constant (alternative API - both strings and constants are supported)
             offsets = await admin.list_offsets(
                 table_path,
                 bucket_ids=[0],
-                offset_type="latest"  # Can also use "earliest" or "timestamp"
+                offset_spec=fluss.OffsetSpec.latest()
             )
             print(f"Latest offsets after writing 7 records: {offsets}")
         except Exception as e:
@@ -734,6 +733,13 @@ async def main():
         await partitioned_writer.flush()
         print("\nWrote 4 records (2 to US, 2 to EU)")
 
+        # Demo: list_partition_infos with partial spec filter
+        print("\n--- Testing list_partition_infos with spec ---")
+        us_partitions = await admin.list_partition_infos(
+            partitioned_table_path, partition_spec={"region": "US"}
+        )
+        print(f"Filtered partitions (region=US): {us_partitions}")
+
         # Demo: list_partition_offsets
         print("\n--- Testing list_partition_offsets ---")
 
@@ -743,7 +749,7 @@ async def main():
             partitioned_table_path,
             partition_name="US",
             bucket_ids=[0],
-            offset_type="latest"
+            offset_spec=fluss.OffsetSpec.latest()
         )
         print(f"US partition latest offsets: {us_offsets}")
 
@@ -752,7 +758,7 @@ async def main():
             partitioned_table_path,
             partition_name="EU",
             bucket_ids=[0],
-            offset_type="latest"
+            offset_spec=fluss.OffsetSpec.latest()
         )
         print(f"EU partition latest offsets: {eu_offsets}")
 
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index daccca8512..47eeb808b5 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -193,16 +193,15 @@ class FlussAdmin:
         self,
         table_path: TablePath,
         bucket_ids: List[int],
-        offset_type: str,
-        timestamp: Optional[int] = None,
+        offset_spec: "OffsetSpec",
     ) -> Dict[int, int]:
         """List offsets for the specified buckets.
 
         Args:
             table_path: Path to the table
             bucket_ids: List of bucket IDs to query
-            offset_type: "earliest", "latest", or "timestamp"
-            timestamp: Required when offset_type is "timestamp"
+            offset_spec: Offset specification (OffsetSpec.earliest(), OffsetSpec.latest(),
+                or OffsetSpec.timestamp(ts))
 
         Returns:
             Dict mapping bucket_id -> offset
@@ -213,8 +212,7 @@ class FlussAdmin:
         table_path: TablePath,
         partition_name: str,
         bucket_ids: List[int],
-        offset_type: str,
-        timestamp: Optional[int] = None,
+        offset_spec: "OffsetSpec",
     ) -> Dict[int, int]:
         """List offsets for buckets in a specific partition.
 
@@ -222,8 +220,8 @@ class FlussAdmin:
             table_path: Path to the table
             partition_name: Partition value (e.g., "US" not "region=US")
             bucket_ids: List of bucket IDs to query
-            offset_type: "earliest", "latest", or "timestamp"
-            timestamp: Required when offset_type is "timestamp"
+            offset_spec: Offset specification (OffsetSpec.earliest(), OffsetSpec.latest(),
+                or OffsetSpec.timestamp(ts))
 
         Returns:
             Dict mapping bucket_id -> offset
@@ -246,11 +244,15 @@ class FlussAdmin:
     async def list_partition_infos(
         self,
         table_path: TablePath,
+        partition_spec: Optional[Dict[str, str]] = None,
     ) -> List["PartitionInfo"]:
-        """List all partitions for a partitioned table.
+        """List partitions for a partitioned table.
 
         Args:
             table_path: Path to the table
+            partition_spec: Optional partial partition spec to filter results.
+                Dict mapping partition column name to value (e.g., {"region": "US"}).
+                If None, returns all partitions.
 
         Returns:
             List of PartitionInfo objects
@@ -839,12 +841,28 @@ class ErrorCode:
     INVALID_ALTER_TABLE_EXCEPTION: int
     DELETION_DISABLED_EXCEPTION: int
 
-class OffsetType:
-    """Offset type constants for list_offsets()."""
+class OffsetSpec:
+    """Offset specification for list_offsets(), matching Java's OffsetSpec.
 
-    EARLIEST: str
-    LATEST: str
-    TIMESTAMP: str
+    Use factory methods to create instances:
+        OffsetSpec.earliest()
+        OffsetSpec.latest()
+        OffsetSpec.timestamp(ts)
+    """
+
+    @staticmethod
+    def earliest() -> "OffsetSpec":
+        """Create an OffsetSpec for the earliest available offset."""
+        ...
+    @staticmethod
+    def latest() -> "OffsetSpec":
+        """Create an OffsetSpec for the latest available offset."""
+        ...
+    @staticmethod
+    def timestamp(ts: int) -> "OffsetSpec":
+        """Create an OffsetSpec for the offset at or after the given timestamp."""
+        ...
+    def __repr__(self) -> str: ...
 
 # Constant for earliest offset (-2)
 EARLIEST_OFFSET: int
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index d03ce7a21c..9a96bea1f6 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -16,7 +16,6 @@
 // under the License.
 
 use crate::*;
-use fcore::rpc::message::OffsetSpec;
 use pyo3::conversion::IntoPyObject;
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::Arc;
@@ -27,23 +26,6 @@ pub struct FlussAdmin {
     __admin: Arc<fcore::client::FlussAdmin>,
 }
 
-/// Parse offset_type string into OffsetSpec
-fn parse_offset_spec(offset_type: &str, timestamp: Option<i64>) -> PyResult<OffsetSpec> {
-    match offset_type {
-        s if s.eq_ignore_ascii_case("earliest") => Ok(OffsetSpec::Earliest),
-        s if s.eq_ignore_ascii_case("latest") => Ok(OffsetSpec::Latest),
-        s if s.eq_ignore_ascii_case("timestamp") => {
-            let ts = timestamp.ok_or_else(|| {
-                FlussError::new_err("timestamp must be provided when offset_type='timestamp'")
-            })?;
-            Ok(OffsetSpec::Timestamp(ts))
-        }
-        _ => Err(FlussError::new_err(format!(
-            "Invalid offset_type: '{offset_type}'. Must be 'earliest', 'latest', or 'timestamp'"
-        ))),
-    }
-}
-
 /// Validate bucket IDs are non-negative
 fn validate_bucket_ids(bucket_ids: &[i32]) -> PyResult<()> {
     for &bucket_id in bucket_ids {
@@ -374,25 +356,20 @@ impl FlussAdmin {
     /// Args:
     ///     table_path: Path to the table
     ///     bucket_ids: List of bucket IDs to query
-    ///     offset_type: Type of offset to retrieve:
-    ///         - "earliest" or OffsetType.EARLIEST: Start of the log
-    ///         - "latest" or OffsetType.LATEST: End of the log
-    ///         - "timestamp" or OffsetType.TIMESTAMP: Offset at given timestamp (requires timestamp arg)
-    ///     timestamp: Required when offset_type is "timestamp", ignored otherwise
+    ///     offset_spec: Offset specification (OffsetSpec.earliest(), OffsetSpec.latest(),
+    ///         or OffsetSpec.timestamp(ts))
     ///
     /// Returns:
     ///     dict[int, int]: Mapping of bucket_id -> offset
-    #[pyo3(signature = (table_path, bucket_ids, offset_type, timestamp=None))]
     pub fn list_offsets<'py>(
         &self,
         py: Python<'py>,
         table_path: &TablePath,
         bucket_ids: Vec<i32>,
-        offset_type: &str,
-        timestamp: Option<i64>,
+        offset_spec: &OffsetSpec,
     ) -> PyResult<Bound<'py, PyAny>> {
         validate_bucket_ids(&bucket_ids)?;
-        let offset_spec = parse_offset_spec(offset_type, timestamp)?;
+        let offset_spec = offset_spec.inner.clone();
 
         let core_table_path = table_path.to_core();
         let admin = self.__admin.clone();
@@ -419,26 +396,21 @@ impl FlussAdmin {
     ///     table_path: Path to the table
     ///     partition_name: Partition value (e.g., "US" not "region=US")
     ///     bucket_ids: List of bucket IDs to query
-    ///     offset_type: Type of offset to retrieve:
-    ///         - "earliest" or OffsetType.EARLIEST: Start of the log
-    ///         - "latest" or OffsetType.LATEST: End of the log
-    ///         - "timestamp" or OffsetType.TIMESTAMP: Offset at given timestamp (requires timestamp arg)
-    ///     timestamp: Required when offset_type is "timestamp", ignored otherwise
+    ///     offset_spec: Offset specification (OffsetSpec.earliest(), OffsetSpec.latest(),
+    ///         or OffsetSpec.timestamp(ts))
     ///
     /// Returns:
     ///     dict[int, int]: Mapping of bucket_id -> offset
-    #[pyo3(signature = (table_path, partition_name, bucket_ids, offset_type, timestamp=None))]
     pub fn list_partition_offsets<'py>(
         &self,
         py: Python<'py>,
         table_path: &TablePath,
         partition_name: &str,
         bucket_ids: Vec<i32>,
-        offset_type: &str,
-        timestamp: Option<i64>,
+        offset_spec: &OffsetSpec,
     ) -> PyResult<Bound<'py, PyAny>> {
         validate_bucket_ids(&bucket_ids)?;
-        let offset_spec = parse_offset_spec(offset_type, timestamp)?;
+        let offset_spec = offset_spec.inner.clone();
 
         let core_table_path = table_path.to_core();
         let admin = self.__admin.clone();
@@ -493,24 +465,30 @@ impl FlussAdmin {
         })
     }
 
-    /// List all partitions for a partitioned table.
+    /// List partitions for a partitioned table.
     ///
     /// Args:
     ///     table_path: Path to the table
+    ///     partition_spec: Optional partial partition spec to filter results.
+    ///         Dict mapping partition column name to value (e.g., {"region": "US"}).
+    ///         If None, returns all partitions.
     ///
     /// Returns:
     ///     List[PartitionInfo]: List of partition info objects
+    #[pyo3(signature = (table_path, partition_spec=None))]
     pub fn list_partition_infos<'py>(
         &self,
         py: Python<'py>,
         table_path: &TablePath,
+        partition_spec: Option<std::collections::HashMap<String, String>>,
     ) -> PyResult<Bound<'py, PyAny>> {
         let core_table_path = table_path.to_core();
         let admin = self.__admin.clone();
+        let core_partition_spec = partition_spec.map(fcore::metadata::PartitionSpec::new);
 
         future_into_py(py, async move {
             let partition_infos = admin
-                .list_partition_infos(&core_table_path)
+                .list_partition_infos_with_spec(&core_table_path, core_partition_spec.as_ref())
                 .await
                 .map_err(|e| FlussError::new_err(format!("Failed to list partitions: {e}")))?;
 
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 801db2c87b..553c8a925e 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -50,21 +50,53 @@ static TOKIO_RUNTIME: LazyLock<Runtime> = LazyLock::new(|| {
         .expect("Failed to create Tokio runtime")
 });
 
-/// Offset type constants for list_offsets()
+/// Offset specification for list_offsets(), matching Java's OffsetSpec.
+///
+/// Use factory methods to create instances:
+///   OffsetSpec.earliest()
+///   OffsetSpec.latest()
+///   OffsetSpec.timestamp(ts)
 #[pyclass]
 #[derive(Clone)]
-pub struct OffsetType;
+pub struct OffsetSpec {
+    pub(crate) inner: fcore::rpc::message::OffsetSpec,
+}
 
 #[pymethods]
-impl OffsetType {
-    #[classattr]
-    const EARLIEST: &'static str = "earliest";
+impl OffsetSpec {
+    /// Create an OffsetSpec for the earliest available offset.
+    #[staticmethod]
+    fn earliest() -> Self {
+        Self {
+            inner: fcore::rpc::message::OffsetSpec::Earliest,
+        }
+    }
+
+    /// Create an OffsetSpec for the latest available offset.
+    #[staticmethod]
+    fn latest() -> Self {
+        Self {
+            inner: fcore::rpc::message::OffsetSpec::Latest,
+        }
+    }
 
-    #[classattr]
-    const LATEST: &'static str = "latest";
+    /// Create an OffsetSpec for the offset at or after the given timestamp.
+    #[staticmethod]
+    fn timestamp(ts: i64) -> Self {
+        Self {
+            inner: fcore::rpc::message::OffsetSpec::Timestamp(ts),
+        }
+    }
 
-    #[classattr]
-    const TIMESTAMP: &'static str = "timestamp";
+    fn __repr__(&self) -> String {
+        match &self.inner {
+            fcore::rpc::message::OffsetSpec::Earliest => "OffsetSpec.earliest()".to_string(),
+            fcore::rpc::message::OffsetSpec::Latest => "OffsetSpec.latest()".to_string(),
+            fcore::rpc::message::OffsetSpec::Timestamp(ts) => {
+                format!("OffsetSpec.timestamp({ts})")
+            }
+        }
+    }
 }
 
 #[pymodule]
@@ -92,7 +124,7 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<ScanRecord>()?;
     m.add_class::<RecordBatch>()?;
     m.add_class::<PartitionInfo>()?;
-    m.add_class::<OffsetType>()?;
+    m.add_class::<OffsetSpec>()?;
     m.add_class::<WriteResultHandle>()?;
     m.add_class::<DatabaseDescriptor>()?;
     m.add_class::<DatabaseInfo>()?;
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index 00ff8086d8..47c9307de7 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -68,8 +68,8 @@ Complete API reference for the Fluss C++ client.
 
 | Method                                                                                                                                                                                                  | Description                             |
 |---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------|
-| `ListOffsets(const TablePath& path, const std::vector<int32_t>& bucket_ids, const OffsetQuery& query, std::unordered_map<int32_t, int64_t>& out) -> Result`                                             | Get offsets for buckets                 |
-| `ListPartitionOffsets(const TablePath& path, const std::string& partition_name, const std::vector<int32_t>& bucket_ids, const OffsetQuery& query, std::unordered_map<int32_t, int64_t>& out) -> Result` | Get offsets for a partition's buckets   |
+| `ListOffsets(const TablePath& path, const std::vector<int32_t>& bucket_ids, const OffsetSpec& query, std::unordered_map<int32_t, int64_t>& out) -> Result`                                             | Get offsets for buckets                 |
+| `ListPartitionOffsets(const TablePath& path, const std::string& partition_name, const std::vector<int32_t>& bucket_ids, const OffsetSpec& query, std::unordered_map<int32_t, int64_t>& out) -> Result` | Get offsets for a partition's buckets   |
 
 ### Lake Operations
 
@@ -423,13 +423,13 @@ When using `table.NewRow()`, the `Set()` method auto-routes to the correct type
 | `bucket_id`    | `int32_t` | Bucket ID    |
 | `offset`       | `int64_t` | Offset value |
 
-## `OffsetQuery`
+## `OffsetSpec`
 
 | Method                                             | Description                             |
 |----------------------------------------------------|-----------------------------------------|
-| `OffsetQuery::Earliest()`                          | Query for the earliest available offset |
-| `OffsetQuery::Latest()`                            | Query for the latest offset             |
-| `OffsetQuery::FromTimestamp(int64_t timestamp_ms)` | Query offset at a specific timestamp    |
+| `OffsetSpec::Earliest()`                          | Query for the earliest available offset |
+| `OffsetSpec::Latest()`                            | Query for the latest offset             |
+| `OffsetSpec::Timestamp(int64_t timestamp_ms)`     | Query offset at a specific timestamp    |
 
 ## Constants
 
@@ -441,7 +441,7 @@ To start reading from the latest offset (only new records), resolve the current
 
 ```cpp
 std::unordered_map<int32_t, int64_t> offsets;
-admin.ListOffsets(table_path, {0}, fluss::OffsetQuery::Latest(), offsets);
+admin.ListOffsets(table_path, {0}, fluss::OffsetSpec::Latest(), offsets);
 scanner.Subscribe(0, offsets[0]);
 ```
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/data-types.md b/fluss-rust/website/docs/user-guide/cpp/data-types.md
index 11712fac55..fb01ac2845 100644
--- a/fluss-rust/website/docs/user-guide/cpp/data-types.md
+++ b/fluss-rust/website/docs/user-guide/cpp/data-types.md
@@ -105,6 +105,6 @@ To start reading from the latest offset, resolve the current offset via `ListOff
 
 ```cpp
 std::unordered_map<int32_t, int64_t> offsets;
-admin.ListOffsets(table_path, {0}, fluss::OffsetQuery::Latest(), offsets);
+admin.ListOffsets(table_path, {0}, fluss::OffsetSpec::Latest(), offsets);
 scanner.Subscribe(0, offsets[0]);
 ```
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md b/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
index 1a33012616..850660ea3a 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
@@ -120,23 +120,23 @@ std::vector<int32_t> bucket_ids = {0, 1, 2};
 // Query earliest offsets
 std::unordered_map<int32_t, int64_t> earliest_offsets;
 admin.ListOffsets(table_path, bucket_ids,
-                  fluss::OffsetQuery::Earliest(), earliest_offsets);
+                  fluss::OffsetSpec::Earliest(), earliest_offsets);
 
 // Query latest offsets
 std::unordered_map<int32_t, int64_t> latest_offsets;
 admin.ListOffsets(table_path, bucket_ids,
-                  fluss::OffsetQuery::Latest(), latest_offsets);
+                  fluss::OffsetSpec::Latest(), latest_offsets);
 
 // Query offsets for a specific timestamp
 std::unordered_map<int32_t, int64_t> timestamp_offsets;
 admin.ListOffsets(table_path, bucket_ids,
-                  fluss::OffsetQuery::FromTimestamp(timestamp_ms),
+                  fluss::OffsetSpec::Timestamp(timestamp_ms),
                   timestamp_offsets);
 
 // Query partition offsets
 std::unordered_map<int32_t, int64_t> partition_offsets;
 admin.ListPartitionOffsets(table_path, "partition_name",
-                           bucket_ids, fluss::OffsetQuery::Latest(),
+                           bucket_ids, fluss::OffsetSpec::Latest(),
                            partition_offsets);
 ```
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
index 6a6927f561..371ee3e020 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
@@ -103,7 +103,7 @@ admin.ListPartitionInfos(table_path, partition_infos);
 std::vector<int32_t> bucket_ids = {0, 1, 2};
 std::unordered_map<int32_t, int64_t> offsets;
 admin.ListPartitionOffsets(table_path, "2024-01-15$US",
-                           bucket_ids, fluss::OffsetQuery::Latest(), offsets);
+                           bucket_ids, fluss::OffsetSpec::Latest(), offsets);
 ```
 
 ## Partitioned Primary Key Tables
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index 321e25e6b7..af03058a04 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -43,8 +43,8 @@ Supports `with` statement (context manager).
 | `await get_table_info(table_path) -> TableInfo`                                                                       | Get table metadata                    |
 | `await list_tables(database_name) -> list[str]`                                                                       | List tables in a database             |
 | `await table_exists(table_path) -> bool`                                                                              | Check if a table exists               |
-| `await list_offsets(table_path, bucket_ids, offset_type, timestamp=None) -> dict[int, int]`                           | Get offsets for buckets               |
-| `await list_partition_offsets(table_path, partition_name, bucket_ids, offset_type, timestamp=None) -> dict[int, int]` | Get offsets for a partition's buckets |
+| `await list_offsets(table_path, bucket_ids, offset_spec) -> dict[int, int]`                           | Get offsets for buckets               |
+| `await list_partition_offsets(table_path, partition_name, bucket_ids, offset_spec) -> dict[int, int]` | Get offsets for a partition's buckets |
 | `await create_partition(table_path, partition_spec, ignore_if_exists=False)`                                          | Create a partition                    |
 | `await drop_partition(table_path, partition_spec, ignore_if_not_exists=False)`                                        | Drop a partition                      |
 | `await list_partition_infos(table_path) -> list[PartitionInfo]`                                                       | List partitions                       |
@@ -264,14 +264,19 @@ Raised for all Fluss-specific errors (connection failures, table not found, sche
 | Constant                     | Value         | Description                                         |
 |------------------------------|---------------|-----------------------------------------------------|
 | `fluss.EARLIEST_OFFSET`      | `-2`          | Start reading from earliest available offset        |
-| `fluss.OffsetType.EARLIEST`  | `"earliest"`  | For `list_offsets()`                                |
-| `fluss.OffsetType.LATEST`    | `"latest"`    | For `list_offsets()`                                |
-| `fluss.OffsetType.TIMESTAMP` | `"timestamp"` | For `list_offsets()` with timestamp                 |
+
+## `OffsetSpec`
+
+| Method                      | Description                                      |
+|-----------------------------|--------------------------------------------------|
+| `OffsetSpec.earliest()`     | Earliest available offset                        |
+| `OffsetSpec.latest()`       | Latest offset                                    |
+| `OffsetSpec.timestamp(ts)`  | Offset at or after the given timestamp (millis)  |
 
 To start reading from the latest offset (only new records), resolve the current offset via `list_offsets` before subscribing:
 
 ```python
-offsets = await admin.list_offsets(table_path, [0], fluss.OffsetType.LATEST)
+offsets = await admin.list_offsets(table_path, [0], fluss.OffsetSpec.latest())
 scanner.subscribe(bucket_id=0, start_offset=offsets[0])
 ```
 
diff --git a/fluss-rust/website/docs/user-guide/python/example/admin-operations.md b/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
index 8c62ee78c9..4561a3fad6 100644
--- a/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
+++ b/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
@@ -56,13 +56,13 @@ await admin.drop_table(table_path, ignore_if_not_exists=True)
 
 ```python
 # Latest offsets for buckets
-offsets = await admin.list_offsets(table_path, bucket_ids=[0, 1], offset_type="latest")
+offsets = await admin.list_offsets(table_path, bucket_ids=[0, 1], offset_spec=fluss.OffsetSpec.latest())
 
 # By timestamp
-offsets = await admin.list_offsets(table_path, bucket_ids=[0], offset_type="timestamp", timestamp=1704067200000)
+offsets = await admin.list_offsets(table_path, bucket_ids=[0], offset_spec=fluss.OffsetSpec.timestamp(1704067200000))
 
 # Per-partition offsets
-offsets = await admin.list_partition_offsets(table_path, partition_name="US", bucket_ids=[0], offset_type="latest")
+offsets = await admin.list_partition_offsets(table_path, partition_name="US", bucket_ids=[0], offset_spec=fluss.OffsetSpec.latest())
 ```
 
 ## Lake Snapshot
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
index c4ef4f3c69..9686fc6247 100644
--- a/fluss-rust/website/docs/user-guide/python/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -24,10 +24,10 @@ with await fluss.FlussConnection.create(config) as conn:
 | Key                 | Description                                           | Default            |
 |---------------------|-------------------------------------------------------|--------------------|
 | `bootstrap.servers` | Coordinator server address                            | `127.0.0.1:9123`   |
-| `request.max.size`  | Maximum request size in bytes                         | `10485760` (10 MB) |
+| `writer.request-max-size`  | Maximum request size in bytes                  | `10485760` (10 MB) |
 | `writer.acks`       | Acknowledgment setting (`all` waits for all replicas) | `all`              |
 | `writer.retries`    | Number of retries on failure                          | `2147483647`       |
-| `writer.batch.size` | Batch size for writes in bytes                        | `2097152` (2 MB)   |
+| `writer.batch-size` | Batch size for writes in bytes                        | `2097152` (2 MB)   |
 
 Remember to close the connection when done:
 
diff --git a/fluss-rust/website/docs/user-guide/python/example/log-tables.md b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
index 63903a4e46..6e44e0610d 100644
--- a/fluss-rust/website/docs/user-guide/python/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
@@ -106,7 +106,7 @@ To only consume new records (skip existing data), first resolve the current late
 
 ```python
 admin = await conn.get_admin()
-offsets = await admin.list_offsets(table_path, [0], fluss.OffsetType.LATEST)
+offsets = await admin.list_offsets(table_path, [0], fluss.OffsetSpec.latest())
 latest = offsets[0]
 
 scanner = await table.new_scan().create_record_batch_log_scanner()

From 32347c74344b38b41483af542492a0adadd72d16 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Mon, 16 Feb 2026 00:37:16 +0000
Subject: [PATCH 147/287] chore: Fix API error not being propagated on python
 side. (#340)

---
 fluss-rust/bindings/python/src/admin.rs          | 12 +++++-------
 fluss-rust/crates/fluss/src/client/connection.rs | 15 +++++++++++++--
 fluss-rust/crates/fluss/src/error.rs             |  9 +++++++++
 3 files changed, 27 insertions(+), 9 deletions(-)

diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index 9a96bea1f6..30db37506b 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -345,7 +345,7 @@ impl FlussAdmin {
             admin
                 .drop_table(&core_table_path, ignore_if_not_exists)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to drop table: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Ok(py.None()))
         })
@@ -378,7 +378,7 @@ impl FlussAdmin {
             let offsets = admin
                 .list_offsets(&core_table_path, &bucket_ids, offset_spec)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to list offsets: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| {
                 let dict = pyo3::types::PyDict::new(py);
@@ -420,9 +420,7 @@ impl FlussAdmin {
             let offsets = admin
                 .list_partition_offsets(&core_table_path, &partition_name, &bucket_ids, offset_spec)
                 .await
-                .map_err(|e| {
-                    FlussError::new_err(format!("Failed to list partition offsets: {e}"))
-                })?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| {
                 let dict = pyo3::types::PyDict::new(py);
@@ -459,7 +457,7 @@ impl FlussAdmin {
             admin
                 .create_partition(&core_table_path, &core_partition_spec, ignore_if_exists)
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to create partition: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| Ok(py.None()))
         })
@@ -490,7 +488,7 @@ impl FlussAdmin {
             let partition_infos = admin
                 .list_partition_infos_with_spec(&core_table_path, core_partition_spec.as_ref())
                 .await
-                .map_err(|e| FlussError::new_err(format!("Failed to list partitions: {e}")))?;
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
             Python::attach(|py| {
                 let py_list = pyo3::types::PyList::empty(py);
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index b370682afd..a17e57fb5f 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -24,7 +24,7 @@ use crate::rpc::RpcClient;
 use parking_lot::RwLock;
 use std::sync::Arc;
 
-use crate::error::Result;
+use crate::error::{Error, FlussError, Result};
 use crate::metadata::TablePath;
 
 pub struct FlussConnection {
@@ -88,7 +88,18 @@ impl FlussConnection {
 
     pub async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>> {
         self.metadata.update_table_metadata(table_path).await?;
-        let table_info = self.metadata.get_cluster().get_table(table_path)?.clone();
+        let table_info = self
+            .metadata
+            .get_cluster()
+            .get_table(table_path)
+            .map_err(|e| {
+                if e.api_error() == Some(FlussError::InvalidTableException) {
+                    Error::table_not_exist(format!("Table not found: {table_path}"))
+                } else {
+                    e
+                }
+            })?
+            .clone();
         Ok(FlussTable::new(self, self.metadata.clone(), table_info))
     }
 }
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index af9f274c77..59524a6387 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -112,6 +112,15 @@ pub enum Error {
 /// These create `FlussAPIError` with the correct protocol error code,
 /// consistent with Java where e.g. `InvalidTableException` always carries code 15.
 impl Error {
+    pub fn table_not_exist(message: impl Into<String>) -> Self {
+        Error::FlussAPIError {
+            api_error: ApiError {
+                code: FlussError::TableNotExist.code(),
+                message: message.into(),
+            },
+        }
+    }
+
     pub fn invalid_table(message: impl Into<String>) -> Self {
         Error::FlussAPIError {
             api_error: ApiError {

From e1ec842165590bb993f8d1d3bad70927b0218768 Mon Sep 17 00:00:00 2001
From: Nikhil Negi <95623427+niknegi@users.noreply.github.com>
Date: Mon, 16 Feb 2026 06:14:27 +0530
Subject: [PATCH 148/287] chore: added Default Implementations for Missing
 Types (#326)

---
 .../crates/fluss/src/metadata/datatype.rs     | 23 +++++++++++++++++--
 1 file changed, 21 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 3da270bc6a..66f68f445c 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -390,6 +390,12 @@ impl CharType {
     }
 }
 
+impl Default for CharType {
+    fn default() -> Self {
+        Self::new(1)
+    }
+}
+
 impl Display for CharType {
     fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
         write!(f, "CHAR({})", self.length)?;
@@ -503,6 +509,13 @@ impl DecimalType {
     }
 }
 
+impl Default for DecimalType {
+    fn default() -> Self {
+        Self::new(Self::DEFAULT_PRECISION, Self::DEFAULT_SCALE)
+            .expect("Invalid default decimal precision or scale")
+    }
+}
+
 impl Display for DecimalType {
     fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
         write!(f, "DECIMAL({}, {})", self.precision, self.scale)?;
@@ -548,13 +561,13 @@ impl Display for DateType {
     }
 }
 
-#[derive(Default, Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize, Deserialize)]
 pub struct TimeType {
     nullable: bool,
     precision: u32,
 }
 
-impl TimeType {
+impl Default for TimeType {
     fn default() -> Self {
         Self::new(Self::DEFAULT_PRECISION).expect("Invalid default time precision")
     }
@@ -798,6 +811,12 @@ impl BinaryType {
     }
 }
 
+impl Default for BinaryType {
+    fn default() -> Self {
+        Self::new(Self::DEFAULT_LENGTH)
+    }
+}
+
 impl Display for BinaryType {
     fn fmt(&self, f: &mut Formatter<'_>) -> std::fmt::Result {
         write!(f, "BINARY({})", self.length)?;

From 5333e45c6635f02d5018f5bcb4479b04572f241b Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Mon, 16 Feb 2026 19:37:24 +0800
Subject: [PATCH 149/287] chore: default cpp builds to release mode (#345)

---
 fluss-rust/bindings/cpp/CMakeLists.txt | 4 ++--
 fluss-rust/bindings/cpp/README.md      | 3 +++
 fluss-rust/bindings/cpp/ci.sh          | 7 ++++---
 3 files changed, 9 insertions(+), 5 deletions(-)

diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
index 05c58ea73d..a8f527edad 100644
--- a/fluss-rust/bindings/cpp/CMakeLists.txt
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -32,7 +32,7 @@ find_package(Threads REQUIRED)
 find_package(Arrow REQUIRED)
 
 if (NOT CMAKE_BUILD_TYPE)
-    set(CMAKE_BUILD_TYPE Debug)
+    set(CMAKE_BUILD_TYPE Release)
 endif()
 
 set(CMAKE_CXX_STANDARD 17)
@@ -122,4 +122,4 @@ add_dependencies(fluss_cpp cargo_build)
 if (FLUSS_ENABLE_ADDRESS_SANITIZER)
     target_compile_options(fluss_cpp PRIVATE -fsanitize=leak,address,undefined -fno-omit-frame-pointer -fno-common -O1)
     target_link_options(fluss_cpp PRIVATE -fsanitize=leak,address,undefined)
-endif()
\ No newline at end of file
+endif()
diff --git a/fluss-rust/bindings/cpp/README.md b/fluss-rust/bindings/cpp/README.md
index 539e313024..1a8d9f2f64 100644
--- a/fluss-rust/bindings/cpp/README.md
+++ b/fluss-rust/bindings/cpp/README.md
@@ -22,12 +22,15 @@ cmake ..
 cmake --build .
 ```
 
+By default, CMake now uses `Release` when `CMAKE_BUILD_TYPE` is not specified.
+
 **With Bazel:**
 
 ```bash
 cd bindings/cpp
 bazel build //...
 ```
+`ci.sh` defaults to optimized builds via `-c opt` (override with `BAZEL_BUILD_FLAGS` if needed).
 See [ci.sh](ci.sh) for the CI build sequence.
 
 
diff --git a/fluss-rust/bindings/cpp/ci.sh b/fluss-rust/bindings/cpp/ci.sh
index b5eb9676b6..ebf5f09205 100755
--- a/fluss-rust/bindings/cpp/ci.sh
+++ b/fluss-rust/bindings/cpp/ci.sh
@@ -19,6 +19,7 @@
 set -xe 
 
 DIR="$(cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd)"
+BAZEL_BUILD_FLAGS="${BAZEL_BUILD_FLAGS:--c opt}"
 
 # Set Bazel output base to bazel-build directory
 # This ensures all Bazel outputs are in bazel-build/.bazel-output-base
@@ -33,16 +34,16 @@ bazel() {
 }
 
 compile() {
-    bazel build //:fluss_cpp
+    bazel build ${BAZEL_BUILD_FLAGS} //:fluss_cpp
 }
 
 build_example() {
-    bazel build //:fluss_cpp_example
+    bazel build ${BAZEL_BUILD_FLAGS} //:fluss_cpp_example
 }
 
 run_example() {
     build_example
-    bazel run //:fluss_cpp_example
+    bazel run ${BAZEL_BUILD_FLAGS} //:fluss_cpp_example
 }
 
 clean() {

From c9e72e649206224399cbd991798a12c69b3e293f Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Tue, 17 Feb 2026 08:04:51 +0000
Subject: [PATCH 150/287] doc: Add missed API documentation update (#337)

---
 fluss-rust/docs/rust-client.md                      |   0
 .../docs/release/create-release.md}                 |  10 +++++++---
 .../docs/release}/generate-release-note.md          |   0
 .../docs/release}/verifying-a-release-candidate.md  |   0
 .../website/docs/user-guide/cpp/api-reference.md    |   3 ++-
 .../website/docs/user-guide/rust/api-reference.md   |  11 ++++++-----
 fluss-rust/website/sidebars.ts                      |   8 +++++++-
 .../assets => website/static/img}/release-guide.png | Bin
 8 files changed, 22 insertions(+), 10 deletions(-)
 delete mode 100644 fluss-rust/docs/rust-client.md
 rename fluss-rust/{docs/creating-a-release.md => website/docs/release/create-release.md} (97%)
 rename fluss-rust/{docs => website/docs/release}/generate-release-note.md (100%)
 rename fluss-rust/{docs => website/docs/release}/verifying-a-release-candidate.md (100%)
 rename fluss-rust/{docs/assets => website/static/img}/release-guide.png (100%)

diff --git a/fluss-rust/docs/rust-client.md b/fluss-rust/docs/rust-client.md
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/fluss-rust/docs/creating-a-release.md b/fluss-rust/website/docs/release/create-release.md
similarity index 97%
rename from fluss-rust/docs/creating-a-release.md
rename to fluss-rust/website/docs/release/create-release.md
index 8b4c868fbf..fc936f9a61 100644
--- a/fluss-rust/docs/creating-a-release.md
+++ b/fluss-rust/website/docs/release/create-release.md
@@ -1,3 +1,7 @@
+---
+sidebar_position: 4
+---
+
 # Creating a Fluss Rust Client Release
 
 This document describes in detail how to create a release of the **Fluss clients** (fluss-rust, fluss-python, fluss-cpp) from the [fluss-rust](https://github.com/apache/fluss-rust) repository. It is based on the [Creating a Fluss Release](https://fluss.apache.org/community/how-to-release/creating-a-fluss-release/) guide of the Apache Fluss project and the [release guide of Apache OpenDAL](https://nightlies.apache.org/opendal/opendal-docs-stable/community/release/); releases are source archives plus CI-published crates.io and PyPI.
@@ -6,7 +10,7 @@ Publishing software has legal consequences. This guide complements the foundatio
 
 ## Overview
 
-![Release process overview](assets/release-guide.png)
+![Release process overview](/img/release-guide.png)
 
 The release process consists of:
 
@@ -22,7 +26,7 @@ The release process consists of:
 
 Deciding to release and selecting a Release Manager is the first step. This is a consensus-based decision of the community.
 
-Anybody can propose a release (e.g. on the dev mailing list), giving a short rationale and nominating a committer as Release Manager (including themselves). Any objections should be resolved by consensus before starting.
+Anybody can propose a release (e.g. on the dev [mailing list](https://fluss.apache.org/community/welcome/)), giving a short rationale and nominating a committer as Release Manager (including themselves). Any objections should be resolved by consensus before starting.
 
 **Checklist to proceed**
 
@@ -360,7 +364,7 @@ svn commit -m "Remove RC after release fluss-rust ${RELEASE_VERSION}"
 2. Choose tag `$RELEASE_TAG`.
 3. Set the target to the release branch `release-${RELEASE_VERSION}` (i.e., the branch/commit used to create `$RELEASE_TAG`).
 4. Click **Generate release notes**, then add: notable changes, breaking changes (if any) from component upgrade docs, **official download link** (source archive and verification), and install instructions for fluss-rust, fluss-python, fluss-cpp.
-   - **Download link:** `https://downloads.apache.org/incubator/fluss/fluss-rust-${RELEASE_VERSION}/` (or the project download page). In the release description, include checksums and GPG verification steps.
+    - **Download link:** `https://downloads.apache.org/incubator/fluss/fluss-rust-${RELEASE_VERSION}/` (or the project download page). In the release description, include checksums and GPG verification steps.
 5. Click **Publish release**.
 
 ### 6. Update CHANGELOG.md on main
diff --git a/fluss-rust/docs/generate-release-note.md b/fluss-rust/website/docs/release/generate-release-note.md
similarity index 100%
rename from fluss-rust/docs/generate-release-note.md
rename to fluss-rust/website/docs/release/generate-release-note.md
diff --git a/fluss-rust/docs/verifying-a-release-candidate.md b/fluss-rust/website/docs/release/verifying-a-release-candidate.md
similarity index 100%
rename from fluss-rust/docs/verifying-a-release-candidate.md
rename to fluss-rust/website/docs/release/verifying-a-release-candidate.md
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index 47c9307de7..9cba2431b2 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -202,8 +202,9 @@ Complete API reference for the Fluss C++ client.
 
 When using `table.NewRow()`, the `Set()` method auto-routes to the correct type based on the schema:
 
-| Method                                                   |  Description                      |
+| Method                                                   | Description                       |
 |----------------------------------------------------------|-----------------------------------|
+| `Set(const std::string& name, std::nullptr_t)`           | Set field to null by column name  |
 | `Set(const std::string& name, bool value)`               | Set boolean by column name        |
 | `Set(const std::string& name, int32_t value)`            | Set integer by column name        |
 | `Set(const std::string& name, int64_t value)`            | Set big integer by column name    |
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index d5d0671542..0929ce68be 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -50,11 +50,12 @@ Complete API reference for the Fluss Rust client.
 
 ### Partition Operations
 
-| Method                                                                                                                   | Description         |
-|--------------------------------------------------------------------------------------------------------------------------|---------------------|
-| `async fn list_partition_infos(&self, table_path: &TablePath) -> Result<Vec<PartitionInfo>>`                             | List all partitions |
-| `async fn create_partition(&self, table_path: &TablePath, spec: &PartitionSpec, ignore_if_exists: bool) -> Result<()>`   | Create a partition  |
-| `async fn drop_partition(&self, table_path: &TablePath, spec: &PartitionSpec, ignore_if_not_exists: bool) -> Result<()>` | Drop a partition    |
+| Method                                                                                                                               | Description                     |
+|--------------------------------------------------------------------------------------------------------------------------------------|---------------------------------|
+| `async fn list_partition_infos(&self, table_path: &TablePath) -> Result<Vec<PartitionInfo>>`                                         | List all partitions             |
+| `async fn list_partition_infos_with_spec(&self, table_path: &TablePath, spec: Option<&PartitionSpec>) -> Result<Vec<PartitionInfo>>` | List partitions matching a spec |
+| `async fn create_partition(&self, table_path: &TablePath, spec: &PartitionSpec, ignore_if_exists: bool) -> Result<()>`               | Create a partition              |
+| `async fn drop_partition(&self, table_path: &TablePath, spec: &PartitionSpec, ignore_if_not_exists: bool) -> Result<()>`             | Drop a partition                |
 
 ### Offset Operations
 
diff --git a/fluss-rust/website/sidebars.ts b/fluss-rust/website/sidebars.ts
index 51bdd5cf7a..f6fbeaca64 100644
--- a/fluss-rust/website/sidebars.ts
+++ b/fluss-rust/website/sidebars.ts
@@ -17,7 +17,13 @@ const sidebars: SidebarsConfig = {
         'developer-guide/contributing',
       ],
     },
-    'release',
+    {
+      type: 'category',
+      label: 'Release',
+      items: [
+        {type: 'autogenerated', dirName: 'release'},
+      ],
+    },
   ],
 };
 
diff --git a/fluss-rust/docs/assets/release-guide.png b/fluss-rust/website/static/img/release-guide.png
similarity index 100%
rename from fluss-rust/docs/assets/release-guide.png
rename to fluss-rust/website/static/img/release-guide.png

From 919e218fb1b449ef21e0b9b7a3161f8c52c7d5a1 Mon Sep 17 00:00:00 2001
From: Nikhil Negi <95623427+niknegi@users.noreply.github.com>
Date: Tue, 17 Feb 2026 13:44:41 +0530
Subject: [PATCH 151/287] chore: added unit test cases and throw an exception
 when any field doesn't exist on RowType (#310)

---
 .../crates/fluss/src/metadata/datatype.rs     | 211 +++++++++++++++++-
 1 file changed, 209 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 66f68f445c..6d888d9de1 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -952,8 +952,12 @@ impl RowType {
     pub fn project_with_field_names(&self, field_names: &[String]) -> Result<RowType> {
         let indices: Vec<usize> = field_names
             .iter()
-            .filter_map(|pk| self.get_field_index(pk))
-            .collect();
+            .map(|name| {
+                self.get_field_index(name).ok_or_else(|| IllegalArgument {
+                    message: format!("Field '{}' does not exist in the row type", name),
+                })
+            })
+            .collect::<Result<Vec<_>>>()?;
 
         self.project(indices.as_slice())
     }
@@ -1424,6 +1428,10 @@ fn test_deeply_nested_types() {
     assert_eq!(nested.to_string(), "ARRAY<MAP<STRING, ROW<x INT, y INT>>>");
 }
 
+// ============================================================================
+// DecimalType validation tests
+// ============================================================================
+
 #[test]
 fn test_decimal_invalid_precision() {
     // DecimalType::with_nullable should return an error for invalid precision
@@ -1450,6 +1458,76 @@ fn test_decimal_invalid_scale() {
     );
 }
 
+// ============================================================================
+// DecimalType validation tests - edge cases
+// ============================================================================
+
+#[test]
+fn test_decimal_valid_precision_and_scale() {
+    // Valid: precision=10, scale=2
+    let result = DecimalType::with_nullable(true, 10, 2);
+    assert!(result.is_ok());
+    let decimal = result.unwrap();
+    assert_eq!(decimal.precision(), 10);
+    assert_eq!(decimal.scale(), 2);
+    // Nullable: should NOT contain "NOT NULL"
+    assert!(!decimal.to_string().contains("NOT NULL"));
+
+    // Valid: precision=38, scale=0
+    let result = DecimalType::with_nullable(true, 38, 0);
+    assert!(result.is_ok());
+    let decimal = result.unwrap();
+    assert_eq!(decimal.precision(), 38);
+    assert_eq!(decimal.scale(), 0);
+
+    // Valid: precision=1, scale=0
+    let result = DecimalType::with_nullable(false, 1, 0);
+    assert!(result.is_ok());
+    let decimal = result.unwrap();
+    assert_eq!(decimal.precision(), 1);
+    assert_eq!(decimal.scale(), 0);
+    // Non-nullable: should contain "NOT NULL"
+    assert!(decimal.to_string().contains("NOT NULL"));
+}
+
+#[test]
+fn test_decimal_invalid_precision_zero() {
+    // Invalid: precision=0 (edge case not covered by existing tests)
+    let result = DecimalType::with_nullable(true, 0, 0);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("Decimal precision must be between 1 and 38")
+    );
+}
+
+#[test]
+fn test_decimal_scale_equals_precision_boundary() {
+    // Boundary: precision=10, scale=10 (scale == precision is valid)
+    let result = DecimalType::with_nullable(true, 10, 10);
+    assert!(result.is_ok());
+    let decimal = result.unwrap();
+    assert_eq!(decimal.precision(), 10);
+    assert_eq!(decimal.scale(), 10);
+}
+
+// ============================================================================
+// TimeType validation tests
+// ============================================================================
+
+#[test]
+fn test_time_valid_precision() {
+    // Test all valid precision values 0 through 9
+    for precision in 0..=9 {
+        let result = TimeType::with_nullable(true, precision);
+        assert!(result.is_ok(), "precision {} should be valid", precision);
+        let time = result.unwrap();
+        assert_eq!(time.precision(), precision);
+    }
+}
+
 #[test]
 fn test_time_invalid_precision() {
     // TimeType::with_nullable should return an error for invalid precision
@@ -1463,6 +1541,21 @@ fn test_time_invalid_precision() {
     );
 }
 
+// ============================================================================
+// TimestampType validation tests
+// ============================================================================
+
+#[test]
+fn test_timestamp_valid_precision() {
+    // Test all valid precision values 0 through 9
+    for precision in 0..=9 {
+        let result = TimestampType::with_nullable(true, precision);
+        assert!(result.is_ok(), "precision {} should be valid", precision);
+        let timestamp_type = result.unwrap();
+        assert_eq!(timestamp_type.precision(), precision);
+    }
+}
+
 #[test]
 fn test_timestamp_invalid_precision() {
     // TimestampType::with_nullable should return an error for invalid precision
@@ -1488,3 +1581,117 @@ fn test_timestamp_ltz_invalid_precision() {
             .contains("Timestamp with local time zone precision must be between 0 and 9")
     );
 }
+
+// ============================================================================
+// RowType projection tests
+// ============================================================================
+
+#[test]
+fn test_row_type_project_valid_indices() {
+    // Create a 3-column row type
+    let row_type = RowType::with_data_types_and_field_names(
+        vec![DataTypes::int(), DataTypes::string(), DataTypes::bigint()],
+        vec!["id", "name", "age"],
+    );
+
+    // Valid projection by indices: [0, 2]
+    let projected = row_type.project(&[0, 2]).unwrap();
+    assert_eq!(projected.fields().len(), 2);
+    assert_eq!(projected.fields()[0].name, "id");
+    assert_eq!(projected.fields()[1].name, "age");
+}
+
+#[test]
+fn test_row_type_project_empty_indices() {
+    // Create a 3-column row type
+    let row_type = RowType::with_data_types_and_field_names(
+        vec![DataTypes::int(), DataTypes::string(), DataTypes::bigint()],
+        vec!["id", "name", "age"],
+    );
+
+    // Projection with an empty indices array should yield an empty RowType
+    let projected = row_type.project(&[]).unwrap();
+    assert_eq!(projected.fields().len(), 0);
+}
+
+#[test]
+fn test_row_type_project_with_field_names_valid() {
+    // Create a 3-column row type
+    let row_type = RowType::with_data_types_and_field_names(
+        vec![DataTypes::int(), DataTypes::string(), DataTypes::bigint()],
+        vec!["id", "name", "age"],
+    );
+
+    // Valid projection by names: ["id", "name"]
+    let projected = row_type
+        .project_with_field_names(&["id".to_string(), "name".to_string()])
+        .unwrap();
+    assert_eq!(projected.fields().len(), 2);
+    assert_eq!(projected.fields()[0].name, "id");
+    assert_eq!(projected.fields()[1].name, "name");
+}
+
+#[test]
+fn test_row_type_project_index_out_of_bounds() {
+    // Create a 3-column row type
+    let row_type = RowType::with_data_types_and_field_names(
+        vec![DataTypes::int(), DataTypes::string(), DataTypes::bigint()],
+        vec!["id", "name", "age"],
+    );
+
+    // Error: index out of bounds
+    let result = row_type.project(&[0, 5]);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("invalid field position: 5")
+    );
+}
+
+#[test]
+fn test_row_type_project_with_field_names_nonexistent() {
+    // Create a 3-column row type
+    let row_type = RowType::with_data_types_and_field_names(
+        vec![DataTypes::int(), DataTypes::string(), DataTypes::bigint()],
+        vec!["id", "name", "age"],
+    );
+
+    // Error: non-existent field name should throw exception
+    let result = row_type.project_with_field_names(&["nonexistent".to_string()]);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("Field 'nonexistent' does not exist in the row type")
+    );
+
+    // Mixed existing and non-existing: should also error on the first non-existent field
+    let result = row_type.project_with_field_names(&["id".to_string(), "nonexistent".to_string()]);
+    assert!(result.is_err());
+    assert!(
+        result
+            .unwrap_err()
+            .to_string()
+            .contains("Field 'nonexistent' does not exist in the row type")
+    );
+}
+
+#[test]
+fn test_row_type_project_duplicate_indices() {
+    // Create a 3-column row type
+    let row_type = RowType::with_data_types_and_field_names(
+        vec![DataTypes::int(), DataTypes::string(), DataTypes::bigint()],
+        vec!["id", "name", "age"],
+    );
+
+    // Projection with duplicate indices: [0, 0, 1]
+    // This documents the expected behavior - duplicates are allowed
+    let projected = row_type.project(&[0, 0, 1]).unwrap();
+    assert_eq!(projected.fields().len(), 3);
+    assert_eq!(projected.fields()[0].name, "id");
+    assert_eq!(projected.fields()[1].name, "id");
+    assert_eq!(projected.fields()[2].name, "name");
+}

From 1720ca046c9e66688121464b3ef938ee24ca9fa2 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Tue, 17 Feb 2026 08:48:55 +0000
Subject: [PATCH 152/287] chore: avoid data copy in CPP bindings (#330)

---
 fluss-rust/bindings/cpp/examples/example.cpp  | 185 +++-
 .../bindings/cpp/examples/kv_example.cpp      | 166 ++--
 fluss-rust/bindings/cpp/include/fluss.hpp     | 590 ++++++------
 fluss-rust/bindings/cpp/src/ffi_converter.hpp | 133 +--
 fluss-rust/bindings/cpp/src/lib.rs            | 906 +++++++++++++++---
 fluss-rust/bindings/cpp/src/table.cpp         | 601 ++++++++++--
 fluss-rust/bindings/cpp/src/types.rs          | 627 +++---------
 7 files changed, 1973 insertions(+), 1235 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index 2b7f331e66..ea966d8e6b 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -15,7 +15,10 @@
 // specific language governing permissions and limitations
 // under the License.
 
+#include <arrow/array/builder_binary.h>
+#include <arrow/array/builder_primitive.h>
 #include <arrow/record_batch.h>
+#include <arrow/type.h>
 
 #include <chrono>
 #include <iostream>
@@ -140,6 +143,18 @@ int main() {
         std::cout << "Row acknowledged by server" << std::endl;
     }
 
+    // Append a row with all fields null (matches Rust log_table.rs all_supported_datatypes)
+    {
+        fluss::GenericRow row;
+        size_t field_count = 8;
+        for (size_t i = 0; i < field_count; ++i) {
+            row.SetNull(i);
+        }
+        check("append_null_row", writer.Append(row));
+    }
+    check("flush_null", writer.Flush());
+    std::cout << "Wrote row with all fields null" << std::endl;
+
     // 6) Full scan — verify all column types including temporal
     fluss::LogScanner scanner;
     check("new_log_scanner", table.NewScan().CreateLogScanner(scanner));
@@ -155,41 +170,63 @@ int main() {
 
     std::cout << "Scanned records: " << records.Size() << std::endl;
     bool scan_ok = true;
-    for (const auto& rec : records.records) {
-        if (rec.row.GetType(4) != fluss::DatumType::Date) {
+    bool found_null_row = false;
+    for (const auto& rec : records) {
+        // Check if this is the all-null row (matches Rust: is_null_at for every column)
+        if (rec.row.IsNull(0)) {
+            found_null_row = true;
+            for (size_t i = 0; i < rec.row.FieldCount(); ++i) {
+                if (!rec.row.IsNull(i)) {
+                    std::cerr << "ERROR: column " << i << " should be null" << std::endl;
+                    scan_ok = false;
+                }
+            }
+            std::cout << "  [null row] all " << rec.row.FieldCount() << " fields are null"
+                      << std::endl;
+            continue;
+        }
+
+        // Non-null rows: verify types
+        if (rec.row.GetType(4) != fluss::TypeId::Date) {
             std::cerr << "ERROR: field 4 expected Date, got "
                       << static_cast<int>(rec.row.GetType(4)) << std::endl;
             scan_ok = false;
         }
-        if (rec.row.GetType(5) != fluss::DatumType::Time) {
+        if (rec.row.GetType(5) != fluss::TypeId::Time) {
             std::cerr << "ERROR: field 5 expected Time, got "
                       << static_cast<int>(rec.row.GetType(5)) << std::endl;
             scan_ok = false;
         }
-        if (rec.row.GetType(6) != fluss::DatumType::TimestampNtz) {
-            std::cerr << "ERROR: field 6 expected TimestampNtz, got "
+        if (rec.row.GetType(6) != fluss::TypeId::Timestamp) {
+            std::cerr << "ERROR: field 6 expected Timestamp, got "
                       << static_cast<int>(rec.row.GetType(6)) << std::endl;
             scan_ok = false;
         }
-        if (rec.row.GetType(7) != fluss::DatumType::TimestampLtz) {
+        if (rec.row.GetType(7) != fluss::TypeId::TimestampLtz) {
             std::cerr << "ERROR: field 7 expected TimestampLtz, got "
                       << static_cast<int>(rec.row.GetType(7)) << std::endl;
             scan_ok = false;
         }
 
-        auto date = rec.row.GetDate(4);
-        auto time = rec.row.GetTime(5);
-        auto ts_ntz = rec.row.GetTimestamp(6);
-        auto ts_ltz = rec.row.GetTimestamp(7);
+        // Name-based getters (equivalent to index-based above)
+        auto date = rec.row.GetDate("event_date");
+        auto time = rec.row.GetTime("event_time");
+        auto ts_ntz = rec.row.GetTimestamp("created_at");
+        auto ts_ltz = rec.row.GetTimestamp("updated_at");
 
-        std::cout << "  id=" << rec.row.GetInt32(0) << " name=" << rec.row.GetString(1)
-                  << " score=" << rec.row.GetFloat32(2) << " age=" << rec.row.GetInt32(3)
+        std::cout << "  id=" << rec.row.GetInt32("id") << " name=" << rec.row.GetString("name")
+                  << " score=" << rec.row.GetFloat32("score") << " age=" << rec.row.GetInt32("age")
                   << " date=" << date.Year() << "-" << date.Month() << "-" << date.Day()
                   << " time=" << time.Hour() << ":" << time.Minute() << ":" << time.Second()
                   << " ts_ntz=" << ts_ntz.epoch_millis << " ts_ltz=" << ts_ltz.epoch_millis << "+"
                   << ts_ltz.nano_of_millisecond << "ns" << std::endl;
     }
 
+    if (!found_null_row) {
+        std::cerr << "ERROR: did not find the all-null row" << std::endl;
+        scan_ok = false;
+    }
+
     if (!scan_ok) {
         std::cerr << "Full scan type verification FAILED!" << std::endl;
         std::exit(1);
@@ -210,18 +247,23 @@ int main() {
     check("poll_projected", projected_scanner.Poll(5000, projected_records));
 
     std::cout << "Projected records: " << projected_records.Size() << std::endl;
-    for (const auto& rec : projected_records.records) {
+    for (const auto& rec : projected_records) {
         if (rec.row.FieldCount() != 2) {
             std::cerr << "ERROR: expected 2 fields, got " << rec.row.FieldCount() << std::endl;
             scan_ok = false;
             continue;
         }
-        if (rec.row.GetType(0) != fluss::DatumType::Int32) {
-            std::cerr << "ERROR: projected field 0 expected Int32, got "
+        // Skip the all-null row
+        if (rec.row.IsNull(0)) {
+            std::cout << "  [null row] skipped" << std::endl;
+            continue;
+        }
+        if (rec.row.GetType(0) != fluss::TypeId::Int) {
+            std::cerr << "ERROR: projected field 0 expected Int, got "
                       << static_cast<int>(rec.row.GetType(0)) << std::endl;
             scan_ok = false;
         }
-        if (rec.row.GetType(1) != fluss::DatumType::TimestampLtz) {
+        if (rec.row.GetType(1) != fluss::TypeId::TimestampLtz) {
             std::cerr << "ERROR: projected field 1 expected TimestampLtz, got "
                       << static_cast<int>(rec.row.GetType(1)) << std::endl;
             scan_ok = false;
@@ -246,18 +288,23 @@ int main() {
     check("poll_name_projected", name_projected_scanner.Poll(5000, name_projected_records));
 
     std::cout << "Name-projected records: " << name_projected_records.Size() << std::endl;
-    for (const auto& rec : name_projected_records.records) {
+    for (const auto& rec : name_projected_records) {
         if (rec.row.FieldCount() != 2) {
             std::cerr << "ERROR: expected 2 fields, got " << rec.row.FieldCount() << std::endl;
             scan_ok = false;
             continue;
         }
-        if (rec.row.GetType(0) != fluss::DatumType::Int32) {
-            std::cerr << "ERROR: name-projected field 0 expected Int32, got "
+        // Skip the all-null row
+        if (rec.row.IsNull(0)) {
+            std::cout << "  [null row] skipped" << std::endl;
+            continue;
+        }
+        if (rec.row.GetType(0) != fluss::TypeId::Int) {
+            std::cerr << "ERROR: name-projected field 0 expected Int, got "
                       << static_cast<int>(rec.row.GetType(0)) << std::endl;
             scan_ok = false;
         }
-        if (rec.row.GetType(1) != fluss::DatumType::TimestampLtz) {
+        if (rec.row.GetType(1) != fluss::TypeId::TimestampLtz) {
             std::cerr << "ERROR: name-projected field 1 expected TimestampLtz, got "
                       << static_cast<int>(rec.row.GetType(1)) << std::endl;
             scan_ok = false;
@@ -404,7 +451,84 @@ int main() {
         }
     }
 
-    // 12) Decimal support example
+    // 12) AppendArrowBatch — write an Arrow RecordBatch directly
+    std::cout << "\n=== AppendArrowBatch Example ===" << std::endl;
+    {
+        // Build an Arrow RecordBatch matching sample_table_cpp_v1 schema:
+        //   id:INT, name:STRING, score:FLOAT, age:INT,
+        //   event_date:DATE, event_time:TIME, created_at:TIMESTAMP, updated_at:TIMESTAMP_LTZ
+        auto arrow_schema = arrow::schema({
+            arrow::field("id", arrow::int32()),
+            arrow::field("name", arrow::utf8()),
+            arrow::field("score", arrow::float32()),
+            arrow::field("age", arrow::int32()),
+            arrow::field("event_date", arrow::date32()),
+            arrow::field("event_time", arrow::time32(arrow::TimeUnit::MILLI)),
+            arrow::field("created_at", arrow::timestamp(arrow::TimeUnit::MICRO)),
+            arrow::field("updated_at", arrow::timestamp(arrow::TimeUnit::MICRO)),
+        });
+
+        arrow::Int32Builder id_builder;
+        arrow::StringBuilder name_builder;
+        arrow::FloatBuilder score_builder;
+        arrow::Int32Builder age_builder;
+        arrow::Date32Builder date_builder;
+        arrow::Time32Builder time_builder(arrow::time32(arrow::TimeUnit::MILLI),
+                                          arrow::default_memory_pool());
+        arrow::TimestampBuilder ts_ntz_builder(arrow::timestamp(arrow::TimeUnit::MICRO),
+                                               arrow::default_memory_pool());
+        arrow::TimestampBuilder ts_ltz_builder(arrow::timestamp(arrow::TimeUnit::MICRO),
+                                               arrow::default_memory_pool());
+
+        // Row 1
+        (void)id_builder.Append(200);
+        (void)name_builder.Append("ArrowAlice");
+        (void)score_builder.Append(88.5f);
+        (void)age_builder.Append(28);
+        (void)date_builder.Append(19888);               // days since epoch (2024-06-15 ≈ 19888)
+        (void)time_builder.Append(52245000);            // 14:30:45 in ms
+        (void)ts_ntz_builder.Append(1718467200000000);  // micros
+        (void)ts_ltz_builder.Append(1718467200000000);
+
+        // Row 2
+        (void)id_builder.Append(201);
+        (void)name_builder.Append("ArrowBob");
+        (void)score_builder.Append(91.3f);
+        (void)age_builder.Append(33);
+        (void)date_builder.Append(20089);    // 2025-01-02
+        (void)time_builder.Append(3600000);  // 01:00:00
+        (void)ts_ntz_builder.Append(1735689600000000);
+        (void)ts_ltz_builder.Append(1735689600000000);
+
+        auto batch_result = arrow::RecordBatch::Make(
+            arrow_schema, 2,
+            {id_builder.Finish().ValueOrDie(), name_builder.Finish().ValueOrDie(),
+             score_builder.Finish().ValueOrDie(), age_builder.Finish().ValueOrDie(),
+             date_builder.Finish().ValueOrDie(), time_builder.Finish().ValueOrDie(),
+             ts_ntz_builder.Finish().ValueOrDie(), ts_ltz_builder.Finish().ValueOrDie()});
+
+        check("append_arrow_batch", writer.AppendArrowBatch(batch_result));
+        check("flush_arrow", writer.Flush());
+        std::cout << "Wrote 2 rows via AppendArrowBatch" << std::endl;
+
+        // Verify by scanning from latest offsets
+        fluss::LogScanner arrow_write_scanner;
+        check("new_arrow_write_scanner", table.NewScan().CreateLogScanner(arrow_write_scanner));
+        for (const auto& [bid, off] : latest_offsets) {
+            check("subscribe_arrow_write", arrow_write_scanner.Subscribe(bid, off));
+        }
+
+        fluss::ScanRecords arrow_write_records;
+        check("poll_arrow_write", arrow_write_scanner.Poll(5000, arrow_write_records));
+        std::cout << "Scanned " << arrow_write_records.Size()
+                  << " records written via AppendArrowBatch:" << std::endl;
+        for (const auto& rec : arrow_write_records) {
+            std::cout << "  id=" << rec.row.GetInt32(0) << " name=" << rec.row.GetString(1)
+                      << " score=" << rec.row.GetFloat32(2) << std::endl;
+        }
+    }
+
+    // 13) Decimal support example
     std::cout << "\n=== Decimal Support Example ===" << std::endl;
 
     fluss::TablePath decimal_table_path("fluss", "decimal_table_cpp_v1");
@@ -469,12 +593,12 @@ int main() {
 
     std::cout << "Scanned decimal records: " << decimal_records.Size() << std::endl;
     for (const auto& rec : decimal_records) {
-        std::cout << "  id=" << rec.row.GetInt32(0) << " price=" << rec.row.DecimalToString(1)
-                  << " amount=" << rec.row.DecimalToString(2)
+        std::cout << "  id=" << rec.row.GetInt32(0) << " price=" << rec.row.GetDecimalString(1)
+                  << " amount=" << rec.row.GetDecimalString(2)
                   << " is_decimal=" << rec.row.IsDecimal(1) << std::endl;
     }
 
-    // 13) Partitioned table example
+    // 14) Partitioned table example
     std::cout << "\n=== Partitioned Table Example ===" << std::endl;
 
     fluss::TablePath partitioned_table_path("fluss", "partitioned_table_cpp_v1");
@@ -553,7 +677,7 @@ int main() {
     check("flush_partitioned", partitioned_writer.Flush());
     std::cout << "Wrote " << partitioned_rows.size() << " rows to partitioned table" << std::endl;
 
-    // 13.1) subscribe_partition_buckets: subscribe to each partition individually
+    // 14.1) subscribe_partition_buckets: subscribe to each partition individually
     std::cout << "\n--- Testing SubscribePartitionBuckets ---" << std::endl;
     fluss::LogScanner partition_scanner;
     check("new_partition_scanner", partitioned_table.NewScan().CreateLogScanner(partition_scanner));
@@ -570,12 +694,13 @@ int main() {
               << std::endl;
     for (size_t i = 0; i < partition_records.Size(); ++i) {
         const auto& rec = partition_records[i];
-        std::cout << "  Record " << i << ": id=" << rec.row.GetInt32(0)
-                  << ", region=" << rec.row.GetString(1) << ", value=" << rec.row.GetInt64(2)
-                  << std::endl;
+        std::cout << "  Record " << i << ": partition_id="
+                  << (rec.partition_id.has_value() ? std::to_string(*rec.partition_id) : "none")
+                  << ", id=" << rec.row.GetInt32(0) << ", region=" << rec.row.GetString(1)
+                  << ", value=" << rec.row.GetInt64(2) << std::endl;
     }
 
-    // 13.2) subscribe_partition_buckets: batch subscribe to all partitions at once
+    // 14.2) subscribe_partition_buckets: batch subscribe to all partitions at once
     std::cout << "\n--- Testing SubscribePartitionBuckets (batch) ---" << std::endl;
     fluss::LogScanner partition_batch_scanner;
     check("new_partition_batch_scanner",
@@ -601,7 +726,7 @@ int main() {
                   << std::endl;
     }
 
-    // 13.3) UnsubscribePartition: unsubscribe from one partition, verify remaining
+    // 14.3) UnsubscribePartition: unsubscribe from one partition, verify remaining
     std::cout << "\n--- Testing UnsubscribePartition ---" << std::endl;
     fluss::LogScanner unsub_partition_scanner;
     check("new_unsub_partition_scanner",
diff --git a/fluss-rust/bindings/cpp/examples/kv_example.cpp b/fluss-rust/bindings/cpp/examples/kv_example.cpp
index b24a459d77..497894f5cc 100644
--- a/fluss-rust/bindings/cpp/examples/kv_example.cpp
+++ b/fluss-rust/bindings/cpp/examples/kv_example.cpp
@@ -138,19 +138,19 @@ int main() {
         auto pk_row = kv_table.NewRow();
         pk_row.Set("user_id", 1);
 
-        bool found = false;
-        fluss::GenericRow result_row;
-        check("lookup_1", lookuper.Lookup(pk_row, found, result_row));
-        if (found) {
-            auto date = result_row.GetDate(5);
-            auto time = result_row.GetTime(6);
-            auto created = result_row.GetTimestamp(7);
-            auto seen = result_row.GetTimestamp(8);
+        fluss::LookupResult result;
+        check("lookup_1", lookuper.Lookup(pk_row, result));
+        if (result.Found()) {
+            // Name-based getters — same data as index-based but self-documenting
+            auto date = result.GetDate("birth_date");
+            auto time = result.GetTime("login_time");
+            auto created = result.GetTimestamp("created_at");
+            auto seen = result.GetTimestamp("last_seen");
             std::cout << "Found user_id=1:"
-                      << "\n  name=" << result_row.GetString(1)
-                      << "\n  email=" << result_row.GetString(2)
-                      << "\n  score=" << result_row.GetFloat32(3)
-                      << "\n  balance=" << result_row.DecimalToString(4)
+                      << "\n  name=" << result.GetString("name")
+                      << "\n  email=" << result.GetString("email")
+                      << "\n  score=" << result.GetFloat32("score")
+                      << "\n  balance=" << result.GetDecimalString("balance")
                       << "\n  birth_date=" << date.Year() << "-" << date.Month() << "-"
                       << date.Day() << "\n  login_time=" << time.Hour() << ":" << time.Minute()
                       << ":" << time.Second() << "\n  created_at(ms)=" << created.epoch_millis
@@ -166,10 +166,9 @@ int main() {
         auto pk_row = kv_table.NewRow();
         pk_row.Set("user_id", 999);
 
-        bool found = false;
-        fluss::GenericRow result_row;
-        check("lookup_999", lookuper.Lookup(pk_row, found, result_row));
-        if (!found) {
+        fluss::LookupResult result;
+        check("lookup_999", lookuper.Lookup(pk_row, result));
+        if (!result.Found()) {
             std::cout << "user_id=999 not found (expected)" << std::endl;
         } else {
             std::cerr << "ERROR: Expected user_id=999 to not be found" << std::endl;
@@ -177,6 +176,57 @@ int main() {
         }
     }
 
+    // 4b) Null row round-trip (matches Rust kv_table.rs all_supported_datatypes)
+    //     Upsert a row with all non-PK fields null, lookup, verify IsNull
+    std::cout << "\n--- Null Row Round-Trip ---" << std::endl;
+    {
+        auto row = kv_table.NewRow();
+        row.Set("user_id", 100);
+        row.SetNull(1);  // name
+        row.SetNull(2);  // email
+        row.SetNull(3);  // score
+        row.SetNull(4);  // balance
+        row.SetNull(5);  // birth_date
+        row.SetNull(6);  // login_time
+        row.SetNull(7);  // created_at
+        row.SetNull(8);  // last_seen
+        fluss::WriteResult wr;
+        check("upsert_null_row", upsert_writer.Upsert(row, wr));
+        check("upsert_null_row_wait", wr.Wait());
+    }
+    {
+        auto pk_row = kv_table.NewRow();
+        pk_row.Set("user_id", 100);
+
+        fluss::LookupResult result;
+        check("lookup_null_row", lookuper.Lookup(pk_row, result));
+        if (!result.Found()) {
+            std::cerr << "ERROR: Expected to find user_id=100 (null row)" << std::endl;
+            std::exit(1);
+        }
+
+        // Verify PK is not null
+        if (result.IsNull(0)) {
+            std::cerr << "ERROR: PK (user_id) should not be null" << std::endl;
+            std::exit(1);
+        }
+
+        // Verify all nullable columns are null (matches Rust is_null_at assertions)
+        bool null_ok = true;
+        for (size_t i = 1; i < result.FieldCount(); ++i) {
+            if (!result.IsNull(i)) {
+                std::cerr << "ERROR: column " << i << " should be null" << std::endl;
+                null_ok = false;
+            }
+        }
+        if (null_ok) {
+            std::cout << "Null row verified: all " << (result.FieldCount() - 1)
+                      << " nullable fields are null" << std::endl;
+        } else {
+            std::exit(1);
+        }
+    }
+
     // 5) Update via upsert (overwrite existing key)
     std::cout << "\n--- Update via Upsert ---" << std::endl;
     {
@@ -200,13 +250,12 @@ int main() {
         auto pk_row = kv_table.NewRow();
         pk_row.Set("user_id", 1);
 
-        bool found = false;
-        fluss::GenericRow result_row;
-        check("lookup_updated", lookuper.Lookup(pk_row, found, result_row));
-        if (found && result_row.GetString(1) == "Alice Updated") {
-            std::cout << "Update verified: name=" << result_row.GetString(1)
-                      << " balance=" << result_row.DecimalToString(4)
-                      << " last_seen(ms)=" << result_row.GetTimestamp(8).epoch_millis << std::endl;
+        fluss::LookupResult result;
+        check("lookup_updated", lookuper.Lookup(pk_row, result));
+        if (result.Found() && result.GetString(1) == "Alice Updated") {
+            std::cout << "Update verified: name=" << result.GetString(1)
+                      << " balance=" << result.GetDecimalString(4)
+                      << " last_seen(ms)=" << result.GetTimestamp(8).epoch_millis << std::endl;
         } else {
             std::cerr << "ERROR: Update verification failed" << std::endl;
             std::exit(1);
@@ -229,10 +278,9 @@ int main() {
         auto pk_row = kv_table.NewRow();
         pk_row.Set("user_id", 2);
 
-        bool found = false;
-        fluss::GenericRow result_row;
-        check("lookup_deleted", lookuper.Lookup(pk_row, found, result_row));
-        if (!found) {
+        fluss::LookupResult result;
+        check("lookup_deleted", lookuper.Lookup(pk_row, result));
+        if (!result.Found()) {
             std::cout << "Delete verified: user_id=2 not found" << std::endl;
         } else {
             std::cerr << "ERROR: Expected user_id=2 to be deleted" << std::endl;
@@ -263,15 +311,14 @@ int main() {
         auto pk_row = kv_table.NewRow();
         pk_row.Set("user_id", 3);
 
-        bool found = false;
-        fluss::GenericRow result_row;
-        check("lookup_partial", lookuper.Lookup(pk_row, found, result_row));
-        if (found) {
+        fluss::LookupResult result;
+        check("lookup_partial", lookuper.Lookup(pk_row, result));
+        if (result.Found()) {
             std::cout << "Partial update verified:"
-                      << "\n  name=" << result_row.GetString(1) << " (unchanged)"
-                      << "\n  balance=" << result_row.DecimalToString(4) << " (updated)"
-                      << "\n  last_seen(ms)=" << result_row.GetTimestamp(8).epoch_millis
-                      << " (updated)" << std::endl;
+                      << "\n  name=" << result.GetString(1) << " (unchanged)"
+                      << "\n  balance=" << result.GetDecimalString(4) << " (updated)"
+                      << "\n  last_seen(ms)=" << result.GetTimestamp(8).epoch_millis << " (updated)"
+                      << std::endl;
         } else {
             std::cerr << "ERROR: Expected to find user_id=3" << std::endl;
             std::exit(1);
@@ -302,14 +349,13 @@ int main() {
         auto pk_row = kv_table.NewRow();
         pk_row.Set("user_id", 3);
 
-        bool found = false;
-        fluss::GenericRow result_row;
-        check("lookup_partial_idx", lookuper.Lookup(pk_row, found, result_row));
-        if (found) {
+        fluss::LookupResult result;
+        check("lookup_partial_idx", lookuper.Lookup(pk_row, result));
+        if (result.Found()) {
             std::cout << "Partial update by indices verified:"
-                      << "\n  name=" << result_row.GetString(1) << " (updated)"
-                      << "\n  balance=" << result_row.DecimalToString(4) << " (unchanged)"
-                      << "\n  last_seen(ms)=" << result_row.GetTimestamp(8).epoch_millis
+                      << "\n  name=" << result.GetString(1) << " (updated)"
+                      << "\n  balance=" << result.GetDecimalString(4) << " (unchanged)"
+                      << "\n  last_seen(ms)=" << result.GetTimestamp(8).epoch_millis
                       << " (unchanged)" << std::endl;
         } else {
             std::cerr << "ERROR: Expected to find user_id=3" << std::endl;
@@ -389,10 +435,9 @@ int main() {
         pk.Set("region", td.region);
         pk.Set("user_id", td.user_id);
 
-        bool found = false;
-        fluss::GenericRow result;
-        check("partitioned_lookup", partitioned_lookuper.Lookup(pk, found, result));
-        if (!found) {
+        fluss::LookupResult result;
+        check("partitioned_lookup", partitioned_lookuper.Lookup(pk, result));
+        if (!result.Found()) {
             std::cerr << "ERROR: Expected to find region=" << td.region << " user_id=" << td.user_id
                       << std::endl;
             std::exit(1);
@@ -420,10 +465,10 @@ int main() {
         auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "US");
         pk.Set("user_id", 1);
-        bool found = false;
-        fluss::GenericRow result;
-        check("partitioned_lookup_updated", partitioned_lookuper.Lookup(pk, found, result));
-        if (!found || result.GetString(2) != "Gustave Updated" || result.GetInt64(3) != 999) {
+        fluss::LookupResult result;
+        check("partitioned_lookup_updated", partitioned_lookuper.Lookup(pk, result));
+        if (!result.Found() || result.GetString(2) != "Gustave Updated" ||
+            result.GetInt64(3) != 999) {
             std::cerr << "ERROR: Partition update verification failed" << std::endl;
             std::exit(1);
         }
@@ -436,10 +481,9 @@ int main() {
         auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "UNKNOWN");
         pk.Set("user_id", 1);
-        bool found = false;
-        fluss::GenericRow result;
-        check("partitioned_lookup_unknown", partitioned_lookuper.Lookup(pk, found, result));
-        if (found) {
+        fluss::LookupResult result;
+        check("partitioned_lookup_unknown", partitioned_lookuper.Lookup(pk, result));
+        if (result.Found()) {
             std::cerr << "ERROR: Expected UNKNOWN partition lookup to return not found"
                       << std::endl;
             std::exit(1);
@@ -460,10 +504,9 @@ int main() {
         auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "EU");
         pk.Set("user_id", 1);
-        bool found = false;
-        fluss::GenericRow result;
-        check("partitioned_lookup_deleted", partitioned_lookuper.Lookup(pk, found, result));
-        if (found) {
+        fluss::LookupResult result;
+        check("partitioned_lookup_deleted", partitioned_lookuper.Lookup(pk, result));
+        if (result.Found()) {
             std::cerr << "ERROR: Expected EU/1 to be deleted" << std::endl;
             std::exit(1);
         }
@@ -475,10 +518,9 @@ int main() {
         auto pk = partitioned_kv_table.NewRow();
         pk.Set("region", "EU");
         pk.Set("user_id", 2);
-        bool found = false;
-        fluss::GenericRow result;
-        check("partitioned_lookup_eu2", partitioned_lookuper.Lookup(pk, found, result));
-        if (!found || result.GetString(2) != "Maelle") {
+        fluss::LookupResult result;
+        check("partitioned_lookup_eu2", partitioned_lookuper.Lookup(pk, result));
+        if (!result.Found() || result.GetString(2) != "Maelle") {
             std::cerr << "ERROR: Expected EU/2 (Maelle) to still exist" << std::endl;
             std::exit(1);
         }
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 30a8636baf..00b5000eef 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -23,9 +23,12 @@
 #include <cstdint>
 #include <limits>
 #include <memory>
+#include <optional>
 #include <stdexcept>
 #include <string>
+#include <string_view>
 #include <unordered_map>
+#include <utility>
 #include <vector>
 
 // Forward declare Arrow classes to avoid including heavy Arrow headers in header
@@ -44,6 +47,9 @@ struct WriteResult;
 struct LogScanner;
 struct UpsertWriter;
 struct Lookuper;
+struct ScanResultInner;
+struct GenericRowInner;
+struct LookupResultInner;
 }  // namespace ffi
 
 /// Named constants for Fluss API error codes.
@@ -232,7 +238,16 @@ struct Timestamp {
     }
 };
 
+enum class ChangeType {
+    AppendOnly = 0,
+    Insert = 1,
+    UpdateBefore = 2,
+    UpdateAfter = 3,
+    Delete = 4,
+};
+
 enum class TypeId {
+    Unknown = 0,
     Boolean = 1,
     TinyInt = 2,
     SmallInt = 3,
@@ -247,6 +262,8 @@ enum class TypeId {
     Timestamp = 12,
     TimestampLtz = 13,
     Decimal = 14,
+    Char = 15,
+    Binary = 16,
 };
 
 class DataType {
@@ -274,6 +291,8 @@ class DataType {
     static DataType Decimal(int32_t precision, int32_t scale) {
         return DataType(TypeId::Decimal, precision, scale);
     }
+    static DataType Char(int32_t length) { return DataType(TypeId::Char, length, 0); }
+    static DataType Binary(int32_t length) { return DataType(TypeId::Binary, length, 0); }
 
     TypeId id() const { return id_; }
     int32_t precision() const { return precision_; }
@@ -285,24 +304,6 @@ class DataType {
     int32_t scale_{0};
 };
 
-enum class DatumType {
-    Null = 0,
-    Bool = 1,
-    Int32 = 2,
-    Int64 = 3,
-    Float32 = 4,
-    Float64 = 5,
-    String = 6,
-    Bytes = 7,
-    DecimalI64 = 8,
-    DecimalI128 = 9,
-    DecimalString = 10,
-    Date = 11,
-    Time = 12,
-    TimestampNtz = 13,
-    TimestampLtz = 14,
-};
-
 constexpr int64_t EARLIEST_OFFSET = -2;
 
 enum class OffsetType {
@@ -376,6 +377,7 @@ struct TableDescriptor {
     int32_t bucket_count{0};
     std::vector<std::string> bucket_keys;
     std::unordered_map<std::string, std::string> properties;
+    std::unordered_map<std::string, std::string> custom_properties;
     std::string comment;
 
     class Builder {
@@ -405,6 +407,19 @@ struct TableDescriptor {
             return *this;
         }
 
+        Builder& SetCustomProperty(std::string key, std::string value) {
+            custom_properties_[std::move(key)] = std::move(value);
+            return *this;
+        }
+
+        Builder& SetLogFormat(std::string format) {
+            return SetProperty("table.log.format", std::move(format));
+        }
+
+        Builder& SetKvFormat(std::string format) {
+            return SetProperty("table.kv.format", std::move(format));
+        }
+
         Builder& SetComment(std::string comment) {
             comment_ = std::move(comment);
             return *this;
@@ -413,7 +428,8 @@ struct TableDescriptor {
         TableDescriptor Build() {
             return TableDescriptor{std::move(schema_),     std::move(partition_keys_),
                                    bucket_count_,          std::move(bucket_keys_),
-                                   std::move(properties_), std::move(comment_)};
+                                   std::move(properties_), std::move(custom_properties_),
+                                   std::move(comment_)};
         }
 
        private:
@@ -422,6 +438,7 @@ struct TableDescriptor {
         int32_t bucket_count_{0};
         std::vector<std::string> bucket_keys_;
         std::unordered_map<std::string, std::string> properties_;
+        std::unordered_map<std::string, std::string> custom_properties_;
         std::string comment_;
     };
 
@@ -441,291 +458,85 @@ struct TableInfo {
     bool has_primary_key;
     bool is_partitioned;
     std::unordered_map<std::string, std::string> properties;
+    std::unordered_map<std::string, std::string> custom_properties;
     std::string comment;
     Schema schema;
 };
 
 namespace detail {
-struct FfiAccess;
-}
-
-struct Datum {
-    friend struct GenericRow;
-    friend struct detail::FfiAccess;
+struct ColumnInfo {
+    size_t index;
+    TypeId type_id;
+};
+using ColumnMap = std::unordered_map<std::string, ColumnInfo>;
 
-    static Datum Null() { return {}; }
-    static Datum Bool(bool v) {
-        Datum d;
-        d.type = DatumType::Bool;
-        d.bool_val = v;
-        return d;
-    }
-    static Datum Int32(int32_t v) {
-        Datum d;
-        d.type = DatumType::Int32;
-        d.i32_val = v;
-        return d;
-    }
-    static Datum Int64(int64_t v) {
-        Datum d;
-        d.type = DatumType::Int64;
-        d.i64_val = v;
-        return d;
+inline size_t ResolveColumn(const ColumnMap& map, const std::string& name) {
+    auto it = map.find(name);
+    if (it == map.end()) {
+        throw std::runtime_error("Unknown column '" + name + "'");
     }
-    static Datum Float32(float v) {
-        Datum d;
-        d.type = DatumType::Float32;
-        d.f32_val = v;
-        return d;
-    }
-    static Datum Float64(double v) {
-        Datum d;
-        d.type = DatumType::Float64;
-        d.f64_val = v;
-        return d;
-    }
-    static Datum String(std::string v) {
-        Datum d;
-        d.type = DatumType::String;
-        d.string_val = std::move(v);
-        return d;
-    }
-    static Datum Bytes(std::vector<uint8_t> v) {
-        Datum d;
-        d.type = DatumType::Bytes;
-        d.bytes_val = std::move(v);
-        return d;
-    }
-    static Datum Date(fluss::Date d) {
-        Datum dat;
-        dat.type = DatumType::Date;
-        dat.i32_val = d.days_since_epoch;
-        return dat;
-    }
-    static Datum Time(fluss::Time t) {
-        Datum dat;
-        dat.type = DatumType::Time;
-        dat.i32_val = t.millis_since_midnight;
-        return dat;
+    return it->second.index;
+}
+
+/// CRTP mixin that adds name-based getters to any class with index-based getters.
+/// Derived must provide: `size_t Resolve(const std::string&) const`
+/// and all the index-based getters (IsNull(idx), GetBool(idx), etc.).
+template <typename Derived>
+struct NamedGetters {
+    bool IsNull(const std::string& n) const { return Self().IsNull(Self().Resolve(n)); }
+    bool GetBool(const std::string& n) const { return Self().GetBool(Self().Resolve(n)); }
+    int32_t GetInt32(const std::string& n) const { return Self().GetInt32(Self().Resolve(n)); }
+    int64_t GetInt64(const std::string& n) const { return Self().GetInt64(Self().Resolve(n)); }
+    float GetFloat32(const std::string& n) const { return Self().GetFloat32(Self().Resolve(n)); }
+    double GetFloat64(const std::string& n) const { return Self().GetFloat64(Self().Resolve(n)); }
+    std::string_view GetString(const std::string& n) const {
+        return Self().GetString(Self().Resolve(n));
     }
-    static Datum TimestampNtz(fluss::Timestamp ts) {
-        Datum dat;
-        dat.type = DatumType::TimestampNtz;
-        dat.i64_val = ts.epoch_millis;
-        dat.i32_val = ts.nano_of_millisecond;
-        return dat;
+    std::pair<const uint8_t*, size_t> GetBytes(const std::string& n) const {
+        return Self().GetBytes(Self().Resolve(n));
     }
-    static Datum TimestampLtz(fluss::Timestamp ts) {
-        Datum dat;
-        dat.type = DatumType::TimestampLtz;
-        dat.i64_val = ts.epoch_millis;
-        dat.i32_val = ts.nano_of_millisecond;
-        return dat;
+    fluss::Date GetDate(const std::string& n) const { return Self().GetDate(Self().Resolve(n)); }
+    fluss::Time GetTime(const std::string& n) const { return Self().GetTime(Self().Resolve(n)); }
+    fluss::Timestamp GetTimestamp(const std::string& n) const {
+        return Self().GetTimestamp(Self().Resolve(n));
     }
-    // Stores the decimal string as-is. Rust side will parse via BigDecimal,
-    // look up (p,s) from the schema, validate, and create the Decimal.
-    static Datum DecimalString(std::string str) {
-        Datum d;
-        d.type = DatumType::DecimalString;
-        d.string_val = std::move(str);
-        return d;
+    std::string GetDecimalString(const std::string& n) const {
+        return Self().GetDecimalString(Self().Resolve(n));
     }
 
    private:
-    DatumType type{DatumType::Null};
-    bool bool_val{false};
-    int32_t i32_val{0};
-    int64_t i64_val{0};
-    float f32_val{0.0F};
-    double f64_val{0.0};
-    std::string string_val;
-    std::vector<uint8_t> bytes_val;
-    int32_t decimal_precision{0};  // Decimal: precision (total digits)
-    int32_t decimal_scale{0};      // Decimal: scale (digits after decimal point)
-    int64_t i128_hi{0};            // Decimal (i128): high 64 bits of unscaled value
-    int64_t i128_lo{0};            // Decimal (i128): low 64 bits of unscaled value
-
-    DatumType GetType() const { return type; }
-    bool IsNull() const { return type == DatumType::Null; }
-    bool GetBool() const { return bool_val; }
-    int32_t GetInt32() const { return i32_val; }
-    int64_t GetInt64() const { return i64_val; }
-    float GetFloat32() const { return f32_val; }
-    double GetFloat64() const { return f64_val; }
-    const std::string& GetString() const { return string_val; }
-    const std::vector<uint8_t>& GetBytes() const { return bytes_val; }
-    fluss::Date GetDate() const { return {i32_val}; }
-    fluss::Time GetTime() const { return {i32_val}; }
-    fluss::Timestamp GetTimestamp() const { return {i64_val, i32_val}; }
-
-    bool IsDecimal() const {
-        return type == DatumType::DecimalI64 || type == DatumType::DecimalI128 ||
-               type == DatumType::DecimalString;
-    }
-
-    std::string DecimalToString() const {
-        if (type == DatumType::DecimalI64) {
-            return FormatUnscaled64(i64_val, decimal_scale);
-        } else if (type == DatumType::DecimalI128) {
-            unsigned __int128 uval =
-                (static_cast<unsigned __int128>(static_cast<uint64_t>(i128_hi)) << 64) |
-                static_cast<unsigned __int128>(static_cast<uint64_t>(i128_lo));
-            __int128 val = static_cast<__int128>(uval);
-            return FormatUnscaled128(val, decimal_scale);
-        } else if (type == DatumType::DecimalString) {
-            return string_val;
-        }
-        return "";
-    }
-
-    static std::string FormatUnscaled64(int64_t unscaled, int32_t scale) {
-        bool negative = unscaled < 0;
-        uint64_t abs_val =
-            negative ? -static_cast<uint64_t>(unscaled) : static_cast<uint64_t>(unscaled);
-        std::string digits = std::to_string(abs_val);
-        if (scale <= 0) {
-            return (negative ? "-" : "") + digits;
-        }
-        while (static_cast<int32_t>(digits.size()) <= scale) {
-            digits = "0" + digits;
-        }
-        auto pos = digits.size() - static_cast<size_t>(scale);
-        return (negative ? "-" : "") + digits.substr(0, pos) + "." + digits.substr(pos);
-    }
-
-    static std::string FormatUnscaled128(__int128 val, int32_t scale) {
-        bool negative = val < 0;
-        unsigned __int128 abs_val =
-            negative ? -static_cast<unsigned __int128>(val) : static_cast<unsigned __int128>(val);
-        std::string digits;
-        if (abs_val == 0) {
-            digits = "0";
-        } else {
-            while (abs_val > 0) {
-                digits = static_cast<char>('0' + static_cast<int>(abs_val % 10)) + digits;
-                abs_val /= 10;
-            }
-        }
-        if (scale <= 0) {
-            return (negative ? "-" : "") + digits;
-        }
-        while (static_cast<int32_t>(digits.size()) <= scale) {
-            digits = "0" + digits;
-        }
-        auto pos = digits.size() - static_cast<size_t>(scale);
-        return (negative ? "-" : "") + digits.substr(0, pos) + "." + digits.substr(pos);
-    }
+    const Derived& Self() const { return static_cast<const Derived&>(*this); }
 };
+}  // namespace detail
 
-struct GenericRow {
-    friend struct detail::FfiAccess;
+class GenericRow {
+   public:
+    GenericRow();
+    explicit GenericRow(size_t field_count);
+    ~GenericRow() noexcept;
 
-    size_t FieldCount() const { return fields.size(); }
+    GenericRow(const GenericRow&) = delete;
+    GenericRow& operator=(const GenericRow&) = delete;
+    GenericRow(GenericRow&& other) noexcept;
+    GenericRow& operator=(GenericRow&& other) noexcept;
 
-    // ── Index-based getters ──────────────────────────────────────────
-    DatumType GetType(size_t idx) const { return GetField(idx).GetType(); }
-    bool IsNull(size_t idx) const { return GetField(idx).IsNull(); }
-    bool GetBool(size_t idx) const { return GetTypedField(idx, DatumType::Bool).GetBool(); }
-    int32_t GetInt32(size_t idx) const { return GetTypedField(idx, DatumType::Int32).GetInt32(); }
-    int64_t GetInt64(size_t idx) const { return GetTypedField(idx, DatumType::Int64).GetInt64(); }
-    float GetFloat32(size_t idx) const {
-        return GetTypedField(idx, DatumType::Float32).GetFloat32();
-    }
-    double GetFloat64(size_t idx) const {
-        return GetTypedField(idx, DatumType::Float64).GetFloat64();
-    }
-    const std::string& GetString(size_t idx) const {
-        return GetTypedField(idx, DatumType::String).GetString();
-    }
-    const std::vector<uint8_t>& GetBytes(size_t idx) const {
-        return GetTypedField(idx, DatumType::Bytes).GetBytes();
-    }
-    fluss::Date GetDate(size_t idx) const { return GetTypedField(idx, DatumType::Date).GetDate(); }
-    fluss::Time GetTime(size_t idx) const { return GetTypedField(idx, DatumType::Time).GetTime(); }
-    fluss::Timestamp GetTimestamp(size_t idx) const {
-        const auto& d = GetField(idx);
-        auto t = d.GetType();
-        if (t != DatumType::TimestampNtz && t != DatumType::TimestampLtz) {
-            throw std::runtime_error("GenericRow: field " + std::to_string(idx) +
-                                     " is not a Timestamp type");
-        }
-        return d.GetTimestamp();
-    }
-    bool IsDecimal(size_t idx) const { return GetField(idx).IsDecimal(); }
-    std::string DecimalToString(size_t idx) const {
-        const auto& d = GetField(idx);
-        if (!d.IsDecimal()) {
-            throw std::runtime_error("GenericRow: field " + std::to_string(idx) +
-                                     " is not a Decimal type");
-        }
-        return d.DecimalToString();
-    }
+    bool Available() const;
+    void Reset();
 
     // ── Index-based setters ──────────────────────────────────────────
-    void SetNull(size_t idx) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Null();
-    }
-
-    void SetBool(size_t idx, bool v) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Bool(v);
-    }
-
-    void SetInt32(size_t idx, int32_t v) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Int32(v);
-    }
-
-    void SetInt64(size_t idx, int64_t v) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Int64(v);
-    }
-
-    void SetFloat32(size_t idx, float v) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Float32(v);
-    }
-
-    void SetFloat64(size_t idx, double v) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Float64(v);
-    }
-
-    void SetString(size_t idx, std::string v) {
-        EnsureSize(idx);
-        fields[idx] = Datum::String(std::move(v));
-    }
-
-    void SetBytes(size_t idx, std::vector<uint8_t> v) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Bytes(std::move(v));
-    }
-
-    void SetDate(size_t idx, fluss::Date d) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Date(d);
-    }
-
-    void SetTime(size_t idx, fluss::Time t) {
-        EnsureSize(idx);
-        fields[idx] = Datum::Time(t);
-    }
-
-    void SetTimestampNtz(size_t idx, fluss::Timestamp ts) {
-        EnsureSize(idx);
-        fields[idx] = Datum::TimestampNtz(ts);
-    }
-
-    void SetTimestampLtz(size_t idx, fluss::Timestamp ts) {
-        EnsureSize(idx);
-        fields[idx] = Datum::TimestampLtz(ts);
-    }
-
-    void SetDecimal(size_t idx, const std::string& value) {
-        EnsureSize(idx);
-        fields[idx] = Datum::DecimalString(value);
-    }
+    void SetNull(size_t idx);
+    void SetBool(size_t idx, bool v);
+    void SetInt32(size_t idx, int32_t v);
+    void SetInt64(size_t idx, int64_t v);
+    void SetFloat32(size_t idx, float v);
+    void SetFloat64(size_t idx, double v);
+    void SetString(size_t idx, std::string v);
+    void SetBytes(size_t idx, std::vector<uint8_t> v);
+    void SetDate(size_t idx, fluss::Date d);
+    void SetTime(size_t idx, fluss::Time t);
+    void SetTimestampNtz(size_t idx, fluss::Timestamp ts);
+    void SetTimestampLtz(size_t idx, fluss::Timestamp ts);
+    void SetDecimal(size_t idx, const std::string& value);
 
     // ── Name-based setters (require schema — see Table::NewRow()) ───
     void Set(const std::string& name, std::nullptr_t) { SetNull(Resolve(name)); }
@@ -734,7 +545,7 @@ struct GenericRow {
     void Set(const std::string& name, int64_t v) { SetInt64(Resolve(name), v); }
     void Set(const std::string& name, float v) { SetFloat32(Resolve(name), v); }
     void Set(const std::string& name, double v) { SetFloat64(Resolve(name), v); }
-    // const char* overload to prevent "string literal" → bool conversion
+    // const char* overload to prevent "string literal" -> bool conversion
     void Set(const std::string& name, const char* v) {
         auto [idx, type] = ResolveColumn(name);
         if (type == TypeId::Decimal) {
@@ -776,13 +587,12 @@ struct GenericRow {
 
    private:
     friend class Table;
-    struct ColumnInfo {
-        size_t index;
-        TypeId type_id;
-    };
-    using ColumnMap = std::unordered_map<std::string, ColumnInfo>;
-    std::vector<Datum> fields;
-    std::shared_ptr<ColumnMap> column_map_;
+    friend class AppendWriter;
+    friend class UpsertWriter;
+    friend class Lookuper;
+
+    using ColumnInfo = detail::ColumnInfo;
+    using ColumnMap = detail::ColumnMap;
 
     size_t Resolve(const std::string& name) const { return ResolveColumn(name).index; }
 
@@ -799,48 +609,122 @@ struct GenericRow {
         return it->second;
     }
 
-    const Datum& GetField(size_t idx) const {
-        if (idx >= fields.size()) {
-            throw std::runtime_error("GenericRow: index " + std::to_string(idx) +
-                                     " out of bounds (size=" + std::to_string(fields.size()) + ")");
-        }
-        return fields[idx];
-    }
+    void Destroy() noexcept;
 
-    const Datum& GetTypedField(size_t idx, DatumType expected) const {
-        const auto& d = GetField(idx);
-        if (d.GetType() != expected) {
-            throw std::runtime_error("GenericRow: field " + std::to_string(idx) +
-                                     " type mismatch: expected " +
-                                     std::to_string(static_cast<int>(expected)) + ", got " +
-                                     std::to_string(static_cast<int>(d.GetType())));
-        }
-        return d;
-    }
+    ffi::GenericRowInner* inner_{nullptr};
+    std::shared_ptr<ColumnMap> column_map_;
+};
 
-    void EnsureSize(size_t idx) {
-        if (fields.size() <= idx) {
-            fields.resize(idx + 1);
+/// Read-only row view for scan results. Zero-copy access to string and bytes data.
+///
+/// WARNING: RowView borrows from ScanRecords. It must not outlive the ScanRecords
+/// that produced it (similar to std::string_view borrowing from std::string).
+class RowView : public detail::NamedGetters<RowView> {
+    friend struct detail::NamedGetters<RowView>;
+
+   public:
+    RowView(const ffi::ScanResultInner* inner, size_t record_idx,
+            const detail::ColumnMap* column_map)
+        : inner_(inner), record_idx_(record_idx), column_map_(column_map) {}
+
+    // ── Index-based getters ──────────────────────────────────────────
+    size_t FieldCount() const;
+    TypeId GetType(size_t idx) const;
+    bool IsNull(size_t idx) const;
+    bool GetBool(size_t idx) const;
+    int32_t GetInt32(size_t idx) const;
+    int64_t GetInt64(size_t idx) const;
+    float GetFloat32(size_t idx) const;
+    double GetFloat64(size_t idx) const;
+    std::string_view GetString(size_t idx) const;
+    std::pair<const uint8_t*, size_t> GetBytes(size_t idx) const;
+    fluss::Date GetDate(size_t idx) const;
+    fluss::Time GetTime(size_t idx) const;
+    fluss::Timestamp GetTimestamp(size_t idx) const;
+    bool IsDecimal(size_t idx) const;
+    std::string GetDecimalString(size_t idx) const;
+
+    // Name-based getters inherited from detail::NamedGetters<RowView>
+    using detail::NamedGetters<RowView>::IsNull;
+    using detail::NamedGetters<RowView>::GetBool;
+    using detail::NamedGetters<RowView>::GetInt32;
+    using detail::NamedGetters<RowView>::GetInt64;
+    using detail::NamedGetters<RowView>::GetFloat32;
+    using detail::NamedGetters<RowView>::GetFloat64;
+    using detail::NamedGetters<RowView>::GetString;
+    using detail::NamedGetters<RowView>::GetBytes;
+    using detail::NamedGetters<RowView>::GetDate;
+    using detail::NamedGetters<RowView>::GetTime;
+    using detail::NamedGetters<RowView>::GetTimestamp;
+    using detail::NamedGetters<RowView>::GetDecimalString;
+
+   private:
+    size_t Resolve(const std::string& name) const {
+        if (!column_map_) {
+            throw std::runtime_error("RowView: name-based access not available");
         }
+        return detail::ResolveColumn(*column_map_, name);
     }
+    const ffi::ScanResultInner* inner_;
+    size_t record_idx_;
+    const detail::ColumnMap* column_map_;  // borrowed from ScanRecords (same lifetime as inner_)
 };
 
+/// A single scan record. Contains metadata and a RowView for field access.
+///
+/// WARNING: ScanRecord contains a RowView that borrows from ScanRecords.
+/// It must not outlive the ScanRecords that produced it.
 struct ScanRecord {
     int32_t bucket_id;
+    std::optional<int64_t> partition_id;
     int64_t offset;
     int64_t timestamp;
-    GenericRow row;
+    ChangeType change_type;
+    RowView row;
 };
 
-struct ScanRecords {
-    std::vector<ScanRecord> records;
+class ScanRecords {
+   public:
+    ScanRecords() noexcept;
+    ~ScanRecords() noexcept;
+
+    ScanRecords(const ScanRecords&) = delete;
+    ScanRecords& operator=(const ScanRecords&) = delete;
+    ScanRecords(ScanRecords&& other) noexcept;
+    ScanRecords& operator=(ScanRecords&& other) noexcept;
 
-    size_t Size() const { return records.size(); }
-    bool Empty() const { return records.empty(); }
-    const ScanRecord& operator[](size_t idx) const { return records[idx]; }
+    size_t Size() const;
+    bool Empty() const;
+    ScanRecord operator[](size_t idx) const;
+
+    class Iterator {
+       public:
+        ScanRecord operator*() const;
+        Iterator& operator++() {
+            ++idx_;
+            return *this;
+        }
+        bool operator!=(const Iterator& other) const { return idx_ != other.idx_; }
 
-    auto begin() const { return records.begin(); }
-    auto end() const { return records.end(); }
+       private:
+        friend class ScanRecords;
+        Iterator(const ScanRecords* owner, size_t idx) : owner_(owner), idx_(idx) {}
+        const ScanRecords* owner_;
+        size_t idx_;
+    };
+
+    Iterator begin() const { return Iterator(this, 0); }
+    Iterator end() const { return Iterator(this, Size()); }
+
+    /// Returns the column name-to-index map (lazy-built, cached).
+    const std::shared_ptr<detail::ColumnMap>& GetColumnMap() const;
+
+   private:
+    friend class LogScanner;
+    void Destroy() noexcept;
+    void BuildColumnMap() const;
+    ffi::ScanResultInner* inner_{nullptr};
+    mutable std::shared_ptr<detail::ColumnMap> column_map_;
 };
 
 class ArrowRecordBatch {
@@ -927,6 +811,66 @@ struct DatabaseInfo {
     int64_t modified_time{0};
 };
 
+/// Read-only result for lookup operations.
+class LookupResult : public detail::NamedGetters<LookupResult> {
+    friend struct detail::NamedGetters<LookupResult>;
+
+   public:
+    LookupResult() noexcept;
+    ~LookupResult() noexcept;
+
+    LookupResult(const LookupResult&) = delete;
+    LookupResult& operator=(const LookupResult&) = delete;
+    LookupResult(LookupResult&& other) noexcept;
+    LookupResult& operator=(LookupResult&& other) noexcept;
+
+    bool Found() const;
+    size_t FieldCount() const;
+
+    // ── Index-based getters ──────────────────────────────────────────
+    TypeId GetType(size_t idx) const;
+    bool IsNull(size_t idx) const;
+    bool GetBool(size_t idx) const;
+    int32_t GetInt32(size_t idx) const;
+    int64_t GetInt64(size_t idx) const;
+    float GetFloat32(size_t idx) const;
+    double GetFloat64(size_t idx) const;
+    std::string_view GetString(size_t idx) const;
+    std::pair<const uint8_t*, size_t> GetBytes(size_t idx) const;
+    fluss::Date GetDate(size_t idx) const;
+    fluss::Time GetTime(size_t idx) const;
+    fluss::Timestamp GetTimestamp(size_t idx) const;
+    bool IsDecimal(size_t idx) const;
+    std::string GetDecimalString(size_t idx) const;
+
+    // Name-based getters inherited from detail::NamedGetters<LookupResult>
+    using detail::NamedGetters<LookupResult>::IsNull;
+    using detail::NamedGetters<LookupResult>::GetBool;
+    using detail::NamedGetters<LookupResult>::GetInt32;
+    using detail::NamedGetters<LookupResult>::GetInt64;
+    using detail::NamedGetters<LookupResult>::GetFloat32;
+    using detail::NamedGetters<LookupResult>::GetFloat64;
+    using detail::NamedGetters<LookupResult>::GetString;
+    using detail::NamedGetters<LookupResult>::GetBytes;
+    using detail::NamedGetters<LookupResult>::GetDate;
+    using detail::NamedGetters<LookupResult>::GetTime;
+    using detail::NamedGetters<LookupResult>::GetTimestamp;
+    using detail::NamedGetters<LookupResult>::GetDecimalString;
+
+   private:
+    friend class Lookuper;
+    size_t Resolve(const std::string& name) const {
+        if (!column_map_) {
+            BuildColumnMap();
+        }
+        return detail::ResolveColumn(*column_map_, name);
+    }
+    void Destroy() noexcept;
+    void BuildColumnMap() const;
+    ffi::LookupResultInner* inner_{nullptr};
+    mutable std::shared_ptr<detail::ColumnMap> column_map_;
+};
+
 class AppendWriter;
 class UpsertWriter;
 class Lookuper;
@@ -1206,6 +1150,8 @@ class AppendWriter {
 
     Result Append(const GenericRow& row);
     Result Append(const GenericRow& row, WriteResult& out);
+    Result AppendArrowBatch(const std::shared_ptr<arrow::RecordBatch>& batch);
+    Result AppendArrowBatch(const std::shared_ptr<arrow::RecordBatch>& batch, WriteResult& out);
     Result Flush();
 
    private:
@@ -1255,7 +1201,7 @@ class Lookuper {
 
     bool Available() const;
 
-    Result Lookup(const GenericRow& pk_row, bool& found, GenericRow& out);
+    Result Lookup(const GenericRow& pk_row, LookupResult& out);
 
    private:
     friend class Table;
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 3c918e569a..cff1a849a2 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -23,89 +23,6 @@
 #include "lib.rs.h"
 
 namespace fluss {
-
-namespace detail {
-struct FfiAccess {
-    static const std::vector<Datum>& fields(const GenericRow& row) { return row.fields; }
-    static std::vector<Datum>& fields(GenericRow& row) { return row.fields; }
-
-    static ffi::FfiDatum to_ffi_datum(const Datum& datum) {
-        ffi::FfiDatum ffi_datum;
-        ffi_datum.datum_type = static_cast<int32_t>(datum.type);
-        ffi_datum.bool_val = datum.bool_val;
-        ffi_datum.i32_val = datum.i32_val;
-        ffi_datum.i64_val = datum.i64_val;
-        ffi_datum.f32_val = datum.f32_val;
-        ffi_datum.f64_val = datum.f64_val;
-        ffi_datum.string_val = rust::String(datum.string_val);
-        ffi_datum.decimal_precision = datum.decimal_precision;
-        ffi_datum.decimal_scale = datum.decimal_scale;
-        ffi_datum.i128_hi = datum.i128_hi;
-        ffi_datum.i128_lo = datum.i128_lo;
-
-        rust::Vec<uint8_t> bytes;
-        for (auto b : datum.bytes_val) {
-            bytes.push_back(b);
-        }
-        ffi_datum.bytes_val = std::move(bytes);
-
-        return ffi_datum;
-    }
-
-    static Datum from_ffi_datum(const ffi::FfiDatum& ffi_datum) {
-        auto dtype = static_cast<DatumType>(ffi_datum.datum_type);
-        switch (dtype) {
-            case DatumType::Null:
-                return Datum::Null();
-            case DatumType::Bool:
-                return Datum::Bool(ffi_datum.bool_val);
-            case DatumType::Int32:
-                return Datum::Int32(ffi_datum.i32_val);
-            case DatumType::Int64:
-                return Datum::Int64(ffi_datum.i64_val);
-            case DatumType::Float32:
-                return Datum::Float32(ffi_datum.f32_val);
-            case DatumType::Float64:
-                return Datum::Float64(ffi_datum.f64_val);
-            case DatumType::String:
-                return Datum::String(std::string(ffi_datum.string_val));
-            case DatumType::Bytes: {
-                std::vector<uint8_t> bytes;
-                for (auto b : ffi_datum.bytes_val) {
-                    bytes.push_back(b);
-                }
-                return Datum::Bytes(std::move(bytes));
-            }
-            case DatumType::Date:
-                return Datum::Date(fluss::Date{ffi_datum.i32_val});
-            case DatumType::Time:
-                return Datum::Time(fluss::Time{ffi_datum.i32_val});
-            case DatumType::TimestampNtz:
-                return Datum::TimestampNtz(fluss::Timestamp{ffi_datum.i64_val, ffi_datum.i32_val});
-            case DatumType::TimestampLtz:
-                return Datum::TimestampLtz(fluss::Timestamp{ffi_datum.i64_val, ffi_datum.i32_val});
-            case DatumType::DecimalI64:
-            case DatumType::DecimalI128:
-            case DatumType::DecimalString: {
-                Datum d;
-                d.type = dtype;
-                d.i64_val = ffi_datum.i64_val;
-                d.decimal_precision = ffi_datum.decimal_precision;
-                d.decimal_scale = ffi_datum.decimal_scale;
-                d.i128_hi = ffi_datum.i128_hi;
-                d.i128_lo = ffi_datum.i128_lo;
-                if (dtype == DatumType::DecimalString) {
-                    d.string_val = std::string(ffi_datum.string_val);
-                }
-                return d;
-            }
-            default:
-                return Datum::Null();
-        }
-    }
-};
-}  // namespace detail
-
 namespace utils {
 
 inline Result make_error(int32_t code, std::string msg) { return Result{code, std::move(msg)}; }
@@ -195,23 +112,20 @@ inline ffi::FfiTableDescriptor to_ffi_table_descriptor(const TableDescriptor& de
     }
     ffi_desc.properties = std::move(props);
 
+    rust::Vec<ffi::HashMapValue> custom_props;
+    for (const auto& [k, v] : desc.custom_properties) {
+        ffi::HashMapValue prop;
+        prop.key = rust::String(k);
+        prop.value = rust::String(v);
+        custom_props.push_back(prop);
+    }
+    ffi_desc.custom_properties = std::move(custom_props);
+
     ffi_desc.comment = rust::String(desc.comment);
 
     return ffi_desc;
 }
 
-inline ffi::FfiGenericRow to_ffi_generic_row(const GenericRow& row) {
-    ffi::FfiGenericRow ffi_row;
-
-    rust::Vec<ffi::FfiDatum> ffi_fields;
-    for (const auto& field : detail::FfiAccess::fields(row)) {
-        ffi_fields.push_back(detail::FfiAccess::to_ffi_datum(field));
-    }
-    ffi_row.fields = std::move(ffi_fields);
-
-    return ffi_row;
-}
-
 inline Column from_ffi_column(const ffi::FfiColumn& ffi_col) {
     return Column{
         std::string(ffi_col.name),
@@ -263,37 +177,16 @@ inline TableInfo from_ffi_table_info(const ffi::FfiTableInfo& ffi_info) {
         info.properties[std::string(prop.key)] = std::string(prop.value);
     }
 
+    for (const auto& prop : ffi_info.custom_properties) {
+        info.custom_properties[std::string(prop.key)] = std::string(prop.value);
+    }
+
     info.comment = std::string(ffi_info.comment);
     info.schema = from_ffi_schema(ffi_info.schema);
 
     return info;
 }
 
-inline GenericRow from_ffi_generic_row(const ffi::FfiGenericRow& ffi_row) {
-    GenericRow row;
-
-    for (const auto& field : ffi_row.fields) {
-        detail::FfiAccess::fields(row).push_back(detail::FfiAccess::from_ffi_datum(field));
-    }
-
-    return row;
-}
-
-inline ScanRecord from_ffi_scan_record(const ffi::FfiScanRecord& ffi_record) {
-    return ScanRecord{ffi_record.bucket_id, ffi_record.offset, ffi_record.timestamp,
-                      from_ffi_generic_row(ffi_record.row)};
-}
-
-inline ScanRecords from_ffi_scan_records(const ffi::FfiScanRecords& ffi_records) {
-    ScanRecords records;
-
-    for (const auto& record : ffi_records.records) {
-        records.records.push_back(from_ffi_scan_record(record));
-    }
-
-    return records;
-}
-
 inline LakeSnapshot from_ffi_lake_snapshot(const ffi::FfiLakeSnapshot& ffi_snapshot) {
     LakeSnapshot snapshot;
     snapshot.snapshot_id = ffi_snapshot.snapshot_id;
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index fab8edff84..444b073578 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -76,6 +76,7 @@ mod ffi {
         bucket_count: i32,
         bucket_keys: Vec<String>,
         properties: Vec<HashMapValue>,
+        custom_properties: Vec<HashMapValue>,
         comment: String,
     }
 
@@ -92,6 +93,7 @@ mod ffi {
         has_primary_key: bool,
         is_partitioned: bool,
         properties: Vec<HashMapValue>,
+        custom_properties: Vec<HashMapValue>,
         comment: String,
         schema: FfiSchema,
     }
@@ -101,40 +103,8 @@ mod ffi {
         table_info: FfiTableInfo,
     }
 
-    struct FfiDatum {
-        datum_type: i32,
-        bool_val: bool,
-        i32_val: i32,
-        i64_val: i64,
-        f32_val: f32,
-        f64_val: f64,
-        string_val: String,
-        bytes_val: Vec<u8>,
-        decimal_precision: i32,
-        decimal_scale: i32,
-        i128_hi: i64,
-        i128_lo: i64,
-    }
-
-    struct FfiGenericRow {
-        fields: Vec<FfiDatum>,
-    }
-
-    struct FfiScanRecord {
-        bucket_id: i32,
-        offset: i64,
-        timestamp: i64,
-        row: FfiGenericRow,
-    }
-
-    struct FfiScanRecords {
-        records: Vec<FfiScanRecord>,
-    }
-
-    struct FfiScanRecordsResult {
-        result: FfiResult,
-        scan_records: FfiScanRecords,
-    }
+    // NOTE: FfiDatum, FfiGenericRow, FfiScanRecord, FfiScanRecords, FfiScanRecordsResult
+    // have been replaced by opaque types below (ScanResultInner, GenericRowInner, LookupResultInner).
 
     struct FfiArrowRecordBatch {
         array_ptr: usize,
@@ -192,11 +162,7 @@ mod ffi {
         bucket_offsets: Vec<FfiBucketOffsetPair>,
     }
 
-    struct FfiLookupResult {
-        result: FfiResult,
-        found: bool,
-        row: FfiGenericRow,
-    }
+    // NOTE: FfiLookupResult replaced by opaque LookupResultInner below.
 
     struct FfiLakeSnapshotResult {
         result: FfiResult,
@@ -261,6 +227,11 @@ mod ffi {
         type UpsertWriter;
         type Lookuper;
 
+        // Opaque types for optimized FFI
+        type ScanResultInner;
+        type GenericRowInner;
+        type LookupResultInner;
+
         // Connection
         fn new_connection(config: &FfiConfig) -> Result<*mut Connection>;
         unsafe fn delete_connection(conn: *mut Connection);
@@ -354,9 +325,31 @@ mod ffi {
         ) -> Result<*mut UpsertWriter>;
         fn new_lookuper(self: &Table) -> Result<*mut Lookuper>;
 
+        // GenericRowInner — opaque row for writes
+        fn new_generic_row(field_count: usize) -> Box<GenericRowInner>;
+        fn gr_reset(self: &mut GenericRowInner);
+        fn gr_set_null(self: &mut GenericRowInner, idx: usize);
+        fn gr_set_bool(self: &mut GenericRowInner, idx: usize, val: bool);
+        fn gr_set_i32(self: &mut GenericRowInner, idx: usize, val: i32);
+        fn gr_set_i64(self: &mut GenericRowInner, idx: usize, val: i64);
+        fn gr_set_f32(self: &mut GenericRowInner, idx: usize, val: f32);
+        fn gr_set_f64(self: &mut GenericRowInner, idx: usize, val: f64);
+        fn gr_set_str(self: &mut GenericRowInner, idx: usize, val: &str);
+        fn gr_set_bytes(self: &mut GenericRowInner, idx: usize, val: &[u8]);
+        fn gr_set_date(self: &mut GenericRowInner, idx: usize, days: i32);
+        fn gr_set_time(self: &mut GenericRowInner, idx: usize, millis: i32);
+        fn gr_set_ts_ntz(self: &mut GenericRowInner, idx: usize, millis: i64, nanos: i32);
+        fn gr_set_ts_ltz(self: &mut GenericRowInner, idx: usize, millis: i64, nanos: i32);
+        fn gr_set_decimal_str(self: &mut GenericRowInner, idx: usize, val: &str);
+
         // AppendWriter
         unsafe fn delete_append_writer(writer: *mut AppendWriter);
-        fn append(self: &mut AppendWriter, row: &FfiGenericRow) -> Result<Box<WriteResult>>;
+        fn append(self: &mut AppendWriter, row: &GenericRowInner) -> Result<Box<WriteResult>>;
+        fn append_arrow_batch(
+            self: &mut AppendWriter,
+            array_ptr: usize,
+            schema_ptr: usize,
+        ) -> Result<Box<WriteResult>>;
         fn flush(self: &mut AppendWriter) -> FfiResult;
 
         // WriteResult — dropped automatically via rust::Box, or call wait() for ack
@@ -364,13 +357,36 @@ mod ffi {
 
         // UpsertWriter
         unsafe fn delete_upsert_writer(writer: *mut UpsertWriter);
-        fn upsert(self: &mut UpsertWriter, row: &FfiGenericRow) -> Result<Box<WriteResult>>;
-        fn delete_row(self: &mut UpsertWriter, row: &FfiGenericRow) -> Result<Box<WriteResult>>;
+        fn upsert(self: &mut UpsertWriter, row: &GenericRowInner) -> Result<Box<WriteResult>>;
+        fn delete_row(self: &mut UpsertWriter, row: &GenericRowInner) -> Result<Box<WriteResult>>;
         fn upsert_flush(self: &mut UpsertWriter) -> FfiResult;
 
         // Lookuper
         unsafe fn delete_lookuper(lookuper: *mut Lookuper);
-        fn lookup(self: &mut Lookuper, pk_row: &FfiGenericRow) -> FfiLookupResult;
+        fn lookup(self: &mut Lookuper, pk_row: &GenericRowInner) -> Box<LookupResultInner>;
+
+        // LookupResultInner accessors
+        fn lv_has_error(self: &LookupResultInner) -> bool;
+        fn lv_error_code(self: &LookupResultInner) -> i32;
+        fn lv_error_message(self: &LookupResultInner) -> &str;
+        fn lv_found(self: &LookupResultInner) -> bool;
+        fn lv_field_count(self: &LookupResultInner) -> usize;
+        fn lv_column_name(self: &LookupResultInner, field: usize) -> Result<&str>;
+        fn lv_column_type(self: &LookupResultInner, field: usize) -> Result<i32>;
+        fn lv_is_null(self: &LookupResultInner, field: usize) -> Result<bool>;
+        fn lv_get_bool(self: &LookupResultInner, field: usize) -> Result<bool>;
+        fn lv_get_i32(self: &LookupResultInner, field: usize) -> Result<i32>;
+        fn lv_get_i64(self: &LookupResultInner, field: usize) -> Result<i64>;
+        fn lv_get_f32(self: &LookupResultInner, field: usize) -> Result<f32>;
+        fn lv_get_f64(self: &LookupResultInner, field: usize) -> Result<f64>;
+        fn lv_get_str(self: &LookupResultInner, field: usize) -> Result<&str>;
+        fn lv_get_bytes(self: &LookupResultInner, field: usize) -> Result<&[u8]>;
+        fn lv_get_date_days(self: &LookupResultInner, field: usize) -> Result<i32>;
+        fn lv_get_time_millis(self: &LookupResultInner, field: usize) -> Result<i32>;
+        fn lv_get_ts_millis(self: &LookupResultInner, field: usize) -> Result<i64>;
+        fn lv_get_ts_nanos(self: &LookupResultInner, field: usize) -> Result<i32>;
+        fn lv_is_ts_ltz(self: &LookupResultInner, field: usize) -> Result<bool>;
+        fn lv_get_decimal_str(self: &LookupResultInner, field: usize) -> Result<String>;
 
         // LogScanner
         unsafe fn delete_log_scanner(scanner: *mut LogScanner);
@@ -392,16 +408,44 @@ mod ffi {
         fn unsubscribe(self: &LogScanner, bucket_id: i32) -> FfiResult;
         fn unsubscribe_partition(self: &LogScanner, partition_id: i64, bucket_id: i32)
         -> FfiResult;
-        fn poll(self: &LogScanner, timeout_ms: i64) -> FfiScanRecordsResult;
+        fn poll(self: &LogScanner, timeout_ms: i64) -> Box<ScanResultInner>;
         fn poll_record_batch(self: &LogScanner, timeout_ms: i64) -> FfiArrowRecordBatchesResult;
         fn free_arrow_ffi_structures(array_ptr: usize, schema_ptr: usize);
+
+        // ScanResultInner accessors
+        fn sv_has_error(self: &ScanResultInner) -> bool;
+        fn sv_error_code(self: &ScanResultInner) -> i32;
+        fn sv_error_message(self: &ScanResultInner) -> &str;
+        fn sv_record_count(self: &ScanResultInner) -> usize;
+        fn sv_column_count(self: &ScanResultInner) -> usize;
+        fn sv_column_name(self: &ScanResultInner, field: usize) -> Result<&str>;
+        fn sv_column_type(self: &ScanResultInner, field: usize) -> Result<i32>;
+        fn sv_bucket_id(self: &ScanResultInner, rec: usize) -> i32;
+        fn sv_has_partition_id(self: &ScanResultInner, rec: usize) -> bool;
+        fn sv_partition_id(self: &ScanResultInner, rec: usize) -> i64;
+        fn sv_offset(self: &ScanResultInner, rec: usize) -> i64;
+        fn sv_timestamp(self: &ScanResultInner, rec: usize) -> i64;
+        fn sv_change_type(self: &ScanResultInner, rec: usize) -> i32;
+        fn sv_field_count(self: &ScanResultInner) -> usize;
+        fn sv_is_null(self: &ScanResultInner, rec: usize, field: usize) -> Result<bool>;
+        fn sv_get_bool(self: &ScanResultInner, rec: usize, field: usize) -> Result<bool>;
+        fn sv_get_i32(self: &ScanResultInner, rec: usize, field: usize) -> Result<i32>;
+        fn sv_get_i64(self: &ScanResultInner, rec: usize, field: usize) -> Result<i64>;
+        fn sv_get_f32(self: &ScanResultInner, rec: usize, field: usize) -> Result<f32>;
+        fn sv_get_f64(self: &ScanResultInner, rec: usize, field: usize) -> Result<f64>;
+        fn sv_get_str(self: &ScanResultInner, rec: usize, field: usize) -> Result<&str>;
+        fn sv_get_bytes(self: &ScanResultInner, rec: usize, field: usize) -> Result<&[u8]>;
+        fn sv_get_date_days(self: &ScanResultInner, rec: usize, field: usize) -> Result<i32>;
+        fn sv_get_time_millis(self: &ScanResultInner, rec: usize, field: usize) -> Result<i32>;
+        fn sv_get_ts_millis(self: &ScanResultInner, rec: usize, field: usize) -> Result<i64>;
+        fn sv_get_ts_nanos(self: &ScanResultInner, rec: usize, field: usize) -> Result<i32>;
+        fn sv_is_ts_ltz(self: &ScanResultInner, rec: usize, field: usize) -> Result<bool>;
+        fn sv_get_decimal_str(self: &ScanResultInner, rec: usize, field: usize) -> Result<String>;
     }
 }
 
 pub struct Connection {
     inner: Arc<fcore::client::FlussConnection>,
-    #[allow(dead_code)]
-    metadata: Option<Arc<fcore::client::Metadata>>,
 }
 
 pub struct Admin {
@@ -499,10 +543,7 @@ fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
 
     match conn {
         Ok(c) => {
-            let conn = Box::into_raw(Box::new(Connection {
-                inner: Arc::new(c),
-                metadata: None,
-            }));
+            let conn = Box::into_raw(Box::new(Connection { inner: Arc::new(c) }));
             Ok(conn)
         }
         Err(e) => Err(format!("Failed to connect: {e}")),
@@ -1136,9 +1177,10 @@ unsafe fn delete_append_writer(writer: *mut AppendWriter) {
 }
 
 impl AppendWriter {
-    fn append(&mut self, row: &ffi::FfiGenericRow) -> Result<Box<WriteResult>, String> {
+    fn append(&mut self, row: &GenericRowInner) -> Result<Box<WriteResult>, String> {
         let schema = self.table_info.get_schema();
-        let generic_row = types::ffi_row_to_core(row, Some(schema)).map_err(|e| e.to_string())?;
+        let generic_row =
+            types::resolve_row_types(&row.row, Some(schema)).map_err(|e| e.to_string())?;
 
         let result_future = self
             .inner
@@ -1150,6 +1192,39 @@ impl AppendWriter {
         }))
     }
 
+    fn append_arrow_batch(
+        &mut self,
+        array_ptr: usize,
+        schema_ptr: usize,
+    ) -> Result<Box<WriteResult>, String> {
+        use arrow::ffi::{FFI_ArrowArray, FFI_ArrowSchema};
+
+        // Safety: C++ allocates these via `new ArrowArray/ArrowSchema` after a
+        // successful `ExportRecordBatch`, so both pointers are valid heap
+        // allocations that we take ownership of here.
+        let ffi_array = unsafe { *Box::from_raw(array_ptr as *mut FFI_ArrowArray) };
+        let ffi_schema = unsafe { Box::from_raw(schema_ptr as *mut FFI_ArrowSchema) };
+
+        // Safety: `from_ffi` requires that the array and schema conform to the
+        // Arrow C Data Interface, which is guaranteed by C++'s ExportRecordBatch.
+        let array_data = unsafe { arrow::ffi::from_ffi(ffi_array, &ffi_schema) }
+            .map_err(|e| format!("Failed to import Arrow batch: {e}"))?;
+        // ffi_array is consumed by from_ffi; ffi_schema is dropped here (Box goes out of scope)
+
+        // Reconstruct RecordBatch from the imported StructArray data
+        let struct_array = arrow::array::StructArray::from(array_data);
+        let batch = arrow::record_batch::RecordBatch::from(struct_array);
+
+        let result_future = self
+            .inner
+            .append_arrow_batch(batch)
+            .map_err(|e| format!("Failed to append Arrow batch: {e}"))?;
+
+        Ok(Box::new(WriteResult {
+            inner: Some(result_future),
+        }))
+    }
+
     fn flush(&mut self) -> ffi::FfiResult {
         let result = RUNTIME.block_on(async { self.inner.flush().await });
 
@@ -1194,9 +1269,10 @@ impl UpsertWriter {
         row
     }
 
-    fn upsert(&mut self, row: &ffi::FfiGenericRow) -> Result<Box<WriteResult>, String> {
+    fn upsert(&mut self, row: &GenericRowInner) -> Result<Box<WriteResult>, String> {
         let schema = self.table_info.get_schema();
-        let generic_row = types::ffi_row_to_core(row, Some(schema)).map_err(|e| e.to_string())?;
+        let generic_row =
+            types::resolve_row_types(&row.row, Some(schema)).map_err(|e| e.to_string())?;
         let generic_row = self.pad_row(generic_row);
 
         let result_future = self
@@ -1209,9 +1285,10 @@ impl UpsertWriter {
         }))
     }
 
-    fn delete_row(&mut self, row: &ffi::FfiGenericRow) -> Result<Box<WriteResult>, String> {
+    fn delete_row(&mut self, row: &GenericRowInner) -> Result<Box<WriteResult>, String> {
         let schema = self.table_info.get_schema();
-        let generic_row = types::ffi_row_to_core(row, Some(schema)).map_err(|e| e.to_string())?;
+        let generic_row =
+            types::resolve_row_types(&row.row, Some(schema)).map_err(|e| e.to_string())?;
         let generic_row = self.pad_row(generic_row);
 
         let result_future = self
@@ -1254,53 +1331,56 @@ impl Lookuper {
         row
     }
 
-    fn lookup(&mut self, pk_row: &ffi::FfiGenericRow) -> ffi::FfiLookupResult {
+    fn lookup(&mut self, pk_row: &GenericRowInner) -> Box<LookupResultInner> {
         let schema = self.table_info.get_schema();
-        let generic_row = match types::ffi_row_to_core(pk_row, Some(schema)) {
+        let generic_row = match types::resolve_row_types(&pk_row.row, Some(schema)) {
             Ok(r) => self.pad_row(r),
             Err(e) => {
-                return ffi::FfiLookupResult {
-                    result: client_err(e.to_string()),
-                    found: false,
-                    row: ffi::FfiGenericRow { fields: vec![] },
-                };
+                return Box::new(LookupResultInner::from_error(
+                    CLIENT_ERROR_CODE,
+                    e.to_string(),
+                ));
             }
         };
 
         let lookup_result = match RUNTIME.block_on(self.inner.lookup(&generic_row)) {
             Ok(r) => r,
             Err(e) => {
-                return ffi::FfiLookupResult {
-                    result: err_from_core_error(&e),
-                    found: false,
-                    row: ffi::FfiGenericRow { fields: vec![] },
-                };
+                let ffi_err = err_from_core_error(&e);
+                return Box::new(LookupResultInner::from_error(
+                    ffi_err.error_code,
+                    ffi_err.error_message,
+                ));
             }
         };
 
+        let columns = self.table_info.get_schema().columns().to_vec();
         match lookup_result.get_single_row() {
-            Ok(Some(row)) => match types::internal_row_to_ffi_row(&row, &self.table_info) {
-                Ok(ffi_row) => ffi::FfiLookupResult {
-                    result: ok_result(),
+            Ok(Some(row)) => match types::compacted_row_to_owned(&row, &self.table_info) {
+                Ok(owned_row) => Box::new(LookupResultInner {
+                    error: None,
                     found: true,
-                    row: ffi_row,
-                },
-                Err(e) => ffi::FfiLookupResult {
-                    result: client_err(e.to_string()),
-                    found: false,
-                    row: ffi::FfiGenericRow { fields: vec![] },
-                },
+                    row: Some(owned_row),
+                    columns,
+                }),
+                Err(e) => Box::new(LookupResultInner::from_error(
+                    CLIENT_ERROR_CODE,
+                    e.to_string(),
+                )),
             },
-            Ok(None) => ffi::FfiLookupResult {
-                result: ok_result(),
+            Ok(None) => Box::new(LookupResultInner {
+                error: None,
                 found: false,
-                row: ffi::FfiGenericRow { fields: vec![] },
-            },
-            Err(e) => ffi::FfiLookupResult {
-                result: err_from_core_error(&e),
-                found: false,
-                row: ffi::FfiGenericRow { fields: vec![] },
-            },
+                row: None,
+                columns,
+            }),
+            Err(e) => {
+                let ffi_err = err_from_core_error(&e);
+                Box::new(LookupResultInner::from_error(
+                    ffi_err.error_code,
+                    ffi_err.error_message,
+                ))
+            }
         }
     }
 }
@@ -1387,34 +1467,47 @@ impl LogScanner {
         dispatch_scanner!(self, unsubscribe_partition(partition_id, bucket_id))
     }
 
-    fn poll(&self, timeout_ms: i64) -> ffi::FfiScanRecordsResult {
+    fn poll(&self, timeout_ms: i64) -> Box<ScanResultInner> {
         let ScannerKind::Record(ref inner) = self.scanner else {
-            return ffi::FfiScanRecordsResult {
-                result: client_err("Record-based scanner not available".to_string()),
-                scan_records: ffi::FfiScanRecords { records: vec![] },
-            };
+            return Box::new(ScanResultInner::from_error(
+                CLIENT_ERROR_CODE,
+                "Record-based scanner not available".to_string(),
+            ));
         };
 
-        let timeout = Duration::from_millis(timeout_ms as u64);
+        let timeout = Duration::from_millis(timeout_ms.max(0) as u64);
         let result = RUNTIME.block_on(async { inner.poll(timeout).await });
 
         match result {
             Ok(records) => {
-                match types::core_scan_records_to_ffi(&records, &self.projected_columns) {
-                    Ok(scan_records) => ffi::FfiScanRecordsResult {
-                        result: ok_result(),
-                        scan_records,
-                    },
-                    Err(e) => ffi::FfiScanRecordsResult {
-                        result: client_err(e.to_string()),
-                        scan_records: ffi::FfiScanRecords { records: vec![] },
-                    },
+                let columns = self.projected_columns.clone();
+                // Flatten ScanRecords into a Vec<FlatScanRecord> — moves Arc<RecordBatch>, zero copy
+                let mut flat = Vec::with_capacity(records.count());
+                for (table_bucket, bucket_records) in records.into_records_by_buckets() {
+                    let bucket_id = table_bucket.bucket_id();
+                    let partition = table_bucket.partition_id();
+                    for record in bucket_records {
+                        flat.push(FlatScanRecord {
+                            bucket_id,
+                            has_partition_id: partition.is_some(),
+                            partition_id: partition.unwrap_or(0),
+                            record,
+                        });
+                    }
                 }
+                Box::new(ScanResultInner {
+                    error: None,
+                    records: flat,
+                    columns,
+                })
+            }
+            Err(e) => {
+                let ffi_err = err_from_core_error(&e);
+                Box::new(ScanResultInner::from_error(
+                    ffi_err.error_code,
+                    ffi_err.error_message,
+                ))
             }
-            Err(e) => ffi::FfiScanRecordsResult {
-                result: err_from_core_error(&e),
-                scan_records: ffi::FfiScanRecords { records: vec![] },
-            },
         }
     }
 
@@ -1426,7 +1519,7 @@ impl LogScanner {
             };
         };
 
-        let timeout = Duration::from_millis(timeout_ms as u64);
+        let timeout = Duration::from_millis(timeout_ms.max(0) as u64);
         let result = RUNTIME.block_on(async { inner_batch.poll(timeout).await });
 
         match result {
@@ -1447,3 +1540,602 @@ impl LogScanner {
         }
     }
 }
+
+// ============================================================================
+// Opaque types: GenericRowInner (write path)
+// ============================================================================
+
+pub struct GenericRowInner {
+    row: fcore::row::GenericRow<'static>,
+}
+
+fn new_generic_row(field_count: usize) -> Box<GenericRowInner> {
+    Box::new(GenericRowInner {
+        row: fcore::row::GenericRow::new(field_count),
+    })
+}
+
+impl GenericRowInner {
+    fn gr_reset(&mut self) {
+        let len = self.row.values.len();
+        self.row = fcore::row::GenericRow::new(len);
+    }
+
+    fn gr_set_null(&mut self, idx: usize) {
+        self.ensure_size(idx);
+        self.row.set_field(idx, fcore::row::Datum::Null);
+    }
+
+    fn gr_set_bool(&mut self, idx: usize, val: bool) {
+        self.ensure_size(idx);
+        self.row.set_field(idx, fcore::row::Datum::Bool(val));
+    }
+
+    fn gr_set_i32(&mut self, idx: usize, val: i32) {
+        self.ensure_size(idx);
+        self.row.set_field(idx, fcore::row::Datum::Int32(val));
+    }
+
+    fn gr_set_i64(&mut self, idx: usize, val: i64) {
+        self.ensure_size(idx);
+        self.row.set_field(idx, fcore::row::Datum::Int64(val));
+    }
+
+    fn gr_set_f32(&mut self, idx: usize, val: f32) {
+        self.ensure_size(idx);
+        self.row
+            .set_field(idx, fcore::row::Datum::Float32(val.into()));
+    }
+
+    fn gr_set_f64(&mut self, idx: usize, val: f64) {
+        self.ensure_size(idx);
+        self.row
+            .set_field(idx, fcore::row::Datum::Float64(val.into()));
+    }
+
+    fn gr_set_str(&mut self, idx: usize, val: &str) {
+        self.ensure_size(idx);
+        self.row.set_field(
+            idx,
+            fcore::row::Datum::String(std::borrow::Cow::Owned(val.to_string())),
+        );
+    }
+
+    fn gr_set_bytes(&mut self, idx: usize, val: &[u8]) {
+        self.ensure_size(idx);
+        self.row.set_field(
+            idx,
+            fcore::row::Datum::Blob(std::borrow::Cow::Owned(val.to_vec())),
+        );
+    }
+
+    fn gr_set_date(&mut self, idx: usize, days: i32) {
+        self.ensure_size(idx);
+        self.row
+            .set_field(idx, fcore::row::Datum::Date(fcore::row::Date::new(days)));
+    }
+
+    fn gr_set_time(&mut self, idx: usize, millis: i32) {
+        self.ensure_size(idx);
+        self.row
+            .set_field(idx, fcore::row::Datum::Time(fcore::row::Time::new(millis)));
+    }
+
+    fn gr_set_ts_ntz(&mut self, idx: usize, millis: i64, nanos: i32) {
+        self.ensure_size(idx);
+        // Use from_millis_nanos, falling back to millis-only on error
+        let ts = fcore::row::TimestampNtz::from_millis_nanos(millis, nanos)
+            .unwrap_or_else(|_| fcore::row::TimestampNtz::new(millis));
+        self.row.set_field(idx, fcore::row::Datum::TimestampNtz(ts));
+    }
+
+    fn gr_set_ts_ltz(&mut self, idx: usize, millis: i64, nanos: i32) {
+        self.ensure_size(idx);
+        let ts = fcore::row::TimestampLtz::from_millis_nanos(millis, nanos)
+            .unwrap_or_else(|_| fcore::row::TimestampLtz::new(millis));
+        self.row.set_field(idx, fcore::row::Datum::TimestampLtz(ts));
+    }
+
+    fn gr_set_decimal_str(&mut self, idx: usize, val: &str) {
+        self.ensure_size(idx);
+        // Store as string; resolve_row_types() will parse and validate against schema
+        self.row.set_field(
+            idx,
+            fcore::row::Datum::String(std::borrow::Cow::Owned(val.to_string())),
+        );
+    }
+
+    fn ensure_size(&mut self, idx: usize) {
+        if self.row.values.len() <= idx {
+            self.row.values.resize(idx + 1, fcore::row::Datum::Null);
+        }
+    }
+}
+
+// ============================================================================
+// Shared row-reading helpers (used by both ScanResultInner and LookupResultInner)
+// ============================================================================
+
+mod row_reader {
+    use fcore::row::InternalRow;
+    use fluss as fcore;
+
+    use crate::types;
+
+    /// Get column at `field`, or error if out of bounds.
+    fn get_column(
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<&fcore::metadata::Column, String> {
+        columns.get(field).ok_or_else(|| {
+            format!(
+                "field index {field} out of range ({} columns)",
+                columns.len()
+            )
+        })
+    }
+
+    /// Validate bounds, null, and type compatibility in a single pass.
+    /// Returns the data type on success for callers that need to dispatch on it.
+    fn validate<'a>(
+        row: &dyn InternalRow,
+        columns: &'a [fcore::metadata::Column],
+        field: usize,
+        getter: &str,
+        allowed: impl FnOnce(&fcore::metadata::DataType) -> bool,
+    ) -> Result<&'a fcore::metadata::DataType, String> {
+        let col = get_column(columns, field)?;
+        if row.is_null_at(field) {
+            return Err(format!("field {field} is null"));
+        }
+        let dt = col.data_type();
+        if !allowed(dt) {
+            return Err(format!(
+                "{getter}: column {field} has incompatible type {dt}"
+            ));
+        }
+        Ok(dt)
+    }
+
+    pub fn column_type(columns: &[fcore::metadata::Column], field: usize) -> Result<i32, String> {
+        Ok(types::core_data_type_to_ffi(
+            get_column(columns, field)?.data_type(),
+        ))
+    }
+
+    pub fn column_name(columns: &[fcore::metadata::Column], field: usize) -> Result<&str, String> {
+        Ok(get_column(columns, field)?.name())
+    }
+
+    pub fn is_null(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<bool, String> {
+        get_column(columns, field)?;
+        Ok(row.is_null_at(field))
+    }
+
+    pub fn get_bool(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<bool, String> {
+        validate(row, columns, field, "get_bool", |dt| {
+            matches!(dt, fcore::metadata::DataType::Boolean(_))
+        })?;
+        Ok(row.get_boolean(field))
+    }
+
+    pub fn get_i32(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<i32, String> {
+        let dt = validate(row, columns, field, "get_i32", |dt| {
+            matches!(
+                dt,
+                fcore::metadata::DataType::TinyInt(_)
+                    | fcore::metadata::DataType::SmallInt(_)
+                    | fcore::metadata::DataType::Int(_)
+            )
+        })?;
+        Ok(match dt {
+            fcore::metadata::DataType::TinyInt(_) => row.get_byte(field) as i32,
+            fcore::metadata::DataType::SmallInt(_) => row.get_short(field) as i32,
+            _ => row.get_int(field),
+        })
+    }
+
+    pub fn get_i64(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<i64, String> {
+        validate(row, columns, field, "get_i64", |dt| {
+            matches!(dt, fcore::metadata::DataType::BigInt(_))
+        })?;
+        Ok(row.get_long(field))
+    }
+
+    pub fn get_f32(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<f32, String> {
+        validate(row, columns, field, "get_f32", |dt| {
+            matches!(dt, fcore::metadata::DataType::Float(_))
+        })?;
+        Ok(row.get_float(field))
+    }
+
+    pub fn get_f64(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<f64, String> {
+        validate(row, columns, field, "get_f64", |dt| {
+            matches!(dt, fcore::metadata::DataType::Double(_))
+        })?;
+        Ok(row.get_double(field))
+    }
+
+    pub fn get_str<'a>(
+        row: &'a dyn InternalRow,
+        columns: &'a [fcore::metadata::Column],
+        field: usize,
+    ) -> Result<&'a str, String> {
+        let dt = validate(row, columns, field, "get_str", |dt| {
+            matches!(
+                dt,
+                fcore::metadata::DataType::Char(_) | fcore::metadata::DataType::String(_)
+            )
+        })?;
+        Ok(match dt {
+            fcore::metadata::DataType::Char(ct) => row.get_char(field, ct.length() as usize),
+            _ => row.get_string(field),
+        })
+    }
+
+    pub fn get_bytes<'a>(
+        row: &'a dyn InternalRow,
+        columns: &'a [fcore::metadata::Column],
+        field: usize,
+    ) -> Result<&'a [u8], String> {
+        let dt = validate(row, columns, field, "get_bytes", |dt| {
+            matches!(
+                dt,
+                fcore::metadata::DataType::Binary(_) | fcore::metadata::DataType::Bytes(_)
+            )
+        })?;
+        Ok(match dt {
+            fcore::metadata::DataType::Binary(bt) => row.get_binary(field, bt.length()),
+            _ => row.get_bytes(field),
+        })
+    }
+
+    pub fn get_date_days(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<i32, String> {
+        validate(row, columns, field, "get_date_days", |dt| {
+            matches!(dt, fcore::metadata::DataType::Date(_))
+        })?;
+        Ok(row.get_date(field).get_inner())
+    }
+
+    pub fn get_time_millis(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<i32, String> {
+        validate(row, columns, field, "get_time_millis", |dt| {
+            matches!(dt, fcore::metadata::DataType::Time(_))
+        })?;
+        Ok(row.get_time(field).get_inner())
+    }
+
+    pub fn get_ts_millis(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<i64, String> {
+        let dt = validate(row, columns, field, "get_ts_millis", |dt| {
+            matches!(
+                dt,
+                fcore::metadata::DataType::Timestamp(_)
+                    | fcore::metadata::DataType::TimestampLTz(_)
+            )
+        })?;
+        match dt {
+            fcore::metadata::DataType::TimestampLTz(ts) => Ok(row
+                .get_timestamp_ltz(field, ts.precision())
+                .get_epoch_millisecond()),
+            fcore::metadata::DataType::Timestamp(ts) => Ok(row
+                .get_timestamp_ntz(field, ts.precision())
+                .get_millisecond()),
+            dt => Err(format!("get_ts_millis: unexpected type {dt}")),
+        }
+    }
+
+    pub fn get_ts_nanos(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<i32, String> {
+        let dt = validate(row, columns, field, "get_ts_nanos", |dt| {
+            matches!(
+                dt,
+                fcore::metadata::DataType::Timestamp(_)
+                    | fcore::metadata::DataType::TimestampLTz(_)
+            )
+        })?;
+        match dt {
+            fcore::metadata::DataType::TimestampLTz(ts) => Ok(row
+                .get_timestamp_ltz(field, ts.precision())
+                .get_nano_of_millisecond()),
+            fcore::metadata::DataType::Timestamp(ts) => Ok(row
+                .get_timestamp_ntz(field, ts.precision())
+                .get_nano_of_millisecond()),
+            dt => Err(format!("get_ts_nanos: unexpected type {dt}")),
+        }
+    }
+
+    pub fn is_ts_ltz(columns: &[fcore::metadata::Column], field: usize) -> Result<bool, String> {
+        Ok(matches!(
+            get_column(columns, field)?.data_type(),
+            fcore::metadata::DataType::TimestampLTz(_)
+        ))
+    }
+
+    pub fn get_decimal_str(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<String, String> {
+        let dt = validate(row, columns, field, "get_decimal_str", |dt| {
+            matches!(dt, fcore::metadata::DataType::Decimal(_))
+        })?;
+        match dt {
+            fcore::metadata::DataType::Decimal(dd) => {
+                let decimal = row.get_decimal(field, dd.precision() as usize, dd.scale() as usize);
+                Ok(decimal.to_big_decimal().to_string())
+            }
+            dt => Err(format!("get_decimal_str: unexpected type {dt}")),
+        }
+    }
+}
+
+// ============================================================================
+// Opaque types: ScanResultInner (scan read path)
+// ============================================================================
+
+struct FlatScanRecord {
+    bucket_id: i32,
+    has_partition_id: bool,
+    partition_id: i64,
+    record: fcore::record::ScanRecord,
+}
+
+pub struct ScanResultInner {
+    error: Option<(i32, String)>,
+    records: Vec<FlatScanRecord>,
+    columns: Vec<fcore::metadata::Column>,
+}
+
+impl ScanResultInner {
+    fn from_error(code: i32, msg: String) -> Self {
+        Self {
+            error: Some((code, msg)),
+            records: Vec::new(),
+            columns: Vec::new(),
+        }
+    }
+
+    fn sv_has_error(&self) -> bool {
+        self.error.is_some()
+    }
+
+    fn sv_error_code(&self) -> i32 {
+        self.error.as_ref().map_or(0, |e| e.0)
+    }
+
+    fn sv_error_message(&self) -> &str {
+        self.error.as_ref().map_or("", |e| e.1.as_str())
+    }
+
+    fn sv_record_count(&self) -> usize {
+        self.records.len()
+    }
+
+    fn sv_column_count(&self) -> usize {
+        self.columns.len()
+    }
+    fn sv_column_name(&self, field: usize) -> Result<&str, String> {
+        row_reader::column_name(&self.columns, field)
+    }
+    fn sv_column_type(&self, field: usize) -> Result<i32, String> {
+        row_reader::column_type(&self.columns, field)
+    }
+
+    // Metadata accessors — C++ validates rec in operator[] before calling these.
+    fn sv_bucket_id(&self, rec: usize) -> i32 {
+        self.records[rec].bucket_id
+    }
+    fn sv_has_partition_id(&self, rec: usize) -> bool {
+        self.records[rec].has_partition_id
+    }
+    fn sv_partition_id(&self, rec: usize) -> i64 {
+        self.records[rec].partition_id
+    }
+    fn sv_offset(&self, rec: usize) -> i64 {
+        self.records[rec].record.offset()
+    }
+    fn sv_timestamp(&self, rec: usize) -> i64 {
+        self.records[rec].record.timestamp()
+    }
+    fn sv_change_type(&self, rec: usize) -> i32 {
+        self.records[rec].record.change_type().to_byte_value() as i32
+    }
+    fn sv_field_count(&self) -> usize {
+        self.columns.len()
+    }
+
+    // Field accessors — C++ validates rec in operator[], validate() checks field.
+    fn sv_is_null(&self, rec: usize, field: usize) -> Result<bool, String> {
+        row_reader::is_null(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_bool(&self, rec: usize, field: usize) -> Result<bool, String> {
+        row_reader::get_bool(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_i32(&self, rec: usize, field: usize) -> Result<i32, String> {
+        row_reader::get_i32(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_i64(&self, rec: usize, field: usize) -> Result<i64, String> {
+        row_reader::get_i64(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_f32(&self, rec: usize, field: usize) -> Result<f32, String> {
+        row_reader::get_f32(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_f64(&self, rec: usize, field: usize) -> Result<f64, String> {
+        row_reader::get_f64(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_str(&self, rec: usize, field: usize) -> Result<&str, String> {
+        row_reader::get_str(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_bytes(&self, rec: usize, field: usize) -> Result<&[u8], String> {
+        row_reader::get_bytes(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_date_days(&self, rec: usize, field: usize) -> Result<i32, String> {
+        row_reader::get_date_days(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_time_millis(&self, rec: usize, field: usize) -> Result<i32, String> {
+        row_reader::get_time_millis(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_ts_millis(&self, rec: usize, field: usize) -> Result<i64, String> {
+        row_reader::get_ts_millis(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_get_ts_nanos(&self, rec: usize, field: usize) -> Result<i32, String> {
+        row_reader::get_ts_nanos(self.records[rec].record.row(), &self.columns, field)
+    }
+    fn sv_is_ts_ltz(&self, _rec: usize, field: usize) -> Result<bool, String> {
+        row_reader::is_ts_ltz(&self.columns, field)
+    }
+    fn sv_get_decimal_str(&self, rec: usize, field: usize) -> Result<String, String> {
+        row_reader::get_decimal_str(self.records[rec].record.row(), &self.columns, field)
+    }
+}
+
+// ============================================================================
+// Opaque types: LookupResultInner (lookup read path)
+// ============================================================================
+
+pub struct LookupResultInner {
+    error: Option<(i32, String)>,
+    found: bool,
+    row: Option<fcore::row::GenericRow<'static>>,
+    columns: Vec<fcore::metadata::Column>,
+}
+
+impl LookupResultInner {
+    fn from_error(code: i32, msg: String) -> Self {
+        Self {
+            error: Some((code, msg)),
+            found: false,
+            row: None,
+            columns: Vec::new(),
+        }
+    }
+
+    fn lv_has_error(&self) -> bool {
+        self.error.is_some()
+    }
+
+    fn lv_error_code(&self) -> i32 {
+        self.error.as_ref().map_or(0, |e| e.0)
+    }
+
+    fn lv_error_message(&self) -> &str {
+        self.error.as_ref().map_or("", |e| e.1.as_str())
+    }
+
+    fn lv_found(&self) -> bool {
+        self.found
+    }
+
+    fn lv_field_count(&self) -> usize {
+        self.columns.len()
+    }
+
+    fn lv_column_type(&self, field: usize) -> Result<i32, String> {
+        row_reader::column_type(&self.columns, field)
+    }
+
+    fn lv_column_name(&self, field: usize) -> Result<&str, String> {
+        row_reader::column_name(&self.columns, field)
+    }
+
+    fn lv_row(&self) -> Result<&fcore::row::GenericRow<'static>, String> {
+        self.row
+            .as_ref()
+            .ok_or_else(|| "no row available (not found or error)".to_string())
+    }
+
+    // Field accessors — delegate to shared row_reader helpers.
+    fn lv_is_null(&self, field: usize) -> Result<bool, String> {
+        let r = self.lv_row()?;
+        row_reader::is_null(r, &self.columns, field)
+    }
+    fn lv_get_bool(&self, field: usize) -> Result<bool, String> {
+        let r = self.lv_row()?;
+        row_reader::get_bool(r, &self.columns, field)
+    }
+    fn lv_get_i32(&self, field: usize) -> Result<i32, String> {
+        let r = self.lv_row()?;
+        row_reader::get_i32(r, &self.columns, field)
+    }
+    fn lv_get_i64(&self, field: usize) -> Result<i64, String> {
+        let r = self.lv_row()?;
+        row_reader::get_i64(r, &self.columns, field)
+    }
+    fn lv_get_f32(&self, field: usize) -> Result<f32, String> {
+        let r = self.lv_row()?;
+        row_reader::get_f32(r, &self.columns, field)
+    }
+    fn lv_get_f64(&self, field: usize) -> Result<f64, String> {
+        let r = self.lv_row()?;
+        row_reader::get_f64(r, &self.columns, field)
+    }
+    fn lv_get_str(&self, field: usize) -> Result<&str, String> {
+        let r = self.lv_row()?;
+        row_reader::get_str(r, &self.columns, field)
+    }
+    fn lv_get_bytes(&self, field: usize) -> Result<&[u8], String> {
+        let r = self.lv_row()?;
+        row_reader::get_bytes(r, &self.columns, field)
+    }
+    fn lv_get_date_days(&self, field: usize) -> Result<i32, String> {
+        let r = self.lv_row()?;
+        row_reader::get_date_days(r, &self.columns, field)
+    }
+    fn lv_get_time_millis(&self, field: usize) -> Result<i32, String> {
+        let r = self.lv_row()?;
+        row_reader::get_time_millis(r, &self.columns, field)
+    }
+    fn lv_get_ts_millis(&self, field: usize) -> Result<i64, String> {
+        let r = self.lv_row()?;
+        row_reader::get_ts_millis(r, &self.columns, field)
+    }
+    fn lv_get_ts_nanos(&self, field: usize) -> Result<i32, String> {
+        let r = self.lv_row()?;
+        row_reader::get_ts_nanos(r, &self.columns, field)
+    }
+    fn lv_is_ts_ltz(&self, field: usize) -> Result<bool, String> {
+        row_reader::is_ts_ltz(&self.columns, field)
+    }
+    fn lv_get_decimal_str(&self, field: usize) -> Result<String, String> {
+        let r = self.lv_row()?;
+        row_reader::get_decimal_str(r, &self.columns, field)
+    }
+}
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 19fd72dd5f..76f1806d90 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -25,7 +25,7 @@
 #include "fluss.hpp"
 #include "lib.rs.h"
 #include "rust/cxx.h"
-// todo:  bindings/cpp/BUILD.bazel still doesn’t declare Arrow include/link dependencies.
+// todo:  bindings/cpp/BUILD.bazel still doesn't declare Arrow include/link dependencies.
 // In environments where Bazel does not already have Arrow available, this will fail at compile/link
 // time.
 #include <arrow/record_batch.h>
@@ -79,6 +79,378 @@ int Date::Day() const {
     return tm.tm_mday;
 }
 
+// NOLINTNEXTLINE(cppcoreguidelines-macro-usage)
+#define CHECK_INNER(name)                                                                 \
+    do {                                                                                  \
+        if (!inner_) throw std::logic_error(name ": not available (moved-from or null)"); \
+    } while (0)
+
+// ============================================================================
+// GenericRow — write-only row backed by opaque Rust GenericRowInner
+// ============================================================================
+
+GenericRow::GenericRow() {
+    auto box = ffi::new_generic_row(0);
+    inner_ = box.into_raw();
+}
+
+GenericRow::GenericRow(size_t field_count) {
+    auto box = ffi::new_generic_row(field_count);
+    inner_ = box.into_raw();
+}
+
+GenericRow::~GenericRow() noexcept { Destroy(); }
+
+void GenericRow::Destroy() noexcept {
+    if (inner_) {
+        rust::Box<ffi::GenericRowInner>::from_raw(inner_);
+        inner_ = nullptr;
+    }
+    column_map_.reset();
+}
+
+GenericRow::GenericRow(GenericRow&& other) noexcept
+    : inner_(other.inner_), column_map_(std::move(other.column_map_)) {
+    other.inner_ = nullptr;
+}
+
+GenericRow& GenericRow::operator=(GenericRow&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        inner_ = other.inner_;
+        column_map_ = std::move(other.column_map_);
+        other.inner_ = nullptr;
+    }
+    return *this;
+}
+
+bool GenericRow::Available() const { return inner_ != nullptr; }
+
+void GenericRow::Reset() {
+    CHECK_INNER("GenericRow");
+    inner_->gr_reset();
+}
+
+void GenericRow::SetNull(size_t idx) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_null(idx);
+}
+void GenericRow::SetBool(size_t idx, bool v) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_bool(idx, v);
+}
+void GenericRow::SetInt32(size_t idx, int32_t v) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_i32(idx, v);
+}
+void GenericRow::SetInt64(size_t idx, int64_t v) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_i64(idx, v);
+}
+void GenericRow::SetFloat32(size_t idx, float v) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_f32(idx, v);
+}
+void GenericRow::SetFloat64(size_t idx, double v) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_f64(idx, v);
+}
+
+void GenericRow::SetString(size_t idx, std::string v) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_str(idx, v);
+}
+
+void GenericRow::SetBytes(size_t idx, std::vector<uint8_t> v) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_bytes(idx, rust::Slice<const uint8_t>(v.data(), v.size()));
+}
+
+void GenericRow::SetDate(size_t idx, fluss::Date d) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_date(idx, d.days_since_epoch);
+}
+
+void GenericRow::SetTime(size_t idx, fluss::Time t) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_time(idx, t.millis_since_midnight);
+}
+
+void GenericRow::SetTimestampNtz(size_t idx, fluss::Timestamp ts) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_ts_ntz(idx, ts.epoch_millis, ts.nano_of_millisecond);
+}
+
+void GenericRow::SetTimestampLtz(size_t idx, fluss::Timestamp ts) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_ts_ltz(idx, ts.epoch_millis, ts.nano_of_millisecond);
+}
+
+void GenericRow::SetDecimal(size_t idx, const std::string& value) {
+    CHECK_INNER("GenericRow");
+    inner_->gr_set_decimal_str(idx, value);
+}
+
+// ============================================================================
+// RowView — zero-copy read-only row view for scan results
+// ============================================================================
+
+size_t RowView::FieldCount() const { return inner_ ? inner_->sv_field_count() : 0; }
+
+TypeId RowView::GetType(size_t idx) const {
+    CHECK_INNER("RowView");
+    return static_cast<TypeId>(inner_->sv_column_type(idx));
+}
+
+bool RowView::IsNull(size_t idx) const {
+    CHECK_INNER("RowView");
+    return inner_->sv_is_null(record_idx_, idx);
+}
+bool RowView::GetBool(size_t idx) const {
+    CHECK_INNER("RowView");
+    return inner_->sv_get_bool(record_idx_, idx);
+}
+int32_t RowView::GetInt32(size_t idx) const {
+    CHECK_INNER("RowView");
+    return inner_->sv_get_i32(record_idx_, idx);
+}
+int64_t RowView::GetInt64(size_t idx) const {
+    CHECK_INNER("RowView");
+    return inner_->sv_get_i64(record_idx_, idx);
+}
+float RowView::GetFloat32(size_t idx) const {
+    CHECK_INNER("RowView");
+    return inner_->sv_get_f32(record_idx_, idx);
+}
+double RowView::GetFloat64(size_t idx) const {
+    CHECK_INNER("RowView");
+    return inner_->sv_get_f64(record_idx_, idx);
+}
+
+std::string_view RowView::GetString(size_t idx) const {
+    CHECK_INNER("RowView");
+    auto s = inner_->sv_get_str(record_idx_, idx);
+    return std::string_view(s.data(), s.size());
+}
+
+std::pair<const uint8_t*, size_t> RowView::GetBytes(size_t idx) const {
+    CHECK_INNER("RowView");
+    auto bytes = inner_->sv_get_bytes(record_idx_, idx);
+    return {bytes.data(), bytes.size()};
+}
+
+Date RowView::GetDate(size_t idx) const {
+    CHECK_INNER("RowView");
+    return Date{inner_->sv_get_date_days(record_idx_, idx)};
+}
+
+Time RowView::GetTime(size_t idx) const {
+    CHECK_INNER("RowView");
+    return Time{inner_->sv_get_time_millis(record_idx_, idx)};
+}
+
+Timestamp RowView::GetTimestamp(size_t idx) const {
+    CHECK_INNER("RowView");
+    return Timestamp{inner_->sv_get_ts_millis(record_idx_, idx),
+                     inner_->sv_get_ts_nanos(record_idx_, idx)};
+}
+
+bool RowView::IsDecimal(size_t idx) const { return GetType(idx) == TypeId::Decimal; }
+
+std::string RowView::GetDecimalString(size_t idx) const {
+    CHECK_INNER("RowView");
+    return std::string(inner_->sv_get_decimal_str(record_idx_, idx));
+}
+
+// ============================================================================
+// ScanRecords — backed by opaque Rust ScanResultInner
+// ============================================================================
+
+ScanRecords::ScanRecords() noexcept = default;
+
+ScanRecords::~ScanRecords() noexcept { Destroy(); }
+
+void ScanRecords::Destroy() noexcept {
+    if (inner_) {
+        rust::Box<ffi::ScanResultInner>::from_raw(inner_);
+        inner_ = nullptr;
+        column_map_.reset();
+    }
+}
+
+ScanRecords::ScanRecords(ScanRecords&& other) noexcept
+    : inner_(other.inner_), column_map_(std::move(other.column_map_)) {
+    other.inner_ = nullptr;
+}
+
+ScanRecords& ScanRecords::operator=(ScanRecords&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        inner_ = other.inner_;
+        column_map_ = std::move(other.column_map_);
+        other.inner_ = nullptr;
+    }
+    return *this;
+}
+
+size_t ScanRecords::Size() const { return inner_ ? inner_->sv_record_count() : 0; }
+
+bool ScanRecords::Empty() const { return Size() == 0; }
+
+void ScanRecords::BuildColumnMap() const {
+    if (!inner_) return;
+    auto map = std::make_shared<detail::ColumnMap>();
+    auto count = inner_->sv_column_count();
+    for (size_t i = 0; i < count; ++i) {
+        auto name = inner_->sv_column_name(i);
+        (*map)[std::string(name.data(), name.size())] = {
+            i, static_cast<TypeId>(inner_->sv_column_type(i))};
+    }
+    column_map_ = std::move(map);
+}
+
+const std::shared_ptr<detail::ColumnMap>& ScanRecords::GetColumnMap() const {
+    if (!column_map_) {
+        BuildColumnMap();
+    }
+    return column_map_;
+}
+
+ScanRecord ScanRecords::operator[](size_t idx) const {
+    if (!inner_) {
+        throw std::logic_error("ScanRecords: not available (moved-from or null)");
+    }
+    if (idx >= inner_->sv_record_count()) {
+        throw std::out_of_range("ScanRecords: index " + std::to_string(idx) + " out of range (" +
+                                std::to_string(inner_->sv_record_count()) + " records)");
+    }
+    return ScanRecord{inner_->sv_bucket_id(idx),
+                      inner_->sv_has_partition_id(idx)
+                          ? std::optional<int64_t>(inner_->sv_partition_id(idx))
+                          : std::nullopt,
+                      inner_->sv_offset(idx),
+                      inner_->sv_timestamp(idx),
+                      static_cast<ChangeType>(inner_->sv_change_type(idx)),
+                      RowView(inner_, idx, GetColumnMap().get())};
+}
+
+ScanRecord ScanRecords::Iterator::operator*() const { return owner_->operator[](idx_); }
+
+// ============================================================================
+// LookupResult — backed by opaque Rust LookupResultInner
+// ============================================================================
+
+LookupResult::LookupResult() noexcept = default;
+
+LookupResult::~LookupResult() noexcept { Destroy(); }
+
+void LookupResult::Destroy() noexcept {
+    if (inner_) {
+        rust::Box<ffi::LookupResultInner>::from_raw(inner_);
+        inner_ = nullptr;
+        column_map_.reset();
+    }
+}
+
+LookupResult::LookupResult(LookupResult&& other) noexcept
+    : inner_(other.inner_), column_map_(std::move(other.column_map_)) {
+    other.inner_ = nullptr;
+}
+
+LookupResult& LookupResult::operator=(LookupResult&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        inner_ = other.inner_;
+        column_map_ = std::move(other.column_map_);
+        other.inner_ = nullptr;
+    }
+    return *this;
+}
+
+void LookupResult::BuildColumnMap() const {
+    if (!inner_) return;
+    auto map = std::make_shared<detail::ColumnMap>();
+    auto count = inner_->lv_field_count();
+    for (size_t i = 0; i < count; ++i) {
+        auto name = inner_->lv_column_name(i);
+        (*map)[std::string(name.data(), name.size())] = {
+            i, static_cast<TypeId>(inner_->lv_column_type(i))};
+    }
+    column_map_ = std::move(map);
+}
+
+bool LookupResult::Found() const { return inner_ && inner_->lv_found(); }
+
+size_t LookupResult::FieldCount() const { return inner_ ? inner_->lv_field_count() : 0; }
+
+TypeId LookupResult::GetType(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return static_cast<TypeId>(inner_->lv_column_type(idx));
+}
+
+bool LookupResult::IsNull(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_is_null(idx);
+}
+bool LookupResult::GetBool(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_bool(idx);
+}
+int32_t LookupResult::GetInt32(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_i32(idx);
+}
+int64_t LookupResult::GetInt64(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_i64(idx);
+}
+float LookupResult::GetFloat32(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_f32(idx);
+}
+double LookupResult::GetFloat64(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_f64(idx);
+}
+
+std::string_view LookupResult::GetString(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    auto s = inner_->lv_get_str(idx);
+    return std::string_view(s.data(), s.size());
+}
+
+std::pair<const uint8_t*, size_t> LookupResult::GetBytes(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    auto bytes = inner_->lv_get_bytes(idx);
+    return {bytes.data(), bytes.size()};
+}
+
+Date LookupResult::GetDate(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return Date{inner_->lv_get_date_days(idx)};
+}
+
+Time LookupResult::GetTime(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return Time{inner_->lv_get_time_millis(idx)};
+}
+
+Timestamp LookupResult::GetTimestamp(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return Timestamp{inner_->lv_get_ts_millis(idx), inner_->lv_get_ts_nanos(idx)};
+}
+
+bool LookupResult::IsDecimal(size_t idx) const { return GetType(idx) == TypeId::Decimal; }
+
+std::string LookupResult::GetDecimalString(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return std::string(inner_->lv_get_decimal_str(idx));
+}
+
+// ============================================================================
+// Table
+// ============================================================================
+
 Table::Table() noexcept = default;
 
 Table::Table(ffi::Table* table) noexcept : table_(table) {}
@@ -117,7 +489,51 @@ TableLookup Table::NewLookup() { return TableLookup(table_); }
 
 TableScan Table::NewScan() { return TableScan(table_); }
 
-// TableAppend implementation
+const std::shared_ptr<GenericRow::ColumnMap>& Table::GetColumnMap() const {
+    if (!column_map_ && Available()) {
+        auto info = GetTableInfo();
+        column_map_ = std::make_shared<GenericRow::ColumnMap>();
+        for (size_t i = 0; i < info.schema.columns.size(); ++i) {
+            (*column_map_)[info.schema.columns[i].name] = {i,
+                                                           info.schema.columns[i].data_type.id()};
+        }
+    }
+    return column_map_;
+}
+
+GenericRow Table::NewRow() const {
+    GenericRow row;
+    row.column_map_ = GetColumnMap();
+    return row;
+}
+
+TableInfo Table::GetTableInfo() const {
+    if (!Available()) {
+        return TableInfo{};
+    }
+    auto ffi_info = table_->get_table_info_from_table();
+    return utils::from_ffi_table_info(ffi_info);
+}
+
+TablePath Table::GetTablePath() const {
+    if (!Available()) {
+        return TablePath{};
+    }
+    auto ffi_path = table_->get_table_path();
+    return TablePath{std::string(ffi_path.database_name), std::string(ffi_path.table_name)};
+}
+
+bool Table::HasPrimaryKey() const {
+    if (!Available()) {
+        return false;
+    }
+    return table_->has_primary_key();
+}
+
+// ============================================================================
+// TableAppend
+// ============================================================================
+
 TableAppend::TableAppend(ffi::Table* table) noexcept : table_(table) {}
 
 Result TableAppend::CreateWriter(AppendWriter& out) {
@@ -135,7 +551,10 @@ Result TableAppend::CreateWriter(AppendWriter& out) {
     }
 }
 
-// TableUpsert implementation
+// ============================================================================
+// TableUpsert
+// ============================================================================
+
 TableUpsert::TableUpsert(ffi::Table* table) noexcept : table_(table) {}
 
 TableUpsert& TableUpsert::PartialUpdateByIndex(std::vector<size_t> column_indices) {
@@ -198,7 +617,10 @@ Result TableUpsert::CreateWriter(UpsertWriter& out) {
     }
 }
 
-// TableLookup implementation
+// ============================================================================
+// TableLookup
+// ============================================================================
+
 TableLookup::TableLookup(ffi::Table* table) noexcept : table_(table) {}
 
 Result TableLookup::CreateLookuper(Lookuper& out) {
@@ -216,7 +638,10 @@ Result TableLookup::CreateLookuper(Lookuper& out) {
     }
 }
 
-// TableScan implementation
+// ============================================================================
+// TableScan
+// ============================================================================
+
 TableScan::TableScan(ffi::Table* table) noexcept : table_(table) {}
 
 TableScan& TableScan::ProjectByIndex(std::vector<size_t> column_indices) {
@@ -278,48 +703,10 @@ Result TableScan::DoCreateScanner(LogScanner& out, bool is_record_batch) {
     }
 }
 
-const std::shared_ptr<GenericRow::ColumnMap>& Table::GetColumnMap() const {
-    if (!column_map_ && Available()) {
-        auto info = GetTableInfo();
-        column_map_ = std::make_shared<GenericRow::ColumnMap>();
-        for (size_t i = 0; i < info.schema.columns.size(); ++i) {
-            (*column_map_)[info.schema.columns[i].name] = {i,
-                                                           info.schema.columns[i].data_type.id()};
-        }
-    }
-    return column_map_;
-}
-
-GenericRow Table::NewRow() const {
-    GenericRow row;
-    row.column_map_ = GetColumnMap();
-    return row;
-}
-
-TableInfo Table::GetTableInfo() const {
-    if (!Available()) {
-        return TableInfo{};
-    }
-    auto ffi_info = table_->get_table_info_from_table();
-    return utils::from_ffi_table_info(ffi_info);
-}
+// ============================================================================
+// WriteResult
+// ============================================================================
 
-TablePath Table::GetTablePath() const {
-    if (!Available()) {
-        return TablePath{};
-    }
-    auto ffi_path = table_->get_table_path();
-    return TablePath{std::string(ffi_path.database_name), std::string(ffi_path.table_name)};
-}
-
-bool Table::HasPrimaryKey() const {
-    if (!Available()) {
-        return false;
-    }
-    return table_->has_primary_key();
-}
-
-// WriteResult implementation
 WriteResult::WriteResult() noexcept = default;
 
 WriteResult::WriteResult(ffi::WriteResult* inner) noexcept : inner_(inner) {}
@@ -358,7 +745,10 @@ Result WriteResult::Wait() {
     return utils::from_ffi_result(ffi_result);
 }
 
-// AppendWriter implementation
+// ============================================================================
+// AppendWriter
+// ============================================================================
+
 AppendWriter::AppendWriter() noexcept = default;
 
 AppendWriter::AppendWriter(ffi::AppendWriter* writer) noexcept : writer_(writer) {}
@@ -396,10 +786,12 @@ Result AppendWriter::Append(const GenericRow& row, WriteResult& out) {
     if (!Available()) {
         return utils::make_client_error("AppendWriter not available");
     }
+    if (!row.Available()) {
+        return utils::make_client_error("GenericRow not available");
+    }
 
     try {
-        auto ffi_row = utils::to_ffi_generic_row(row);
-        auto rust_box = writer_->append(ffi_row);
+        auto rust_box = writer_->append(*row.inner_);
         out = WriteResult(rust_box.into_raw());
         return utils::make_ok();
     } catch (const rust::Error& e) {
@@ -409,6 +801,47 @@ Result AppendWriter::Append(const GenericRow& row, WriteResult& out) {
     }
 }
 
+Result AppendWriter::AppendArrowBatch(const std::shared_ptr<arrow::RecordBatch>& batch) {
+    WriteResult wr;
+    return AppendArrowBatch(batch, wr);
+}
+
+Result AppendWriter::AppendArrowBatch(const std::shared_ptr<arrow::RecordBatch>& batch,
+                                      WriteResult& out) {
+    if (!Available()) {
+        return utils::make_client_error("AppendWriter not available");
+    }
+    if (!batch) {
+        return utils::make_client_error("Arrow RecordBatch is null");
+    }
+
+    // Export via Arrow C Data Interface
+    struct ArrowArray c_array;
+    struct ArrowSchema c_schema;
+    auto status = arrow::ExportRecordBatch(*batch, &c_array, &c_schema);
+    if (!status.ok()) {
+        return utils::make_client_error("Failed to export Arrow batch: " + status.ToString());
+    }
+
+    // Heap-allocate for Rust ownership transfer
+    auto* array_heap = new ArrowArray(std::move(c_array));
+    auto* schema_heap = new ArrowSchema(std::move(c_schema));
+
+    try {
+        // Rust takes ownership of both pointers immediately via Box::from_raw(),
+        // so after this call (success or exception) C++ must NOT free them.
+        auto result_box = writer_->append_arrow_batch(reinterpret_cast<size_t>(array_heap),
+                                                      reinterpret_cast<size_t>(schema_heap));
+        out.Destroy();
+        out.inner_ = result_box.into_raw();
+        return utils::make_ok();
+    } catch (const rust::Error& e) {
+        return utils::make_client_error(std::string(e.what()));
+    } catch (const std::exception& e) {
+        return utils::make_client_error(std::string(e.what()));
+    }
+}
+
 Result AppendWriter::Flush() {
     if (!Available()) {
         return utils::make_client_error("AppendWriter not available");
@@ -418,7 +851,10 @@ Result AppendWriter::Flush() {
     return utils::from_ffi_result(ffi_result);
 }
 
-// UpsertWriter implementation
+// ============================================================================
+// UpsertWriter
+// ============================================================================
+
 UpsertWriter::UpsertWriter() noexcept = default;
 
 UpsertWriter::UpsertWriter(ffi::UpsertWriter* writer) noexcept : writer_(writer) {}
@@ -456,10 +892,12 @@ Result UpsertWriter::Upsert(const GenericRow& row, WriteResult& out) {
     if (!Available()) {
         return utils::make_client_error("UpsertWriter not available");
     }
+    if (!row.Available()) {
+        return utils::make_client_error("GenericRow not available");
+    }
 
     try {
-        auto ffi_row = utils::to_ffi_generic_row(row);
-        auto rust_box = writer_->upsert(ffi_row);
+        auto rust_box = writer_->upsert(*row.inner_);
         out = WriteResult(rust_box.into_raw());
         return utils::make_ok();
     } catch (const rust::Error& e) {
@@ -478,10 +916,12 @@ Result UpsertWriter::Delete(const GenericRow& row, WriteResult& out) {
     if (!Available()) {
         return utils::make_client_error("UpsertWriter not available");
     }
+    if (!row.Available()) {
+        return utils::make_client_error("GenericRow not available");
+    }
 
     try {
-        auto ffi_row = utils::to_ffi_generic_row(row);
-        auto rust_box = writer_->delete_row(ffi_row);
+        auto rust_box = writer_->delete_row(*row.inner_);
         out = WriteResult(rust_box.into_raw());
         return utils::make_ok();
     } catch (const rust::Error& e) {
@@ -500,7 +940,10 @@ Result UpsertWriter::Flush() {
     return utils::from_ffi_result(ffi_result);
 }
 
-// Lookuper implementation
+// ============================================================================
+// Lookuper
+// ============================================================================
+
 Lookuper::Lookuper() noexcept = default;
 
 Lookuper::Lookuper(ffi::Lookuper* lookuper) noexcept : lookuper_(lookuper) {}
@@ -529,34 +972,29 @@ Lookuper& Lookuper::operator=(Lookuper&& other) noexcept {
 
 bool Lookuper::Available() const { return lookuper_ != nullptr; }
 
-Result Lookuper::Lookup(const GenericRow& pk_row, bool& found, GenericRow& out) {
+Result Lookuper::Lookup(const GenericRow& pk_row, LookupResult& out) {
     if (!Available()) {
         return utils::make_client_error("Lookuper not available");
     }
+    if (!pk_row.Available()) {
+        return utils::make_client_error("GenericRow not available");
+    }
 
-    try {
-        auto ffi_row = utils::to_ffi_generic_row(pk_row);
-        auto ffi_result = lookuper_->lookup(ffi_row);
-        auto result = utils::from_ffi_result(ffi_result.result);
-        if (!result.Ok()) {
-            found = false;
-            return result;
-        }
-        found = ffi_result.found;
-        if (found) {
-            out = utils::from_ffi_generic_row(ffi_result.row);
-        }
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        found = false;
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        found = false;
-        return utils::make_client_error(e.what());
+    auto result_box = lookuper_->lookup(*pk_row.inner_);
+    if (result_box->lv_has_error()) {
+        return utils::make_error(result_box->lv_error_code(),
+                                 std::string(result_box->lv_error_message()));
     }
+
+    out.Destroy();
+    out.inner_ = result_box.into_raw();
+    return utils::make_ok();
 }
 
-// LogScanner implementation
+// ============================================================================
+// LogScanner
+// ============================================================================
+
 LogScanner::LogScanner() noexcept = default;
 
 LogScanner::LogScanner(ffi::LogScanner* scanner) noexcept : scanner_(scanner) {}
@@ -663,13 +1101,14 @@ Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
         return utils::make_client_error("LogScanner not available");
     }
 
-    auto ffi_result = scanner_->poll(timeout_ms);
-    auto result = utils::from_ffi_result(ffi_result.result);
-    if (!result.Ok()) {
-        return result;
+    auto result_box = scanner_->poll(timeout_ms);
+    if (result_box->sv_has_error()) {
+        return utils::make_error(result_box->sv_error_code(),
+                                 std::string(result_box->sv_error_message()));
     }
 
-    out = utils::from_ffi_scan_records(ffi_result.scan_records);
+    out.Destroy();
+    out.inner_ = result_box.into_raw();
     return utils::make_ok();
 }
 
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 17aa872109..073a16817f 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -17,20 +17,12 @@
 
 use crate::ffi;
 use anyhow::{Result, anyhow};
-use arrow::array::{
-    Date32Array, Decimal128Array, LargeBinaryArray, LargeStringArray, Time32MillisecondArray,
-    Time32SecondArray, Time64MicrosecondArray, Time64NanosecondArray, TimestampMicrosecondArray,
-    TimestampMillisecondArray, TimestampNanosecondArray, TimestampSecondArray,
-};
-use arrow::datatypes::{DataType as ArrowDataType, TimeUnit};
+use arrow::array::Array;
 use arrow::ffi::{FFI_ArrowArray, FFI_ArrowSchema};
-use fcore::row::InternalRow;
 use fluss as fcore;
 use std::borrow::Cow;
 use std::str::FromStr;
 
-use arrow::array::Array;
-
 pub const DATA_TYPE_BOOLEAN: i32 = 1;
 pub const DATA_TYPE_TINYINT: i32 = 2;
 pub const DATA_TYPE_SMALLINT: i32 = 3;
@@ -45,27 +37,10 @@ pub const DATA_TYPE_TIME: i32 = 11;
 pub const DATA_TYPE_TIMESTAMP: i32 = 12;
 pub const DATA_TYPE_TIMESTAMP_LTZ: i32 = 13;
 pub const DATA_TYPE_DECIMAL: i32 = 14;
+pub const DATA_TYPE_CHAR: i32 = 15;
+pub const DATA_TYPE_BINARY: i32 = 16;
 
-pub const DATUM_TYPE_NULL: i32 = 0;
-pub const DATUM_TYPE_BOOL: i32 = 1;
-pub const DATUM_TYPE_INT32: i32 = 2;
-pub const DATUM_TYPE_INT64: i32 = 3;
-pub const DATUM_TYPE_FLOAT32: i32 = 4;
-pub const DATUM_TYPE_FLOAT64: i32 = 5;
-pub const DATUM_TYPE_STRING: i32 = 6;
-pub const DATUM_TYPE_BYTES: i32 = 7;
-pub const DATUM_TYPE_DECIMAL_I64: i32 = 8;
-pub const DATUM_TYPE_DECIMAL_I128: i32 = 9;
-pub const DATUM_TYPE_DECIMAL_STRING: i32 = 10;
-pub const DATUM_TYPE_DATE: i32 = 11;
-pub const DATUM_TYPE_TIME: i32 = 12;
-pub const DATUM_TYPE_TIMESTAMP_NTZ: i32 = 13;
-pub const DATUM_TYPE_TIMESTAMP_LTZ: i32 = 14;
-
-const MILLIS_PER_SECOND: i64 = 1_000;
-const MICROS_PER_MILLI: i64 = 1_000;
-const NANOS_PER_MICRO: i64 = 1_000;
-const NANOS_PER_MILLI: i64 = 1_000_000;
+// DATUM_TYPE_* constants removed — no longer needed with opaque types.
 
 fn ffi_data_type_to_core(dt: i32, precision: u32, scale: u32) -> Result<fcore::metadata::DataType> {
     match dt {
@@ -90,11 +65,13 @@ fn ffi_data_type_to_core(dt: i32, precision: u32, scale: u32) -> Result<fcore::m
             let dt = fcore::metadata::DecimalType::new(precision, scale)?;
             Ok(fcore::metadata::DataType::Decimal(dt))
         }
+        DATA_TYPE_CHAR => Ok(fcore::metadata::DataTypes::char(precision)),
+        DATA_TYPE_BINARY => Ok(fcore::metadata::DataTypes::binary(precision as usize)),
         _ => Err(anyhow!("Unknown data type: {dt}")),
     }
 }
 
-fn core_data_type_to_ffi(dt: &fcore::metadata::DataType) -> i32 {
+pub fn core_data_type_to_ffi(dt: &fcore::metadata::DataType) -> i32 {
     match dt {
         fcore::metadata::DataType::Boolean(_) => DATA_TYPE_BOOLEAN,
         fcore::metadata::DataType::TinyInt(_) => DATA_TYPE_TINYINT,
@@ -110,6 +87,8 @@ fn core_data_type_to_ffi(dt: &fcore::metadata::DataType) -> i32 {
         fcore::metadata::DataType::Timestamp(_) => DATA_TYPE_TIMESTAMP,
         fcore::metadata::DataType::TimestampLTz(_) => DATA_TYPE_TIMESTAMP_LTZ,
         fcore::metadata::DataType::Decimal(_) => DATA_TYPE_DECIMAL,
+        fcore::metadata::DataType::Char(_) => DATA_TYPE_CHAR,
+        fcore::metadata::DataType::Binary(_) => DATA_TYPE_BINARY,
         _ => 0,
     }
 }
@@ -156,6 +135,15 @@ pub fn ffi_descriptor_to_core(
         builder = builder.property(&prop.key, &prop.value);
     }
 
+    if !descriptor.custom_properties.is_empty() {
+        let custom: std::collections::HashMap<String, String> = descriptor
+            .custom_properties
+            .iter()
+            .map(|kv| (kv.key.clone(), kv.value.clone()))
+            .collect();
+        builder = builder.custom_properties(custom);
+    }
+
     if !descriptor.comment.is_empty() {
         builder = builder.comment(&descriptor.comment);
     }
@@ -175,6 +163,8 @@ pub fn core_table_info_to_ffi(info: &fcore::metadata::TableInfo) -> ffi::FfiTabl
                 }
                 fcore::metadata::DataType::Timestamp(dt) => (dt.precision() as i32, 0),
                 fcore::metadata::DataType::TimestampLTz(dt) => (dt.precision() as i32, 0),
+                fcore::metadata::DataType::Char(dt) => (dt.length() as i32, 0),
+                fcore::metadata::DataType::Binary(dt) => (dt.length() as i32, 0),
                 _ => (0, 0),
             };
             ffi::FfiColumn {
@@ -201,6 +191,15 @@ pub fn core_table_info_to_ffi(info: &fcore::metadata::TableInfo) -> ffi::FfiTabl
         })
         .collect();
 
+    let custom_properties: Vec<ffi::HashMapValue> = info
+        .get_custom_properties()
+        .iter()
+        .map(|(k, v)| ffi::HashMapValue {
+            key: k.clone(),
+            value: v.clone(),
+        })
+        .collect();
+
     ffi::FfiTableInfo {
         table_id: info.get_table_id(),
         schema_id: info.get_schema_id(),
@@ -217,6 +216,7 @@ pub fn core_table_info_to_ffi(info: &fcore::metadata::TableInfo) -> ffi::FfiTabl
         has_primary_key: info.has_primary_key(),
         is_partitioned: info.is_partitioned(),
         properties,
+        custom_properties,
         comment: info.get_comment().unwrap_or("").to_string(),
         schema: ffi::FfiSchema {
             columns,
@@ -242,6 +242,7 @@ pub fn empty_table_info() -> ffi::FfiTableInfo {
         has_primary_key: false,
         is_partitioned: false,
         properties: vec![],
+        custom_properties: vec![],
         comment: String::new(),
         schema: ffi::FfiSchema {
             columns: vec![],
@@ -293,527 +294,127 @@ pub fn core_database_info_to_ffi(info: &fcore::metadata::DatabaseInfo) -> ffi::F
     }
 }
 
-/// Look up decimal (precision, scale) from schema for column `idx`.
-fn get_decimal_type(idx: usize, schema: Option<&fcore::metadata::Schema>) -> Result<(u32, u32)> {
-    let col = schema
-        .and_then(|s| s.columns().get(idx))
-        .ok_or_else(|| anyhow!("Schema not available for decimal column {idx}"))?;
-    match col.data_type() {
-        fcore::metadata::DataType::Decimal(dt) => Ok((dt.precision(), dt.scale())),
-        other => Err(anyhow!("Column {idx} is {other:?}, not Decimal")),
-    }
-}
-
-pub fn ffi_row_to_core<'a>(
-    row: &'a ffi::FfiGenericRow,
+/// Resolve types in a GenericRow using schema metadata.
+/// Narrows Int32 → Int8/Int16, parses decimal strings, etc.
+/// Used by both AppendWriter and UpsertWriter.
+pub fn resolve_row_types(
+    row: &fcore::row::GenericRow<'_>,
     schema: Option<&fcore::metadata::Schema>,
-) -> Result<fcore::row::GenericRow<'a>> {
+) -> Result<fcore::row::GenericRow<'static>> {
     use fcore::row::Datum;
 
-    let mut generic_row = fcore::row::GenericRow::new(row.fields.len());
+    let mut out = fcore::row::GenericRow::new(row.values.len());
 
-    for (idx, field) in row.fields.iter().enumerate() {
-        let datum = match field.datum_type {
-            DATUM_TYPE_NULL => Datum::Null,
-            DATUM_TYPE_BOOL => Datum::Bool(field.bool_val),
-            DATUM_TYPE_INT32 => match schema
+    for (idx, datum) in row.values.iter().enumerate() {
+        let resolved = match datum {
+            Datum::Null => Datum::Null,
+            Datum::Bool(v) => Datum::Bool(*v),
+            Datum::Int32(v) => match schema
                 .and_then(|s| s.columns().get(idx))
                 .map(|c| c.data_type())
             {
-                Some(fcore::metadata::DataType::TinyInt(_)) => {
-                    Datum::Int8(i8::try_from(field.i32_val).map_err(|_| {
-                        anyhow!("Column {idx}: {} overflows TinyInt", field.i32_val)
-                    })?)
-                }
-                Some(fcore::metadata::DataType::SmallInt(_)) => {
-                    Datum::Int16(i16::try_from(field.i32_val).map_err(|_| {
-                        anyhow!("Column {idx}: {} overflows SmallInt", field.i32_val)
-                    })?)
-                }
-                _ => Datum::Int32(field.i32_val),
-            },
-            DATUM_TYPE_INT64 => Datum::Int64(field.i64_val),
-            DATUM_TYPE_FLOAT32 => Datum::Float32(field.f32_val.into()),
-            DATUM_TYPE_FLOAT64 => Datum::Float64(field.f64_val.into()),
-            DATUM_TYPE_STRING => Datum::String(Cow::Borrowed(field.string_val.as_str())),
-            DATUM_TYPE_BYTES => Datum::Blob(Cow::Borrowed(field.bytes_val.as_slice())),
-            DATUM_TYPE_DECIMAL_STRING => {
-                let (precision, scale) = get_decimal_type(idx, schema)?;
-                let bd =
-                    bigdecimal::BigDecimal::from_str(field.string_val.as_str()).map_err(|e| {
-                        anyhow!(
-                            "Column {idx}: invalid decimal string '{}': {e}",
-                            field.string_val
-                        )
-                    })?;
-                let decimal = fcore::row::Decimal::from_big_decimal(bd, precision, scale)
-                    .map_err(|e| anyhow!("Column {idx}: {e}"))?;
-                Datum::Decimal(decimal)
-            }
-            DATUM_TYPE_DECIMAL_I64 => {
-                let precision = field.decimal_precision as u32;
-                let scale = field.decimal_scale as u32;
-                let decimal =
-                    fcore::row::Decimal::from_unscaled_long(field.i64_val, precision, scale)
-                        .map_err(|e| anyhow!("Column {idx}: {e}"))?;
-                Datum::Decimal(decimal)
-            }
-            DATUM_TYPE_DECIMAL_I128 => {
-                let precision = field.decimal_precision as u32;
-                let scale = field.decimal_scale as u32;
-                let i128_val = ((field.i128_hi as i128) << 64) | (field.i128_lo as u64 as i128);
-                let decimal = fcore::row::Decimal::from_arrow_decimal128(
-                    i128_val,
-                    scale as i64,
-                    precision,
-                    scale,
-                )
-                .map_err(|e| anyhow!("Column {idx}: {e}"))?;
-                Datum::Decimal(decimal)
-            }
-            DATUM_TYPE_DATE => Datum::Date(fcore::row::Date::new(field.i32_val)),
-            DATUM_TYPE_TIME => Datum::Time(fcore::row::Time::new(field.i32_val)),
-            DATUM_TYPE_TIMESTAMP_NTZ => Datum::TimestampNtz(
-                fcore::row::TimestampNtz::from_millis_nanos(field.i64_val, field.i32_val)
-                    .map_err(|e| anyhow!("Column {idx}: {e}"))?,
-            ),
-            DATUM_TYPE_TIMESTAMP_LTZ => Datum::TimestampLtz(
-                fcore::row::TimestampLtz::from_millis_nanos(field.i64_val, field.i32_val)
-                    .map_err(|e| anyhow!("Column {idx}: {e}"))?,
-            ),
-            other => return Err(anyhow!("Column {idx}: unknown datum type {other}")),
-        };
-        generic_row.set_field(idx, datum);
-    }
-
-    Ok(generic_row)
-}
-
-pub fn core_scan_records_to_ffi(
-    records: &fcore::record::ScanRecords,
-    columns: &[fcore::metadata::Column],
-) -> Result<ffi::FfiScanRecords> {
-    let mut ffi_records = Vec::new();
-
-    // Iterate over all buckets and their records
-    for (table_bucket, bucket_records) in records.records_by_buckets() {
-        let bucket_id = table_bucket.bucket_id();
-        for record in bucket_records {
-            let row = record.row();
-            let fields = core_row_to_ffi_fields(row, columns)?;
-
-            ffi_records.push(ffi::FfiScanRecord {
-                bucket_id,
-                offset: record.offset(),
-                timestamp: record.timestamp(),
-                row: ffi::FfiGenericRow { fields },
-            });
-        }
-    }
-
-    Ok(ffi::FfiScanRecords {
-        records: ffi_records,
-    })
-}
-
-fn core_row_to_ffi_fields(
-    row: &fcore::row::ColumnarRow,
-    columns: &[fcore::metadata::Column],
-) -> Result<Vec<ffi::FfiDatum>> {
-    let record_batch = row.get_record_batch();
-    let schema = record_batch.schema();
-    let row_id = row.get_row_id();
-
-    let mut fields = Vec::with_capacity(schema.fields().len());
-
-    for (i, field) in schema.fields().iter().enumerate() {
-        if row.is_null_at(i) {
-            fields.push(ffi::FfiDatum::default());
-            continue;
-        }
-
-        let datum = match field.data_type() {
-            ArrowDataType::Boolean => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_BOOL,
-                bool_val: row.get_boolean(i),
-                ..Default::default()
-            },
-            ArrowDataType::Int8 => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_INT32,
-                i32_val: row.get_byte(i) as i32,
-                ..Default::default()
-            },
-            ArrowDataType::Int16 => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_INT32,
-                i32_val: row.get_short(i) as i32,
-                ..Default::default()
+                Some(fcore::metadata::DataType::TinyInt(_)) => Datum::Int8(
+                    i8::try_from(*v).map_err(|_| anyhow!("Column {idx}: {v} overflows TinyInt"))?,
+                ),
+                Some(fcore::metadata::DataType::SmallInt(_)) => Datum::Int16(
+                    i16::try_from(*v)
+                        .map_err(|_| anyhow!("Column {idx}: {v} overflows SmallInt"))?,
+                ),
+                _ => Datum::Int32(*v),
             },
-            ArrowDataType::Int32 => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_INT32,
-                i32_val: row.get_int(i),
-                ..Default::default()
-            },
-            ArrowDataType::Int64 => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_INT64,
-                i64_val: row.get_long(i),
-                ..Default::default()
-            },
-            ArrowDataType::Float32 => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_FLOAT32,
-                f32_val: row.get_float(i),
-                ..Default::default()
-            },
-            ArrowDataType::Float64 => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_FLOAT64,
-                f64_val: row.get_double(i),
-                ..Default::default()
-            },
-            ArrowDataType::Utf8 => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_STRING,
-                string_val: row.get_string(i).to_string(),
-                ..Default::default()
-            },
-            ArrowDataType::LargeUtf8 => {
-                let array = record_batch
-                    .column(i)
-                    .as_any()
-                    .downcast_ref::<LargeStringArray>()
-                    .ok_or_else(|| anyhow!("Column {i}: expected LargeUtf8 array"))?;
-                ffi::FfiDatum {
-                    datum_type: DATUM_TYPE_STRING,
-                    string_val: array.value(row_id).to_string(),
-                    ..Default::default()
-                }
-            }
-            ArrowDataType::Binary => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_BYTES,
-                bytes_val: row.get_bytes(i).to_vec(),
-                ..Default::default()
-            },
-            ArrowDataType::FixedSizeBinary(len) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_BYTES,
-                bytes_val: row.get_binary(i, *len as usize).to_vec(),
-                ..Default::default()
-            },
-            ArrowDataType::LargeBinary => {
-                let array = record_batch
-                    .column(i)
-                    .as_any()
-                    .downcast_ref::<LargeBinaryArray>()
-                    .ok_or_else(|| anyhow!("Column {i}: expected LargeBinary array"))?;
-                ffi::FfiDatum {
-                    datum_type: DATUM_TYPE_BYTES,
-                    bytes_val: array.value(row_id).to_vec(),
-                    ..Default::default()
-                }
-            }
-            ArrowDataType::Date32 => {
-                let array = record_batch
-                    .column(i)
-                    .as_any()
-                    .downcast_ref::<Date32Array>()
-                    .ok_or_else(|| anyhow!("Column {i}: expected Date32 array"))?;
-                ffi::FfiDatum {
-                    datum_type: DATUM_TYPE_DATE,
-                    i32_val: array.value(row_id),
-                    ..Default::default()
-                }
-            }
-            ArrowDataType::Timestamp(unit, _tz) => {
-                let datum_type = match columns.get(i).map(|c| c.data_type()) {
-                    Some(fcore::metadata::DataType::TimestampLTz(_)) => DATUM_TYPE_TIMESTAMP_LTZ,
-                    _ => DATUM_TYPE_TIMESTAMP_NTZ,
-                };
-                let mut datum = ffi::FfiDatum {
-                    datum_type,
-                    ..Default::default()
-                };
-                match unit {
-                    TimeUnit::Second => {
-                        let array = record_batch
-                            .column(i)
-                            .as_any()
-                            .downcast_ref::<TimestampSecondArray>()
-                            .ok_or_else(|| {
-                                anyhow!("Column {i}: expected Timestamp(second) array")
-                            })?;
-                        datum.i64_val = array.value(row_id) * MILLIS_PER_SECOND;
-                    }
-                    TimeUnit::Millisecond => {
-                        let array = record_batch
-                            .column(i)
-                            .as_any()
-                            .downcast_ref::<TimestampMillisecondArray>()
-                            .ok_or_else(|| {
-                                anyhow!("Column {i}: expected Timestamp(millisecond) array")
-                            })?;
-                        datum.i64_val = array.value(row_id);
-                    }
-                    TimeUnit::Microsecond => {
-                        let array = record_batch
-                            .column(i)
-                            .as_any()
-                            .downcast_ref::<TimestampMicrosecondArray>()
-                            .ok_or_else(|| {
-                                anyhow!("Column {i}: expected Timestamp(microsecond) array")
-                            })?;
-                        let micros = array.value(row_id);
-                        datum.i64_val = micros.div_euclid(MICROS_PER_MILLI);
-                        datum.i32_val =
-                            (micros.rem_euclid(MICROS_PER_MILLI) * NANOS_PER_MICRO) as i32;
-                    }
-                    TimeUnit::Nanosecond => {
-                        let array = record_batch
-                            .column(i)
-                            .as_any()
-                            .downcast_ref::<TimestampNanosecondArray>()
-                            .ok_or_else(|| {
-                                anyhow!("Column {i}: expected Timestamp(nanosecond) array")
-                            })?;
-                        let nanos = array.value(row_id);
-                        datum.i64_val = nanos.div_euclid(NANOS_PER_MILLI);
-                        datum.i32_val = nanos.rem_euclid(NANOS_PER_MILLI) as i32;
-                    }
-                }
-                datum
-            }
-            ArrowDataType::Time32(unit) => match unit {
-                TimeUnit::Second => {
-                    let array = record_batch
-                        .column(i)
-                        .as_any()
-                        .downcast_ref::<Time32SecondArray>()
-                        .ok_or_else(|| anyhow!("Column {i}: expected Time32(second) array"))?;
-                    ffi::FfiDatum {
-                        datum_type: DATUM_TYPE_TIME,
-                        i32_val: array.value(row_id) * MILLIS_PER_SECOND as i32,
-                        ..Default::default()
-                    }
-                }
-                TimeUnit::Millisecond => {
-                    let array = record_batch
-                        .column(i)
-                        .as_any()
-                        .downcast_ref::<Time32MillisecondArray>()
-                        .ok_or_else(|| anyhow!("Column {i}: expected Time32(millisecond) array"))?;
-                    ffi::FfiDatum {
-                        datum_type: DATUM_TYPE_TIME,
-                        i32_val: array.value(row_id),
-                        ..Default::default()
-                    }
-                }
-                _ => return Err(anyhow!("Column {i}: unsupported Time32 unit")),
-            },
-            ArrowDataType::Time64(unit) => match unit {
-                TimeUnit::Microsecond => {
-                    let array = record_batch
-                        .column(i)
-                        .as_any()
-                        .downcast_ref::<Time64MicrosecondArray>()
-                        .ok_or_else(|| anyhow!("Column {i}: expected Time64(microsecond) array"))?;
-                    ffi::FfiDatum {
-                        datum_type: DATUM_TYPE_TIME,
-                        i32_val: (array.value(row_id) / MICROS_PER_MILLI) as i32,
-                        ..Default::default()
-                    }
-                }
-                TimeUnit::Nanosecond => {
-                    let array = record_batch
-                        .column(i)
-                        .as_any()
-                        .downcast_ref::<Time64NanosecondArray>()
-                        .ok_or_else(|| anyhow!("Column {i}: expected Time64(nanosecond) array"))?;
-                    ffi::FfiDatum {
-                        datum_type: DATUM_TYPE_TIME,
-                        i32_val: (array.value(row_id) / NANOS_PER_MILLI) as i32,
-                        ..Default::default()
-                    }
-                }
-                _ => return Err(anyhow!("Column {i}: unsupported Time64 unit")),
-            },
-            ArrowDataType::Decimal128(precision, scale) => {
-                let array = record_batch
-                    .column(i)
-                    .as_any()
-                    .downcast_ref::<Decimal128Array>()
-                    .ok_or_else(|| anyhow!("Column {i}: expected Decimal128 array"))?;
-                let i128_val = array.value(row_id);
-
-                if fcore::row::Decimal::is_compact_precision(*precision as u32) {
-                    ffi::FfiDatum {
-                        datum_type: DATUM_TYPE_DECIMAL_I64,
-                        i64_val: i128_val as i64,
-                        decimal_precision: *precision as i32,
-                        decimal_scale: *scale as i32,
-                        ..Default::default()
-                    }
-                } else {
-                    ffi::FfiDatum {
-                        datum_type: DATUM_TYPE_DECIMAL_I128,
-                        i128_hi: (i128_val >> 64) as i64,
-                        i128_lo: i128_val as i64,
-                        decimal_precision: *precision as i32,
-                        decimal_scale: *scale as i32,
-                        ..Default::default()
+            Datum::Int64(v) => Datum::Int64(*v),
+            Datum::Float32(v) => Datum::Float32(*v),
+            Datum::Float64(v) => Datum::Float64(*v),
+            Datum::Int8(v) => Datum::Int8(*v),
+            Datum::Int16(v) => Datum::Int16(*v),
+            Datum::String(cow) => {
+                // Check if the schema column is Decimal — if so, parse the string as decimal
+                match schema
+                    .and_then(|s| s.columns().get(idx))
+                    .map(|c| c.data_type())
+                {
+                    Some(fcore::metadata::DataType::Decimal(dt)) => {
+                        let (precision, scale) = (dt.precision(), dt.scale());
+                        let bd = bigdecimal::BigDecimal::from_str(cow.as_ref()).map_err(|e| {
+                            anyhow!("Column {idx}: invalid decimal string '{}': {e}", cow)
+                        })?;
+                        let decimal = fcore::row::Decimal::from_big_decimal(bd, precision, scale)
+                            .map_err(|e| anyhow!("Column {idx}: {e}"))?;
+                        Datum::Decimal(decimal)
                     }
+                    _ => Datum::String(Cow::Owned(cow.to_string())),
                 }
             }
-            other => return Err(anyhow!("Column {i}: unsupported Arrow data type {other:?}")),
+            Datum::Blob(cow) => Datum::Blob(Cow::Owned(cow.to_vec())),
+            Datum::Decimal(d) => Datum::Decimal(d.clone()),
+            Datum::Date(d) => Datum::Date(*d),
+            Datum::Time(t) => Datum::Time(*t),
+            Datum::TimestampNtz(ts) => Datum::TimestampNtz(*ts),
+            Datum::TimestampLtz(ts) => Datum::TimestampLtz(*ts),
         };
-
-        fields.push(datum);
+        out.set_field(idx, resolved);
     }
 
-    Ok(fields)
+    Ok(out)
 }
 
-impl Default for ffi::FfiDatum {
-    fn default() -> Self {
-        Self {
-            datum_type: DATUM_TYPE_NULL,
-            bool_val: false,
-            i32_val: 0,
-            i64_val: 0,
-            f32_val: 0.0,
-            f64_val: 0.0,
-            string_val: String::new(),
-            bytes_val: vec![],
-            decimal_precision: 0,
-            decimal_scale: 0,
-            i128_hi: 0,
-            i128_lo: 0,
-        }
-    }
-}
-
-/// Convert any InternalRow to FfiGenericRow using Fluss schema metadata.
-/// Used for lookup results (CompactedRow) where Arrow schema is unavailable.
-pub fn internal_row_to_ffi_row(
+/// Convert a CompactedRow (lookup result) to an owned GenericRow<'static>.
+/// One copy for strings/bytes (Cow::Owned), but no second copy into FfiDatum.
+pub fn compacted_row_to_owned(
     row: &dyn fcore::row::InternalRow,
     table_info: &fcore::metadata::TableInfo,
-) -> Result<ffi::FfiGenericRow> {
+) -> Result<fcore::row::GenericRow<'static>> {
+    use fcore::row::Datum;
+
     let schema = table_info.get_schema();
     let columns = schema.columns();
-    let mut fields = Vec::with_capacity(columns.len());
+    let mut out = fcore::row::GenericRow::new(columns.len());
 
     for (i, col) in columns.iter().enumerate() {
         if row.is_null_at(i) {
-            fields.push(ffi::FfiDatum::default());
+            out.set_field(i, Datum::Null);
             continue;
         }
 
         let datum = match col.data_type() {
-            fcore::metadata::DataType::Boolean(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_BOOL,
-                bool_val: row.get_boolean(i),
-                ..Default::default()
-            },
-            fcore::metadata::DataType::TinyInt(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_INT32,
-                i32_val: row.get_byte(i) as i32,
-                ..Default::default()
-            },
-            fcore::metadata::DataType::SmallInt(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_INT32,
-                i32_val: row.get_short(i) as i32,
-                ..Default::default()
-            },
-            fcore::metadata::DataType::Int(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_INT32,
-                i32_val: row.get_int(i),
-                ..Default::default()
-            },
-            fcore::metadata::DataType::BigInt(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_INT64,
-                i64_val: row.get_long(i),
-                ..Default::default()
-            },
-            fcore::metadata::DataType::Float(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_FLOAT32,
-                f32_val: row.get_float(i),
-                ..Default::default()
-            },
-            fcore::metadata::DataType::Double(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_FLOAT64,
-                f64_val: row.get_double(i),
-                ..Default::default()
-            },
-            fcore::metadata::DataType::String(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_STRING,
-                string_val: row.get_string(i).to_string(),
-                ..Default::default()
-            },
-            fcore::metadata::DataType::Bytes(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_BYTES,
-                bytes_val: row.get_bytes(i).to_vec(),
-                ..Default::default()
-            },
-            fcore::metadata::DataType::Date(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_DATE,
-                i32_val: row.get_date(i).get_inner(),
-                ..Default::default()
-            },
-            fcore::metadata::DataType::Time(_) => ffi::FfiDatum {
-                datum_type: DATUM_TYPE_TIME,
-                i32_val: row.get_time(i).get_inner(),
-                ..Default::default()
-            },
+            fcore::metadata::DataType::Boolean(_) => Datum::Bool(row.get_boolean(i)),
+            fcore::metadata::DataType::TinyInt(_) => Datum::Int8(row.get_byte(i)),
+            fcore::metadata::DataType::SmallInt(_) => Datum::Int16(row.get_short(i)),
+            fcore::metadata::DataType::Int(_) => Datum::Int32(row.get_int(i)),
+            fcore::metadata::DataType::BigInt(_) => Datum::Int64(row.get_long(i)),
+            fcore::metadata::DataType::Float(_) => Datum::Float32(row.get_float(i).into()),
+            fcore::metadata::DataType::Double(_) => Datum::Float64(row.get_double(i).into()),
+            fcore::metadata::DataType::String(_) => {
+                Datum::String(Cow::Owned(row.get_string(i).to_string()))
+            }
+            fcore::metadata::DataType::Bytes(_) => {
+                Datum::Blob(Cow::Owned(row.get_bytes(i).to_vec()))
+            }
+            fcore::metadata::DataType::Date(_) => Datum::Date(row.get_date(i)),
+            fcore::metadata::DataType::Time(_) => Datum::Time(row.get_time(i)),
             fcore::metadata::DataType::Timestamp(dt) => {
-                let ts = row.get_timestamp_ntz(i, dt.precision());
-                ffi::FfiDatum {
-                    datum_type: DATUM_TYPE_TIMESTAMP_NTZ,
-                    i64_val: ts.get_millisecond(),
-                    i32_val: ts.get_nano_of_millisecond(),
-                    ..Default::default()
-                }
+                Datum::TimestampNtz(row.get_timestamp_ntz(i, dt.precision()))
             }
             fcore::metadata::DataType::TimestampLTz(dt) => {
-                let ts = row.get_timestamp_ltz(i, dt.precision());
-                ffi::FfiDatum {
-                    datum_type: DATUM_TYPE_TIMESTAMP_LTZ,
-                    i64_val: ts.get_epoch_millisecond(),
-                    i32_val: ts.get_nano_of_millisecond(),
-                    ..Default::default()
-                }
+                Datum::TimestampLtz(row.get_timestamp_ltz(i, dt.precision()))
             }
             fcore::metadata::DataType::Decimal(dt) => {
-                let precision = dt.precision();
-                let scale = dt.scale();
-                let decimal = row.get_decimal(i, precision as usize, scale as usize);
-                if fcore::row::Decimal::is_compact_precision(precision) {
-                    ffi::FfiDatum {
-                        datum_type: DATUM_TYPE_DECIMAL_I64,
-                        i64_val: decimal.to_unscaled_long().map_err(|e| {
-                            anyhow!("Column {i}: compact decimal conversion failed: {e}")
-                        })?,
-                        decimal_precision: precision as i32,
-                        decimal_scale: scale as i32,
-                        ..Default::default()
-                    }
-                } else {
-                    let bd = decimal.to_big_decimal();
-                    let (unscaled, _) = bd.into_bigint_and_exponent();
-                    use bigdecimal::ToPrimitive;
-                    let i128_val = unscaled.to_i128().ok_or_else(|| {
-                        anyhow!("Column {i}: decimal unscaled value does not fit in i128")
-                    })?;
-                    ffi::FfiDatum {
-                        datum_type: DATUM_TYPE_DECIMAL_I128,
-                        i128_hi: (i128_val >> 64) as i64,
-                        i128_lo: i128_val as i64,
-                        decimal_precision: precision as i32,
-                        decimal_scale: scale as i32,
-                        ..Default::default()
-                    }
-                }
+                let decimal = row.get_decimal(i, dt.precision() as usize, dt.scale() as usize);
+                Datum::Decimal(decimal)
+            }
+            fcore::metadata::DataType::Char(dt) => Datum::String(Cow::Owned(
+                row.get_char(i, dt.length() as usize).to_string(),
+            )),
+            fcore::metadata::DataType::Binary(dt) => {
+                Datum::Blob(Cow::Owned(row.get_binary(i, dt.length()).to_vec()))
             }
             other => return Err(anyhow!("Unsupported data type for column {i}: {other:?}")),
         };
 
-        fields.push(datum);
+        out.set_field(i, datum);
     }
 
-    Ok(ffi::FfiGenericRow { fields })
+    Ok(out)
 }
 
 pub fn core_lake_snapshot_to_ffi(snapshot: &fcore::metadata::LakeSnapshot) -> ffi::FfiLakeSnapshot {

From 9eadba8b46a2b9348a05c166cc5f6aafc6ac856e Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Tue, 17 Feb 2026 10:18:14 +0000
Subject: [PATCH 153/287] test: introduce python integration tests (#341)

---
 fluss-rust/.github/workflows/ci.yml           |  42 ++
 fluss-rust/.gitignore                         |   3 +
 .../bindings/python/GENERATED_README.md       |   1 +
 fluss-rust/bindings/python/pyproject.toml     |   5 +
 fluss-rust/bindings/python/test/conftest.py   | 137 ++++
 fluss-rust/bindings/python/test/test_admin.py | 301 ++++++++
 .../bindings/python/test/test_kv_table.py     | 428 +++++++++++
 .../bindings/python/test/test_log_table.py    | 675 ++++++++++++++++++
 .../docs/developer-guide/contributing.md      |  14 +-
 9 files changed, 1602 insertions(+), 4 deletions(-)
 create mode 100644 fluss-rust/bindings/python/GENERATED_README.md
 create mode 100644 fluss-rust/bindings/python/test/conftest.py
 create mode 100644 fluss-rust/bindings/python/test/test_admin.py
 create mode 100644 fluss-rust/bindings/python/test/test_kv_table.py
 create mode 100644 fluss-rust/bindings/python/test/test_log_table.py

diff --git a/fluss-rust/.github/workflows/ci.yml b/fluss-rust/.github/workflows/ci.yml
index e9048fb0e0..20bee8775f 100644
--- a/fluss-rust/.github/workflows/ci.yml
+++ b/fluss-rust/.github/workflows/ci.yml
@@ -137,3 +137,45 @@ jobs:
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
+
+  python-integration-test:
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python: ["3.9", "3.10", "3.11", "3.12"]
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python }}
+
+      - name: Install uv
+        uses: astral-sh/setup-uv@v4
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Rust Cache
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cargo/registry
+            ~/.cargo/git
+            target
+          key: python-test-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
+
+      - name: Build Python bindings
+        working-directory: bindings/python
+        run: |
+          uv sync --extra dev
+          uv run maturin develop
+
+      - name: Run Python integration tests
+        working-directory: bindings/python
+        run: uv run pytest test/ -v
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
index 476f84e979..f251aab32d 100644
--- a/fluss-rust/.gitignore
+++ b/fluss-rust/.gitignore
@@ -28,9 +28,12 @@ __pycache__/
 *.egg-info/
 dist/
 build/
+.venv/
+uv.lock
 
 # CPP
 *CMakeFiles/
+.cache/
 
 # Website (Docusaurus)
 website/node_modules
diff --git a/fluss-rust/bindings/python/GENERATED_README.md b/fluss-rust/bindings/python/GENERATED_README.md
new file mode 100644
index 0000000000..0a011ba6ee
--- /dev/null
+++ b/fluss-rust/bindings/python/GENERATED_README.md
@@ -0,0 +1 @@
+This readme can be automatically generated by generate_readme.py.
\ No newline at end of file
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index 0be25a03db..f5b0b68d62 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -52,6 +52,7 @@ dev = [
     "pytest-asyncio>=0.25.3",
     "ruff>=0.9.10",
     "maturin>=1.8.2",
+    "testcontainers>=4.0.0",
 ]
 docs = [
     "pdoc>=15.0.4",
@@ -90,6 +91,10 @@ docstring-code-format = true
 [tool.ruff.lint.isort]
 known-first-party = ["fluss"]
 
+[tool.pytest.ini_options]
+asyncio_mode = "auto"
+asyncio_default_fixture_loop_scope = "session"
+
 [tool.mypy]
 python_version = "3.9"
 warn_return_any = true
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
new file mode 100644
index 0000000000..fbd7396ee8
--- /dev/null
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -0,0 +1,137 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Shared fixtures for Fluss Python integration tests.
+
+If FLUSS_BOOTSTRAP_SERVERS is set, tests connect to an existing cluster.
+Otherwise, a Fluss cluster is started automatically via testcontainers.
+
+Run with:
+    uv run maturin develop && uv run pytest test/ -v
+"""
+
+import os
+import socket
+import time
+
+import pytest
+import pytest_asyncio
+
+import fluss
+
+FLUSS_VERSION = "0.7.0"
+BOOTSTRAP_SERVERS_ENV = os.environ.get("FLUSS_BOOTSTRAP_SERVERS")
+
+
+def _wait_for_port(host, port, timeout=60):
+    """Wait for a TCP port to become available."""
+    start = time.time()
+    while time.time() - start < timeout:
+        try:
+            with socket.create_connection((host, port), timeout=1):
+                return
+        except (ConnectionRefusedError, TimeoutError, OSError):
+            time.sleep(1)
+    raise TimeoutError(f"Port {port} on {host} not available after {timeout}s")
+
+
+@pytest.fixture(scope="session")
+def fluss_cluster():
+    """Start a Fluss cluster using testcontainers, or use an existing one."""
+    if BOOTSTRAP_SERVERS_ENV:
+        yield BOOTSTRAP_SERVERS_ENV
+        return
+
+    from testcontainers.core.container import DockerContainer
+    from testcontainers.core.network import Network
+
+    network = Network()
+    network.create()
+
+    zookeeper = (
+        DockerContainer("zookeeper:3.9.2")
+        .with_network(network)
+        .with_name("zookeeper-python-test")
+    )
+
+    coordinator_props = "\n".join([
+        "zookeeper.address: zookeeper-python-test:2181",
+        "bind.listeners: INTERNAL://coordinator-server-python-test:0,"
+        " CLIENT://coordinator-server-python-test:9123",
+        "advertised.listeners: CLIENT://localhost:9123",
+        "internal.listener.name: INTERNAL",
+        "netty.server.num-network-threads: 1",
+        "netty.server.num-worker-threads: 3",
+    ])
+    coordinator = (
+        DockerContainer(f"fluss/fluss:{FLUSS_VERSION}")
+        .with_network(network)
+        .with_name("coordinator-server-python-test")
+        .with_bind_ports(9123, 9123)
+        .with_command("coordinatorServer")
+        .with_env("FLUSS_PROPERTIES", coordinator_props)
+    )
+
+    tablet_props = "\n".join([
+        "zookeeper.address: zookeeper-python-test:2181",
+        "bind.listeners: INTERNAL://tablet-server-python-test:0,"
+        " CLIENT://tablet-server-python-test:9123",
+        "advertised.listeners: CLIENT://localhost:9124",
+        "internal.listener.name: INTERNAL",
+        "tablet-server.id: 0",
+        "netty.server.num-network-threads: 1",
+        "netty.server.num-worker-threads: 3",
+    ])
+    tablet_server = (
+        DockerContainer(f"fluss/fluss:{FLUSS_VERSION}")
+        .with_network(network)
+        .with_name("tablet-server-python-test")
+        .with_bind_ports(9123, 9124)
+        .with_command("tabletServer")
+        .with_env("FLUSS_PROPERTIES", tablet_props)
+    )
+
+    zookeeper.start()
+    coordinator.start()
+    tablet_server.start()
+
+    _wait_for_port("localhost", 9123)
+    _wait_for_port("localhost", 9124)
+    # Extra wait for cluster to fully initialize
+    time.sleep(10)
+
+    yield "127.0.0.1:9123"
+
+    tablet_server.stop()
+    coordinator.stop()
+    zookeeper.stop()
+    network.remove()
+
+
+@pytest_asyncio.fixture(scope="session")
+async def connection(fluss_cluster):
+    """Session-scoped connection to the Fluss cluster."""
+    config = fluss.Config({"bootstrap.servers": fluss_cluster})
+    conn = await fluss.FlussConnection.create(config)
+    yield conn
+    conn.close()
+
+
+@pytest_asyncio.fixture(scope="session")
+async def admin(connection):
+    """Session-scoped admin client."""
+    return await connection.get_admin()
diff --git a/fluss-rust/bindings/python/test/test_admin.py b/fluss-rust/bindings/python/test/test_admin.py
new file mode 100644
index 0000000000..f203400f89
--- /dev/null
+++ b/fluss-rust/bindings/python/test/test_admin.py
@@ -0,0 +1,301 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Integration tests for FlussAdmin operations.
+
+Mirrors the Rust integration tests in crates/fluss/tests/integration/admin.rs.
+"""
+
+import pyarrow as pa
+import pytest
+
+import fluss
+
+
+async def test_create_database(admin):
+    """Test database create, exists, get_info, and drop lifecycle."""
+    db_name = "py_test_create_database"
+
+    # Cleanup in case of prior failed run
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+
+    assert not await admin.database_exists(db_name)
+
+    db_descriptor = fluss.DatabaseDescriptor(
+        comment="test_db",
+        custom_properties={"k1": "v1", "k2": "v2"},
+    )
+    await admin.create_database(db_name, db_descriptor, ignore_if_exists=False)
+
+    assert await admin.database_exists(db_name)
+
+    db_info = await admin.get_database_info(db_name)
+    assert db_info.database_name == db_name
+
+    descriptor = db_info.get_database_descriptor()
+    assert descriptor.comment == "test_db"
+    assert descriptor.get_custom_properties() == {"k1": "v1", "k2": "v2"}
+
+    await admin.drop_database(db_name, ignore_if_not_exists=False, cascade=True)
+
+    assert not await admin.database_exists(db_name)
+
+
+async def test_create_table(admin):
+    """Test table create, exists, get_info, list, and drop lifecycle."""
+    db_name = "py_test_create_table_db"
+
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+
+    assert not await admin.database_exists(db_name)
+    await admin.create_database(
+        db_name,
+        fluss.DatabaseDescriptor(comment="Database for test_create_table"),
+        ignore_if_exists=False,
+    )
+
+    table_name = "test_user_table"
+    table_path = fluss.TablePath(db_name, table_name)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("name", pa.string()),
+                pa.field("age", pa.int32()),
+                pa.field("email", pa.string()),
+            ]
+        ),
+        primary_keys=["id"],
+    )
+
+    table_descriptor = fluss.TableDescriptor(
+        schema,
+        bucket_count=3,
+        bucket_keys=["id"],
+        comment="Test table for user data (id, name, age, email)",
+        log_format="arrow",
+        kv_format="indexed",
+        properties={"table.replication.factor": "1"},
+    )
+
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    assert await admin.table_exists(table_path)
+
+    tables = await admin.list_tables(db_name)
+    assert len(tables) == 1
+    assert table_name in tables
+
+    table_info = await admin.get_table_info(table_path)
+
+    assert table_info.comment == "Test table for user data (id, name, age, email)"
+    assert table_info.get_primary_keys() == ["id"]
+    assert table_info.num_buckets == 3
+    assert table_info.get_bucket_keys() == ["id"]
+    assert table_info.get_column_names() == ["id", "name", "age", "email"]
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+    assert not await admin.table_exists(table_path)
+
+    await admin.drop_database(db_name, ignore_if_not_exists=False, cascade=True)
+    assert not await admin.database_exists(db_name)
+
+
+async def test_partition_apis(admin):
+    """Test partition create, list, and drop lifecycle."""
+    db_name = "py_test_partition_apis_db"
+
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+    await admin.create_database(
+        db_name,
+        fluss.DatabaseDescriptor(comment="Database for test_partition_apis"),
+        ignore_if_exists=True,
+    )
+
+    table_path = fluss.TablePath(db_name, "partitioned_table")
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("name", pa.string()),
+                pa.field("dt", pa.string()),
+                pa.field("region", pa.string()),
+            ]
+        ),
+        primary_keys=["id", "dt", "region"],
+    )
+
+    table_descriptor = fluss.TableDescriptor(
+        schema,
+        partition_keys=["dt", "region"],
+        bucket_count=3,
+        bucket_keys=["id"],
+        log_format="arrow",
+        kv_format="compacted",
+        properties={"table.replication.factor": "1"},
+    )
+
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=True)
+
+    # Initially no partitions
+    partitions = await admin.list_partition_infos(table_path)
+    assert len(partitions) == 0
+
+    # Create a partition
+    await admin.create_partition(
+        table_path,
+        {"dt": "2024-01-15", "region": "EMEA"},
+        ignore_if_exists=False,
+    )
+
+    partitions = await admin.list_partition_infos(table_path)
+    assert len(partitions) == 1
+    assert partitions[0].partition_name == "2024-01-15$EMEA"
+
+    # Drop the partition
+    await admin.drop_partition(
+        table_path,
+        {"dt": "2024-01-15", "region": "EMEA"},
+        ignore_if_not_exists=False,
+    )
+
+    partitions = await admin.list_partition_infos(table_path)
+    assert len(partitions) == 0
+
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+
+
+async def test_fluss_error_response(admin):
+    """Test that API errors are raised as FlussError with correct error codes."""
+    table_path = fluss.TablePath("fluss", "py_not_exist")
+
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await admin.get_table_info(table_path)
+
+    assert exc_info.value.error_code == fluss.ErrorCode.TABLE_NOT_EXIST
+
+
+async def test_error_database_not_exist(admin):
+    """Test error handling for non-existent database operations."""
+    # get_database_info
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await admin.get_database_info("py_no_such_db")
+    assert exc_info.value.error_code == fluss.ErrorCode.DATABASE_NOT_EXIST
+
+    # drop_database without ignore flag
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await admin.drop_database("py_no_such_db", ignore_if_not_exists=False)
+    assert exc_info.value.error_code == fluss.ErrorCode.DATABASE_NOT_EXIST
+
+    # list_tables for non-existent database
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await admin.list_tables("py_no_such_db")
+    assert exc_info.value.error_code == fluss.ErrorCode.DATABASE_NOT_EXIST
+
+
+async def test_error_database_already_exist(admin):
+    """Test error when creating a database that already exists."""
+    db_name = "py_test_error_db_already_exist"
+
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+    await admin.create_database(db_name, ignore_if_exists=False)
+
+    # Create same database again without ignore flag
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await admin.create_database(db_name, ignore_if_exists=False)
+    assert exc_info.value.error_code == fluss.ErrorCode.DATABASE_ALREADY_EXIST
+
+    # With ignore flag should succeed
+    await admin.create_database(db_name, ignore_if_exists=True)
+
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+
+
+async def test_error_table_already_exist(admin):
+    """Test error when creating a table that already exists."""
+    db_name = "py_test_error_tbl_already_exist_db"
+
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+    await admin.create_database(db_name, ignore_if_exists=True)
+
+    table_path = fluss.TablePath(db_name, "my_table")
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(
+        schema,
+        bucket_count=1,
+        properties={"table.replication.factor": "1"},
+    )
+
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    # Create same table again without ignore flag
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+    assert exc_info.value.error_code == fluss.ErrorCode.TABLE_ALREADY_EXIST
+
+    # With ignore flag should succeed
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=True)
+
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+
+
+async def test_error_table_not_exist(admin):
+    """Test error handling for non-existent table operations."""
+    table_path = fluss.TablePath("fluss", "py_no_such_table")
+
+    # drop without ignore flag
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await admin.drop_table(table_path, ignore_if_not_exists=False)
+    assert exc_info.value.error_code == fluss.ErrorCode.TABLE_NOT_EXIST
+
+    # drop with ignore flag should succeed
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+
+async def test_error_table_not_partitioned(admin):
+    """Test error when calling partition operations on non-partitioned table."""
+    db_name = "py_test_error_not_partitioned_db"
+
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+    await admin.create_database(db_name, ignore_if_exists=True)
+
+    table_path = fluss.TablePath(db_name, "non_partitioned_table")
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(
+        schema,
+        bucket_count=1,
+        properties={"table.replication.factor": "1"},
+    )
+
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await admin.list_partition_infos(table_path)
+    assert (
+        exc_info.value.error_code == fluss.ErrorCode.TABLE_NOT_PARTITIONED_EXCEPTION
+    )
+
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
diff --git a/fluss-rust/bindings/python/test/test_kv_table.py b/fluss-rust/bindings/python/test/test_kv_table.py
new file mode 100644
index 0000000000..98b0cee969
--- /dev/null
+++ b/fluss-rust/bindings/python/test/test_kv_table.py
@@ -0,0 +1,428 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Integration tests for KV (primary key) table operations.
+
+Mirrors the Rust integration tests in crates/fluss/tests/integration/kv_table.rs.
+"""
+
+import math
+from datetime import date, datetime, timezone
+from datetime import time as dt_time
+from decimal import Decimal
+
+import pyarrow as pa
+
+import fluss
+
+
+async def test_upsert_delete_and_lookup(connection, admin):
+    """Test upsert, lookup, update, delete, and non-existent key lookup."""
+    table_path = fluss.TablePath("fluss", "py_test_upsert_and_lookup")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("name", pa.string()),
+                pa.field("age", pa.int64()),
+            ]
+        ),
+        primary_keys=["id"],
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    upsert_writer = table.new_upsert().create_writer()
+
+    test_data = [(1, "Verso", 32), (2, "Noco", 25), (3, "Esquie", 35)]
+
+    # Upsert rows (fire-and-forget, then flush)
+    for id_, name, age in test_data:
+        upsert_writer.upsert({"id": id_, "name": name, "age": age})
+    await upsert_writer.flush()
+
+    # Lookup and verify
+    lookuper = table.new_lookup().create_lookuper()
+
+    for id_, expected_name, expected_age in test_data:
+        result = await lookuper.lookup({"id": id_})
+        assert result is not None, f"Row with id={id_} should exist"
+        assert result["id"] == id_
+        assert result["name"] == expected_name
+        assert result["age"] == expected_age
+
+    # Update record with id=1 (await acknowledgment)
+    handle = upsert_writer.upsert({"id": 1, "name": "Verso", "age": 33})
+    await handle.wait()
+
+    result = await lookuper.lookup({"id": 1})
+    assert result is not None
+    assert result["age"] == 33
+    assert result["name"] == "Verso"
+
+    # Delete record with id=1 (await acknowledgment)
+    handle = upsert_writer.delete({"id": 1})
+    await handle.wait()
+
+    result = await lookuper.lookup({"id": 1})
+    assert result is None, "Record 1 should not exist after delete"
+
+    # Verify other records still exist
+    for id_ in [2, 3]:
+        result = await lookuper.lookup({"id": id_})
+        assert result is not None, f"Record {id_} should still exist"
+
+    # Lookup non-existent key
+    result = await lookuper.lookup({"id": 999})
+    assert result is None, "Non-existent key should return None"
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_composite_primary_keys(connection, admin):
+    """Test upsert and lookup with composite (multi-column) primary keys."""
+    table_path = fluss.TablePath("fluss", "py_test_composite_pk")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("region", pa.string()),
+                pa.field("user_id", pa.int32()),
+                pa.field("score", pa.int64()),
+            ]
+        ),
+        primary_keys=["region", "user_id"],
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    upsert_writer = table.new_upsert().create_writer()
+
+    test_data = [
+        ("US", 1, 100),
+        ("US", 2, 200),
+        ("EU", 1, 150),
+        ("EU", 2, 250),
+    ]
+
+    for region, user_id, score in test_data:
+        upsert_writer.upsert({"region": region, "user_id": user_id, "score": score})
+    await upsert_writer.flush()
+
+    lookuper = table.new_lookup().create_lookuper()
+
+    # Lookup (US, 1) -> score 100
+    result = await lookuper.lookup({"region": "US", "user_id": 1})
+    assert result is not None
+    assert result["score"] == 100
+
+    # Lookup (EU, 2) -> score 250
+    result = await lookuper.lookup({"region": "EU", "user_id": 2})
+    assert result is not None
+    assert result["score"] == 250
+
+    # Update (US, 1) score (await acknowledgment)
+    handle = upsert_writer.upsert({"region": "US", "user_id": 1, "score": 500})
+    await handle.wait()
+
+    result = await lookuper.lookup({"region": "US", "user_id": 1})
+    assert result is not None
+    assert result["score"] == 500
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_partial_update(connection, admin):
+    """Test partial column update via partial_update_by_name."""
+    table_path = fluss.TablePath("fluss", "py_test_partial_update")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("name", pa.string()),
+                pa.field("age", pa.int64()),
+                pa.field("score", pa.int64()),
+            ]
+        ),
+        primary_keys=["id"],
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+
+    # Insert initial record
+    upsert_writer = table.new_upsert().create_writer()
+    handle = upsert_writer.upsert(
+        {"id": 1, "name": "Verso", "age": 32, "score": 6942}
+    )
+    await handle.wait()
+
+    lookuper = table.new_lookup().create_lookuper()
+    result = await lookuper.lookup({"id": 1})
+    assert result is not None
+    assert result["id"] == 1
+    assert result["name"] == "Verso"
+    assert result["age"] == 32
+    assert result["score"] == 6942
+
+    # Partial update: only update score column
+    partial_writer = (
+        table.new_upsert().partial_update_by_name(["id", "score"]).create_writer()
+    )
+    handle = partial_writer.upsert({"id": 1, "score": 420})
+    await handle.wait()
+
+    result = await lookuper.lookup({"id": 1})
+    assert result is not None
+    assert result["id"] == 1
+    assert result["name"] == "Verso", "name should remain unchanged"
+    assert result["age"] == 32, "age should remain unchanged"
+    assert result["score"] == 420, "score should be updated to 420"
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_partial_update_by_index(connection, admin):
+    """Test partial column update via partial_update_by_index."""
+    table_path = fluss.TablePath("fluss", "py_test_partial_update_by_index")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("name", pa.string()),
+                pa.field("age", pa.int64()),
+                pa.field("score", pa.int64()),
+            ]
+        ),
+        primary_keys=["id"],
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+
+    upsert_writer = table.new_upsert().create_writer()
+    handle = upsert_writer.upsert(
+        {"id": 1, "name": "Verso", "age": 32, "score": 6942}
+    )
+    await handle.wait()
+
+    # Partial update by indices: columns 0=id (PK), 1=name
+    partial_writer = (
+        table.new_upsert().partial_update_by_index([0, 1]).create_writer()
+    )
+    handle = partial_writer.upsert([1, "Verso Renamed"])
+    await handle.wait()
+
+    lookuper = table.new_lookup().create_lookuper()
+    result = await lookuper.lookup({"id": 1})
+    assert result is not None
+    assert result["name"] == "Verso Renamed", "name should be updated"
+    assert result["score"] == 6942, "score should remain unchanged"
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_partitioned_table_upsert_and_lookup(connection, admin):
+    """Test upsert/lookup/delete on a partitioned KV table."""
+    table_path = fluss.TablePath("fluss", "py_test_partitioned_kv_table")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("region", pa.string()),
+                pa.field("user_id", pa.int32()),
+                pa.field("name", pa.string()),
+                pa.field("score", pa.int64()),
+            ]
+        ),
+        primary_keys=["region", "user_id"],
+    )
+    table_descriptor = fluss.TableDescriptor(
+        schema,
+        partition_keys=["region"],
+    )
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    # Create partitions
+    for region in ["US", "EU", "APAC"]:
+        await admin.create_partition(
+            table_path, {"region": region}, ignore_if_exists=True
+        )
+
+    table = await connection.get_table(table_path)
+    upsert_writer = table.new_upsert().create_writer()
+
+    test_data = [
+        ("US", 1, "Gustave", 100),
+        ("US", 2, "Lune", 200),
+        ("EU", 1, "Sciel", 150),
+        ("EU", 2, "Maelle", 250),
+        ("APAC", 1, "Noco", 300),
+    ]
+
+    for region, user_id, name, score in test_data:
+        upsert_writer.upsert(
+            {"region": region, "user_id": user_id, "name": name, "score": score}
+        )
+    await upsert_writer.flush()
+
+    lookuper = table.new_lookup().create_lookuper()
+
+    # Verify all rows across partitions
+    for region, user_id, expected_name, expected_score in test_data:
+        result = await lookuper.lookup({"region": region, "user_id": user_id})
+        assert result is not None, f"Row ({region}, {user_id}) should exist"
+        assert result["region"] == region
+        assert result["user_id"] == user_id
+        assert result["name"] == expected_name
+        assert result["score"] == expected_score
+
+    # Update within a partition (await acknowledgment)
+    handle = upsert_writer.upsert(
+        {"region": "US", "user_id": 1, "name": "Gustave Updated", "score": 999}
+    )
+    await handle.wait()
+
+    result = await lookuper.lookup({"region": "US", "user_id": 1})
+    assert result is not None
+    assert result["name"] == "Gustave Updated"
+    assert result["score"] == 999
+
+    # Lookup in non-existent partition should return None
+    result = await lookuper.lookup({"region": "UNKNOWN_REGION", "user_id": 1})
+    assert result is None, "Lookup in non-existent partition should return None"
+
+    # Delete within a partition (await acknowledgment)
+    handle = upsert_writer.delete({"region": "EU", "user_id": 1})
+    await handle.wait()
+
+    result = await lookuper.lookup({"region": "EU", "user_id": 1})
+    assert result is None, "Deleted record should not exist"
+
+    # Verify sibling record still exists
+    result = await lookuper.lookup({"region": "EU", "user_id": 2})
+    assert result is not None
+    assert result["name"] == "Maelle"
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_all_supported_datatypes(connection, admin):
+    """Test upsert/lookup for all supported data types, including nulls."""
+    table_path = fluss.TablePath("fluss", "py_test_kv_all_datatypes")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("pk_int", pa.int32()),
+                pa.field("col_boolean", pa.bool_()),
+                pa.field("col_tinyint", pa.int8()),
+                pa.field("col_smallint", pa.int16()),
+                pa.field("col_int", pa.int32()),
+                pa.field("col_bigint", pa.int64()),
+                pa.field("col_float", pa.float32()),
+                pa.field("col_double", pa.float64()),
+                pa.field("col_string", pa.string()),
+                pa.field("col_decimal", pa.decimal128(10, 2)),
+                pa.field("col_date", pa.date32()),
+                pa.field("col_time", pa.time32("ms")),
+                pa.field("col_timestamp_ntz", pa.timestamp("us")),
+                pa.field("col_timestamp_ltz", pa.timestamp("us", tz="UTC")),
+                pa.field("col_bytes", pa.binary()),
+            ]
+        ),
+        primary_keys=["pk_int"],
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    upsert_writer = table.new_upsert().create_writer()
+
+    # Test data for all types
+    row_data = {
+        "pk_int": 1,
+        "col_boolean": True,
+        "col_tinyint": 127,
+        "col_smallint": 32767,
+        "col_int": 2147483647,
+        "col_bigint": 9223372036854775807,
+        "col_float": 3.14,
+        "col_double": 2.718281828459045,
+        "col_string": "world of fluss python client",
+        "col_decimal": Decimal("123.45"),
+        "col_date": date(2026, 1, 23),
+        "col_time": dt_time(10, 13, 47, 123000),  # millisecond precision
+        "col_timestamp_ntz": datetime(2026, 1, 23, 10, 13, 47, 123000),
+        "col_timestamp_ltz": datetime(2026, 1, 23, 10, 13, 47, 123000),
+        "col_bytes": b"binary data",
+    }
+
+    handle = upsert_writer.upsert(row_data)
+    await handle.wait()
+
+    lookuper = table.new_lookup().create_lookuper()
+    result = await lookuper.lookup({"pk_int": 1})
+    assert result is not None, "Row should exist"
+
+    assert result["pk_int"] == 1
+    assert result["col_boolean"] is True
+    assert result["col_tinyint"] == 127
+    assert result["col_smallint"] == 32767
+    assert result["col_int"] == 2147483647
+    assert result["col_bigint"] == 9223372036854775807
+    assert math.isclose(result["col_float"], 3.14, rel_tol=1e-6)
+    assert math.isclose(result["col_double"], 2.718281828459045, rel_tol=1e-15)
+    assert result["col_string"] == "world of fluss python client"
+    assert result["col_decimal"] == Decimal("123.45")
+    assert result["col_date"] == date(2026, 1, 23)
+    assert result["col_time"] == dt_time(10, 13, 47, 123000)
+    assert result["col_timestamp_ntz"] == datetime(2026, 1, 23, 10, 13, 47, 123000)
+    assert result["col_timestamp_ltz"] == datetime(
+        2026, 1, 23, 10, 13, 47, 123000, tzinfo=timezone.utc
+    )
+    assert result["col_bytes"] == b"binary data"
+
+    # Test with null values for all nullable columns
+    null_row = {"pk_int": 2}
+    for col in row_data:
+        if col != "pk_int":
+            null_row[col] = None
+    handle = upsert_writer.upsert(null_row)
+    await handle.wait()
+
+    result = await lookuper.lookup({"pk_int": 2})
+    assert result is not None, "Row with nulls should exist"
+    assert result["pk_int"] == 2
+    for col in row_data:
+        if col != "pk_int":
+            assert result[col] is None, f"{col} should be null"
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
new file mode 100644
index 0000000000..3219f03c0d
--- /dev/null
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -0,0 +1,675 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Integration tests for log (append-only) table operations.
+
+Mirrors the Rust integration tests in crates/fluss/tests/integration/log_table.rs.
+"""
+
+import asyncio
+import time
+
+import pyarrow as pa
+
+import fluss
+
+
+async def test_append_and_scan(connection, admin):
+    """Test appending record batches and scanning with a record-based scanner."""
+    table_path = fluss.TablePath("fluss", "py_test_append_and_scan")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("c1", pa.int32()), pa.field("c2", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+
+    batch1 = pa.RecordBatch.from_arrays(
+        [pa.array([1, 2, 3], type=pa.int32()), pa.array(["a1", "a2", "a3"])],
+        schema=pa.schema([pa.field("c1", pa.int32()), pa.field("c2", pa.string())]),
+    )
+    append_writer.write_arrow_batch(batch1)
+
+    batch2 = pa.RecordBatch.from_arrays(
+        [pa.array([4, 5, 6], type=pa.int32()), pa.array(["a4", "a5", "a6"])],
+        schema=pa.schema([pa.field("c1", pa.int32()), pa.field("c2", pa.string())]),
+    )
+    append_writer.write_arrow_batch(batch2)
+
+    await append_writer.flush()
+
+    # Scan with record-based scanner
+    scanner = await table.new_scan().create_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    records = _poll_records(scanner, expected_count=6)
+
+    assert len(records) == 6, f"Expected 6 records, got {len(records)}"
+
+    records.sort(key=lambda r: r.row["c1"])
+
+    expected_c1 = [1, 2, 3, 4, 5, 6]
+    expected_c2 = ["a1", "a2", "a3", "a4", "a5", "a6"]
+    for i, record in enumerate(records):
+        assert record.row["c1"] == expected_c1[i], f"c1 mismatch at row {i}"
+        assert record.row["c2"] == expected_c2[i], f"c2 mismatch at row {i}"
+
+    # Test unsubscribe
+    scanner.unsubscribe(bucket_id=0)
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_append_dict_rows(connection, admin):
+    """Test appending rows as dicts and scanning."""
+    table_path = fluss.TablePath("fluss", "py_test_append_dict_rows")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+
+    # Append using dicts
+    append_writer.append({"id": 1, "name": "Alice"})
+    append_writer.append({"id": 2, "name": "Bob"})
+    # Append using lists
+    append_writer.append([3, "Charlie"])
+    await append_writer.flush()
+
+    scanner = await table.new_scan().create_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    records = _poll_records(scanner, expected_count=3)
+    assert len(records) == 3
+
+    rows = sorted([r.row for r in records], key=lambda r: r["id"])
+    assert rows[0] == {"id": 1, "name": "Alice"}
+    assert rows[1] == {"id": 2, "name": "Bob"}
+    assert rows[2] == {"id": 3, "name": "Charlie"}
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_list_offsets(connection, admin):
+    """Test listing earliest, latest, and timestamp-based offsets."""
+    table_path = fluss.TablePath("fluss", "py_test_list_offsets")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    await asyncio.sleep(2)  # Wait for table initialization
+
+    # Earliest offset should be 0 for empty table
+    earliest = await admin.list_offsets(
+        table_path, bucket_ids=[0], offset_spec=fluss.OffsetSpec.earliest()
+    )
+    assert earliest[0] == 0
+
+    # Latest offset should be 0 for empty table
+    latest = await admin.list_offsets(
+        table_path, bucket_ids=[0], offset_spec=fluss.OffsetSpec.latest()
+    )
+    assert latest[0] == 0
+
+    before_append_ms = int(time.time() * 1000)
+
+    # Append some records
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+    batch = pa.RecordBatch.from_arrays(
+        [
+            pa.array([1, 2, 3], type=pa.int32()),
+            pa.array(["alice", "bob", "charlie"]),
+        ],
+        schema=pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())]),
+    )
+    append_writer.write_arrow_batch(batch)
+    await append_writer.flush()
+
+    await asyncio.sleep(1)
+
+    after_append_ms = int(time.time() * 1000)
+
+    # Latest offset should be 3 after appending 3 records
+    latest_after = await admin.list_offsets(
+        table_path, bucket_ids=[0], offset_spec=fluss.OffsetSpec.latest()
+    )
+    assert latest_after[0] == 3
+
+    # Earliest offset should still be 0
+    earliest_after = await admin.list_offsets(
+        table_path, bucket_ids=[0], offset_spec=fluss.OffsetSpec.earliest()
+    )
+    assert earliest_after[0] == 0
+
+    # Timestamp before append should resolve to offset 0
+    ts_before = await admin.list_offsets(
+        table_path,
+        bucket_ids=[0],
+        offset_spec=fluss.OffsetSpec.timestamp(before_append_ms),
+    )
+    assert ts_before[0] == 0
+
+    # Timestamp after append should resolve to offset 3
+    ts_after = await admin.list_offsets(
+        table_path,
+        bucket_ids=[0],
+        offset_spec=fluss.OffsetSpec.timestamp(after_append_ms),
+    )
+    assert ts_after[0] == 3
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_project(connection, admin):
+    """Test column projection by name and by index."""
+    table_path = fluss.TablePath("fluss", "py_test_project")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("col_a", pa.int32()),
+                pa.field("col_b", pa.string()),
+                pa.field("col_c", pa.int32()),
+            ]
+        )
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+
+    batch = pa.RecordBatch.from_arrays(
+        [
+            pa.array([1, 2, 3], type=pa.int32()),
+            pa.array(["x", "y", "z"]),
+            pa.array([10, 20, 30], type=pa.int32()),
+        ],
+        schema=pa.schema(
+            [
+                pa.field("col_a", pa.int32()),
+                pa.field("col_b", pa.string()),
+                pa.field("col_c", pa.int32()),
+            ]
+        ),
+    )
+    append_writer.write_arrow_batch(batch)
+    await append_writer.flush()
+
+    # Test project_by_name: select col_b and col_c only
+    scan = table.new_scan().project_by_name(["col_b", "col_c"])
+    scanner = await scan.create_log_scanner()
+    scanner.subscribe_buckets({0: 0})
+
+    records = _poll_records(scanner, expected_count=3)
+    assert len(records) == 3
+
+    records.sort(key=lambda r: r.row["col_c"])
+    expected_col_b = ["x", "y", "z"]
+    expected_col_c = [10, 20, 30]
+    for i, record in enumerate(records):
+        assert record.row["col_b"] == expected_col_b[i]
+        assert record.row["col_c"] == expected_col_c[i]
+        # col_a should not be present in projected results
+        assert "col_a" not in record.row
+
+    # Test project by indices [1, 0] -> (col_b, col_a)
+    scanner2 = await table.new_scan().project([1, 0]).create_log_scanner()
+    scanner2.subscribe_buckets({0: 0})
+
+    records2 = _poll_records(scanner2, expected_count=3)
+    assert len(records2) == 3
+
+    records2.sort(key=lambda r: r.row["col_a"])
+    for i, record in enumerate(records2):
+        assert record.row["col_b"] == expected_col_b[i]
+        assert record.row["col_a"] == [1, 2, 3][i]
+        assert "col_c" not in record.row
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_poll_batches(connection, admin):
+    """Test batch-based scanning with poll_arrow and poll_record_batch."""
+    table_path = fluss.TablePath("fluss", "py_test_poll_batches")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    await asyncio.sleep(1)
+
+    table = await connection.get_table(table_path)
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    scanner.subscribe(bucket_id=0, start_offset=0)
+
+    # Empty table should return empty result
+    result = scanner.poll_arrow(500)
+    assert result.num_rows == 0
+
+    writer = table.new_append().create_writer()
+    pa_schema = pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [pa.array([1, 2], type=pa.int32()), pa.array(["a", "b"])],
+            schema=pa_schema,
+        )
+    )
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [pa.array([3, 4], type=pa.int32()), pa.array(["c", "d"])],
+            schema=pa_schema,
+        )
+    )
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [pa.array([5, 6], type=pa.int32()), pa.array(["e", "f"])],
+            schema=pa_schema,
+        )
+    )
+    await writer.flush()
+
+    # Poll until we get all 6 records
+    all_ids = _poll_arrow_ids(scanner, expected_count=6)
+    assert all_ids == [1, 2, 3, 4, 5, 6]
+
+    # Append more and verify offset continuation (no duplicates)
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [pa.array([7, 8], type=pa.int32()), pa.array(["g", "h"])],
+            schema=pa_schema,
+        )
+    )
+    await writer.flush()
+
+    new_ids = _poll_arrow_ids(scanner, expected_count=2)
+    assert new_ids == [7, 8]
+
+    # Subscribe from mid-offset should truncate (skip earlier records)
+    trunc_scanner = await table.new_scan().create_record_batch_log_scanner()
+    trunc_scanner.subscribe(bucket_id=0, start_offset=3)
+
+    trunc_ids = _poll_arrow_ids(trunc_scanner, expected_count=5)
+    assert trunc_ids == [4, 5, 6, 7, 8]
+
+    # Projection with batch scanner
+    proj_scanner = (
+        await table.new_scan()
+        .project_by_name(["id"])
+        .create_record_batch_log_scanner()
+    )
+    proj_scanner.subscribe(bucket_id=0, start_offset=0)
+    batches = proj_scanner.poll_record_batch(10000)
+    assert len(batches) > 0
+    assert batches[0].batch.num_columns == 1
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_to_arrow_and_to_pandas(connection, admin):
+    """Test to_arrow() and to_pandas() convenience methods."""
+    table_path = fluss.TablePath("fluss", "py_test_to_arrow_pandas")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+
+    pa_schema = pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [pa.array([1, 2, 3], type=pa.int32()), pa.array(["a", "b", "c"])],
+            schema=pa_schema,
+        )
+    )
+    await writer.flush()
+
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+
+    # to_arrow()
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+    arrow_table = scanner.to_arrow()
+    assert arrow_table.num_rows == 3
+    assert arrow_table.schema.names == ["id", "name"]
+
+    # to_pandas()
+    scanner2 = await table.new_scan().create_record_batch_log_scanner()
+    scanner2.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+    df = scanner2.to_pandas()
+    assert len(df) == 3
+    assert list(df.columns) == ["id", "name"]
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_partitioned_table_append_scan(connection, admin):
+    """Test append and scan on a partitioned log table."""
+    table_path = fluss.TablePath("fluss", "py_test_partitioned_log_append")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("region", pa.string()),
+                pa.field("value", pa.int64()),
+            ]
+        )
+    )
+    table_descriptor = fluss.TableDescriptor(
+        schema,
+        partition_keys=["region"],
+    )
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    # Create partitions
+    for region in ["US", "EU"]:
+        await admin.create_partition(
+            table_path, {"region": region}, ignore_if_exists=True
+        )
+
+    await asyncio.sleep(2)  # Wait for partitions to be available
+
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+
+    # Append rows
+    test_data = [
+        (1, "US", 100),
+        (2, "US", 200),
+        (3, "EU", 300),
+        (4, "EU", 400),
+    ]
+    for id_, region, value in test_data:
+        append_writer.append({"id": id_, "region": region, "value": value})
+    await append_writer.flush()
+
+    # Append arrow batches per partition
+    pa_schema = pa.schema(
+        [
+            pa.field("id", pa.int32()),
+            pa.field("region", pa.string()),
+            pa.field("value", pa.int64()),
+        ]
+    )
+    us_batch = pa.RecordBatch.from_arrays(
+        [
+            pa.array([5, 6], type=pa.int32()),
+            pa.array(["US", "US"]),
+            pa.array([500, 600], type=pa.int64()),
+        ],
+        schema=pa_schema,
+    )
+    append_writer.write_arrow_batch(us_batch)
+
+    eu_batch = pa.RecordBatch.from_arrays(
+        [
+            pa.array([7, 8], type=pa.int32()),
+            pa.array(["EU", "EU"]),
+            pa.array([700, 800], type=pa.int64()),
+        ],
+        schema=pa_schema,
+    )
+    append_writer.write_arrow_batch(eu_batch)
+    await append_writer.flush()
+
+    # Verify partition offsets
+    us_offsets = await admin.list_partition_offsets(
+        table_path,
+        partition_name="US",
+        bucket_ids=[0],
+        offset_spec=fluss.OffsetSpec.latest(),
+    )
+    assert us_offsets[0] == 4, "US partition should have 4 records"
+
+    eu_offsets = await admin.list_partition_offsets(
+        table_path,
+        partition_name="EU",
+        bucket_ids=[0],
+        offset_spec=fluss.OffsetSpec.latest(),
+    )
+    assert eu_offsets[0] == 4, "EU partition should have 4 records"
+
+    # Scan all partitions
+    scanner = await table.new_scan().create_log_scanner()
+    partition_infos = await admin.list_partition_infos(table_path)
+    for p in partition_infos:
+        scanner.subscribe_partition(
+            partition_id=p.partition_id, bucket_id=0, start_offset=0
+        )
+
+    expected = [
+        (1, "US", 100),
+        (2, "US", 200),
+        (3, "EU", 300),
+        (4, "EU", 400),
+        (5, "US", 500),
+        (6, "US", 600),
+        (7, "EU", 700),
+        (8, "EU", 800),
+    ]
+
+    records = _poll_records(scanner, expected_count=8)
+    assert len(records) == 8
+
+    collected = sorted(
+        [(r.row["id"], r.row["region"], r.row["value"]) for r in records],
+        key=lambda x: x[0],
+    )
+    assert collected == expected
+
+    # Test unsubscribe_partition: unsubscribe from EU, only US data should remain
+    unsub_scanner = await table.new_scan().create_log_scanner()
+    eu_partition_id = next(
+        p.partition_id for p in partition_infos if p.partition_name == "EU"
+    )
+    for p in partition_infos:
+        unsub_scanner.subscribe_partition(p.partition_id, 0, 0)
+    unsub_scanner.unsubscribe_partition(eu_partition_id, 0)
+
+    remaining = _poll_records(unsub_scanner, expected_count=4, timeout_s=5)
+    assert len(remaining) == 4
+    assert all(r.row["region"] == "US" for r in remaining)
+
+    # Test subscribe_partition_buckets (batch subscribe)
+    batch_scanner = await table.new_scan().create_log_scanner()
+    partition_bucket_offsets = {
+        (p.partition_id, 0): fluss.EARLIEST_OFFSET for p in partition_infos
+    }
+    batch_scanner.subscribe_partition_buckets(partition_bucket_offsets)
+
+    batch_records = _poll_records(batch_scanner, expected_count=8)
+    assert len(batch_records) == 8
+    batch_collected = sorted(
+        [(r.row["id"], r.row["region"], r.row["value"]) for r in batch_records],
+        key=lambda x: x[0],
+    )
+    assert batch_collected == expected
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_write_arrow(connection, admin):
+    """Test writing a full PyArrow Table via write_arrow()."""
+    table_path = fluss.TablePath("fluss", "py_test_write_arrow")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+
+    pa_schema = pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    arrow_table = pa.table(
+        {
+            "id": pa.array([1, 2, 3, 4, 5], type=pa.int32()),
+            "name": pa.array(["alice", "bob", "charlie", "dave", "eve"]),
+        },
+        schema=pa_schema,
+    )
+    writer.write_arrow(arrow_table)
+    await writer.flush()
+
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    result = scanner.to_arrow()
+    assert result.num_rows == 5
+
+    ids = sorted(result.column("id").to_pylist())
+    names = [
+        n
+        for _, n in sorted(
+            zip(result.column("id").to_pylist(), result.column("name").to_pylist())
+        )
+    ]
+    assert ids == [1, 2, 3, 4, 5]
+    assert names == ["alice", "bob", "charlie", "dave", "eve"]
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_write_pandas(connection, admin):
+    """Test writing a Pandas DataFrame via write_pandas()."""
+    import pandas as pd
+
+    table_path = fluss.TablePath("fluss", "py_test_write_pandas")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+
+    df = pd.DataFrame({"id": [10, 20, 30], "name": ["x", "y", "z"]})
+    writer.write_pandas(df)
+    await writer.flush()
+
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    result = scanner.to_pandas()
+    assert len(result) == 3
+
+    result_sorted = result.sort_values("id").reset_index(drop=True)
+    assert result_sorted["id"].tolist() == [10, 20, 30]
+    assert result_sorted["name"].tolist() == ["x", "y", "z"]
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_partitioned_table_to_arrow(connection, admin):
+    """Test to_arrow() on partitioned tables."""
+    table_path = fluss.TablePath("fluss", "py_test_partitioned_to_arrow")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("region", pa.string()),
+                pa.field("value", pa.int64()),
+            ]
+        )
+    )
+    table_descriptor = fluss.TableDescriptor(schema, partition_keys=["region"])
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    for region in ["US", "EU"]:
+        await admin.create_partition(
+            table_path, {"region": region}, ignore_if_exists=True
+        )
+
+    await asyncio.sleep(2)
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+    writer.append({"id": 1, "region": "US", "value": 100})
+    writer.append({"id": 2, "region": "EU", "value": 200})
+    await writer.flush()
+
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    partition_infos = await admin.list_partition_infos(table_path)
+    for p in partition_infos:
+        scanner.subscribe_partition(p.partition_id, 0, fluss.EARLIEST_OFFSET)
+
+    arrow_table = scanner.to_arrow()
+    assert arrow_table.num_rows == 2
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+def _poll_records(scanner, expected_count, timeout_s=10):
+    """Poll a record-based scanner until expected_count records are collected."""
+    collected = []
+    deadline = time.monotonic() + timeout_s
+    while len(collected) < expected_count and time.monotonic() < deadline:
+        records = scanner.poll(5000)
+        collected.extend(records)
+    return collected
+
+
+def _poll_arrow_ids(scanner, expected_count, timeout_s=10):
+    """Poll a batch scanner and extract 'id' column values."""
+    all_ids = []
+    deadline = time.monotonic() + timeout_s
+    while len(all_ids) < expected_count and time.monotonic() < deadline:
+        arrow_table = scanner.poll_arrow(5000)
+        if arrow_table.num_rows > 0:
+            all_ids.extend(arrow_table.column("id").to_pylist())
+    return all_ids
diff --git a/fluss-rust/website/docs/developer-guide/contributing.md b/fluss-rust/website/docs/developer-guide/contributing.md
index eced106aad..38b792e8e6 100644
--- a/fluss-rust/website/docs/developer-guide/contributing.md
+++ b/fluss-rust/website/docs/developer-guide/contributing.md
@@ -82,7 +82,7 @@ cargo build --workspace --all-targets
 # Run unit tests
 cargo test --workspace
 
-# Run integration tests (requires a running Fluss cluster)
+# Run integration tests (requires Docker)
 RUST_TEST_THREADS=1 cargo test --features integration_tests --workspace
 
 # Run a single test
@@ -93,9 +93,15 @@ cargo test test_name
 
 ```bash
 cd bindings/python
-pip install maturin
-pip install -e ".[dev]"
-maturin develop
+
+# Install dev dependencies and build the extension
+uv sync --extra dev && uv run maturin develop
+
+# Run integration tests (requires Docker)
+uv run pytest test/ -v
+
+# To run against an existing cluster instead
+FLUSS_BOOTSTRAP_SERVERS=127.0.0.1:9123 uv run pytest test/ -v
 ```
 
 ### C++ Bindings

From 56d5ca1af8ca69200d44b860d238113475a5f411 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Tue, 17 Feb 2026 12:27:54 +0000
Subject: [PATCH 154/287] chore: Fix issue where interleaving non-Pk column
 with PK columns cause lookup panic (#346)

---
 fluss-rust/bindings/python/src/lookup.rs      |  4 +-
 fluss-rust/bindings/python/src/table.rs       | 52 ++++++++++++++++---
 .../bindings/python/test/test_kv_table.py     |  4 +-
 .../bindings/python/test/test_log_table.py    |  3 ++
 4 files changed, 53 insertions(+), 10 deletions(-)

diff --git a/fluss-rust/bindings/python/src/lookup.rs b/fluss-rust/bindings/python/src/lookup.rs
index 718f8e5038..e2edbf415a 100644
--- a/fluss-rust/bindings/python/src/lookup.rs
+++ b/fluss-rust/bindings/python/src/lookup.rs
@@ -15,7 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::table::{internal_row_to_dict, python_to_sparse_generic_row};
+use crate::table::{internal_row_to_dict, python_to_dense_generic_row};
 use crate::*;
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::Arc;
@@ -53,7 +53,7 @@ impl Lookuper {
         pk: &Bound<'_, PyAny>,
     ) -> PyResult<Bound<'py, PyAny>> {
         let pk_indices = self.table_info.get_schema().primary_key_indexes();
-        let generic_row = python_to_sparse_generic_row(pk, &self.table_info, &pk_indices)?;
+        let generic_row = python_to_dense_generic_row(pk, &self.table_info, &pk_indices)?;
         let inner = self.inner.clone();
         let table_info = self.table_info.clone();
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 80852152e1..c3ea248e04 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -783,6 +783,7 @@ fn process_sequence(
     target_indices: &[usize],
     fields: &[fcore::metadata::DataField],
     datums: &mut [fcore::row::Datum<'static>],
+    sparse: bool,
 ) -> PyResult<()> {
     if seq.len()? != target_indices.len() {
         return Err(FlussError::new_err(format!(
@@ -794,7 +795,8 @@ fn process_sequence(
     for (i, &col_idx) in target_indices.iter().enumerate() {
         let field = &fields[col_idx];
         let value = seq.get_item(i)?;
-        datums[col_idx] = python_value_to_datum(&value, field.data_type())
+        let dest = if sparse { col_idx } else { i };
+        datums[dest] = python_value_to_datum(&value, field.data_type())
             .map_err(|e| FlussError::new_err(format!("Field '{}': {}", field.name(), e)))?;
     }
     Ok(())
@@ -806,12 +808,37 @@ pub fn python_to_sparse_generic_row(
     row: &Bound<PyAny>,
     table_info: &fcore::metadata::TableInfo,
     target_indices: &[usize],
+) -> PyResult<fcore::row::GenericRow<'static>> {
+    python_to_generic_row_inner(row, table_info, target_indices, true)
+}
+
+/// Build a dense GenericRow with exactly `target_indices.len()` fields,
+/// containing only the target column values in order.
+pub fn python_to_dense_generic_row(
+    row: &Bound<PyAny>,
+    table_info: &fcore::metadata::TableInfo,
+    target_indices: &[usize],
+) -> PyResult<fcore::row::GenericRow<'static>> {
+    python_to_generic_row_inner(row, table_info, target_indices, false)
+}
+
+/// Build a GenericRow from user input. When `sparse` is true, the row is full width and padded with nulls
+fn python_to_generic_row_inner(
+    row: &Bound<PyAny>,
+    table_info: &fcore::metadata::TableInfo,
+    target_indices: &[usize],
+    sparse: bool,
 ) -> PyResult<fcore::row::GenericRow<'static>> {
     let row_type = table_info.row_type();
     let fields = row_type.fields();
     let target_names: Vec<&str> = target_indices.iter().map(|&i| fields[i].name()).collect();
 
-    let mut datums: Vec<fcore::row::Datum<'static>> = vec![fcore::row::Datum::Null; fields.len()];
+    let num_fields = if sparse {
+        fields.len()
+    } else {
+        target_indices.len()
+    };
+    let mut datums: Vec<fcore::row::Datum<'static>> = vec![fcore::row::Datum::Null; num_fields];
 
     let row_input: RowInput = row.extract().map_err(|_| {
         let type_name = row
@@ -849,19 +876,30 @@ pub fn python_to_sparse_generic_row(
                 let value = dict
                     .get_item(name)?
                     .ok_or_else(|| FlussError::new_err(format!("Missing field: {name}")))?;
-                datums[col_idx] = python_value_to_datum(&value, field.data_type())
+                let dest = if sparse { col_idx } else { i };
+                datums[dest] = python_value_to_datum(&value, field.data_type())
                     .map_err(|e| FlussError::new_err(format!("Field '{name}': {e}")))?;
             }
         }
 
         RowInput::List(list) => {
-            let seq = list.as_sequence();
-            process_sequence(seq, target_indices, fields, &mut datums)?;
+            process_sequence(
+                list.as_sequence(),
+                target_indices,
+                fields,
+                &mut datums,
+                sparse,
+            )?;
         }
 
         RowInput::Tuple(tuple) => {
-            let seq = tuple.as_sequence();
-            process_sequence(seq, target_indices, fields, &mut datums)?;
+            process_sequence(
+                tuple.as_sequence(),
+                target_indices,
+                fields,
+                &mut datums,
+                sparse,
+            )?;
         }
     }
 
diff --git a/fluss-rust/bindings/python/test/test_kv_table.py b/fluss-rust/bindings/python/test/test_kv_table.py
index 98b0cee969..36aa3e463b 100644
--- a/fluss-rust/bindings/python/test/test_kv_table.py
+++ b/fluss-rust/bindings/python/test/test_kv_table.py
@@ -101,12 +101,14 @@ async def test_composite_primary_keys(connection, admin):
     table_path = fluss.TablePath("fluss", "py_test_composite_pk")
     await admin.drop_table(table_path, ignore_if_not_exists=True)
 
+    # PK columns intentionally interleaved with non-PK column to verify
+    # that lookup correctly handles non-contiguous primary key indices.
     schema = fluss.Schema(
         pa.schema(
             [
                 pa.field("region", pa.string()),
-                pa.field("user_id", pa.int32()),
                 pa.field("score", pa.int64()),
+                pa.field("user_id", pa.int32()),
             ]
         ),
         primary_keys=["region", "user_id"],
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index 3219f03c0d..09586aa8de 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -179,6 +179,9 @@ async def test_list_offsets(connection, admin):
     )
     assert ts_before[0] == 0
 
+    # Intentional sleep to avoid race condition FlussError(code=38) The timestamp is invalid
+    await asyncio.sleep(1)
+
     # Timestamp after append should resolve to offset 3
     ts_after = await admin.list_offsets(
         table_path,

From bb685325da75ca1ec3e8dc80a769513b5cd59b10 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Tue, 17 Feb 2026 13:01:59 +0000
Subject: [PATCH 155/287] chore: add API reference for CustomProperty (#336)

---
 .../docs/user-guide/cpp/api-reference.md      | 52 ++++++++++---------
 .../docs/user-guide/rust/api-reference.md     | 39 +++++++-------
 2 files changed, 48 insertions(+), 43 deletions(-)

diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index 9cba2431b2..681394ae48 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -286,15 +286,16 @@ When using `table.NewRow()`, the `Set()` method auto-routes to the correct type
 
 ## `TableDescriptor::Builder`
 
-| Method                                                                      |  Description               |
-|-----------------------------------------------------------------------------|----------------------------|
-| `SetSchema(const Schema& schema) -> Builder&`                               | Set the table schema       |
-| `SetPartitionKeys(const std::vector<std::string>& keys) -> Builder&`        | Set partition key columns  |
-| `SetBucketCount(int32_t count) -> Builder&`                                 | Set the number of buckets  |
-| `SetBucketKeys(const std::vector<std::string>& keys) -> Builder&`           | Set bucket key columns     |
-| `SetProperty(const std::string& key, const std::string& value) -> Builder&` | Set a table property       |
-| `SetComment(const std::string& comment) -> Builder&`                        | Set a table comment        |
-| `Build() -> TableDescriptor`                                                | Build the table descriptor |
+| Method                                                                            | Description                |
+|-----------------------------------------------------------------------------------|----------------------------|
+| `SetSchema(const Schema& schema) -> Builder&`                                     | Set the table schema       |
+| `SetPartitionKeys(const std::vector<std::string>& keys) -> Builder&`              | Set partition key columns  |
+| `SetBucketCount(int32_t count) -> Builder&`                                       | Set the number of buckets  |
+| `SetBucketKeys(const std::vector<std::string>& keys) -> Builder&`                 | Set bucket key columns     |
+| `SetProperty(const std::string& key, const std::string& value) -> Builder&`       | Set a table property       |
+| `SetCustomProperty(const std::string& key, const std::string& value) -> Builder&` | Set a custom property      |
+| `SetComment(const std::string& comment) -> Builder&`                              | Set a table comment        |
+| `Build() -> TableDescriptor`                                                      | Build the table descriptor |
 
 ## `DataType`
 
@@ -336,22 +337,23 @@ When using `table.NewRow()`, the `Set()` method auto-routes to the correct type
 
 ## `TableInfo`
 
-| Field             | Type                                           |  Description                        |
-|-------------------|------------------------------------------------|-------------------------------------|
-| `table_id`        | `int64_t`                                      | Table ID                            |
-| `schema_id`       | `int32_t`                                      | Schema ID                           |
-| `table_path`      | `TablePath`                                    | Table path                          |
-| `created_time`    | `int64_t`                                      | Creation timestamp                  |
-| `modified_time`   | `int64_t`                                      | Last modification timestamp         |
-| `primary_keys`    | `std::vector<std::string>`                     | Primary key columns                 |
-| `bucket_keys`     | `std::vector<std::string>`                     | Bucket key columns                  |
-| `partition_keys`  | `std::vector<std::string>`                     | Partition key columns               |
-| `num_buckets`     | `int32_t`                                      | Number of buckets                   |
-| `has_primary_key` | `bool`                                         | Whether the table has a primary key |
-| `is_partitioned`  | `bool`                                         | Whether the table is partitioned    |
-| `properties`      | `std::unordered_map<std::string, std::string>` | Table properties                    |
-| `comment`         | `std::string`                                  | Table comment                       |
-| `schema`          | `Schema`                                       | Table schema                        |
+| Field               | Type                                           | Description                         |
+|---------------------|------------------------------------------------|-------------------------------------|
+| `table_id`          | `int64_t`                                      | Table ID                            |
+| `schema_id`         | `int32_t`                                      | Schema ID                           |
+| `table_path`        | `TablePath`                                    | Table path                          |
+| `created_time`      | `int64_t`                                      | Creation timestamp                  |
+| `modified_time`     | `int64_t`                                      | Last modification timestamp         |
+| `primary_keys`      | `std::vector<std::string>`                     | Primary key columns                 |
+| `bucket_keys`       | `std::vector<std::string>`                     | Bucket key columns                  |
+| `partition_keys`    | `std::vector<std::string>`                     | Partition key columns               |
+| `num_buckets`       | `int32_t`                                      | Number of buckets                   |
+| `has_primary_key`   | `bool`                                         | Whether the table has a primary key |
+| `is_partitioned`    | `bool`                                         | Whether the table is partitioned    |
+| `properties`        | `std::unordered_map<std::string, std::string>` | Table properties                    |
+| `custom_properties` | `std::unordered_map<std::string, std::string>` | Custom properties                   |
+| `comment`           | `std::string`                                  | Table comment                       |
+| `schema`            | `Schema`                                       | Table schema                        |
 
 ## Temporal Types
 
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 0929ce68be..0134fbce31 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -239,27 +239,30 @@ writer.append(&row)?.await?;
 
 ## `TableDescriptor`
 
-| Method                                             |  Description                         |
-|----------------------------------------------------|--------------------------------------|
-| `fn builder() -> TableDescriptorBuilder`           | Create a table descriptor builder    |
-| `fn schema(&self) -> &Schema`                      | Get the table schema                 |
-| `fn partition_keys(&self) -> &[String]`            | Get partition key column names       |
-| `fn has_primary_key(&self) -> bool`                | Check if the table has a primary key |
-| `fn properties(&self) -> &HashMap<String, String>` | Get all table properties             |
-| `fn comment(&self) -> Option<&str>`                | Get table comment                    |
+| Method                                                    | Description                          |
+|-----------------------------------------------------------|--------------------------------------|
+| `fn builder() -> TableDescriptorBuilder`                  | Create a table descriptor builder    |
+| `fn schema(&self) -> &Schema`                             | Get the table schema                 |
+| `fn partition_keys(&self) -> &[String]`                   | Get partition key column names       |
+| `fn has_primary_key(&self) -> bool`                       | Check if the table has a primary key |
+| `fn properties(&self) -> &HashMap<String, String>`        | Get all table properties             |
+| `fn custom_properties(&self) -> &HashMap<String, String>` | Get custom properties                |
+| `fn comment(&self) -> Option<&str>`                       | Get table comment                    |
 
 ## `TableDescriptorBuilder`
 
-| Method                                                                           |  Description                                |
-|----------------------------------------------------------------------------------|---------------------------------------------|
-| `fn schema(schema: Schema) -> Self`                                              | Set the schema                              |
-| `fn log_format(format: LogFormat) -> Self`                                       | Set log format (e.g., `LogFormat::ARROW`)   |
-| `fn kv_format(format: KvFormat) -> Self`                                         | Set KV format (e.g., `KvFormat::COMPACTED`) |
-| `fn property(key: &str, value: &str) -> Self`                                    | Set a table property                        |
-| `fn partitioned_by(keys: Vec<&str>) -> Self`                                     | Set partition columns                       |
-| `fn distributed_by(bucket_count: Option<i32>, bucket_keys: Vec<String>) -> Self` | Set bucket distribution                     |
-| `fn comment(comment: &str) -> Self`                                              | Set table comment                           |
-| `fn build() -> Result<TableDescriptor>`                                          | Build the table descriptor                  |
+| Method                                                                                    | Description                                 |
+|-------------------------------------------------------------------------------------------|---------------------------------------------|
+| `fn schema(schema: Schema) -> Self`                                                       | Set the schema                              |
+| `fn log_format(format: LogFormat) -> Self`                                                | Set log format (e.g., `LogFormat::ARROW`)   |
+| `fn kv_format(format: KvFormat) -> Self`                                                  | Set KV format (e.g., `KvFormat::COMPACTED`) |
+| `fn property(key: &str, value: &str) -> Self`                                             | Set a table property                        |
+| `fn custom_property(key: impl Into<String>, value: impl Into<String>) -> Self`            | Set a single custom property                |
+| `fn custom_properties(properties: HashMap<impl Into<String>, impl Into<String>>) -> Self` | Set custom properties                       |
+| `fn partitioned_by(keys: Vec<&str>) -> Self`                                              | Set partition columns                       |
+| `fn distributed_by(bucket_count: Option<i32>, bucket_keys: Vec<String>) -> Self`          | Set bucket distribution                     |
+| `fn comment(comment: &str) -> Self`                                                       | Set table comment                           |
+| `fn build() -> Result<TableDescriptor>`                                                   | Build the table descriptor                  |
 
 ## `TablePath`
 

From 11299f2ce46cb7a00ba48b594e9cbbb3841b0e33 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Wed, 18 Feb 2026 01:05:25 +0000
Subject: [PATCH 156/287] chore: add missing ChangeType enum and doc in C++.
 Add test coverage for ChangeType in integration test. (#334)

---
 .../docs/user-guide/cpp/api-reference.md      | 39 ++++++++++++++++---
 1 file changed, 33 insertions(+), 6 deletions(-)

diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index 681394ae48..3b93916905 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -226,12 +226,14 @@ When using `table.NewRow()`, the `Set()` method auto-routes to the correct type
 
 ## `ScanRecord`
 
-| Field       | Type         |  Description                  |
-|-------------|--------------|-------------------------------|
-| `bucket_id` | `int32_t`    | Bucket this record belongs to |
-| `offset`    | `int64_t`    | Record offset in the log      |
-| `timestamp` | `int64_t`    | Record timestamp              |
-| `row`       | `GenericRow` | Row data                      |
+| Field          | Type                     | Description                                                         |
+|----------------|--------------------------|---------------------------------------------------------------------|
+| `bucket_id`    | `int32_t`                | Bucket this record belongs to                                       |
+| `partition_id` | `std::optional<int64_t>` | Partition ID (present only for partitioned tables)                  |
+| `offset`       | `int64_t`                | Record offset in the log                                            |
+| `timestamp`    | `int64_t`                | Record timestamp                                                    |
+| `change_type`  | `ChangeType`             | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
+| `row`          | `RowView`                | Row data                                                            |
 
 ## `ScanRecords`
 
@@ -450,6 +452,31 @@ scanner.Subscribe(0, offsets[0]);
 
 ## Enums
 
+### `ChangeType`
+
+| Value          | Short String | Description                      |
+|----------------|--------------|----------------------------------|
+| `AppendOnly`   | `+A`         | Append-only record               |
+| `Insert`       | `+I`         | Inserted row                     |
+| `UpdateBefore` | `-U`         | Previous value of an updated row |
+| `UpdateAfter`  | `+U`         | New value of an updated row      |
+| `Delete`       | `-D`         | Deleted row                      |
+
+You may refer to the following example to convert ChangeType enum to its short string representation.
+
+```cpp
+inline const char* ChangeTypeShortString(ChangeType ct) {
+    switch (ct) {
+        case ChangeType::AppendOnly: return "+A";
+        case ChangeType::Insert: return "+I";
+        case ChangeType::UpdateBefore: return "-U";
+        case ChangeType::UpdateAfter: return "+U";
+        case ChangeType::Delete: return "-D";
+    }
+    throw std::invalid_argument("Unknown ChangeType");
+}
+```
+
 ### `TypeId`
 
 | Value          |  Description               |

From 70160fd0977b4c0ee047c8a6a3df8e180293421e Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 18 Feb 2026 01:42:34 +0000
Subject: [PATCH 157/287] chore: fix sparse to dense representation for CPP
 lookup (#348)

---
 .../bindings/cpp/examples/kv_example.cpp      | 29 ++++++++++---------
 fluss-rust/bindings/cpp/src/lib.rs            | 22 +++++++++-----
 2 files changed, 30 insertions(+), 21 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/kv_example.cpp b/fluss-rust/bindings/cpp/examples/kv_example.cpp
index 497894f5cc..46ed01f682 100644
--- a/fluss-rust/bindings/cpp/examples/kv_example.cpp
+++ b/fluss-rust/bindings/cpp/examples/kv_example.cpp
@@ -371,11 +371,13 @@ int main() {
     fluss::TablePath partitioned_kv_path("fluss", "partitioned_kv_cpp_v1");
     admin.DropTable(partitioned_kv_path, true);
 
+    // PK columns intentionally interleaved with non-PK columns to verify
+    // that lookup correctly builds a dense PK-only row (not sparse full-width).
     auto partitioned_kv_schema = fluss::Schema::NewBuilder()
                                      .AddColumn("region", fluss::DataType::String())
+                                     .AddColumn("score", fluss::DataType::BigInt())
                                      .AddColumn("user_id", fluss::DataType::Int())
                                      .AddColumn("name", fluss::DataType::String())
-                                     .AddColumn("score", fluss::DataType::BigInt())
                                      .SetPrimaryKeys({"region", "user_id"})
                                      .Build();
 
@@ -403,23 +405,24 @@ int main() {
           partitioned_kv_table.NewUpsert().CreateWriter(partitioned_writer));
 
     // Upsert rows across partitions
+    // Column order: region(0), score(1), user_id(2), name(3)
     struct TestRow {
         const char* region;
+        int64_t score;
         int32_t user_id;
         const char* name;
-        int64_t score;
     };
     TestRow test_data[] = {
-        {"US", 1, "Gustave", 100}, {"US", 2, "Lune", 200},   {"EU", 1, "Sciel", 150},
-        {"EU", 2, "Maelle", 250},  {"APAC", 1, "Noco", 300},
+        {"US", 100, 1, "Gustave"}, {"US", 200, 2, "Lune"},   {"EU", 150, 1, "Sciel"},
+        {"EU", 250, 2, "Maelle"},  {"APAC", 300, 1, "Noco"},
     };
 
     for (const auto& td : test_data) {
         auto row = partitioned_kv_table.NewRow();
         row.Set("region", td.region);
+        row.Set("score", td.score);
         row.Set("user_id", td.user_id);
         row.Set("name", td.name);
-        row.Set("score", td.score);
         check("partitioned_upsert", partitioned_writer.Upsert(row));
     }
     check("partitioned_flush", partitioned_writer.Flush());
@@ -442,7 +445,7 @@ int main() {
                       << std::endl;
             std::exit(1);
         }
-        if (result.GetString(2) != td.name || result.GetInt64(3) != td.score) {
+        if (result.GetString(3) != td.name || result.GetInt64(1) != td.score) {
             std::cerr << "ERROR: Data mismatch for region=" << td.region
                       << " user_id=" << td.user_id << std::endl;
             std::exit(1);
@@ -454,9 +457,9 @@ int main() {
     {
         auto row = partitioned_kv_table.NewRow();
         row.Set("region", "US");
+        row.Set("score", static_cast<int64_t>(999));
         row.Set("user_id", 1);
         row.Set("name", "Gustave Updated");
-        row.Set("score", static_cast<int64_t>(999));
         fluss::WriteResult wr;
         check("partitioned_update", partitioned_writer.Upsert(row, wr));
         check("partitioned_update_wait", wr.Wait());
@@ -467,13 +470,13 @@ int main() {
         pk.Set("user_id", 1);
         fluss::LookupResult result;
         check("partitioned_lookup_updated", partitioned_lookuper.Lookup(pk, result));
-        if (!result.Found() || result.GetString(2) != "Gustave Updated" ||
-            result.GetInt64(3) != 999) {
+        if (!result.Found() || result.GetString(3) != "Gustave Updated" ||
+            result.GetInt64(1) != 999) {
             std::cerr << "ERROR: Partition update verification failed" << std::endl;
             std::exit(1);
         }
-        std::cout << "Update verified: US/1 name=" << result.GetString(2)
-                  << " score=" << result.GetInt64(3) << std::endl;
+        std::cout << "Update verified: US/1 name=" << result.GetString(3)
+                  << " score=" << result.GetInt64(1) << std::endl;
     }
 
     // Lookup in non-existent partition
@@ -520,11 +523,11 @@ int main() {
         pk.Set("user_id", 2);
         fluss::LookupResult result;
         check("partitioned_lookup_eu2", partitioned_lookuper.Lookup(pk, result));
-        if (!result.Found() || result.GetString(2) != "Maelle") {
+        if (!result.Found() || result.GetString(3) != "Maelle") {
             std::cerr << "ERROR: Expected EU/2 (Maelle) to still exist" << std::endl;
             std::exit(1);
         }
-        std::cout << "EU/2 still exists: name=" << result.GetString(2) << std::endl;
+        std::cout << "EU/2 still exists: name=" << result.GetString(3) << std::endl;
     }
 
     check("drop_partitioned_kv", admin.DropTable(partitioned_kv_path, true));
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 444b073578..cb29882d16 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -1321,20 +1321,26 @@ unsafe fn delete_lookuper(lookuper: *mut Lookuper) {
 }
 
 impl Lookuper {
-    /// Pad row with Null to full schema width (same as UpsertWriter::pad_row).
-    /// Ensures the PK row is always full-width, matching Python's behavior.
-    fn pad_row<'a>(&self, mut row: fcore::row::GenericRow<'a>) -> fcore::row::GenericRow<'a> {
-        let num_columns = self.table_info.get_schema().columns().len();
-        if row.values.len() < num_columns {
-            row.values.resize(num_columns, fcore::row::Datum::Null);
+    /// Build a dense PK-only row from a (possibly sparse) input row.
+    /// The user may set PK values at their full schema positions (e.g. [0, 2])
+    /// via name-based Set(). We compact them into [0, 1, …] to match
+    /// the lookup_row_type the core KeyEncoder expects.
+    fn dense_pk_row<'a>(&self, mut row: fcore::row::GenericRow<'a>) -> fcore::row::GenericRow<'a> {
+        let pk_indices = self.table_info.get_schema().primary_key_indexes();
+        let mut dense = fcore::row::GenericRow::new(pk_indices.len());
+        for (dense_idx, &schema_idx) in pk_indices.iter().enumerate() {
+            if schema_idx < row.values.len() {
+                dense.values[dense_idx] =
+                    std::mem::replace(&mut row.values[schema_idx], fcore::row::Datum::Null);
+            }
         }
-        row
+        dense
     }
 
     fn lookup(&mut self, pk_row: &GenericRowInner) -> Box<LookupResultInner> {
         let schema = self.table_info.get_schema();
         let generic_row = match types::resolve_row_types(&pk_row.row, Some(schema)) {
-            Ok(r) => self.pad_row(r),
+            Ok(r) => self.dense_pk_row(r),
             Err(e) => {
                 return Box::new(LookupResultInner::from_error(
                     CLIENT_ERROR_CODE,

From 74c92415644c61bae680f10b00a36c443148bd73 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Wed, 18 Feb 2026 02:10:29 +0000
Subject: [PATCH 158/287] chore: add CI for documentation. Minor improvement
 and organisation of website (#350)

---
 fluss-rust/.github/workflows/ci.yml           |  6 +++
 fluss-rust/.github/workflows/docs-check.yml   | 49 +++++++++++++++++++
 .../docs/developer-guide/_category_.json      |  4 --
 fluss-rust/website/docs/index.md              |  6 +--
 .../docs/release/generate-release-note.md     |  8 +--
 .../release/verifying-a-release-candidate.md  |  8 +--
 .../user-guide/cpp/example/_category_.json    |  2 +-
 .../user-guide/python/example/_category_.json |  2 +-
 .../user-guide/rust/example/_category_.json   |  2 +-
 fluss-rust/website/sidebars.ts                | 11 ++---
 10 files changed, 72 insertions(+), 26 deletions(-)
 create mode 100644 fluss-rust/.github/workflows/docs-check.yml
 delete mode 100644 fluss-rust/website/docs/developer-guide/_category_.json

diff --git a/fluss-rust/.github/workflows/ci.yml b/fluss-rust/.github/workflows/ci.yml
index 20bee8775f..d51e3c07df 100644
--- a/fluss-rust/.github/workflows/ci.yml
+++ b/fluss-rust/.github/workflows/ci.yml
@@ -21,9 +21,15 @@ on:
   push:
     branches:
       - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
   pull_request:
     branches:
       - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
 
 concurrency:
   group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
diff --git a/fluss-rust/.github/workflows/docs-check.yml b/fluss-rust/.github/workflows/docs-check.yml
new file mode 100644
index 0000000000..6408c54189
--- /dev/null
+++ b/fluss-rust/.github/workflows/docs-check.yml
@@ -0,0 +1,49 @@
+################################################################################
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+################################################################################
+
+# This workflow is meant for checking broken links in the documentation.
+name: Check Documentation
+permissions:
+  contents: read
+on:
+  pull_request:
+    branches: [main]
+    paths:
+      - 'website/**'
+  push:
+    branches: [main]
+    paths:
+      - 'website/**'
+
+jobs:
+  test-deploy:
+    runs-on: ubuntu-latest
+    defaults:
+      run:
+        working-directory: ./website
+    steps:
+      - uses: actions/checkout@v6
+        with:
+          fetch-depth: 0
+      - uses: actions/setup-node@v6
+        with:
+          node-version: 24
+      - name: Install dependencies
+        run: npm install
+      - name: Test build website
+        run: npm run build -- --no-minify
diff --git a/fluss-rust/website/docs/developer-guide/_category_.json b/fluss-rust/website/docs/developer-guide/_category_.json
deleted file mode 100644
index cc7b01abbc..0000000000
--- a/fluss-rust/website/docs/developer-guide/_category_.json
+++ /dev/null
@@ -1,4 +0,0 @@
-{
-  "label": "Developer Guide",
-  "position": 3
-}
diff --git a/fluss-rust/website/docs/index.md b/fluss-rust/website/docs/index.md
index 4153813877..e7d5e08a87 100644
--- a/fluss-rust/website/docs/index.md
+++ b/fluss-rust/website/docs/index.md
@@ -8,7 +8,7 @@ title: Introduction
 
 [Apache Fluss](https://fluss.apache.org/) (incubating) is a streaming storage system built for real-time analytics, serving as the real-time data layer for Lakehouse architectures.
 
-This documentation covers the **Fluss client libraries** for Rust, Python, and C++, which are developed in the [fluss-rust](https://github.com/apache/fluss-rust) repository. These clients allow you to:
+This documentation covers the **Fluss client libraries** for Rust, Python, C++, and [Java](https://fluss.apache.org/docs/0.9/apis/java-client/), which are developed in the [fluss-rust](https://github.com/apache/fluss-rust) repository (Java client is part of the [main Fluss project](https://github.com/apache/fluss)). These clients allow you to:
 
 - **Create and manage** databases, tables, and partitions
 - **Write** data to log tables (append-only) and primary key tables (upsert/delete)
@@ -40,6 +40,6 @@ You need a running Fluss cluster to use any of the client libraries. See the [De
 
 ## How This Guide Is Organised
 
-The **User Guide** walks through installation, configuration, and working with each table type across all three languages. Code examples are shown side by side under **Rust**, **Python**, and **C++** headings.
+The **Clients** section walks through installation, configuration, and working with each table type across all three languages. Code examples are shown side by side under **Rust**, **Python**, and **C++** headings.
 
-The **Developer Guide** covers building from source, running tests, and the release process for contributors.
+The **Contributing** guide covers building from source, running tests, and the release process for contributors.
diff --git a/fluss-rust/website/docs/release/generate-release-note.md b/fluss-rust/website/docs/release/generate-release-note.md
index edbc43bdbd..9db04a5cab 100644
--- a/fluss-rust/website/docs/release/generate-release-note.md
+++ b/fluss-rust/website/docs/release/generate-release-note.md
@@ -1,10 +1,10 @@
 # Generate Release Note
 
-Use GitHub's **Generate release notes** to produce a draft from merged PRs between tags. Categories (Added, Fixed, Docs, etc.) are configured in [.github/release.yml](../.github/release.yml).
+Use GitHub's **Generate release notes** to produce a draft from merged PRs between tags. Categories (Added, Fixed, Docs, etc.) are configured in [.github/release.yml](https://github.com/apache/fluss-rust/blob/main/.github/release.yml).
 
-1. Go to [Create a new release](https://github.com/apache/fluss-rust/releases/new).
+1. Go to [Creating a Fluss Client Release](create-release.md).
 2. In **Choose a tag**, pick the release tag (e.g. `v0.1.0`).
 3. Click **Generate release notes**.
-4. Copy the generated content for **CHANGELOG.md** or the GitHub Release description. When publishing the release, add the official download link, checksums/verification, and install instructions (see [creating-a-release.md](creating-a-release.md)).
+4. Copy the generated content for **CHANGELOG.md** or the GitHub Release description. When publishing the release, add the official download link, checksums/verification, and install instructions (see [Creating a Fluss Rust Client Release](create-release.md)).
 
-See [creating-a-fluss-rust-release.md](creating-a-fluss-rust-release.md) and [GitHub: Automatically generated release notes](https://docs.github.com/en/repositories/releasing-projects-on-github/automatically-generated-release-notes).
+See [Creating a Fluss Rust Client Release](create-release.md) and [GitHub: Automatically generated release notes](https://docs.github.com/en/repositories/releasing-projects-on-github/automatically-generated-release-notes).
diff --git a/fluss-rust/website/docs/release/verifying-a-release-candidate.md b/fluss-rust/website/docs/release/verifying-a-release-candidate.md
index dc70f723bd..ebb4d97df5 100644
--- a/fluss-rust/website/docs/release/verifying-a-release-candidate.md
+++ b/fluss-rust/website/docs/release/verifying-a-release-candidate.md
@@ -86,7 +86,7 @@ Unzip the source release archive and verify that:
 3. All dependencies have been checked for their license and the license is ASL 2.0 compatible ([ASF third-party license policy](http://www.apache.org/legal/resolved.html#category-x)).
 4. Compatible non-ASL 2.0 licenses are documented (e.g. in NOTICE or in dependency audit files such as `DEPENDENCIES*.tsv`).
 
-The project uses [cargo-deny](https://embarkstudios.github.io/cargo-deny/) for license checks; see [Creating a Fluss Rust Client Release](creating-a-release.md) for how the dependency list is generated before a release.
+The project uses [cargo-deny](https://embarkstudios.github.io/cargo-deny/) for license checks; see [Creating a Fluss Rust Client Release](create-release.md) for how the dependency list is generated before a release.
 
 ## Testing features
 
@@ -94,9 +94,9 @@ For any user-facing feature included in a release, we aim to ensure it is functi
 
 **Per-language verification:** For **Rust** and **C++**, build from the source release and write your own test cases to verify. For **Python**, the RC is published to **TestPyPI**; install the client from TestPyPI and write your own test cases (e.g. connect, create table, read/write) to verify. Use the README in each component as the entry point:
 
-- **Rust client:** You can depend on the RC via its git tag (e.g. in your `Cargo.toml`: `fluss-rs = { git = "https://github.com/apache/fluss-rust", tag = "v${RELEASE_VERSION}-rc${RC_NUM}" }`) and build your own test project to verify. Alternatively, build from the source release; see [crates/fluss/README.md](../crates/fluss/README.md).
-- **Python bindings:** See [bindings/python/README.md](../bindings/python/README.md) for how to add the Python client (for an RC, install from **TestPyPI**: `pip install -i https://test.pypi.org/simple/ pyfluss==${RELEASE_VERSION}`); then write test cases to verify.
-- **C++ bindings:** See [bindings/cpp/README.md](../bindings/cpp/README.md) for how to build and link the C++ client; then write test cases to verify.
+- **Rust client:** You can depend on the RC via its git tag (e.g. in your `Cargo.toml`: `fluss-rs = { git = "https://github.com/apache/fluss-rust", tag = "v${RELEASE_VERSION}-rc${RC_NUM}" }`) and build your own test project to verify. Alternatively, build from the source release; see [Rust Installation Guide](../user-guide/rust/installation.md).
+- **Python bindings:** See [Python Installation Guide](../user-guide/python/installation.md) for how to add the Python client (for an RC, install from **TestPyPI**: `pip install -i https://test.pypi.org/simple/ pyfluss==${RELEASE_VERSION}`); then write test cases to verify.
+- **C++ bindings:** See [C++ Installation Guide](../user-guide/cpp/installation.md) for how to build and link the C++ client; then write test cases to verify.
 
 ## Incubator release checklist
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/_category_.json b/fluss-rust/website/docs/user-guide/cpp/example/_category_.json
index dd2229499b..4d81ec12ae 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/_category_.json
+++ b/fluss-rust/website/docs/user-guide/cpp/example/_category_.json
@@ -1,4 +1,4 @@
 {
-  "label": "Example",
+  "label": "Examples",
   "position": 5
 }
diff --git a/fluss-rust/website/docs/user-guide/python/example/_category_.json b/fluss-rust/website/docs/user-guide/python/example/_category_.json
index dd2229499b..4d81ec12ae 100644
--- a/fluss-rust/website/docs/user-guide/python/example/_category_.json
+++ b/fluss-rust/website/docs/user-guide/python/example/_category_.json
@@ -1,4 +1,4 @@
 {
-  "label": "Example",
+  "label": "Examples",
   "position": 5
 }
diff --git a/fluss-rust/website/docs/user-guide/rust/example/_category_.json b/fluss-rust/website/docs/user-guide/rust/example/_category_.json
index dd2229499b..4d81ec12ae 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/_category_.json
+++ b/fluss-rust/website/docs/user-guide/rust/example/_category_.json
@@ -1,4 +1,4 @@
 {
-  "label": "Example",
+  "label": "Examples",
   "position": 5
 }
diff --git a/fluss-rust/website/sidebars.ts b/fluss-rust/website/sidebars.ts
index f6fbeaca64..1aea14b4ac 100644
--- a/fluss-rust/website/sidebars.ts
+++ b/fluss-rust/website/sidebars.ts
@@ -5,18 +5,13 @@ const sidebars: SidebarsConfig = {
     'index',
     {
       type: 'category',
-      label: 'User Guide',
+      label: 'Clients',
       items: [
         {type: 'autogenerated', dirName: 'user-guide'},
+        {type: 'link', label: 'Java', href: 'https://fluss.apache.org/docs/0.9/apis/java-client/'},
       ],
     },
-    {
-      type: 'category',
-      label: 'Developer Guide',
-      items: [
-        'developer-guide/contributing',
-      ],
-    },
+    'developer-guide/contributing',
     {
       type: 'category',
       label: 'Release',

From f79a9bd47b11eab592f8b448304c0fc2e87ae87a Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 18 Feb 2026 02:11:18 +0000
Subject: [PATCH 159/287] chore: update docs after opaque types CPP rework
 (#349)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |   3 +-
 .../docs/user-guide/cpp/api-reference.md      | 179 ++++++++++++------
 .../website/docs/user-guide/cpp/data-types.md |  98 +++++++---
 .../cpp/example/partitioned-tables.md         |   7 +-
 .../cpp/example/primary-key-tables.md         |  11 +-
 5 files changed, 202 insertions(+), 96 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 00b5000eef..a1a6b1f61e 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -716,10 +716,9 @@ class ScanRecords {
     Iterator begin() const { return Iterator(this, 0); }
     Iterator end() const { return Iterator(this, Size()); }
 
+   private:
     /// Returns the column name-to-index map (lazy-built, cached).
     const std::shared_ptr<detail::ColumnMap>& GetColumnMap() const;
-
-   private:
     friend class LogScanner;
     void Destroy() noexcept;
     void BuildColumnMap() const;
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index 3b93916905..a20739b038 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -145,9 +145,9 @@ Complete API reference for the Fluss C++ client.
 
 ## `Lookuper`
 
-| Method                                                                     |  Description                |
-|----------------------------------------------------------------------------|-----------------------------|
-| `Lookup(const GenericRow& pk_row, bool& found, GenericRow& out) -> Result` | Lookup a row by primary key |
+| Method                                                        |  Description                |
+|---------------------------------------------------------------|-----------------------------|
+| `Lookup(const GenericRow& pk_row, LookupResult& out) -> Result` | Lookup a row by primary key |
 
 ## `LogScanner`
 
@@ -164,21 +164,7 @@ Complete API reference for the Fluss C++ client.
 
 ## `GenericRow`
 
-### Index-Based Getters
-
-| Method                                         |  Description                   |
-|------------------------------------------------|--------------------------------|
-| `GetBool(size_t idx) -> bool`                  | Get boolean value at index     |
-| `GetInt32(size_t idx) -> int32_t`              | Get 32-bit integer at index    |
-| `GetInt64(size_t idx) -> int64_t`              | Get 64-bit integer at index    |
-| `GetFloat32(size_t idx) -> float`              | Get 32-bit float at index      |
-| `GetFloat64(size_t idx) -> double`             | Get 64-bit float at index      |
-| `GetString(size_t idx) -> std::string`         | Get string at index            |
-| `GetBytes(size_t idx) -> std::vector<uint8_t>` | Get binary data at index       |
-| `GetDate(size_t idx) -> Date`                  | Get date at index              |
-| `GetTime(size_t idx) -> Time`                  | Get time at index              |
-| `GetTimestamp(size_t idx) -> Timestamp`        | Get timestamp at index         |
-| `DecimalToString(size_t idx) -> std::string`   | Get decimal as string at index |
+`GenericRow` is a **write-only** row used for append, upsert, delete, and lookup key construction. For reading field values from scan or lookup results, see [`RowView`](#rowview) and [`LookupResult`](#lookupresult).
 
 ### Index-Based Setters
 
@@ -215,34 +201,121 @@ When using `table.NewRow()`, the `Set()` method auto-routes to the correct type
 | `Set(const std::string& name, const Time& value)`        | Set time by column name           |
 | `Set(const std::string& name, const Timestamp& value)`   | Set timestamp by column name      |
 
-### Row Inspection
+## `RowView`
+
+Read-only row view for scan results. Provides zero-copy access to string and bytes data.
+
+:::warning Lifetime
+`RowView` borrows from `ScanRecords`. It must not outlive the `ScanRecords` that produced it (similar to `std::string_view` borrowing from `std::string`).
+:::
 
-| Method                             |  Description                     |
-|------------------------------------|----------------------------------|
-| `FieldCount() -> size_t`           | Get the number of fields         |
-| `GetType(size_t idx) -> DatumType` | Get the datum type at index      |
-| `IsNull(size_t idx) -> bool`       | Check if field is null           |
-| `IsDecimal(size_t idx) -> bool`    | Check if field is a decimal type |
+### Index-Based Getters
+
+| Method                                                     |  Description                   |
+|------------------------------------------------------------|--------------------------------|
+| `FieldCount() -> size_t`                                   | Get the number of fields       |
+| `GetType(size_t idx) -> TypeId`                            | Get the type at index          |
+| `IsNull(size_t idx) -> bool`                               | Check if field is null         |
+| `GetBool(size_t idx) -> bool`                              | Get boolean value at index     |
+| `GetInt32(size_t idx) -> int32_t`                          | Get 32-bit integer at index    |
+| `GetInt64(size_t idx) -> int64_t`                          | Get 64-bit integer at index    |
+| `GetFloat32(size_t idx) -> float`                          | Get 32-bit float at index      |
+| `GetFloat64(size_t idx) -> double`                         | Get 64-bit float at index      |
+| `GetString(size_t idx) -> std::string_view`                | Get string at index (zero-copy)|
+| `GetBytes(size_t idx) -> std::pair<const uint8_t*, size_t>`| Get binary data at index (zero-copy)|
+| `GetDate(size_t idx) -> Date`                              | Get date at index              |
+| `GetTime(size_t idx) -> Time`                              | Get time at index              |
+| `GetTimestamp(size_t idx) -> Timestamp`                    | Get timestamp at index         |
+| `IsDecimal(size_t idx) -> bool`                            | Check if field is a decimal type|
+| `GetDecimalString(size_t idx) -> std::string`              | Get decimal as string at index |
+
+### Name-Based Getters
+
+| Method                                                  |  Description                       |
+|---------------------------------------------------------|------------------------------------|
+| `IsNull(const std::string& name) -> bool`               | Check if field is null by name     |
+| `GetBool(const std::string& name) -> bool`              | Get boolean by column name         |
+| `GetInt32(const std::string& name) -> int32_t`          | Get 32-bit integer by column name  |
+| `GetInt64(const std::string& name) -> int64_t`          | Get 64-bit integer by column name  |
+| `GetFloat32(const std::string& name) -> float`          | Get 32-bit float by column name    |
+| `GetFloat64(const std::string& name) -> double`         | Get 64-bit float by column name    |
+| `GetString(const std::string& name) -> std::string_view`| Get string by column name          |
+| `GetBytes(const std::string& name) -> std::pair<const uint8_t*, size_t>` | Get binary data by column name |
+| `GetDate(const std::string& name) -> Date`              | Get date by column name            |
+| `GetTime(const std::string& name) -> Time`              | Get time by column name            |
+| `GetTimestamp(const std::string& name) -> Timestamp`    | Get timestamp by column name       |
+| `GetDecimalString(const std::string& name) -> std::string` | Get decimal as string by column name |
 
 ## `ScanRecord`
 
-| Field          | Type                     | Description                                                         |
-|----------------|--------------------------|---------------------------------------------------------------------|
-| `bucket_id`    | `int32_t`                | Bucket this record belongs to                                       |
-| `partition_id` | `std::optional<int64_t>` | Partition ID (present only for partitioned tables)                  |
-| `offset`       | `int64_t`                | Record offset in the log                                            |
-| `timestamp`    | `int64_t`                | Record timestamp                                                    |
-| `change_type`  | `ChangeType`             | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
-| `row`          | `RowView`                | Row data                                                            |
+:::warning Lifetime
+`ScanRecord` contains a `RowView` that borrows from `ScanRecords`. It must not outlive the `ScanRecords` that produced it.
+:::
+
+| Field          | Type                    |  Description                     |
+|----------------|-------------------------|----------------------------------|
+| `bucket_id`    | `int32_t`               | Bucket this record belongs to    |
+| `partition_id` | `std::optional<int64_t>`| Partition ID (if partitioned)    |
+| `offset`       | `int64_t`               | Record offset in the log         |
+| `timestamp`    | `int64_t`               | Record timestamp                 |
+| `change_type`  | `ChangeType`            | Type of change (see `ChangeType`)|
+| `row`          | `RowView`               | Read-only row view for field access |
 
 ## `ScanRecords`
 
-| Method                                        |  Description                               |
-|-----------------------------------------------|--------------------------------------------|
-| `Size() -> size_t`                            | Number of records                          |
-| `Empty() -> bool`                             | Check if empty                             |
-| `operator[](size_t idx) -> const ScanRecord&` | Access record by index                     |
-| `begin() / end()`                             | Iterator support for range-based for loops |
+| Method                                 |  Description                               |
+|----------------------------------------|--------------------------------------------|
+| `Size() -> size_t`                     | Number of records                          |
+| `Empty() -> bool`                      | Check if empty                             |
+| `operator[](size_t idx) -> ScanRecord` | Access record by index                     |
+| `begin() / end()`                      | Iterator support for range-based for loops |
+
+## `LookupResult`
+
+Read-only result for lookup operations. Provides zero-copy access to field values.
+
+### Metadata
+
+| Method                      |  Description                   |
+|-----------------------------|--------------------------------|
+| `Found() -> bool`           | Whether a matching row was found |
+| `FieldCount() -> size_t`    | Get the number of fields       |
+
+### Index-Based Getters
+
+| Method                                                     |  Description                   |
+|------------------------------------------------------------|--------------------------------|
+| `GetType(size_t idx) -> TypeId`                            | Get the type at index          |
+| `IsNull(size_t idx) -> bool`                               | Check if field is null         |
+| `GetBool(size_t idx) -> bool`                              | Get boolean value at index     |
+| `GetInt32(size_t idx) -> int32_t`                          | Get 32-bit integer at index    |
+| `GetInt64(size_t idx) -> int64_t`                          | Get 64-bit integer at index    |
+| `GetFloat32(size_t idx) -> float`                          | Get 32-bit float at index      |
+| `GetFloat64(size_t idx) -> double`                         | Get 64-bit float at index      |
+| `GetString(size_t idx) -> std::string_view`                | Get string at index (zero-copy)|
+| `GetBytes(size_t idx) -> std::pair<const uint8_t*, size_t>`| Get binary data at index (zero-copy)|
+| `GetDate(size_t idx) -> Date`                              | Get date at index              |
+| `GetTime(size_t idx) -> Time`                              | Get time at index              |
+| `GetTimestamp(size_t idx) -> Timestamp`                    | Get timestamp at index         |
+| `IsDecimal(size_t idx) -> bool`                            | Check if field is a decimal type|
+| `GetDecimalString(size_t idx) -> std::string`              | Get decimal as string at index |
+
+### Name-Based Getters
+
+| Method                                                  |  Description                       |
+|---------------------------------------------------------|------------------------------------|
+| `IsNull(const std::string& name) -> bool`               | Check if field is null by name     |
+| `GetBool(const std::string& name) -> bool`              | Get boolean by column name         |
+| `GetInt32(const std::string& name) -> int32_t`          | Get 32-bit integer by column name  |
+| `GetInt64(const std::string& name) -> int64_t`          | Get 64-bit integer by column name  |
+| `GetFloat32(const std::string& name) -> float`          | Get 32-bit float by column name    |
+| `GetFloat64(const std::string& name) -> double`         | Get 64-bit float by column name    |
+| `GetString(const std::string& name) -> std::string_view`| Get string by column name          |
+| `GetBytes(const std::string& name) -> std::pair<const uint8_t*, size_t>` | Get binary data by column name |
+| `GetDate(const std::string& name) -> Date`              | Get date by column name            |
+| `GetTime(const std::string& name) -> Time`              | Get time by column name            |
+| `GetTimestamp(const std::string& name) -> Timestamp`    | Get timestamp by column name       |
+| `GetDecimalString(const std::string& name) -> std::string` | Get decimal as string by column name |
 
 ## `ArrowRecordBatch`
 
@@ -496,25 +569,15 @@ inline const char* ChangeTypeShortString(ChangeType ct) {
 | `TimestampLtz` | Timestamp with timezone    |
 | `Decimal`      | Decimal                    |
 
-### `DatumType`
-
-| Value           | C++ Type               |  Description                    |
-|-----------------|------------------------|---------------------------------|
-| `Null`          | --                     | Null value                      |
-| `Bool`          | `bool`                 | Boolean                         |
-| `Int32`         | `int32_t`              | 32-bit integer                  |
-| `Int64`         | `int64_t`              | 64-bit integer                  |
-| `Float32`       | `float`                | 32-bit float                    |
-| `Float64`       | `double`               | 64-bit float                    |
-| `String`        | `std::string`          | String                          |
-| `Bytes`         | `std::vector<uint8_t>` | Binary data                     |
-| `DecimalI64`    | `int64_t`              | Decimal (64-bit internal)       |
-| `DecimalI128`   | `__int128`             | Decimal (128-bit internal)      |
-| `DecimalString` | `std::string`          | Decimal (string representation) |
-| `Date`          | `Date`                 | Date                            |
-| `Time`          | `Time`                 | Time                            |
-| `TimestampNtz`  | `Timestamp`            | Timestamp without timezone      |
-| `TimestampLtz`  | `Timestamp`            | Timestamp with timezone         |
+### `ChangeType`
+
+| Value          |  Description                                |
+|----------------|---------------------------------------------|
+| `AppendOnly`   | Append-only record (log tables)             |
+| `Insert`       | Inserted row (PK tables)                    |
+| `UpdateBefore` | Row value before an update (PK tables)      |
+| `UpdateAfter`  | Row value after an update (PK tables)       |
+| `Delete`       | Deleted row (PK tables)                     |
 
 ### `OffsetSpec`
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/data-types.md b/fluss-rust/website/docs/user-guide/cpp/data-types.md
index fb01ac2845..18121d3aa9 100644
--- a/fluss-rust/website/docs/user-guide/cpp/data-types.md
+++ b/fluss-rust/website/docs/user-guide/cpp/data-types.md
@@ -24,6 +24,8 @@ sidebar_position: 3
 
 ## GenericRow Setters
 
+`SetInt32` is used for `TinyInt`, `SmallInt`, and `Int` columns. For `TinyInt` and `SmallInt`, the value is validated at write time — an error is returned if it overflows the column's range (e.g., \[-128, 127\] for `TinyInt`, \[-32768, 32767\] for `SmallInt`).
+
 ```cpp
 fluss::GenericRow row;
 row.SetNull(0);
@@ -52,46 +54,90 @@ row.Set("created_at", fluss::Timestamp::FromMillis(1700000000000));
 row.Set("nickname", nullptr);    // set to null
 ```
 
-## GenericRow Getters
+## Reading Field Values
+
+Field values are read through `RowView` (from scan results) and `LookupResult` (from lookups), not through `GenericRow`. Both provide the same getter interface with zero-copy access to string and bytes data.
+
+:::warning Lifetime
+`RowView` borrows from `ScanRecords`. It must not outlive the `ScanRecords` that produced it (similar to `std::string_view` borrowing from `std::string`).
+:::
 
 ```cpp
-std::string name = result_row.GetString(1);
-float score = result_row.GetFloat32(3);
-std::string balance = result_row.DecimalToString(4);
-fluss::Date date = result_row.GetDate(5);
-fluss::Time time = result_row.GetTime(6);
-fluss::Timestamp ts = result_row.GetTimestamp(7);
+// DON'T — string_view dangles after ScanRecords is destroyed:
+std::string_view dangling;
+{
+    fluss::ScanRecords records;
+    scanner.Poll(5000, records);
+    dangling = records[0].row.GetString(0); // points into ScanRecords memory
+}
+// dangling is undefined behavior here — ScanRecords is gone!
+
+// DO — use values within ScanRecords lifetime, or copy when you need ownership:
+fluss::ScanRecords records;
+scanner.Poll(5000, records);
+for (const auto& rec : records) {
+    auto name = rec.row.GetString(0);              // zero-copy string_view
+    auto owned = std::string(rec.row.GetString(0)); // explicit copy when needed
+    process(owned);
+}
+```
+
+### From Scan Results (RowView)
+
+```cpp
+for (const auto& rec : records) {
+    auto name = rec.row.GetString(1);          // zero-copy string_view
+    float score = rec.row.GetFloat32(3);
+    auto balance = rec.row.GetDecimalString(4); // std::string (already owned)
+    fluss::Date date = rec.row.GetDate(5);
+    fluss::Time time = rec.row.GetTime(6);
+    fluss::Timestamp ts = rec.row.GetTimestamp(7);
+}
+```
+
+### From Lookup Results (LookupResult)
+
+```cpp
+fluss::LookupResult result;
+lookuper.Lookup(pk_row, result);
+if (result.Found()) {
+    auto name = result.GetString(1);  // zero-copy string_view
+    int64_t age = result.GetInt64(2);
+}
 ```
 
-## DatumType Enum
-
-| DatumType       | C++ Type               | Getter                 |
-|-----------------|------------------------|------------------------|
-| `Null`          | --                     | `IsNull(idx)`          |
-| `Bool`          | `bool`                 | `GetBool(idx)`         |
-| `Int32`         | `int32_t`              | `GetInt32(idx)`        |
-| `Int64`         | `int64_t`              | `GetInt64(idx)`        |
-| `Float32`       | `float`                | `GetFloat32(idx)`      |
-| `Float64`       | `double`               | `GetFloat64(idx)`      |
-| `String`        | `std::string`          | `GetString(idx)`       |
-| `Bytes`         | `std::vector<uint8_t>` | `GetBytes(idx)`        |
-| `Date`          | `Date`                 | `GetDate(idx)`         |
-| `Time`          | `Time`                 | `GetTime(idx)`         |
-| `TimestampNtz`  | `Timestamp`            | `GetTimestamp(idx)`    |
-| `TimestampLtz`  | `Timestamp`            | `GetTimestamp(idx)`    |
-| `DecimalString` | `std::string`          | `DecimalToString(idx)` |
+## TypeId Enum
+
+`TinyInt` and `SmallInt` values are widened to `int32_t` on read.
+
+| TypeId          | C++ Type                                    | Getter                    |
+|-----------------|---------------------------------------------|---------------------------|
+| `Boolean`       | `bool`                                      | `GetBool(idx)`            |
+| `TinyInt`       | `int32_t`                                   | `GetInt32(idx)`           |
+| `SmallInt`      | `int32_t`                                   | `GetInt32(idx)`           |
+| `Int`           | `int32_t`                                   | `GetInt32(idx)`           |
+| `BigInt`        | `int64_t`                                   | `GetInt64(idx)`           |
+| `Float`         | `float`                                     | `GetFloat32(idx)`         |
+| `Double`        | `double`                                    | `GetFloat64(idx)`         |
+| `String`        | `std::string_view`                          | `GetString(idx)`          |
+| `Bytes`         | `std::pair<const uint8_t*, size_t>`         | `GetBytes(idx)`           |
+| `Date`          | `Date`                                      | `GetDate(idx)`            |
+| `Time`          | `Time`                                      | `GetTime(idx)`            |
+| `Timestamp`     | `Timestamp`                                 | `GetTimestamp(idx)`       |
+| `TimestampLtz`  | `Timestamp`                                 | `GetTimestamp(idx)`       |
+| `Decimal`       | `std::string`                               | `GetDecimalString(idx)`   |
 
 ## Type Checking
 
 ```cpp
-if (rec.row.GetType(0) == fluss::DatumType::Int32) {
+if (rec.row.GetType(0) == fluss::TypeId::Int) {
     int32_t value = rec.row.GetInt32(0);
 }
 if (rec.row.IsNull(1)) {
     // field is null
 }
 if (rec.row.IsDecimal(2)) {
-    std::string decimal_str = rec.row.DecimalToString(2);
+    std::string decimal_str = rec.row.GetDecimalString(2);
 }
 ```
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
index 371ee3e020..17c1c2057d 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/partitioned-tables.md
@@ -171,10 +171,9 @@ pk.Set("user_id", 1001);
 pk.Set("region", "APAC");
 pk.Set("zone", static_cast<int64_t>(1));
 
-bool found = false;
-fluss::GenericRow result;
-lookuper.Lookup(pk, found, result);
-if (found) {
+fluss::LookupResult result;
+lookuper.Lookup(pk, result);
+if (result.Found()) {
     std::cout << "score=" << result.GetInt64(3) << std::endl;
 }
 ```
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/primary-key-tables.md b/fluss-rust/website/docs/user-guide/cpp/example/primary-key-tables.md
index 7aa87e31a7..f26b5477a7 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/primary-key-tables.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/primary-key-tables.md
@@ -120,13 +120,12 @@ table.NewLookup().CreateLookuper(lookuper);
 auto pk_row = table.NewRow();
 pk_row.Set("id", 1);
 
-bool found = false;
-fluss::GenericRow result_row;
-lookuper.Lookup(pk_row, found, result_row);
+fluss::LookupResult result;
+lookuper.Lookup(pk_row, result);
 
-if (found) {
-    std::cout << "Found: name=" << result_row.GetString(1)
-              << ", age=" << result_row.GetInt64(2) << std::endl;
+if (result.Found()) {
+    std::cout << "Found: name=" << result.GetString(1)
+              << ", age=" << result.GetInt64(2) << std::endl;
 } else {
     std::cout << "Not found" << std::endl;
 }

From cb4a9b30684cc826ceed2a1f599abde802255940 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Thu, 19 Feb 2026 09:01:59 +0000
Subject: [PATCH 160/287] chore: make RowView shared_ptr (#353)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     | 29 ++++++++-------
 fluss-rust/bindings/cpp/src/table.cpp         | 35 ++++---------------
 .../docs/user-guide/cpp/api-reference.md      | 10 +++---
 .../website/docs/user-guide/cpp/data-types.md | 29 ++++++++-------
 .../docs/user-guide/cpp/example/log-tables.md | 28 +++++++++++++++
 5 files changed, 68 insertions(+), 63 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index a1a6b1f61e..27d1fcb9c1 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -617,15 +617,15 @@ class GenericRow {
 
 /// Read-only row view for scan results. Zero-copy access to string and bytes data.
 ///
-/// WARNING: RowView borrows from ScanRecords. It must not outlive the ScanRecords
-/// that produced it (similar to std::string_view borrowing from std::string).
+/// RowView shares ownership of the underlying scan data via reference counting,
+/// so it can safely outlive the ScanRecords that produced it.
 class RowView : public detail::NamedGetters<RowView> {
     friend struct detail::NamedGetters<RowView>;
 
    public:
-    RowView(const ffi::ScanResultInner* inner, size_t record_idx,
-            const detail::ColumnMap* column_map)
-        : inner_(inner), record_idx_(record_idx), column_map_(column_map) {}
+    RowView(std::shared_ptr<const ffi::ScanResultInner> inner, size_t record_idx,
+            std::shared_ptr<const detail::ColumnMap> column_map)
+        : inner_(std::move(inner)), record_idx_(record_idx), column_map_(std::move(column_map)) {}
 
     // ── Index-based getters ──────────────────────────────────────────
     size_t FieldCount() const;
@@ -665,15 +665,15 @@ class RowView : public detail::NamedGetters<RowView> {
         }
         return detail::ResolveColumn(*column_map_, name);
     }
-    const ffi::ScanResultInner* inner_;
+    std::shared_ptr<const ffi::ScanResultInner> inner_;
     size_t record_idx_;
-    const detail::ColumnMap* column_map_;  // borrowed from ScanRecords (same lifetime as inner_)
+    std::shared_ptr<const detail::ColumnMap> column_map_;
 };
 
 /// A single scan record. Contains metadata and a RowView for field access.
 ///
-/// WARNING: ScanRecord contains a RowView that borrows from ScanRecords.
-/// It must not outlive the ScanRecords that produced it.
+/// ScanRecord is a value type that can be freely copied, stored, and
+/// accumulated across multiple Poll() calls.
 struct ScanRecord {
     int32_t bucket_id;
     std::optional<int64_t> partition_id;
@@ -685,13 +685,13 @@ struct ScanRecord {
 
 class ScanRecords {
    public:
-    ScanRecords() noexcept;
-    ~ScanRecords() noexcept;
+    ScanRecords() noexcept = default;
+    ~ScanRecords() noexcept = default;
 
     ScanRecords(const ScanRecords&) = delete;
     ScanRecords& operator=(const ScanRecords&) = delete;
-    ScanRecords(ScanRecords&& other) noexcept;
-    ScanRecords& operator=(ScanRecords&& other) noexcept;
+    ScanRecords(ScanRecords&&) noexcept = default;
+    ScanRecords& operator=(ScanRecords&&) noexcept = default;
 
     size_t Size() const;
     bool Empty() const;
@@ -720,9 +720,8 @@ class ScanRecords {
     /// Returns the column name-to-index map (lazy-built, cached).
     const std::shared_ptr<detail::ColumnMap>& GetColumnMap() const;
     friend class LogScanner;
-    void Destroy() noexcept;
     void BuildColumnMap() const;
-    ffi::ScanResultInner* inner_{nullptr};
+    std::shared_ptr<ffi::ScanResultInner> inner_;
     mutable std::shared_ptr<detail::ColumnMap> column_map_;
 };
 
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 76f1806d90..a697cea078 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -266,32 +266,7 @@ std::string RowView::GetDecimalString(size_t idx) const {
 // ScanRecords — backed by opaque Rust ScanResultInner
 // ============================================================================
 
-ScanRecords::ScanRecords() noexcept = default;
-
-ScanRecords::~ScanRecords() noexcept { Destroy(); }
-
-void ScanRecords::Destroy() noexcept {
-    if (inner_) {
-        rust::Box<ffi::ScanResultInner>::from_raw(inner_);
-        inner_ = nullptr;
-        column_map_.reset();
-    }
-}
-
-ScanRecords::ScanRecords(ScanRecords&& other) noexcept
-    : inner_(other.inner_), column_map_(std::move(other.column_map_)) {
-    other.inner_ = nullptr;
-}
-
-ScanRecords& ScanRecords::operator=(ScanRecords&& other) noexcept {
-    if (this != &other) {
-        Destroy();
-        inner_ = other.inner_;
-        column_map_ = std::move(other.column_map_);
-        other.inner_ = nullptr;
-    }
-    return *this;
-}
+// ScanRecords constructor, destructor, move operations are all defaulted in the header.
 
 size_t ScanRecords::Size() const { return inner_ ? inner_->sv_record_count() : 0; }
 
@@ -331,7 +306,7 @@ ScanRecord ScanRecords::operator[](size_t idx) const {
                       inner_->sv_offset(idx),
                       inner_->sv_timestamp(idx),
                       static_cast<ChangeType>(inner_->sv_change_type(idx)),
-                      RowView(inner_, idx, GetColumnMap().get())};
+                      RowView(inner_, idx, GetColumnMap())};
 }
 
 ScanRecord ScanRecords::Iterator::operator*() const { return owner_->operator[](idx_); }
@@ -1107,8 +1082,10 @@ Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
                                  std::string(result_box->sv_error_message()));
     }
 
-    out.Destroy();
-    out.inner_ = result_box.into_raw();
+    out.column_map_.reset();
+    out.inner_ = std::shared_ptr<ffi::ScanResultInner>(
+        result_box.into_raw(),
+        [](ffi::ScanResultInner* p) { rust::Box<ffi::ScanResultInner>::from_raw(p); });
     return utils::make_ok();
 }
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index a20739b038..a07dd6c6e0 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -203,10 +203,10 @@ When using `table.NewRow()`, the `Set()` method auto-routes to the correct type
 
 ## `RowView`
 
-Read-only row view for scan results. Provides zero-copy access to string and bytes data.
+Read-only row view for scan results. Provides zero-copy access to string and bytes data. `RowView` shares ownership of the underlying scan data via reference counting, so it can safely outlive the `ScanRecords` that produced it.
 
-:::warning Lifetime
-`RowView` borrows from `ScanRecords`. It must not outlive the `ScanRecords` that produced it (similar to `std::string_view` borrowing from `std::string`).
+:::note string_view Lifetime
+`GetString()` returns `std::string_view` that borrows from the underlying data. The `string_view` is valid as long as any `RowView` (or `ScanRecord`) referencing the same poll result is alive. Copy to `std::string` if you need the value after all references are gone.
 :::
 
 ### Index-Based Getters
@@ -248,9 +248,7 @@ Read-only row view for scan results. Provides zero-copy access to string and byt
 
 ## `ScanRecord`
 
-:::warning Lifetime
-`ScanRecord` contains a `RowView` that borrows from `ScanRecords`. It must not outlive the `ScanRecords` that produced it.
-:::
+`ScanRecord` is a value type that can be freely copied, stored, and accumulated across multiple `Poll()` calls. It shares ownership of the underlying scan data via reference counting.
 
 | Field          | Type                    |  Description                     |
 |----------------|-------------------------|----------------------------------|
diff --git a/fluss-rust/website/docs/user-guide/cpp/data-types.md b/fluss-rust/website/docs/user-guide/cpp/data-types.md
index 18121d3aa9..bfb296f2b9 100644
--- a/fluss-rust/website/docs/user-guide/cpp/data-types.md
+++ b/fluss-rust/website/docs/user-guide/cpp/data-types.md
@@ -58,28 +58,31 @@ row.Set("nickname", nullptr);    // set to null
 
 Field values are read through `RowView` (from scan results) and `LookupResult` (from lookups), not through `GenericRow`. Both provide the same getter interface with zero-copy access to string and bytes data.
 
-:::warning Lifetime
-`RowView` borrows from `ScanRecords`. It must not outlive the `ScanRecords` that produced it (similar to `std::string_view` borrowing from `std::string`).
+`ScanRecord` is a value type — it can be freely copied, stored, and accumulated across multiple `Poll()` calls via reference counting.
+
+:::note string_view Lifetime
+`GetString()` returns `std::string_view` that borrows from the underlying data. The `string_view` is valid as long as any `ScanRecord` referencing the same poll result is alive. Copy to `std::string` if you need the value after all records are gone.
 :::
 
 ```cpp
-// DON'T — string_view dangles after ScanRecords is destroyed:
-std::string_view dangling;
-{
-    fluss::ScanRecords records;
-    scanner.Poll(5000, records);
-    dangling = records[0].row.GetString(0); // points into ScanRecords memory
-}
-// dangling is undefined behavior here — ScanRecords is gone!
-
-// DO — use values within ScanRecords lifetime, or copy when you need ownership:
+// ScanRecord is a value type — safe to store and accumulate:
+std::vector<fluss::ScanRecord> all_records;
 fluss::ScanRecords records;
 scanner.Poll(5000, records);
 for (const auto& rec : records) {
+    all_records.push_back(rec);                    // safe! ref-counted
     auto name = rec.row.GetString(0);              // zero-copy string_view
     auto owned = std::string(rec.row.GetString(0)); // explicit copy when needed
-    process(owned);
 }
+
+// DON'T — string_view dangles after all records referencing the data are destroyed:
+std::string_view dangling;
+{
+    fluss::ScanRecords records;
+    scanner.Poll(5000, records);
+    dangling = records[0].row.GetString(0);
+}
+// dangling is undefined behavior here — no ScanRecord keeps the data alive!
 ```
 
 ### From Scan Results (RowView)
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md b/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
index c94bb84572..3a862c18e4 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
@@ -62,6 +62,34 @@ for (const auto& rec : records) {
 }
 ```
 
+**Continuous polling:**
+
+```cpp
+while (running) {
+    fluss::ScanRecords records;
+    scanner.Poll(1000, records);
+    for (const auto& rec : records) {
+        process(rec);
+    }
+}
+```
+
+**Accumulating records across polls:**
+
+`ScanRecord` is a value type — it can be freely copied, stored, and accumulated. The underlying data stays alive via reference counting (zero-copy).
+
+```cpp
+std::vector<fluss::ScanRecord> all_records;
+while (all_records.size() < 1000) {
+    fluss::ScanRecords records;
+    scanner.Poll(1000, records);
+    for (const auto& rec : records) {
+        all_records.push_back(rec);  // ref-counted, no data copy
+    }
+}
+// all_records is valid — each record keeps its data alive
+```
+
 **Batch subscribe:**
 
 ```cpp

From eeb5200a78f21742fd489dd87916d4e5bea0da60 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Fri, 20 Feb 2026 16:02:40 +0000
Subject: [PATCH 161/287] chore: Scan results returned per bucket python/cpp
 (#351)

---
 fluss-rust/bindings/cpp/examples/example.cpp  | 300 +++++++-------
 fluss-rust/bindings/cpp/include/fluss.hpp     | 139 +++++--
 fluss-rust/bindings/cpp/src/lib.rs            | 254 ++++++++----
 fluss-rust/bindings/cpp/src/table.cpp         | 190 ++++++---
 fluss-rust/bindings/python/Cargo.toml         |   1 +
 fluss-rust/bindings/python/example/example.py |  31 +-
 fluss-rust/bindings/python/fluss/__init__.pyi |  62 ++-
 fluss-rust/bindings/python/src/lib.rs         |   1 +
 fluss-rust/bindings/python/src/table.rs       | 374 ++++++++++++++----
 .../bindings/python/test/test_log_table.py    |  83 +++-
 .../docs/user-guide/cpp/api-reference.md      |  65 ++-
 .../docs/user-guide/cpp/example/log-tables.md |  12 +
 .../docs/user-guide/python/api-reference.md   |  56 ++-
 .../user-guide/python/example/log-tables.md   |  11 +-
 .../user-guide/rust/example/log-tables.md     |  15 +
 15 files changed, 1167 insertions(+), 427 deletions(-)

diff --git a/fluss-rust/bindings/cpp/examples/example.cpp b/fluss-rust/bindings/cpp/examples/example.cpp
index ea966d8e6b..d86ee5cda7 100644
--- a/fluss-rust/bindings/cpp/examples/example.cpp
+++ b/fluss-rust/bindings/cpp/examples/example.cpp
@@ -168,58 +168,75 @@ int main() {
     fluss::ScanRecords records;
     check("poll", scanner.Poll(5000, records));
 
-    std::cout << "Scanned records: " << records.Size() << std::endl;
+    // Flat iteration over all records (regardless of bucket)
+    std::cout << "Scanned records: " << records.Count() << " across " << records.BucketCount()
+              << " buckets" << std::endl;
+    for (const auto& rec : records) {
+        std::cout << "  offset=" << rec.offset << " timestamp=" << rec.timestamp << std::endl;
+    }
+
+    // Per-bucket access (with type verification)
     bool scan_ok = true;
     bool found_null_row = false;
-    for (const auto& rec : records) {
-        // Check if this is the all-null row (matches Rust: is_null_at for every column)
-        if (rec.row.IsNull(0)) {
-            found_null_row = true;
-            for (size_t i = 0; i < rec.row.FieldCount(); ++i) {
-                if (!rec.row.IsNull(i)) {
-                    std::cerr << "ERROR: column " << i << " should be null" << std::endl;
-                    scan_ok = false;
+    for (const auto& tb : records.Buckets()) {
+        auto view = records.Records(tb);
+        std::cout << "  Bucket " << tb.bucket_id;
+        if (tb.partition_id.has_value()) {
+            std::cout << " (partition=" << *tb.partition_id << ")";
+        }
+        std::cout << ": " << view.Size() << " records" << std::endl;
+        for (const auto& rec : view) {
+            // Check if this is the all-null row
+            if (rec.row.IsNull(0)) {
+                found_null_row = true;
+                for (size_t i = 0; i < rec.row.FieldCount(); ++i) {
+                    if (!rec.row.IsNull(i)) {
+                        std::cerr << "ERROR: column " << i << " should be null" << std::endl;
+                        scan_ok = false;
+                    }
                 }
+                std::cout << "    [null row] all " << rec.row.FieldCount() << " fields are null"
+                          << std::endl;
+                continue;
             }
-            std::cout << "  [null row] all " << rec.row.FieldCount() << " fields are null"
-                      << std::endl;
-            continue;
-        }
-
-        // Non-null rows: verify types
-        if (rec.row.GetType(4) != fluss::TypeId::Date) {
-            std::cerr << "ERROR: field 4 expected Date, got "
-                      << static_cast<int>(rec.row.GetType(4)) << std::endl;
-            scan_ok = false;
-        }
-        if (rec.row.GetType(5) != fluss::TypeId::Time) {
-            std::cerr << "ERROR: field 5 expected Time, got "
-                      << static_cast<int>(rec.row.GetType(5)) << std::endl;
-            scan_ok = false;
-        }
-        if (rec.row.GetType(6) != fluss::TypeId::Timestamp) {
-            std::cerr << "ERROR: field 6 expected Timestamp, got "
-                      << static_cast<int>(rec.row.GetType(6)) << std::endl;
-            scan_ok = false;
-        }
-        if (rec.row.GetType(7) != fluss::TypeId::TimestampLtz) {
-            std::cerr << "ERROR: field 7 expected TimestampLtz, got "
-                      << static_cast<int>(rec.row.GetType(7)) << std::endl;
-            scan_ok = false;
-        }
 
-        // Name-based getters (equivalent to index-based above)
-        auto date = rec.row.GetDate("event_date");
-        auto time = rec.row.GetTime("event_time");
-        auto ts_ntz = rec.row.GetTimestamp("created_at");
-        auto ts_ltz = rec.row.GetTimestamp("updated_at");
+            // Non-null rows: verify types
+            if (rec.row.GetType(4) != fluss::TypeId::Date) {
+                std::cerr << "ERROR: field 4 expected Date, got "
+                          << static_cast<int>(rec.row.GetType(4)) << std::endl;
+                scan_ok = false;
+            }
+            if (rec.row.GetType(5) != fluss::TypeId::Time) {
+                std::cerr << "ERROR: field 5 expected Time, got "
+                          << static_cast<int>(rec.row.GetType(5)) << std::endl;
+                scan_ok = false;
+            }
+            if (rec.row.GetType(6) != fluss::TypeId::Timestamp) {
+                std::cerr << "ERROR: field 6 expected Timestamp, got "
+                          << static_cast<int>(rec.row.GetType(6)) << std::endl;
+                scan_ok = false;
+            }
+            if (rec.row.GetType(7) != fluss::TypeId::TimestampLtz) {
+                std::cerr << "ERROR: field 7 expected TimestampLtz, got "
+                          << static_cast<int>(rec.row.GetType(7)) << std::endl;
+                scan_ok = false;
+            }
 
-        std::cout << "  id=" << rec.row.GetInt32("id") << " name=" << rec.row.GetString("name")
-                  << " score=" << rec.row.GetFloat32("score") << " age=" << rec.row.GetInt32("age")
-                  << " date=" << date.Year() << "-" << date.Month() << "-" << date.Day()
-                  << " time=" << time.Hour() << ":" << time.Minute() << ":" << time.Second()
-                  << " ts_ntz=" << ts_ntz.epoch_millis << " ts_ltz=" << ts_ltz.epoch_millis << "+"
-                  << ts_ltz.nano_of_millisecond << "ns" << std::endl;
+            // Name-based getters
+            auto date = rec.row.GetDate("event_date");
+            auto time = rec.row.GetTime("event_time");
+            auto ts_ntz = rec.row.GetTimestamp("created_at");
+            auto ts_ltz = rec.row.GetTimestamp("updated_at");
+
+            std::cout << "    id=" << rec.row.GetInt32("id")
+                      << " name=" << rec.row.GetString("name")
+                      << " score=" << rec.row.GetFloat32("score")
+                      << " age=" << rec.row.GetInt32("age") << " date=" << date.Year() << "-"
+                      << date.Month() << "-" << date.Day() << " time=" << time.Hour() << ":"
+                      << time.Minute() << ":" << time.Second() << " ts_ntz=" << ts_ntz.epoch_millis
+                      << " ts_ltz=" << ts_ltz.epoch_millis << "+" << ts_ltz.nano_of_millisecond
+                      << "ns" << std::endl;
+        }
     }
 
     if (!found_null_row) {
@@ -246,32 +263,34 @@ int main() {
     fluss::ScanRecords projected_records;
     check("poll_projected", projected_scanner.Poll(5000, projected_records));
 
-    std::cout << "Projected records: " << projected_records.Size() << std::endl;
-    for (const auto& rec : projected_records) {
-        if (rec.row.FieldCount() != 2) {
-            std::cerr << "ERROR: expected 2 fields, got " << rec.row.FieldCount() << std::endl;
-            scan_ok = false;
-            continue;
-        }
-        // Skip the all-null row
-        if (rec.row.IsNull(0)) {
-            std::cout << "  [null row] skipped" << std::endl;
-            continue;
-        }
-        if (rec.row.GetType(0) != fluss::TypeId::Int) {
-            std::cerr << "ERROR: projected field 0 expected Int, got "
-                      << static_cast<int>(rec.row.GetType(0)) << std::endl;
-            scan_ok = false;
-        }
-        if (rec.row.GetType(1) != fluss::TypeId::TimestampLtz) {
-            std::cerr << "ERROR: projected field 1 expected TimestampLtz, got "
-                      << static_cast<int>(rec.row.GetType(1)) << std::endl;
-            scan_ok = false;
-        }
+    std::cout << "Projected records: " << projected_records.Count() << std::endl;
+    for (const auto& tb : projected_records.Buckets()) {
+        for (const auto& rec : projected_records.Records(tb)) {
+            if (rec.row.FieldCount() != 2) {
+                std::cerr << "ERROR: expected 2 fields, got " << rec.row.FieldCount() << std::endl;
+                scan_ok = false;
+                continue;
+            }
+            // Skip the all-null row
+            if (rec.row.IsNull(0)) {
+                std::cout << "  [null row] skipped" << std::endl;
+                continue;
+            }
+            if (rec.row.GetType(0) != fluss::TypeId::Int) {
+                std::cerr << "ERROR: projected field 0 expected Int, got "
+                          << static_cast<int>(rec.row.GetType(0)) << std::endl;
+                scan_ok = false;
+            }
+            if (rec.row.GetType(1) != fluss::TypeId::TimestampLtz) {
+                std::cerr << "ERROR: projected field 1 expected TimestampLtz, got "
+                          << static_cast<int>(rec.row.GetType(1)) << std::endl;
+                scan_ok = false;
+            }
 
-        auto ts = rec.row.GetTimestamp(1);
-        std::cout << "  id=" << rec.row.GetInt32(0) << " updated_at=" << ts.epoch_millis << "+"
-                  << ts.nano_of_millisecond << "ns" << std::endl;
+            auto ts = rec.row.GetTimestamp(1);
+            std::cout << "  id=" << rec.row.GetInt32(0) << " updated_at=" << ts.epoch_millis << "+"
+                      << ts.nano_of_millisecond << "ns" << std::endl;
+        }
     }
 
     // 7b) Projected scan by column names — same columns as above but using names
@@ -287,32 +306,34 @@ int main() {
     fluss::ScanRecords name_projected_records;
     check("poll_name_projected", name_projected_scanner.Poll(5000, name_projected_records));
 
-    std::cout << "Name-projected records: " << name_projected_records.Size() << std::endl;
-    for (const auto& rec : name_projected_records) {
-        if (rec.row.FieldCount() != 2) {
-            std::cerr << "ERROR: expected 2 fields, got " << rec.row.FieldCount() << std::endl;
-            scan_ok = false;
-            continue;
-        }
-        // Skip the all-null row
-        if (rec.row.IsNull(0)) {
-            std::cout << "  [null row] skipped" << std::endl;
-            continue;
-        }
-        if (rec.row.GetType(0) != fluss::TypeId::Int) {
-            std::cerr << "ERROR: name-projected field 0 expected Int, got "
-                      << static_cast<int>(rec.row.GetType(0)) << std::endl;
-            scan_ok = false;
-        }
-        if (rec.row.GetType(1) != fluss::TypeId::TimestampLtz) {
-            std::cerr << "ERROR: name-projected field 1 expected TimestampLtz, got "
-                      << static_cast<int>(rec.row.GetType(1)) << std::endl;
-            scan_ok = false;
-        }
+    std::cout << "Name-projected records: " << name_projected_records.Count() << std::endl;
+    for (const auto& tb : name_projected_records.Buckets()) {
+        for (const auto& rec : name_projected_records.Records(tb)) {
+            if (rec.row.FieldCount() != 2) {
+                std::cerr << "ERROR: expected 2 fields, got " << rec.row.FieldCount() << std::endl;
+                scan_ok = false;
+                continue;
+            }
+            // Skip the all-null row
+            if (rec.row.IsNull(0)) {
+                std::cout << "  [null row] skipped" << std::endl;
+                continue;
+            }
+            if (rec.row.GetType(0) != fluss::TypeId::Int) {
+                std::cerr << "ERROR: name-projected field 0 expected Int, got "
+                          << static_cast<int>(rec.row.GetType(0)) << std::endl;
+                scan_ok = false;
+            }
+            if (rec.row.GetType(1) != fluss::TypeId::TimestampLtz) {
+                std::cerr << "ERROR: name-projected field 1 expected TimestampLtz, got "
+                          << static_cast<int>(rec.row.GetType(1)) << std::endl;
+                scan_ok = false;
+            }
 
-        auto ts = rec.row.GetTimestamp(1);
-        std::cout << "  id=" << rec.row.GetInt32(0) << " updated_at=" << ts.epoch_millis << "+"
-                  << ts.nano_of_millisecond << "ns" << std::endl;
+            auto ts = rec.row.GetTimestamp(1);
+            std::cout << "  id=" << rec.row.GetInt32(0) << " updated_at=" << ts.epoch_millis << "+"
+                      << ts.nano_of_millisecond << "ns" << std::endl;
+        }
     }
 
     if (scan_ok) {
@@ -356,8 +377,8 @@ int main() {
 
     std::unordered_map<int32_t, int64_t> timestamp_offsets;
     check("list_timestamp_offsets",
-          admin.ListOffsets(table_path, all_bucket_ids,
-                            fluss::OffsetSpec::Timestamp(timestamp_ms), timestamp_offsets));
+          admin.ListOffsets(table_path, all_bucket_ids, fluss::OffsetSpec::Timestamp(timestamp_ms),
+                            timestamp_offsets));
     std::cout << "Offsets for timestamp " << timestamp_ms << " (1 hour ago):" << std::endl;
     for (const auto& [bucket_id, offset] : timestamp_offsets) {
         std::cout << "  Bucket " << bucket_id << ": offset=" << offset << std::endl;
@@ -381,15 +402,21 @@ int main() {
     fluss::ScanRecords batch_records;
     check("poll_batch", batch_scanner.Poll(5000, batch_records));
 
-    std::cout << "Scanned " << batch_records.Size() << " records from batch subscription"
+    std::cout << "Scanned " << batch_records.Count() << " records from batch subscription"
               << std::endl;
-    for (size_t i = 0; i < batch_records.Size() && i < 5; ++i) {
-        const auto& rec = batch_records[i];
-        std::cout << "  Record " << i << ": bucket_id=" << rec.bucket_id
-                  << ", offset=" << rec.offset << ", timestamp=" << rec.timestamp << std::endl;
-    }
-    if (batch_records.Size() > 5) {
-        std::cout << "  ... and " << (batch_records.Size() - 5) << " more records" << std::endl;
+    for (const auto& tb : batch_records.Buckets()) {
+        size_t shown = 0;
+        for (const auto& rec : batch_records.Records(tb)) {
+            if (shown < 5) {
+                std::cout << "  bucket_id=" << tb.bucket_id << ", offset=" << rec.offset
+                          << ", timestamp=" << rec.timestamp << std::endl;
+            }
+            ++shown;
+        }
+        if (shown > 5) {
+            std::cout << "  ... and " << (shown - 5) << " more records in bucket " << tb.bucket_id
+                      << std::endl;
+        }
     }
 
     // 9.1) Unsubscribe from a bucket
@@ -520,11 +547,13 @@ int main() {
 
         fluss::ScanRecords arrow_write_records;
         check("poll_arrow_write", arrow_write_scanner.Poll(5000, arrow_write_records));
-        std::cout << "Scanned " << arrow_write_records.Size()
+        std::cout << "Scanned " << arrow_write_records.Count()
                   << " records written via AppendArrowBatch:" << std::endl;
-        for (const auto& rec : arrow_write_records) {
-            std::cout << "  id=" << rec.row.GetInt32(0) << " name=" << rec.row.GetString(1)
-                      << " score=" << rec.row.GetFloat32(2) << std::endl;
+        for (const auto& tb : arrow_write_records.Buckets()) {
+            for (const auto& rec : arrow_write_records.Records(tb)) {
+                std::cout << "  id=" << rec.row.GetInt32(0) << " name=" << rec.row.GetString(1)
+                          << " score=" << rec.row.GetFloat32(2) << std::endl;
+            }
         }
     }
 
@@ -591,11 +620,13 @@ int main() {
     fluss::ScanRecords decimal_records;
     check("poll_decimal", decimal_scanner.Poll(5000, decimal_records));
 
-    std::cout << "Scanned decimal records: " << decimal_records.Size() << std::endl;
-    for (const auto& rec : decimal_records) {
-        std::cout << "  id=" << rec.row.GetInt32(0) << " price=" << rec.row.GetDecimalString(1)
-                  << " amount=" << rec.row.GetDecimalString(2)
-                  << " is_decimal=" << rec.row.IsDecimal(1) << std::endl;
+    std::cout << "Scanned decimal records: " << decimal_records.Count() << std::endl;
+    for (const auto& tb : decimal_records.Buckets()) {
+        for (const auto& rec : decimal_records.Records(tb)) {
+            std::cout << "  id=" << rec.row.GetInt32(0) << " price=" << rec.row.GetDecimalString(1)
+                      << " amount=" << rec.row.GetDecimalString(2)
+                      << " is_decimal=" << rec.row.IsDecimal(1) << std::endl;
+        }
     }
 
     // 14) Partitioned table example
@@ -690,14 +721,15 @@ int main() {
 
     fluss::ScanRecords partition_records;
     check("poll_partitioned", partition_scanner.Poll(5000, partition_records));
-    std::cout << "Scanned " << partition_records.Size() << " records from partitioned table"
+    std::cout << "Scanned " << partition_records.Count() << " records from partitioned table"
               << std::endl;
-    for (size_t i = 0; i < partition_records.Size(); ++i) {
-        const auto& rec = partition_records[i];
-        std::cout << "  Record " << i << ": partition_id="
-                  << (rec.partition_id.has_value() ? std::to_string(*rec.partition_id) : "none")
-                  << ", id=" << rec.row.GetInt32(0) << ", region=" << rec.row.GetString(1)
-                  << ", value=" << rec.row.GetInt64(2) << std::endl;
+    for (const auto& tb : partition_records.Buckets()) {
+        for (const auto& rec : partition_records.Records(tb)) {
+            std::cout << "  partition_id="
+                      << (tb.partition_id.has_value() ? std::to_string(*tb.partition_id) : "none")
+                      << ", id=" << rec.row.GetInt32(0) << ", region=" << rec.row.GetString(1)
+                      << ", value=" << rec.row.GetInt64(2) << std::endl;
+        }
     }
 
     // 14.2) subscribe_partition_buckets: batch subscribe to all partitions at once
@@ -717,13 +749,13 @@ int main() {
 
     fluss::ScanRecords partition_batch_records;
     check("poll_partition_batch", partition_batch_scanner.Poll(5000, partition_batch_records));
-    std::cout << "Scanned " << partition_batch_records.Size()
+    std::cout << "Scanned " << partition_batch_records.Count()
               << " records from batch partition subscription" << std::endl;
-    for (size_t i = 0; i < partition_batch_records.Size(); ++i) {
-        const auto& rec = partition_batch_records[i];
-        std::cout << "  Record " << i << ": id=" << rec.row.GetInt32(0)
-                  << ", region=" << rec.row.GetString(1) << ", value=" << rec.row.GetInt64(2)
-                  << std::endl;
+    for (const auto& tb : partition_batch_records.Buckets()) {
+        for (const auto& rec : partition_batch_records.Records(tb)) {
+            std::cout << "  id=" << rec.row.GetInt32(0) << ", region=" << rec.row.GetString(1)
+                      << ", value=" << rec.row.GetInt64(2) << std::endl;
+        }
     }
 
     // 14.3) UnsubscribePartition: unsubscribe from one partition, verify remaining
@@ -743,12 +775,12 @@ int main() {
 
     fluss::ScanRecords unsub_records;
     check("poll_after_unsub", unsub_partition_scanner.Poll(5000, unsub_records));
-    std::cout << "After unsubscribe, scanned " << unsub_records.Size() << " records" << std::endl;
-    for (size_t i = 0; i < unsub_records.Size(); ++i) {
-        const auto& rec = unsub_records[i];
-        std::cout << "  Record " << i << ": id=" << rec.row.GetInt32(0)
-                  << ", region=" << rec.row.GetString(1) << ", value=" << rec.row.GetInt64(2)
-                  << std::endl;
+    std::cout << "After unsubscribe, scanned " << unsub_records.Count() << " records" << std::endl;
+    for (const auto& tb : unsub_records.Buckets()) {
+        for (const auto& rec : unsub_records.Records(tb)) {
+            std::cout << "  id=" << rec.row.GetInt32(0) << ", region=" << rec.row.GetString(1)
+                      << ", value=" << rec.row.GetInt64(2) << std::endl;
+        }
     }
 
     // Cleanup
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 27d1fcb9c1..9ea7e416fc 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -507,6 +507,17 @@ struct NamedGetters {
    private:
     const Derived& Self() const { return static_cast<const Derived&>(*this); }
 };
+
+struct ScanData {
+    ffi::ScanResultInner* raw;
+    ColumnMap columns;
+
+    ScanData(ffi::ScanResultInner* r, ColumnMap cols) : raw(r), columns(std::move(cols)) {}
+    ~ScanData();
+
+    ScanData(const ScanData&) = delete;
+    ScanData& operator=(const ScanData&) = delete;
+};
 }  // namespace detail
 
 class GenericRow {
@@ -623,9 +634,8 @@ class RowView : public detail::NamedGetters<RowView> {
     friend struct detail::NamedGetters<RowView>;
 
    public:
-    RowView(std::shared_ptr<const ffi::ScanResultInner> inner, size_t record_idx,
-            std::shared_ptr<const detail::ColumnMap> column_map)
-        : inner_(std::move(inner)), record_idx_(record_idx), column_map_(std::move(column_map)) {}
+    RowView(std::shared_ptr<const detail::ScanData> data, size_t bucket_idx, size_t rec_idx)
+        : data_(std::move(data)), bucket_idx_(bucket_idx), rec_idx_(rec_idx) {}
 
     // ── Index-based getters ──────────────────────────────────────────
     size_t FieldCount() const;
@@ -660,14 +670,28 @@ class RowView : public detail::NamedGetters<RowView> {
 
    private:
     size_t Resolve(const std::string& name) const {
-        if (!column_map_) {
+        if (!data_) {
             throw std::runtime_error("RowView: name-based access not available");
         }
-        return detail::ResolveColumn(*column_map_, name);
+        return detail::ResolveColumn(data_->columns, name);
+    }
+    std::shared_ptr<const detail::ScanData> data_;
+    size_t bucket_idx_;
+    size_t rec_idx_;
+};
+
+/// Identifies a specific bucket, optionally within a partition.
+struct TableBucket {
+    int64_t table_id;
+    int32_t bucket_id;
+    std::optional<int64_t> partition_id;
+
+    bool operator==(const TableBucket& other) const {
+        return table_id == other.table_id && bucket_id == other.bucket_id &&
+               partition_id == other.partition_id;
     }
-    std::shared_ptr<const ffi::ScanResultInner> inner_;
-    size_t record_idx_;
-    std::shared_ptr<const detail::ColumnMap> column_map_;
+
+    bool operator!=(const TableBucket& other) const { return !(*this == other); }
 };
 
 /// A single scan record. Contains metadata and a RowView for field access.
@@ -675,14 +699,61 @@ class RowView : public detail::NamedGetters<RowView> {
 /// ScanRecord is a value type that can be freely copied, stored, and
 /// accumulated across multiple Poll() calls.
 struct ScanRecord {
-    int32_t bucket_id;
-    std::optional<int64_t> partition_id;
     int64_t offset;
     int64_t timestamp;
     ChangeType change_type;
     RowView row;
 };
 
+/// A view into a subset of scan results for a single bucket.
+///
+/// BucketView is a value type — it shares ownership of the underlying scan data
+/// via reference counting, so it can safely outlive the ScanRecords that produced it.
+class BucketView {
+   public:
+    BucketView(std::shared_ptr<const detail::ScanData> data, TableBucket bucket, size_t bucket_idx,
+               size_t count)
+        : data_(std::move(data)),
+          bucket_(std::move(bucket)),
+          bucket_idx_(bucket_idx),
+          count_(count) {}
+
+    /// The bucket these records belong to.
+    const TableBucket& Bucket() const { return bucket_; }
+
+    /// Number of records in this bucket.
+    size_t Size() const { return count_; }
+    bool Empty() const { return count_ == 0; }
+
+    /// Access a record by its position within this bucket (0-based).
+    ScanRecord operator[](size_t idx) const;
+
+    class Iterator {
+       public:
+        ScanRecord operator*() const;
+        Iterator& operator++() {
+            ++idx_;
+            return *this;
+        }
+        bool operator!=(const Iterator& other) const { return idx_ != other.idx_; }
+
+       private:
+        friend class BucketView;
+        Iterator(const BucketView* owner, size_t idx) : owner_(owner), idx_(idx) {}
+        const BucketView* owner_;
+        size_t idx_;
+    };
+
+    Iterator begin() const { return Iterator(this, 0); }
+    Iterator end() const { return Iterator(this, count_); }
+
+   private:
+    std::shared_ptr<const detail::ScanData> data_;
+    TableBucket bucket_;
+    size_t bucket_idx_;
+    size_t count_;
+};
+
 class ScanRecords {
    public:
     ScanRecords() noexcept = default;
@@ -693,36 +764,52 @@ class ScanRecords {
     ScanRecords(ScanRecords&&) noexcept = default;
     ScanRecords& operator=(ScanRecords&&) noexcept = default;
 
-    size_t Size() const;
-    bool Empty() const;
-    ScanRecord operator[](size_t idx) const;
+    /// Total number of records across all buckets.
+    size_t Count() const;
+    bool IsEmpty() const;
+
+    /// Number of distinct buckets with records.
+    size_t BucketCount() const;
+
+    /// List of distinct buckets that have records.
+    std::vector<TableBucket> Buckets() const;
+
+    /// Get a view of records for a specific bucket.
+    ///
+    /// Returns an empty BucketView if the bucket is not present (matches Rust/Java).
+    /// Note: O(B) linear scan. For iteration over all buckets, prefer BucketAt(idx).
+    BucketView Records(const TableBucket& bucket) const;
 
+    /// Get a view of records by bucket index (0-based). O(1).
+    ///
+    /// Throws std::out_of_range if idx >= BucketCount().
+    BucketView BucketAt(size_t idx) const;
+
+    /// Flat iterator over all records across all buckets (matches Java Iterable<ScanRecord>).
     class Iterator {
        public:
         ScanRecord operator*() const;
-        Iterator& operator++() {
-            ++idx_;
-            return *this;
+        Iterator& operator++();
+        bool operator!=(const Iterator& other) const {
+            return bucket_idx_ != other.bucket_idx_ || rec_idx_ != other.rec_idx_;
         }
-        bool operator!=(const Iterator& other) const { return idx_ != other.idx_; }
 
        private:
         friend class ScanRecords;
-        Iterator(const ScanRecords* owner, size_t idx) : owner_(owner), idx_(idx) {}
+        Iterator(const ScanRecords* owner, size_t bucket_idx, size_t rec_idx)
+            : owner_(owner), bucket_idx_(bucket_idx), rec_idx_(rec_idx) {}
         const ScanRecords* owner_;
-        size_t idx_;
+        size_t bucket_idx_;
+        size_t rec_idx_;
     };
 
-    Iterator begin() const { return Iterator(this, 0); }
-    Iterator end() const { return Iterator(this, Size()); }
+    Iterator begin() const;
+    Iterator end() const { return Iterator(this, BucketCount(), 0); }
 
    private:
-    /// Returns the column name-to-index map (lazy-built, cached).
-    const std::shared_ptr<detail::ColumnMap>& GetColumnMap() const;
     friend class LogScanner;
-    void BuildColumnMap() const;
-    std::shared_ptr<ffi::ScanResultInner> inner_;
-    mutable std::shared_ptr<detail::ColumnMap> column_map_;
+    ScanRecord RecordAt(size_t bucket, size_t rec_idx) const;
+    std::shared_ptr<const detail::ScanData> data_;
 };
 
 class ArrowRecordBatch {
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index cb29882d16..9f987b94a9 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -141,6 +141,14 @@ mod ffi {
         timestamp: i64,
     }
 
+    struct FfiBucketInfo {
+        table_id: i64,
+        bucket_id: i32,
+        has_partition_id: bool,
+        partition_id: i64,
+        record_count: usize,
+    }
+
     struct FfiBucketSubscription {
         bucket_id: i32,
         offset: i64,
@@ -420,27 +428,96 @@ mod ffi {
         fn sv_column_count(self: &ScanResultInner) -> usize;
         fn sv_column_name(self: &ScanResultInner, field: usize) -> Result<&str>;
         fn sv_column_type(self: &ScanResultInner, field: usize) -> Result<i32>;
-        fn sv_bucket_id(self: &ScanResultInner, rec: usize) -> i32;
-        fn sv_has_partition_id(self: &ScanResultInner, rec: usize) -> bool;
-        fn sv_partition_id(self: &ScanResultInner, rec: usize) -> i64;
-        fn sv_offset(self: &ScanResultInner, rec: usize) -> i64;
-        fn sv_timestamp(self: &ScanResultInner, rec: usize) -> i64;
-        fn sv_change_type(self: &ScanResultInner, rec: usize) -> i32;
+        fn sv_offset(self: &ScanResultInner, bucket: usize, rec: usize) -> i64;
+        fn sv_timestamp(self: &ScanResultInner, bucket: usize, rec: usize) -> i64;
+        fn sv_change_type(self: &ScanResultInner, bucket: usize, rec: usize) -> i32;
         fn sv_field_count(self: &ScanResultInner) -> usize;
-        fn sv_is_null(self: &ScanResultInner, rec: usize, field: usize) -> Result<bool>;
-        fn sv_get_bool(self: &ScanResultInner, rec: usize, field: usize) -> Result<bool>;
-        fn sv_get_i32(self: &ScanResultInner, rec: usize, field: usize) -> Result<i32>;
-        fn sv_get_i64(self: &ScanResultInner, rec: usize, field: usize) -> Result<i64>;
-        fn sv_get_f32(self: &ScanResultInner, rec: usize, field: usize) -> Result<f32>;
-        fn sv_get_f64(self: &ScanResultInner, rec: usize, field: usize) -> Result<f64>;
-        fn sv_get_str(self: &ScanResultInner, rec: usize, field: usize) -> Result<&str>;
-        fn sv_get_bytes(self: &ScanResultInner, rec: usize, field: usize) -> Result<&[u8]>;
-        fn sv_get_date_days(self: &ScanResultInner, rec: usize, field: usize) -> Result<i32>;
-        fn sv_get_time_millis(self: &ScanResultInner, rec: usize, field: usize) -> Result<i32>;
-        fn sv_get_ts_millis(self: &ScanResultInner, rec: usize, field: usize) -> Result<i64>;
-        fn sv_get_ts_nanos(self: &ScanResultInner, rec: usize, field: usize) -> Result<i32>;
-        fn sv_is_ts_ltz(self: &ScanResultInner, rec: usize, field: usize) -> Result<bool>;
-        fn sv_get_decimal_str(self: &ScanResultInner, rec: usize, field: usize) -> Result<String>;
+        fn sv_is_null(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<bool>;
+        fn sv_get_bool(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<bool>;
+        fn sv_get_i32(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<i32>;
+        fn sv_get_i64(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<i64>;
+        fn sv_get_f32(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<f32>;
+        fn sv_get_f64(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<f64>;
+        fn sv_get_str(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<&str>;
+        fn sv_get_bytes(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<&[u8]>;
+        fn sv_get_date_days(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<i32>;
+        fn sv_get_time_millis(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<i32>;
+        fn sv_get_ts_millis(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<i64>;
+        fn sv_get_ts_nanos(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<i32>;
+        fn sv_is_ts_ltz(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<bool>;
+        fn sv_get_decimal_str(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<String>;
+
+        fn sv_bucket_infos(self: &ScanResultInner) -> &Vec<FfiBucketInfo>;
     }
 }
 
@@ -1487,24 +1564,27 @@ impl LogScanner {
         match result {
             Ok(records) => {
                 let columns = self.projected_columns.clone();
-                // Flatten ScanRecords into a Vec<FlatScanRecord> — moves Arc<RecordBatch>, zero copy
-                let mut flat = Vec::with_capacity(records.count());
+                let mut total_count = 0usize;
+                let mut buckets = Vec::new();
+                let mut bucket_infos = Vec::new();
                 for (table_bucket, bucket_records) in records.into_records_by_buckets() {
-                    let bucket_id = table_bucket.bucket_id();
-                    let partition = table_bucket.partition_id();
-                    for record in bucket_records {
-                        flat.push(FlatScanRecord {
-                            bucket_id,
-                            has_partition_id: partition.is_some(),
-                            partition_id: partition.unwrap_or(0),
-                            record,
-                        });
-                    }
+                    let count = bucket_records.len();
+                    total_count += count;
+                    bucket_infos.push(ffi::FfiBucketInfo {
+                        table_id: table_bucket.table_id(),
+                        bucket_id: table_bucket.bucket_id(),
+                        has_partition_id: table_bucket.partition_id().is_some(),
+                        partition_id: table_bucket.partition_id().unwrap_or(0),
+                        record_count: count,
+                    });
+                    buckets.push((table_bucket, bucket_records));
                 }
                 Box::new(ScanResultInner {
                     error: None,
-                    records: flat,
+                    buckets,
                     columns,
+                    bucket_infos,
+                    total_count,
                 })
             }
             Err(e) => {
@@ -1917,28 +1997,29 @@ mod row_reader {
 // Opaque types: ScanResultInner (scan read path)
 // ============================================================================
 
-struct FlatScanRecord {
-    bucket_id: i32,
-    has_partition_id: bool,
-    partition_id: i64,
-    record: fcore::record::ScanRecord,
-}
-
 pub struct ScanResultInner {
     error: Option<(i32, String)>,
-    records: Vec<FlatScanRecord>,
+    buckets: Vec<(fcore::metadata::TableBucket, Vec<fcore::record::ScanRecord>)>,
     columns: Vec<fcore::metadata::Column>,
+    bucket_infos: Vec<ffi::FfiBucketInfo>,
+    total_count: usize,
 }
 
 impl ScanResultInner {
     fn from_error(code: i32, msg: String) -> Self {
         Self {
             error: Some((code, msg)),
-            records: Vec::new(),
+            buckets: Vec::new(),
             columns: Vec::new(),
+            bucket_infos: Vec::new(),
+            total_count: 0,
         }
     }
 
+    fn resolve(&self, bucket: usize, rec: usize) -> &fcore::record::ScanRecord {
+        &self.buckets[bucket].1[rec]
+    }
+
     fn sv_has_error(&self) -> bool {
         self.error.is_some()
     }
@@ -1952,7 +2033,7 @@ impl ScanResultInner {
     }
 
     fn sv_record_count(&self) -> usize {
-        self.records.len()
+        self.total_count
     }
 
     fn sv_column_count(&self) -> usize {
@@ -1965,71 +2046,70 @@ impl ScanResultInner {
         row_reader::column_type(&self.columns, field)
     }
 
-    // Metadata accessors — C++ validates rec in operator[] before calling these.
-    fn sv_bucket_id(&self, rec: usize) -> i32 {
-        self.records[rec].bucket_id
+    fn sv_offset(&self, bucket: usize, rec: usize) -> i64 {
+        self.resolve(bucket, rec).offset()
     }
-    fn sv_has_partition_id(&self, rec: usize) -> bool {
-        self.records[rec].has_partition_id
+    fn sv_timestamp(&self, bucket: usize, rec: usize) -> i64 {
+        self.resolve(bucket, rec).timestamp()
     }
-    fn sv_partition_id(&self, rec: usize) -> i64 {
-        self.records[rec].partition_id
-    }
-    fn sv_offset(&self, rec: usize) -> i64 {
-        self.records[rec].record.offset()
-    }
-    fn sv_timestamp(&self, rec: usize) -> i64 {
-        self.records[rec].record.timestamp()
-    }
-    fn sv_change_type(&self, rec: usize) -> i32 {
-        self.records[rec].record.change_type().to_byte_value() as i32
+    fn sv_change_type(&self, bucket: usize, rec: usize) -> i32 {
+        self.resolve(bucket, rec).change_type().to_byte_value() as i32
     }
     fn sv_field_count(&self) -> usize {
         self.columns.len()
     }
 
-    // Field accessors — C++ validates rec in operator[], validate() checks field.
-    fn sv_is_null(&self, rec: usize, field: usize) -> Result<bool, String> {
-        row_reader::is_null(self.records[rec].record.row(), &self.columns, field)
+    // Field accessors — C++ validates bounds in BucketView/RecordAt, validate() checks field.
+    fn sv_is_null(&self, bucket: usize, rec: usize, field: usize) -> Result<bool, String> {
+        row_reader::is_null(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_bool(&self, rec: usize, field: usize) -> Result<bool, String> {
-        row_reader::get_bool(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_bool(&self, bucket: usize, rec: usize, field: usize) -> Result<bool, String> {
+        row_reader::get_bool(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_i32(&self, rec: usize, field: usize) -> Result<i32, String> {
-        row_reader::get_i32(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_i32(&self, bucket: usize, rec: usize, field: usize) -> Result<i32, String> {
+        row_reader::get_i32(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_i64(&self, rec: usize, field: usize) -> Result<i64, String> {
-        row_reader::get_i64(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_i64(&self, bucket: usize, rec: usize, field: usize) -> Result<i64, String> {
+        row_reader::get_i64(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_f32(&self, rec: usize, field: usize) -> Result<f32, String> {
-        row_reader::get_f32(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_f32(&self, bucket: usize, rec: usize, field: usize) -> Result<f32, String> {
+        row_reader::get_f32(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_f64(&self, rec: usize, field: usize) -> Result<f64, String> {
-        row_reader::get_f64(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_f64(&self, bucket: usize, rec: usize, field: usize) -> Result<f64, String> {
+        row_reader::get_f64(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_str(&self, rec: usize, field: usize) -> Result<&str, String> {
-        row_reader::get_str(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_str(&self, bucket: usize, rec: usize, field: usize) -> Result<&str, String> {
+        row_reader::get_str(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_bytes(&self, rec: usize, field: usize) -> Result<&[u8], String> {
-        row_reader::get_bytes(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_bytes(&self, bucket: usize, rec: usize, field: usize) -> Result<&[u8], String> {
+        row_reader::get_bytes(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_date_days(&self, rec: usize, field: usize) -> Result<i32, String> {
-        row_reader::get_date_days(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_date_days(&self, bucket: usize, rec: usize, field: usize) -> Result<i32, String> {
+        row_reader::get_date_days(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_time_millis(&self, rec: usize, field: usize) -> Result<i32, String> {
-        row_reader::get_time_millis(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_time_millis(&self, bucket: usize, rec: usize, field: usize) -> Result<i32, String> {
+        row_reader::get_time_millis(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_ts_millis(&self, rec: usize, field: usize) -> Result<i64, String> {
-        row_reader::get_ts_millis(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_ts_millis(&self, bucket: usize, rec: usize, field: usize) -> Result<i64, String> {
+        row_reader::get_ts_millis(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_get_ts_nanos(&self, rec: usize, field: usize) -> Result<i32, String> {
-        row_reader::get_ts_nanos(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_ts_nanos(&self, bucket: usize, rec: usize, field: usize) -> Result<i32, String> {
+        row_reader::get_ts_nanos(self.resolve(bucket, rec).row(), &self.columns, field)
     }
-    fn sv_is_ts_ltz(&self, _rec: usize, field: usize) -> Result<bool, String> {
+    fn sv_is_ts_ltz(&self, _bucket: usize, _rec: usize, field: usize) -> Result<bool, String> {
         row_reader::is_ts_ltz(&self.columns, field)
     }
-    fn sv_get_decimal_str(&self, rec: usize, field: usize) -> Result<String, String> {
-        row_reader::get_decimal_str(self.records[rec].record.row(), &self.columns, field)
+    fn sv_get_decimal_str(
+        &self,
+        bucket: usize,
+        rec: usize,
+        field: usize,
+    ) -> Result<String, String> {
+        row_reader::get_decimal_str(self.resolve(bucket, rec).row(), &self.columns, field)
+    }
+
+    fn sv_bucket_infos(&self) -> &Vec<ffi::FfiBucketInfo> {
+        &self.bucket_infos
     }
 }
 
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index a697cea078..73035bb9b9 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -191,75 +191,91 @@ void GenericRow::SetDecimal(size_t idx, const std::string& value) {
     inner_->gr_set_decimal_str(idx, value);
 }
 
+// ============================================================================
+// ScanData — destructor must live in .cpp where rust::Box is visible
+// ============================================================================
+
+detail::ScanData::~ScanData() {
+    if (raw) {
+        rust::Box<ffi::ScanResultInner>::from_raw(raw);
+    }
+}
+
 // ============================================================================
 // RowView — zero-copy read-only row view for scan results
 // ============================================================================
 
-size_t RowView::FieldCount() const { return inner_ ? inner_->sv_field_count() : 0; }
+// NOLINTNEXTLINE(cppcoreguidelines-macro-usage)
+#define CHECK_DATA(name)                                                                 \
+    do {                                                                                 \
+        if (!data_) throw std::logic_error(name ": not available (moved-from or null)"); \
+    } while (0)
+
+size_t RowView::FieldCount() const { return data_ ? data_->raw->sv_field_count() : 0; }
 
 TypeId RowView::GetType(size_t idx) const {
-    CHECK_INNER("RowView");
-    return static_cast<TypeId>(inner_->sv_column_type(idx));
+    CHECK_DATA("RowView");
+    return static_cast<TypeId>(data_->raw->sv_column_type(idx));
 }
 
 bool RowView::IsNull(size_t idx) const {
-    CHECK_INNER("RowView");
-    return inner_->sv_is_null(record_idx_, idx);
+    CHECK_DATA("RowView");
+    return data_->raw->sv_is_null(bucket_idx_, rec_idx_, idx);
 }
 bool RowView::GetBool(size_t idx) const {
-    CHECK_INNER("RowView");
-    return inner_->sv_get_bool(record_idx_, idx);
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_bool(bucket_idx_, rec_idx_, idx);
 }
 int32_t RowView::GetInt32(size_t idx) const {
-    CHECK_INNER("RowView");
-    return inner_->sv_get_i32(record_idx_, idx);
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_i32(bucket_idx_, rec_idx_, idx);
 }
 int64_t RowView::GetInt64(size_t idx) const {
-    CHECK_INNER("RowView");
-    return inner_->sv_get_i64(record_idx_, idx);
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_i64(bucket_idx_, rec_idx_, idx);
 }
 float RowView::GetFloat32(size_t idx) const {
-    CHECK_INNER("RowView");
-    return inner_->sv_get_f32(record_idx_, idx);
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_f32(bucket_idx_, rec_idx_, idx);
 }
 double RowView::GetFloat64(size_t idx) const {
-    CHECK_INNER("RowView");
-    return inner_->sv_get_f64(record_idx_, idx);
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_f64(bucket_idx_, rec_idx_, idx);
 }
 
 std::string_view RowView::GetString(size_t idx) const {
-    CHECK_INNER("RowView");
-    auto s = inner_->sv_get_str(record_idx_, idx);
+    CHECK_DATA("RowView");
+    auto s = data_->raw->sv_get_str(bucket_idx_, rec_idx_, idx);
     return std::string_view(s.data(), s.size());
 }
 
 std::pair<const uint8_t*, size_t> RowView::GetBytes(size_t idx) const {
-    CHECK_INNER("RowView");
-    auto bytes = inner_->sv_get_bytes(record_idx_, idx);
+    CHECK_DATA("RowView");
+    auto bytes = data_->raw->sv_get_bytes(bucket_idx_, rec_idx_, idx);
     return {bytes.data(), bytes.size()};
 }
 
 Date RowView::GetDate(size_t idx) const {
-    CHECK_INNER("RowView");
-    return Date{inner_->sv_get_date_days(record_idx_, idx)};
+    CHECK_DATA("RowView");
+    return Date{data_->raw->sv_get_date_days(bucket_idx_, rec_idx_, idx)};
 }
 
 Time RowView::GetTime(size_t idx) const {
-    CHECK_INNER("RowView");
-    return Time{inner_->sv_get_time_millis(record_idx_, idx)};
+    CHECK_DATA("RowView");
+    return Time{data_->raw->sv_get_time_millis(bucket_idx_, rec_idx_, idx)};
 }
 
 Timestamp RowView::GetTimestamp(size_t idx) const {
-    CHECK_INNER("RowView");
-    return Timestamp{inner_->sv_get_ts_millis(record_idx_, idx),
-                     inner_->sv_get_ts_nanos(record_idx_, idx)};
+    CHECK_DATA("RowView");
+    return Timestamp{data_->raw->sv_get_ts_millis(bucket_idx_, rec_idx_, idx),
+                     data_->raw->sv_get_ts_nanos(bucket_idx_, rec_idx_, idx)};
 }
 
 bool RowView::IsDecimal(size_t idx) const { return GetType(idx) == TypeId::Decimal; }
 
 std::string RowView::GetDecimalString(size_t idx) const {
-    CHECK_INNER("RowView");
-    return std::string(inner_->sv_get_decimal_str(record_idx_, idx));
+    CHECK_DATA("RowView");
+    return std::string(data_->raw->sv_get_decimal_str(bucket_idx_, rec_idx_, idx));
 }
 
 // ============================================================================
@@ -268,48 +284,94 @@ std::string RowView::GetDecimalString(size_t idx) const {
 
 // ScanRecords constructor, destructor, move operations are all defaulted in the header.
 
-size_t ScanRecords::Size() const { return inner_ ? inner_->sv_record_count() : 0; }
+size_t ScanRecords::Count() const { return data_ ? data_->raw->sv_record_count() : 0; }
 
-bool ScanRecords::Empty() const { return Size() == 0; }
+bool ScanRecords::IsEmpty() const { return Count() == 0; }
 
-void ScanRecords::BuildColumnMap() const {
-    if (!inner_) return;
-    auto map = std::make_shared<detail::ColumnMap>();
-    auto count = inner_->sv_column_count();
-    for (size_t i = 0; i < count; ++i) {
-        auto name = inner_->sv_column_name(i);
-        (*map)[std::string(name.data(), name.size())] = {
-            i, static_cast<TypeId>(inner_->sv_column_type(i))};
+ScanRecord ScanRecords::RecordAt(size_t bucket, size_t rec_idx) const {
+    if (!data_) {
+        throw std::logic_error("ScanRecords: not available (moved-from or null)");
     }
-    column_map_ = std::move(map);
+    return ScanRecord{data_->raw->sv_offset(bucket, rec_idx),
+                      data_->raw->sv_timestamp(bucket, rec_idx),
+                      static_cast<ChangeType>(data_->raw->sv_change_type(bucket, rec_idx)),
+                      RowView(data_, bucket, rec_idx)};
+}
+
+static TableBucket to_table_bucket(const ffi::FfiBucketInfo& g) {
+    return TableBucket{g.table_id, g.bucket_id,
+                       g.has_partition_id ? std::optional<int64_t>(g.partition_id) : std::nullopt};
+}
+
+size_t ScanRecords::BucketCount() const { return data_ ? data_->raw->sv_bucket_infos().size() : 0; }
+
+ScanRecord ScanRecords::Iterator::operator*() const {
+    return owner_->RecordAt(bucket_idx_, rec_idx_);
 }
 
-const std::shared_ptr<detail::ColumnMap>& ScanRecords::GetColumnMap() const {
-    if (!column_map_) {
-        BuildColumnMap();
+ScanRecords::Iterator ScanRecords::begin() const { return Iterator(this, 0, 0); }
+
+ScanRecords::Iterator& ScanRecords::Iterator::operator++() {
+    ++rec_idx_;
+    if (owner_->data_) {
+        const auto& infos = owner_->data_->raw->sv_bucket_infos();
+        while (bucket_idx_ < infos.size() && rec_idx_ >= infos[bucket_idx_].record_count) {
+            rec_idx_ = 0;
+            ++bucket_idx_;
+        }
     }
-    return column_map_;
+    return *this;
+}
+
+std::vector<TableBucket> ScanRecords::Buckets() const {
+    std::vector<TableBucket> result;
+    if (!data_) return result;
+    const auto& infos = data_->raw->sv_bucket_infos();
+    result.reserve(infos.size());
+    for (const auto& g : infos) {
+        result.push_back(to_table_bucket(g));
+    }
+    return result;
 }
 
-ScanRecord ScanRecords::operator[](size_t idx) const {
-    if (!inner_) {
+BucketView ScanRecords::Records(const TableBucket& bucket) const {
+    if (!data_) {
+        return BucketView({}, bucket, 0, 0);
+    }
+    const auto& infos = data_->raw->sv_bucket_infos();
+    for (size_t i = 0; i < infos.size(); ++i) {
+        TableBucket tb = to_table_bucket(infos[i]);
+        if (tb == bucket) {
+            return BucketView(data_, std::move(tb), i, infos[i].record_count);
+        }
+    }
+    return BucketView({}, bucket, 0, 0);
+}
+
+BucketView ScanRecords::BucketAt(size_t idx) const {
+    if (!data_) {
         throw std::logic_error("ScanRecords: not available (moved-from or null)");
     }
-    if (idx >= inner_->sv_record_count()) {
-        throw std::out_of_range("ScanRecords: index " + std::to_string(idx) + " out of range (" +
-                                std::to_string(inner_->sv_record_count()) + " records)");
+    const auto& infos = data_->raw->sv_bucket_infos();
+    if (idx >= infos.size()) {
+        throw std::out_of_range("ScanRecords::BucketAt: index " + std::to_string(idx) +
+                                " out of range (" + std::to_string(infos.size()) + " buckets)");
     }
-    return ScanRecord{inner_->sv_bucket_id(idx),
-                      inner_->sv_has_partition_id(idx)
-                          ? std::optional<int64_t>(inner_->sv_partition_id(idx))
-                          : std::nullopt,
-                      inner_->sv_offset(idx),
-                      inner_->sv_timestamp(idx),
-                      static_cast<ChangeType>(inner_->sv_change_type(idx)),
-                      RowView(inner_, idx, GetColumnMap())};
+    return BucketView(data_, to_table_bucket(infos[idx]), idx, infos[idx].record_count);
 }
 
-ScanRecord ScanRecords::Iterator::operator*() const { return owner_->operator[](idx_); }
+ScanRecord BucketView::operator[](size_t idx) const {
+    if (idx >= count_) {
+        throw std::out_of_range("BucketView: index " + std::to_string(idx) + " out of range (" +
+                                std::to_string(count_) + " records)");
+    }
+    return ScanRecord{data_->raw->sv_offset(bucket_idx_, idx),
+                      data_->raw->sv_timestamp(bucket_idx_, idx),
+                      static_cast<ChangeType>(data_->raw->sv_change_type(bucket_idx_, idx)),
+                      RowView(data_, bucket_idx_, idx)};
+}
+
+ScanRecord BucketView::Iterator::operator*() const { return owner_->operator[](idx_); }
 
 // ============================================================================
 // LookupResult — backed by opaque Rust LookupResultInner
@@ -1082,10 +1144,16 @@ Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
                                  std::string(result_box->sv_error_message()));
     }
 
-    out.column_map_.reset();
-    out.inner_ = std::shared_ptr<ffi::ScanResultInner>(
-        result_box.into_raw(),
-        [](ffi::ScanResultInner* p) { rust::Box<ffi::ScanResultInner>::from_raw(p); });
+    // Wrap raw pointer in ScanData immediately so it's never leaked on exception.
+    auto data = std::make_shared<detail::ScanData>(result_box.into_raw(), detail::ColumnMap{});
+    // Build column map eagerly — shared by all RowViews/BucketViews.
+    auto col_count = data->raw->sv_column_count();
+    for (size_t i = 0; i < col_count; ++i) {
+        auto name = data->raw->sv_column_name(i);
+        data->columns[std::string(name.data(), name.size())] = {
+            i, static_cast<TypeId>(data->raw->sv_column_type(i))};
+    }
+    out.data_ = std::move(data);
     return utils::make_ok();
 }
 
diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
index 804e1bbc0e..9cf20e3d7b 100644
--- a/fluss-rust/bindings/python/Cargo.toml
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -37,3 +37,4 @@ arrow-array = "57.0.0"
 pyo3-async-runtimes = { version = "0.26.0", features = ["tokio-runtime"] }
 jiff = { workspace = true }
 bigdecimal = "0.4"
+indexmap = "2"
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 9c2b7e308c..3564d91cc5 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -351,21 +351,26 @@ async def main():
 
         record_scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
-        # Poll returns List[ScanRecord] with per-record metadata
+        # Poll returns ScanRecords — records grouped by bucket
         print("\n--- Testing poll() method (record-by-record) ---")
         try:
-            records = record_scanner.poll(5000)
-            print(f"Number of records: {len(records)}")
-
-            # Show first few records with metadata
-            for i, record in enumerate(records[:5]):
-                print(f"  Record {i}: offset={record.offset}, "
-                      f"timestamp={record.timestamp}, "
-                      f"change_type={record.change_type}, "
-                      f"row={record.row}")
-
-            if len(records) > 5:
-                print(f"  ... and {len(records) - 5} more records")
+            scan_records = record_scanner.poll(5000)
+            print(f"Total records: {scan_records.count()}, buckets: {len(scan_records.buckets())}")
+
+            # Flat iteration over all records (regardless of bucket)
+            print(f"  Flat iteration: {scan_records.count()} records")
+            for record in scan_records:
+                print(f"    offset={record.offset}, timestamp={record.timestamp}")
+
+            # Per-bucket access
+            for bucket in scan_records.buckets():
+                bucket_recs = scan_records.records(bucket)
+                print(f"  Bucket {bucket}: {len(bucket_recs)} records")
+                for record in bucket_recs[:3]:
+                    print(f"    offset={record.offset}, "
+                          f"timestamp={record.timestamp}, "
+                          f"change_type={record.change_type}, "
+                          f"row={record.row}")
 
         except Exception as e:
             print(f"Error during poll: {e}")
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 47eeb808b5..4b7fa4e845 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -19,7 +19,7 @@
 
 from enum import IntEnum
 from types import TracebackType
-from typing import Dict, List, Optional, Tuple
+from typing import Dict, Iterator, List, Optional, Tuple, Union, overload
 
 import pandas as pd
 import pyarrow as pa
@@ -43,12 +43,12 @@ class ChangeType(IntEnum):
         ...
 
 class ScanRecord:
-    """Represents a single scan record with metadata."""
+    """Represents a single scan record with metadata.
+
+    The bucket is the key in ScanRecords, not on the individual record
+    (matches Rust/Java).
+    """
 
-    @property
-    def bucket(self) -> TableBucket:
-        """The bucket this record belongs to."""
-        ...
     @property
     def offset(self) -> int:
         """The position of this record in the log."""
@@ -90,6 +90,47 @@ class RecordBatch:
     def __str__(self) -> str: ...
     def __repr__(self) -> str: ...
 
+class ScanRecords:
+    """A collection of scan records grouped by bucket.
+
+    Returned by ``LogScanner.poll()``. Supports flat iteration
+    (``for rec in records``) and per-bucket access (``records.records(bucket)``).
+    """
+
+    def buckets(self) -> List[TableBucket]:
+        """List of distinct buckets that have records."""
+        ...
+    def records(self, bucket: TableBucket) -> List[ScanRecord]:
+        """Get records for a specific bucket. Returns empty list if bucket not present."""
+        ...
+    def count(self) -> int:
+        """Total number of records across all buckets."""
+        ...
+    def is_empty(self) -> bool:
+        """Whether the result set is empty."""
+        ...
+    def keys(self) -> List[TableBucket]:
+        """Mapping protocol: alias for ``buckets()``."""
+        ...
+    def values(self) -> Iterator[List[ScanRecord]]:
+        """Mapping protocol: lazy iterator over record lists, one per bucket."""
+        ...
+    def items(self) -> Iterator[Tuple[TableBucket, List[ScanRecord]]]:
+        """Mapping protocol: lazy iterator over ``(bucket, records)`` pairs."""
+        ...
+    def __len__(self) -> int: ...
+    @overload
+    def __getitem__(self, index: int) -> ScanRecord: ...
+    @overload
+    def __getitem__(self, index: slice) -> List[ScanRecord]: ...
+    @overload
+    def __getitem__(self, bucket: TableBucket) -> List[ScanRecord]: ...
+    def __getitem__(self, key: Union[int, slice, TableBucket]) -> Union[ScanRecord, List[ScanRecord]]: ...
+    def __contains__(self, bucket: TableBucket) -> bool: ...
+    def __iter__(self) -> Iterator[ScanRecord]: ...
+    def __str__(self) -> str: ...
+    def __repr__(self) -> str: ...
+
 class Config:
     def __init__(self, properties: Optional[Dict[str, str]] = None) -> None: ...
     @property
@@ -590,7 +631,7 @@ class LogScanner:
             bucket_id: The bucket ID within the partition
         """
         ...
-    def poll(self, timeout_ms: int) -> List[ScanRecord]:
+    def poll(self, timeout_ms: int) -> ScanRecords:
         """Poll for individual records with metadata.
 
         Requires a record-based scanner (created with new_scan().create_log_scanner()).
@@ -599,11 +640,12 @@ class LogScanner:
             timeout_ms: Timeout in milliseconds to wait for records.
 
         Returns:
-            List of ScanRecord objects, each containing bucket, offset, timestamp,
-            change_type, and row data as a dictionary.
+            ScanRecords grouped by bucket. Supports flat iteration
+            (``for rec in records``) and per-bucket access
+            (``records.buckets()``, ``records.records(bucket)``).
 
         Note:
-            Returns an empty list if no records are available or timeout expires.
+            Returns an empty ScanRecords if no records are available or timeout expires.
         """
         ...
     def poll_record_batch(self, timeout_ms: int) -> List[RecordBatch]:
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 553c8a925e..ebc0d54cc3 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -122,6 +122,7 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<TableBucket>()?;
     m.add_class::<ChangeType>()?;
     m.add_class::<ScanRecord>()?;
+    m.add_class::<ScanRecords>()?;
     m.add_class::<RecordBatch>()?;
     m.add_class::<PartitionInfo>()?;
     m.add_class::<OffsetSpec>()?;
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index c3ea248e04..bc2e956c1a 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -22,7 +22,14 @@ use arrow_pyarrow::{FromPyArrow, ToPyArrow};
 use arrow_schema::SchemaRef;
 use fluss::record::to_arrow_schema;
 use fluss::rpc::message::OffsetSpec;
-use pyo3::types::IntoPyDict;
+use indexmap::IndexMap;
+use pyo3::exceptions::{PyIndexError, PyRuntimeError, PyTypeError};
+use pyo3::sync::PyOnceLock;
+use pyo3::types::{
+    IntoPyDict, PyBool, PyByteArray, PyBytes, PyDate, PyDateAccess, PyDateTime, PyDelta,
+    PyDeltaAccess, PyDict, PyList, PySequence, PySlice, PyTime, PyTimeAccess, PyTuple, PyType,
+    PyTzInfo,
+};
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::collections::HashMap;
 use std::sync::Arc;
@@ -38,11 +45,12 @@ const MICROS_PER_DAY: i64 = 86_400_000_000;
 const NANOS_PER_MILLI: i64 = 1_000_000;
 const NANOS_PER_MICRO: i64 = 1_000;
 
-/// Represents a single scan record with metadata
+/// Represents a single scan record with metadata.
+///
+/// Matches Rust/Java: offset, timestamp, change_type, row.
+/// The bucket is the key in ScanRecords, not on the individual record.
 #[pyclass]
 pub struct ScanRecord {
-    #[pyo3(get)]
-    bucket: TableBucket,
     #[pyo3(get)]
     offset: i64,
     #[pyo3(get)]
@@ -50,21 +58,20 @@ pub struct ScanRecord {
     #[pyo3(get)]
     change_type: ChangeType,
     /// Store row as a Python dict directly
-    row_dict: Py<pyo3::types::PyDict>,
+    row_dict: Py<PyDict>,
 }
 
 #[pymethods]
 impl ScanRecord {
     /// Get the row data as a dictionary
     #[getter]
-    pub fn row(&self, py: Python) -> Py<pyo3::types::PyDict> {
+    pub fn row(&self, py: Python) -> Py<PyDict> {
         self.row_dict.clone_ref(py)
     }
 
     fn __str__(&self) -> String {
         format!(
-            "ScanRecord(bucket={}, offset={}, timestamp={}, change_type={})",
-            self.bucket.__str__(),
+            "ScanRecord(offset={}, timestamp={}, change_type={})",
             self.offset,
             self.timestamp,
             self.change_type.short_string()
@@ -80,13 +87,12 @@ impl ScanRecord {
     /// Create a ScanRecord from core types
     pub fn from_core(
         py: Python,
-        bucket: &fcore::metadata::TableBucket,
         record: &fcore::record::ScanRecord,
         row_type: &fcore::metadata::RowType,
     ) -> PyResult<Self> {
         let fields = row_type.fields();
         let row = record.row();
-        let dict = pyo3::types::PyDict::new(py);
+        let dict = PyDict::new(py);
 
         for (pos, field) in fields.iter().enumerate() {
             let value = datum_to_python_value(py, row, pos, field.data_type())?;
@@ -94,7 +100,6 @@ impl ScanRecord {
         }
 
         Ok(ScanRecord {
-            bucket: TableBucket::from_core(bucket.clone()),
             offset: record.offset(),
             timestamp: record.timestamp(),
             change_type: ChangeType::from_core(*record.change_type()),
@@ -155,6 +160,247 @@ impl RecordBatch {
     }
 }
 
+/// A collection of scan records grouped by bucket.
+///
+/// Returned by `LogScanner.poll()`. Records are grouped by `TableBucket`.
+#[pyclass]
+pub struct ScanRecords {
+    records_by_bucket: IndexMap<TableBucket, Vec<Py<ScanRecord>>>,
+    total_count: usize,
+}
+
+#[pymethods]
+impl ScanRecords {
+    /// List of distinct buckets that have records in this result.
+    pub fn buckets(&self) -> Vec<TableBucket> {
+        self.records_by_bucket.keys().cloned().collect()
+    }
+
+    /// Get records for a specific bucket.
+    ///
+    /// Returns an empty list if the bucket is not present (matches Rust/Java behavior).
+    pub fn records(&self, py: Python, bucket: &TableBucket) -> Vec<Py<ScanRecord>> {
+        self.records_by_bucket
+            .get(bucket)
+            .map(|recs| recs.iter().map(|r| r.clone_ref(py)).collect())
+            .unwrap_or_default()
+    }
+
+    /// Total number of records across all buckets.
+    pub fn count(&self) -> usize {
+        self.total_count
+    }
+
+    /// Whether the result set is empty.
+    pub fn is_empty(&self) -> bool {
+        self.total_count == 0
+    }
+
+    fn __len__(&self) -> usize {
+        self.total_count
+    }
+
+    /// Type-dispatched indexing:
+    ///   records[0]       → ScanRecord (flat index)
+    ///   records[-1]      → ScanRecord (negative index)
+    ///   records[1:3]     → list[ScanRecord] (slice)
+    ///   records[bucket]  → list[ScanRecord] (by bucket)
+    fn __getitem__(&self, py: Python, key: &Bound<'_, PyAny>) -> PyResult<Py<PyAny>> {
+        // Try integer index first
+        if let Ok(mut idx) = key.extract::<isize>() {
+            let len = self.total_count as isize;
+            if idx < 0 {
+                idx += len;
+            }
+            if idx < 0 || idx >= len {
+                return Err(PyIndexError::new_err(format!(
+                    "index {idx} out of range for ScanRecords of size {len}"
+                )));
+            }
+            let idx = idx as usize;
+            let mut offset = 0;
+            for recs in self.records_by_bucket.values() {
+                if idx < offset + recs.len() {
+                    return Ok(recs[idx - offset].clone_ref(py).into_any());
+                }
+                offset += recs.len();
+            }
+            return Err(PyRuntimeError::new_err(
+                "internal error: total_count out of sync with records",
+            ));
+        }
+        // Try slice
+        if let Ok(slice) = key.downcast::<PySlice>() {
+            let indices = slice.indices(self.total_count as isize)?;
+            let mut result: Vec<Py<ScanRecord>> = Vec::new();
+            let mut i = indices.start;
+            while (indices.step > 0 && i < indices.stop) || (indices.step < 0 && i > indices.stop) {
+                let idx = i as usize;
+                let mut offset = 0;
+                for recs in self.records_by_bucket.values() {
+                    if idx < offset + recs.len() {
+                        result.push(recs[idx - offset].clone_ref(py));
+                        break;
+                    }
+                    offset += recs.len();
+                }
+                i += indices.step;
+            }
+            return Ok(result.into_pyobject(py).unwrap().into_any().unbind());
+        }
+        // Try TableBucket
+        if let Ok(bucket) = key.extract::<TableBucket>() {
+            let recs = self.records(py, &bucket);
+            return Ok(recs.into_pyobject(py).unwrap().into_any().unbind());
+        }
+        Err(PyTypeError::new_err(
+            "index must be int, slice, or TableBucket",
+        ))
+    }
+
+    /// Support `bucket in records`.
+    fn __contains__(&self, bucket: &TableBucket) -> bool {
+        self.records_by_bucket.contains_key(bucket)
+    }
+
+    /// Mapping protocol: alias for `buckets()`.
+    pub fn keys(&self) -> Vec<TableBucket> {
+        self.buckets()
+    }
+
+    /// Mapping protocol: lazy iterator over record lists, one per bucket.
+    pub fn values(slf: Bound<'_, Self>) -> ScanRecordsBucketIter {
+        let this = slf.borrow();
+        let bucket_keys: Vec<TableBucket> = this.records_by_bucket.keys().cloned().collect();
+        drop(this);
+        ScanRecordsBucketIter {
+            owner: slf.unbind(),
+            bucket_keys,
+            bucket_idx: 0,
+            with_keys: false,
+        }
+    }
+
+    /// Mapping protocol: lazy iterator over `(TableBucket, list[ScanRecord])` pairs.
+    pub fn items(slf: Bound<'_, Self>) -> ScanRecordsBucketIter {
+        let this = slf.borrow();
+        let bucket_keys: Vec<TableBucket> = this.records_by_bucket.keys().cloned().collect();
+        drop(this);
+        ScanRecordsBucketIter {
+            owner: slf.unbind(),
+            bucket_keys,
+            bucket_idx: 0,
+            with_keys: true,
+        }
+    }
+
+    fn __str__(&self) -> String {
+        format!(
+            "ScanRecords(records={}, buckets={})",
+            self.total_count,
+            self.records_by_bucket.len()
+        )
+    }
+
+    fn __repr__(&self) -> String {
+        self.__str__()
+    }
+
+    /// Flat iterator over all records across all buckets (matches Java/Rust).
+    fn __iter__(slf: Bound<'_, Self>) -> ScanRecordsIter {
+        let this = slf.borrow();
+        let bucket_keys: Vec<TableBucket> = this.records_by_bucket.keys().cloned().collect();
+        drop(this);
+        ScanRecordsIter {
+            owner: slf.unbind(),
+            bucket_keys,
+            bucket_idx: 0,
+            rec_idx: 0,
+        }
+    }
+}
+
+#[pyclass]
+struct ScanRecordsIter {
+    owner: Py<ScanRecords>,
+    bucket_keys: Vec<TableBucket>,
+    bucket_idx: usize,
+    rec_idx: usize,
+}
+
+#[pymethods]
+impl ScanRecordsIter {
+    fn __iter__(slf: PyRef<'_, Self>) -> PyRef<'_, Self> {
+        slf
+    }
+
+    fn __next__(&mut self, py: Python) -> Option<Py<ScanRecord>> {
+        let owner = self.owner.borrow(py);
+        loop {
+            if self.bucket_idx >= self.bucket_keys.len() {
+                return None;
+            }
+            let bucket = &self.bucket_keys[self.bucket_idx];
+            if let Some(recs) = owner.records_by_bucket.get(bucket) {
+                if self.rec_idx < recs.len() {
+                    let rec = recs[self.rec_idx].clone_ref(py);
+                    self.rec_idx += 1;
+                    return Some(rec);
+                }
+            }
+            self.bucket_idx += 1;
+            self.rec_idx = 0;
+        }
+    }
+}
+
+/// Lazy iterator for `ScanRecords.items()` and `ScanRecords.values()`.
+///
+/// Yields one bucket at a time: `(TableBucket, list[ScanRecord])` for items,
+/// or `list[ScanRecord]` for values. Only materializes records for the
+/// current bucket on each `__next__` call.
+#[pyclass]
+pub struct ScanRecordsBucketIter {
+    owner: Py<ScanRecords>,
+    bucket_keys: Vec<TableBucket>,
+    bucket_idx: usize,
+    with_keys: bool,
+}
+
+#[pymethods]
+impl ScanRecordsBucketIter {
+    fn __iter__(slf: PyRef<'_, Self>) -> PyRef<'_, Self> {
+        slf
+    }
+
+    fn __next__(&mut self, py: Python) -> Option<Py<PyAny>> {
+        if self.bucket_idx >= self.bucket_keys.len() {
+            return None;
+        }
+        let bucket = &self.bucket_keys[self.bucket_idx];
+        let owner = self.owner.borrow(py);
+        let recs = owner
+            .records_by_bucket
+            .get(bucket)
+            .map(|recs| recs.iter().map(|r| r.clone_ref(py)).collect::<Vec<_>>())
+            .unwrap_or_default();
+        let bucket = bucket.clone();
+        self.bucket_idx += 1;
+
+        if self.with_keys {
+            Some(
+                (bucket, recs)
+                    .into_pyobject(py)
+                    .unwrap()
+                    .into_any()
+                    .unbind(),
+            )
+        } else {
+            Some(recs.into_pyobject(py).unwrap().into_any().unbind())
+        }
+    }
+}
+
 /// Represents a Fluss table for data operations
 #[pyclass]
 pub struct FlussTable {
@@ -763,9 +1009,9 @@ impl AppendWriter {
 /// Represents different input shapes for a row
 #[derive(FromPyObject)]
 enum RowInput<'py> {
-    Dict(Bound<'py, pyo3::types::PyDict>),
-    Tuple(Bound<'py, pyo3::types::PyTuple>),
-    List(Bound<'py, pyo3::types::PyList>),
+    Dict(Bound<'py, PyDict>),
+    Tuple(Bound<'py, PyTuple>),
+    List(Bound<'py, PyList>),
 }
 
 /// Convert Python row (dict/list/tuple) to GenericRow requiring all schema columns.
@@ -779,7 +1025,7 @@ pub fn python_to_generic_row(
 
 /// Process a Python sequence (list or tuple) into datums at the target column positions.
 fn process_sequence(
-    seq: &Bound<pyo3::types::PySequence>,
+    seq: &Bound<PySequence>,
     target_indices: &[usize],
     fields: &[fcore::metadata::DataField],
     datums: &mut [fcore::row::Datum<'static>],
@@ -924,7 +1170,7 @@ fn python_value_to_datum(
         }
         fcore::metadata::DataType::TinyInt(_) => {
             // Strict type checking: reject bool for int columns
-            if value.is_instance_of::<pyo3::types::PyBool>() {
+            if value.is_instance_of::<PyBool>() {
                 return Err(FlussError::new_err(
                     "Expected int for TinyInt column, got bool. Use 0 or 1 explicitly.".to_string(),
                 ));
@@ -933,7 +1179,7 @@ fn python_value_to_datum(
             Ok(Datum::Int8(v))
         }
         fcore::metadata::DataType::SmallInt(_) => {
-            if value.is_instance_of::<pyo3::types::PyBool>() {
+            if value.is_instance_of::<PyBool>() {
                 return Err(FlussError::new_err(
                     "Expected int for SmallInt column, got bool. Use 0 or 1 explicitly."
                         .to_string(),
@@ -943,7 +1189,7 @@ fn python_value_to_datum(
             Ok(Datum::Int16(v))
         }
         fcore::metadata::DataType::Int(_) => {
-            if value.is_instance_of::<pyo3::types::PyBool>() {
+            if value.is_instance_of::<PyBool>() {
                 return Err(FlussError::new_err(
                     "Expected int for Int column, got bool. Use 0 or 1 explicitly.".to_string(),
                 ));
@@ -952,7 +1198,7 @@ fn python_value_to_datum(
             Ok(Datum::Int32(v))
         }
         fcore::metadata::DataType::BigInt(_) => {
-            if value.is_instance_of::<pyo3::types::PyBool>() {
+            if value.is_instance_of::<PyBool>() {
                 return Err(FlussError::new_err(
                     "Expected int for BigInt column, got bool. Use 0 or 1 explicitly.".to_string(),
                 ));
@@ -975,9 +1221,9 @@ fn python_value_to_datum(
         fcore::metadata::DataType::Bytes(_) | fcore::metadata::DataType::Binary(_) => {
             // Efficient extraction: downcast to specific type and use bulk copy.
             // PyBytes::as_bytes() and PyByteArray::to_vec() are O(n) bulk copies of the underlying data.
-            if let Ok(bytes) = value.downcast::<pyo3::types::PyBytes>() {
+            if let Ok(bytes) = value.downcast::<PyBytes>() {
                 Ok(bytes.as_bytes().to_vec().into())
-            } else if let Ok(bytearray) = value.downcast::<pyo3::types::PyByteArray>() {
+            } else if let Ok(bytearray) = value.downcast::<PyByteArray>() {
                 Ok(bytearray.to_vec().into())
             } else {
                 Err(FlussError::new_err(format!(
@@ -1067,11 +1313,11 @@ pub fn datum_to_python_value(
         }
         DataType::Bytes(_) => {
             let b = row.get_bytes(pos);
-            Ok(pyo3::types::PyBytes::new(py, b).into_any().unbind())
+            Ok(PyBytes::new(py, b).into_any().unbind())
         }
         DataType::Binary(binary_type) => {
             let b = row.get_binary(pos, binary_type.length());
-            Ok(pyo3::types::PyBytes::new(py, b).into_any().unbind())
+            Ok(PyBytes::new(py, b).into_any().unbind())
         }
         DataType::Decimal(decimal_type) => {
             let decimal = row.get_decimal(
@@ -1113,8 +1359,6 @@ fn rust_decimal_to_python(py: Python, decimal: &fcore::row::Decimal) -> PyResult
 
 /// Convert Rust Date (days since epoch) to Python datetime.date
 fn rust_date_to_python(py: Python, date: fcore::row::Date) -> PyResult<Py<PyAny>> {
-    use pyo3::types::PyDate;
-
     let days_since_epoch = date.get_inner();
     let epoch = jiff::civil::date(1970, 1, 1);
     let civil_date = epoch + jiff::Span::new().days(days_since_epoch as i64);
@@ -1130,8 +1374,6 @@ fn rust_date_to_python(py: Python, date: fcore::row::Date) -> PyResult<Py<PyAny>
 
 /// Convert Rust Time (millis since midnight) to Python datetime.time
 fn rust_time_to_python(py: Python, time: fcore::row::Time) -> PyResult<Py<PyAny>> {
-    use pyo3::types::PyTime;
-
     let millis = time.get_inner() as i64;
     let hours = millis / MILLIS_PER_HOUR;
     let minutes = (millis % MILLIS_PER_HOUR) / MILLIS_PER_MINUTE;
@@ -1151,8 +1393,6 @@ fn rust_time_to_python(py: Python, time: fcore::row::Time) -> PyResult<Py<PyAny>
 
 /// Convert Rust TimestampNtz to Python naive datetime
 fn rust_timestamp_ntz_to_python(py: Python, ts: fcore::row::TimestampNtz) -> PyResult<Py<PyAny>> {
-    use pyo3::types::PyDateTime;
-
     let millis = ts.get_millisecond();
     let nanos = ts.get_nano_of_millisecond();
     let total_micros = millis * MICROS_PER_MILLI + (nanos as i64 / NANOS_PER_MICRO);
@@ -1178,8 +1418,6 @@ fn rust_timestamp_ntz_to_python(py: Python, ts: fcore::row::TimestampNtz) -> PyR
 
 /// Convert Rust TimestampLtz to Python timezone-aware datetime (UTC)
 fn rust_timestamp_ltz_to_python(py: Python, ts: fcore::row::TimestampLtz) -> PyResult<Py<PyAny>> {
-    use pyo3::types::PyDateTime;
-
     let millis = ts.get_epoch_millisecond();
     let nanos = ts.get_nano_of_millisecond();
     let total_micros = millis * MICROS_PER_MILLI + (nanos as i64 / NANOS_PER_MICRO);
@@ -1212,7 +1450,7 @@ pub fn internal_row_to_dict(
 ) -> PyResult<Py<PyAny>> {
     let row_type = table_info.row_type();
     let fields = row_type.fields();
-    let dict = pyo3::types::PyDict::new(py);
+    let dict = PyDict::new(py);
 
     for (pos, field) in fields.iter().enumerate() {
         let value = datum_to_python_value(py, row, pos, field.data_type())?;
@@ -1224,29 +1462,26 @@ pub fn internal_row_to_dict(
 
 /// Cached decimal.Decimal type
 /// Uses PyOnceLock for thread-safety and subinterpreter compatibility.
-static DECIMAL_TYPE: pyo3::sync::PyOnceLock<Py<pyo3::types::PyType>> =
-    pyo3::sync::PyOnceLock::new();
+static DECIMAL_TYPE: PyOnceLock<Py<PyType>> = PyOnceLock::new();
 
 /// Cached UTC timezone
-static UTC_TIMEZONE: pyo3::sync::PyOnceLock<Py<PyAny>> = pyo3::sync::PyOnceLock::new();
+static UTC_TIMEZONE: PyOnceLock<Py<PyAny>> = PyOnceLock::new();
 
 /// Cached UTC epoch type
-static UTC_EPOCH: pyo3::sync::PyOnceLock<Py<PyAny>> = pyo3::sync::PyOnceLock::new();
+static UTC_EPOCH: PyOnceLock<Py<PyAny>> = PyOnceLock::new();
 
 /// Get the cached decimal.Decimal type, importing it once per interpreter.
-fn get_decimal_type(py: Python) -> PyResult<Bound<pyo3::types::PyType>> {
+fn get_decimal_type(py: Python) -> PyResult<Bound<PyType>> {
     let ty = DECIMAL_TYPE.get_or_try_init(py, || -> PyResult<_> {
         let decimal_mod = py.import("decimal")?;
-        let decimal_ty = decimal_mod
-            .getattr("Decimal")?
-            .downcast_into::<pyo3::types::PyType>()?;
+        let decimal_ty = decimal_mod.getattr("Decimal")?.downcast_into::<PyType>()?;
         Ok(decimal_ty.unbind())
     })?;
     Ok(ty.bind(py).clone())
 }
 
 /// Get the cached UTC timezone (datetime.timezone.utc), creating it once per interpreter.
-fn get_utc_timezone(py: Python) -> PyResult<Bound<pyo3::types::PyTzInfo>> {
+fn get_utc_timezone(py: Python) -> PyResult<Bound<PyTzInfo>> {
     let tz = UTC_TIMEZONE.get_or_try_init(py, || -> PyResult<_> {
         let datetime_mod = py.import("datetime")?;
         let timezone = datetime_mod.getattr("timezone")?;
@@ -1254,10 +1489,7 @@ fn get_utc_timezone(py: Python) -> PyResult<Bound<pyo3::types::PyTzInfo>> {
         Ok(utc.unbind())
     })?;
     // Downcast to PyTzInfo for use with PyDateTime::new()
-    Ok(tz
-        .bind(py)
-        .clone()
-        .downcast_into::<pyo3::types::PyTzInfo>()?)
+    Ok(tz.bind(py).clone().downcast_into::<PyTzInfo>()?)
 }
 
 /// Get the cached UTC epoch datetime, creating it once per interpreter.
@@ -1313,8 +1545,6 @@ fn python_decimal_to_datum(
 
 /// Convert Python datetime.date to Datum::Date.
 fn python_date_to_datum(value: &Bound<PyAny>) -> PyResult<fcore::row::Datum<'static>> {
-    use pyo3::types::{PyDate, PyDateAccess, PyDateTime};
-
     // Reject datetime.datetime (subclass of date) - use timestamp columns for those
     if value.downcast::<PyDateTime>().is_ok() {
         return Err(FlussError::new_err(
@@ -1351,8 +1581,6 @@ fn python_date_to_datum(value: &Bound<PyAny>) -> PyResult<fcore::row::Datum<'sta
 /// Sub-millisecond precision (microseconds not divisible by 1000) will raise an error
 /// to prevent silent data loss and ensure fail-fast behavior.
 fn python_time_to_datum(value: &Bound<PyAny>) -> PyResult<fcore::row::Datum<'static>> {
-    use pyo3::types::{PyTime, PyTimeAccess};
-
     let time = value.downcast::<PyTime>().map_err(|_| {
         FlussError::new_err(format!(
             "Expected datetime.time, got {}",
@@ -1411,8 +1639,6 @@ fn python_datetime_to_timestamp_ltz(value: &Bound<PyAny>) -> PyResult<fcore::row
 /// Uses integer arithmetic to avoid float precision issues.
 /// For clarity, tz-aware datetimes are rejected - use TimestampLtz for those.
 fn extract_datetime_components_ntz(value: &Bound<PyAny>) -> PyResult<(i64, i32)> {
-    use pyo3::types::PyDateTime;
-
     // Try PyDateTime first
     if let Ok(dt) = value.downcast::<PyDateTime>() {
         // Reject tz-aware datetime for NTZ - it's ambiguous what the user wants
@@ -1465,8 +1691,6 @@ fn extract_datetime_components_ntz(value: &Bound<PyAny>) -> PyResult<(i64, i32)>
 /// Extract epoch milliseconds for TimestampLtz (instant in time, UTC-based).
 /// For naive datetimes, assumes UTC. For aware datetimes, converts to UTC.
 fn extract_datetime_components_ltz(value: &Bound<PyAny>) -> PyResult<(i64, i32)> {
-    use pyo3::types::PyDateTime;
-
     // Try PyDateTime first
     if let Ok(dt) = value.downcast::<PyDateTime>() {
         // Check if timezone-aware
@@ -1506,11 +1730,7 @@ fn extract_datetime_components_ltz(value: &Bound<PyAny>) -> PyResult<(i64, i32)>
 }
 
 /// Convert datetime components to epoch milliseconds treating them as UTC
-fn datetime_to_epoch_millis_as_utc(
-    dt: &pyo3::Bound<'_, pyo3::types::PyDateTime>,
-) -> PyResult<(i64, i32)> {
-    use pyo3::types::{PyDateAccess, PyTimeAccess};
-
+fn datetime_to_epoch_millis_as_utc(dt: &Bound<'_, PyDateTime>) -> PyResult<(i64, i32)> {
     let year = dt.get_year();
     let month = dt.get_month();
     let day = dt.get_day();
@@ -1541,11 +1761,7 @@ fn datetime_to_epoch_millis_as_utc(
 /// Convert timezone-aware datetime to epoch milliseconds using Python's timedelta.
 /// This correctly handles timezone conversions by computing (dt - UTC_EPOCH).
 /// The UTC epoch is cached for performance.
-fn datetime_to_epoch_millis_utc_aware(
-    dt: &pyo3::Bound<'_, pyo3::types::PyDateTime>,
-) -> PyResult<(i64, i32)> {
-    use pyo3::types::{PyDelta, PyDeltaAccess};
-
+fn datetime_to_epoch_millis_utc_aware(dt: &Bound<'_, PyDateTime>) -> PyResult<(i64, i32)> {
     let py = dt.py();
     let epoch = get_utc_epoch(py)?;
 
@@ -1777,14 +1993,15 @@ impl LogScanner {
     ///     timeout_ms: Timeout in milliseconds to wait for records
     ///
     /// Returns:
-    ///     List of ScanRecord objects, each containing bucket, offset, timestamp,
-    ///     change_type, and row data as a dictionary.
+    ///     ScanRecords grouped by bucket. Supports flat iteration
+    ///     (`for rec in records`) and per-bucket access (`records.buckets()`,
+    ///     `records.records(bucket)`, `records[bucket]`).
     ///
     /// Note:
     ///     - Requires a record-based scanner (created with new_scan().create_log_scanner())
-    ///     - Returns an empty list if no records are available
-    ///     - When timeout expires, returns an empty list (NOT an error)
-    fn poll(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<ScanRecord>> {
+    ///     - Returns an empty ScanRecords if no records are available
+    ///     - When timeout expires, returns an empty ScanRecords (NOT an error)
+    fn poll(&self, py: Python, timeout_ms: i64) -> PyResult<ScanRecords> {
         let scanner = self.scanner.as_record()?;
 
         if timeout_ms < 0 {
@@ -1798,19 +2015,26 @@ impl LogScanner {
             .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
             .map_err(|e| FlussError::from_core_error(&e))?;
 
-        // Convert ScanRecords to Python ScanRecord list
-        // Use projected_row_type to handle column projection correctly
+        // Convert core ScanRecords to Python ScanRecords grouped by bucket
         let row_type = &self.projected_row_type;
-        let mut result = Vec::new();
+        let mut records_by_bucket = IndexMap::new();
+        let mut total_count = 0usize;
 
         for (bucket, records) in scan_records.into_records_by_buckets() {
-            for record in records {
-                let scan_record = ScanRecord::from_core(py, &bucket, &record, row_type)?;
-                result.push(scan_record);
+            let py_bucket = TableBucket::from_core(bucket);
+            let mut py_records = Vec::with_capacity(records.len());
+            for record in &records {
+                let scan_record = ScanRecord::from_core(py, record, row_type)?;
+                py_records.push(Py::new(py, scan_record)?);
+                total_count += 1;
             }
+            records_by_bucket.insert(py_bucket, py_records);
         }
 
-        Ok(result)
+        Ok(ScanRecords {
+            records_by_bucket,
+            total_count,
+        })
     }
 
     /// Poll for batches with metadata.
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index 09586aa8de..bfa9789734 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -492,11 +492,22 @@ async def test_partitioned_table_append_scan(connection, admin):
         (8, "EU", 800),
     ]
 
-    records = _poll_records(scanner, expected_count=8)
-    assert len(records) == 8
+    # Poll and verify per-bucket grouping
+    all_records = []
+    deadline = time.monotonic() + 10
+    while len(all_records) < 8 and time.monotonic() < deadline:
+        scan_records = scanner.poll(5000)
+        for bucket, bucket_records in scan_records.items():
+            assert bucket.partition_id is not None, "Partitioned table should have partition_id"
+            # All records in a bucket should belong to the same partition
+            regions = {r.row["region"] for r in bucket_records}
+            assert len(regions) == 1, f"Bucket has mixed regions: {regions}"
+            all_records.extend(bucket_records)
+
+    assert len(all_records) == 8
 
     collected = sorted(
-        [(r.row["id"], r.row["region"], r.row["value"]) for r in records],
+        [(r.row["id"], r.row["region"], r.row["value"]) for r in all_records],
         key=lambda x: x[0],
     )
     assert collected == expected
@@ -652,6 +663,70 @@ async def test_partitioned_table_to_arrow(connection, admin):
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
+async def test_scan_records_indexing_and_slicing(connection, admin):
+    """Test ScanRecords indexing, slicing (incl. negative steps), and iteration consistency."""
+    table_path = fluss.TablePath("fluss", "py_test_scan_records_indexing")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())])
+    )
+    await admin.create_table(table_path, fluss.TableDescriptor(schema))
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [pa.array(list(range(1, 9)), type=pa.int32()),
+             pa.array([f"v{i}" for i in range(1, 9)])],
+            schema=pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())]),
+        )
+    )
+    await writer.flush()
+
+    scanner = await table.new_scan().create_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    # Poll until we get a non-empty ScanRecords (need ≥2 records for slice tests)
+    sr = None
+    deadline = time.monotonic() + 10
+    while time.monotonic() < deadline:
+        sr = scanner.poll(5000)
+        if len(sr) >= 2:
+            break
+    assert sr is not None and len(sr) >= 2, "Expected at least 2 records"
+    n = len(sr)
+    offsets = [sr[i].offset for i in range(n)]
+
+    # Iteration and indexing must produce the same order
+    assert [r.offset for r in sr] == offsets
+
+    # Negative indexing
+    assert sr[-1].offset == offsets[-1]
+    assert sr[-n].offset == offsets[0]
+
+    # Verify slices match the same operation on the offsets reference list
+    test_slices = [
+        slice(1, n - 1),          # forward subrange
+        slice(None, None, -1),    # [::-1] full reverse
+        slice(n - 2, 0, -1),      # reverse with bounds
+        slice(n - 1, 0, -2),      # reverse with step
+        slice(None, None, 2),     # [::2]
+        slice(1, None, 3),        # [1::3]
+        slice(2, 2),              # empty
+    ]
+    for s in test_slices:
+        result = [r.offset for r in sr[s]]
+        assert result == offsets[s], f"slice {s}: got {result}, expected {offsets[s]}"
+
+    # Bucket-based indexing
+    for bucket in sr.buckets():
+        assert len(sr[bucket]) > 0
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
 # ---------------------------------------------------------------------------
 # Helpers
 # ---------------------------------------------------------------------------
@@ -667,6 +742,8 @@ def _poll_records(scanner, expected_count, timeout_s=10):
     return collected
 
 
+
+
 def _poll_arrow_ids(scanner, expected_count, timeout_s=10):
     """Poll a batch scanner and extract 'id' column values."""
     all_ids = []
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index a07dd6c6e0..433c5da9de 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -250,23 +250,60 @@ Read-only row view for scan results. Provides zero-copy access to string and byt
 
 `ScanRecord` is a value type that can be freely copied, stored, and accumulated across multiple `Poll()` calls. It shares ownership of the underlying scan data via reference counting.
 
-| Field          | Type                    |  Description                     |
-|----------------|-------------------------|----------------------------------|
-| `bucket_id`    | `int32_t`               | Bucket this record belongs to    |
-| `partition_id` | `std::optional<int64_t>`| Partition ID (if partitioned)    |
-| `offset`       | `int64_t`               | Record offset in the log         |
-| `timestamp`    | `int64_t`               | Record timestamp                 |
-| `change_type`  | `ChangeType`            | Type of change (see `ChangeType`)|
-| `row`          | `RowView`               | Read-only row view for field access |
+| Field         | Type         |  Description                                                        |
+|---------------|--------------|---------------------------------------------------------------------|
+| `offset`      | `int64_t`    | Record offset in the log                                            |
+| `timestamp`   | `int64_t`    | Record timestamp                                                    |
+| `change_type` | `ChangeType` | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
+| `row`         | `RowView`    | Row data (value type, shares ownership via reference counting)      |
 
 ## `ScanRecords`
 
-| Method                                 |  Description                               |
-|----------------------------------------|--------------------------------------------|
-| `Size() -> size_t`                     | Number of records                          |
-| `Empty() -> bool`                      | Check if empty                             |
-| `operator[](size_t idx) -> ScanRecord` | Access record by index                     |
-| `begin() / end()`                      | Iterator support for range-based for loops |
+### Flat Access
+
+| Method                                  |  Description                               |
+|-----------------------------------------|--------------------------------------------|
+| `Count() -> size_t`                     | Total number of records across all buckets |
+| `IsEmpty() -> bool`                     | Check if empty                             |
+| `begin() / end()`                       | Iterator support for range-based for loops |
+
+Flat iteration over all records (regardless of bucket):
+
+```cpp
+for (const auto& rec : records) {
+    std::cout << "offset=" << rec.offset << std::endl;
+}
+```
+
+### Per-Bucket Access
+
+| Method                                                          |  Description                                                          |
+|-----------------------------------------------------------------|-----------------------------------------------------------------------|
+| `BucketCount() -> size_t`                                       | Number of distinct buckets                                            |
+| `Buckets() -> std::vector<TableBucket>`                         | List of distinct buckets                                              |
+| `Records(const TableBucket& bucket) -> BucketView`              | Records for a specific bucket (empty view if bucket not present)      |
+| `BucketAt(size_t idx) -> BucketView`                            | Records by bucket index (0-based, O(1))                               |
+
+## `BucketView`
+
+A view of records within a single bucket. Obtained from `ScanRecords::Records()` or `ScanRecords::BucketAt()`. `BucketView` is a value type — it shares ownership of the underlying scan data via reference counting, so it can safely outlive the `ScanRecords` that produced it.
+
+| Method                                         |  Description                               |
+|------------------------------------------------|--------------------------------------------|
+| `Size() -> size_t`                         | Number of records in this bucket           |
+| `Empty() -> bool`                          | Check if empty                             |
+| `Bucket() -> const TableBucket&`           | Get the bucket                             |
+| `operator[](size_t idx) -> ScanRecord`     | Access record by index within this bucket  |
+| `begin() / end()`                          | Iterator support for range-based for loops |
+
+## `TableBucket`
+
+| Field / Method                        |  Description                                    |
+|---------------------------------------|-------------------------------------------------|
+| `table_id -> int64_t`                    | Table ID                                        |
+| `bucket_id -> int32_t`                   | Bucket ID                                       |
+| `partition_id -> std::optional<int64_t>` | Partition ID (empty if non-partitioned)         |
+| `operator==(const TableBucket&) -> bool` | Equality comparison                             |
 
 ## `LookupResult`
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md b/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
index 3a862c18e4..0125a4ce29 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/log-tables.md
@@ -60,6 +60,18 @@ for (const auto& rec : records) {
               << " timestamp=" << rec.row.GetInt64(2)
               << " @ offset=" << rec.offset << std::endl;
 }
+
+// Or per-bucket access
+for (const auto& bucket : records.Buckets()) {
+    auto view = records.Records(bucket);
+    std::cout << "Bucket " << bucket.bucket_id << ": "
+              << view.Size() << " records" << std::endl;
+    for (const auto& rec : view) {
+        std::cout << "  event_id=" << rec.row.GetInt32(0)
+                  << " event_type=" << rec.row.GetString(1)
+                  << " @ offset=" << rec.offset << std::endl;
+    }
+}
 ```
 
 **Continuous polling:**
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index af03058a04..27a57dc1b8 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -137,17 +137,69 @@ Builder for creating a `Lookuper`. Obtain via `FlussTable.new_lookup()`.
 | `.subscribe_partition_buckets(partition_bucket_offsets)`      | Subscribe to multiple partition+bucket combos (`{(part_id, bucket_id): offset}`) |
 | `.unsubscribe(bucket_id)`                                     | Unsubscribe from a bucket (non-partitioned tables)                               |
 | `.unsubscribe_partition(partition_id, bucket_id)`             | Unsubscribe from a partition bucket                                              |
-| `.poll(timeout_ms) -> list[ScanRecord]`                       | Poll individual records (record scanner only)                                    |
+| `.poll(timeout_ms) -> ScanRecords`                            | Poll individual records (record scanner only)                                    |
 | `.poll_arrow(timeout_ms) -> pa.Table`                         | Poll as Arrow Table (batch scanner only)                                         |
 | `.poll_record_batch(timeout_ms) -> list[RecordBatch]`         | Poll batches with metadata (batch scanner only)                                  |
 | `.to_arrow() -> pa.Table`                                     | Read all subscribed data as Arrow Table (batch scanner only)                     |
 | `.to_pandas() -> pd.DataFrame`                                | Read all subscribed data as DataFrame (batch scanner only)                       |
 
+## `ScanRecords`
+
+Returned by `LogScanner.poll()`. Records are grouped by bucket.
+
+> **Note:** Flat iteration and integer indexing traverse buckets in an arbitrary order that is consistent within a single `ScanRecords` instance but may differ between `poll()` calls. Use per-bucket access (`.items()`, `.records(bucket)`) when bucket ordering matters.
+
+```python
+scan_records = scanner.poll(timeout_ms=5000)
+
+# Sequence access
+scan_records[0]                              # first record
+scan_records[-1]                             # last record
+scan_records[:5]                             # first 5 records
+
+# Per-bucket access
+for bucket, records in scan_records.items():
+    for record in records:
+        print(f"bucket={bucket.bucket_id}, offset={record.offset}, row={record.row}")
+
+# Flat iteration
+for record in scan_records:
+    print(record.row)
+```
+
+### Methods
+
+| Method                                 |  Description                                                     |
+|----------------------------------------|------------------------------------------------------------------|
+| `.buckets() -> list[TableBucket]`      | List of distinct buckets                                         |
+| `.records(bucket) -> list[ScanRecord]` | Records for a specific bucket (empty list if bucket not present) |
+| `.count() -> int`                      | Total record count across all buckets                            |
+| `.is_empty() -> bool`                  | Check if empty                                                   |
+
+### Indexing
+
+| Expression                   | Returns              | Description                       |
+|------------------------------|----------------------|-----------------------------------|
+| `scan_records[0]`           | `ScanRecord`         | Record by flat index              |
+| `scan_records[-1]`          | `ScanRecord`         | Negative indexing                  |
+| `scan_records[1:5]`         | `list[ScanRecord]`   | Slice                             |
+| `scan_records[bucket]`      | `list[ScanRecord]`   | Records for a bucket              |
+
+### Mapping Protocol
+
+| Method / Protocol              | Description                                     |
+|--------------------------------|-------------------------------------------------|
+| `.keys()`                      | Same as `.buckets()`                            |
+| `.values()`                    | Lazy iterator over record lists, one per bucket |
+| `.items()`                     | Lazy iterator over `(bucket, records)` pairs    |
+| `len(scan_records)`           | Same as `.count()`                              |
+| `bucket in scan_records`      | Membership test                                 |
+| `for record in scan_records`  | Flat iteration over all records                 |
+
 ## `ScanRecord`
 
 | Property                     |  Description                                                        |
 |------------------------------|---------------------------------------------------------------------|
-| `.bucket -> TableBucket`     | Bucket this record belongs to                                       |
 | `.offset -> int`             | Record offset in the log                                            |
 | `.timestamp -> int`          | Record timestamp                                                    |
 | `.change_type -> ChangeType` | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
diff --git a/fluss-rust/website/docs/user-guide/python/example/log-tables.md b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
index 6e44e0610d..adaa162ada 100644
--- a/fluss-rust/website/docs/user-guide/python/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
@@ -83,13 +83,20 @@ while True:
     if result.num_rows > 0:
         print(result.to_pandas())
 
-# Record scanner: poll individual records with metadata
+# Record scanner: poll individual records
 scanner = await table.new_scan().create_log_scanner()
 scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
 while True:
-    for record in scanner.poll(timeout_ms=5000):
+    scan_records = scanner.poll(timeout_ms=5000)
+
+    for record in scan_records:
         print(f"offset={record.offset}, change={record.change_type.short_string()}, row={record.row}")
+
+    # Or per-bucket access (dict-like)
+    for bucket, records in scan_records.items():
+        for record in records:
+            print(f"bucket={bucket.bucket_id}, offset={record.offset}, row={record.row}")
 ```
 
 ### Unsubscribing
diff --git a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
index 3ba33542fb..f5a4d0e25e 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
@@ -63,6 +63,21 @@ log_scanner.subscribe(0, 0).await?;
 // Poll for records
 let records = log_scanner.poll(Duration::from_secs(10)).await?;
 
+// Per-bucket access
+for (bucket, bucket_records) in records.records_by_buckets() {
+    println!("Bucket {}: {} records", bucket.bucket_id(), bucket_records.len());
+    for record in bucket_records {
+        let row = record.row();
+        println!(
+            "  event_id={}, event_type={} @ offset={}",
+            row.get_int(0),
+            row.get_string(1),
+            record.offset()
+        );
+    }
+}
+
+// Or flat iteration (consumes ScanRecords)
 for record in records {
     let row = record.row();
     println!(

From 0f4556061980ab953df6fd5f8bf737f5a3541656 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sun, 22 Feb 2026 02:55:42 +0000
Subject: [PATCH 162/287] chore: introduce c++ integration test (#352)

---
 .../.github/workflows/build_and_test_cpp.yml  |  78 ++
 .../workflows/build_and_test_python.yml       |  81 ++
 .../.github/workflows/build_and_test_rust.yml |  85 ++
 ...docs-check.yml => check_documentation.yml} |   4 +-
 .../check_license_and_formatting.yml          |  60 ++
 fluss-rust/.github/workflows/ci.yml           | 187 ----
 fluss-rust/bindings/cpp/CMakeLists.txt        |  23 +
 fluss-rust/bindings/cpp/test/test_admin.cpp   | 331 +++++++
 .../bindings/cpp/test/test_kv_table.cpp       | 733 +++++++++++++++
 .../bindings/cpp/test/test_log_table.cpp      | 831 ++++++++++++++++++
 fluss-rust/bindings/cpp/test/test_main.cpp    |  31 +
 fluss-rust/bindings/cpp/test/test_utils.h     | 315 +++++++
 .../bindings/python/test/test_log_table.py    |   4 +-
 .../fluss/tests/integration/log_table.rs      |  59 +-
 14 files changed, 2601 insertions(+), 221 deletions(-)
 create mode 100644 fluss-rust/.github/workflows/build_and_test_cpp.yml
 create mode 100644 fluss-rust/.github/workflows/build_and_test_python.yml
 create mode 100644 fluss-rust/.github/workflows/build_and_test_rust.yml
 rename fluss-rust/.github/workflows/{docs-check.yml => check_documentation.yml} (96%)
 create mode 100644 fluss-rust/.github/workflows/check_license_and_formatting.yml
 delete mode 100644 fluss-rust/.github/workflows/ci.yml
 create mode 100644 fluss-rust/bindings/cpp/test/test_admin.cpp
 create mode 100644 fluss-rust/bindings/cpp/test/test_kv_table.cpp
 create mode 100644 fluss-rust/bindings/cpp/test/test_log_table.cpp
 create mode 100644 fluss-rust/bindings/cpp/test/test_main.cpp
 create mode 100644 fluss-rust/bindings/cpp/test/test_utils.h

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
new file mode 100644
index 0000000000..5cdd14d7e4
--- /dev/null
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -0,0 +1,78 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+name: C++ Build and Tests
+
+on:
+  push:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+  pull_request:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+      - 'bindings/python/**'
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
+  cancel-in-progress: true
+
+jobs:
+  build-and-test-cpp:
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Install Apache Arrow C++
+        run: |
+          sudo apt-get install -y -V ca-certificates lsb-release wget
+          wget https://apache.jfrog.io/artifactory/arrow/$(lsb_release --id --short | tr 'A-Z' 'a-z')/apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
+          sudo apt-get install -y -V ./apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
+          sudo apt-get update
+          sudo apt-get install -y -V libarrow-dev
+
+      - name: Rust Cache
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cargo/registry
+            ~/.cargo/git
+            target
+          key: cpp-test-${{ runner.os }}-${{ hashFiles('**/Cargo.lock') }}
+
+      - name: Build C++ bindings and tests
+        working-directory: bindings/cpp
+        run: |
+          cmake -B build -DFLUSS_ENABLE_TESTING=ON -DCMAKE_BUILD_TYPE=Debug
+          cmake --build build --parallel
+
+      - name: Run C++ integration tests
+        working-directory: bindings/cpp
+        run: cd build && ctest --output-on-failure --timeout 300
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
new file mode 100644
index 0000000000..efb5caabdd
--- /dev/null
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -0,0 +1,81 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+name: Python Build and Tests
+
+on:
+  push:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+  pull_request:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+      - 'bindings/cpp/**'
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
+  cancel-in-progress: true
+
+jobs:
+  build-and-test-python:
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python: ["3.9", "3.10", "3.11", "3.12"]
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python }}
+
+      - name: Install uv
+        uses: astral-sh/setup-uv@v4
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Rust Cache
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cargo/registry
+            ~/.cargo/git
+            target
+          key: python-test-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
+
+      - name: Build Python bindings
+        working-directory: bindings/python
+        run: |
+          uv sync --extra dev
+          uv run maturin develop
+
+      - name: Run Python integration tests
+        working-directory: bindings/python
+        run: uv run pytest test/ -v
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
new file mode 100644
index 0000000000..c9e05b7428
--- /dev/null
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -0,0 +1,85 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+name: Rust Build and Tests
+
+on:
+  push:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+  pull_request:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+      - 'bindings/python/**'
+      - 'bindings/cpp/**'
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
+  cancel-in-progress: true
+
+jobs:
+  build-and-test-rust:
+    timeout-minutes: 60
+    runs-on: ${{ matrix.os }}
+    strategy:
+      matrix:
+        os:
+          - ubuntu-latest
+          - macos-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install protoc
+        run: |
+          if [ "$RUNNER_OS" = "Linux" ]; then
+            sudo apt-get update && sudo apt-get install -y protobuf-compiler
+          elif [ "$RUNNER_OS" = "macOS" ]; then
+            brew install protobuf
+          fi
+
+      - name: Rust Cache
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cargo/registry
+            ~/.cargo/git
+            target
+          key: rust-${{ runner.os }}-${{ hashFiles('**/Cargo.lock') }}
+
+      - name: Build
+        run: cargo build --workspace --all-targets --exclude fluss_python --exclude fluss-cpp
+
+      - name: Unit Test
+        run: cargo test --all-targets --workspace --exclude fluss_python --exclude fluss-cpp
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
+
+      - name: Integration Test (Linux only)
+        if: runner.os == 'Linux'
+        run: |
+          RUST_TEST_THREADS=1 cargo test --features integration_tests --all-targets --workspace --exclude fluss_python --exclude fluss-cpp -- --nocapture
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
diff --git a/fluss-rust/.github/workflows/docs-check.yml b/fluss-rust/.github/workflows/check_documentation.yml
similarity index 96%
rename from fluss-rust/.github/workflows/docs-check.yml
rename to fluss-rust/.github/workflows/check_documentation.yml
index 6408c54189..70e6a438d2 100644
--- a/fluss-rust/.github/workflows/docs-check.yml
+++ b/fluss-rust/.github/workflows/check_documentation.yml
@@ -17,7 +17,7 @@
 ################################################################################
 
 # This workflow is meant for checking broken links in the documentation.
-name: Check Documentation
+name: Documentation Check
 permissions:
   contents: read
 on:
@@ -31,7 +31,7 @@ on:
       - 'website/**'
 
 jobs:
-  test-deploy:
+  check-documentation:
     runs-on: ubuntu-latest
     defaults:
       run:
diff --git a/fluss-rust/.github/workflows/check_license_and_formatting.yml b/fluss-rust/.github/workflows/check_license_and_formatting.yml
new file mode 100644
index 0000000000..1b83b749e8
--- /dev/null
+++ b/fluss-rust/.github/workflows/check_license_and_formatting.yml
@@ -0,0 +1,60 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+name: License and Formatting Check
+
+on:
+  push:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+  pull_request:
+    branches:
+      - main
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
+  cancel-in-progress: true
+
+jobs:
+  check-license-and-formatting:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Check License Header
+        uses: apache/skywalking-eyes/header@v0.6.0
+
+      - name: Install cargo-deny
+        uses: taiki-e/install-action@v2
+        with:
+          tool: cargo-deny@0.14.22
+
+      - name: Check dependency licenses (Apache-compatible)
+        run: cargo deny check licenses
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Format
+        run: cargo fmt --all -- --check
+
+      - name: Clippy
+        run: cargo clippy --all-targets --workspace -- -D warnings
diff --git a/fluss-rust/.github/workflows/ci.yml b/fluss-rust/.github/workflows/ci.yml
deleted file mode 100644
index d51e3c07df..0000000000
--- a/fluss-rust/.github/workflows/ci.yml
+++ /dev/null
@@ -1,187 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-name: CI
-
-on:
-  push:
-    branches:
-      - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-  pull_request:
-    branches:
-      - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
-  cancel-in-progress: true
-
-jobs:
-  check:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Check License Header
-        uses: apache/skywalking-eyes/header@v0.6.0
-
-      - name: Install cargo-deny
-        uses: taiki-e/install-action@v2
-        with:
-          tool: cargo-deny@0.14.22
-
-      - name: Check dependency licenses (Apache-compatible)
-        run: cargo deny check licenses
-
-      - name: Install protoc
-        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
-
-      - name: Format
-        run: cargo fmt --all -- --check
-
-      - name: Clippy
-        run: cargo clippy --all-targets --workspace -- -D warnings
-
-  build:
-    runs-on: ${{ matrix.os }}
-    strategy:
-      matrix:
-        os:
-          - ubuntu-latest
-          - macos-latest
-        python: ["3.11", "3.12", "3.13"]
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Set up Python
-        uses: actions/setup-python@v5
-        with:
-          python-version: ${{ matrix.python }}
-
-      - name: Install protoc
-        run: |
-          if [ "$RUNNER_OS" = "Linux" ]; then
-            sudo apt-get update && sudo apt-get install -y protobuf-compiler
-          elif [ "$RUNNER_OS" = "macOS" ]; then
-            brew install protobuf
-          fi
-
-      - name: Rust Cache
-        uses: actions/cache@v4
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: build-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
-
-      - name: Build
-        run: cargo build --workspace --all-targets
-
-  test:
-    runs-on: ${{ matrix.os }}
-    strategy:
-      matrix:
-        os:
-          - ubuntu-latest
-          - macos-latest
-        python: ["3.11", "3.12", "3.13"]
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Set up Python
-        uses: actions/setup-python@v5
-        with:
-          python-version: ${{ matrix.python }}
-
-      - name: Install protoc
-        run: |
-          if [ "$RUNNER_OS" = "Linux" ]; then
-            sudo apt-get update && sudo apt-get install -y protobuf-compiler
-          elif [ "$RUNNER_OS" = "macOS" ]; then
-            brew install protobuf
-          fi
-
-      - name: Rust Cache
-        uses: actions/cache@v4
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: test-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
-
-      - name: Unit Test
-        run: cargo test --all-targets --workspace
-        env:
-          RUST_LOG: DEBUG
-          RUST_BACKTRACE: full
-
-      - name: Integration Test (Linux only)
-        if: runner.os == 'Linux'
-        run: |
-          RUST_TEST_THREADS=1 cargo test --features integration_tests --all-targets --workspace -- --nocapture
-        env:
-          RUST_LOG: DEBUG
-          RUST_BACKTRACE: full
-
-  python-integration-test:
-    timeout-minutes: 60
-    runs-on: ubuntu-latest
-    strategy:
-      matrix:
-        python: ["3.9", "3.10", "3.11", "3.12"]
-    steps:
-      - uses: actions/checkout@v4
-
-      - name: Set up Python
-        uses: actions/setup-python@v5
-        with:
-          python-version: ${{ matrix.python }}
-
-      - name: Install uv
-        uses: astral-sh/setup-uv@v4
-
-      - name: Install protoc
-        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
-
-      - name: Rust Cache
-        uses: actions/cache@v4
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: python-test-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
-
-      - name: Build Python bindings
-        working-directory: bindings/python
-        run: |
-          uv sync --extra dev
-          uv run maturin develop
-
-      - name: Run Python integration tests
-        working-directory: bindings/python
-        run: uv run pytest test/ -v
-        env:
-          RUST_LOG: DEBUG
-          RUST_BACKTRACE: full
diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
index a8f527edad..6bd9fc79aa 100644
--- a/fluss-rust/bindings/cpp/CMakeLists.txt
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -123,3 +123,26 @@ if (FLUSS_ENABLE_ADDRESS_SANITIZER)
     target_compile_options(fluss_cpp PRIVATE -fsanitize=leak,address,undefined -fno-omit-frame-pointer -fno-common -O1)
     target_link_options(fluss_cpp PRIVATE -fsanitize=leak,address,undefined)
 endif()
+
+if (FLUSS_ENABLE_TESTING)
+    FetchContent_Declare(
+        googletest
+        URL https://github.com/google/googletest/archive/refs/tags/v${FLUSS_GOOGLETEST_VERSION}.tar.gz
+    )
+    set(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
+    FetchContent_MakeAvailable(googletest)
+
+    enable_testing()
+
+    file(GLOB TEST_SOURCE_FILES "test/*.cpp")
+    add_executable(fluss_cpp_test ${TEST_SOURCE_FILES})
+    target_link_libraries(fluss_cpp_test PRIVATE fluss_cpp GTest::gtest)
+    target_link_libraries(fluss_cpp_test PRIVATE Arrow::arrow_shared)
+    target_compile_definitions(fluss_cpp_test PRIVATE ARROW_FOUND)
+    target_include_directories(fluss_cpp_test PRIVATE
+        ${CPP_INCLUDE_DIR}
+        ${PROJECT_SOURCE_DIR}/test
+    )
+
+    add_test(NAME fluss_cpp_integration_tests COMMAND fluss_cpp_test)
+endif()
diff --git a/fluss-rust/bindings/cpp/test/test_admin.cpp b/fluss-rust/bindings/cpp/test/test_admin.cpp
new file mode 100644
index 0000000000..b6bb25b789
--- /dev/null
+++ b/fluss-rust/bindings/cpp/test/test_admin.cpp
@@ -0,0 +1,331 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include <gtest/gtest.h>
+
+#include "test_utils.h"
+
+class AdminTest : public ::testing::Test {
+   protected:
+    fluss::Admin& admin() { return fluss_test::FlussTestEnvironment::Instance()->GetAdmin(); }
+};
+
+TEST_F(AdminTest, CreateDatabase) {
+    auto& adm = admin();
+
+    std::string db_name = "test_create_database_cpp";
+
+    // Database should not exist initially
+    bool exists = true;
+    ASSERT_OK(adm.DatabaseExists(db_name, exists));
+    ASSERT_FALSE(exists);
+
+    // Create database with descriptor
+    fluss::DatabaseDescriptor descriptor;
+    descriptor.comment = "test_db";
+    descriptor.properties = {{"k1", "v1"}, {"k2", "v2"}};
+    ASSERT_OK(adm.CreateDatabase(db_name, descriptor, false));
+
+    // Database should exist now
+    ASSERT_OK(adm.DatabaseExists(db_name, exists));
+    ASSERT_TRUE(exists);
+
+    // Get database info
+    fluss::DatabaseInfo db_info;
+    ASSERT_OK(adm.GetDatabaseInfo(db_name, db_info));
+    EXPECT_EQ(db_info.database_name, db_name);
+    EXPECT_EQ(db_info.comment, "test_db");
+    EXPECT_EQ(db_info.properties.at("k1"), "v1");
+    EXPECT_EQ(db_info.properties.at("k2"), "v2");
+
+    // Drop database
+    ASSERT_OK(adm.DropDatabase(db_name, false, true));
+
+    // Database should not exist now
+    ASSERT_OK(adm.DatabaseExists(db_name, exists));
+    ASSERT_FALSE(exists);
+}
+
+TEST_F(AdminTest, CreateTable) {
+    auto& adm = admin();
+
+    std::string db_name = "test_create_table_cpp_db";
+    fluss::DatabaseDescriptor db_desc;
+    db_desc.comment = "Database for test_create_table";
+
+    bool exists = false;
+    ASSERT_OK(adm.DatabaseExists(db_name, exists));
+    ASSERT_FALSE(exists);
+
+    ASSERT_OK(adm.CreateDatabase(db_name, db_desc, false));
+
+    std::string table_name = "test_user_table";
+    fluss::TablePath table_path(db_name, table_name);
+
+    // Build schema
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .AddColumn("age", fluss::DataType::Int(), "User's age (optional)")
+                      .AddColumn("email", fluss::DataType::String())
+                      .SetPrimaryKeys({"id"})
+                      .Build();
+
+    // Build table descriptor
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetComment("Test table for user data (id, name, age, email)")
+                                .SetBucketCount(3)
+                                .SetBucketKeys({"id"})
+                                .SetProperty("table.replication.factor", "1")
+                                .SetLogFormat("arrow")
+                                .SetKvFormat("indexed")
+                                .Build();
+
+    // Create table
+    ASSERT_OK(adm.CreateTable(table_path, table_descriptor, false));
+
+    // Table should exist
+    ASSERT_OK(adm.TableExists(table_path, exists));
+    ASSERT_TRUE(exists);
+
+    // List tables
+    std::vector<std::string> tables;
+    ASSERT_OK(adm.ListTables(db_name, tables));
+    ASSERT_EQ(tables.size(), 1u);
+    EXPECT_TRUE(std::find(tables.begin(), tables.end(), table_name) != tables.end());
+
+    // Get table info
+    fluss::TableInfo table_info;
+    ASSERT_OK(adm.GetTableInfo(table_path, table_info));
+
+    EXPECT_EQ(table_info.comment, "Test table for user data (id, name, age, email)");
+    EXPECT_EQ(table_info.primary_keys, std::vector<std::string>{"id"});
+    EXPECT_EQ(table_info.num_buckets, 3);
+    EXPECT_EQ(table_info.bucket_keys, std::vector<std::string>{"id"});
+
+    // Drop table
+    ASSERT_OK(adm.DropTable(table_path, false));
+    ASSERT_OK(adm.TableExists(table_path, exists));
+    ASSERT_FALSE(exists);
+
+    // Drop database
+    ASSERT_OK(adm.DropDatabase(db_name, false, true));
+    ASSERT_OK(adm.DatabaseExists(db_name, exists));
+    ASSERT_FALSE(exists);
+}
+
+TEST_F(AdminTest, PartitionApis) {
+    auto& adm = admin();
+
+    std::string db_name = "test_partition_apis_cpp_db";
+    fluss::DatabaseDescriptor db_desc;
+    db_desc.comment = "Database for test_partition_apis";
+    ASSERT_OK(adm.CreateDatabase(db_name, db_desc, true));
+
+    fluss::TablePath table_path(db_name, "partitioned_table");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .AddColumn("dt", fluss::DataType::String())
+                      .AddColumn("region", fluss::DataType::String())
+                      .SetPrimaryKeys({"id", "dt", "region"})
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetBucketCount(3)
+                                .SetBucketKeys({"id"})
+                                .SetPartitionKeys({"dt", "region"})
+                                .SetProperty("table.replication.factor", "1")
+                                .SetLogFormat("arrow")
+                                .SetKvFormat("compacted")
+                                .Build();
+
+    ASSERT_OK(adm.CreateTable(table_path, table_descriptor, true));
+
+    // No partitions initially
+    std::vector<fluss::PartitionInfo> partitions;
+    ASSERT_OK(adm.ListPartitionInfos(table_path, partitions));
+    ASSERT_TRUE(partitions.empty());
+
+    // Create a partition
+    std::unordered_map<std::string, std::string> partition_spec = {
+        {"dt", "2024-01-15"}, {"region", "EMEA"}};
+    ASSERT_OK(adm.CreatePartition(table_path, partition_spec, false));
+
+    // Should have one partition
+    ASSERT_OK(adm.ListPartitionInfos(table_path, partitions));
+    ASSERT_EQ(partitions.size(), 1u);
+    EXPECT_EQ(partitions[0].partition_name, "2024-01-15$EMEA");
+
+    // List with partial spec filter - should find the partition
+    std::unordered_map<std::string, std::string> partial_spec = {{"dt", "2024-01-15"}};
+    std::vector<fluss::PartitionInfo> partitions_with_spec;
+    ASSERT_OK(adm.ListPartitionInfos(table_path, partial_spec, partitions_with_spec));
+    ASSERT_EQ(partitions_with_spec.size(), 1u);
+    EXPECT_EQ(partitions_with_spec[0].partition_name, "2024-01-15$EMEA");
+
+    // List with non-matching spec - should find no partitions
+    std::unordered_map<std::string, std::string> non_matching_spec = {{"dt", "2024-01-16"}};
+    std::vector<fluss::PartitionInfo> empty_partitions;
+    ASSERT_OK(adm.ListPartitionInfos(table_path, non_matching_spec, empty_partitions));
+    ASSERT_TRUE(empty_partitions.empty());
+
+    // Drop partition
+    ASSERT_OK(adm.DropPartition(table_path, partition_spec, false));
+
+    ASSERT_OK(adm.ListPartitionInfos(table_path, partitions));
+    ASSERT_TRUE(partitions.empty());
+
+    // Cleanup
+    ASSERT_OK(adm.DropTable(table_path, true));
+    ASSERT_OK(adm.DropDatabase(db_name, true, true));
+}
+
+TEST_F(AdminTest, FlussErrorResponse) {
+    auto& adm = admin();
+
+    fluss::TablePath table_path("fluss", "not_exist_cpp");
+
+    fluss::TableInfo info;
+    auto result = adm.GetTableInfo(table_path, info);
+    ASSERT_FALSE(result.Ok());
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::TABLE_NOT_EXIST);
+}
+
+TEST_F(AdminTest, ErrorDatabaseNotExist) {
+    auto& adm = admin();
+
+    // get_database_info for non-existent database
+    fluss::DatabaseInfo info;
+    auto result = adm.GetDatabaseInfo("no_such_db_cpp", info);
+    ASSERT_FALSE(result.Ok());
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::DATABASE_NOT_EXIST);
+
+    // drop_database without ignore flag
+    result = adm.DropDatabase("no_such_db_cpp", false, false);
+    ASSERT_FALSE(result.Ok());
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::DATABASE_NOT_EXIST);
+
+    // list_tables for non-existent database
+    std::vector<std::string> tables;
+    result = adm.ListTables("no_such_db_cpp", tables);
+    ASSERT_FALSE(result.Ok());
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::DATABASE_NOT_EXIST);
+}
+
+TEST_F(AdminTest, ErrorDatabaseAlreadyExist) {
+    auto& adm = admin();
+
+    std::string db_name = "test_error_db_already_exist_cpp";
+    fluss::DatabaseDescriptor descriptor;
+
+    ASSERT_OK(adm.CreateDatabase(db_name, descriptor, false));
+
+    // Create same database again without ignore flag
+    auto result = adm.CreateDatabase(db_name, descriptor, false);
+    ASSERT_FALSE(result.Ok());
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::DATABASE_ALREADY_EXIST);
+
+    // With ignore flag should succeed
+    ASSERT_OK(adm.CreateDatabase(db_name, descriptor, true));
+
+    // Cleanup
+    ASSERT_OK(adm.DropDatabase(db_name, true, true));
+}
+
+TEST_F(AdminTest, ErrorTableAlreadyExist) {
+    auto& adm = admin();
+
+    std::string db_name = "test_error_tbl_already_exist_cpp_db";
+    fluss::DatabaseDescriptor db_desc;
+    ASSERT_OK(adm.CreateDatabase(db_name, db_desc, true));
+
+    fluss::TablePath table_path(db_name, "my_table");
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .Build();
+    auto table_desc = fluss::TableDescriptor::NewBuilder()
+                          .SetSchema(schema)
+                          .SetBucketCount(1)
+                          .SetProperty("table.replication.factor", "1")
+                          .Build();
+
+    ASSERT_OK(adm.CreateTable(table_path, table_desc, false));
+
+    // Create same table again without ignore flag
+    auto result = adm.CreateTable(table_path, table_desc, false);
+    ASSERT_FALSE(result.Ok());
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::TABLE_ALREADY_EXIST);
+
+    // With ignore flag should succeed
+    ASSERT_OK(adm.CreateTable(table_path, table_desc, true));
+
+    // Cleanup
+    ASSERT_OK(adm.DropTable(table_path, true));
+    ASSERT_OK(adm.DropDatabase(db_name, true, true));
+}
+
+TEST_F(AdminTest, ErrorTableNotExist) {
+    auto& adm = admin();
+
+    fluss::TablePath table_path("fluss", "no_such_table_cpp");
+
+    // Drop without ignore flag
+    auto result = adm.DropTable(table_path, false);
+    ASSERT_FALSE(result.Ok());
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::TABLE_NOT_EXIST);
+
+    // Drop with ignore flag should succeed
+    ASSERT_OK(adm.DropTable(table_path, true));
+}
+
+TEST_F(AdminTest, ErrorTableNotPartitioned) {
+    auto& adm = admin();
+
+    std::string db_name = "test_error_not_partitioned_cpp_db";
+    fluss::DatabaseDescriptor db_desc;
+    ASSERT_OK(adm.CreateDatabase(db_name, db_desc, true));
+
+    fluss::TablePath table_path(db_name, "non_partitioned_table");
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .Build();
+    auto table_desc = fluss::TableDescriptor::NewBuilder()
+                          .SetSchema(schema)
+                          .SetBucketCount(1)
+                          .SetProperty("table.replication.factor", "1")
+                          .Build();
+
+    ASSERT_OK(adm.CreateTable(table_path, table_desc, false));
+
+    // list_partition_infos on non-partitioned table
+    std::vector<fluss::PartitionInfo> partitions;
+    auto result = adm.ListPartitionInfos(table_path, partitions);
+    ASSERT_FALSE(result.Ok());
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::TABLE_NOT_PARTITIONED_EXCEPTION);
+
+    // Cleanup
+    ASSERT_OK(adm.DropTable(table_path, true));
+    ASSERT_OK(adm.DropDatabase(db_name, true, true));
+}
diff --git a/fluss-rust/bindings/cpp/test/test_kv_table.cpp b/fluss-rust/bindings/cpp/test/test_kv_table.cpp
new file mode 100644
index 0000000000..9c4f7a02fb
--- /dev/null
+++ b/fluss-rust/bindings/cpp/test/test_kv_table.cpp
@@ -0,0 +1,733 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include <gtest/gtest.h>
+
+#include "test_utils.h"
+
+class KvTableTest : public ::testing::Test {
+   protected:
+    fluss::Admin& admin() { return fluss_test::FlussTestEnvironment::Instance()->GetAdmin(); }
+
+    fluss::Connection& connection() {
+        return fluss_test::FlussTestEnvironment::Instance()->GetConnection();
+    }
+};
+
+TEST_F(KvTableTest, UpsertDeleteAndLookup) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_upsert_and_lookup_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .AddColumn("age", fluss::DataType::BigInt())
+                      .SetPrimaryKeys({"id"})
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    // Create upsert writer
+    auto table_upsert = table.NewUpsert();
+    fluss::UpsertWriter upsert_writer;
+    ASSERT_OK(table_upsert.CreateWriter(upsert_writer));
+
+    // Upsert 3 rows (fire-and-forget, then flush)
+    struct TestData {
+        int32_t id;
+        std::string name;
+        int64_t age;
+    };
+    std::vector<TestData> test_data = {{1, "Verso", 32}, {2, "Noco", 25}, {3, "Esquie", 35}};
+
+    for (const auto& d : test_data) {
+        fluss::GenericRow row(3);
+        row.SetInt32(0, d.id);
+        row.SetString(1, d.name);
+        row.SetInt64(2, d.age);
+        ASSERT_OK(upsert_writer.Upsert(row));
+    }
+    ASSERT_OK(upsert_writer.Flush());
+
+    // Create lookuper
+    fluss::Lookuper lookuper;
+    ASSERT_OK(table.NewLookup().CreateLookuper(lookuper));
+
+    // Verify lookup results
+    for (const auto& d : test_data) {
+        fluss::GenericRow key(3);
+        key.SetInt32(0, d.id);
+
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found()) << "Row with id=" << d.id << " should exist";
+
+        EXPECT_EQ(result.GetInt32(0), d.id) << "id mismatch";
+        EXPECT_EQ(result.GetString(1), d.name) << "name mismatch";
+        EXPECT_EQ(result.GetInt64(2), d.age) << "age mismatch";
+    }
+
+    // Update record with id=1 (await acknowledgment)
+    {
+        fluss::GenericRow updated_row(3);
+        updated_row.SetInt32(0, 1);
+        updated_row.SetString(1, "Verso");
+        updated_row.SetInt64(2, 33);
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Upsert(updated_row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify the update
+    {
+        fluss::GenericRow key(3);
+        key.SetInt32(0, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(result.GetInt64(2), 33) << "Age should be updated";
+        EXPECT_EQ(result.GetString(1), "Verso") << "Name should remain unchanged";
+    }
+
+    // Delete record with id=1 (await acknowledgment)
+    {
+        fluss::GenericRow delete_row(3);
+        delete_row.SetInt32(0, 1);
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Delete(delete_row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify deletion
+    {
+        fluss::GenericRow key(3);
+        key.SetInt32(0, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_FALSE(result.Found()) << "Record 1 should not exist after delete";
+    }
+
+    // Verify other records still exist
+    for (int id : {2, 3}) {
+        fluss::GenericRow key(3);
+        key.SetInt32(0, id);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found()) << "Record " << id
+                                    << " should still exist after deleting record 1";
+    }
+
+    // Lookup non-existent key
+    {
+        fluss::GenericRow key(3);
+        key.SetInt32(0, 999);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_FALSE(result.Found()) << "Non-existent key should return not found";
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(KvTableTest, CompositePrimaryKeys) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_composite_pk_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("region", fluss::DataType::String())
+                      .AddColumn("score", fluss::DataType::BigInt())
+                      .AddColumn("user_id", fluss::DataType::Int())
+                      .SetPrimaryKeys({"region", "user_id"})
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    auto table_upsert = table.NewUpsert();
+    fluss::UpsertWriter upsert_writer;
+    ASSERT_OK(table_upsert.CreateWriter(upsert_writer));
+
+    // Insert records with composite keys
+    struct TestData {
+        std::string region;
+        int32_t user_id;
+        int64_t score;
+    };
+    std::vector<TestData> test_data = {
+        {"US", 1, 100}, {"US", 2, 200}, {"EU", 1, 150}, {"EU", 2, 250}};
+
+    for (const auto& d : test_data) {
+        auto row = table.NewRow();
+        row.Set("region", d.region);
+        row.Set("score", d.score);
+        row.Set("user_id", d.user_id);
+        ASSERT_OK(upsert_writer.Upsert(row));
+    }
+    ASSERT_OK(upsert_writer.Flush());
+
+    // Create lookuper
+    fluss::Lookuper lookuper;
+    ASSERT_OK(table.NewLookup().CreateLookuper(lookuper));
+
+    // Lookup (US, 1) - should return score 100
+    {
+        auto key = table.NewRow();
+        key.Set("region", "US");
+        key.Set("user_id", 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(result.GetInt64("score"), 100) << "Score for (US, 1) should be 100";
+    }
+
+    // Lookup (EU, 2) - should return score 250
+    {
+        auto key = table.NewRow();
+        key.Set("region", "EU");
+        key.Set("user_id", 2);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(result.GetInt64("score"), 250) << "Score for (EU, 2) should be 250";
+    }
+
+    // Update (US, 1) score (await acknowledgment)
+    {
+        auto update_row = table.NewRow();
+        update_row.Set("region", "US");
+        update_row.Set("user_id", 1);
+        update_row.Set("score", static_cast<int64_t>(500));
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Upsert(update_row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify update
+    {
+        auto key = table.NewRow();
+        key.Set("region", "US");
+        key.Set("user_id", 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(result.GetInt64("score"), 500) << "Row score should be updated";
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(KvTableTest, PartialUpdate) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_partial_update_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .AddColumn("age", fluss::DataType::BigInt())
+                      .AddColumn("score", fluss::DataType::BigInt())
+                      .SetPrimaryKeys({"id"})
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    // Insert initial record with all columns
+    auto table_upsert = table.NewUpsert();
+    fluss::UpsertWriter upsert_writer;
+    ASSERT_OK(table_upsert.CreateWriter(upsert_writer));
+
+    {
+        fluss::GenericRow row(4);
+        row.SetInt32(0, 1);
+        row.SetString(1, "Verso");
+        row.SetInt64(2, 32);
+        row.SetInt64(3, 6942);
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Upsert(row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify initial record
+    fluss::Lookuper lookuper;
+    ASSERT_OK(table.NewLookup().CreateLookuper(lookuper));
+
+    {
+        fluss::GenericRow key(4);
+        key.SetInt32(0, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(result.GetInt32(0), 1);
+        EXPECT_EQ(result.GetString(1), "Verso");
+        EXPECT_EQ(result.GetInt64(2), 32);
+        EXPECT_EQ(result.GetInt64(3), 6942);
+    }
+
+    // Create partial update writer to update only score column
+    auto partial_upsert = table.NewUpsert();
+    partial_upsert.PartialUpdateByName({"id", "score"});
+    fluss::UpsertWriter partial_writer;
+    ASSERT_OK(partial_upsert.CreateWriter(partial_writer));
+
+    // Update only the score column (await acknowledgment)
+    {
+        fluss::GenericRow partial_row(4);
+        partial_row.SetInt32(0, 1);
+        partial_row.SetNull(1);  // not in partial update
+        partial_row.SetNull(2);  // not in partial update
+        partial_row.SetInt64(3, 420);
+        fluss::WriteResult wr;
+        ASSERT_OK(partial_writer.Upsert(partial_row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify partial update - name and age should remain unchanged
+    {
+        fluss::GenericRow key(4);
+        key.SetInt32(0, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(result.GetInt32(0), 1) << "id should remain 1";
+        EXPECT_EQ(result.GetString(1), "Verso") << "name should remain unchanged";
+        EXPECT_EQ(result.GetInt64(2), 32) << "age should remain unchanged";
+        EXPECT_EQ(result.GetInt64(3), 420) << "score should be updated to 420";
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(KvTableTest, PartialUpdateByIndex) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_partial_update_by_index_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .AddColumn("age", fluss::DataType::BigInt())
+                      .AddColumn("score", fluss::DataType::BigInt())
+                      .SetPrimaryKeys({"id"})
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    // Insert initial record with all columns
+    auto table_upsert = table.NewUpsert();
+    fluss::UpsertWriter upsert_writer;
+    ASSERT_OK(table_upsert.CreateWriter(upsert_writer));
+
+    {
+        fluss::GenericRow row(4);
+        row.SetInt32(0, 1);
+        row.SetString(1, "Verso");
+        row.SetInt64(2, 32);
+        row.SetInt64(3, 6942);
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Upsert(row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify initial record
+    fluss::Lookuper lookuper;
+    ASSERT_OK(table.NewLookup().CreateLookuper(lookuper));
+
+    {
+        fluss::GenericRow key(4);
+        key.SetInt32(0, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(result.GetInt32(0), 1);
+        EXPECT_EQ(result.GetString(1), "Verso");
+        EXPECT_EQ(result.GetInt64(2), 32);
+        EXPECT_EQ(result.GetInt64(3), 6942);
+    }
+
+    // Create partial update writer using column indices: 0 (id) and 3 (score)
+    auto partial_upsert = table.NewUpsert();
+    partial_upsert.PartialUpdateByIndex({0, 3});
+    fluss::UpsertWriter partial_writer;
+    ASSERT_OK(partial_upsert.CreateWriter(partial_writer));
+
+    // Update only the score column (await acknowledgment)
+    {
+        fluss::GenericRow partial_row(4);
+        partial_row.SetInt32(0, 1);
+        partial_row.SetNull(1);  // not in partial update
+        partial_row.SetNull(2);  // not in partial update
+        partial_row.SetInt64(3, 420);
+        fluss::WriteResult wr;
+        ASSERT_OK(partial_writer.Upsert(partial_row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify partial update - name and age should remain unchanged
+    {
+        fluss::GenericRow key(4);
+        key.SetInt32(0, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(result.GetInt32(0), 1) << "id should remain 1";
+        EXPECT_EQ(result.GetString(1), "Verso") << "name should remain unchanged";
+        EXPECT_EQ(result.GetInt64(2), 32) << "age should remain unchanged";
+        EXPECT_EQ(result.GetInt64(3), 420) << "score should be updated to 420";
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(KvTableTest, PartitionedTableUpsertAndLookup) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_partitioned_kv_table_cpp");
+
+    // Create a partitioned KV table with region as partition key
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("region", fluss::DataType::String())
+                      .AddColumn("user_id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .AddColumn("score", fluss::DataType::BigInt())
+                      .SetPrimaryKeys({"region", "user_id"})
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetPartitionKeys({"region"})
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    // Create partitions
+    fluss_test::CreatePartitions(adm, table_path, "region", {"US", "EU", "APAC"});
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    auto table_upsert = table.NewUpsert();
+    fluss::UpsertWriter upsert_writer;
+    ASSERT_OK(table_upsert.CreateWriter(upsert_writer));
+
+    // Insert records with different partitions
+    struct TestData {
+        std::string region;
+        int32_t user_id;
+        std::string name;
+        int64_t score;
+    };
+    std::vector<TestData> test_data = {{"US", 1, "Gustave", 100}, {"US", 2, "Lune", 200},
+                                       {"EU", 1, "Sciel", 150},   {"EU", 2, "Maelle", 250},
+                                       {"APAC", 1, "Noco", 300}};
+
+    for (const auto& d : test_data) {
+        fluss::GenericRow row(4);
+        row.SetString(0, d.region);
+        row.SetInt32(1, d.user_id);
+        row.SetString(2, d.name);
+        row.SetInt64(3, d.score);
+        ASSERT_OK(upsert_writer.Upsert(row));
+    }
+    ASSERT_OK(upsert_writer.Flush());
+
+    // Create lookuper
+    fluss::Lookuper lookuper;
+    ASSERT_OK(table.NewLookup().CreateLookuper(lookuper));
+
+    // Lookup records
+    for (const auto& d : test_data) {
+        fluss::GenericRow key(4);
+        key.SetString(0, d.region);
+        key.SetInt32(1, d.user_id);
+
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+
+        EXPECT_EQ(std::string(result.GetString(0)), d.region) << "region mismatch";
+        EXPECT_EQ(result.GetInt32(1), d.user_id) << "user_id mismatch";
+        EXPECT_EQ(std::string(result.GetString(2)), d.name) << "name mismatch";
+        EXPECT_EQ(result.GetInt64(3), d.score) << "score mismatch";
+    }
+
+    // Update within a partition (await acknowledgment)
+    {
+        fluss::GenericRow updated_row(4);
+        updated_row.SetString(0, "US");
+        updated_row.SetInt32(1, 1);
+        updated_row.SetString(2, "Gustave Updated");
+        updated_row.SetInt64(3, 999);
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Upsert(updated_row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify the update
+    {
+        fluss::GenericRow key(4);
+        key.SetString(0, "US");
+        key.SetInt32(1, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(std::string(result.GetString(2)), "Gustave Updated");
+        EXPECT_EQ(result.GetInt64(3), 999);
+    }
+
+    // Lookup in non-existent partition should return not found
+    {
+        fluss::GenericRow key(4);
+        key.SetString(0, "UNKNOWN_REGION");
+        key.SetInt32(1, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_FALSE(result.Found()) << "Lookup in non-existent partition should return not found";
+    }
+
+    // Delete a record within a partition (await acknowledgment)
+    {
+        fluss::GenericRow delete_key(4);
+        delete_key.SetString(0, "EU");
+        delete_key.SetInt32(1, 1);
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Delete(delete_key, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Verify deletion
+    {
+        fluss::GenericRow key(4);
+        key.SetString(0, "EU");
+        key.SetInt32(1, 1);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_FALSE(result.Found()) << "Deleted record should not exist";
+    }
+
+    // Verify other records in same partition still exist
+    {
+        fluss::GenericRow key(4);
+        key.SetString(0, "EU");
+        key.SetInt32(1, 2);
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+        EXPECT_EQ(std::string(result.GetString(2)), "Maelle");
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(KvTableTest, AllSupportedDatatypes) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_all_datatypes_cpp");
+
+    // Create a table with all supported datatypes
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("pk_int", fluss::DataType::Int())
+                      .AddColumn("col_boolean", fluss::DataType::Boolean())
+                      .AddColumn("col_tinyint", fluss::DataType::TinyInt())
+                      .AddColumn("col_smallint", fluss::DataType::SmallInt())
+                      .AddColumn("col_int", fluss::DataType::Int())
+                      .AddColumn("col_bigint", fluss::DataType::BigInt())
+                      .AddColumn("col_float", fluss::DataType::Float())
+                      .AddColumn("col_double", fluss::DataType::Double())
+                      .AddColumn("col_char", fluss::DataType::Char(10))
+                      .AddColumn("col_string", fluss::DataType::String())
+                      .AddColumn("col_decimal", fluss::DataType::Decimal(10, 2))
+                      .AddColumn("col_date", fluss::DataType::Date())
+                      .AddColumn("col_time", fluss::DataType::Time())
+                      .AddColumn("col_timestamp", fluss::DataType::Timestamp())
+                      .AddColumn("col_timestamp_ltz", fluss::DataType::TimestampLtz())
+                      .AddColumn("col_bytes", fluss::DataType::Bytes())
+                      .AddColumn("col_binary", fluss::DataType::Binary(20))
+                      .SetPrimaryKeys({"pk_int"})
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    auto table_upsert = table.NewUpsert();
+    fluss::UpsertWriter upsert_writer;
+    ASSERT_OK(table_upsert.CreateWriter(upsert_writer));
+
+    // Test data
+    int32_t pk_int = 1;
+    bool col_boolean = true;
+    int32_t col_tinyint = 127;
+    int32_t col_smallint = 32767;
+    int32_t col_int = 2147483647;
+    int64_t col_bigint = 9223372036854775807LL;
+    float col_float = 3.14f;
+    double col_double = 2.718281828459045;
+    std::string col_char = "hello";
+    std::string col_string = "world of fluss rust client";
+    std::string col_decimal = "123.45";
+    auto col_date = fluss::Date::FromDays(20476);           // 2026-01-23
+    auto col_time = fluss::Time::FromMillis(36827000);       // 10:13:47
+    auto col_timestamp = fluss::Timestamp::FromMillis(1769163227123);      // 2026-01-23 10:13:47.123
+    auto col_timestamp_ltz = fluss::Timestamp::FromMillis(1769163227123);
+    std::vector<uint8_t> col_bytes = {'b', 'i', 'n', 'a', 'r', 'y', ' ', 'd', 'a', 't', 'a'};
+    std::vector<uint8_t> col_binary = {'f', 'i', 'x', 'e', 'd', ' ', 'b', 'i', 'n', 'a',
+                                       'r', 'y', ' ', 'd', 'a', 't', 'a', '!', '!', '!'};
+
+    // Upsert a row with all datatypes
+    {
+        fluss::GenericRow row(17);
+        row.SetInt32(0, pk_int);
+        row.SetBool(1, col_boolean);
+        row.SetInt32(2, col_tinyint);
+        row.SetInt32(3, col_smallint);
+        row.SetInt32(4, col_int);
+        row.SetInt64(5, col_bigint);
+        row.SetFloat32(6, col_float);
+        row.SetFloat64(7, col_double);
+        row.SetString(8, col_char);
+        row.SetString(9, col_string);
+        row.SetDecimal(10, col_decimal);
+        row.SetDate(11, col_date);
+        row.SetTime(12, col_time);
+        row.SetTimestampNtz(13, col_timestamp);
+        row.SetTimestampLtz(14, col_timestamp_ltz);
+        row.SetBytes(15, col_bytes);
+        row.SetBytes(16, col_binary);
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Upsert(row, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Lookup the record
+    fluss::Lookuper lookuper;
+    ASSERT_OK(table.NewLookup().CreateLookuper(lookuper));
+
+    {
+        fluss::GenericRow key(17);
+        key.SetInt32(0, pk_int);
+
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+
+        // Verify all datatypes
+        EXPECT_EQ(result.GetInt32(0), pk_int) << "pk_int mismatch";
+        EXPECT_EQ(result.GetBool(1), col_boolean) << "col_boolean mismatch";
+        EXPECT_EQ(result.GetInt32(2), col_tinyint) << "col_tinyint mismatch";
+        EXPECT_EQ(result.GetInt32(3), col_smallint) << "col_smallint mismatch";
+        EXPECT_EQ(result.GetInt32(4), col_int) << "col_int mismatch";
+        EXPECT_EQ(result.GetInt64(5), col_bigint) << "col_bigint mismatch";
+        EXPECT_NEAR(result.GetFloat32(6), col_float, 1e-6f) << "col_float mismatch";
+        EXPECT_NEAR(result.GetFloat64(7), col_double, 1e-15) << "col_double mismatch";
+        EXPECT_EQ(result.GetString(8), col_char) << "col_char mismatch";
+        EXPECT_EQ(result.GetString(9), col_string) << "col_string mismatch";
+        EXPECT_EQ(result.GetDecimalString(10), col_decimal) << "col_decimal mismatch";
+        EXPECT_EQ(result.GetDate(11).days_since_epoch, col_date.days_since_epoch) << "col_date mismatch";
+        EXPECT_EQ(result.GetTime(12).millis_since_midnight, col_time.millis_since_midnight) << "col_time mismatch";
+        EXPECT_EQ(result.GetTimestamp(13).epoch_millis, col_timestamp.epoch_millis)
+            << "col_timestamp mismatch";
+        EXPECT_EQ(result.GetTimestamp(14).epoch_millis, col_timestamp_ltz.epoch_millis)
+            << "col_timestamp_ltz mismatch";
+
+        auto [bytes_ptr, bytes_len] = result.GetBytes(15);
+        EXPECT_EQ(bytes_len, col_bytes.size()) << "col_bytes length mismatch";
+        EXPECT_TRUE(std::memcmp(bytes_ptr, col_bytes.data(), bytes_len) == 0)
+            << "col_bytes mismatch";
+
+        auto [binary_ptr, binary_len] = result.GetBytes(16);
+        EXPECT_EQ(binary_len, col_binary.size()) << "col_binary length mismatch";
+        EXPECT_TRUE(std::memcmp(binary_ptr, col_binary.data(), binary_len) == 0)
+            << "col_binary mismatch";
+    }
+
+    // Test with null values for nullable columns
+    {
+        fluss::GenericRow row_with_nulls(17);
+        row_with_nulls.SetInt32(0, 2);  // pk_int = 2
+        for (size_t i = 1; i < 17; ++i) {
+            row_with_nulls.SetNull(i);
+        }
+        fluss::WriteResult wr;
+        ASSERT_OK(upsert_writer.Upsert(row_with_nulls, wr));
+        ASSERT_OK(wr.Wait());
+    }
+
+    // Lookup row with nulls
+    {
+        fluss::GenericRow key(17);
+        key.SetInt32(0, 2);
+
+        fluss::LookupResult result;
+        ASSERT_OK(lookuper.Lookup(key, result));
+        ASSERT_TRUE(result.Found());
+
+        EXPECT_EQ(result.GetInt32(0), 2) << "pk_int mismatch";
+        for (size_t i = 1; i < 17; ++i) {
+            EXPECT_TRUE(result.IsNull(i)) << "column " << i << " should be null";
+        }
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
diff --git a/fluss-rust/bindings/cpp/test/test_log_table.cpp b/fluss-rust/bindings/cpp/test/test_log_table.cpp
new file mode 100644
index 0000000000..47ab6f25c3
--- /dev/null
+++ b/fluss-rust/bindings/cpp/test/test_log_table.cpp
@@ -0,0 +1,831 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include <arrow/api.h>
+#include <gtest/gtest.h>
+
+#include <algorithm>
+#include <chrono>
+#include <thread>
+#include <tuple>
+
+#include "test_utils.h"
+
+class LogTableTest : public ::testing::Test {
+   protected:
+    fluss::Admin& admin() { return fluss_test::FlussTestEnvironment::Instance()->GetAdmin(); }
+
+    fluss::Connection& connection() {
+        return fluss_test::FlussTestEnvironment::Instance()->GetConnection();
+    }
+};
+
+TEST_F(LogTableTest, AppendRecordBatchAndScan) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_append_record_batch_and_scan_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("c1", fluss::DataType::Int())
+                      .AddColumn("c2", fluss::DataType::String())
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetBucketCount(3)
+                                .SetBucketKeys({"c1"})
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    // Create append writer
+    auto table_append = table.NewAppend();
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table_append.CreateWriter(append_writer));
+
+    // Append Arrow record batches
+    {
+        auto c1 = arrow::Int32Builder();
+        c1.AppendValues({1, 2, 3}).ok();
+        auto c2 = arrow::StringBuilder();
+        c2.AppendValues({"a1", "a2", "a3"}).ok();
+
+        auto batch = arrow::RecordBatch::Make(
+            arrow::schema({arrow::field("c1", arrow::int32()), arrow::field("c2", arrow::utf8())}),
+            3, {c1.Finish().ValueOrDie(), c2.Finish().ValueOrDie()});
+
+        ASSERT_OK(append_writer.AppendArrowBatch(batch));
+    }
+
+    {
+        auto c1 = arrow::Int32Builder();
+        c1.AppendValues({4, 5, 6}).ok();
+        auto c2 = arrow::StringBuilder();
+        c2.AppendValues({"a4", "a5", "a6"}).ok();
+
+        auto batch = arrow::RecordBatch::Make(
+            arrow::schema({arrow::field("c1", arrow::int32()), arrow::field("c2", arrow::utf8())}),
+            3, {c1.Finish().ValueOrDie(), c2.Finish().ValueOrDie()});
+
+        ASSERT_OK(append_writer.AppendArrowBatch(batch));
+    }
+
+    ASSERT_OK(append_writer.Flush());
+
+    // Create scanner and subscribe to all 3 buckets
+    fluss::Table scan_table;
+    ASSERT_OK(conn.GetTable(table_path, scan_table));
+    int32_t num_buckets = scan_table.GetTableInfo().num_buckets;
+    ASSERT_EQ(num_buckets, 3) << "Table should have 3 buckets";
+
+    auto table_scan = scan_table.NewScan();
+    fluss::LogScanner log_scanner;
+    ASSERT_OK(table_scan.CreateLogScanner(log_scanner));
+
+    for (int32_t bucket_id = 0; bucket_id < num_buckets; ++bucket_id) {
+        ASSERT_OK(log_scanner.Subscribe(bucket_id, fluss::EARLIEST_OFFSET));
+    }
+
+    // Poll for records across all buckets
+    std::vector<std::pair<int32_t, std::string>> records;
+    fluss_test::PollRecords(log_scanner, 6, [](const fluss::ScanRecord& rec) {
+        return std::make_pair(rec.row.GetInt32(0), std::string(rec.row.GetString(1)));
+    }, records);
+    ASSERT_EQ(records.size(), 6u) << "Expected 6 records";
+    std::sort(records.begin(), records.end());
+
+    std::vector<std::pair<int32_t, std::string>> expected = {
+        {1, "a1"}, {2, "a2"}, {3, "a3"}, {4, "a4"}, {5, "a5"}, {6, "a6"}};
+    EXPECT_EQ(records, expected);
+
+    // Verify per-bucket iteration via BucketView
+    {
+        fluss::Table bucket_table;
+        ASSERT_OK(conn.GetTable(table_path, bucket_table));
+        auto bucket_scan = bucket_table.NewScan();
+        fluss::LogScanner bucket_scanner;
+        ASSERT_OK(bucket_scan.CreateLogScanner(bucket_scanner));
+
+        for (int32_t bid = 0; bid < num_buckets; ++bid) {
+            ASSERT_OK(bucket_scanner.Subscribe(bid, fluss::EARLIEST_OFFSET));
+        }
+
+        std::vector<std::pair<int32_t, std::string>> bucket_records;
+        auto bucket_deadline = std::chrono::steady_clock::now() + std::chrono::seconds(10);
+        size_t buckets_with_data = 0;
+        while (bucket_records.size() < 6 && std::chrono::steady_clock::now() < bucket_deadline) {
+            fluss::ScanRecords scan_records;
+            ASSERT_OK(bucket_scanner.Poll(500, scan_records));
+
+            // Iterate by bucket
+            for (size_t b = 0; b < scan_records.BucketCount(); ++b) {
+                auto bucket_view = scan_records.BucketAt(b);
+                if (!bucket_view.Empty()) {
+                    buckets_with_data++;
+                }
+                for (auto rec : bucket_view) {
+                    bucket_records.emplace_back(rec.row.GetInt32(0),
+                                                std::string(rec.row.GetString(1)));
+                }
+            }
+        }
+
+        ASSERT_EQ(bucket_records.size(), 6u) << "Expected 6 records via per-bucket iteration";
+        EXPECT_GT(buckets_with_data, 1u) << "Records should be distributed across multiple buckets";
+
+        std::sort(bucket_records.begin(), bucket_records.end());
+        EXPECT_EQ(bucket_records, expected);
+    }
+
+    // Test unsubscribe
+    ASSERT_OK(log_scanner.Unsubscribe(0));
+
+    // Verify unsubscribe_partition fails on a non-partitioned table
+    auto unsub_result = log_scanner.UnsubscribePartition(0, 0);
+    ASSERT_FALSE(unsub_result.Ok())
+        << "unsubscribe_partition should fail on a non-partitioned table";
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, ListOffsets) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_list_offsets_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    // Wait for table initialization
+    std::this_thread::sleep_for(std::chrono::seconds(2));
+
+    // Earliest offset should be 0 for empty table
+    std::unordered_map<int32_t, int64_t> earliest_offsets;
+    ASSERT_OK(adm.ListOffsets(table_path, {0}, fluss::OffsetSpec::Earliest(), earliest_offsets));
+    EXPECT_EQ(earliest_offsets[0], 0) << "Earliest offset should be 0 for bucket 0";
+
+    // Latest offset should be 0 for empty table
+    std::unordered_map<int32_t, int64_t> latest_offsets;
+    ASSERT_OK(adm.ListOffsets(table_path, {0}, fluss::OffsetSpec::Latest(), latest_offsets));
+    EXPECT_EQ(latest_offsets[0], 0) << "Latest offset should be 0 for empty table";
+
+    auto before_append_ms =
+        std::chrono::duration_cast<std::chrono::milliseconds>(
+            std::chrono::system_clock::now().time_since_epoch())
+            .count();
+
+    // Append records
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+    auto table_append = table.NewAppend();
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table_append.CreateWriter(append_writer));
+
+    {
+        auto id_builder = arrow::Int32Builder();
+        id_builder.AppendValues({1, 2, 3}).ok();
+        auto name_builder = arrow::StringBuilder();
+        name_builder.AppendValues({"alice", "bob", "charlie"}).ok();
+
+        auto batch = arrow::RecordBatch::Make(
+            arrow::schema(
+                {arrow::field("id", arrow::int32()), arrow::field("name", arrow::utf8())}),
+            3, {id_builder.Finish().ValueOrDie(), name_builder.Finish().ValueOrDie()});
+
+        ASSERT_OK(append_writer.AppendArrowBatch(batch));
+    }
+    ASSERT_OK(append_writer.Flush());
+
+    std::this_thread::sleep_for(std::chrono::seconds(1));
+
+    auto after_append_ms =
+        std::chrono::duration_cast<std::chrono::milliseconds>(
+            std::chrono::system_clock::now().time_since_epoch())
+            .count();
+
+    // Latest offset after appending should be 3
+    std::unordered_map<int32_t, int64_t> latest_after;
+    ASSERT_OK(adm.ListOffsets(table_path, {0}, fluss::OffsetSpec::Latest(), latest_after));
+    EXPECT_EQ(latest_after[0], 3) << "Latest offset should be 3 after appending 3 records";
+
+    // Earliest offset should still be 0
+    std::unordered_map<int32_t, int64_t> earliest_after;
+    ASSERT_OK(adm.ListOffsets(table_path, {0}, fluss::OffsetSpec::Earliest(), earliest_after));
+    EXPECT_EQ(earliest_after[0], 0) << "Earliest offset should still be 0";
+
+    // Timestamp before append should resolve to offset 0
+    std::unordered_map<int32_t, int64_t> ts_offsets;
+    ASSERT_OK(adm.ListOffsets(table_path, {0}, fluss::OffsetSpec::Timestamp(before_append_ms),
+                              ts_offsets));
+    EXPECT_EQ(ts_offsets[0], 0)
+        << "Timestamp before append should resolve to offset 0";
+
+    // Timestamp after append should resolve to offset 3
+    std::unordered_map<int32_t, int64_t> ts_after_offsets;
+    ASSERT_OK(adm.ListOffsets(table_path, {0}, fluss::OffsetSpec::Timestamp(after_append_ms),
+                              ts_after_offsets));
+    EXPECT_EQ(ts_after_offsets[0], 3)
+        << "Timestamp after append should resolve to offset 3";
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, TestProject) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_project_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("col_a", fluss::DataType::Int())
+                      .AddColumn("col_b", fluss::DataType::String())
+                      .AddColumn("col_c", fluss::DataType::Int())
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    // Append 3 records
+    auto table_append = table.NewAppend();
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table_append.CreateWriter(append_writer));
+
+    {
+        auto col_a_builder = arrow::Int32Builder();
+        col_a_builder.AppendValues({1, 2, 3}).ok();
+        auto col_b_builder = arrow::StringBuilder();
+        col_b_builder.AppendValues({"x", "y", "z"}).ok();
+        auto col_c_builder = arrow::Int32Builder();
+        col_c_builder.AppendValues({10, 20, 30}).ok();
+
+        auto batch = arrow::RecordBatch::Make(
+            arrow::schema({arrow::field("col_a", arrow::int32()),
+                           arrow::field("col_b", arrow::utf8()),
+                           arrow::field("col_c", arrow::int32())}),
+            3,
+            {col_a_builder.Finish().ValueOrDie(), col_b_builder.Finish().ValueOrDie(),
+             col_c_builder.Finish().ValueOrDie()});
+
+        ASSERT_OK(append_writer.AppendArrowBatch(batch));
+    }
+    ASSERT_OK(append_writer.Flush());
+
+    // Test project_by_name: select col_b and col_c only
+    {
+        fluss::Table proj_table;
+        ASSERT_OK(conn.GetTable(table_path, proj_table));
+        auto scan = proj_table.NewScan();
+        scan.ProjectByName({"col_b", "col_c"});
+        fluss::LogScanner scanner;
+        ASSERT_OK(scan.CreateLogScanner(scanner));
+
+        ASSERT_OK(scanner.Subscribe(0, 0));
+
+        fluss::ScanRecords records;
+        ASSERT_OK(scanner.Poll(10000, records));
+
+        ASSERT_EQ(records.Count(), 3u) << "Should have 3 records with project_by_name";
+
+        std::vector<std::string> expected_col_b = {"x", "y", "z"};
+        std::vector<int32_t> expected_col_c = {10, 20, 30};
+
+        // Collect and sort by col_c to get deterministic order
+        std::vector<std::pair<std::string, int32_t>> collected;
+        for (auto rec : records) {
+            collected.emplace_back(std::string(rec.row.GetString(0)), rec.row.GetInt32(1));
+        }
+        std::sort(collected.begin(), collected.end(),
+                  [](const auto& a, const auto& b) { return a.second < b.second; });
+
+        for (size_t i = 0; i < 3; ++i) {
+            EXPECT_EQ(collected[i].first, expected_col_b[i]) << "col_b mismatch at index " << i;
+            EXPECT_EQ(collected[i].second, expected_col_c[i]) << "col_c mismatch at index " << i;
+        }
+    }
+
+    // Test project by column indices: select col_b (1) and col_a (0) in that order
+    {
+        fluss::Table proj_table;
+        ASSERT_OK(conn.GetTable(table_path, proj_table));
+        auto scan = proj_table.NewScan();
+        scan.ProjectByIndex({1, 0});
+        fluss::LogScanner scanner;
+        ASSERT_OK(scan.CreateLogScanner(scanner));
+
+        ASSERT_OK(scanner.Subscribe(0, 0));
+
+        fluss::ScanRecords records;
+        ASSERT_OK(scanner.Poll(10000, records));
+
+        ASSERT_EQ(records.Count(), 3u);
+
+        std::vector<std::string> expected_col_b = {"x", "y", "z"};
+        std::vector<int32_t> expected_col_a = {1, 2, 3};
+
+        std::vector<std::pair<std::string, int32_t>> collected;
+        for (auto rec : records) {
+            collected.emplace_back(std::string(rec.row.GetString(0)), rec.row.GetInt32(1));
+        }
+        std::sort(collected.begin(), collected.end(),
+                  [](const auto& a, const auto& b) { return a.second < b.second; });
+
+        for (size_t i = 0; i < 3; ++i) {
+            EXPECT_EQ(collected[i].first, expected_col_b[i]) << "col_b mismatch at index " << i;
+            EXPECT_EQ(collected[i].second, expected_col_a[i]) << "col_a mismatch at index " << i;
+        }
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, TestPollBatches) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_poll_batches_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("name", fluss::DataType::String())
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    std::this_thread::sleep_for(std::chrono::seconds(1));
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    auto scan = table.NewScan();
+    fluss::LogScanner scanner;
+    ASSERT_OK(scan.CreateRecordBatchLogScanner(scanner));
+    ASSERT_OK(scanner.Subscribe(0, 0));
+
+    // Test 1: Empty table should return empty result
+    {
+        fluss::ArrowRecordBatches batches;
+        ASSERT_OK(scanner.PollRecordBatch(500, batches));
+        ASSERT_TRUE(batches.Empty());
+    }
+
+    // Append data
+    auto table_append = table.NewAppend();
+    fluss::AppendWriter writer;
+    ASSERT_OK(table_append.CreateWriter(writer));
+
+    auto make_batch = [](std::vector<int32_t> ids, std::vector<std::string> names) {
+        auto id_builder = arrow::Int32Builder();
+        id_builder.AppendValues(ids).ok();
+        auto name_builder = arrow::StringBuilder();
+        name_builder.AppendValues(names).ok();
+        return arrow::RecordBatch::Make(
+            arrow::schema(
+                {arrow::field("id", arrow::int32()), arrow::field("name", arrow::utf8())}),
+            static_cast<int64_t>(ids.size()),
+            {id_builder.Finish().ValueOrDie(), name_builder.Finish().ValueOrDie()});
+    };
+
+    ASSERT_OK(writer.AppendArrowBatch(make_batch({1, 2}, {"a", "b"})));
+    ASSERT_OK(writer.AppendArrowBatch(make_batch({3, 4}, {"c", "d"})));
+    ASSERT_OK(writer.AppendArrowBatch(make_batch({5, 6}, {"e", "f"})));
+    ASSERT_OK(writer.Flush());
+
+    // Extract ids from Arrow batches
+    auto extract_ids = [](const fluss::ArrowRecordBatches& batches) {
+        std::vector<int32_t> ids;
+        for (const auto& batch : batches) {
+            auto arr =
+                std::static_pointer_cast<arrow::Int32Array>(batch->GetArrowRecordBatch()->column(0));
+            for (int64_t i = 0; i < arr->length(); ++i) {
+                ids.push_back(arr->Value(i));
+            }
+        }
+        return ids;
+    };
+
+    // Test 2: Poll until we get all 6 records
+    std::vector<int32_t> all_ids;
+    fluss_test::PollRecordBatches(scanner, 6, extract_ids, all_ids);
+    ASSERT_EQ(all_ids, (std::vector<int32_t>{1, 2, 3, 4, 5, 6}));
+
+    // Test 3: Append more and verify offset continuation (no duplicates)
+    ASSERT_OK(writer.AppendArrowBatch(make_batch({7, 8}, {"g", "h"})));
+    ASSERT_OK(writer.Flush());
+
+    std::vector<int32_t> new_ids;
+    fluss_test::PollRecordBatches(scanner, 2, extract_ids, new_ids);
+    ASSERT_EQ(new_ids, (std::vector<int32_t>{7, 8}));
+
+    // Test 4: Subscribing from mid-offset should truncate batch
+    {
+        fluss::Table trunc_table;
+        ASSERT_OK(conn.GetTable(table_path, trunc_table));
+        auto trunc_scan = trunc_table.NewScan();
+        fluss::LogScanner trunc_scanner;
+        ASSERT_OK(trunc_scan.CreateRecordBatchLogScanner(trunc_scanner));
+        ASSERT_OK(trunc_scanner.Subscribe(0, 3));
+
+        std::vector<int32_t> trunc_ids;
+        fluss_test::PollRecordBatches(trunc_scanner, 5, extract_ids, trunc_ids);
+        ASSERT_EQ(trunc_ids, (std::vector<int32_t>{4, 5, 6, 7, 8}));
+    }
+
+    // Test 5: Projection should only return requested columns
+    {
+        fluss::Table proj_table;
+        ASSERT_OK(conn.GetTable(table_path, proj_table));
+        auto proj_scan = proj_table.NewScan();
+        proj_scan.ProjectByName({"id"});
+        fluss::LogScanner proj_scanner;
+        ASSERT_OK(proj_scan.CreateRecordBatchLogScanner(proj_scanner));
+        ASSERT_OK(proj_scanner.Subscribe(0, 0));
+
+        fluss::ArrowRecordBatches proj_batches;
+        ASSERT_OK(proj_scanner.PollRecordBatch(10000, proj_batches));
+
+        ASSERT_FALSE(proj_batches.Empty());
+        EXPECT_EQ(proj_batches[0]->GetArrowRecordBatch()->num_columns(), 1)
+            << "Projected batch should have 1 column (id), not 2";
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, AllSupportedDatatypes) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_log_all_datatypes_cpp");
+
+    // Create a log table with all supported datatypes
+    auto schema =
+        fluss::Schema::NewBuilder()
+            .AddColumn("col_tinyint", fluss::DataType::TinyInt())
+            .AddColumn("col_smallint", fluss::DataType::SmallInt())
+            .AddColumn("col_int", fluss::DataType::Int())
+            .AddColumn("col_bigint", fluss::DataType::BigInt())
+            .AddColumn("col_float", fluss::DataType::Float())
+            .AddColumn("col_double", fluss::DataType::Double())
+            .AddColumn("col_boolean", fluss::DataType::Boolean())
+            .AddColumn("col_char", fluss::DataType::Char(10))
+            .AddColumn("col_string", fluss::DataType::String())
+            .AddColumn("col_decimal", fluss::DataType::Decimal(10, 2))
+            .AddColumn("col_date", fluss::DataType::Date())
+            .AddColumn("col_time", fluss::DataType::Time())
+            .AddColumn("col_timestamp", fluss::DataType::Timestamp())
+            .AddColumn("col_timestamp_ltz", fluss::DataType::TimestampLtz())
+            .AddColumn("col_bytes", fluss::DataType::Bytes())
+            .AddColumn("col_binary", fluss::DataType::Binary(4))
+            .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    size_t field_count = table.GetTableInfo().schema.columns.size();
+
+    auto table_append = table.NewAppend();
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table_append.CreateWriter(append_writer));
+
+    // Test data
+    int32_t col_tinyint = 127;
+    int32_t col_smallint = 32767;
+    int32_t col_int = 2147483647;
+    int64_t col_bigint = 9223372036854775807LL;
+    float col_float = 3.14f;
+    double col_double = 2.718281828459045;
+    bool col_boolean = true;
+    std::string col_char = "hello";
+    std::string col_string = "world of fluss rust client";
+    std::string col_decimal = "123.45";
+    auto col_date = fluss::Date::FromDays(20476);           // 2026-01-23
+    auto col_time = fluss::Time::FromMillis(36827000);       // 10:13:47
+    auto col_timestamp = fluss::Timestamp::FromMillisNanos(1769163227123, 456000);
+    auto col_timestamp_ltz = fluss::Timestamp::FromMillisNanos(1769163227123, 456000);
+    std::vector<uint8_t> col_bytes = {'b', 'i', 'n', 'a', 'r', 'y', ' ', 'd', 'a', 't', 'a'};
+    std::vector<uint8_t> col_binary = {0xDE, 0xAD, 0xBE, 0xEF};
+
+    // Append a row with all datatypes
+    {
+        fluss::GenericRow row(field_count);
+        row.SetInt32(0, col_tinyint);
+        row.SetInt32(1, col_smallint);
+        row.SetInt32(2, col_int);
+        row.SetInt64(3, col_bigint);
+        row.SetFloat32(4, col_float);
+        row.SetFloat64(5, col_double);
+        row.SetBool(6, col_boolean);
+        row.SetString(7, col_char);
+        row.SetString(8, col_string);
+        row.SetDecimal(9, col_decimal);
+        row.SetDate(10, col_date);
+        row.SetTime(11, col_time);
+        row.SetTimestampNtz(12, col_timestamp);
+        row.SetTimestampLtz(13, col_timestamp_ltz);
+        row.SetBytes(14, col_bytes);
+        row.SetBytes(15, col_binary);
+        ASSERT_OK(append_writer.Append(row));
+    }
+
+    // Append a row with null values
+    {
+        fluss::GenericRow row_with_nulls(field_count);
+        for (size_t i = 0; i < field_count; ++i) {
+            row_with_nulls.SetNull(i);
+        }
+        ASSERT_OK(append_writer.Append(row_with_nulls));
+    }
+
+    ASSERT_OK(append_writer.Flush());
+
+    // Scan the records
+    fluss::Table scan_table;
+    ASSERT_OK(conn.GetTable(table_path, scan_table));
+    auto table_scan = scan_table.NewScan();
+    fluss::LogScanner log_scanner;
+    ASSERT_OK(table_scan.CreateLogScanner(log_scanner));
+    ASSERT_OK(log_scanner.Subscribe(0, 0));
+
+    // Poll until we get 2 records
+    std::vector<fluss::ScanRecord> all_records;
+    fluss_test::PollRecords(log_scanner, 2,
+        [](const fluss::ScanRecord& rec) { return rec; }, all_records);
+    ASSERT_EQ(all_records.size(), 2u) << "Expected 2 records";
+
+    // Verify first record (all values)
+    auto& row = all_records[0].row;
+
+    EXPECT_EQ(row.GetInt32(0), col_tinyint) << "col_tinyint mismatch";
+    EXPECT_EQ(row.GetInt32(1), col_smallint) << "col_smallint mismatch";
+    EXPECT_EQ(row.GetInt32(2), col_int) << "col_int mismatch";
+    EXPECT_EQ(row.GetInt64(3), col_bigint) << "col_bigint mismatch";
+    EXPECT_NEAR(row.GetFloat32(4), col_float, 1e-6f) << "col_float mismatch";
+    EXPECT_NEAR(row.GetFloat64(5), col_double, 1e-15) << "col_double mismatch";
+    EXPECT_EQ(row.GetBool(6), col_boolean) << "col_boolean mismatch";
+    EXPECT_EQ(row.GetString(7), col_char) << "col_char mismatch";
+    EXPECT_EQ(row.GetString(8), col_string) << "col_string mismatch";
+    EXPECT_EQ(row.GetDecimalString(9), col_decimal) << "col_decimal mismatch";
+    EXPECT_EQ(row.GetDate(10).days_since_epoch, col_date.days_since_epoch) << "col_date mismatch";
+    EXPECT_EQ(row.GetTime(11).millis_since_midnight, col_time.millis_since_midnight)
+        << "col_time mismatch";
+    EXPECT_EQ(row.GetTimestamp(12).epoch_millis, col_timestamp.epoch_millis)
+        << "col_timestamp millis mismatch";
+    EXPECT_EQ(row.GetTimestamp(12).nano_of_millisecond, col_timestamp.nano_of_millisecond)
+        << "col_timestamp nanos mismatch";
+    EXPECT_EQ(row.GetTimestamp(13).epoch_millis, col_timestamp_ltz.epoch_millis)
+        << "col_timestamp_ltz millis mismatch";
+    EXPECT_EQ(row.GetTimestamp(13).nano_of_millisecond, col_timestamp_ltz.nano_of_millisecond)
+        << "col_timestamp_ltz nanos mismatch";
+
+    auto [bytes_ptr, bytes_len] = row.GetBytes(14);
+    EXPECT_EQ(bytes_len, col_bytes.size()) << "col_bytes length mismatch";
+    EXPECT_TRUE(std::memcmp(bytes_ptr, col_bytes.data(), bytes_len) == 0)
+        << "col_bytes mismatch";
+
+    auto [binary_ptr, binary_len] = row.GetBytes(15);
+    EXPECT_EQ(binary_len, col_binary.size()) << "col_binary length mismatch";
+    EXPECT_TRUE(std::memcmp(binary_ptr, col_binary.data(), binary_len) == 0)
+        << "col_binary mismatch";
+
+    // Verify second record (all nulls)
+    auto& null_row = all_records[1].row;
+    for (size_t i = 0; i < field_count; ++i) {
+        EXPECT_TRUE(null_row.IsNull(i)) << "column " << i << " should be null";
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, PartitionedTableAppendScan) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_partitioned_log_append_cpp");
+
+    // Create a partitioned log table
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("region", fluss::DataType::String())
+                      .AddColumn("value", fluss::DataType::BigInt())
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetPartitionKeys({"region"})
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    // Create partitions
+    fluss_test::CreatePartitions(adm, table_path, "region", {"US", "EU"});
+
+    // Wait for partitions
+    std::this_thread::sleep_for(std::chrono::seconds(2));
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    auto table_append = table.NewAppend();
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table_append.CreateWriter(append_writer));
+
+    // Append rows
+    struct TestData {
+        int32_t id;
+        std::string region;
+        int64_t value;
+    };
+    std::vector<TestData> test_data = {{1, "US", 100}, {2, "US", 200}, {3, "EU", 300}, {4, "EU", 400}};
+
+    for (const auto& d : test_data) {
+        fluss::GenericRow row(3);
+        row.SetInt32(0, d.id);
+        row.SetString(1, d.region);
+        row.SetInt64(2, d.value);
+        ASSERT_OK(append_writer.Append(row));
+    }
+    ASSERT_OK(append_writer.Flush());
+
+    // Append arrow batches per partition
+    {
+        auto id_builder = arrow::Int32Builder();
+        id_builder.AppendValues({5, 6}).ok();
+        auto region_builder = arrow::StringBuilder();
+        region_builder.AppendValues({"US", "US"}).ok();
+        auto value_builder = arrow::Int64Builder();
+        value_builder.AppendValues({500, 600}).ok();
+
+        auto batch = arrow::RecordBatch::Make(
+            arrow::schema({arrow::field("id", arrow::int32()),
+                           arrow::field("region", arrow::utf8()),
+                           arrow::field("value", arrow::int64())}),
+            2,
+            {id_builder.Finish().ValueOrDie(), region_builder.Finish().ValueOrDie(),
+             value_builder.Finish().ValueOrDie()});
+
+        ASSERT_OK(append_writer.AppendArrowBatch(batch));
+    }
+
+    {
+        auto id_builder = arrow::Int32Builder();
+        id_builder.AppendValues({7, 8}).ok();
+        auto region_builder = arrow::StringBuilder();
+        region_builder.AppendValues({"EU", "EU"}).ok();
+        auto value_builder = arrow::Int64Builder();
+        value_builder.AppendValues({700, 800}).ok();
+
+        auto batch = arrow::RecordBatch::Make(
+            arrow::schema({arrow::field("id", arrow::int32()),
+                           arrow::field("region", arrow::utf8()),
+                           arrow::field("value", arrow::int64())}),
+            2,
+            {id_builder.Finish().ValueOrDie(), region_builder.Finish().ValueOrDie(),
+             value_builder.Finish().ValueOrDie()});
+
+        ASSERT_OK(append_writer.AppendArrowBatch(batch));
+    }
+    ASSERT_OK(append_writer.Flush());
+
+    // Test list partition offsets
+    std::unordered_map<int32_t, int64_t> us_offsets;
+    ASSERT_OK(adm.ListPartitionOffsets(table_path, "US", {0}, fluss::OffsetSpec::Latest(),
+                                       us_offsets));
+    EXPECT_EQ(us_offsets[0], 4) << "US partition should have 4 records";
+
+    std::unordered_map<int32_t, int64_t> eu_offsets;
+    ASSERT_OK(adm.ListPartitionOffsets(table_path, "EU", {0}, fluss::OffsetSpec::Latest(),
+                                       eu_offsets));
+    EXPECT_EQ(eu_offsets[0], 4) << "EU partition should have 4 records";
+
+    // Subscribe to all partitions and scan
+    fluss::Table scan_table;
+    ASSERT_OK(conn.GetTable(table_path, scan_table));
+    auto table_scan = scan_table.NewScan();
+    fluss::LogScanner log_scanner;
+    ASSERT_OK(table_scan.CreateLogScanner(log_scanner));
+
+    std::vector<fluss::PartitionInfo> partition_infos;
+    ASSERT_OK(adm.ListPartitionInfos(table_path, partition_infos));
+
+    for (const auto& pi : partition_infos) {
+        ASSERT_OK(log_scanner.SubscribePartitionBuckets(pi.partition_id, 0, 0));
+    }
+
+    // Collect all records
+    using Record = std::tuple<int32_t, std::string, int64_t>;
+    auto extract_record = [](const fluss::ScanRecord& rec) -> Record {
+        return {rec.row.GetInt32(0), std::string(rec.row.GetString(1)), rec.row.GetInt64(2)};
+    };
+    std::vector<Record> collected;
+    fluss_test::PollRecords(log_scanner, 8, extract_record, collected);
+
+    ASSERT_EQ(collected.size(), 8u) << "Expected 8 records total";
+    std::sort(collected.begin(), collected.end());
+
+    std::vector<Record> expected = {{1, "US", 100},  {2, "US", 200},  {3, "EU", 300},
+                                    {4, "EU", 400},  {5, "US", 500},  {6, "US", 600},
+                                    {7, "EU", 700},  {8, "EU", 800}};
+    EXPECT_EQ(collected, expected);
+
+    // Test unsubscribe_partition: unsubscribe EU, should only get US data
+    {
+        fluss::Table unsub_table;
+        ASSERT_OK(conn.GetTable(table_path, unsub_table));
+        auto unsub_scan = unsub_table.NewScan();
+        fluss::LogScanner unsub_scanner;
+        ASSERT_OK(unsub_scan.CreateLogScanner(unsub_scanner));
+
+        int64_t eu_partition_id = -1;
+        for (const auto& pi : partition_infos) {
+            ASSERT_OK(unsub_scanner.SubscribePartitionBuckets(pi.partition_id, 0, 0));
+            if (pi.partition_name == "EU") {
+                eu_partition_id = pi.partition_id;
+            }
+        }
+        ASSERT_GE(eu_partition_id, 0) << "EU partition should exist";
+
+        ASSERT_OK(unsub_scanner.UnsubscribePartition(eu_partition_id, 0));
+
+        std::vector<Record> us_only;
+        fluss_test::PollRecords(unsub_scanner, 4, extract_record, us_only);
+
+        ASSERT_EQ(us_only.size(), 4u) << "Should receive exactly 4 US records";
+        for (const auto& [id, region, val] : us_only) {
+            EXPECT_EQ(region, "US") << "After unsubscribe EU, only US data should be read";
+        }
+    }
+
+    // Test subscribe_partition_buckets (batch subscribe)
+    {
+        fluss::Table batch_table;
+        ASSERT_OK(conn.GetTable(table_path, batch_table));
+        auto batch_scan = batch_table.NewScan();
+        fluss::LogScanner batch_scanner;
+        ASSERT_OK(batch_scan.CreateLogScanner(batch_scanner));
+
+        std::vector<fluss::PartitionBucketSubscription> subs;
+        for (const auto& pi : partition_infos) {
+            subs.push_back({pi.partition_id, 0, 0});
+        }
+        ASSERT_OK(batch_scanner.SubscribePartitionBuckets(subs));
+
+        std::vector<Record> batch_collected;
+        fluss_test::PollRecords(batch_scanner, 8, extract_record, batch_collected);
+        ASSERT_EQ(batch_collected.size(), 8u);
+        std::sort(batch_collected.begin(), batch_collected.end());
+        EXPECT_EQ(batch_collected, expected);
+    }
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
diff --git a/fluss-rust/bindings/cpp/test/test_main.cpp b/fluss-rust/bindings/cpp/test/test_main.cpp
new file mode 100644
index 0000000000..8c2e2d966f
--- /dev/null
+++ b/fluss-rust/bindings/cpp/test/test_main.cpp
@@ -0,0 +1,31 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include <gtest/gtest.h>
+
+#include "test_utils.h"
+
+int main(int argc, char** argv) {
+    ::testing::InitGoogleTest(&argc, argv);
+
+    // Register the global test environment (manages the Fluss cluster lifecycle).
+    ::testing::AddGlobalTestEnvironment(fluss_test::FlussTestEnvironment::Instance());
+
+    return RUN_ALL_TESTS();
+}
diff --git a/fluss-rust/bindings/cpp/test/test_utils.h b/fluss-rust/bindings/cpp/test/test_utils.h
new file mode 100644
index 0000000000..bae523775f
--- /dev/null
+++ b/fluss-rust/bindings/cpp/test/test_utils.h
@@ -0,0 +1,315 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#pragma once
+
+#include <gtest/gtest.h>
+
+#include <algorithm>
+#include <chrono>
+#include <cstdio>
+#include <cstdlib>
+#include <cstring>
+#include <string>
+#include <thread>
+#include <vector>
+
+#ifdef _WIN32
+#include <winsock2.h>
+#include <ws2tcpip.h>
+#pragma comment(lib, "ws2_32.lib")
+#else
+#include <arpa/inet.h>
+#include <netinet/in.h>
+#include <sys/socket.h>
+#include <unistd.h>
+#endif
+
+#include "fluss.hpp"
+
+// Macro to assert Result is OK and print error message on failure
+#define ASSERT_OK(result) ASSERT_TRUE((result).Ok()) << (result).error_message
+#define EXPECT_OK(result) EXPECT_TRUE((result).Ok()) << (result).error_message
+
+namespace fluss_test {
+
+static constexpr const char* kFlussVersion = "0.7.0";
+static constexpr const char* kNetworkName = "fluss-cpp-test-network";
+static constexpr const char* kZookeeperName = "zookeeper-cpp-test";
+static constexpr const char* kCoordinatorName = "coordinator-server-cpp-test";
+static constexpr const char* kTabletServerName = "tablet-server-cpp-test";
+static constexpr int kCoordinatorPort = 9123;
+static constexpr int kTabletServerPort = 9124;
+
+/// Execute a shell command and return its exit code.
+inline int RunCommand(const std::string& cmd) {
+    return system(cmd.c_str());
+}
+
+/// Wait until a TCP port is accepting connections, or timeout.
+inline bool WaitForPort(const std::string& host, int port, int timeout_seconds = 60) {
+    auto deadline =
+        std::chrono::steady_clock::now() + std::chrono::seconds(timeout_seconds);
+
+    while (std::chrono::steady_clock::now() < deadline) {
+        int sock = socket(AF_INET, SOCK_STREAM, 0);
+        if (sock < 0) {
+            std::this_thread::sleep_for(std::chrono::milliseconds(500));
+            continue;
+        }
+
+        struct sockaddr_in addr {};
+        addr.sin_family = AF_INET;
+        addr.sin_port = htons(static_cast<uint16_t>(port));
+        inet_pton(AF_INET, host.c_str(), &addr.sin_addr);
+
+        int result = connect(sock, reinterpret_cast<struct sockaddr*>(&addr), sizeof(addr));
+#ifdef _WIN32
+        closesocket(sock);
+#else
+        close(sock);
+#endif
+        if (result == 0) {
+            return true;
+        }
+
+        std::this_thread::sleep_for(std::chrono::milliseconds(500));
+    }
+    return false;
+}
+
+/// Manages a Docker-based Fluss cluster for integration testing.
+class FlussTestCluster {
+   public:
+    FlussTestCluster() = default;
+
+    bool Start() {
+        const char* env_servers = std::getenv("FLUSS_BOOTSTRAP_SERVERS");
+        if (env_servers && std::strlen(env_servers) > 0) {
+            bootstrap_servers_ = env_servers;
+            external_cluster_ = true;
+            std::cout << "Using external cluster: " << bootstrap_servers_ << std::endl;
+            return true;
+        }
+
+        std::cout << "Starting Fluss cluster via Docker..." << std::endl;
+
+        // Create network
+        RunCommand(std::string("docker network create ") + kNetworkName + " 2>/dev/null || true");
+
+        // Start ZooKeeper
+        std::string zk_cmd = std::string("docker run -d --rm") +
+                              " --name " + kZookeeperName +
+                              " --network " + kNetworkName +
+                              " zookeeper:3.9.2";
+        if (RunCommand(zk_cmd) != 0) {
+            std::cerr << "Failed to start ZooKeeper" << std::endl;
+            return false;
+        }
+
+        // Wait for ZooKeeper to be ready before starting Fluss servers
+        std::this_thread::sleep_for(std::chrono::seconds(5));
+
+        // Start Coordinator Server
+        std::string coord_props =
+            "zookeeper.address: " + std::string(kZookeeperName) + ":2181\\n"
+            "bind.listeners: INTERNAL://" + std::string(kCoordinatorName) + ":0, CLIENT://" +
+            std::string(kCoordinatorName) + ":9123\\n"
+            "advertised.listeners: CLIENT://localhost:9123\\n"
+            "internal.listener.name: INTERNAL\\n"
+            "netty.server.num-network-threads: 1\\n"
+            "netty.server.num-worker-threads: 3";
+
+        std::string coord_cmd = std::string("docker run -d --rm") +
+                                " --name " + kCoordinatorName +
+                                " --network " + kNetworkName +
+                                " -p 9123:9123" +
+                                " -e FLUSS_PROPERTIES=\"$(printf '" + coord_props + "')\"" +
+                                " fluss/fluss:" + kFlussVersion +
+                                " coordinatorServer";
+        if (RunCommand(coord_cmd) != 0) {
+            std::cerr << "Failed to start Coordinator Server" << std::endl;
+            Stop();
+            return false;
+        }
+
+        // Wait for coordinator to be ready
+        if (!WaitForPort("127.0.0.1", kCoordinatorPort)) {
+            std::cerr << "Coordinator Server did not become ready" << std::endl;
+            Stop();
+            return false;
+        }
+
+        // Start Tablet Server
+        std::string ts_props =
+            "zookeeper.address: " + std::string(kZookeeperName) + ":2181\\n"
+            "bind.listeners: INTERNAL://" + std::string(kTabletServerName) + ":0, CLIENT://" +
+            std::string(kTabletServerName) + ":9123\\n"
+            "advertised.listeners: CLIENT://localhost:" + std::to_string(kTabletServerPort) + "\\n"
+            "internal.listener.name: INTERNAL\\n"
+            "tablet-server.id: 0\\n"
+            "netty.server.num-network-threads: 1\\n"
+            "netty.server.num-worker-threads: 3";
+
+        std::string ts_cmd = std::string("docker run -d --rm") +
+                             " --name " + kTabletServerName +
+                             " --network " + kNetworkName +
+                             " -p " + std::to_string(kTabletServerPort) + ":9123" +
+                             " -e FLUSS_PROPERTIES=\"$(printf '" + ts_props + "')\"" +
+                             " fluss/fluss:" + kFlussVersion +
+                             " tabletServer";
+        if (RunCommand(ts_cmd) != 0) {
+            std::cerr << "Failed to start Tablet Server" << std::endl;
+            Stop();
+            return false;
+        }
+
+        // Wait for tablet server to be ready
+        if (!WaitForPort("127.0.0.1", kTabletServerPort)) {
+            std::cerr << "Tablet Server did not become ready" << std::endl;
+            Stop();
+            return false;
+        }
+
+        bootstrap_servers_ = "127.0.0.1:9123";
+        std::cout << "Fluss cluster started successfully." << std::endl;
+        return true;
+    }
+
+    void Stop() {
+        if (external_cluster_) return;
+
+        std::cout << "Stopping Fluss cluster..." << std::endl;
+        RunCommand(std::string("docker stop ") + kTabletServerName + " 2>/dev/null || true");
+        RunCommand(std::string("docker stop ") + kCoordinatorName + " 2>/dev/null || true");
+        RunCommand(std::string("docker stop ") + kZookeeperName + " 2>/dev/null || true");
+        RunCommand(std::string("docker network rm ") + kNetworkName + " 2>/dev/null || true");
+        std::cout << "Fluss cluster stopped." << std::endl;
+    }
+
+    const std::string& GetBootstrapServers() const { return bootstrap_servers_; }
+
+   private:
+    std::string bootstrap_servers_;
+    bool external_cluster_{false};
+};
+
+/// GoogleTest Environment that manages the Fluss cluster lifecycle.
+class FlussTestEnvironment : public ::testing::Environment {
+   public:
+    static FlussTestEnvironment* Instance() {
+        static FlussTestEnvironment* instance = nullptr;
+        if (!instance) {
+            instance = new FlussTestEnvironment();
+        }
+        return instance;
+    }
+
+    void SetUp() override {
+        if (!cluster_.Start()) {
+            GTEST_SKIP() << "Failed to start Fluss cluster. Skipping integration tests.";
+        }
+
+        // Retry connection creation until the coordinator is fully initialized.
+        fluss::Configuration config;
+        config.bootstrap_servers = cluster_.GetBootstrapServers();
+
+        auto deadline =
+            std::chrono::steady_clock::now() + std::chrono::seconds(60);
+        while (std::chrono::steady_clock::now() < deadline) {
+            auto result = fluss::Connection::Create(config, connection_);
+            if (result.Ok()) {
+                auto admin_result = connection_.GetAdmin(admin_);
+                if (admin_result.Ok()) {
+                    std::cout << "Connected to Fluss cluster." << std::endl;
+                    return;
+                }
+            }
+            std::cout << "Waiting for Fluss cluster to be ready..." << std::endl;
+            std::this_thread::sleep_for(std::chrono::seconds(2));
+        }
+        GTEST_SKIP() << "Fluss cluster did not become ready within timeout.";
+    }
+
+    void TearDown() override {
+        cluster_.Stop();
+    }
+
+    fluss::Connection& GetConnection() { return connection_; }
+    fluss::Admin& GetAdmin() { return admin_; }
+    const std::string& GetBootstrapServers() { return cluster_.GetBootstrapServers(); }
+
+   private:
+    FlussTestEnvironment() = default;
+
+    FlussTestCluster cluster_;
+    fluss::Connection connection_;
+    fluss::Admin admin_;
+};
+
+/// Helper: create a table (assert success). Drops existing table first if it exists.
+inline void CreateTable(fluss::Admin& admin, const fluss::TablePath& path,
+                        const fluss::TableDescriptor& descriptor) {
+    admin.DropTable(path, true);  // ignore if not exists
+    auto result = admin.CreateTable(path, descriptor, false);
+    ASSERT_OK(result);
+}
+
+/// Helper: create partitions for a partitioned table.
+inline void CreatePartitions(fluss::Admin& admin, const fluss::TablePath& path,
+                             const std::string& partition_column,
+                             const std::vector<std::string>& values) {
+    for (const auto& value : values) {
+        std::unordered_map<std::string, std::string> spec;
+        spec[partition_column] = value;
+        auto result = admin.CreatePartition(path, spec, true);
+        ASSERT_OK(result);
+    }
+}
+
+/// Poll a LogScanner for ScanRecords until `expected_count` items are collected or timeout.
+/// `extract_fn` is called for each ScanRecord and should return a value of type T.
+template <typename T, typename ExtractFn>
+void PollRecords(fluss::LogScanner& scanner, size_t expected_count,
+                 ExtractFn extract_fn, std::vector<T>& out) {
+    auto deadline = std::chrono::steady_clock::now() + std::chrono::seconds(10);
+    while (out.size() < expected_count && std::chrono::steady_clock::now() < deadline) {
+        fluss::ScanRecords records;
+        ASSERT_OK(scanner.Poll(1000, records));
+        for (auto rec : records) {
+            out.push_back(extract_fn(rec));
+        }
+    }
+}
+
+/// Poll a LogScanner for ArrowRecordBatches until `expected_count` items are collected or timeout.
+/// `extract_fn` is called with the full ArrowRecordBatches and should return a std::vector<T>.
+template <typename T, typename ExtractFn>
+void PollRecordBatches(fluss::LogScanner& scanner, size_t expected_count,
+                       ExtractFn extract_fn, std::vector<T>& out) {
+    auto deadline = std::chrono::steady_clock::now() + std::chrono::seconds(10);
+    while (out.size() < expected_count && std::chrono::steady_clock::now() < deadline) {
+        fluss::ArrowRecordBatches batches;
+        ASSERT_OK(scanner.PollRecordBatch(1000, batches));
+        auto items = extract_fn(batches);
+        out.insert(out.end(), items.begin(), items.end());
+    }
+}
+
+}  // namespace fluss_test
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index bfa9789734..dd1a4d4f3e 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -36,7 +36,9 @@ async def test_append_and_scan(connection, admin):
     schema = fluss.Schema(
         pa.schema([pa.field("c1", pa.int32()), pa.field("c2", pa.string())])
     )
-    table_descriptor = fluss.TableDescriptor(schema)
+    table_descriptor = fluss.TableDescriptor(
+        schema, bucket_count=3, bucket_keys=["c1"]
+    )
     await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
 
     table = await connection.get_table(table_path)
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 76420676c0..eac72e5c78 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -39,7 +39,7 @@ mod table_test {
     };
     use arrow::array::record_batch;
     use fluss::client::{EARLIEST_OFFSET, FlussTable, TableScan};
-    use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
+    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::record::ScanRecord;
     use fluss::row::InternalRow;
     use fluss::rpc::message::OffsetSpec;
@@ -79,6 +79,7 @@ mod table_test {
                     .build()
                     .expect("Failed to build schema"),
             )
+            .distributed_by(Some(3), vec!["c1".to_string()])
             .build()
             .expect("Failed to build table");
 
@@ -127,38 +128,34 @@ mod table_test {
                 .expect("Failed to subscribe with EARLIEST_OFFSET");
         }
 
-        // Poll for records
-        let scan_records = log_scanner
-            .poll(tokio::time::Duration::from_secs(10))
-            .await
-            .expect("Failed to poll records");
-
-        // Verify the scanned records
-        let table_bucket = TableBucket::new(table.get_table_info().table_id, 0);
-        let records = scan_records.records(&table_bucket);
-
-        assert_eq!(records.len(), 6, "Expected 6 records");
-
-        // Verify record contents match what was appended
-        let expected_c1_values = vec![1, 2, 3, 4, 5, 6];
-        let expected_c2_values = vec!["a1", "a2", "a3", "a4", "a5", "a6"];
-
-        for (i, record) in records.iter().enumerate() {
-            let row = record.row();
-            assert_eq!(
-                row.get_int(0),
-                expected_c1_values[i],
-                "c1 value mismatch at row {}",
-                i
-            );
-            assert_eq!(
-                row.get_string(1),
-                expected_c2_values[i],
-                "c2 value mismatch at row {}",
-                i
-            );
+        // Poll for records across all buckets
+        let mut collected: Vec<(i32, String)> = Vec::new();
+        let start_time = std::time::Instant::now();
+        while collected.len() < 6 && start_time.elapsed() < Duration::from_secs(10) {
+            let scan_records = log_scanner
+                .poll(Duration::from_millis(500))
+                .await
+                .expect("Failed to poll records");
+            for rec in scan_records {
+                let row = rec.row();
+                collected.push((row.get_int(0), row.get_string(1).to_string()));
+            }
         }
 
+        assert_eq!(collected.len(), 6, "Expected 6 records");
+
+        // Sort and verify record contents
+        collected.sort();
+        let expected: Vec<(i32, String)> = vec![
+            (1, "a1".to_string()),
+            (2, "a2".to_string()),
+            (3, "a3".to_string()),
+            (4, "a4".to_string()),
+            (5, "a5".to_string()),
+            (6, "a6".to_string()),
+        ];
+        assert_eq!(collected, expected);
+
         // Test unsubscribe: unsubscribe from bucket 0, verify no error
         log_scanner
             .unsubscribe(0)

From 58e9de57c13b3a0c9296c7c4a2de37d0a10f53b5 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sun, 22 Feb 2026 02:57:48 +0000
Subject: [PATCH 163/287] chore: add notes on lake snapshot (#359)

---
 .../website/docs/user-guide/cpp/example/admin-operations.md   | 4 ++++
 .../docs/user-guide/python/example/admin-operations.md        | 4 ++++
 .../website/docs/user-guide/rust/example/admin-operations.md  | 4 ++++
 3 files changed, 12 insertions(+)

diff --git a/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md b/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
index 850660ea3a..0f08549a0e 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/admin-operations.md
@@ -142,6 +142,10 @@ admin.ListPartitionOffsets(table_path, "partition_name",
 
 ## Lake Snapshot
 
+:::note
+Lake snapshots require [lake integration](https://fluss.apache.org/docs/maintenance/tiered-storage/overview/) (e.g. Paimon or Iceberg) to be enabled on the server. Without it, `GetLatestLakeSnapshot` will return an error.
+:::
+
 ```cpp
 fluss::LakeSnapshot snapshot;
 admin.GetLatestLakeSnapshot(table_path, snapshot);
diff --git a/fluss-rust/website/docs/user-guide/python/example/admin-operations.md b/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
index 4561a3fad6..ba3748a050 100644
--- a/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
+++ b/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
@@ -67,6 +67,10 @@ offsets = await admin.list_partition_offsets(table_path, partition_name="US", bu
 
 ## Lake Snapshot
 
+:::note
+Lake snapshots require [lake integration](https://fluss.apache.org/docs/maintenance/tiered-storage/overview/) (e.g. Paimon or Iceberg) to be enabled on the server. Without it, `get_latest_lake_snapshot` will raise an error.
+:::
+
 ```python
 snapshot = await admin.get_latest_lake_snapshot(table_path)
 print(f"Snapshot ID: {snapshot.snapshot_id}")
diff --git a/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md b/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
index 7fcc4017a6..d18ad0eca5 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
@@ -112,6 +112,10 @@ let partition_offsets = admin.list_partition_offsets(
 
 ## Lake Snapshot
 
+:::note
+Lake snapshots require [lake integration](https://fluss.apache.org/docs/maintenance/tiered-storage/overview/) (e.g. Paimon or Iceberg) to be enabled on the server. Without it, `get_latest_lake_snapshot` will return an error.
+:::
+
 ```rust
 let snapshot = admin.get_latest_lake_snapshot(&table_path).await?;
 println!("Snapshot ID: {}", snapshot.snapshot_id);

From 60d3f41e6e63ee65613bf66ae2dca786e91546c9 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 22 Feb 2026 02:59:32 +0000
Subject: [PATCH 164/287] chore: introduce max poll records config option
 (#355)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  2 +
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  1 +
 fluss-rust/bindings/cpp/src/lib.rs            |  2 +
 fluss-rust/bindings/python/fluss/__init__.pyi |  4 ++
 fluss-rust/bindings/python/src/config.rs      | 56 ++++++++++++++-----
 .../crates/fluss/src/client/table/scanner.rs  |  5 +-
 fluss-rust/crates/fluss/src/config.rs         |  7 +++
 .../docs/user-guide/cpp/api-reference.md      |  1 +
 .../docs/user-guide/python/api-reference.md   | 15 ++---
 .../python/example/configuration.md           |  3 +
 .../docs/user-guide/rust/api-reference.md     |  1 +
 11 files changed, 73 insertions(+), 24 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 9ea7e416fc..9a62828c01 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -983,6 +983,8 @@ struct Configuration {
     size_t scanner_remote_log_prefetch_num{4};
     // Number of threads for downloading remote log data
     size_t remote_file_download_thread_num{3};
+    // Maximum number of records returned in a single call to Poll() for LogScanner
+    size_t scanner_log_max_poll_records{500};
 };
 
 class Connection {
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index cff1a849a2..370429bc97 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -53,6 +53,7 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.writer_batch_size = config.writer_batch_size;
     ffi_config.scanner_remote_log_prefetch_num = config.scanner_remote_log_prefetch_num;
     ffi_config.remote_file_download_thread_num = config.remote_file_download_thread_num;
+    ffi_config.scanner_log_max_poll_records = config.scanner_log_max_poll_records;
     return ffi_config;
 }
 
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 9f987b94a9..fad98cf10f 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -45,6 +45,7 @@ mod ffi {
         writer_batch_size: i32,
         scanner_remote_log_prefetch_num: usize,
         remote_file_download_thread_num: usize,
+        scanner_log_max_poll_records: usize,
     }
 
     struct FfiResult {
@@ -614,6 +615,7 @@ fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
         writer_batch_size: config.writer_batch_size,
         scanner_remote_log_prefetch_num: config.scanner_remote_log_prefetch_num,
         remote_file_download_thread_num: config.remote_file_download_thread_num,
+        scanner_log_max_poll_records: config.scanner_log_max_poll_records,
     };
 
     let conn = RUNTIME.block_on(async { fcore::client::FlussConnection::new(config).await });
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 4b7fa4e845..6f9ae0b35d 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -161,6 +161,10 @@ class Config:
     def remote_file_download_thread_num(self) -> int: ...
     @remote_file_download_thread_num.setter
     def remote_file_download_thread_num(self, num: int) -> None: ...
+    @property
+    def scanner_log_max_poll_records(self) -> int: ...
+    @scanner_log_max_poll_records.setter
+    def scanner_log_max_poll_records(self, num: int) -> None: ...
 
 class FlussConnection:
     @staticmethod
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 237ab6fae0..fdf90b7ee1 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -43,32 +43,46 @@ impl Config {
                         config.bootstrap_servers = value;
                     }
                     "writer.request-max-size" => {
-                        if let Ok(size) = value.parse::<i32>() {
-                            config.writer_request_max_size = size;
-                        }
+                        config.writer_request_max_size = value.parse::<i32>().map_err(|e| {
+                            FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
+                        })?;
                     }
                     "writer.acks" => {
                         config.writer_acks = value;
                     }
                     "writer.retries" => {
-                        if let Ok(retries) = value.parse::<i32>() {
-                            config.writer_retries = retries;
-                        }
+                        config.writer_retries = value.parse::<i32>().map_err(|e| {
+                            FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
+                        })?;
                     }
                     "writer.batch-size" => {
-                        if let Ok(size) = value.parse::<i32>() {
-                            config.writer_batch_size = size;
-                        }
+                        config.writer_batch_size = value.parse::<i32>().map_err(|e| {
+                            FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
+                        })?;
                     }
                     "scanner.remote-log.prefetch-num" => {
-                        if let Ok(num) = value.parse::<usize>() {
-                            config.scanner_remote_log_prefetch_num = num;
-                        }
+                        config.scanner_remote_log_prefetch_num =
+                            value.parse::<usize>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
                     }
                     "remote-file.download-thread-num" => {
-                        if let Ok(num) = value.parse::<usize>() {
-                            config.remote_file_download_thread_num = num;
-                        }
+                        config.remote_file_download_thread_num =
+                            value.parse::<usize>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
+                    }
+                    "scanner.log.max-poll-records" => {
+                        config.scanner_log_max_poll_records =
+                            value.parse::<usize>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
                     }
                     _ => {
                         return Err(FlussError::new_err(format!("Unknown property: {key}")));
@@ -163,6 +177,18 @@ impl Config {
     fn set_remote_file_download_thread_num(&mut self, num: usize) {
         self.inner.remote_file_download_thread_num = num;
     }
+
+    /// Get the scanner log max poll records
+    #[getter]
+    fn scanner_log_max_poll_records(&self) -> usize {
+        self.inner.scanner_log_max_poll_records
+    }
+
+    /// Set the scanner log max poll records
+    #[setter]
+    fn set_scanner_log_max_poll_records(&mut self, num: usize) {
+        self.inner.scanner_log_max_poll_records = num;
+    }
 }
 
 impl Config {
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 0900267b80..4b6f809567 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -636,6 +636,7 @@ struct LogFetcher {
     security_token_manager: Arc<SecurityTokenManager>,
     log_fetch_buffer: Arc<LogFetchBuffer>,
     nodes_with_pending_fetch_requests: Arc<Mutex<HashSet<i32>>>,
+    max_poll_records: usize,
 }
 
 struct FetchResponseContext {
@@ -694,6 +695,7 @@ impl LogFetcher {
             security_token_manager,
             log_fetch_buffer,
             nodes_with_pending_fetch_requests: Arc::new(Mutex::new(HashSet::new())),
+            max_poll_records: config.scanner_log_max_poll_records,
         })
     }
 
@@ -1092,9 +1094,8 @@ impl LogFetcher {
     /// Collect completed fetches from buffer
     /// Reference: LogFetchCollector.collectFetch in Java
     fn collect_fetches(&self) -> Result<HashMap<TableBucket, Vec<ScanRecord>>> {
-        const MAX_POLL_RECORDS: usize = 500; // Default max poll records
         let mut result: HashMap<TableBucket, Vec<ScanRecord>> = HashMap::new();
-        let mut records_remaining = MAX_POLL_RECORDS;
+        let mut records_remaining = self.max_poll_records;
 
         let collect_result: Result<()> = {
             while records_remaining > 0 {
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 92f0b0d95c..ecf7e122b7 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -24,6 +24,7 @@ const DEFAULT_WRITER_BATCH_SIZE: i32 = 2 * 1024 * 1024;
 const DEFAULT_RETRIES: i32 = i32::MAX;
 const DEFAULT_PREFETCH_NUM: usize = 4;
 const DEFAULT_DOWNLOAD_THREADS: usize = 3;
+const DEFAULT_MAX_POLL_RECORDS: usize = 500;
 
 const DEFAULT_ACKS: &str = "all";
 
@@ -54,6 +55,11 @@ pub struct Config {
     /// Default: 3 (matching Java REMOTE_FILE_DOWNLOAD_THREAD_NUM)
     #[arg(long, default_value_t = DEFAULT_DOWNLOAD_THREADS)]
     pub remote_file_download_thread_num: usize,
+
+    /// Maximum number of records returned in a single call to poll() for LogScanner.
+    /// Default: 500 (matching Java CLIENT_SCANNER_LOG_MAX_POLL_RECORDS)
+    #[arg(long, default_value_t = DEFAULT_MAX_POLL_RECORDS)]
+    pub scanner_log_max_poll_records: usize,
 }
 
 impl Default for Config {
@@ -66,6 +72,7 @@ impl Default for Config {
             writer_batch_size: DEFAULT_WRITER_BATCH_SIZE,
             scanner_remote_log_prefetch_num: DEFAULT_PREFETCH_NUM,
             remote_file_download_thread_num: DEFAULT_DOWNLOAD_THREADS,
+            scanner_log_max_poll_records: DEFAULT_MAX_POLL_RECORDS,
         }
     }
 }
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index 433c5da9de..c18778b290 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -24,6 +24,7 @@ Complete API reference for the Fluss C++ client.
 | `writer_batch_size`               | `int32_t`     | `2097152` (2 MB)     | Batch size for writes in bytes                                  |
 | `scanner_remote_log_prefetch_num` | `size_t`      | `4`                  | Number of remote log segments to prefetch                       |
 | `remote_file_download_thread_num` | `size_t`      | `3`                  | Number of threads for remote log downloads                      |
+| `scanner_log_max_poll_records`    | `size_t`      | `500`                | Maximum number of records returned in a single Poll()           |
 
 ## `Connection`
 
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index 27a57dc1b8..fa62fd9a7e 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -10,13 +10,14 @@ Complete API reference for the Fluss Python client.
 | Method / Property                  | Description                                               |
 |------------------------------------|-----------------------------------------------------------|
 | `Config(properties: dict = None)`  | Create config from a dict of key-value pairs              |
-| `.bootstrap_servers`               | Get/set coordinator server address                        |
-| `.writer_request_max_size`         | Get/set max request size in bytes                         |
-| `.writer_acks`                     | Get/set acknowledgment setting (`"all"` for all replicas) |
-| `.writer_retries`                  | Get/set number of retries on failure                      |
-| `.writer_batch_size`               | Get/set write batch size in bytes                         |
-| `.scanner_remote_log_prefetch_num` | Get/set number of remote log segments to prefetch         |
-| `.remote_file_download_thread_num` | Get/set number of threads for remote log downloads        |
+| `bootstrap_servers`                | Get/set coordinator server address                        |
+| `writer_request_max_size`          | Get/set max request size in bytes                         |
+| `writer_acks`                      | Get/set acknowledgment setting (`"all"` for all replicas) |
+| `writer_retries`                   | Get/set number of retries on failure                      |
+| `writer_batch_size`                | Get/set write batch size in bytes                         |
+| `scanner_remote_log_prefetch_num`  | Get/set number of remote log segments to prefetch         |
+| `remote_file_download_thread_num`  | Get/set number of threads for remote log downloads        |
+| `scanner_log_max_poll_records`     | Get/set max number of records returned in a single poll() |
 
 ## `FlussConnection`
 
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
index 9686fc6247..f2828c4f90 100644
--- a/fluss-rust/website/docs/user-guide/python/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -28,6 +28,9 @@ with await fluss.FlussConnection.create(config) as conn:
 | `writer.acks`       | Acknowledgment setting (`all` waits for all replicas) | `all`              |
 | `writer.retries`    | Number of retries on failure                          | `2147483647`       |
 | `writer.batch-size` | Batch size for writes in bytes                        | `2097152` (2 MB)   |
+| `scanner.remote-log.prefetch-num` | Number of remote log segments to prefetch | `4`                |
+| `remote-file.download-thread-num` | Number of threads for remote log downloads | `3`               |
+| `scanner.log.max-poll-records` | Max records returned in a single poll()       | `500`              |
 
 Remember to close the connection when done:
 
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 0134fbce31..a38cd7d034 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -16,6 +16,7 @@ Complete API reference for the Fluss Rust client.
 | `writer_batch_size`               | `i32`    | `2097152` (2 MB)   | Batch size for writes in bytes                          |
 | `scanner_remote_log_prefetch_num` | `usize`  | `4`                | Number of remote log segments to prefetch               |
 | `remote_file_download_thread_num` | `usize`  | `3`                | Number of threads for remote log downloads              |
+| `scanner_log_max_poll_records`    | `usize`  | `500`              | Maximum number of records returned in a single poll()   |
 
 ## `FlussConnection`
 

From 30a8bae774b58235f91088e21c394dd9d9719ace Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqidong1991@gmail.com>
Date: Sun, 22 Feb 2026 15:41:08 +0100
Subject: [PATCH 165/287] chore: fix broken link and version mismatch in README
 (#364)

---
 fluss-rust/README.md | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/fluss-rust/README.md b/fluss-rust/README.md
index dafe19c880..a88ec2f3ae 100644
--- a/fluss-rust/README.md
+++ b/fluss-rust/README.md
@@ -24,10 +24,10 @@ If your cluster does not fulfill these software requirements you will need to in
 Fluss requires the JAVA_HOME environment variable to be set on all nodes and point to the directory of your Java installation.
 
 #### Fluss Setup
-Go to the [downloads](https://fluss.apache.org/downloads/) page and download the Fluss-0.6.0. Make sure to pick the Fluss package matching your Java version. After downloading the latest release, extract it:
+Go to the [downloads](https://fluss.apache.org/downloads/) page and download the latest Fluss release (currently 0.8.0). Make sure to pick the Fluss package matching your Java version. After downloading the latest release, extract it:
 ```shell
-tar -xzf fluss-0.7-SNAPSHOT-bin.tgz
-cd fluss-0.7-SNAPSHOT/
+tar -xzf fluss-0.8.0-incubating-bin.tgz
+cd fluss-0.8.0-incubating/
 ```
 You can start Fluss local cluster by running the following command:
 ```shell
@@ -118,7 +118,7 @@ Then, stop your Fluss cluster. Go to your Fluss home, stop it via the following
 ## Documentation
 
 - [Development Guide](DEVELOPMENT.md) – Build, test, and contribute to fluss-rust.
-- [Release Guide](docs/creating-a-release.md) – How to build, release, and sign official Fluss client packages (Rust, Python, C++).
+- [Release Guide](website/docs/release/create-release.md) – How to build, release, and sign official Fluss client packages (Rust, Python, C++).
 
 ## License
 

From d1d8323810e9363bbe4fe6b5dfbef34e10e46cb4 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Mon, 23 Feb 2026 13:22:07 +0000
Subject: [PATCH 166/287] chore: fix IT failure from additional table
 properties (#368)

---
 .../crates/fluss/tests/integration/admin.rs      | 16 +++++++++++-----
 1 file changed, 11 insertions(+), 5 deletions(-)

diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index 121158c1d5..c0745dc6a1 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -200,11 +200,17 @@ mod admin_test {
             "Bucket keys mismatch"
         );
 
-        assert_eq!(
-            table_info.get_properties(),
-            table_descriptor.properties(),
-            "Properties mismatch"
-        );
+        // The server may add extra default properties, so verify that all
+        // expected properties are present rather than requiring an exact match.
+        let actual_props = table_info.get_properties();
+        for (key, value) in table_descriptor.properties() {
+            assert_eq!(
+                actual_props.get(key),
+                Some(value),
+                "Property mismatch for key '{}'",
+                key
+            );
+        }
 
         // drop table
         admin

From 6fd0ab205aef7e7a3ce721517b7ca64c276c6255 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Tue, 24 Feb 2026 03:51:11 +0000
Subject: [PATCH 167/287] chore: rename BucketView to BucketRecords (#370)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     | 26 +++++++++----------
 fluss-rust/bindings/cpp/src/lib.rs            |  2 +-
 fluss-rust/bindings/cpp/src/table.cpp         | 20 +++++++-------
 .../bindings/cpp/test/test_log_table.cpp      |  8 +++---
 .../docs/user-guide/cpp/api-reference.md      |  8 +++---
 5 files changed, 32 insertions(+), 32 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 9a62828c01..6b56ba20bc 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -705,14 +705,14 @@ struct ScanRecord {
     RowView row;
 };
 
-/// A view into a subset of scan results for a single bucket.
+/// A bundle of scan records belonging to a single bucket.
 ///
-/// BucketView is a value type — it shares ownership of the underlying scan data
+/// BucketRecords is a value type — it shares ownership of the underlying scan data
 /// via reference counting, so it can safely outlive the ScanRecords that produced it.
-class BucketView {
+class BucketRecords {
    public:
-    BucketView(std::shared_ptr<const detail::ScanData> data, TableBucket bucket, size_t bucket_idx,
-               size_t count)
+    BucketRecords(std::shared_ptr<const detail::ScanData> data, TableBucket bucket,
+                  size_t bucket_idx, size_t count)
         : data_(std::move(data)),
           bucket_(std::move(bucket)),
           bucket_idx_(bucket_idx),
@@ -738,9 +738,9 @@ class BucketView {
         bool operator!=(const Iterator& other) const { return idx_ != other.idx_; }
 
        private:
-        friend class BucketView;
-        Iterator(const BucketView* owner, size_t idx) : owner_(owner), idx_(idx) {}
-        const BucketView* owner_;
+        friend class BucketRecords;
+        Iterator(const BucketRecords* owner, size_t idx) : owner_(owner), idx_(idx) {}
+        const BucketRecords* owner_;
         size_t idx_;
     };
 
@@ -774,16 +774,16 @@ class ScanRecords {
     /// List of distinct buckets that have records.
     std::vector<TableBucket> Buckets() const;
 
-    /// Get a view of records for a specific bucket.
+    /// Get records for a specific bucket.
     ///
-    /// Returns an empty BucketView if the bucket is not present (matches Rust/Java).
+    /// Returns an empty BucketRecords if the bucket is not present (matches Rust/Java).
     /// Note: O(B) linear scan. For iteration over all buckets, prefer BucketAt(idx).
-    BucketView Records(const TableBucket& bucket) const;
+    BucketRecords Records(const TableBucket& bucket) const;
 
-    /// Get a view of records by bucket index (0-based). O(1).
+    /// Get records by bucket index (0-based). O(1).
     ///
     /// Throws std::out_of_range if idx >= BucketCount().
-    BucketView BucketAt(size_t idx) const;
+    BucketRecords BucketAt(size_t idx) const;
 
     /// Flat iterator over all records across all buckets (matches Java Iterable<ScanRecord>).
     class Iterator {
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index fad98cf10f..5a1b3dbdb8 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -2061,7 +2061,7 @@ impl ScanResultInner {
         self.columns.len()
     }
 
-    // Field accessors — C++ validates bounds in BucketView/RecordAt, validate() checks field.
+    // Field accessors — C++ validates bounds in BucketRecords/RecordAt, validate() checks field.
     fn sv_is_null(&self, bucket: usize, rec: usize, field: usize) -> Result<bool, String> {
         row_reader::is_null(self.resolve(bucket, rec).row(), &self.columns, field)
     }
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index 73035bb9b9..b0b7029d22 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -334,21 +334,21 @@ std::vector<TableBucket> ScanRecords::Buckets() const {
     return result;
 }
 
-BucketView ScanRecords::Records(const TableBucket& bucket) const {
+BucketRecords ScanRecords::Records(const TableBucket& bucket) const {
     if (!data_) {
-        return BucketView({}, bucket, 0, 0);
+        return BucketRecords({}, bucket, 0, 0);
     }
     const auto& infos = data_->raw->sv_bucket_infos();
     for (size_t i = 0; i < infos.size(); ++i) {
         TableBucket tb = to_table_bucket(infos[i]);
         if (tb == bucket) {
-            return BucketView(data_, std::move(tb), i, infos[i].record_count);
+            return BucketRecords(data_, std::move(tb), i, infos[i].record_count);
         }
     }
-    return BucketView({}, bucket, 0, 0);
+    return BucketRecords({}, bucket, 0, 0);
 }
 
-BucketView ScanRecords::BucketAt(size_t idx) const {
+BucketRecords ScanRecords::BucketAt(size_t idx) const {
     if (!data_) {
         throw std::logic_error("ScanRecords: not available (moved-from or null)");
     }
@@ -357,12 +357,12 @@ BucketView ScanRecords::BucketAt(size_t idx) const {
         throw std::out_of_range("ScanRecords::BucketAt: index " + std::to_string(idx) +
                                 " out of range (" + std::to_string(infos.size()) + " buckets)");
     }
-    return BucketView(data_, to_table_bucket(infos[idx]), idx, infos[idx].record_count);
+    return BucketRecords(data_, to_table_bucket(infos[idx]), idx, infos[idx].record_count);
 }
 
-ScanRecord BucketView::operator[](size_t idx) const {
+ScanRecord BucketRecords::operator[](size_t idx) const {
     if (idx >= count_) {
-        throw std::out_of_range("BucketView: index " + std::to_string(idx) + " out of range (" +
+        throw std::out_of_range("BucketRecords: index " + std::to_string(idx) + " out of range (" +
                                 std::to_string(count_) + " records)");
     }
     return ScanRecord{data_->raw->sv_offset(bucket_idx_, idx),
@@ -371,7 +371,7 @@ ScanRecord BucketView::operator[](size_t idx) const {
                       RowView(data_, bucket_idx_, idx)};
 }
 
-ScanRecord BucketView::Iterator::operator*() const { return owner_->operator[](idx_); }
+ScanRecord BucketRecords::Iterator::operator*() const { return owner_->operator[](idx_); }
 
 // ============================================================================
 // LookupResult — backed by opaque Rust LookupResultInner
@@ -1146,7 +1146,7 @@ Result LogScanner::Poll(int64_t timeout_ms, ScanRecords& out) {
 
     // Wrap raw pointer in ScanData immediately so it's never leaked on exception.
     auto data = std::make_shared<detail::ScanData>(result_box.into_raw(), detail::ColumnMap{});
-    // Build column map eagerly — shared by all RowViews/BucketViews.
+    // Build column map eagerly — shared by all RowViews/BucketRecords.
     auto col_count = data->raw->sv_column_count();
     for (size_t i = 0; i < col_count; ++i) {
         auto name = data->raw->sv_column_name(i);
diff --git a/fluss-rust/bindings/cpp/test/test_log_table.cpp b/fluss-rust/bindings/cpp/test/test_log_table.cpp
index 47ab6f25c3..7d316faf34 100644
--- a/fluss-rust/bindings/cpp/test/test_log_table.cpp
+++ b/fluss-rust/bindings/cpp/test/test_log_table.cpp
@@ -119,7 +119,7 @@ TEST_F(LogTableTest, AppendRecordBatchAndScan) {
         {1, "a1"}, {2, "a2"}, {3, "a3"}, {4, "a4"}, {5, "a5"}, {6, "a6"}};
     EXPECT_EQ(records, expected);
 
-    // Verify per-bucket iteration via BucketView
+    // Verify per-bucket iteration via BucketRecords
     {
         fluss::Table bucket_table;
         ASSERT_OK(conn.GetTable(table_path, bucket_table));
@@ -140,11 +140,11 @@ TEST_F(LogTableTest, AppendRecordBatchAndScan) {
 
             // Iterate by bucket
             for (size_t b = 0; b < scan_records.BucketCount(); ++b) {
-                auto bucket_view = scan_records.BucketAt(b);
-                if (!bucket_view.Empty()) {
+                auto bkt_records = scan_records.BucketAt(b);
+                if (!bkt_records.Empty()) {
                     buckets_with_data++;
                 }
-                for (auto rec : bucket_view) {
+                for (auto rec : bkt_records) {
                     bucket_records.emplace_back(rec.row.GetInt32(0),
                                                 std::string(rec.row.GetString(1)));
                 }
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index c18778b290..30d89a9c23 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -282,12 +282,12 @@ for (const auto& rec : records) {
 |-----------------------------------------------------------------|-----------------------------------------------------------------------|
 | `BucketCount() -> size_t`                                       | Number of distinct buckets                                            |
 | `Buckets() -> std::vector<TableBucket>`                         | List of distinct buckets                                              |
-| `Records(const TableBucket& bucket) -> BucketView`              | Records for a specific bucket (empty view if bucket not present)      |
-| `BucketAt(size_t idx) -> BucketView`                            | Records by bucket index (0-based, O(1))                               |
+| `Records(const TableBucket& bucket) -> BucketRecords`              | Records for a specific bucket (empty if bucket not present)           |
+| `BucketAt(size_t idx) -> BucketRecords`                            | Records by bucket index (0-based, O(1))                               |
 
-## `BucketView`
+## `BucketRecords`
 
-A view of records within a single bucket. Obtained from `ScanRecords::Records()` or `ScanRecords::BucketAt()`. `BucketView` is a value type — it shares ownership of the underlying scan data via reference counting, so it can safely outlive the `ScanRecords` that produced it.
+A bundle of scan records belonging to a single bucket. Obtained from `ScanRecords::Records()` or `ScanRecords::BucketAt()`. `BucketRecords` is a value type — it shares ownership of the underlying scan data via reference counting, so it can safely outlive the `ScanRecords` that produced it.
 
 | Method                                         |  Description                               |
 |------------------------------------------------|--------------------------------------------|

From 48624420c5a670e3346114fc80eacb995298d2ff Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Wed, 25 Feb 2026 02:05:48 +0100
Subject: [PATCH 168/287] feat: Add round robin bucket assigner (#360)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  2 +
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  1 +
 fluss-rust/bindings/cpp/src/lib.rs            | 11 ++++
 fluss-rust/bindings/python/src/config.rs      | 11 ++++
 .../fluss/src/client/write/bucket_assigner.rs | 66 +++++++++++++++++++
 .../fluss/src/client/write/writer_client.rs   | 30 +++++++--
 fluss-rust/crates/fluss/src/config.rs         | 27 +++++++-
 .../user-guide/cpp/example/configuration.md   |  1 +
 .../python/example/configuration.md           | 21 +++---
 .../user-guide/rust/example/configuration.md  | 15 +++--
 10 files changed, 160 insertions(+), 25 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 6b56ba20bc..f17cafc1aa 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -979,6 +979,8 @@ struct Configuration {
     int32_t writer_retries{std::numeric_limits<int32_t>::max()};
     // Writer batch size in bytes (2 MB)
     int32_t writer_batch_size{2 * 1024 * 1024};
+    // Bucket assigner for tables without bucket keys: "sticky" or "round_robin"
+    std::string writer_bucket_no_key_assigner{"sticky"};
     // Number of remote log batches to prefetch during scanning
     size_t scanner_remote_log_prefetch_num{4};
     // Number of threads for downloading remote log data
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 370429bc97..a2e7fa2616 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -51,6 +51,7 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.writer_acks = rust::String(config.writer_acks);
     ffi_config.writer_retries = config.writer_retries;
     ffi_config.writer_batch_size = config.writer_batch_size;
+    ffi_config.writer_bucket_no_key_assigner = rust::String(config.writer_bucket_no_key_assigner);
     ffi_config.scanner_remote_log_prefetch_num = config.scanner_remote_log_prefetch_num;
     ffi_config.remote_file_download_thread_num = config.remote_file_download_thread_num;
     ffi_config.scanner_log_max_poll_records = config.scanner_log_max_poll_records;
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 5a1b3dbdb8..9fbdc8ff1f 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -43,6 +43,7 @@ mod ffi {
         writer_acks: String,
         writer_retries: i32,
         writer_batch_size: i32,
+        writer_bucket_no_key_assigner: String,
         scanner_remote_log_prefetch_num: usize,
         remote_file_download_thread_num: usize,
         scanner_log_max_poll_records: usize,
@@ -607,12 +608,22 @@ fn err_from_core_error(e: &fcore::error::Error) -> ffi::FfiResult {
 
 // Connection implementation
 fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
+    let assigner_type = match config.writer_bucket_no_key_assigner.as_str() {
+        "round_robin" => fluss::config::NoKeyAssigner::RoundRobin,
+        "sticky" => fluss::config::NoKeyAssigner::Sticky,
+        other => {
+            return Err(format!(
+                "Unknown bucket assigner type: '{other}', expected 'sticky' or 'round_robin'"
+            ));
+        }
+    };
     let config = fluss::config::Config {
         bootstrap_servers: config.bootstrap_servers.to_string(),
         writer_request_max_size: config.writer_request_max_size,
         writer_acks: config.writer_acks.to_string(),
         writer_retries: config.writer_retries,
         writer_batch_size: config.writer_batch_size,
+        writer_bucket_no_key_assigner: assigner_type,
         scanner_remote_log_prefetch_num: config.scanner_remote_log_prefetch_num,
         remote_file_download_thread_num: config.remote_file_download_thread_num,
         scanner_log_max_poll_records: config.scanner_log_max_poll_records,
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index fdf90b7ee1..75056a5226 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -84,6 +84,17 @@ impl Config {
                                 ))
                             })?;
                     }
+                    "writer.bucket.no-key-assigner" => {
+                        config.writer_bucket_no_key_assigner = match value.as_str() {
+                            "round_robin" => fcore::config::NoKeyAssigner::RoundRobin,
+                            "sticky" => fcore::config::NoKeyAssigner::Sticky,
+                            other => {
+                                return Err(FlussError::new_err(format!(
+                                    "Unknown bucket assigner type: {other}, expected 'sticky' or 'round_robin'"
+                                )));
+                            }
+                        };
+                    }
                     _ => {
                         return Err(FlussError::new_err(format!("Unknown property: {key}")));
                     }
diff --git a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
index 7fcd20ba54..8ad38e3d42 100644
--- a/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
+++ b/fluss-rust/crates/fluss/src/client/write/bucket_assigner.rs
@@ -106,6 +106,44 @@ impl BucketAssigner for StickyBucketAssigner {
     }
 }
 
+/// Unlike [StickyBucketAssigner], each record is assigned to the next bucket
+/// in a rotating sequence, providing even data distribution across all buckets.
+pub struct RoundRobinBucketAssigner {
+    table_path: Arc<PhysicalTablePath>,
+    num_buckets: i32,
+    counter: AtomicI32,
+}
+
+impl RoundRobinBucketAssigner {
+    pub fn new(table_path: Arc<PhysicalTablePath>, num_buckets: i32) -> Self {
+        let mut rng = rand::rng();
+        Self {
+            table_path,
+            num_buckets,
+            counter: AtomicI32::new(rng.random()),
+        }
+    }
+}
+
+impl BucketAssigner for RoundRobinBucketAssigner {
+    fn abort_if_batch_full(&self) -> bool {
+        false
+    }
+
+    fn on_new_batch(&self, _cluster: &Cluster, _prev_bucket_id: i32) {}
+
+    fn assign_bucket(&self, _bucket_key: Option<&Bytes>, cluster: &Cluster) -> Result<i32> {
+        let next_value = self.counter.fetch_add(1, Ordering::Relaxed);
+        let available_buckets = cluster.get_available_buckets_for_table_path(&self.table_path);
+        if available_buckets.is_empty() {
+            Ok((next_value & i32::MAX) % self.num_buckets)
+        } else {
+            let idx = (next_value & i32::MAX) % available_buckets.len() as i32;
+            Ok(available_buckets[idx as usize].bucket_id())
+        }
+    }
+}
+
 /// A [BucketAssigner] which assigns based on a modulo hashing function
 pub struct HashBucketAssigner {
     num_buckets: i32,
@@ -173,6 +211,34 @@ mod tests {
         assert!((0..2).contains(&next_bucket));
     }
 
+    #[test]
+    fn round_robin_assigner_cycles_through_buckets() {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let num_buckets = 3;
+        let cluster = build_cluster(&table_path, 1, num_buckets);
+        let physical = Arc::new(PhysicalTablePath::of(Arc::new(table_path)));
+        let assigner = RoundRobinBucketAssigner::new(physical, num_buckets);
+
+        let mut seen = Vec::new();
+        for _ in 0..(num_buckets * 2) {
+            let bucket = assigner.assign_bucket(None, &cluster).expect("bucket");
+            assert!((0..num_buckets).contains(&bucket));
+            seen.push(bucket);
+        }
+
+        assert_eq!(seen[0], seen[3]);
+        assert_eq!(seen[1], seen[4]);
+        assert_eq!(seen[2], seen[5]);
+    }
+
+    #[test]
+    fn round_robin_assigner_does_not_abort_on_batch_full() {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let physical = Arc::new(PhysicalTablePath::of(Arc::new(table_path)));
+        let assigner = RoundRobinBucketAssigner::new(physical, 3);
+        assert!(!assigner.abort_if_batch_full());
+    }
+
     #[test]
     fn hash_bucket_assigner_requires_key() {
         let assigner = HashBucketAssigner::new(3, <dyn BucketingFunction>::of(None));
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index 41ef4bbb42..23f523c8bf 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -19,11 +19,12 @@ use crate::BucketId;
 use crate::bucketing::BucketingFunction;
 use crate::client::metadata::Metadata;
 use crate::client::write::bucket_assigner::{
-    BucketAssigner, HashBucketAssigner, StickyBucketAssigner,
+    BucketAssigner, HashBucketAssigner, RoundRobinBucketAssigner, StickyBucketAssigner,
 };
 use crate::client::write::sender::Sender;
 use crate::client::{RecordAccumulator, ResultHandle, WriteRecord};
 use crate::config::Config;
+use crate::config::NoKeyAssigner;
 use crate::error::{Error, Result};
 use crate::metadata::{PhysicalTablePath, TableInfo};
 use bytes::Bytes;
@@ -99,7 +100,12 @@ impl WriterClient {
         let (bucket_assigner, bucket_id) =
             self.assign_bucket(&record.table_info, bucket_key, physical_table_path)?;
 
-        let mut result = self.accumulate.append(record, bucket_id, &cluster, true)?;
+        let mut result = self.accumulate.append(
+            record,
+            bucket_id,
+            &cluster,
+            bucket_assigner.abort_if_batch_full(),
+        )?;
 
         if result.abort_record_for_new_batch {
             let prev_bucket_id = bucket_id;
@@ -125,10 +131,14 @@ impl WriterClient {
             if let Some(assigner) = self.bucket_assigners.get(table_path) {
                 assigner.clone()
             } else {
-                let assigner =
-                    Self::create_bucket_assigner(table_info, Arc::clone(table_path), bucket_key)?;
+                let assigner = Self::create_bucket_assigner(
+                    table_info,
+                    Arc::clone(table_path),
+                    bucket_key,
+                    &self.config,
+                )?;
                 self.bucket_assigners
-                    .insert(Arc::clone(table_path), Arc::clone(&assigner.clone()));
+                    .insert(Arc::clone(table_path), Arc::clone(&assigner));
                 assigner
             }
         };
@@ -164,6 +174,7 @@ impl WriterClient {
         table_info: &Arc<TableInfo>,
         table_path: Arc<PhysicalTablePath>,
         bucket_key: Option<&Bytes>,
+        config: &Config,
     ) -> Result<Arc<dyn BucketAssigner>> {
         if bucket_key.is_some() {
             let datalake_format = table_info.get_table_config().get_datalake_format()?;
@@ -173,8 +184,13 @@ impl WriterClient {
                 function,
             )))
         } else {
-            // TODO: Wire up toi use round robin/sticky according to ConfigOptions.CLIENT_WRITER_BUCKET_NO_KEY_ASSIGNER
-            Ok(Arc::new(StickyBucketAssigner::new(table_path)))
+            match config.writer_bucket_no_key_assigner {
+                NoKeyAssigner::Sticky => Ok(Arc::new(StickyBucketAssigner::new(table_path))),
+                NoKeyAssigner::RoundRobin => Ok(Arc::new(RoundRobinBucketAssigner::new(
+                    table_path,
+                    table_info.num_buckets,
+                ))),
+            }
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index ecf7e122b7..6ff4327f46 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -15,8 +15,9 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use clap::Parser;
+use clap::{Parser, ValueEnum};
 use serde::{Deserialize, Serialize};
+use std::fmt;
 
 const DEFAULT_BOOTSTRAP_SERVER: &str = "127.0.0.1:9123";
 const DEFAULT_REQUEST_MAX_SIZE: i32 = 10 * 1024 * 1024;
@@ -28,6 +29,26 @@ const DEFAULT_MAX_POLL_RECORDS: usize = 500;
 
 const DEFAULT_ACKS: &str = "all";
 
+/// Bucket assigner strategy for tables without bucket keys.
+/// Matches Java `client.writer.bucket.no-key-assigner`.
+#[derive(Debug, Clone, Copy, PartialEq, Eq, ValueEnum, Deserialize, Serialize)]
+#[serde(rename_all = "snake_case")]
+pub enum NoKeyAssigner {
+    /// Sticks to one bucket until the batch is full, then switches.
+    Sticky,
+    /// Assigns each record to the next bucket in a rotating sequence.
+    RoundRobin,
+}
+
+impl fmt::Display for NoKeyAssigner {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        match self {
+            NoKeyAssigner::Sticky => write!(f, "sticky"),
+            NoKeyAssigner::RoundRobin => write!(f, "round_robin"),
+        }
+    }
+}
+
 #[derive(Parser, Debug, Clone, Deserialize, Serialize)]
 #[command(author, version, about, long_about = None)]
 pub struct Config {
@@ -46,6 +67,9 @@ pub struct Config {
     #[arg(long, default_value_t = DEFAULT_WRITER_BATCH_SIZE)]
     pub writer_batch_size: i32,
 
+    #[arg(long, value_enum, default_value_t = NoKeyAssigner::Sticky)]
+    pub writer_bucket_no_key_assigner: NoKeyAssigner,
+
     /// Maximum number of remote log segments to prefetch
     /// Default: 4 (matching Java CLIENT_SCANNER_REMOTE_LOG_PREFETCH_NUM)
     #[arg(long, default_value_t = DEFAULT_PREFETCH_NUM)]
@@ -70,6 +94,7 @@ impl Default for Config {
             writer_acks: String::from(DEFAULT_ACKS),
             writer_retries: i32::MAX,
             writer_batch_size: DEFAULT_WRITER_BATCH_SIZE,
+            writer_bucket_no_key_assigner: NoKeyAssigner::Sticky,
             scanner_remote_log_prefetch_num: DEFAULT_PREFETCH_NUM,
             remote_file_download_thread_num: DEFAULT_DOWNLOAD_THREADS,
             scanner_log_max_poll_records: DEFAULT_MAX_POLL_RECORDS,
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
index 518a5845ff..715e3c63fd 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
@@ -30,6 +30,7 @@ config.writer_request_max_size = 10 * 1024 * 1024;     // Max request size (10 M
 config.writer_acks = "all";                      // Wait for all replicas
 config.writer_retries = std::numeric_limits<int32_t>::max();  // Retry on failure
 config.writer_batch_size = 2 * 1024 * 1024;     // Batch size (2 MB)
+config.writer_bucket_no_key_assigner = "sticky"; // "sticky" or "round_robin"
 config.scanner_remote_log_prefetch_num = 4;      // Remote log prefetch count
 config.remote_file_download_thread_num = 3;  // Download threads
 ```
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
index f2828c4f90..466bf0dd38 100644
--- a/fluss-rust/website/docs/user-guide/python/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -21,16 +21,17 @@ with await fluss.FlussConnection.create(config) as conn:
 
 ## Connection Configurations
 
-| Key                 | Description                                           | Default            |
-|---------------------|-------------------------------------------------------|--------------------|
-| `bootstrap.servers` | Coordinator server address                            | `127.0.0.1:9123`   |
-| `writer.request-max-size`  | Maximum request size in bytes                  | `10485760` (10 MB) |
-| `writer.acks`       | Acknowledgment setting (`all` waits for all replicas) | `all`              |
-| `writer.retries`    | Number of retries on failure                          | `2147483647`       |
-| `writer.batch-size` | Batch size for writes in bytes                        | `2097152` (2 MB)   |
-| `scanner.remote-log.prefetch-num` | Number of remote log segments to prefetch | `4`                |
-| `remote-file.download-thread-num` | Number of threads for remote log downloads | `3`               |
-| `scanner.log.max-poll-records` | Max records returned in a single poll()       | `500`              |
+| Key                                | Description                                                                          | Default            |
+|------------------------------------|--------------------------------------------------------------------------------------|--------------------|
+| `bootstrap.servers`               | Coordinator server address                                                            | `127.0.0.1:9123`   |
+| `writer.request-max-size`         | Maximum request size in bytes                                                         | `10485760` (10 MB) |
+| `writer.acks`                     | Acknowledgment setting (`all` waits for all replicas)                                 | `all`              |
+| `writer.retries`                  | Number of retries on failure                                                          | `2147483647`       |
+| `writer.batch-size`               | Batch size for writes in bytes                                                        | `2097152` (2 MB)   |
+| `writer.bucket.no-key-assigner`   | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin`  | `sticky`           |
+| `scanner.remote-log.prefetch-num` | Number of remote log segments to prefetch                                             | `4`                |
+| `remote-file.download-thread-num` | Number of threads for remote log downloads                                            | `3`                |
+| `scanner.log.max-poll-records`    | Max records returned in a single poll()                                               | `500`              |
 
 Remember to close the connection when done:
 
diff --git a/fluss-rust/website/docs/user-guide/rust/example/configuration.md b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
index a84c24dcad..92b9bf2f1d 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
@@ -17,10 +17,11 @@ let conn = FlussConnection::new(config).await?;
 
 ## Connection Configurations
 
-| Option                    | Description                                           | Default          |
-|---------------------------|-------------------------------------------------------|------------------|
-| `bootstrap_servers`       | Coordinator server address                            | `127.0.0.1:9123` |
-| `writer_request_max_size` | Maximum request size in bytes                         | 10 MB            |
-| `writer_acks`             | Acknowledgment setting (`all` waits for all replicas) | `all`            |
-| `writer_retries`          | Number of retries on failure                          | `i32::MAX`       |
-| `writer_batch_size`       | Batch size for writes                                 | 2 MB             |
+| Option                          | Description                                                                          | Default          |
+|---------------------------------|--------------------------------------------------------------------------------------|------------------|
+| `bootstrap_servers`             | Coordinator server address                                                           | `127.0.0.1:9123` |
+| `writer_request_max_size`       | Maximum request size in bytes                                                        | 10 MB            |
+| `writer_acks`                   | Acknowledgment setting (`all` waits for all replicas)                                | `all`            |
+| `writer_retries`                | Number of retries on failure                                                         | `i32::MAX`       |
+| `writer_batch_size`             | Batch size for writes                                                                | 2 MB             |
+| `writer_bucket_no_key_assigner` | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`         |

From 81b06aed4a47be29014d8c4301d0ee186e6cf673 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Fri, 27 Feb 2026 01:58:28 +0000
Subject: [PATCH 169/287] chore: Fix panic / crashes in Rust and C++ (#365)

---
 fluss-rust/bindings/cpp/src/lib.rs            |  80 +--
 fluss-rust/bindings/cpp/src/types.rs          |  34 +-
 fluss-rust/bindings/python/src/table.rs       |  56 ++-
 .../crates/examples/src/example_kv_table.rs   |   8 +-
 .../src/example_partitioned_kv_table.rs       |  10 +-
 .../crates/examples/src/example_table.rs      |   6 +-
 .../crates/fluss/src/client/table/append.rs   |  17 +
 .../src/client/table/partition_getter.rs      |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  |  10 +-
 .../crates/fluss/src/client/table/upsert.rs   |   2 +-
 fluss-rust/crates/fluss/src/record/arrow.rs   |   2 +-
 .../fluss/src/record/kv/kv_record_batch.rs    |   2 +-
 .../src/record/kv/kv_record_batch_builder.rs  |   8 +-
 fluss-rust/crates/fluss/src/row/column.rs     | 465 ++++++++++--------
 .../fluss/src/row/compacted/compacted_row.rs  | 105 ++--
 .../src/row/encode/compacted_key_encoder.rs   |   2 +-
 .../crates/fluss/src/row/field_getter.rs      |  45 +-
 fluss-rust/crates/fluss/src/row/mod.rs        | 231 ++++++---
 .../crates/fluss/src/row/row_decoder.rs       |   8 +-
 .../fluss/tests/integration/kv_table.rs       | 266 ++++++----
 .../fluss/tests/integration/log_table.rs      | 200 ++++++--
 .../tests/integration/table_remote_scan.rs    |  14 +-
 22 files changed, 977 insertions(+), 596 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 9fbdc8ff1f..32dbf7d030 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -1784,7 +1784,7 @@ mod row_reader {
         allowed: impl FnOnce(&fcore::metadata::DataType) -> bool,
     ) -> Result<&'a fcore::metadata::DataType, String> {
         let col = get_column(columns, field)?;
-        if row.is_null_at(field) {
+        if row.is_null_at(field).map_err(|e| e.to_string())? {
             return Err(format!("field {field} is null"));
         }
         let dt = col.data_type();
@@ -1812,7 +1812,7 @@ mod row_reader {
         field: usize,
     ) -> Result<bool, String> {
         get_column(columns, field)?;
-        Ok(row.is_null_at(field))
+        row.is_null_at(field).map_err(|e| e.to_string())
     }
 
     pub fn get_bool(
@@ -1823,7 +1823,7 @@ mod row_reader {
         validate(row, columns, field, "get_bool", |dt| {
             matches!(dt, fcore::metadata::DataType::Boolean(_))
         })?;
-        Ok(row.get_boolean(field))
+        row.get_boolean(field).map_err(|e| e.to_string())
     }
 
     pub fn get_i32(
@@ -1839,11 +1839,17 @@ mod row_reader {
                     | fcore::metadata::DataType::Int(_)
             )
         })?;
-        Ok(match dt {
-            fcore::metadata::DataType::TinyInt(_) => row.get_byte(field) as i32,
-            fcore::metadata::DataType::SmallInt(_) => row.get_short(field) as i32,
-            _ => row.get_int(field),
-        })
+        match dt {
+            fcore::metadata::DataType::TinyInt(_) => row
+                .get_byte(field)
+                .map(|v| v as i32)
+                .map_err(|e| e.to_string()),
+            fcore::metadata::DataType::SmallInt(_) => row
+                .get_short(field)
+                .map(|v| v as i32)
+                .map_err(|e| e.to_string()),
+            _ => row.get_int(field).map_err(|e| e.to_string()),
+        }
     }
 
     pub fn get_i64(
@@ -1854,7 +1860,7 @@ mod row_reader {
         validate(row, columns, field, "get_i64", |dt| {
             matches!(dt, fcore::metadata::DataType::BigInt(_))
         })?;
-        Ok(row.get_long(field))
+        row.get_long(field).map_err(|e| e.to_string())
     }
 
     pub fn get_f32(
@@ -1865,7 +1871,7 @@ mod row_reader {
         validate(row, columns, field, "get_f32", |dt| {
             matches!(dt, fcore::metadata::DataType::Float(_))
         })?;
-        Ok(row.get_float(field))
+        row.get_float(field).map_err(|e| e.to_string())
     }
 
     pub fn get_f64(
@@ -1876,7 +1882,7 @@ mod row_reader {
         validate(row, columns, field, "get_f64", |dt| {
             matches!(dt, fcore::metadata::DataType::Double(_))
         })?;
-        Ok(row.get_double(field))
+        row.get_double(field).map_err(|e| e.to_string())
     }
 
     pub fn get_str<'a>(
@@ -1890,10 +1896,12 @@ mod row_reader {
                 fcore::metadata::DataType::Char(_) | fcore::metadata::DataType::String(_)
             )
         })?;
-        Ok(match dt {
-            fcore::metadata::DataType::Char(ct) => row.get_char(field, ct.length() as usize),
-            _ => row.get_string(field),
-        })
+        match dt {
+            fcore::metadata::DataType::Char(ct) => row
+                .get_char(field, ct.length() as usize)
+                .map_err(|e| e.to_string()),
+            _ => row.get_string(field).map_err(|e| e.to_string()),
+        }
     }
 
     pub fn get_bytes<'a>(
@@ -1907,10 +1915,12 @@ mod row_reader {
                 fcore::metadata::DataType::Binary(_) | fcore::metadata::DataType::Bytes(_)
             )
         })?;
-        Ok(match dt {
-            fcore::metadata::DataType::Binary(bt) => row.get_binary(field, bt.length()),
-            _ => row.get_bytes(field),
-        })
+        match dt {
+            fcore::metadata::DataType::Binary(bt) => row
+                .get_binary(field, bt.length())
+                .map_err(|e| e.to_string()),
+            _ => row.get_bytes(field).map_err(|e| e.to_string()),
+        }
     }
 
     pub fn get_date_days(
@@ -1921,7 +1931,9 @@ mod row_reader {
         validate(row, columns, field, "get_date_days", |dt| {
             matches!(dt, fcore::metadata::DataType::Date(_))
         })?;
-        Ok(row.get_date(field).get_inner())
+        row.get_date(field)
+            .map(|d| d.get_inner())
+            .map_err(|e| e.to_string())
     }
 
     pub fn get_time_millis(
@@ -1932,7 +1944,9 @@ mod row_reader {
         validate(row, columns, field, "get_time_millis", |dt| {
             matches!(dt, fcore::metadata::DataType::Time(_))
         })?;
-        Ok(row.get_time(field).get_inner())
+        row.get_time(field)
+            .map(|t| t.get_inner())
+            .map_err(|e| e.to_string())
     }
 
     pub fn get_ts_millis(
@@ -1948,12 +1962,14 @@ mod row_reader {
             )
         })?;
         match dt {
-            fcore::metadata::DataType::TimestampLTz(ts) => Ok(row
+            fcore::metadata::DataType::TimestampLTz(ts) => row
                 .get_timestamp_ltz(field, ts.precision())
-                .get_epoch_millisecond()),
-            fcore::metadata::DataType::Timestamp(ts) => Ok(row
+                .map(|v| v.get_epoch_millisecond())
+                .map_err(|e| e.to_string()),
+            fcore::metadata::DataType::Timestamp(ts) => row
                 .get_timestamp_ntz(field, ts.precision())
-                .get_millisecond()),
+                .map(|v| v.get_millisecond())
+                .map_err(|e| e.to_string()),
             dt => Err(format!("get_ts_millis: unexpected type {dt}")),
         }
     }
@@ -1971,12 +1987,14 @@ mod row_reader {
             )
         })?;
         match dt {
-            fcore::metadata::DataType::TimestampLTz(ts) => Ok(row
+            fcore::metadata::DataType::TimestampLTz(ts) => row
                 .get_timestamp_ltz(field, ts.precision())
-                .get_nano_of_millisecond()),
-            fcore::metadata::DataType::Timestamp(ts) => Ok(row
+                .map(|v| v.get_nano_of_millisecond())
+                .map_err(|e| e.to_string()),
+            fcore::metadata::DataType::Timestamp(ts) => row
                 .get_timestamp_ntz(field, ts.precision())
-                .get_nano_of_millisecond()),
+                .map(|v| v.get_nano_of_millisecond())
+                .map_err(|e| e.to_string()),
             dt => Err(format!("get_ts_nanos: unexpected type {dt}")),
         }
     }
@@ -1998,7 +2016,9 @@ mod row_reader {
         })?;
         match dt {
             fcore::metadata::DataType::Decimal(dd) => {
-                let decimal = row.get_decimal(field, dd.precision() as usize, dd.scale() as usize);
+                let decimal = row
+                    .get_decimal(field, dd.precision() as usize, dd.scale() as usize)
+                    .map_err(|e| e.to_string())?;
                 Ok(decimal.to_big_decimal().to_string())
             }
             dt => Err(format!("get_decimal_str: unexpected type {dt}")),
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 073a16817f..f8efe677f4 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -371,42 +371,42 @@ pub fn compacted_row_to_owned(
     let mut out = fcore::row::GenericRow::new(columns.len());
 
     for (i, col) in columns.iter().enumerate() {
-        if row.is_null_at(i) {
+        if row.is_null_at(i)? {
             out.set_field(i, Datum::Null);
             continue;
         }
 
         let datum = match col.data_type() {
-            fcore::metadata::DataType::Boolean(_) => Datum::Bool(row.get_boolean(i)),
-            fcore::metadata::DataType::TinyInt(_) => Datum::Int8(row.get_byte(i)),
-            fcore::metadata::DataType::SmallInt(_) => Datum::Int16(row.get_short(i)),
-            fcore::metadata::DataType::Int(_) => Datum::Int32(row.get_int(i)),
-            fcore::metadata::DataType::BigInt(_) => Datum::Int64(row.get_long(i)),
-            fcore::metadata::DataType::Float(_) => Datum::Float32(row.get_float(i).into()),
-            fcore::metadata::DataType::Double(_) => Datum::Float64(row.get_double(i).into()),
+            fcore::metadata::DataType::Boolean(_) => Datum::Bool(row.get_boolean(i)?),
+            fcore::metadata::DataType::TinyInt(_) => Datum::Int8(row.get_byte(i)?),
+            fcore::metadata::DataType::SmallInt(_) => Datum::Int16(row.get_short(i)?),
+            fcore::metadata::DataType::Int(_) => Datum::Int32(row.get_int(i)?),
+            fcore::metadata::DataType::BigInt(_) => Datum::Int64(row.get_long(i)?),
+            fcore::metadata::DataType::Float(_) => Datum::Float32(row.get_float(i)?.into()),
+            fcore::metadata::DataType::Double(_) => Datum::Float64(row.get_double(i)?.into()),
             fcore::metadata::DataType::String(_) => {
-                Datum::String(Cow::Owned(row.get_string(i).to_string()))
+                Datum::String(Cow::Owned(row.get_string(i)?.to_string()))
             }
             fcore::metadata::DataType::Bytes(_) => {
-                Datum::Blob(Cow::Owned(row.get_bytes(i).to_vec()))
+                Datum::Blob(Cow::Owned(row.get_bytes(i)?.to_vec()))
             }
-            fcore::metadata::DataType::Date(_) => Datum::Date(row.get_date(i)),
-            fcore::metadata::DataType::Time(_) => Datum::Time(row.get_time(i)),
+            fcore::metadata::DataType::Date(_) => Datum::Date(row.get_date(i)?),
+            fcore::metadata::DataType::Time(_) => Datum::Time(row.get_time(i)?),
             fcore::metadata::DataType::Timestamp(dt) => {
-                Datum::TimestampNtz(row.get_timestamp_ntz(i, dt.precision()))
+                Datum::TimestampNtz(row.get_timestamp_ntz(i, dt.precision())?)
             }
             fcore::metadata::DataType::TimestampLTz(dt) => {
-                Datum::TimestampLtz(row.get_timestamp_ltz(i, dt.precision()))
+                Datum::TimestampLtz(row.get_timestamp_ltz(i, dt.precision())?)
             }
             fcore::metadata::DataType::Decimal(dt) => {
-                let decimal = row.get_decimal(i, dt.precision() as usize, dt.scale() as usize);
+                let decimal = row.get_decimal(i, dt.precision() as usize, dt.scale() as usize)?;
                 Datum::Decimal(decimal)
             }
             fcore::metadata::DataType::Char(dt) => Datum::String(Cow::Owned(
-                row.get_char(i, dt.length() as usize).to_string(),
+                row.get_char(i, dt.length() as usize)?.to_string(),
             )),
             fcore::metadata::DataType::Binary(dt) => {
-                Datum::Blob(Cow::Owned(row.get_binary(i, dt.length()).to_vec()))
+                Datum::Blob(Cow::Owned(row.get_binary(i, dt.length())?.to_vec()))
             }
             other => return Err(anyhow!("Unsupported data type for column {i}: {other:?}")),
         };
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index bc2e956c1a..660cd6be16 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -1256,91 +1256,119 @@ pub fn datum_to_python_value(
     use fcore::metadata::DataType;
 
     // Check for null first
-    if row.is_null_at(pos) {
+    if row
+        .is_null_at(pos)
+        .map_err(|e| FlussError::from_core_error(&e))?
+    {
         return Ok(py.None());
     }
 
     match data_type {
         DataType::Boolean(_) => Ok(row
             .get_boolean(pos)
+            .map_err(|e| FlussError::from_core_error(&e))?
             .into_pyobject(py)?
             .to_owned()
             .into_any()
             .unbind()),
         DataType::TinyInt(_) => Ok(row
             .get_byte(pos)
+            .map_err(|e| FlussError::from_core_error(&e))?
             .into_pyobject(py)?
             .to_owned()
             .into_any()
             .unbind()),
         DataType::SmallInt(_) => Ok(row
             .get_short(pos)
+            .map_err(|e| FlussError::from_core_error(&e))?
             .into_pyobject(py)?
             .to_owned()
             .into_any()
             .unbind()),
         DataType::Int(_) => Ok(row
             .get_int(pos)
+            .map_err(|e| FlussError::from_core_error(&e))?
             .into_pyobject(py)?
             .to_owned()
             .into_any()
             .unbind()),
         DataType::BigInt(_) => Ok(row
             .get_long(pos)
+            .map_err(|e| FlussError::from_core_error(&e))?
             .into_pyobject(py)?
             .to_owned()
             .into_any()
             .unbind()),
         DataType::Float(_) => Ok(row
             .get_float(pos)
+            .map_err(|e| FlussError::from_core_error(&e))?
             .into_pyobject(py)?
             .to_owned()
             .into_any()
             .unbind()),
         DataType::Double(_) => Ok(row
             .get_double(pos)
+            .map_err(|e| FlussError::from_core_error(&e))?
             .into_pyobject(py)?
             .to_owned()
             .into_any()
             .unbind()),
         DataType::String(_) => {
-            let s = row.get_string(pos);
+            let s = row
+                .get_string(pos)
+                .map_err(|e| FlussError::from_core_error(&e))?;
             Ok(s.into_pyobject(py)?.into_any().unbind())
         }
         DataType::Char(char_type) => {
-            let s = row.get_char(pos, char_type.length() as usize);
+            let s = row
+                .get_char(pos, char_type.length() as usize)
+                .map_err(|e| FlussError::from_core_error(&e))?;
             Ok(s.into_pyobject(py)?.into_any().unbind())
         }
         DataType::Bytes(_) => {
-            let b = row.get_bytes(pos);
+            let b = row
+                .get_bytes(pos)
+                .map_err(|e| FlussError::from_core_error(&e))?;
             Ok(PyBytes::new(py, b).into_any().unbind())
         }
         DataType::Binary(binary_type) => {
-            let b = row.get_binary(pos, binary_type.length());
+            let b = row
+                .get_binary(pos, binary_type.length())
+                .map_err(|e| FlussError::from_core_error(&e))?;
             Ok(PyBytes::new(py, b).into_any().unbind())
         }
         DataType::Decimal(decimal_type) => {
-            let decimal = row.get_decimal(
-                pos,
-                decimal_type.precision() as usize,
-                decimal_type.scale() as usize,
-            );
+            let decimal = row
+                .get_decimal(
+                    pos,
+                    decimal_type.precision() as usize,
+                    decimal_type.scale() as usize,
+                )
+                .map_err(|e| FlussError::from_core_error(&e))?;
             rust_decimal_to_python(py, &decimal)
         }
         DataType::Date(_) => {
-            let date = row.get_date(pos);
+            let date = row
+                .get_date(pos)
+                .map_err(|e| FlussError::from_core_error(&e))?;
             rust_date_to_python(py, date)
         }
         DataType::Time(_) => {
-            let time = row.get_time(pos);
+            let time = row
+                .get_time(pos)
+                .map_err(|e| FlussError::from_core_error(&e))?;
             rust_time_to_python(py, time)
         }
         DataType::Timestamp(ts_type) => {
-            let ts = row.get_timestamp_ntz(pos, ts_type.precision());
+            let ts = row
+                .get_timestamp_ntz(pos, ts_type.precision())
+                .map_err(|e| FlussError::from_core_error(&e))?;
             rust_timestamp_ntz_to_python(py, ts)
         }
         DataType::TimestampLTz(ts_type) => {
-            let ts = row.get_timestamp_ltz(pos, ts_type.precision());
+            let ts = row
+                .get_timestamp_ltz(pos, ts_type.precision())
+                .map_err(|e| FlussError::from_core_error(&e))?;
             rust_timestamp_ltz_to_python(py, ts)
         }
         _ => Err(FlussError::new_err(format!(
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 90788b1401..8fb60baa24 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -75,8 +75,8 @@ pub async fn main() -> Result<()> {
         let row = result.get_single_row()?.unwrap();
         println!(
             "Found id={id}: name={}, age={}",
-            row.get_string(1),
-            row.get_long(2)
+            row.get_string(1)?,
+            row.get_long(2)?
         );
     }
 
@@ -92,8 +92,8 @@ pub async fn main() -> Result<()> {
     let row = result.get_single_row()?.unwrap();
     println!(
         "Verified update: name={}, age={}",
-        row.get_string(1),
-        row.get_long(2)
+        row.get_string(1)?,
+        row.get_long(2)?
     );
 
     println!("\n=== Deleting ===");
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index e0471785d2..9cd2e7df86 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -90,9 +90,9 @@ pub async fn main() -> Result<()> {
         let row = result.get_single_row()?.unwrap();
         println!(
             "Found id={id}: region={}, zone={}, score={}",
-            row.get_string(1),
-            row.get_long(2),
-            row.get_long(3)
+            row.get_string(1)?,
+            row.get_long(2)?,
+            row.get_long(3)?
         );
     }
 
@@ -109,8 +109,8 @@ pub async fn main() -> Result<()> {
     let row = result.get_single_row()?.unwrap();
     println!(
         "Verified update: region={}, zone={}",
-        row.get_string(1),
-        row.get_long(2)
+        row.get_string(1)?,
+        row.get_long(2)?
     );
 
     println!("\n=== Deleting ===");
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index cfe1627b24..e4ad1fbdfc 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -83,9 +83,9 @@ pub async fn main() -> Result<()> {
             let row = record.row();
             println!(
                 "{{{}, {}, {}}}@{}",
-                row.get_int(0),
-                row.get_string(1),
-                row.get_long(2),
+                row.get_int(0)?,
+                row.get_string(1)?,
+                row.get_long(2)?,
                 record.offset()
             );
         }
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index 942253fa19..a58433f386 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -17,6 +17,7 @@
 
 use crate::client::table::partition_getter::{PartitionGetter, get_physical_path};
 use crate::client::{WriteRecord, WriteResultFuture, WriterClient};
+use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::{PhysicalTablePath, TableInfo, TablePath};
 use crate::row::{ColumnarRow, InternalRow};
@@ -69,6 +70,21 @@ pub struct AppendWriter {
 }
 
 impl AppendWriter {
+    fn check_field_count<R: InternalRow>(&self, row: &R) -> Result<()> {
+        let expected = self.table_info.get_row_type().fields().len();
+        if row.get_field_count() != expected {
+            return Err(IllegalArgument {
+                message: format!(
+                    "The field count of the row does not match the table schema. \
+                     Expected: {}, Actual: {}",
+                    expected,
+                    row.get_field_count()
+                ),
+            });
+        }
+        Ok(())
+    }
+
     /// Appends a row to the table.
     ///
     /// This method returns a [`WriteResultFuture`] immediately after queueing the write,
@@ -81,6 +97,7 @@ impl AppendWriter {
     /// A [`WriteResultFuture`] that can be awaited to wait for server acknowledgment,
     /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
     pub fn append<R: InternalRow>(&self, row: &R) -> Result<WriteResultFuture> {
+        self.check_field_count(row)?;
         let physical_table_path = Arc::new(get_physical_path(
             &self.table_path,
             self.partition_getter.as_ref(),
diff --git a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
index a1aad2d83e..1115ded3bd 100644
--- a/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
+++ b/fluss-rust/crates/fluss/src/client/table/partition_getter.rs
@@ -87,7 +87,7 @@ impl PartitionGetter {
         let mut partition_values = Vec::with_capacity(self.partitions.len());
 
         for (data_type, field_getter) in &self.partitions {
-            let value = field_getter.get_field(row);
+            let value = field_getter.get_field(row)?;
             if value.is_null() {
                 return Err(IllegalArgument {
                     message: "Partition value shouldn't be null.".to_string(),
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 4b6f809567..3ec9106d66 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -114,9 +114,9 @@ impl<'a> TableScan<'a> {
     ///         let row = record.row();
     ///         println!(
     ///             "{{{}, {}, {}}}@{}",
-    ///             row.get_int(0),
-    ///             row.get_string(2),
-    ///             row.get_string(3),
+    ///             row.get_int(0)?,
+    ///             row.get_string(2)?,
+    ///             row.get_string(3)?,
     ///             record.offset()
     ///         );
     ///     }
@@ -188,8 +188,8 @@ impl<'a> TableScan<'a> {
     ///         let row = record.row();
     ///         println!(
     ///             "{{{}, {}}}@{}",
-    ///             row.get_int(0),
-    ///             row.get_string(1),
+    ///             row.get_int(0)?,
+    ///             row.get_string(1)?,
     ///             record.offset()
     ///         );
     ///     }
diff --git a/fluss-rust/crates/fluss/src/client/table/upsert.rs b/fluss-rust/crates/fluss/src/client/table/upsert.rs
index 7057b9013d..52ec37b37b 100644
--- a/fluss-rust/crates/fluss/src/client/table/upsert.rs
+++ b/fluss-rust/crates/fluss/src/client/table/upsert.rs
@@ -328,7 +328,7 @@ impl UpsertWriter {
         })?;
         encoder.start_new_row()?;
         for (pos, field_getter) in self.field_getters.iter().enumerate() {
-            let datum = field_getter.get_field(row);
+            let datum = field_getter.get_field(row)?;
             encoder.encode_field(pos, datum)?;
         }
         encoder.finish_row()
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 7fb9d34a0e..ea27836e52 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -355,7 +355,7 @@ impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
 
     fn append(&mut self, row: &dyn InternalRow) -> Result<bool> {
         for (idx, getter) in self.field_getters.iter().enumerate() {
-            let datum = getter.get_field(row);
+            let datum = getter.get_field(row)?;
             let field_type = self.table_schema.field(idx).data_type();
             let builder =
                 self.arrow_column_builders
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
index eb89d69cda..14ff2e91b4 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch.rs
@@ -445,7 +445,7 @@ mod tests {
         assert_eq!(record1.key().as_ref(), key1);
         assert!(!record1.is_deletion());
         let row1 = record1.row(&*decoder).unwrap();
-        assert_eq!(row1.get_bytes(0), &[1, 2, 3, 4, 5]);
+        assert_eq!(row1.get_bytes(0).unwrap(), &[1, 2, 3, 4, 5]);
 
         let record2 = iter.next().unwrap().unwrap();
         assert_eq!(record2.key().as_ref(), key2);
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
index 837076482e..0e806337fd 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_batch_builder.rs
@@ -555,14 +555,14 @@ mod tests {
                 1 => {
                     assert_eq!(rec.key().as_ref(), key1);
                     let row = rec.row(&*decoder).unwrap();
-                    assert_eq!(row.get_int(0), 42);
-                    assert_eq!(row.get_string(1), "hello");
+                    assert_eq!(row.get_int(0)?, 42);
+                    assert_eq!(row.get_string(1)?, "hello");
                 }
                 2 => {
                     assert_eq!(rec.key().as_ref(), key2);
                     let row = rec.row(&*decoder).unwrap();
-                    assert_eq!(row.get_int(0), 100);
-                    assert_eq!(row.get_string(1), "world");
+                    assert_eq!(row.get_int(0)?, 100);
+                    assert_eq!(row.get_string(1)?, "world");
                 }
                 3 => {
                     assert_eq!(rec.key().as_ref(), key3);
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 50db32b14d..c07fe97c5c 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -15,15 +15,17 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
 use crate::row::InternalRow;
-use arrow::array::{
-    Array, AsArray, BinaryArray, Date32Array, Decimal128Array, FixedSizeBinaryArray, Float32Array,
-    Float64Array, Int8Array, Int16Array, Int32Array, Int64Array, RecordBatch, StringArray,
-    Time32MillisecondArray, Time32SecondArray, Time64MicrosecondArray, Time64NanosecondArray,
-    TimestampMicrosecondArray, TimestampMillisecondArray, TimestampNanosecondArray,
-    TimestampSecondArray,
+use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+use arrow::array::{Array, AsArray, BinaryArray, RecordBatch, StringArray};
+use arrow::datatypes::{
+    DataType as ArrowDataType, Date32Type, Decimal128Type, Float32Type, Float64Type, Int8Type,
+    Int16Type, Int32Type, Int64Type, Time32MillisecondType, Time32SecondType,
+    Time64MicrosecondType, Time64NanosecondType, TimeUnit, TimestampMicrosecondType,
+    TimestampMillisecondType, TimestampNanosecondType, TimestampSecondType,
 };
-use arrow::datatypes::{DataType as ArrowDataType, TimeUnit};
 use std::sync::Arc;
 
 #[derive(Clone)]
@@ -59,6 +61,18 @@ impl ColumnarRow {
         &self.record_batch
     }
 
+    fn column(&self, pos: usize) -> Result<&Arc<dyn Array>> {
+        self.record_batch
+            .columns()
+            .get(pos)
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "column index {pos} out of bounds (batch has {} columns)",
+                    self.record_batch.num_columns()
+                ),
+            })
+    }
+
     /// Generic helper to read timestamp from Arrow, handling all TimeUnit conversions.
     /// Like Java, the precision parameter is ignored - conversion is determined by Arrow TimeUnit.
     fn read_timestamp_from_arrow<T>(
@@ -66,114 +80,133 @@ impl ColumnarRow {
         pos: usize,
         _precision: u32,
         construct_compact: impl FnOnce(i64) -> T,
-        construct_with_nanos: impl FnOnce(i64, i32) -> crate::error::Result<T>,
-    ) -> T {
-        let schema = self.record_batch.schema();
-        let arrow_field = schema.field(pos);
-        let column = self.record_batch.column(pos);
-
-        // Read value based on the actual Arrow timestamp type
-        let value = match arrow_field.data_type() {
-            ArrowDataType::Timestamp(TimeUnit::Second, _) => column
-                .as_any()
-                .downcast_ref::<TimestampSecondArray>()
-                .expect("Expected TimestampSecondArray")
-                .value(self.row_id),
-            ArrowDataType::Timestamp(TimeUnit::Millisecond, _) => column
-                .as_any()
-                .downcast_ref::<TimestampMillisecondArray>()
-                .expect("Expected TimestampMillisecondArray")
-                .value(self.row_id),
-            ArrowDataType::Timestamp(TimeUnit::Microsecond, _) => column
-                .as_any()
-                .downcast_ref::<TimestampMicrosecondArray>()
-                .expect("Expected TimestampMicrosecondArray")
-                .value(self.row_id),
-            ArrowDataType::Timestamp(TimeUnit::Nanosecond, _) => column
-                .as_any()
-                .downcast_ref::<TimestampNanosecondArray>()
-                .expect("Expected TimestampNanosecondArray")
-                .value(self.row_id),
-            other => panic!("Expected Timestamp column at position {pos}, got {other:?}"),
+        construct_with_nanos: impl FnOnce(i64, i32) -> Result<T>,
+    ) -> Result<T> {
+        let column = self.column(pos)?;
+
+        // Read value and time unit based on the actual Arrow timestamp type
+        let (value, time_unit) = match column.data_type() {
+            ArrowDataType::Timestamp(TimeUnit::Second, _) => (
+                column
+                    .as_primitive_opt::<TimestampSecondType>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("expected TimestampSecondArray at position {pos}"),
+                    })?
+                    .value(self.row_id),
+                TimeUnit::Second,
+            ),
+            ArrowDataType::Timestamp(TimeUnit::Millisecond, _) => (
+                column
+                    .as_primitive_opt::<TimestampMillisecondType>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("expected TimestampMillisecondArray at position {pos}"),
+                    })?
+                    .value(self.row_id),
+                TimeUnit::Millisecond,
+            ),
+            ArrowDataType::Timestamp(TimeUnit::Microsecond, _) => (
+                column
+                    .as_primitive_opt::<TimestampMicrosecondType>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("expected TimestampMicrosecondArray at position {pos}"),
+                    })?
+                    .value(self.row_id),
+                TimeUnit::Microsecond,
+            ),
+            ArrowDataType::Timestamp(TimeUnit::Nanosecond, _) => (
+                column
+                    .as_primitive_opt::<TimestampNanosecondType>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("expected TimestampNanosecondArray at position {pos}"),
+                    })?
+                    .value(self.row_id),
+                TimeUnit::Nanosecond,
+            ),
+            other => {
+                return Err(IllegalArgument {
+                    message: format!("expected Timestamp column at position {pos}, got {other:?}"),
+                });
+            }
         };
 
         // Convert based on Arrow TimeUnit
-        let (millis, nanos) = match arrow_field.data_type() {
-            ArrowDataType::Timestamp(time_unit, _) => match time_unit {
-                TimeUnit::Second => (value * 1000, 0),
-                TimeUnit::Millisecond => (value, 0),
-                TimeUnit::Microsecond => {
-                    // Use Euclidean division so that nanos is always non-negative,
-                    // even for timestamps before the Unix epoch.
-                    let millis = value.div_euclid(1000);
-                    let nanos = (value.rem_euclid(1000) * 1000) as i32;
-                    (millis, nanos)
-                }
-                TimeUnit::Nanosecond => {
-                    // Use Euclidean division so that nanos is always in [0, 999_999].
-                    let millis = value.div_euclid(1_000_000);
-                    let nanos = value.rem_euclid(1_000_000) as i32;
-                    (millis, nanos)
-                }
-            },
-            _ => unreachable!(),
+        let (millis, nanos) = match time_unit {
+            TimeUnit::Second => (value * 1000, 0),
+            TimeUnit::Millisecond => (value, 0),
+            TimeUnit::Microsecond => {
+                // Use Euclidean division so that nanos is always non-negative,
+                // even for timestamps before the Unix epoch.
+                let millis = value.div_euclid(1000);
+                let nanos = (value.rem_euclid(1000) * 1000) as i32;
+                (millis, nanos)
+            }
+            TimeUnit::Nanosecond => {
+                // Use Euclidean division so that nanos is always in [0, 999_999].
+                let millis = value.div_euclid(1_000_000);
+                let nanos = value.rem_euclid(1_000_000) as i32;
+                (millis, nanos)
+            }
         };
 
         if nanos == 0 {
-            construct_compact(millis)
+            Ok(construct_compact(millis))
         } else {
-            // nanos is guaranteed to be in valid range [0, 999_999] by arithmetic
-            construct_with_nanos(millis, nanos).expect("nanos in valid range by construction")
+            construct_with_nanos(millis, nanos)
         }
     }
 
     /// Read date value from Arrow Date32Array
-    fn read_date_from_arrow(&self, pos: usize) -> i32 {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<Date32Array>()
-            .expect("Expected Date32Array")
-            .value(self.row_id)
+    fn read_date_from_arrow(&self, pos: usize) -> Result<i32> {
+        Ok(self
+            .column(pos)?
+            .as_primitive_opt::<Date32Type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected Date32Array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
     /// Read time value from Arrow Time32/Time64 arrays, converting to milliseconds
-    fn read_time_from_arrow(&self, pos: usize) -> i32 {
-        let schema = self.record_batch.schema();
-        let arrow_field = schema.field(pos);
-        let column = self.record_batch.column(pos);
+    fn read_time_from_arrow(&self, pos: usize) -> Result<i32> {
+        let column = self.column(pos)?;
 
-        match arrow_field.data_type() {
+        match column.data_type() {
             ArrowDataType::Time32(TimeUnit::Second) => {
                 let value = column
-                    .as_any()
-                    .downcast_ref::<Time32SecondArray>()
-                    .expect("Expected Time32SecondArray")
+                    .as_primitive_opt::<Time32SecondType>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("expected Time32SecondArray at position {pos}"),
+                    })?
                     .value(self.row_id);
-                value * 1000 // Convert seconds to milliseconds
+                Ok(value * 1000) // Convert seconds to milliseconds
             }
-            ArrowDataType::Time32(TimeUnit::Millisecond) => column
-                .as_any()
-                .downcast_ref::<Time32MillisecondArray>()
-                .expect("Expected Time32MillisecondArray")
-                .value(self.row_id),
+            ArrowDataType::Time32(TimeUnit::Millisecond) => Ok(column
+                .as_primitive_opt::<Time32MillisecondType>()
+                .ok_or_else(|| IllegalArgument {
+                    message: format!("expected Time32MillisecondArray at position {pos}"),
+                })?
+                .value(self.row_id)),
             ArrowDataType::Time64(TimeUnit::Microsecond) => {
                 let value = column
-                    .as_any()
-                    .downcast_ref::<Time64MicrosecondArray>()
-                    .expect("Expected Time64MicrosecondArray")
+                    .as_primitive_opt::<Time64MicrosecondType>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("expected Time64MicrosecondArray at position {pos}"),
+                    })?
                     .value(self.row_id);
-                (value / 1000) as i32 // Convert microseconds to milliseconds
+                Ok((value / 1000) as i32) // Convert microseconds to milliseconds
             }
             ArrowDataType::Time64(TimeUnit::Nanosecond) => {
                 let value = column
-                    .as_any()
-                    .downcast_ref::<Time64NanosecondArray>()
-                    .expect("Expected Time64NanosecondArray")
+                    .as_primitive_opt::<Time64NanosecondType>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("expected Time64NanosecondArray at position {pos}"),
+                    })?
                     .value(self.row_id);
-                (value / 1_000_000) as i32 // Convert nanoseconds to milliseconds
+                Ok((value / 1_000_000) as i32) // Convert nanoseconds to milliseconds
             }
-            other => panic!("Expected Time column at position {pos}, got {other:?}"),
+            other => Err(IllegalArgument {
+                message: format!("expected Time column at position {pos}, got {other:?}"),
+            }),
         }
     }
 }
@@ -183,106 +216,121 @@ impl InternalRow for ColumnarRow {
         self.record_batch.num_columns()
     }
 
-    fn is_null_at(&self, pos: usize) -> bool {
-        self.record_batch.column(pos).is_null(self.row_id)
+    fn is_null_at(&self, pos: usize) -> Result<bool> {
+        Ok(self.column(pos)?.is_null(self.row_id))
     }
 
-    fn get_boolean(&self, pos: usize) -> bool {
-        self.record_batch
-            .column(pos)
-            .as_boolean()
-            .value(self.row_id)
+    fn get_boolean(&self, pos: usize) -> Result<bool> {
+        Ok(self
+            .column(pos)?
+            .as_boolean_opt()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected boolean array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_byte(&self, pos: usize) -> i8 {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<Int8Array>()
-            .expect("Expect byte array")
-            .value(self.row_id)
+    fn get_byte(&self, pos: usize) -> Result<i8> {
+        Ok(self
+            .column(pos)?
+            .as_primitive_opt::<Int8Type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected byte array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_short(&self, pos: usize) -> i16 {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<Int16Array>()
-            .expect("Expect short array")
-            .value(self.row_id)
+    fn get_short(&self, pos: usize) -> Result<i16> {
+        Ok(self
+            .column(pos)?
+            .as_primitive_opt::<Int16Type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected short array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_int(&self, pos: usize) -> i32 {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<Int32Array>()
-            .expect("Expect int array")
-            .value(self.row_id)
+    fn get_int(&self, pos: usize) -> Result<i32> {
+        Ok(self
+            .column(pos)?
+            .as_primitive_opt::<Int32Type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected int array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_long(&self, pos: usize) -> i64 {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<Int64Array>()
-            .expect("Expect long array")
-            .value(self.row_id)
+    fn get_long(&self, pos: usize) -> Result<i64> {
+        Ok(self
+            .column(pos)?
+            .as_primitive_opt::<Int64Type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected long array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_float(&self, pos: usize) -> f32 {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<Float32Array>()
-            .expect("Expect float32 array")
-            .value(self.row_id)
+    fn get_float(&self, pos: usize) -> Result<f32> {
+        Ok(self
+            .column(pos)?
+            .as_primitive_opt::<Float32Type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected float32 array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_double(&self, pos: usize) -> f64 {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<Float64Array>()
-            .expect("Expect float64 array")
-            .value(self.row_id)
+    fn get_double(&self, pos: usize) -> Result<f64> {
+        Ok(self
+            .column(pos)?
+            .as_primitive_opt::<Float64Type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected float64 array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_char(&self, pos: usize, _length: usize) -> &str {
-        self.record_batch
-            .column(pos)
+    fn get_char(&self, pos: usize, _length: usize) -> Result<&str> {
+        Ok(self
+            .column(pos)?
             .as_any()
             .downcast_ref::<StringArray>()
-            .expect("Expected String array for char type")
-            .value(self.row_id)
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected String array for char type at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_string(&self, pos: usize) -> &str {
-        self.record_batch
-            .column(pos)
+    fn get_string(&self, pos: usize) -> Result<&str> {
+        Ok(self
+            .column(pos)?
             .as_any()
             .downcast_ref::<StringArray>()
-            .expect("Expected String array.")
-            .value(self.row_id)
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected String array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> crate::row::Decimal {
+    fn get_decimal(
+        &self,
+        pos: usize,
+        precision: usize,
+        scale: usize,
+    ) -> Result<crate::row::Decimal> {
         use arrow::datatypes::DataType;
 
-        let column = self.record_batch.column(pos);
+        let column = self.column(pos)?;
         let array = column
-            .as_any()
-            .downcast_ref::<Decimal128Array>()
-            .unwrap_or_else(|| {
-                panic!(
-                    "Expected Decimal128Array at column {}, found: {:?}",
-                    pos,
+            .as_primitive_opt::<Decimal128Type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "expected Decimal128Array at column {pos}, found: {:?}",
                     column.data_type()
-                )
-            });
+                ),
+            })?;
 
         // Contract: caller must check is_null_at() before calling get_decimal.
-        // Calling on null value violates the contract and returns garbage data
         debug_assert!(
             !array.is_null(self.row_id),
             "get_decimal called on null value at pos {} row {}",
@@ -290,12 +338,16 @@ impl InternalRow for ColumnarRow {
             self.row_id
         );
 
-        // Read scale from Arrow schema field metadata
-        let schema = self.record_batch.schema();
-        let field = schema.field(pos);
-        let arrow_scale = match field.data_type() {
+        // Read scale from Arrow column data type
+        let arrow_scale = match column.data_type() {
             DataType::Decimal128(_p, s) => *s as i64,
-            dt => panic!("Expected Decimal128 data type at column {pos}, found: {dt:?}"),
+            dt => {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "expected Decimal128 data type at column {pos}, found: {dt:?}"
+                    ),
+                });
+            }
         };
 
         let i128_val = array.value(self.row_id);
@@ -307,60 +359,53 @@ impl InternalRow for ColumnarRow {
             precision as u32,
             scale as u32,
         )
-        .unwrap_or_else(|e| {
-            panic!(
-                "Failed to create Decimal at column {} row {}: {}",
-                pos, self.row_id, e
-            )
-        })
     }
 
-    fn get_date(&self, pos: usize) -> crate::row::datum::Date {
-        crate::row::datum::Date::new(self.read_date_from_arrow(pos))
+    fn get_date(&self, pos: usize) -> Result<Date> {
+        Ok(Date::new(self.read_date_from_arrow(pos)?))
     }
 
-    fn get_time(&self, pos: usize) -> crate::row::datum::Time {
-        crate::row::datum::Time::new(self.read_time_from_arrow(pos))
+    fn get_time(&self, pos: usize) -> Result<Time> {
+        Ok(Time::new(self.read_time_from_arrow(pos)?))
     }
 
-    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampNtz {
-        // Like Java's ArrowTimestampNtzColumnVector, we ignore the precision parameter
-        // and determine the conversion from the Arrow column's TimeUnit.
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> Result<TimestampNtz> {
         self.read_timestamp_from_arrow(
             pos,
             precision,
-            crate::row::datum::TimestampNtz::new,
-            crate::row::datum::TimestampNtz::from_millis_nanos,
+            TimestampNtz::new,
+            TimestampNtz::from_millis_nanos,
         )
     }
 
-    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampLtz {
-        // Like Java's ArrowTimestampLtzColumnVector, we ignore the precision parameter
-        // and determine the conversion from the Arrow column's TimeUnit.
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> Result<TimestampLtz> {
         self.read_timestamp_from_arrow(
             pos,
             precision,
-            crate::row::datum::TimestampLtz::new,
-            crate::row::datum::TimestampLtz::from_millis_nanos,
+            TimestampLtz::new,
+            TimestampLtz::from_millis_nanos,
         )
     }
 
-    fn get_binary(&self, pos: usize, _length: usize) -> &[u8] {
-        self.record_batch
-            .column(pos)
-            .as_any()
-            .downcast_ref::<FixedSizeBinaryArray>()
-            .expect("Expected binary array.")
-            .value(self.row_id)
+    fn get_binary(&self, pos: usize, _length: usize) -> Result<&[u8]> {
+        Ok(self
+            .column(pos)?
+            .as_fixed_size_binary_opt()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected binary array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 
-    fn get_bytes(&self, pos: usize) -> &[u8] {
-        self.record_batch
-            .column(pos)
+    fn get_bytes(&self, pos: usize) -> Result<&[u8]> {
+        Ok(self
+            .column(pos)?
             .as_any()
             .downcast_ref::<BinaryArray>()
-            .expect("Expected bytes array.")
-            .value(self.row_id)
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected bytes array at position {pos}"),
+            })?
+            .value(self.row_id))
     }
 }
 
@@ -368,8 +413,8 @@ impl InternalRow for ColumnarRow {
 mod tests {
     use super::*;
     use arrow::array::{
-        BinaryArray, BooleanArray, Float32Array, Float64Array, Int8Array, Int16Array, Int32Array,
-        Int64Array, StringArray,
+        BinaryArray, BooleanArray, Decimal128Array, Float32Array, Float64Array, Int8Array,
+        Int16Array, Int32Array, Int64Array, StringArray,
     };
     use arrow::datatypes::{DataType, Field, Schema};
 
@@ -407,16 +452,16 @@ mod tests {
 
         let mut row = ColumnarRow::new(Arc::new(batch));
         assert_eq!(row.get_field_count(), 10);
-        assert!(row.get_boolean(0));
-        assert_eq!(row.get_byte(1), 1);
-        assert_eq!(row.get_short(2), 2);
-        assert_eq!(row.get_int(3), 3);
-        assert_eq!(row.get_long(4), 4);
-        assert_eq!(row.get_float(5), 1.25);
-        assert_eq!(row.get_double(6), 2.5);
-        assert_eq!(row.get_string(7), "hello");
-        assert_eq!(row.get_bytes(8), b"data");
-        assert_eq!(row.get_char(9, 2), "ab");
+        assert!(row.get_boolean(0).unwrap());
+        assert_eq!(row.get_byte(1).unwrap(), 1);
+        assert_eq!(row.get_short(2).unwrap(), 2);
+        assert_eq!(row.get_int(3).unwrap(), 3);
+        assert_eq!(row.get_long(4).unwrap(), 4);
+        assert_eq!(row.get_float(5).unwrap(), 1.25);
+        assert_eq!(row.get_double(6).unwrap(), 2.5);
+        assert_eq!(row.get_string(7).unwrap(), "hello");
+        assert_eq!(row.get_bytes(8).unwrap(), b"data");
+        assert_eq!(row.get_char(9, 2).unwrap(), "ab");
         row.set_row_id(0);
         assert_eq!(row.get_row_id(), 0);
     }
@@ -465,12 +510,12 @@ mod tests {
 
         // Verify decimal values
         assert_eq!(
-            row.get_decimal(0, 10, 2),
+            row.get_decimal(0, 10, 2).unwrap(),
             crate::row::Decimal::from_big_decimal(BigDecimal::new(BigInt::from(12345), 2), 10, 2)
                 .unwrap()
         );
         assert_eq!(
-            row.get_decimal(1, 20, 5),
+            row.get_decimal(1, 20, 5).unwrap(),
             crate::row::Decimal::from_big_decimal(
                 BigDecimal::new(BigInt::from(1234567890), 5),
                 20,
@@ -479,7 +524,7 @@ mod tests {
             .unwrap()
         );
         assert_eq!(
-            row.get_decimal(2, 38, 10),
+            row.get_decimal(2, 38, 10).unwrap(),
             crate::row::Decimal::from_big_decimal(
                 BigDecimal::new(BigInt::from(999999999999999999i128), 10),
                 38,
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 232220720c..918ebdfd5f 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -16,9 +16,11 @@
 // under the License.
 
 use crate::client::WriteFormat;
+use crate::error::Result;
 use crate::metadata::RowType;
 use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
-use crate::row::{GenericRow, InternalRow};
+use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+use crate::row::{Decimal, GenericRow, InternalRow};
 use std::sync::{Arc, OnceLock};
 
 // Reference implementation:
@@ -81,74 +83,80 @@ impl<'a> InternalRow for CompactedRow<'a> {
         self.arity
     }
 
-    fn is_null_at(&self, pos: usize) -> bool {
-        self.deserializer.get_row_type().fields().as_slice()[pos]
-            .data_type
-            .is_nullable()
-            && self.reader.is_null_at(pos)
+    fn is_null_at(&self, pos: usize) -> Result<bool> {
+        let fields = self.deserializer.get_row_type().fields();
+        if pos >= fields.len() {
+            return Err(crate::error::Error::IllegalArgument {
+                message: format!(
+                    "position {pos} out of bounds (row has {} fields)",
+                    fields.len()
+                ),
+            });
+        }
+        Ok(fields.as_slice()[pos].data_type.is_nullable() && self.reader.is_null_at(pos))
     }
 
-    fn get_boolean(&self, pos: usize) -> bool {
+    fn get_boolean(&self, pos: usize) -> Result<bool> {
         self.decoded_row().get_boolean(pos)
     }
 
-    fn get_byte(&self, pos: usize) -> i8 {
+    fn get_byte(&self, pos: usize) -> Result<i8> {
         self.decoded_row().get_byte(pos)
     }
 
-    fn get_short(&self, pos: usize) -> i16 {
+    fn get_short(&self, pos: usize) -> Result<i16> {
         self.decoded_row().get_short(pos)
     }
 
-    fn get_int(&self, pos: usize) -> i32 {
+    fn get_int(&self, pos: usize) -> Result<i32> {
         self.decoded_row().get_int(pos)
     }
 
-    fn get_long(&self, pos: usize) -> i64 {
+    fn get_long(&self, pos: usize) -> Result<i64> {
         self.decoded_row().get_long(pos)
     }
 
-    fn get_float(&self, pos: usize) -> f32 {
+    fn get_float(&self, pos: usize) -> Result<f32> {
         self.decoded_row().get_float(pos)
     }
 
-    fn get_double(&self, pos: usize) -> f64 {
+    fn get_double(&self, pos: usize) -> Result<f64> {
         self.decoded_row().get_double(pos)
     }
 
-    fn get_char(&self, pos: usize, length: usize) -> &str {
+    fn get_char(&self, pos: usize, length: usize) -> Result<&str> {
         self.decoded_row().get_char(pos, length)
     }
 
-    fn get_string(&self, pos: usize) -> &str {
+    fn get_string(&self, pos: usize) -> Result<&str> {
         self.decoded_row().get_string(pos)
     }
 
-    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> crate::row::Decimal {
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Result<Decimal> {
         self.decoded_row().get_decimal(pos, precision, scale)
     }
 
-    fn get_date(&self, pos: usize) -> crate::row::datum::Date {
+    fn get_date(&self, pos: usize) -> Result<Date> {
         self.decoded_row().get_date(pos)
     }
 
-    fn get_time(&self, pos: usize) -> crate::row::datum::Time {
+    fn get_time(&self, pos: usize) -> Result<Time> {
         self.decoded_row().get_time(pos)
     }
 
-    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampNtz {
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> Result<TimestampNtz> {
         self.decoded_row().get_timestamp_ntz(pos, precision)
     }
 
-    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> crate::row::datum::TimestampLtz {
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> Result<TimestampLtz> {
         self.decoded_row().get_timestamp_ltz(pos, precision)
     }
 
-    fn get_binary(&self, pos: usize, length: usize) -> &[u8] {
+    fn get_binary(&self, pos: usize, length: usize) -> Result<&[u8]> {
         self.decoded_row().get_binary(pos, length)
     }
 
-    fn get_bytes(&self, pos: usize) -> &[u8] {
+    fn get_bytes(&self, pos: usize) -> Result<&[u8]> {
         self.decoded_row().get_bytes(pos)
     }
 
@@ -203,15 +211,15 @@ mod tests {
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
         assert_eq!(row.get_field_count(), 9);
-        assert!(row.get_boolean(0));
-        assert_eq!(row.get_byte(1), 1);
-        assert_eq!(row.get_short(2), 100);
-        assert_eq!(row.get_int(3), 1000);
-        assert_eq!(row.get_long(4), 10000);
-        assert_eq!(row.get_float(5), 1.5);
-        assert_eq!(row.get_double(6), 2.5);
-        assert_eq!(row.get_string(7), "Hello World");
-        assert_eq!(row.get_bytes(8), &[1, 2, 3, 4, 5]);
+        assert!(row.get_boolean(0).unwrap());
+        assert_eq!(row.get_byte(1).unwrap(), 1);
+        assert_eq!(row.get_short(2).unwrap(), 100);
+        assert_eq!(row.get_int(3).unwrap(), 1000);
+        assert_eq!(row.get_long(4).unwrap(), 10000);
+        assert_eq!(row.get_float(5).unwrap(), 1.5);
+        assert_eq!(row.get_double(6).unwrap(), 2.5);
+        assert_eq!(row.get_string(7).unwrap(), "Hello World");
+        assert_eq!(row.get_bytes(8).unwrap(), &[1, 2, 3, 4, 5]);
 
         // Test with nulls and negative values
         let row_type = RowType::with_data_types(vec![
@@ -228,13 +236,13 @@ mod tests {
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
-        assert!(!row.is_null_at(0));
-        assert!(row.is_null_at(1));
-        assert!(!row.is_null_at(2));
-        assert_eq!(row.get_int(0), -42);
-        assert_eq!(row.get_double(2), 2.71);
+        assert!(!row.is_null_at(0).unwrap());
+        assert!(row.is_null_at(1).unwrap());
+        assert!(!row.is_null_at(2).unwrap());
+        assert_eq!(row.get_int(0).unwrap(), -42);
+        assert_eq!(row.get_double(2).unwrap(), 2.71);
         // Verify caching works on repeated reads
-        assert_eq!(row.get_int(0), -42);
+        assert_eq!(row.get_int(0).unwrap(), -42);
     }
 
     #[test]
@@ -285,30 +293,33 @@ mod tests {
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
         // Verify all values
-        assert_eq!(row.get_date(0).get_inner(), 19651);
-        assert_eq!(row.get_time(1).get_inner(), 34200000);
-        assert_eq!(row.get_timestamp_ntz(2, 3).get_millisecond(), 1698235273182);
+        assert_eq!(row.get_date(0).unwrap().get_inner(), 19651);
+        assert_eq!(row.get_time(1).unwrap().get_inner(), 34200000);
+        assert_eq!(
+            row.get_timestamp_ntz(2, 3).unwrap().get_millisecond(),
+            1698235273182
+        );
         assert_eq!(
-            row.get_timestamp_ltz(3, 3).get_epoch_millisecond(),
+            row.get_timestamp_ltz(3, 3).unwrap().get_epoch_millisecond(),
             1698235273182
         );
-        let read_ts_ntz = row.get_timestamp_ntz(4, 6);
+        let read_ts_ntz = row.get_timestamp_ntz(4, 6).unwrap();
         assert_eq!(read_ts_ntz.get_millisecond(), 1698235273182);
         assert_eq!(read_ts_ntz.get_nano_of_millisecond(), 123456);
-        let read_ts_ltz = row.get_timestamp_ltz(5, 9);
+        let read_ts_ltz = row.get_timestamp_ltz(5, 9).unwrap();
         assert_eq!(read_ts_ltz.get_epoch_millisecond(), 1698235273182);
         assert_eq!(read_ts_ltz.get_nano_of_millisecond(), 987654);
         // Assert on Decimal equality
-        assert_eq!(row.get_decimal(6, 10, 2), small_decimal);
-        assert_eq!(row.get_decimal(7, 28, 10), large_decimal);
+        assert_eq!(row.get_decimal(6, 10, 2).unwrap(), small_decimal);
+        assert_eq!(row.get_decimal(7, 28, 10).unwrap(), large_decimal);
 
         // Assert on Decimal components to catch any regressions
-        let read_small_decimal = row.get_decimal(6, 10, 2);
+        let read_small_decimal = row.get_decimal(6, 10, 2).unwrap();
         assert_eq!(read_small_decimal.precision(), 10);
         assert_eq!(read_small_decimal.scale(), 2);
         assert_eq!(read_small_decimal.to_unscaled_long().unwrap(), 12345);
 
-        let read_large_decimal = row.get_decimal(7, 28, 10);
+        let read_large_decimal = row.get_decimal(7, 28, 10).unwrap();
         assert_eq!(read_large_decimal.precision(), 28);
         assert_eq!(read_large_decimal.scale(), 10);
         assert_eq!(
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
index 563c1c960e..d201450be4 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
@@ -83,7 +83,7 @@ impl KeyEncoder for CompactedKeyEncoder {
 
         // iterate all the fields of the row, and encode each field
         for (pos, field_getter) in self.field_getters.iter().enumerate() {
-            match &field_getter.get_field(row) {
+            match &field_getter.get_field(row)? {
                 Datum::Null => {
                     return Err(IllegalArgument {
                         message: format!("Cannot encode key with null value at position: {pos:?}"),
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
index cbffa4d09f..d6b9fc94d7 100644
--- a/fluss-rust/crates/fluss/src/row/field_getter.rs
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -15,6 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::error::Result;
 use crate::metadata::{DataType, RowType};
 use crate::row::{Datum, InternalRow};
 
@@ -24,11 +25,11 @@ pub enum FieldGetter {
     NonNullable(InnerFieldGetter),
 }
 impl FieldGetter {
-    pub fn get_field<'a>(&self, row: &'a dyn InternalRow) -> Datum<'a> {
+    pub fn get_field<'a>(&self, row: &'a dyn InternalRow) -> Result<Datum<'a>> {
         match self {
             FieldGetter::Nullable(getter) => {
-                if row.is_null_at(getter.pos()) {
-                    Datum::Null
+                if row.is_null_at(getter.pos())? {
+                    Ok(Datum::Null)
                 } else {
                     getter.get_field(row)
                 }
@@ -151,33 +152,33 @@ pub enum InnerFieldGetter {
 }
 
 impl InnerFieldGetter {
-    pub fn get_field<'a>(&self, row: &'a dyn InternalRow) -> Datum<'a> {
-        match self {
-            InnerFieldGetter::Char { pos, len } => Datum::from(row.get_char(*pos, *len)),
-            InnerFieldGetter::String { pos } => Datum::from(row.get_string(*pos)),
-            InnerFieldGetter::Bool { pos } => Datum::from(row.get_boolean(*pos)),
-            InnerFieldGetter::Binary { pos, len } => Datum::from(row.get_binary(*pos, *len)),
-            InnerFieldGetter::Bytes { pos } => Datum::from(row.get_bytes(*pos)),
-            InnerFieldGetter::TinyInt { pos } => Datum::from(row.get_byte(*pos)),
-            InnerFieldGetter::SmallInt { pos } => Datum::from(row.get_short(*pos)),
-            InnerFieldGetter::Int { pos } => Datum::from(row.get_int(*pos)),
-            InnerFieldGetter::BigInt { pos } => Datum::from(row.get_long(*pos)),
-            InnerFieldGetter::Float { pos } => Datum::from(row.get_float(*pos)),
-            InnerFieldGetter::Double { pos } => Datum::from(row.get_double(*pos)),
+    pub fn get_field<'a>(&self, row: &'a dyn InternalRow) -> Result<Datum<'a>> {
+        Ok(match self {
+            InnerFieldGetter::Char { pos, len } => Datum::from(row.get_char(*pos, *len)?),
+            InnerFieldGetter::String { pos } => Datum::from(row.get_string(*pos)?),
+            InnerFieldGetter::Bool { pos } => Datum::from(row.get_boolean(*pos)?),
+            InnerFieldGetter::Binary { pos, len } => Datum::from(row.get_binary(*pos, *len)?),
+            InnerFieldGetter::Bytes { pos } => Datum::from(row.get_bytes(*pos)?),
+            InnerFieldGetter::TinyInt { pos } => Datum::from(row.get_byte(*pos)?),
+            InnerFieldGetter::SmallInt { pos } => Datum::from(row.get_short(*pos)?),
+            InnerFieldGetter::Int { pos } => Datum::from(row.get_int(*pos)?),
+            InnerFieldGetter::BigInt { pos } => Datum::from(row.get_long(*pos)?),
+            InnerFieldGetter::Float { pos } => Datum::from(row.get_float(*pos)?),
+            InnerFieldGetter::Double { pos } => Datum::from(row.get_double(*pos)?),
             InnerFieldGetter::Decimal {
                 pos,
                 precision,
                 scale,
-            } => Datum::Decimal(row.get_decimal(*pos, *precision, *scale)),
-            InnerFieldGetter::Date { pos } => Datum::Date(row.get_date(*pos)),
-            InnerFieldGetter::Time { pos } => Datum::Time(row.get_time(*pos)),
+            } => Datum::Decimal(row.get_decimal(*pos, *precision, *scale)?),
+            InnerFieldGetter::Date { pos } => Datum::Date(row.get_date(*pos)?),
+            InnerFieldGetter::Time { pos } => Datum::Time(row.get_time(*pos)?),
             InnerFieldGetter::Timestamp { pos, precision } => {
-                Datum::TimestampNtz(row.get_timestamp_ntz(*pos, *precision))
+                Datum::TimestampNtz(row.get_timestamp_ntz(*pos, *precision)?)
             }
             InnerFieldGetter::TimestampLtz { pos, precision } => {
-                Datum::TimestampLtz(row.get_timestamp_ltz(*pos, *precision))
+                Datum::TimestampLtz(row.get_timestamp_ltz(*pos, *precision)?)
             } //TODO Array, Map, Row
-        }
+        })
     }
 
     pub fn pos(&self) -> usize {
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 276dcca38e..8fb777d257 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -54,67 +54,69 @@ impl<'a> BinaryRow<'a> {
     }
 }
 
-// TODO make functions return Result<?> for better error handling
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+
 pub trait InternalRow: Send + Sync {
     /// Returns the number of fields in this row
     fn get_field_count(&self) -> usize;
 
     /// Returns true if the element is null at the given position
-    fn is_null_at(&self, pos: usize) -> bool;
+    fn is_null_at(&self, pos: usize) -> Result<bool>;
 
     /// Returns the boolean value at the given position
-    fn get_boolean(&self, pos: usize) -> bool;
+    fn get_boolean(&self, pos: usize) -> Result<bool>;
 
     /// Returns the byte value at the given position
-    fn get_byte(&self, pos: usize) -> i8;
+    fn get_byte(&self, pos: usize) -> Result<i8>;
 
     /// Returns the short value at the given position
-    fn get_short(&self, pos: usize) -> i16;
+    fn get_short(&self, pos: usize) -> Result<i16>;
 
     /// Returns the integer value at the given position
-    fn get_int(&self, pos: usize) -> i32;
+    fn get_int(&self, pos: usize) -> Result<i32>;
 
     /// Returns the long value at the given position
-    fn get_long(&self, pos: usize) -> i64;
+    fn get_long(&self, pos: usize) -> Result<i64>;
 
     /// Returns the float value at the given position
-    fn get_float(&self, pos: usize) -> f32;
+    fn get_float(&self, pos: usize) -> Result<f32>;
 
     /// Returns the double value at the given position
-    fn get_double(&self, pos: usize) -> f64;
+    fn get_double(&self, pos: usize) -> Result<f64>;
 
     /// Returns the string value at the given position with fixed length
-    fn get_char(&self, pos: usize, length: usize) -> &str;
+    fn get_char(&self, pos: usize, length: usize) -> Result<&str>;
 
     /// Returns the string value at the given position
-    fn get_string(&self, pos: usize) -> &str;
+    fn get_string(&self, pos: usize) -> Result<&str>;
 
     /// Returns the decimal value at the given position
-    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Decimal;
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Result<Decimal>;
 
     /// Returns the date value at the given position (date as days since epoch)
-    fn get_date(&self, pos: usize) -> datum::Date;
+    fn get_date(&self, pos: usize) -> Result<Date>;
 
     /// Returns the time value at the given position (time as milliseconds since midnight)
-    fn get_time(&self, pos: usize) -> datum::Time;
+    fn get_time(&self, pos: usize) -> Result<Time>;
 
     /// Returns the timestamp value at the given position (timestamp without timezone)
     ///
     /// The precision is required to determine whether the timestamp value was stored
     /// in a compact representation (precision <= 3) or with nanosecond precision.
-    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> datum::TimestampNtz;
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> Result<TimestampNtz>;
 
     /// Returns the timestamp value at the given position (timestamp with local timezone)
     ///
     /// The precision is required to determine whether the timestamp value was stored
     /// in a compact representation (precision <= 3) or with nanosecond precision.
-    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> datum::TimestampLtz;
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> Result<TimestampLtz>;
 
     /// Returns the binary value at the given position with fixed length
-    fn get_binary(&self, pos: usize, length: usize) -> &[u8];
+    fn get_binary(&self, pos: usize, length: usize) -> Result<&[u8]>;
 
     /// Returns the binary value at the given position
-    fn get_bytes(&self, pos: usize) -> &[u8];
+    fn get_bytes(&self, pos: usize) -> Result<&[u8]>;
 
     /// Returns encoded bytes if already encoded
     fn as_encoded_bytes(&self, _write_format: WriteFormat) -> Option<&[u8]> {
@@ -127,98 +129,149 @@ pub struct GenericRow<'a> {
     pub values: Vec<Datum<'a>>,
 }
 
+impl<'a> GenericRow<'a> {
+    fn get_value(&self, pos: usize) -> Result<&Datum<'a>> {
+        self.values.get(pos).ok_or_else(|| IllegalArgument {
+            message: format!(
+                "position {pos} out of bounds (row has {} fields)",
+                self.values.len()
+            ),
+        })
+    }
+
+    fn try_convert<T: TryFrom<&'a Datum<'a>>>(
+        &'a self,
+        pos: usize,
+        expected_type: &str,
+    ) -> Result<T> {
+        let datum = self.get_value(pos)?;
+        T::try_from(datum).map_err(|_| IllegalArgument {
+            message: format!(
+                "type mismatch at position {pos}: expected {expected_type}, got {datum:?}"
+            ),
+        })
+    }
+}
+
 impl<'a> InternalRow for GenericRow<'a> {
     fn get_field_count(&self) -> usize {
         self.values.len()
     }
 
-    fn is_null_at(&self, pos: usize) -> bool {
-        self.values
-            .get(pos)
-            .expect("position out of bounds")
-            .is_null()
+    fn is_null_at(&self, pos: usize) -> Result<bool> {
+        Ok(self.get_value(pos)?.is_null())
     }
 
-    fn get_boolean(&self, pos: usize) -> bool {
-        self.values.get(pos).unwrap().try_into().unwrap()
+    fn get_boolean(&self, pos: usize) -> Result<bool> {
+        self.try_convert(pos, "Boolean")
     }
 
-    fn get_byte(&self, pos: usize) -> i8 {
-        self.values.get(pos).unwrap().try_into().unwrap()
+    fn get_byte(&self, pos: usize) -> Result<i8> {
+        self.try_convert(pos, "TinyInt")
     }
 
-    fn get_short(&self, pos: usize) -> i16 {
-        self.values.get(pos).unwrap().try_into().unwrap()
+    fn get_short(&self, pos: usize) -> Result<i16> {
+        self.try_convert(pos, "SmallInt")
     }
 
-    fn get_int(&self, pos: usize) -> i32 {
-        self.values.get(pos).unwrap().try_into().unwrap()
+    fn get_int(&self, pos: usize) -> Result<i32> {
+        self.try_convert(pos, "Int")
     }
 
-    fn get_long(&self, _pos: usize) -> i64 {
-        self.values.get(_pos).unwrap().try_into().unwrap()
+    fn get_long(&self, pos: usize) -> Result<i64> {
+        self.try_convert(pos, "BigInt")
     }
 
-    fn get_float(&self, pos: usize) -> f32 {
-        self.values.get(pos).unwrap().try_into().unwrap()
+    fn get_float(&self, pos: usize) -> Result<f32> {
+        self.try_convert(pos, "Float")
     }
 
-    fn get_double(&self, pos: usize) -> f64 {
-        self.values.get(pos).unwrap().try_into().unwrap()
+    fn get_double(&self, pos: usize) -> Result<f64> {
+        self.try_convert(pos, "Double")
     }
 
-    fn get_char(&self, pos: usize, _length: usize) -> &str {
+    fn get_char(&self, pos: usize, _length: usize) -> Result<&str> {
         // don't check length, following java client
         self.get_string(pos)
     }
 
-    fn get_string(&self, pos: usize) -> &str {
-        self.values.get(pos).unwrap().try_into().unwrap()
+    fn get_string(&self, pos: usize) -> Result<&str> {
+        self.try_convert(pos, "String")
     }
 
-    fn get_decimal(&self, pos: usize, _precision: usize, _scale: usize) -> Decimal {
-        match self.values.get(pos).unwrap() {
-            Datum::Decimal(d) => d.clone(),
-            other => panic!("Expected Decimal at pos {pos:?}, got {other:?}"),
+    fn get_decimal(&self, pos: usize, _precision: usize, _scale: usize) -> Result<Decimal> {
+        match self.get_value(pos)? {
+            Datum::Decimal(d) => Ok(d.clone()),
+            other => Err(IllegalArgument {
+                message: format!(
+                    "type mismatch at position {pos}: expected Decimal, got {other:?}"
+                ),
+            }),
         }
     }
 
-    fn get_date(&self, pos: usize) -> datum::Date {
-        match self.values.get(pos).unwrap() {
-            Datum::Date(d) => *d,
-            Datum::Int32(i) => datum::Date::new(*i),
-            other => panic!("Expected Date or Int32 at pos {pos:?}, got {other:?}"),
+    fn get_date(&self, pos: usize) -> Result<Date> {
+        match self.get_value(pos)? {
+            Datum::Date(d) => Ok(*d),
+            Datum::Int32(i) => Ok(Date::new(*i)),
+            other => Err(IllegalArgument {
+                message: format!(
+                    "type mismatch at position {pos}: expected Date or Int32, got {other:?}"
+                ),
+            }),
         }
     }
 
-    fn get_time(&self, pos: usize) -> datum::Time {
-        match self.values.get(pos).unwrap() {
-            Datum::Time(t) => *t,
-            Datum::Int32(i) => datum::Time::new(*i),
-            other => panic!("Expected Time or Int32 at pos {pos:?}, got {other:?}"),
+    fn get_time(&self, pos: usize) -> Result<Time> {
+        match self.get_value(pos)? {
+            Datum::Time(t) => Ok(*t),
+            Datum::Int32(i) => Ok(Time::new(*i)),
+            other => Err(IllegalArgument {
+                message: format!(
+                    "type mismatch at position {pos}: expected Time or Int32, got {other:?}"
+                ),
+            }),
         }
     }
 
-    fn get_timestamp_ntz(&self, pos: usize, _precision: u32) -> datum::TimestampNtz {
-        match self.values.get(pos).unwrap() {
-            Datum::TimestampNtz(t) => *t,
-            other => panic!("Expected TimestampNtz at pos {pos:?}, got {other:?}"),
+    fn get_timestamp_ntz(&self, pos: usize, _precision: u32) -> Result<TimestampNtz> {
+        match self.get_value(pos)? {
+            Datum::TimestampNtz(t) => Ok(*t),
+            other => Err(IllegalArgument {
+                message: format!(
+                    "type mismatch at position {pos}: expected TimestampNtz, got {other:?}"
+                ),
+            }),
         }
     }
 
-    fn get_timestamp_ltz(&self, pos: usize, _precision: u32) -> datum::TimestampLtz {
-        match self.values.get(pos).unwrap() {
-            Datum::TimestampLtz(t) => *t,
-            other => panic!("Expected TimestampLtz at pos {pos:?}, got {other:?}"),
+    fn get_timestamp_ltz(&self, pos: usize, _precision: u32) -> Result<TimestampLtz> {
+        match self.get_value(pos)? {
+            Datum::TimestampLtz(t) => Ok(*t),
+            other => Err(IllegalArgument {
+                message: format!(
+                    "type mismatch at position {pos}: expected TimestampLtz, got {other:?}"
+                ),
+            }),
         }
     }
 
-    fn get_binary(&self, pos: usize, _length: usize) -> &[u8] {
-        self.values.get(pos).unwrap().as_blob()
+    fn get_binary(&self, pos: usize, _length: usize) -> Result<&[u8]> {
+        match self.get_value(pos)? {
+            Datum::Blob(b) => Ok(b.as_ref()),
+            other => Err(IllegalArgument {
+                message: format!("type mismatch at position {pos}: expected Binary, got {other:?}"),
+            }),
+        }
     }
 
-    fn get_bytes(&self, pos: usize) -> &[u8] {
-        self.values.get(pos).unwrap().as_blob()
+    fn get_bytes(&self, pos: usize) -> Result<&[u8]> {
+        match self.get_value(pos)? {
+            Datum::Blob(b) => Ok(b.as_ref()),
+            other => Err(IllegalArgument {
+                message: format!("type mismatch at position {pos}: expected Bytes, got {other:?}"),
+            }),
+        }
     }
 }
 
@@ -268,17 +321,27 @@ mod tests {
         row.set_field(0, Datum::Null);
         row.set_field(1, 42_i32);
 
-        assert!(row.is_null_at(0));
-        assert!(!row.is_null_at(1));
+        assert!(row.is_null_at(0).unwrap());
+        assert!(!row.is_null_at(1).unwrap());
+    }
+
+    #[test]
+    fn is_null_at_out_of_bounds_returns_error() {
+        let row = GenericRow::from_data(vec![42_i32]);
+        let err = row.is_null_at(5).unwrap_err();
+        assert!(
+            err.to_string().contains("out of bounds"),
+            "Expected out of bounds error, got: {err}"
+        );
     }
 
     #[test]
     fn new_initializes_nulls() {
         let row = GenericRow::new(3);
         assert_eq!(row.get_field_count(), 3);
-        assert!(row.is_null_at(0));
-        assert!(row.is_null_at(1));
-        assert!(row.is_null_at(2));
+        assert!(row.is_null_at(0).unwrap());
+        assert!(row.is_null_at(1).unwrap());
+        assert!(row.is_null_at(2).unwrap());
     }
 
     #[test]
@@ -288,8 +351,28 @@ mod tests {
         row.set_field(0, 123_i32);
         // Fields 1 and 2 remain null
         assert_eq!(row.get_field_count(), 3);
-        assert_eq!(row.get_int(0), 123);
-        assert!(row.is_null_at(1));
-        assert!(row.is_null_at(2));
+        assert_eq!(row.get_int(0).unwrap(), 123);
+        assert!(row.is_null_at(1).unwrap());
+        assert!(row.is_null_at(2).unwrap());
+    }
+
+    #[test]
+    fn type_mismatch_returns_error() {
+        let row = GenericRow::from_data(vec![Datum::Int64(999)]);
+        let err = row.get_string(0).unwrap_err();
+        assert!(
+            err.to_string().contains("type mismatch"),
+            "Expected type mismatch error, got: {err}"
+        );
+    }
+
+    #[test]
+    fn out_of_bounds_returns_error() {
+        let row = GenericRow::from_data(vec![42_i32]);
+        let err = row.get_int(5).unwrap_err();
+        assert!(
+            err.to_string().contains("out of bounds"),
+            "Expected out of bounds error, got: {err}"
+        );
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/row_decoder.rs b/fluss-rust/crates/fluss/src/row/row_decoder.rs
index 9f9b4217a2..aea8c86e94 100644
--- a/fluss-rust/crates/fluss/src/row/row_decoder.rs
+++ b/fluss-rust/crates/fluss/src/row/row_decoder.rs
@@ -112,8 +112,8 @@ mod tests {
 
         // Verify
         assert_eq!(row.get_field_count(), 2);
-        assert_eq!(row.get_int(0), 42);
-        assert_eq!(row.get_string(1), "hello");
+        assert_eq!(row.get_int(0).unwrap(), 42);
+        assert_eq!(row.get_string(1).unwrap(), "hello");
     }
 
     #[test]
@@ -131,7 +131,7 @@ mod tests {
         let row = decoder.decode(&data);
 
         // Verify
-        assert_eq!(row.get_int(0), 100);
-        assert_eq!(row.get_string(1), "world");
+        assert_eq!(row.get_int(0).unwrap(), 100);
+        assert_eq!(row.get_string(1).unwrap(), "world");
     }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index ab5f5b6f32..c101a18941 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -64,7 +64,7 @@ mod kv_table_test {
         let cluster = get_fluss_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().await.unwrap();
 
         let table_path = TablePath::new("fluss", "test_upsert_and_lookup");
 
@@ -83,10 +83,7 @@ mod kv_table_test {
 
         create_table(&admin, &table_path, &table_descriptor).await;
 
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
+        let table = connection.get_table(&table_path).await.unwrap();
 
         let table_upsert = table.new_upsert().expect("Failed to create upsert");
         let upsert_writer = table_upsert
@@ -118,14 +115,11 @@ mod kv_table_test {
                 .lookup(&make_key(*id))
                 .await
                 .expect("Failed to lookup");
-            let row = result
-                .get_single_row()
-                .expect("Failed to get row")
-                .expect("Row should exist");
+            let row = result.get_single_row().unwrap().expect("Row should exist");
 
-            assert_eq!(row.get_int(0), *id, "id mismatch");
-            assert_eq!(row.get_string(1), *expected_name, "name mismatch");
-            assert_eq!(row.get_long(2), *expected_age, "age mismatch");
+            assert_eq!(row.get_int(0).unwrap(), *id, "id mismatch");
+            assert_eq!(row.get_string(1).unwrap(), *expected_name, "name mismatch");
+            assert_eq!(row.get_long(2).unwrap(), *expected_age, "age mismatch");
         }
 
         // Update the record with new age (await acknowledgment)
@@ -144,18 +138,15 @@ mod kv_table_test {
             .lookup(&make_key(1))
             .await
             .expect("Failed to lookup after update");
-        let found_row = result
-            .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
+        let found_row = result.get_single_row().unwrap().expect("Row should exist");
         assert_eq!(
-            found_row.get_long(2),
-            updated_row.get_long(2),
+            found_row.get_long(2).unwrap(),
+            updated_row.get_long(2).unwrap(),
             "Age should be updated"
         );
         assert_eq!(
-            found_row.get_string(1),
-            updated_row.get_string(1),
+            found_row.get_string(1).unwrap(),
+            updated_row.get_string(1).unwrap(),
             "Name should remain unchanged"
         );
 
@@ -174,10 +165,7 @@ mod kv_table_test {
             .await
             .expect("Failed to lookup deleted record");
         assert!(
-            result
-                .get_single_row()
-                .expect("Failed to get row")
-                .is_none(),
+            result.get_single_row().unwrap().is_none(),
             "Record 1 should not exist after delete"
         );
 
@@ -188,10 +176,7 @@ mod kv_table_test {
                 .await
                 .expect("Failed to lookup");
             assert!(
-                result
-                    .get_single_row()
-                    .expect("Failed to get row")
-                    .is_some(),
+                result.get_single_row().unwrap().is_some(),
                 "Record {} should still exist after deleting record 1",
                 i
             );
@@ -203,10 +188,7 @@ mod kv_table_test {
             .await
             .expect("Failed to lookup non-existent key");
         assert!(
-            result
-                .get_single_row()
-                .expect("Failed to get row")
-                .is_none(),
+            result.get_single_row().unwrap().is_none(),
             "Non-existent key should return None"
         );
 
@@ -221,7 +203,7 @@ mod kv_table_test {
         let cluster = get_fluss_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().await.unwrap();
 
         let table_path = TablePath::new("fluss", "test_composite_pk");
 
@@ -240,10 +222,7 @@ mod kv_table_test {
 
         create_table(&admin, &table_path, &table_descriptor).await;
 
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
+        let table = connection.get_table(&table_path).await.unwrap();
 
         let table_upsert = table.new_upsert().expect("Failed to create upsert");
         let upsert_writer = table_upsert
@@ -279,22 +258,24 @@ mod kv_table_test {
         key.set_field(0, "US");
         key.set_field(1, 1);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
-        let row = result
-            .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-        assert_eq!(row.get_long(2), 100, "Score for (US, 1) should be 100");
+        let row = result.get_single_row().unwrap().expect("Row should exist");
+        assert_eq!(
+            row.get_long(2).unwrap(),
+            100,
+            "Score for (US, 1) should be 100"
+        );
 
         // Lookup (EU, 2) - should return score 250
         let mut key = GenericRow::new(3);
         key.set_field(0, "EU");
         key.set_field(1, 2);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
-        let row = result
-            .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-        assert_eq!(row.get_long(2), 250, "Score for (EU, 2) should be 250");
+        let row = result.get_single_row().unwrap().expect("Row should exist");
+        assert_eq!(
+            row.get_long(2).unwrap(),
+            250,
+            "Score for (EU, 2) should be 250"
+        );
 
         // Update (US, 1) score (await acknowledgment)
         let mut update_row = GenericRow::new(3);
@@ -312,13 +293,10 @@ mod kv_table_test {
         key.set_field(0, "US");
         key.set_field(1, 1);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
-        let row = result
-            .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
+        let row = result.get_single_row().unwrap().expect("Row should exist");
         assert_eq!(
-            row.get_long(2),
-            update_row.get_long(2),
+            row.get_long(2).unwrap(),
+            update_row.get_long(2).unwrap(),
             "Row score should be updated"
         );
 
@@ -393,10 +371,10 @@ mod kv_table_test {
             .expect("Failed to get row")
             .expect("Row should exist");
 
-        assert_eq!(found_row.get_int(0), 1);
-        assert_eq!(found_row.get_string(1), "Verso");
-        assert_eq!(found_row.get_long(2), 32i64);
-        assert_eq!(found_row.get_long(3), 6942i64);
+        assert_eq!(found_row.get_int(0).unwrap(), 1);
+        assert_eq!(found_row.get_string(1).unwrap(), "Verso");
+        assert_eq!(found_row.get_long(2).unwrap(), 32i64);
+        assert_eq!(found_row.get_long(3).unwrap(), 6942i64);
 
         // Create partial update writer to update only score column
         let partial_upsert = table_upsert
@@ -428,14 +406,22 @@ mod kv_table_test {
             .expect("Failed to get row")
             .expect("Row should exist");
 
-        assert_eq!(found_row.get_int(0), 1, "id should remain 1");
+        assert_eq!(found_row.get_int(0).unwrap(), 1, "id should remain 1");
         assert_eq!(
-            found_row.get_string(1),
+            found_row.get_string(1).unwrap(),
             "Verso",
             "name should remain unchanged"
         );
-        assert_eq!(found_row.get_long(2), 32, "age should remain unchanged");
-        assert_eq!(found_row.get_long(3), 420, "score should be updated to 420");
+        assert_eq!(
+            found_row.get_long(2).unwrap(),
+            32,
+            "age should remain unchanged"
+        );
+        assert_eq!(
+            found_row.get_long(3).unwrap(),
+            420,
+            "score should be updated to 420"
+        );
 
         admin
             .drop_table(&table_path, false)
@@ -524,10 +510,10 @@ mod kv_table_test {
                 .expect("Failed to get row")
                 .expect("Row should exist");
 
-            assert_eq!(row.get_string(0), *region, "region mismatch");
-            assert_eq!(row.get_int(1), *user_id, "user_id mismatch");
-            assert_eq!(row.get_string(2), *expected_name, "name mismatch");
-            assert_eq!(row.get_long(3), *expected_score, "score mismatch");
+            assert_eq!(row.get_string(0).unwrap(), *region, "region mismatch");
+            assert_eq!(row.get_int(1).unwrap(), *user_id, "user_id mismatch");
+            assert_eq!(row.get_string(2).unwrap(), *expected_name, "name mismatch");
+            assert_eq!(row.get_long(3).unwrap(), *expected_score, "score mismatch");
         }
 
         // Test update within a partition (await acknowledgment)
@@ -551,8 +537,8 @@ mod kv_table_test {
             .get_single_row()
             .expect("Failed to get row")
             .expect("Row should exist");
-        assert_eq!(row.get_string(2), "Gustave Updated");
-        assert_eq!(row.get_long(3), 999);
+        assert_eq!(row.get_string(2).unwrap(), "Gustave Updated");
+        assert_eq!(row.get_long(3).unwrap(), 999);
 
         // Lookup in non-existent partition should return empty result
         let mut non_existent_key = GenericRow::new(4);
@@ -602,7 +588,7 @@ mod kv_table_test {
             .get_single_row()
             .expect("Failed to get row")
             .expect("Row should exist");
-        assert_eq!(row.get_string(2), "Maelle");
+        assert_eq!(row.get_string(2).unwrap(), "Maelle");
 
         admin
             .drop_table(&table_path, false)
@@ -732,62 +718,88 @@ mod kv_table_test {
             .expect("Row should exist");
 
         // Verify all datatypes
-        assert_eq!(found_row.get_int(0), pk_int, "pk_int mismatch");
+        assert_eq!(found_row.get_int(0).unwrap(), pk_int, "pk_int mismatch");
         assert_eq!(
-            found_row.get_boolean(1),
+            found_row.get_boolean(1).unwrap(),
             col_boolean,
             "col_boolean mismatch"
         );
-        assert_eq!(found_row.get_byte(2), col_tinyint, "col_tinyint mismatch");
         assert_eq!(
-            found_row.get_short(3),
+            found_row.get_byte(2).unwrap(),
+            col_tinyint,
+            "col_tinyint mismatch"
+        );
+        assert_eq!(
+            found_row.get_short(3).unwrap(),
             col_smallint,
             "col_smallint mismatch"
         );
-        assert_eq!(found_row.get_int(4), col_int, "col_int mismatch");
-        assert_eq!(found_row.get_long(5), col_bigint, "col_bigint mismatch");
+        assert_eq!(found_row.get_int(4).unwrap(), col_int, "col_int mismatch");
+        assert_eq!(
+            found_row.get_long(5).unwrap(),
+            col_bigint,
+            "col_bigint mismatch"
+        );
         assert!(
-            (found_row.get_float(6) - col_float).abs() < f32::EPSILON,
+            (found_row.get_float(6).unwrap() - col_float).abs() < f32::EPSILON,
             "col_float mismatch: expected {}, got {}",
             col_float,
-            found_row.get_float(6)
+            found_row.get_float(6).unwrap()
         );
         assert!(
-            (found_row.get_double(7) - col_double).abs() < f64::EPSILON,
+            (found_row.get_double(7).unwrap() - col_double).abs() < f64::EPSILON,
             "col_double mismatch: expected {}, got {}",
             col_double,
-            found_row.get_double(7)
+            found_row.get_double(7).unwrap()
+        );
+        assert_eq!(
+            found_row.get_char(8, 10).unwrap(),
+            col_char,
+            "col_char mismatch"
+        );
+        assert_eq!(
+            found_row.get_string(9).unwrap(),
+            col_string,
+            "col_string mismatch"
         );
-        assert_eq!(found_row.get_char(8, 10), col_char, "col_char mismatch");
-        assert_eq!(found_row.get_string(9), col_string, "col_string mismatch");
         assert_eq!(
-            found_row.get_decimal(10, 10, 2),
+            found_row.get_decimal(10, 10, 2).unwrap(),
             col_decimal,
             "col_decimal mismatch"
         );
         assert_eq!(
-            found_row.get_date(11).get_inner(),
+            found_row.get_date(11).unwrap().get_inner(),
             col_date.get_inner(),
             "col_date mismatch"
         );
         assert_eq!(
-            found_row.get_time(12).get_inner(),
+            found_row.get_time(12).unwrap().get_inner(),
             col_time.get_inner(),
             "col_time mismatch"
         );
         assert_eq!(
-            found_row.get_timestamp_ntz(13, 6).get_millisecond(),
+            found_row
+                .get_timestamp_ntz(13, 6)
+                .unwrap()
+                .get_millisecond(),
             col_timestamp.get_millisecond(),
             "col_timestamp mismatch"
         );
         assert_eq!(
-            found_row.get_timestamp_ltz(14, 6).get_epoch_millisecond(),
+            found_row
+                .get_timestamp_ltz(14, 6)
+                .unwrap()
+                .get_epoch_millisecond(),
             col_timestamp_ltz.get_epoch_millisecond(),
             "col_timestamp_ltz mismatch"
         );
-        assert_eq!(found_row.get_bytes(15), col_bytes, "col_bytes mismatch");
         assert_eq!(
-            found_row.get_binary(16, 20),
+            found_row.get_bytes(15).unwrap(),
+            col_bytes,
+            "col_bytes mismatch"
+        );
+        assert_eq!(
+            found_row.get_binary(16, 20).unwrap(),
             col_binary,
             "col_binary mismatch"
         );
@@ -830,29 +842,75 @@ mod kv_table_test {
             .expect("Row should exist");
 
         // Verify all nullable columns are null
-        assert_eq!(found_row_nulls.get_int(0), pk_int_2, "pk_int mismatch");
-        assert!(found_row_nulls.is_null_at(1), "col_boolean should be null");
-        assert!(found_row_nulls.is_null_at(2), "col_tinyint should be null");
-        assert!(found_row_nulls.is_null_at(3), "col_smallint should be null");
-        assert!(found_row_nulls.is_null_at(4), "col_int should be null");
-        assert!(found_row_nulls.is_null_at(5), "col_bigint should be null");
-        assert!(found_row_nulls.is_null_at(6), "col_float should be null");
-        assert!(found_row_nulls.is_null_at(7), "col_double should be null");
-        assert!(found_row_nulls.is_null_at(8), "col_char should be null");
-        assert!(found_row_nulls.is_null_at(9), "col_string should be null");
-        assert!(found_row_nulls.is_null_at(10), "col_decimal should be null");
-        assert!(found_row_nulls.is_null_at(11), "col_date should be null");
-        assert!(found_row_nulls.is_null_at(12), "col_time should be null");
+        assert_eq!(
+            found_row_nulls.get_int(0).unwrap(),
+            pk_int_2,
+            "pk_int mismatch"
+        );
+        assert!(
+            found_row_nulls.is_null_at(1).unwrap(),
+            "col_boolean should be null"
+        );
         assert!(
-            found_row_nulls.is_null_at(13),
+            found_row_nulls.is_null_at(2).unwrap(),
+            "col_tinyint should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(3).unwrap(),
+            "col_smallint should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(4).unwrap(),
+            "col_int should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(5).unwrap(),
+            "col_bigint should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(6).unwrap(),
+            "col_float should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(7).unwrap(),
+            "col_double should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(8).unwrap(),
+            "col_char should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(9).unwrap(),
+            "col_string should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(10).unwrap(),
+            "col_decimal should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(11).unwrap(),
+            "col_date should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(12).unwrap(),
+            "col_time should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(13).unwrap(),
             "col_timestamp should be null"
         );
         assert!(
-            found_row_nulls.is_null_at(14),
+            found_row_nulls.is_null_at(14).unwrap(),
             "col_timestamp_ltz should be null"
         );
-        assert!(found_row_nulls.is_null_at(15), "col_bytes should be null");
-        assert!(found_row_nulls.is_null_at(16), "col_binary should be null");
+        assert!(
+            found_row_nulls.is_null_at(15).unwrap(),
+            "col_bytes should be null"
+        );
+        assert!(
+            found_row_nulls.is_null_at(16).unwrap(),
+            "col_binary should be null"
+        );
 
         admin
             .drop_table(&table_path, false)
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index eac72e5c78..779ffdd319 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -138,7 +138,10 @@ mod table_test {
                 .expect("Failed to poll records");
             for rec in scan_records {
                 let row = rec.row();
-                collected.push((row.get_int(0), row.get_string(1).to_string()));
+                collected.push((
+                    row.get_int(0).unwrap(),
+                    row.get_string(1).unwrap().to_string(),
+                ));
             }
         }
 
@@ -362,13 +365,13 @@ mod table_test {
             let row = record.row();
             // col_b is now at index 0, col_c is at index 1
             assert_eq!(
-                row.get_string(0),
+                row.get_string(0).unwrap(),
                 expected_col_b[i],
                 "col_b mismatch at index {}",
                 i
             );
             assert_eq!(
-                row.get_int(1),
+                row.get_int(1).unwrap(),
                 expected_col_c[i],
                 "col_c mismatch at index {}",
                 i
@@ -394,13 +397,13 @@ mod table_test {
             let row = record.row();
             // col_b is now at index 0, col_c is at index 1
             assert_eq!(
-                row.get_string(0),
+                row.get_string(0).unwrap(),
                 expected_col_b[i],
                 "col_b mismatch at index {}",
                 i
             );
             assert_eq!(
-                row.get_int(1),
+                row.get_int(1).unwrap(),
                 expected_col_a[i],
                 "col_c mismatch at index {}",
                 i
@@ -777,81 +780,103 @@ mod table_test {
         assert_eq!(records.len(), 2, "Expected 2 records");
 
         let found_row = records[0].row();
-        assert_eq!(found_row.get_byte(0), col_tinyint, "col_tinyint mismatch");
         assert_eq!(
-            found_row.get_short(1),
+            found_row.get_byte(0).unwrap(),
+            col_tinyint,
+            "col_tinyint mismatch"
+        );
+        assert_eq!(
+            found_row.get_short(1).unwrap(),
             col_smallint,
             "col_smallint mismatch"
         );
-        assert_eq!(found_row.get_int(2), col_int, "col_int mismatch");
-        assert_eq!(found_row.get_long(3), col_bigint, "col_bigint mismatch");
+        assert_eq!(found_row.get_int(2).unwrap(), col_int, "col_int mismatch");
+        assert_eq!(
+            found_row.get_long(3).unwrap(),
+            col_bigint,
+            "col_bigint mismatch"
+        );
         assert!(
-            (found_row.get_float(4) - col_float).abs() < f32::EPSILON,
+            (found_row.get_float(4).unwrap() - col_float).abs() < f32::EPSILON,
             "col_float mismatch: expected {}, got {}",
             col_float,
-            found_row.get_float(4)
+            found_row.get_float(4).unwrap()
         );
         assert!(
-            (found_row.get_double(5) - col_double).abs() < f64::EPSILON,
+            (found_row.get_double(5).unwrap() - col_double).abs() < f64::EPSILON,
             "col_double mismatch: expected {}, got {}",
             col_double,
-            found_row.get_double(5)
+            found_row.get_double(5).unwrap()
         );
         assert_eq!(
-            found_row.get_boolean(6),
+            found_row.get_boolean(6).unwrap(),
             col_boolean,
             "col_boolean mismatch"
         );
-        assert_eq!(found_row.get_char(7, 10), col_char, "col_char mismatch");
-        assert_eq!(found_row.get_string(8), col_string, "col_string mismatch");
         assert_eq!(
-            found_row.get_decimal(9, 10, 2),
+            found_row.get_char(7, 10).unwrap(),
+            col_char,
+            "col_char mismatch"
+        );
+        assert_eq!(
+            found_row.get_string(8).unwrap(),
+            col_string,
+            "col_string mismatch"
+        );
+        assert_eq!(
+            found_row.get_decimal(9, 10, 2).unwrap(),
             col_decimal,
             "col_decimal mismatch"
         );
         assert_eq!(
-            found_row.get_date(10).get_inner(),
+            found_row.get_date(10).unwrap().get_inner(),
             col_date.get_inner(),
             "col_date mismatch"
         );
 
         assert_eq!(
-            found_row.get_time(11).get_inner(),
+            found_row.get_time(11).unwrap().get_inner(),
             col_time_s.get_inner(),
             "col_time_s mismatch"
         );
 
         assert_eq!(
-            found_row.get_time(12).get_inner(),
+            found_row.get_time(12).unwrap().get_inner(),
             col_time_ms.get_inner(),
             "col_time_ms mismatch"
         );
 
         assert_eq!(
-            found_row.get_time(13).get_inner(),
+            found_row.get_time(13).unwrap().get_inner(),
             col_time_us.get_inner(),
             "col_time_us mismatch"
         );
 
         assert_eq!(
-            found_row.get_time(14).get_inner(),
+            found_row.get_time(14).unwrap().get_inner(),
             col_time_ns.get_inner(),
             "col_time_ns mismatch"
         );
 
         assert_eq!(
-            found_row.get_timestamp_ntz(15, 0).get_millisecond(),
+            found_row
+                .get_timestamp_ntz(15, 0)
+                .unwrap()
+                .get_millisecond(),
             col_timestamp_s.get_millisecond(),
             "col_timestamp_s mismatch"
         );
 
         assert_eq!(
-            found_row.get_timestamp_ntz(16, 3).get_millisecond(),
+            found_row
+                .get_timestamp_ntz(16, 3)
+                .unwrap()
+                .get_millisecond(),
             col_timestamp_ms.get_millisecond(),
             "col_timestamp_ms mismatch"
         );
 
-        let read_ts_us = found_row.get_timestamp_ntz(17, 6);
+        let read_ts_us = found_row.get_timestamp_ntz(17, 6).unwrap();
         assert_eq!(
             read_ts_us.get_millisecond(),
             col_timestamp_us.get_millisecond(),
@@ -863,7 +888,7 @@ mod table_test {
             "col_timestamp_us nanos mismatch"
         );
 
-        let read_ts_ns = found_row.get_timestamp_ntz(18, 9);
+        let read_ts_ns = found_row.get_timestamp_ntz(18, 9).unwrap();
         assert_eq!(
             read_ts_ns.get_millisecond(),
             col_timestamp_ns.get_millisecond(),
@@ -876,18 +901,24 @@ mod table_test {
         );
 
         assert_eq!(
-            found_row.get_timestamp_ltz(19, 0).get_epoch_millisecond(),
+            found_row
+                .get_timestamp_ltz(19, 0)
+                .unwrap()
+                .get_epoch_millisecond(),
             col_timestamp_ltz_s.get_epoch_millisecond(),
             "col_timestamp_ltz_s mismatch"
         );
 
         assert_eq!(
-            found_row.get_timestamp_ltz(20, 3).get_epoch_millisecond(),
+            found_row
+                .get_timestamp_ltz(20, 3)
+                .unwrap()
+                .get_epoch_millisecond(),
             col_timestamp_ltz_ms.get_epoch_millisecond(),
             "col_timestamp_ltz_ms mismatch"
         );
 
-        let read_ts_ltz_us = found_row.get_timestamp_ltz(21, 6);
+        let read_ts_ltz_us = found_row.get_timestamp_ltz(21, 6).unwrap();
         assert_eq!(
             read_ts_ltz_us.get_epoch_millisecond(),
             col_timestamp_ltz_us.get_epoch_millisecond(),
@@ -899,7 +930,7 @@ mod table_test {
             "col_timestamp_ltz_us nanos mismatch"
         );
 
-        let read_ts_ltz_ns = found_row.get_timestamp_ltz(22, 9);
+        let read_ts_ltz_ns = found_row.get_timestamp_ltz(22, 9).unwrap();
         assert_eq!(
             read_ts_ltz_ns.get_epoch_millisecond(),
             col_timestamp_ltz_ns.get_epoch_millisecond(),
@@ -910,15 +941,19 @@ mod table_test {
             col_timestamp_ltz_ns.get_nano_of_millisecond(),
             "col_timestamp_ltz_ns nanos mismatch"
         );
-        assert_eq!(found_row.get_bytes(23), col_bytes, "col_bytes mismatch");
         assert_eq!(
-            found_row.get_binary(24, 4),
+            found_row.get_bytes(23).unwrap(),
+            col_bytes,
+            "col_bytes mismatch"
+        );
+        assert_eq!(
+            found_row.get_binary(24, 4).unwrap(),
             col_binary,
             "col_binary mismatch"
         );
 
         // Verify timestamps before Unix epoch (negative timestamps)
-        let read_ts_us_neg = found_row.get_timestamp_ntz(25, 6);
+        let read_ts_us_neg = found_row.get_timestamp_ntz(25, 6).unwrap();
         assert_eq!(
             read_ts_us_neg.get_millisecond(),
             col_timestamp_us_neg.get_millisecond(),
@@ -930,7 +965,7 @@ mod table_test {
             "col_timestamp_us_neg nanos mismatch"
         );
 
-        let read_ts_ns_neg = found_row.get_timestamp_ntz(26, 9);
+        let read_ts_ns_neg = found_row.get_timestamp_ntz(26, 9).unwrap();
         assert_eq!(
             read_ts_ns_neg.get_millisecond(),
             col_timestamp_ns_neg.get_millisecond(),
@@ -942,7 +977,7 @@ mod table_test {
             "col_timestamp_ns_neg nanos mismatch"
         );
 
-        let read_ts_ltz_us_neg = found_row.get_timestamp_ltz(27, 6);
+        let read_ts_ltz_us_neg = found_row.get_timestamp_ltz(27, 6).unwrap();
         assert_eq!(
             read_ts_ltz_us_neg.get_epoch_millisecond(),
             col_timestamp_ltz_us_neg.get_epoch_millisecond(),
@@ -954,7 +989,7 @@ mod table_test {
             "col_timestamp_ltz_us_neg nanos mismatch"
         );
 
-        let read_ts_ltz_ns_neg = found_row.get_timestamp_ltz(28, 9);
+        let read_ts_ltz_ns_neg = found_row.get_timestamp_ltz(28, 9).unwrap();
         assert_eq!(
             read_ts_ltz_ns_neg.get_epoch_millisecond(),
             col_timestamp_ltz_ns_neg.get_epoch_millisecond(),
@@ -969,7 +1004,11 @@ mod table_test {
         // Verify row with all nulls (record index 1)
         let found_row_nulls = records[1].row();
         for i in 0..field_count {
-            assert!(found_row_nulls.is_null_at(i), "column {} should be null", i);
+            assert!(
+                found_row_nulls.is_null_at(i).unwrap(),
+                "column {} should be null",
+                i
+            );
         }
 
         admin
@@ -1140,9 +1179,9 @@ mod table_test {
             for rec in records {
                 let row = rec.row();
                 collected_records.push((
-                    row.get_int(0),
-                    row.get_string(1).to_string(),
-                    row.get_long(2),
+                    row.get_int(0).unwrap(),
+                    row.get_string(1).unwrap().to_string(),
+                    row.get_long(2).unwrap(),
                 ));
             }
         }
@@ -1196,9 +1235,9 @@ mod table_test {
             for rec in records {
                 let row = rec.row();
                 records_after_unsubscribe.push((
-                    row.get_int(0),
-                    row.get_string(1).to_string(),
-                    row.get_long(2),
+                    row.get_int(0).unwrap(),
+                    row.get_string(1).unwrap().to_string(),
+                    row.get_long(2).unwrap(),
                 ));
             }
         }
@@ -1248,9 +1287,9 @@ mod table_test {
             for rec in records {
                 let row = rec.row();
                 batch_collected.push((
-                    row.get_int(0),
-                    row.get_string(1).to_string(),
-                    row.get_long(2),
+                    row.get_int(0).unwrap(),
+                    row.get_string(1).unwrap().to_string(),
+                    row.get_long(2).unwrap(),
                 ));
             }
         }
@@ -1272,4 +1311,73 @@ mod table_test {
             .await
             .expect("Failed to drop table");
     }
+
+    #[tokio::test]
+    async fn undersized_row_returns_error() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().await.expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_log_undersized_row");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("col_bool", DataTypes::boolean())
+                    .column("col_int", DataTypes::int())
+                    .column("col_string", DataTypes::string())
+                    .column("col_bigint", DataTypes::bigint())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create table append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        // Scenario 1b: GenericRow with only 2 fields for a 4-column table
+        let mut row = fluss::row::GenericRow::new(2);
+        row.set_field(0, true);
+        row.set_field(1, 42_i32);
+
+        let result = append_writer.append(&row);
+        assert!(result.is_err(), "Undersized row should be rejected");
+        let err_msg = result.unwrap_err().to_string();
+        assert!(
+            err_msg.contains("Expected: 4") && err_msg.contains("Actual: 2"),
+            "Error should mention field count mismatch, got: {err_msg}"
+        );
+
+        // Correct column count but wrong types:
+        // Schema is (Boolean, Int, String, BigInt) but we put Int64 where String is expected.
+        // This should return an error, not panic.
+        let row_wrong_types = fluss::row::GenericRow::from_data(vec![
+            fluss::row::Datum::Bool(true),
+            fluss::row::Datum::Int32(42),
+            fluss::row::Datum::Int64(999), // wrong: String column
+            fluss::row::Datum::Int64(100),
+        ]);
+
+        let result = append_writer.append(&row_wrong_types);
+        assert!(
+            result.is_err(),
+            "Row with mismatched types should be rejected, not panic"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index 210dfc4e5f..fcd67738ab 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -192,8 +192,18 @@ mod table_remote_scan_test {
             let row = record.row();
             let expected_c1 = i as i32;
             let expected_c2 = format!("v{}", i);
-            assert_eq!(row.get_int(1), expected_c1, "c1 mismatch at index {}", i);
-            assert_eq!(row.get_string(0), expected_c2, "c2 mismatch at index {}", i);
+            assert_eq!(
+                row.get_int(1).unwrap(),
+                expected_c1,
+                "c1 mismatch at index {}",
+                i
+            );
+            assert_eq!(
+                row.get_string(0).unwrap(),
+                expected_c2,
+                "c2 mismatch at index {}",
+                i
+            );
         }
     }
 

From 7eb86a70dbb298b904a3874f655d36236ed6868d Mon Sep 17 00:00:00 2001
From: Prajwal banakar <prajwal.banakara@gmail.com>
Date: Fri, 27 Feb 2026 09:28:50 +0530
Subject: [PATCH 170/287] chore: make batch timeout configurable (#371)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  1 +
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  1 +
 fluss-rust/bindings/cpp/src/lib.rs            |  2 ++
 fluss-rust/bindings/python/src/config.rs      | 17 +++++++++++++++++
 .../fluss/src/client/write/accumulator.rs     |  3 ++-
 fluss-rust/crates/fluss/src/config.rs         |  7 +++++++
 .../user-guide/cpp/example/configuration.md   |  1 +
 .../python/example/configuration.md           | 19 ++++++++++---------
 .../user-guide/rust/example/configuration.md  |  1 +
 9 files changed, 42 insertions(+), 10 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index f17cafc1aa..0f980b7316 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -987,6 +987,7 @@ struct Configuration {
     size_t remote_file_download_thread_num{3};
     // Maximum number of records returned in a single call to Poll() for LogScanner
     size_t scanner_log_max_poll_records{500};
+    int64_t writer_batch_timeout_ms{100};
 };
 
 class Connection {
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index a2e7fa2616..e37634350c 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -55,6 +55,7 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.scanner_remote_log_prefetch_num = config.scanner_remote_log_prefetch_num;
     ffi_config.remote_file_download_thread_num = config.remote_file_download_thread_num;
     ffi_config.scanner_log_max_poll_records = config.scanner_log_max_poll_records;
+    ffi_config.writer_batch_timeout_ms = config.writer_batch_timeout_ms;
     return ffi_config;
 }
 
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 32dbf7d030..ea1307e2d8 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -47,6 +47,7 @@ mod ffi {
         scanner_remote_log_prefetch_num: usize,
         remote_file_download_thread_num: usize,
         scanner_log_max_poll_records: usize,
+        writer_batch_timeout_ms: i64,
     }
 
     struct FfiResult {
@@ -623,6 +624,7 @@ fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
         writer_acks: config.writer_acks.to_string(),
         writer_retries: config.writer_retries,
         writer_batch_size: config.writer_batch_size,
+        writer_batch_timeout_ms: config.writer_batch_timeout_ms,
         writer_bucket_no_key_assigner: assigner_type,
         scanner_remote_log_prefetch_num: config.scanner_remote_log_prefetch_num,
         remote_file_download_thread_num: config.remote_file_download_thread_num,
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 75056a5226..5b7f2d37cd 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -60,6 +60,11 @@ impl Config {
                             FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
                         })?;
                     }
+                    "writer.batch-timeout-ms" => {
+                        config.writer_batch_timeout_ms = value.parse::<i64>().map_err(|e| {
+                            FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
+                        })?;
+                    }
                     "scanner.remote-log.prefetch-num" => {
                         config.scanner_remote_log_prefetch_num =
                             value.parse::<usize>().map_err(|e| {
@@ -200,6 +205,18 @@ impl Config {
     fn set_scanner_log_max_poll_records(&mut self, num: usize) {
         self.inner.scanner_log_max_poll_records = num;
     }
+
+    /// Get the writer batch timeout in milliseconds
+    #[getter]
+    fn writer_batch_timeout_ms(&self) -> i64 {
+        self.inner.writer_batch_timeout_ms
+    }
+
+    /// Set the writer batch timeout in milliseconds
+    #[setter]
+    fn set_writer_batch_timeout_ms(&mut self, timeout: i64) {
+        self.inner.writer_batch_timeout_ms = timeout;
+    }
 }
 
 impl Config {
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 2c36452470..0cf501cb45 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -50,11 +50,12 @@ pub struct RecordAccumulator {
 
 impl RecordAccumulator {
     pub fn new(config: Config) -> Self {
+        let batch_timeout_ms = config.writer_batch_timeout_ms;
         RecordAccumulator {
             config,
             write_batches: Default::default(),
             incomplete_batches: Default::default(),
-            batch_timeout_ms: 500,
+            batch_timeout_ms,
             closed: Default::default(),
             flushes_in_progress: Default::default(),
             appends_in_progress: Default::default(),
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 6ff4327f46..302649327c 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -26,6 +26,7 @@ const DEFAULT_RETRIES: i32 = i32::MAX;
 const DEFAULT_PREFETCH_NUM: usize = 4;
 const DEFAULT_DOWNLOAD_THREADS: usize = 3;
 const DEFAULT_MAX_POLL_RECORDS: usize = 500;
+const DEFAULT_WRITER_BATCH_TIMEOUT_MS: i64 = 100;
 
 const DEFAULT_ACKS: &str = "all";
 
@@ -84,6 +85,11 @@ pub struct Config {
     /// Default: 500 (matching Java CLIENT_SCANNER_LOG_MAX_POLL_RECORDS)
     #[arg(long, default_value_t = DEFAULT_MAX_POLL_RECORDS)]
     pub scanner_log_max_poll_records: usize,
+
+    /// The maximum time to wait for a batch to be completed in milliseconds.
+    /// Default: 100 (matching Java CLIENT_WRITER_BATCH_TIMEOUT)
+    #[arg(long, default_value_t = DEFAULT_WRITER_BATCH_TIMEOUT_MS)]
+    pub writer_batch_timeout_ms: i64,
 }
 
 impl Default for Config {
@@ -98,6 +104,7 @@ impl Default for Config {
             scanner_remote_log_prefetch_num: DEFAULT_PREFETCH_NUM,
             remote_file_download_thread_num: DEFAULT_DOWNLOAD_THREADS,
             scanner_log_max_poll_records: DEFAULT_MAX_POLL_RECORDS,
+            writer_batch_timeout_ms: DEFAULT_WRITER_BATCH_TIMEOUT_MS,
         }
     }
 }
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
index 715e3c63fd..d73661aea1 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
@@ -30,6 +30,7 @@ config.writer_request_max_size = 10 * 1024 * 1024;     // Max request size (10 M
 config.writer_acks = "all";                      // Wait for all replicas
 config.writer_retries = std::numeric_limits<int32_t>::max();  // Retry on failure
 config.writer_batch_size = 2 * 1024 * 1024;     // Batch size (2 MB)
+config.writer_batch_timeout_ms = 100;           // Max time to wait for a batch to fill
 config.writer_bucket_no_key_assigner = "sticky"; // "sticky" or "round_robin"
 config.scanner_remote_log_prefetch_num = 4;      // Remote log prefetch count
 config.remote_file_download_thread_num = 3;  // Download threads
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
index 466bf0dd38..71e71994ea 100644
--- a/fluss-rust/website/docs/user-guide/python/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -23,15 +23,16 @@ with await fluss.FlussConnection.create(config) as conn:
 
 | Key                                | Description                                                                          | Default            |
 |------------------------------------|--------------------------------------------------------------------------------------|--------------------|
-| `bootstrap.servers`               | Coordinator server address                                                            | `127.0.0.1:9123`   |
-| `writer.request-max-size`         | Maximum request size in bytes                                                         | `10485760` (10 MB) |
-| `writer.acks`                     | Acknowledgment setting (`all` waits for all replicas)                                 | `all`              |
-| `writer.retries`                  | Number of retries on failure                                                          | `2147483647`       |
-| `writer.batch-size`               | Batch size for writes in bytes                                                        | `2097152` (2 MB)   |
-| `writer.bucket.no-key-assigner`   | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin`  | `sticky`           |
-| `scanner.remote-log.prefetch-num` | Number of remote log segments to prefetch                                             | `4`                |
-| `remote-file.download-thread-num` | Number of threads for remote log downloads                                            | `3`                |
-| `scanner.log.max-poll-records`    | Max records returned in a single poll()                                               | `500`              |
+| `bootstrap.servers`               | Coordinator server address                                                           | `127.0.0.1:9123`   |
+| `writer.request-max-size`         | Maximum request size in bytes                                                        | `10485760` (10 MB) |
+| `writer.acks`                     | Acknowledgment setting (`all` waits for all replicas)                                | `all`              |
+| `writer.retries`                  | Number of retries on failure                                                         | `2147483647`       |
+| `writer.batch-size`               | Batch size for writes in bytes                                                       | `2097152` (2 MB)   |
+| `writer.bucket.no-key-assigner`   | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`           |
+| `scanner.remote-log.prefetch-num` | Number of remote log segments to prefetch                                            | `4`                |
+| `remote-file.download-thread-num` | Number of threads for remote log downloads                                           | `3`                |
+| `scanner.log.max-poll-records`    | Max records returned in a single poll()                                              | `500`              |
+| `writer.batch-timeout-ms`         | The maximum time to wait for a writer batch to fill up before sending.               | `100`              |
 
 Remember to close the connection when done:
 
diff --git a/fluss-rust/website/docs/user-guide/rust/example/configuration.md b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
index 92b9bf2f1d..7d7cc9397b 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
@@ -25,3 +25,4 @@ let conn = FlussConnection::new(config).await?;
 | `writer_retries`                | Number of retries on failure                                                         | `i32::MAX`       |
 | `writer_batch_size`             | Batch size for writes                                                                | 2 MB             |
 | `writer_bucket_no_key_assigner` | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`         |
+| `writer_batch_timeout_ms`       | The maximum time to wait for a writer batch to fill up before sending.               | `100`            |

From bb5bdf39fb6eee4288b3cb8dd7cc46faab96e5ca Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Fri, 27 Feb 2026 22:16:55 +0800
Subject: [PATCH 171/287] perf: introduce streaming download for file download
 (#381)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |   2 +
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |   1 +
 fluss-rust/bindings/cpp/src/lib.rs            |   6 +-
 fluss-rust/bindings/python/fluss/__init__.pyi |   4 +
 fluss-rust/bindings/python/src/config.rs      |  20 ++++
 .../fluss/src/client/table/remote_log.rs      | 103 +++++++++++-------
 .../crates/fluss/src/client/table/scanner.rs  |   1 +
 fluss-rust/crates/fluss/src/config.rs         |   7 ++
 .../user-guide/cpp/example/configuration.md   |   2 +
 .../python/example/configuration.md           |  25 +++--
 .../user-guide/rust/example/configuration.md  |   6 +-
 11 files changed, 121 insertions(+), 56 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 0f980b7316..0a62af9151 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -985,6 +985,8 @@ struct Configuration {
     size_t scanner_remote_log_prefetch_num{4};
     // Number of threads for downloading remote log data
     size_t remote_file_download_thread_num{3};
+    // Remote log read concurrency within one file (streaming read path)
+    size_t scanner_remote_log_read_concurrency{4};
     // Maximum number of records returned in a single call to Poll() for LogScanner
     size_t scanner_log_max_poll_records{500};
     int64_t writer_batch_timeout_ms{100};
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index e37634350c..9020027731 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -54,6 +54,7 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.writer_bucket_no_key_assigner = rust::String(config.writer_bucket_no_key_assigner);
     ffi_config.scanner_remote_log_prefetch_num = config.scanner_remote_log_prefetch_num;
     ffi_config.remote_file_download_thread_num = config.remote_file_download_thread_num;
+    ffi_config.scanner_remote_log_read_concurrency = config.scanner_remote_log_read_concurrency;
     ffi_config.scanner_log_max_poll_records = config.scanner_log_max_poll_records;
     ffi_config.writer_batch_timeout_ms = config.writer_batch_timeout_ms;
     return ffi_config;
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index ea1307e2d8..9b01d32218 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -46,6 +46,7 @@ mod ffi {
         writer_bucket_no_key_assigner: String,
         scanner_remote_log_prefetch_num: usize,
         remote_file_download_thread_num: usize,
+        scanner_remote_log_read_concurrency: usize,
         scanner_log_max_poll_records: usize,
         writer_batch_timeout_ms: i64,
     }
@@ -618,7 +619,7 @@ fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
             ));
         }
     };
-    let config = fluss::config::Config {
+    let config_core = fluss::config::Config {
         bootstrap_servers: config.bootstrap_servers.to_string(),
         writer_request_max_size: config.writer_request_max_size,
         writer_acks: config.writer_acks.to_string(),
@@ -628,10 +629,11 @@ fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
         writer_bucket_no_key_assigner: assigner_type,
         scanner_remote_log_prefetch_num: config.scanner_remote_log_prefetch_num,
         remote_file_download_thread_num: config.remote_file_download_thread_num,
+        scanner_remote_log_read_concurrency: config.scanner_remote_log_read_concurrency,
         scanner_log_max_poll_records: config.scanner_log_max_poll_records,
     };
 
-    let conn = RUNTIME.block_on(async { fcore::client::FlussConnection::new(config).await });
+    let conn = RUNTIME.block_on(async { fcore::client::FlussConnection::new(config_core).await });
 
     match conn {
         Ok(c) => {
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 6f9ae0b35d..514d011ac7 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -162,6 +162,10 @@ class Config:
     @remote_file_download_thread_num.setter
     def remote_file_download_thread_num(self, num: int) -> None: ...
     @property
+    def scanner_remote_log_read_concurrency(self) -> int: ...
+    @scanner_remote_log_read_concurrency.setter
+    def scanner_remote_log_read_concurrency(self, num: int) -> None: ...
+    @property
     def scanner_log_max_poll_records(self) -> int: ...
     @scanner_log_max_poll_records.setter
     def scanner_log_max_poll_records(self, num: int) -> None: ...
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 5b7f2d37cd..9c0059e098 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -81,6 +81,14 @@ impl Config {
                                 ))
                             })?;
                     }
+                    "scanner.remote-log.read-concurrency" => {
+                        config.scanner_remote_log_read_concurrency =
+                            value.parse::<usize>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
+                    }
                     "scanner.log.max-poll-records" => {
                         config.scanner_log_max_poll_records =
                             value.parse::<usize>().map_err(|e| {
@@ -194,6 +202,18 @@ impl Config {
         self.inner.remote_file_download_thread_num = num;
     }
 
+    /// Get the scanner remote log read concurrency
+    #[getter]
+    fn scanner_remote_log_read_concurrency(&self) -> usize {
+        self.inner.scanner_remote_log_read_concurrency
+    }
+
+    /// Set the scanner remote log read concurrency
+    #[setter]
+    fn set_scanner_remote_log_read_concurrency(&mut self, num: usize) {
+        self.inner.scanner_remote_log_read_concurrency = num;
+    }
+
     /// Get the scanner log max poll records
     #[getter]
     fn scanner_log_max_poll_records(&self) -> usize {
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index 02820d93c3..6bc955125f 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -19,9 +19,10 @@ use crate::error::{Error, Result};
 use crate::io::{FileIO, Storage};
 use crate::metadata::TableBucket;
 use crate::proto::{PbRemoteLogFetchInfo, PbRemoteLogSegment};
+use futures::TryStreamExt;
 use parking_lot::Mutex;
 use std::{
-    cmp::{Ordering, Reverse, min},
+    cmp::{Ordering, Reverse},
     collections::{BinaryHeap, HashMap},
     future::Future,
     io, mem,
@@ -293,6 +294,7 @@ enum DownloadResult {
 struct ProductionFetcher {
     credentials_rx: CredentialsReceiver,
     local_log_dir: Arc<TempDir>,
+    remote_log_read_concurrency: usize,
 }
 
 impl RemoteLogFetcher for ProductionFetcher {
@@ -302,6 +304,7 @@ impl RemoteLogFetcher for ProductionFetcher {
     ) -> Pin<Box<dyn Future<Output = Result<FetchResult>> + Send>> {
         let mut credentials_rx = self.credentials_rx.clone();
         let local_log_dir = self.local_log_dir.clone();
+        let remote_log_read_concurrency = self.remote_log_read_concurrency;
 
         // Clone data needed for async operation to avoid lifetime issues
         let segment = request.segment.clone();
@@ -361,6 +364,7 @@ impl RemoteLogFetcher for ProductionFetcher {
                 &remote_path,
                 &local_file_path,
                 &remote_fs_props,
+                remote_log_read_concurrency,
             )
             .await?;
 
@@ -768,11 +772,13 @@ impl RemoteLogDownloader {
         local_log_dir: TempDir,
         max_prefetch_segments: usize,
         max_concurrent_downloads: usize,
+        remote_log_read_concurrency: usize,
         credentials_rx: CredentialsReceiver,
     ) -> Result<Self> {
         let fetcher = Arc::new(ProductionFetcher {
             credentials_rx,
             local_log_dir: Arc::new(local_log_dir),
+            remote_log_read_concurrency: remote_log_read_concurrency.max(1),
         });
 
         Self::new_with_fetcher(fetcher, max_prefetch_segments, max_concurrent_downloads)
@@ -848,12 +854,13 @@ impl Drop for RemoteLogDownloader {
 }
 
 impl RemoteLogDownloader {
-    /// Download a file from remote storage to local using streaming read/write
+    /// Download a file from remote storage to local using streaming read/write.
     async fn download_file(
         remote_log_tablet_dir: &str,
         remote_path: &str,
         local_path: &Path,
         remote_fs_props: &HashMap<String, String>,
+        remote_log_read_concurrency: usize,
     ) -> Result<PathBuf> {
         // Handle both URL (e.g., "s3://bucket/path") and local file paths
         // If the path doesn't contain "://", treat it as a local file path
@@ -886,56 +893,70 @@ impl RemoteLogDownloader {
 
         // Timeout for remote storage operations (30 seconds)
         const REMOTE_OP_TIMEOUT: Duration = Duration::from_secs(30);
+        const CHUNK_SIZE: usize = 8 * 1024 * 1024; // 8MiB
+
+        Self::download_file_streaming(
+            &op,
+            relative_path,
+            remote_path,
+            local_path,
+            CHUNK_SIZE,
+            remote_log_read_concurrency,
+            REMOTE_OP_TIMEOUT,
+        )
+        .await?;
 
-        // Get file metadata to know the size with timeout
-        let meta = op.stat(relative_path).await?;
-        let file_size = meta.content_length();
+        Ok(local_path.to_path_buf())
+    }
 
-        // Create local file for writing
+    async fn download_file_streaming(
+        op: &opendal::Operator,
+        relative_path: &str,
+        remote_path: &str,
+        local_path: &Path,
+        chunk_size: usize,
+        streaming_read_concurrency: usize,
+        remote_op_timeout: Duration,
+    ) -> Result<()> {
         let mut local_file = tokio::fs::File::create(local_path).await?;
 
-        // Stream data from remote to local file in chunks
-        // opendal::Reader::read accepts a range, so we read in chunks
-        const CHUNK_SIZE: u64 = 8 * 1024 * 1024; // 8MB chunks for efficient reading
-        let mut offset = 0u64;
-        let mut chunk_count = 0u64;
-        let total_chunks = file_size.div_ceil(CHUNK_SIZE);
+        let reader_future = op
+            .reader_with(relative_path)
+            .chunk(chunk_size)
+            .concurrent(streaming_read_concurrency);
+        let reader = tokio::time::timeout(remote_op_timeout, reader_future)
+            .await
+            .map_err(|e| Error::IoUnexpectedError {
+                message: format!("Timeout creating streaming reader for {remote_path}: {e}."),
+                source: io::ErrorKind::TimedOut.into(),
+            })??;
+
+        let mut stream = tokio::time::timeout(remote_op_timeout, reader.into_bytes_stream(..))
+            .await
+            .map_err(|e| Error::IoUnexpectedError {
+                message: format!("Timeout creating streaming bytes stream for {remote_path}: {e}."),
+                source: io::ErrorKind::TimedOut.into(),
+            })??;
 
-        while offset < file_size {
-            let end = min(offset + CHUNK_SIZE, file_size);
-            let range = offset..end;
+        let mut chunk_count = 0u64;
+        while let Some(chunk) = tokio::time::timeout(remote_op_timeout, stream.try_next())
+            .await
+            .map_err(|e| Error::IoUnexpectedError {
+                message: format!(
+                    "Timeout streaming chunk from remote storage: {remote_path}, exception: {e}."
+                ),
+                source: io::ErrorKind::TimedOut.into(),
+            })??
+        {
             chunk_count += 1;
-
             if chunk_count <= 3 || chunk_count % 10 == 0 {
-                log::debug!(
-                    "Remote log download: reading chunk {chunk_count}/{total_chunks} (offset {offset})"
-                );
+                log::debug!("Remote log streaming download: chunk #{chunk_count} ({remote_path})");
             }
-
-            // Read chunk from remote storage with timeout
-            let read_future = op.read_with(relative_path).range(range.clone());
-            let chunk = tokio::time::timeout(REMOTE_OP_TIMEOUT, read_future)
-                .await
-                .map_err(|e| {
-                    Error::IoUnexpectedError {
-                        message: format!(
-                            "Timeout reading chunk from remote storage: {remote_path} at offset {offset}, exception: {e}."
-                        ),
-                        source: io::ErrorKind::TimedOut.into(),
-                    }
-                })??;
-            let bytes = chunk.to_bytes();
-
-            // Write chunk to local file
-            local_file.write_all(&bytes).await?;
-
-            offset = end;
+            local_file.write_all(&chunk).await?;
         }
 
-        // Ensure all data is flushed to disk
         local_file.sync_all().await?;
-
-        Ok(local_path.to_path_buf())
+        Ok(())
     }
 }
 
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 3ec9106d66..e837ba76c3 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -677,6 +677,7 @@ impl LogFetcher {
             tmp_dir,
             config.scanner_remote_log_prefetch_num,
             config.remote_file_download_thread_num,
+            config.scanner_remote_log_read_concurrency,
             credentials_rx,
         )?);
 
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 302649327c..a0d7e70716 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -25,6 +25,7 @@ const DEFAULT_WRITER_BATCH_SIZE: i32 = 2 * 1024 * 1024;
 const DEFAULT_RETRIES: i32 = i32::MAX;
 const DEFAULT_PREFETCH_NUM: usize = 4;
 const DEFAULT_DOWNLOAD_THREADS: usize = 3;
+const DEFAULT_SCANNER_REMOTE_LOG_READ_CONCURRENCY: usize = 4;
 const DEFAULT_MAX_POLL_RECORDS: usize = 500;
 const DEFAULT_WRITER_BATCH_TIMEOUT_MS: i64 = 100;
 
@@ -81,6 +82,11 @@ pub struct Config {
     #[arg(long, default_value_t = DEFAULT_DOWNLOAD_THREADS)]
     pub remote_file_download_thread_num: usize,
 
+    /// Intra-file remote log read concurrency for each remote segment download.
+    /// Download path always uses streaming reader.
+    #[arg(long, default_value_t = DEFAULT_SCANNER_REMOTE_LOG_READ_CONCURRENCY)]
+    pub scanner_remote_log_read_concurrency: usize,
+
     /// Maximum number of records returned in a single call to poll() for LogScanner.
     /// Default: 500 (matching Java CLIENT_SCANNER_LOG_MAX_POLL_RECORDS)
     #[arg(long, default_value_t = DEFAULT_MAX_POLL_RECORDS)]
@@ -103,6 +109,7 @@ impl Default for Config {
             writer_bucket_no_key_assigner: NoKeyAssigner::Sticky,
             scanner_remote_log_prefetch_num: DEFAULT_PREFETCH_NUM,
             remote_file_download_thread_num: DEFAULT_DOWNLOAD_THREADS,
+            scanner_remote_log_read_concurrency: DEFAULT_SCANNER_REMOTE_LOG_READ_CONCURRENCY,
             scanner_log_max_poll_records: DEFAULT_MAX_POLL_RECORDS,
             writer_batch_timeout_ms: DEFAULT_WRITER_BATCH_TIMEOUT_MS,
         }
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
index d73661aea1..2245ee1bf1 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
@@ -34,4 +34,6 @@ config.writer_batch_timeout_ms = 100;           // Max time to wait for a batch
 config.writer_bucket_no_key_assigner = "sticky"; // "sticky" or "round_robin"
 config.scanner_remote_log_prefetch_num = 4;      // Remote log prefetch count
 config.remote_file_download_thread_num = 3;  // Download threads
+config.scanner_remote_log_read_concurrency = 4;   // In-file remote log read concurrency
+config.scanner_log_max_poll_records = 500;        // Max records returned per poll()
 ```
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
index 71e71994ea..39c53be4ea 100644
--- a/fluss-rust/website/docs/user-guide/python/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -21,18 +21,19 @@ with await fluss.FlussConnection.create(config) as conn:
 
 ## Connection Configurations
 
-| Key                                | Description                                                                          | Default            |
-|------------------------------------|--------------------------------------------------------------------------------------|--------------------|
-| `bootstrap.servers`               | Coordinator server address                                                           | `127.0.0.1:9123`   |
-| `writer.request-max-size`         | Maximum request size in bytes                                                        | `10485760` (10 MB) |
-| `writer.acks`                     | Acknowledgment setting (`all` waits for all replicas)                                | `all`              |
-| `writer.retries`                  | Number of retries on failure                                                         | `2147483647`       |
-| `writer.batch-size`               | Batch size for writes in bytes                                                       | `2097152` (2 MB)   |
-| `writer.bucket.no-key-assigner`   | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`           |
-| `scanner.remote-log.prefetch-num` | Number of remote log segments to prefetch                                            | `4`                |
-| `remote-file.download-thread-num` | Number of threads for remote log downloads                                           | `3`                |
-| `scanner.log.max-poll-records`    | Max records returned in a single poll()                                              | `500`              |
-| `writer.batch-timeout-ms`         | The maximum time to wait for a writer batch to fill up before sending.               | `100`              |
+| Key                                   | Description                                                                           | Default            |
+|---------------------------------------|---------------------------------------------------------------------------------------|--------------------|
+| `bootstrap.servers`                   | Coordinator server address                                                            | `127.0.0.1:9123`   |
+| `writer.request-max-size`             | Maximum request size in bytes                                                         | `10485760` (10 MB) |
+| `writer.acks`                         | Acknowledgment setting (`all` waits for all replicas)                                 | `all`              |
+| `writer.retries`                      | Number of retries on failure                                                          | `2147483647`       |
+| `writer.batch-size`                   | Batch size for writes in bytes                                                        | `2097152` (2 MB)   |
+| `writer.batch-timeout-ms`             | The maximum time to wait for a writer batch to fill up before sending.               | `100`              |
+| `writer.bucket.no-key-assigner`       | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`           |
+| `scanner.remote-log.prefetch-num`     | Number of remote log segments to prefetch                                             | `4`                |
+| `remote-file.download-thread-num`     | Number of threads for remote log downloads                                            | `3`                |
+| `scanner.remote-log.read-concurrency` | Streaming read concurrency within a remote log file                                   | `4`                |
+| `scanner.log.max-poll-records`        | Max records returned in a single poll()                                               | `500`              |
 
 Remember to close the connection when done:
 
diff --git a/fluss-rust/website/docs/user-guide/rust/example/configuration.md b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
index 7d7cc9397b..a2f52dc1f0 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
@@ -24,5 +24,9 @@ let conn = FlussConnection::new(config).await?;
 | `writer_acks`                   | Acknowledgment setting (`all` waits for all replicas)                                | `all`            |
 | `writer_retries`                | Number of retries on failure                                                         | `i32::MAX`       |
 | `writer_batch_size`             | Batch size for writes                                                                | 2 MB             |
-| `writer_bucket_no_key_assigner` | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`         |
 | `writer_batch_timeout_ms`       | The maximum time to wait for a writer batch to fill up before sending.               | `100`            |
+| `writer_bucket_no_key_assigner` | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`         |
+| `scanner_remote_log_prefetch_num` | Number of remote log segments to prefetch                                           | `4`              |
+| `remote_file_download_thread_num` | Number of concurrent remote log file downloads                                      | `3`              |
+| `scanner_remote_log_read_concurrency` | Streaming read concurrency within a remote log file                           | `4`              |
+| `scanner_log_max_poll_records`  | Maximum records returned in a single `poll()`                                       | `500`            |

From 39bc2094aa6f6c59de0f22b030e0ad52796df7cf Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sat, 28 Feb 2026 05:11:59 +0100
Subject: [PATCH 172/287] feat: Add get_server_nodes to Admin (#363)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  10 ++
 fluss-rust/bindings/cpp/src/admin.cpp         |  18 +++
 fluss-rust/bindings/cpp/src/lib.rs            |  41 +++++++
 fluss-rust/bindings/cpp/test/test_admin.cpp   |  25 ++++
 fluss-rust/bindings/python/fluss/__init__.pyi |  32 +++++
 fluss-rust/bindings/python/src/admin.rs       |  81 +++++++++++++
 fluss-rust/bindings/python/src/lib.rs         |   1 +
 fluss-rust/bindings/python/test/test_admin.py |  17 +++
 fluss-rust/crates/fluss/src/client/admin.rs   |   8 ++
 .../crates/fluss/src/client/metadata.rs       |   2 +-
 .../crates/fluss/src/cluster/cluster.rs       | 112 ++++++++++++++++++
 fluss-rust/crates/fluss/src/cluster/mod.rs    |  24 +++-
 fluss-rust/crates/fluss/src/lib.rs            |   1 +
 .../crates/fluss/src/rpc/server_connection.rs |   2 +-
 .../crates/fluss/tests/integration/admin.rs   |  43 +++++++
 .../docs/user-guide/cpp/api-reference.md      |  16 +++
 .../docs/user-guide/python/api-reference.md   |  11 ++
 .../docs/user-guide/rust/api-reference.md     |  16 +++
 18 files changed, 457 insertions(+), 3 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 0a62af9151..cb060282f4 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -881,6 +881,14 @@ struct PartitionInfo {
     std::string partition_name;
 };
 
+struct ServerNode {
+    int32_t id;
+    std::string host;
+    uint32_t port;
+    std::string server_type;
+    std::string uid;
+};
+
 /// Descriptor for create_database (optional). Leave comment and properties empty for default.
 struct DatabaseDescriptor {
     std::string comment;
@@ -1073,6 +1081,8 @@ class Admin {
 
     Result TableExists(const TablePath& table_path, bool& out);
 
+    Result GetServerNodes(std::vector<ServerNode>& out);
+
    private:
     Result DoListOffsets(const TablePath& table_path, const std::vector<int32_t>& bucket_ids,
                          const OffsetSpec& offset_spec, std::unordered_map<int32_t, int64_t>& out,
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index 8deb182dcd..49300c156b 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -346,4 +346,22 @@ Result Admin::TableExists(const TablePath& table_path, bool& out) {
     return result;
 }
 
+Result Admin::GetServerNodes(std::vector<ServerNode>& out) {
+    if (!Available()) {
+        return utils::make_client_error("Admin not available");
+    }
+
+    auto ffi_result = admin_->get_server_nodes();
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.clear();
+        out.reserve(ffi_result.server_nodes.size());
+        for (const auto& node : ffi_result.server_nodes) {
+            out.push_back({node.node_id, std::string(node.host), node.port,
+                           std::string(node.server_type), std::string(node.uid)});
+        }
+    }
+    return result;
+}
+
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 9b01d32218..d26af6a87d 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -229,6 +229,19 @@ mod ffi {
         value: bool,
     }
 
+    struct FfiServerNode {
+        node_id: i32,
+        host: String,
+        port: u32,
+        server_type: String,
+        uid: String,
+    }
+
+    struct FfiServerNodesResult {
+        result: FfiResult,
+        server_nodes: Vec<FfiServerNode>,
+    }
+
     extern "Rust" {
         type Connection;
         type Admin;
@@ -319,6 +332,7 @@ mod ffi {
         fn get_database_info(self: &Admin, database_name: &str) -> FfiDatabaseInfoResult;
         fn list_tables(self: &Admin, database_name: &str) -> FfiListTablesResult;
         fn table_exists(self: &Admin, table_path: &FfiTablePath) -> FfiBoolResult;
+        fn get_server_nodes(self: &Admin) -> FfiServerNodesResult;
 
         // Table
         unsafe fn delete_table(table: *mut Table);
@@ -1104,6 +1118,33 @@ impl Admin {
             },
         }
     }
+
+    fn get_server_nodes(&self) -> ffi::FfiServerNodesResult {
+        let result = RUNTIME.block_on(async { self.inner.get_server_nodes().await });
+
+        match result {
+            Ok(nodes) => {
+                let server_nodes: Vec<ffi::FfiServerNode> = nodes
+                    .into_iter()
+                    .map(|node| ffi::FfiServerNode {
+                        node_id: node.id(),
+                        host: node.host().to_string(),
+                        port: node.port(),
+                        server_type: node.server_type().to_string(),
+                        uid: node.uid().to_string(),
+                    })
+                    .collect();
+                ffi::FfiServerNodesResult {
+                    result: ok_result(),
+                    server_nodes,
+                }
+            }
+            Err(e) => ffi::FfiServerNodesResult {
+                result: err_from_core_error(&e),
+                server_nodes: vec![],
+            },
+        }
+    }
 }
 
 // Table implementation
diff --git a/fluss-rust/bindings/cpp/test/test_admin.cpp b/fluss-rust/bindings/cpp/test/test_admin.cpp
index b6bb25b789..99f93fcf1e 100644
--- a/fluss-rust/bindings/cpp/test/test_admin.cpp
+++ b/fluss-rust/bindings/cpp/test/test_admin.cpp
@@ -285,6 +285,31 @@ TEST_F(AdminTest, ErrorTableAlreadyExist) {
     ASSERT_OK(adm.DropDatabase(db_name, true, true));
 }
 
+TEST_F(AdminTest, GetServerNodes) {
+    auto& adm = admin();
+
+    std::vector<fluss::ServerNode> nodes;
+    ASSERT_OK(adm.GetServerNodes(nodes));
+
+    ASSERT_GT(nodes.size(), 0u) << "Expected at least one server node";
+
+    bool has_coordinator = false;
+    bool has_tablet = false;
+    for (const auto& node : nodes) {
+        EXPECT_FALSE(node.host.empty()) << "Server node host should not be empty";
+        EXPECT_GT(node.port, 0u) << "Server node port should be > 0";
+        EXPECT_FALSE(node.uid.empty()) << "Server node uid should not be empty";
+
+        if (node.server_type == "CoordinatorServer") {
+            has_coordinator = true;
+        } else if (node.server_type == "TabletServer") {
+            has_tablet = true;
+        }
+    }
+    EXPECT_TRUE(has_coordinator) << "Expected a coordinator server node";
+    EXPECT_TRUE(has_tablet) << "Expected at least one tablet server node";
+}
+
 TEST_F(AdminTest, ErrorTableNotExist) {
     auto& adm = admin();
 
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 514d011ac7..4c2142d7b0 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -185,6 +185,31 @@ class FlussConnection:
     ) -> bool: ...
     def __repr__(self) -> str: ...
 
+class ServerNode:
+    """Information about a server node in the Fluss cluster."""
+
+    @property
+    def id(self) -> int:
+        """The server node ID."""
+        ...
+    @property
+    def host(self) -> str:
+        """The hostname of the server."""
+        ...
+    @property
+    def port(self) -> int:
+        """The port number of the server."""
+        ...
+    @property
+    def server_type(self) -> str:
+        """The type of server ('CoordinatorServer' or 'TabletServer')."""
+        ...
+    @property
+    def uid(self) -> str:
+        """The unique identifier of the server (e.g. 'cs-0', 'ts-1')."""
+        ...
+    def __repr__(self) -> str: ...
+
 class FlussAdmin:
     async def create_database(
         self,
@@ -307,6 +332,13 @@ class FlussAdmin:
             List of PartitionInfo objects
         """
         ...
+    async def get_server_nodes(self) -> List[ServerNode]:
+        """Get all alive server nodes in the cluster.
+
+        Returns:
+            List of ServerNode objects (coordinator and tablet servers)
+        """
+        ...
     def __repr__(self) -> str: ...
 
 
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index 30db37506b..703b13347b 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -501,6 +501,30 @@ impl FlussAdmin {
         })
     }
 
+    /// Get all alive server nodes in the cluster.
+    ///
+    /// Returns:
+    ///     List[ServerNode]: List of server nodes (coordinator and tablet servers)
+    pub fn get_server_nodes<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let admin = self.__admin.clone();
+
+        future_into_py(py, async move {
+            let nodes = admin
+                .get_server_nodes()
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
+
+            Python::attach(|py| {
+                let py_list = pyo3::types::PyList::empty(py);
+                for node in nodes {
+                    let py_node = ServerNode::from_core(node);
+                    py_list.append(Py::new(py, py_node)?)?;
+                }
+                Ok(py_list.unbind())
+            })
+        })
+    }
+
     fn __repr__(&self) -> String {
         "FlussAdmin()".to_string()
     }
@@ -552,3 +576,60 @@ impl PartitionInfo {
         }
     }
 }
+
+/// Information about a server node in the Fluss cluster
+#[pyclass]
+pub struct ServerNode {
+    id: i32,
+    host: String,
+    port: u32,
+    server_type: String,
+    uid: String,
+}
+
+#[pymethods]
+impl ServerNode {
+    #[getter]
+    fn id(&self) -> i32 {
+        self.id
+    }
+
+    #[getter]
+    fn host(&self) -> &str {
+        &self.host
+    }
+
+    #[getter]
+    fn port(&self) -> u32 {
+        self.port
+    }
+
+    #[getter]
+    fn server_type(&self) -> &str {
+        &self.server_type
+    }
+
+    #[getter]
+    fn uid(&self) -> &str {
+        &self.uid
+    }
+
+    fn __repr__(&self) -> String {
+        format!(
+            "ServerNode(id={}, host='{}', port={}, server_type='{}')",
+            self.id, self.host, self.port, self.server_type
+        )
+    }
+}
+
+impl ServerNode {
+    pub fn from_core(node: fcore::ServerNode) -> Self {
+        Self {
+            id: node.id(),
+            host: node.host().to_string(),
+            port: node.port(),
+            server_type: node.server_type().to_string(),
+            uid: node.uid().to_string(),
+        }
+    }
+}
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index ebc0d54cc3..6890e08879 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -125,6 +125,7 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<ScanRecords>()?;
     m.add_class::<RecordBatch>()?;
     m.add_class::<PartitionInfo>()?;
+    m.add_class::<ServerNode>()?;
     m.add_class::<OffsetSpec>()?;
     m.add_class::<WriteResultHandle>()?;
     m.add_class::<DatabaseDescriptor>()?;
diff --git a/fluss-rust/bindings/python/test/test_admin.py b/fluss-rust/bindings/python/test/test_admin.py
index f203400f89..e2f43431d5 100644
--- a/fluss-rust/bindings/python/test/test_admin.py
+++ b/fluss-rust/bindings/python/test/test_admin.py
@@ -272,6 +272,23 @@ async def test_error_table_not_exist(admin):
     await admin.drop_table(table_path, ignore_if_not_exists=True)
 
 
+async def test_get_server_nodes(admin):
+    """Test get_server_nodes returns coordinator and tablet servers."""
+    nodes = await admin.get_server_nodes()
+
+    assert len(nodes) > 0, "Expected at least one server node"
+
+    server_types = [n.server_type for n in nodes]
+    assert "CoordinatorServer" in server_types, "Expected a coordinator server"
+    assert "TabletServer" in server_types, "Expected at least one tablet server"
+
+    for node in nodes:
+        assert node.host, "Server node host should not be empty"
+        assert node.port > 0, "Server node port should be > 0"
+        assert node.uid, "Server node uid should not be empty"
+        assert repr(node).startswith("ServerNode(")
+
+
 async def test_error_table_not_partitioned(admin):
     """Test error when calling partition operations on non-partitioned table."""
     db_name = "py_test_error_not_partitioned_db"
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 3012f85c9a..7a79e5ed99 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use crate::client::metadata::Metadata;
+use crate::cluster::ServerNode;
 use crate::metadata::{
     DatabaseDescriptor, DatabaseInfo, JsonSerde, LakeSnapshot, PartitionInfo, PartitionSpec,
     PhysicalTablePath, TableBucket, TableDescriptor, TableInfo, TablePath,
@@ -267,6 +268,13 @@ impl FlussAdmin {
         ))
     }
 
+    /// Get all alive server nodes in the cluster, including the coordinator
+    /// and all tablet servers. Refreshes cluster metadata before returning.
+    pub async fn get_server_nodes(&self) -> Result<Vec<ServerNode>> {
+        self.metadata.reinit_cluster().await?;
+        Ok(self.metadata.get_cluster().get_server_nodes())
+    }
+
     /// Get the latest lake snapshot for a table
     pub async fn get_latest_lake_snapshot(&self, table_path: &TablePath) -> Result<LakeSnapshot> {
         let response = self
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index 3d8e77b2eb..8581464733 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -89,7 +89,7 @@ impl Metadata {
         Cluster::from_metadata_response(response, None)
     }
 
-    async fn reinit_cluster(&self) -> Result<()> {
+    pub(crate) async fn reinit_cluster(&self) -> Result<()> {
         let cluster = Self::init_cluster(&self.bootstrap, self.connections.clone()).await?;
         *self.cluster.write() = cluster.into();
         Ok(())
diff --git a/fluss-rust/crates/fluss/src/cluster/cluster.rs b/fluss-rust/crates/fluss/src/cluster/cluster.rs
index 5b1e08365c..d5518709ec 100644
--- a/fluss-rust/crates/fluss/src/cluster/cluster.rs
+++ b/fluss-rust/crates/fluss/src/cluster/cluster.rs
@@ -369,6 +369,15 @@ impl Cluster {
             .unwrap_or(&EMPTY)
     }
 
+    pub fn get_server_nodes(&self) -> Vec<ServerNode> {
+        let mut nodes = Vec::new();
+        if let Some(coordinator) = &self.coordinator_server {
+            nodes.push(coordinator.clone());
+        }
+        nodes.extend(self.alive_tablet_servers.iter().cloned());
+        nodes
+    }
+
     pub fn get_one_available_server(&self) -> Option<&ServerNode> {
         if self.alive_tablet_servers.is_empty() {
             return None;
@@ -427,3 +436,106 @@ fn get_bucket_locations(
     }
     bucket_locations
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn make_coordinator() -> ServerNode {
+        ServerNode::new(
+            0,
+            "coord-host".to_string(),
+            9123,
+            ServerType::CoordinatorServer,
+        )
+    }
+
+    fn make_tablet_servers() -> HashMap<i32, ServerNode> {
+        let mut servers = HashMap::new();
+        servers.insert(
+            1,
+            ServerNode::new(1, "ts1-host".to_string(), 9124, ServerType::TabletServer),
+        );
+        servers.insert(
+            2,
+            ServerNode::new(2, "ts2-host".to_string(), 9125, ServerType::TabletServer),
+        );
+        servers
+    }
+
+    #[test]
+    fn test_server_node_getters() {
+        let node = ServerNode::new(5, "myhost".to_string(), 8080, ServerType::TabletServer);
+        assert_eq!(node.id(), 5);
+        assert_eq!(node.host(), "myhost");
+        assert_eq!(node.port(), 8080);
+        assert_eq!(node.server_type(), &ServerType::TabletServer);
+        assert_eq!(node.uid(), "ts-5");
+        assert_eq!(node.url(), "myhost:8080");
+    }
+
+    #[test]
+    fn test_server_type_display() {
+        assert_eq!(ServerType::TabletServer.to_string(), "TabletServer");
+        assert_eq!(
+            ServerType::CoordinatorServer.to_string(),
+            "CoordinatorServer"
+        );
+    }
+
+    #[test]
+    fn test_get_server_nodes_with_coordinator_and_tablets() {
+        let cluster = Cluster::new(
+            Some(make_coordinator()),
+            make_tablet_servers(),
+            HashMap::new(),
+            HashMap::new(),
+            HashMap::new(),
+            HashMap::new(),
+            HashMap::new(),
+        );
+
+        let nodes = cluster.get_server_nodes();
+        assert_eq!(nodes.len(), 3);
+
+        let coordinator_count = nodes
+            .iter()
+            .filter(|n| *n.server_type() == ServerType::CoordinatorServer)
+            .count();
+        assert_eq!(coordinator_count, 1);
+
+        let tablet_count = nodes
+            .iter()
+            .filter(|n| *n.server_type() == ServerType::TabletServer)
+            .count();
+        assert_eq!(tablet_count, 2);
+    }
+
+    #[test]
+    fn test_get_server_nodes_no_coordinator() {
+        let cluster = Cluster::new(
+            None,
+            make_tablet_servers(),
+            HashMap::new(),
+            HashMap::new(),
+            HashMap::new(),
+            HashMap::new(),
+            HashMap::new(),
+        );
+
+        let nodes = cluster.get_server_nodes();
+        assert_eq!(nodes.len(), 2);
+        assert!(
+            nodes
+                .iter()
+                .all(|n| *n.server_type() == ServerType::TabletServer)
+        );
+    }
+
+    #[test]
+    fn test_get_server_nodes_empty_cluster() {
+        let cluster = Cluster::default();
+        let nodes = cluster.get_server_nodes();
+        assert!(nodes.is_empty());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/cluster/mod.rs b/fluss-rust/crates/fluss/src/cluster/mod.rs
index 58e80c00b0..8b825eee20 100644
--- a/fluss-rust/crates/fluss/src/cluster/mod.rs
+++ b/fluss-rust/crates/fluss/src/cluster/mod.rs
@@ -17,6 +17,7 @@
 
 use crate::BucketId;
 use crate::metadata::{PhysicalTablePath, TableBucket};
+use std::fmt;
 use std::sync::Arc;
 
 #[allow(clippy::module_inception)]
@@ -47,7 +48,7 @@ impl ServerNode {
         }
     }
 
-    pub fn uid(&self) -> &String {
+    pub fn uid(&self) -> &str {
         &self.uid
     }
 
@@ -58,6 +59,18 @@ impl ServerNode {
     pub fn id(&self) -> i32 {
         self.id
     }
+
+    pub fn host(&self) -> &str {
+        &self.host
+    }
+
+    pub fn port(&self) -> u32 {
+        self.port
+    }
+
+    pub fn server_type(&self) -> &ServerType {
+        &self.server_type
+    }
 }
 
 #[derive(Debug, Clone, PartialEq, Eq, Hash)]
@@ -66,6 +79,15 @@ pub enum ServerType {
     CoordinatorServer,
 }
 
+impl fmt::Display for ServerType {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        match self {
+            ServerType::TabletServer => write!(f, "TabletServer"),
+            ServerType::CoordinatorServer => write!(f, "CoordinatorServer"),
+        }
+    }
+}
+
 #[derive(Debug, Clone)]
 pub struct BucketLocation {
     pub table_bucket: TableBucket,
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index f079db2808..689c37ca06 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -22,6 +22,7 @@ pub mod row;
 pub mod rpc;
 
 mod cluster;
+pub use cluster::{ServerNode, ServerType};
 
 pub mod config;
 pub mod error;
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index c8fe9ae393..a345c2fdc5 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -84,7 +84,7 @@ impl RpcClient {
                 }
             }
 
-            connections.insert(server_id.clone(), new_server.clone());
+            connections.insert(server_id.to_owned(), new_server.clone());
         }
         Ok(new_server)
     }
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index c0745dc6a1..350292316f 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -519,6 +519,49 @@ mod admin_test {
             .expect("drop_table with ignore_if_not_exists should succeed");
     }
 
+    #[tokio::test]
+    async fn test_get_server_nodes() {
+        let cluster = get_fluss_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().await.unwrap();
+
+        let nodes = admin
+            .get_server_nodes()
+            .await
+            .expect("should get server nodes");
+
+        assert!(
+            !nodes.is_empty(),
+            "Expected at least one server node in the cluster"
+        );
+
+        let has_coordinator = nodes
+            .iter()
+            .any(|n| *n.server_type() == fluss::ServerType::CoordinatorServer);
+        assert!(has_coordinator, "Expected a coordinator server node");
+
+        let tablet_count = nodes
+            .iter()
+            .filter(|n| *n.server_type() == fluss::ServerType::TabletServer)
+            .count();
+        assert!(
+            tablet_count >= 1,
+            "Expected at least one tablet server node"
+        );
+
+        for node in &nodes {
+            assert!(
+                !node.host().is_empty(),
+                "Server node host should not be empty"
+            );
+            assert!(node.port() > 0, "Server node port should be > 0");
+            assert!(
+                !node.uid().is_empty(),
+                "Server node uid should not be empty"
+            );
+        }
+    }
+
     #[tokio::test]
     async fn test_error_table_not_partitioned() {
         let cluster = get_fluss_cluster();
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index 30d89a9c23..489f13a17b 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -78,6 +78,22 @@ Complete API reference for the Fluss C++ client.
 |-----------------------------------------------------------------------------|------------------------------|
 | `GetLatestLakeSnapshot(const TablePath& path, LakeSnapshot& out) -> Result` | Get the latest lake snapshot |
 
+### Cluster Operations
+
+| Method                                                    | Description                                        |
+|-----------------------------------------------------------|----------------------------------------------------|
+| `GetServerNodes(std::vector<ServerNode>& out) -> Result`  | Get all alive server nodes (coordinator + tablets) |
+
+## `ServerNode`
+
+| Field         | Type          | Description                                              |
+|---------------|---------------|----------------------------------------------------------|
+| `id`          | `int32_t`     | Server node ID                                           |
+| `host`        | `std::string` | Hostname of the server                                   |
+| `port`        | `uint32_t`    | Port number                                              |
+| `server_type` | `std::string` | Server type (`"CoordinatorServer"` or `"TabletServer"`)  |
+| `uid`         | `std::string` | Unique identifier (e.g. `"cs-0"`, `"ts-1"`)             |
+
 ## `Table`
 
 | Method                        | Description                              |
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index fa62fd9a7e..1c97066c0f 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -50,6 +50,17 @@ Supports `with` statement (context manager).
 | `await drop_partition(table_path, partition_spec, ignore_if_not_exists=False)`                                        | Drop a partition                      |
 | `await list_partition_infos(table_path) -> list[PartitionInfo]`                                                       | List partitions                       |
 | `await get_latest_lake_snapshot(table_path) -> LakeSnapshot`                                                          | Get latest lake snapshot              |
+| `await get_server_nodes() -> list[ServerNode]`                                                                        | Get all alive server nodes            |
+
+## `ServerNode`
+
+| Property                 | Description                                                |
+|--------------------------|------------------------------------------------------------|
+| `.id -> int`             | Server node ID                                             |
+| `.host -> str`           | Hostname of the server                                     |
+| `.port -> int`           | Port number                                                |
+| `.server_type -> str`    | Server type (`"CoordinatorServer"` or `"TabletServer"`)    |
+| `.uid -> str`            | Unique identifier (e.g. `"cs-0"`, `"ts-1"`)               |
 
 ## `FlussTable`
 
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index a38cd7d034..2d149aac5a 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -71,6 +71,22 @@ Complete API reference for the Fluss Rust client.
 |--------------------------------------------------------------------------------------------|------------------------------|
 | `async fn get_latest_lake_snapshot(&self, table_path: &TablePath) -> Result<LakeSnapshot>` | Get the latest lake snapshot |
 
+### Cluster Operations
+
+| Method                                                        | Description                                         |
+|---------------------------------------------------------------|-----------------------------------------------------|
+| `async fn get_server_nodes(&self) -> Result<Vec<ServerNode>>` | Get all alive server nodes (coordinator + tablets)  |
+
+## `ServerNode`
+
+| Method                            | Description                                          |
+|-----------------------------------|------------------------------------------------------|
+| `fn id(&self) -> i32`            | Server node ID                                       |
+| `fn host(&self) -> &str`         | Hostname of the server                               |
+| `fn port(&self) -> u32`          | Port number                                          |
+| `fn server_type(&self) -> &ServerType` | Server type (`CoordinatorServer` or `TabletServer`) |
+| `fn uid(&self) -> &str`          | Unique identifier (e.g. `"cs-0"`, `"ts-1"`)         |
+
 ## `FlussTable<'a>`
 
 | Method                                        | Description                             |

From 1f4ff05eb3f9c424ef429745fc78b1991a58b607 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 28 Feb 2026 11:40:02 +0000
Subject: [PATCH 173/287] feat: support sasl/plain auth (#375)

---
 .../.github/workflows/build_and_test_rust.yml |   2 +-
 fluss-rust/bindings/cpp/include/fluss.hpp     |  10 +
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |   5 +
 fluss-rust/bindings/cpp/src/lib.rs            |  13 +
 .../bindings/cpp/test/test_sasl_auth.cpp      | 125 ++++++++
 fluss-rust/bindings/cpp/test/test_utils.h     | 151 +++++----
 fluss-rust/bindings/python/src/config.rs      |  77 +++++
 fluss-rust/bindings/python/test/conftest.py   |  57 +++-
 .../bindings/python/test/test_sasl_auth.py    | 108 +++++++
 .../crates/fluss/src/client/connection.rs     |  18 +-
 fluss-rust/crates/fluss/src/config.rs         | 166 +++++++++-
 .../crates/fluss/src/proto/fluss_api.proto    |  11 +-
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |   4 +
 .../fluss/src/rpc/message/authenticate.rs     |  86 ++++++
 .../crates/fluss/src/rpc/message/mod.rs       |   2 +
 .../crates/fluss/src/rpc/server_connection.rs | 107 ++++++-
 .../crates/fluss/tests/integration/admin.rs   |  52 +---
 .../fluss/tests/integration/fluss_cluster.rs  | 290 +++++++++++++++---
 .../fluss/tests/integration/kv_table.rs       |  43 +--
 .../fluss/tests/integration/log_table.rs      | 107 +++----
 .../fluss/tests/integration/sasl_auth.rs      | 149 +++++++++
 .../tests/integration/table_remote_scan.rs    |  95 +-----
 .../crates/fluss/tests/integration/utils.rs   | 141 +++++----
 fluss-rust/crates/fluss/tests/test_fluss.rs   |   1 +
 .../docs/user-guide/cpp/error-handling.md     |  21 ++
 .../user-guide/cpp/example/configuration.md   |  39 ++-
 .../docs/user-guide/python/error-handling.md  |  19 ++
 .../python/example/configuration.md           |  26 +-
 .../docs/user-guide/rust/error-handling.md    |  19 ++
 .../user-guide/rust/example/configuration.md  |  46 ++-
 30 files changed, 1560 insertions(+), 430 deletions(-)
 create mode 100644 fluss-rust/bindings/cpp/test/test_sasl_auth.cpp
 create mode 100644 fluss-rust/bindings/python/test/test_sasl_auth.py
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/authenticate.rs
 create mode 100644 fluss-rust/crates/fluss/tests/integration/sasl_auth.rs

diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index c9e05b7428..1bf7bc58fc 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -79,7 +79,7 @@ jobs:
       - name: Integration Test (Linux only)
         if: runner.os == 'Linux'
         run: |
-          RUST_TEST_THREADS=1 cargo test --features integration_tests --all-targets --workspace --exclude fluss_python --exclude fluss-cpp -- --nocapture
+          cargo test --features integration_tests --all-targets --workspace --exclude fluss_python --exclude fluss-cpp
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index cb060282f4..b507da7229 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -998,6 +998,16 @@ struct Configuration {
     // Maximum number of records returned in a single call to Poll() for LogScanner
     size_t scanner_log_max_poll_records{500};
     int64_t writer_batch_timeout_ms{100};
+    // Connect timeout in milliseconds for TCP transport connect
+    uint64_t connect_timeout_ms{120000};
+    // Security protocol: "PLAINTEXT" (default, no auth) or "sasl" (SASL auth)
+    std::string security_protocol{"PLAINTEXT"};
+    // SASL mechanism (only "PLAIN" is supported)
+    std::string security_sasl_mechanism{"PLAIN"};
+    // SASL username (required when security_protocol is "sasl")
+    std::string security_sasl_username;
+    // SASL password (required when security_protocol is "sasl")
+    std::string security_sasl_password;
 };
 
 class Connection {
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 9020027731..3375761460 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -57,6 +57,11 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.scanner_remote_log_read_concurrency = config.scanner_remote_log_read_concurrency;
     ffi_config.scanner_log_max_poll_records = config.scanner_log_max_poll_records;
     ffi_config.writer_batch_timeout_ms = config.writer_batch_timeout_ms;
+    ffi_config.connect_timeout_ms = config.connect_timeout_ms;
+    ffi_config.security_protocol = rust::String(config.security_protocol);
+    ffi_config.security_sasl_mechanism = rust::String(config.security_sasl_mechanism);
+    ffi_config.security_sasl_username = rust::String(config.security_sasl_username);
+    ffi_config.security_sasl_password = rust::String(config.security_sasl_password);
     return ffi_config;
 }
 
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index d26af6a87d..c310fc838e 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -49,6 +49,11 @@ mod ffi {
         scanner_remote_log_read_concurrency: usize,
         scanner_log_max_poll_records: usize,
         writer_batch_timeout_ms: i64,
+        connect_timeout_ms: u64,
+        security_protocol: String,
+        security_sasl_mechanism: String,
+        security_sasl_username: String,
+        security_sasl_password: String,
     }
 
     struct FfiResult {
@@ -258,6 +263,9 @@ mod ffi {
         type LookupResultInner;
 
         // Connection
+        // TODO: all Result<*mut T> methods lose server error codes (mapped to CLIENT_ERROR).
+        // Fix by introducing  some struct like { result: FfiResult, ptr: i64 } to preserve error
+        // codes from the server, matching how Rust and Python bindings handle errors.
         fn new_connection(config: &FfiConfig) -> Result<*mut Connection>;
         unsafe fn delete_connection(conn: *mut Connection);
         fn get_admin(self: &Connection) -> Result<*mut Admin>;
@@ -645,6 +653,11 @@ fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
         remote_file_download_thread_num: config.remote_file_download_thread_num,
         scanner_remote_log_read_concurrency: config.scanner_remote_log_read_concurrency,
         scanner_log_max_poll_records: config.scanner_log_max_poll_records,
+        connect_timeout_ms: config.connect_timeout_ms,
+        security_protocol: config.security_protocol.to_string(),
+        security_sasl_mechanism: config.security_sasl_mechanism.to_string(),
+        security_sasl_username: config.security_sasl_username.to_string(),
+        security_sasl_password: config.security_sasl_password.to_string(),
     };
 
     let conn = RUNTIME.block_on(async { fcore::client::FlussConnection::new(config_core).await });
diff --git a/fluss-rust/bindings/cpp/test/test_sasl_auth.cpp b/fluss-rust/bindings/cpp/test/test_sasl_auth.cpp
new file mode 100644
index 0000000000..2208db3019
--- /dev/null
+++ b/fluss-rust/bindings/cpp/test/test_sasl_auth.cpp
@@ -0,0 +1,125 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include <gtest/gtest.h>
+
+#include "test_utils.h"
+
+class SaslAuthTest : public ::testing::Test {
+   protected:
+    const std::string& sasl_servers() {
+        return fluss_test::FlussTestEnvironment::Instance()->GetSaslBootstrapServers();
+    }
+    const std::string& plaintext_servers() {
+        return fluss_test::FlussTestEnvironment::Instance()->GetBootstrapServers();
+    }
+};
+
+TEST_F(SaslAuthTest, SaslConnectWithValidCredentials) {
+    fluss::Configuration config;
+    config.bootstrap_servers = sasl_servers();
+    config.security_protocol = "sasl";
+    config.security_sasl_mechanism = "PLAIN";
+    config.security_sasl_username = "admin";
+    config.security_sasl_password = "admin-secret";
+
+    fluss::Connection conn;
+    ASSERT_OK(fluss::Connection::Create(config, conn));
+
+    fluss::Admin admin;
+    ASSERT_OK(conn.GetAdmin(admin));
+
+    // Perform a basic operation to confirm the connection is fully functional
+    std::string db_name = "cpp_sasl_test_valid_db";
+    fluss::DatabaseDescriptor descriptor;
+    descriptor.comment = "created via SASL auth";
+    ASSERT_OK(admin.CreateDatabase(db_name, descriptor, true));
+
+    bool exists = false;
+    ASSERT_OK(admin.DatabaseExists(db_name, exists));
+    ASSERT_TRUE(exists);
+
+    ASSERT_OK(admin.DropDatabase(db_name, true, true));
+}
+
+TEST_F(SaslAuthTest, SaslConnectWithSecondUser) {
+    fluss::Configuration config;
+    config.bootstrap_servers = sasl_servers();
+    config.security_protocol = "sasl";
+    config.security_sasl_mechanism = "PLAIN";
+    config.security_sasl_username = "alice";
+    config.security_sasl_password = "alice-secret";
+
+    fluss::Connection conn;
+    ASSERT_OK(fluss::Connection::Create(config, conn));
+
+    fluss::Admin admin;
+    ASSERT_OK(conn.GetAdmin(admin));
+
+    // Basic operation to confirm functional connection
+    bool exists = false;
+    ASSERT_OK(admin.DatabaseExists("some_nonexistent_db_alice", exists));
+    ASSERT_FALSE(exists);
+}
+
+TEST_F(SaslAuthTest, SaslConnectWithWrongPassword) {
+    fluss::Configuration config;
+    config.bootstrap_servers = sasl_servers();
+    config.security_protocol = "sasl";
+    config.security_sasl_mechanism = "PLAIN";
+    config.security_sasl_username = "admin";
+    config.security_sasl_password = "wrong-password";
+
+    fluss::Connection conn;
+    auto result = fluss::Connection::Create(config, conn);
+    ASSERT_FALSE(result.Ok());
+    // TODO: error_code is CLIENT_ERROR (-2) because CXX Result<*mut T> loses the server
+    // error code. Should be AUTHENTICATE_EXCEPTION (46) once fixed
+    EXPECT_NE(result.error_message.find("Authentication failed"), std::string::npos)
+        << "Expected 'Authentication failed' in: " << result.error_message;
+}
+
+TEST_F(SaslAuthTest, SaslConnectWithUnknownUser) {
+    fluss::Configuration config;
+    config.bootstrap_servers = sasl_servers();
+    config.security_protocol = "sasl";
+    config.security_sasl_mechanism = "PLAIN";
+    config.security_sasl_username = "nonexistent_user";
+    config.security_sasl_password = "some-password";
+
+    fluss::Connection conn;
+    auto result = fluss::Connection::Create(config, conn);
+    ASSERT_FALSE(result.Ok());
+    // TODO: same as above — should check error_code == AUTHENTICATE_EXCEPTION once fixed.
+    EXPECT_NE(result.error_message.find("Authentication failed"), std::string::npos)
+        << "Expected 'Authentication failed' in: " << result.error_message;
+}
+
+TEST_F(SaslAuthTest, SaslClientToPlaintextServer) {
+    fluss::Configuration config;
+    config.bootstrap_servers = plaintext_servers();
+    config.security_protocol = "sasl";
+    config.security_sasl_mechanism = "PLAIN";
+    config.security_sasl_username = "admin";
+    config.security_sasl_password = "admin-secret";
+
+    fluss::Connection conn;
+    auto result = fluss::Connection::Create(config, conn);
+    ASSERT_FALSE(result.Ok()) << "SASL client connecting to plaintext server should fail";
+}
diff --git a/fluss-rust/bindings/cpp/test/test_utils.h b/fluss-rust/bindings/cpp/test/test_utils.h
index bae523775f..98d119a5d3 100644
--- a/fluss-rust/bindings/cpp/test/test_utils.h
+++ b/fluss-rust/bindings/cpp/test/test_utils.h
@@ -49,23 +49,46 @@
 
 namespace fluss_test {
 
-static constexpr const char* kFlussVersion = "0.7.0";
+static constexpr const char* kFlussImage = "apache/fluss";
+static constexpr const char* kFlussVersion = "0.8.0-incubating";
 static constexpr const char* kNetworkName = "fluss-cpp-test-network";
 static constexpr const char* kZookeeperName = "zookeeper-cpp-test";
 static constexpr const char* kCoordinatorName = "coordinator-server-cpp-test";
 static constexpr const char* kTabletServerName = "tablet-server-cpp-test";
 static constexpr int kCoordinatorPort = 9123;
 static constexpr int kTabletServerPort = 9124;
+static constexpr int kPlainClientPort = 9223;
+static constexpr int kPlainClientTabletPort = 9224;
 
 /// Execute a shell command and return its exit code.
-inline int RunCommand(const std::string& cmd) {
-    return system(cmd.c_str());
+inline int RunCommand(const std::string& cmd) { return system(cmd.c_str()); }
+
+/// Join property lines with the escaped newline separator used by `printf` in docker commands.
+inline std::string JoinProps(const std::vector<std::string>& lines) {
+    std::string result;
+    for (size_t i = 0; i < lines.size(); ++i) {
+        if (i > 0) result += "\\n";
+        result += lines[i];
+    }
+    return result;
+}
+
+/// Build a `docker run` command with FLUSS_PROPERTIES.
+inline std::string DockerRunCmd(const std::string& name, const std::string& props,
+                                const std::vector<std::string>& port_mappings,
+                                const std::string& server_type) {
+    std::string cmd = "docker run -d --rm --name " + name + " --network " + kNetworkName;
+    for (const auto& pm : port_mappings) {
+        cmd += " -p " + pm;
+    }
+    cmd += " -e FLUSS_PROPERTIES=\"$(printf '" + props + "')\"";
+    cmd += " " + std::string(kFlussImage) + ":" + kFlussVersion + " " + server_type;
+    return cmd;
 }
 
 /// Wait until a TCP port is accepting connections, or timeout.
 inline bool WaitForPort(const std::string& host, int port, int timeout_seconds = 60) {
-    auto deadline =
-        std::chrono::steady_clock::now() + std::chrono::seconds(timeout_seconds);
+    auto deadline = std::chrono::steady_clock::now() + std::chrono::seconds(timeout_seconds);
 
     while (std::chrono::steady_clock::now() < deadline) {
         int sock = socket(AF_INET, SOCK_STREAM, 0);
@@ -114,10 +137,8 @@ class FlussTestCluster {
         RunCommand(std::string("docker network create ") + kNetworkName + " 2>/dev/null || true");
 
         // Start ZooKeeper
-        std::string zk_cmd = std::string("docker run -d --rm") +
-                              " --name " + kZookeeperName +
-                              " --network " + kNetworkName +
-                              " zookeeper:3.9.2";
+        std::string zk_cmd = std::string("docker run -d --rm") + " --name " + kZookeeperName +
+                             " --network " + kNetworkName + " zookeeper:3.9.2";
         if (RunCommand(zk_cmd) != 0) {
             std::cerr << "Failed to start ZooKeeper" << std::endl;
             return false;
@@ -126,23 +147,29 @@ class FlussTestCluster {
         // Wait for ZooKeeper to be ready before starting Fluss servers
         std::this_thread::sleep_for(std::chrono::seconds(5));
 
-        // Start Coordinator Server
-        std::string coord_props =
-            "zookeeper.address: " + std::string(kZookeeperName) + ":2181\\n"
-            "bind.listeners: INTERNAL://" + std::string(kCoordinatorName) + ":0, CLIENT://" +
-            std::string(kCoordinatorName) + ":9123\\n"
-            "advertised.listeners: CLIENT://localhost:9123\\n"
-            "internal.listener.name: INTERNAL\\n"
-            "netty.server.num-network-threads: 1\\n"
-            "netty.server.num-worker-threads: 3";
-
-        std::string coord_cmd = std::string("docker run -d --rm") +
-                                " --name " + kCoordinatorName +
-                                " --network " + kNetworkName +
-                                " -p 9123:9123" +
-                                " -e FLUSS_PROPERTIES=\"$(printf '" + coord_props + "')\"" +
-                                " fluss/fluss:" + kFlussVersion +
-                                " coordinatorServer";
+        // Start Coordinator Server (dual listeners: CLIENT=SASL on 9123, PLAIN_CLIENT=plaintext on
+        // 9223)
+        std::string sasl_jaas =
+            "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required"
+            " user_admin=\"admin-secret\" user_alice=\"alice-secret\";";
+
+        std::string coord = std::string(kCoordinatorName);
+        std::string zk = std::string(kZookeeperName);
+        std::string coord_props = JoinProps({
+            "zookeeper.address: " + zk + ":2181",
+            "bind.listeners: INTERNAL://" + coord + ":0, CLIENT://" + coord +
+                ":9123, PLAIN_CLIENT://" + coord + ":9223",
+            "advertised.listeners: CLIENT://localhost:9123, PLAIN_CLIENT://localhost:9223",
+            "internal.listener.name: INTERNAL",
+            "security.protocol.map: CLIENT:sasl",
+            "security.sasl.enabled.mechanisms: plain",
+            "security.sasl.plain.jaas.config: " + sasl_jaas,
+            "netty.server.num-network-threads: 1",
+            "netty.server.num-worker-threads: 3",
+        });
+
+        std::string coord_cmd = DockerRunCmd(kCoordinatorName, coord_props,
+                                             {"9123:9123", "9223:9223"}, "coordinatorServer");
         if (RunCommand(coord_cmd) != 0) {
             std::cerr << "Failed to start Coordinator Server" << std::endl;
             Stop();
@@ -156,24 +183,27 @@ class FlussTestCluster {
             return false;
         }
 
-        // Start Tablet Server
-        std::string ts_props =
-            "zookeeper.address: " + std::string(kZookeeperName) + ":2181\\n"
-            "bind.listeners: INTERNAL://" + std::string(kTabletServerName) + ":0, CLIENT://" +
-            std::string(kTabletServerName) + ":9123\\n"
-            "advertised.listeners: CLIENT://localhost:" + std::to_string(kTabletServerPort) + "\\n"
-            "internal.listener.name: INTERNAL\\n"
-            "tablet-server.id: 0\\n"
-            "netty.server.num-network-threads: 1\\n"
-            "netty.server.num-worker-threads: 3";
-
-        std::string ts_cmd = std::string("docker run -d --rm") +
-                             " --name " + kTabletServerName +
-                             " --network " + kNetworkName +
-                             " -p " + std::to_string(kTabletServerPort) + ":9123" +
-                             " -e FLUSS_PROPERTIES=\"$(printf '" + ts_props + "')\"" +
-                             " fluss/fluss:" + kFlussVersion +
-                             " tabletServer";
+        // Start Tablet Server (dual listeners: CLIENT=SASL on 9123, PLAIN_CLIENT=plaintext on 9223)
+        std::string ts = std::string(kTabletServerName);
+        std::string ts_props = JoinProps({
+            "zookeeper.address: " + zk + ":2181",
+            "bind.listeners: INTERNAL://" + ts + ":0, CLIENT://" + ts + ":9123, PLAIN_CLIENT://" +
+                ts + ":9223",
+            "advertised.listeners: CLIENT://localhost:" + std::to_string(kTabletServerPort) +
+                ", PLAIN_CLIENT://localhost:" + std::to_string(kPlainClientTabletPort),
+            "internal.listener.name: INTERNAL",
+            "security.protocol.map: CLIENT:sasl",
+            "security.sasl.enabled.mechanisms: plain",
+            "security.sasl.plain.jaas.config: " + sasl_jaas,
+            "tablet-server.id: 0",
+            "netty.server.num-network-threads: 1",
+            "netty.server.num-worker-threads: 3",
+        });
+
+        std::string ts_cmd = DockerRunCmd(kTabletServerName, ts_props,
+                                          {std::to_string(kTabletServerPort) + ":9123",
+                                           std::to_string(kPlainClientTabletPort) + ":9223"},
+                                          "tabletServer");
         if (RunCommand(ts_cmd) != 0) {
             std::cerr << "Failed to start Tablet Server" << std::endl;
             Stop();
@@ -187,7 +217,20 @@ class FlussTestCluster {
             return false;
         }
 
-        bootstrap_servers_ = "127.0.0.1:9123";
+        // Wait for plaintext listeners
+        if (!WaitForPort("127.0.0.1", kPlainClientPort)) {
+            std::cerr << "Coordinator plaintext listener did not become ready" << std::endl;
+            Stop();
+            return false;
+        }
+        if (!WaitForPort("127.0.0.1", kPlainClientTabletPort)) {
+            std::cerr << "Tablet Server plaintext listener did not become ready" << std::endl;
+            Stop();
+            return false;
+        }
+
+        bootstrap_servers_ = "127.0.0.1:" + std::to_string(kPlainClientPort);
+        sasl_bootstrap_servers_ = "127.0.0.1:" + std::to_string(kCoordinatorPort);
         std::cout << "Fluss cluster started successfully." << std::endl;
         return true;
     }
@@ -204,9 +247,11 @@ class FlussTestCluster {
     }
 
     const std::string& GetBootstrapServers() const { return bootstrap_servers_; }
+    const std::string& GetSaslBootstrapServers() const { return sasl_bootstrap_servers_; }
 
    private:
     std::string bootstrap_servers_;
+    std::string sasl_bootstrap_servers_;
     bool external_cluster_{false};
 };
 
@@ -230,8 +275,7 @@ class FlussTestEnvironment : public ::testing::Environment {
         fluss::Configuration config;
         config.bootstrap_servers = cluster_.GetBootstrapServers();
 
-        auto deadline =
-            std::chrono::steady_clock::now() + std::chrono::seconds(60);
+        auto deadline = std::chrono::steady_clock::now() + std::chrono::seconds(60);
         while (std::chrono::steady_clock::now() < deadline) {
             auto result = fluss::Connection::Create(config, connection_);
             if (result.Ok()) {
@@ -247,13 +291,12 @@ class FlussTestEnvironment : public ::testing::Environment {
         GTEST_SKIP() << "Fluss cluster did not become ready within timeout.";
     }
 
-    void TearDown() override {
-        cluster_.Stop();
-    }
+    void TearDown() override { cluster_.Stop(); }
 
     fluss::Connection& GetConnection() { return connection_; }
     fluss::Admin& GetAdmin() { return admin_; }
     const std::string& GetBootstrapServers() { return cluster_.GetBootstrapServers(); }
+    const std::string& GetSaslBootstrapServers() { return cluster_.GetSaslBootstrapServers(); }
 
    private:
     FlussTestEnvironment() = default;
@@ -286,8 +329,8 @@ inline void CreatePartitions(fluss::Admin& admin, const fluss::TablePath& path,
 /// Poll a LogScanner for ScanRecords until `expected_count` items are collected or timeout.
 /// `extract_fn` is called for each ScanRecord and should return a value of type T.
 template <typename T, typename ExtractFn>
-void PollRecords(fluss::LogScanner& scanner, size_t expected_count,
-                 ExtractFn extract_fn, std::vector<T>& out) {
+void PollRecords(fluss::LogScanner& scanner, size_t expected_count, ExtractFn extract_fn,
+                 std::vector<T>& out) {
     auto deadline = std::chrono::steady_clock::now() + std::chrono::seconds(10);
     while (out.size() < expected_count && std::chrono::steady_clock::now() < deadline) {
         fluss::ScanRecords records;
@@ -301,8 +344,8 @@ void PollRecords(fluss::LogScanner& scanner, size_t expected_count,
 /// Poll a LogScanner for ArrowRecordBatches until `expected_count` items are collected or timeout.
 /// `extract_fn` is called with the full ArrowRecordBatches and should return a std::vector<T>.
 template <typename T, typename ExtractFn>
-void PollRecordBatches(fluss::LogScanner& scanner, size_t expected_count,
-                       ExtractFn extract_fn, std::vector<T>& out) {
+void PollRecordBatches(fluss::LogScanner& scanner, size_t expected_count, ExtractFn extract_fn,
+                       std::vector<T>& out) {
     auto deadline = std::chrono::steady_clock::now() + std::chrono::seconds(10);
     while (out.size() < expected_count && std::chrono::steady_clock::now() < deadline) {
         fluss::ArrowRecordBatches batches;
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 9c0059e098..4582d43d49 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -108,6 +108,23 @@ impl Config {
                             }
                         };
                     }
+                    "connect-timeout" => {
+                        config.connect_timeout_ms = value.parse::<u64>().map_err(|e| {
+                            FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
+                        })?;
+                    }
+                    "security.protocol" => {
+                        config.security_protocol = value;
+                    }
+                    "security.sasl.mechanism" => {
+                        config.security_sasl_mechanism = value;
+                    }
+                    "security.sasl.username" => {
+                        config.security_sasl_username = value;
+                    }
+                    "security.sasl.password" => {
+                        config.security_sasl_password = value;
+                    }
                     _ => {
                         return Err(FlussError::new_err(format!("Unknown property: {key}")));
                     }
@@ -237,6 +254,66 @@ impl Config {
     fn set_writer_batch_timeout_ms(&mut self, timeout: i64) {
         self.inner.writer_batch_timeout_ms = timeout;
     }
+
+    /// Get the connect timeout in milliseconds
+    #[getter]
+    fn connect_timeout_ms(&self) -> u64 {
+        self.inner.connect_timeout_ms
+    }
+
+    /// Set the connect timeout in milliseconds
+    #[setter]
+    fn set_connect_timeout_ms(&mut self, timeout: u64) {
+        self.inner.connect_timeout_ms = timeout;
+    }
+
+    /// Get the security protocol
+    #[getter]
+    fn security_protocol(&self) -> String {
+        self.inner.security_protocol.clone()
+    }
+
+    /// Set the security protocol
+    #[setter]
+    fn set_security_protocol(&mut self, protocol: String) {
+        self.inner.security_protocol = protocol;
+    }
+
+    /// Get the SASL mechanism
+    #[getter]
+    fn security_sasl_mechanism(&self) -> String {
+        self.inner.security_sasl_mechanism.clone()
+    }
+
+    /// Set the SASL mechanism
+    #[setter]
+    fn set_security_sasl_mechanism(&mut self, mechanism: String) {
+        self.inner.security_sasl_mechanism = mechanism;
+    }
+
+    /// Get the SASL username
+    #[getter]
+    fn security_sasl_username(&self) -> String {
+        self.inner.security_sasl_username.clone()
+    }
+
+    /// Set the SASL username
+    #[setter]
+    fn set_security_sasl_username(&mut self, username: String) {
+        self.inner.security_sasl_username = username;
+    }
+
+    /// Get the SASL password
+    #[getter]
+    fn security_sasl_password(&self) -> String {
+        self.inner.security_sasl_password.clone()
+    }
+
+    /// Set the SASL password
+    #[setter]
+    fn set_security_sasl_password(&mut self, password: String) {
+        self.inner.security_sasl_password = password;
+    }
 }
 
 impl Config {
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index fbd7396ee8..0a969e8462 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -33,7 +33,8 @@
 
 import fluss
 
-FLUSS_VERSION = "0.7.0"
+FLUSS_IMAGE = "apache/fluss"
+FLUSS_VERSION = "0.8.0-incubating"
 BOOTSTRAP_SERVERS_ENV = os.environ.get("FLUSS_BOOTSTRAP_SERVERS")
 
 
@@ -53,7 +54,7 @@ def _wait_for_port(host, port, timeout=60):
 def fluss_cluster():
     """Start a Fluss cluster using testcontainers, or use an existing one."""
     if BOOTSTRAP_SERVERS_ENV:
-        yield BOOTSTRAP_SERVERS_ENV
+        yield (BOOTSTRAP_SERVERS_ENV, BOOTSTRAP_SERVERS_ENV)
         return
 
     from testcontainers.core.container import DockerContainer
@@ -68,20 +69,30 @@ def fluss_cluster():
         .with_name("zookeeper-python-test")
     )
 
+    sasl_jaas = (
+        "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required"
+        ' user_admin="admin-secret" user_alice="alice-secret";'
+    )
     coordinator_props = "\n".join([
         "zookeeper.address: zookeeper-python-test:2181",
         "bind.listeners: INTERNAL://coordinator-server-python-test:0,"
-        " CLIENT://coordinator-server-python-test:9123",
-        "advertised.listeners: CLIENT://localhost:9123",
+        " CLIENT://coordinator-server-python-test:9123,"
+        " PLAIN_CLIENT://coordinator-server-python-test:9223",
+        "advertised.listeners: CLIENT://localhost:9123,"
+        " PLAIN_CLIENT://localhost:9223",
         "internal.listener.name: INTERNAL",
+        "security.protocol.map: CLIENT:sasl",
+        "security.sasl.enabled.mechanisms: plain",
+        f"security.sasl.plain.jaas.config: {sasl_jaas}",
         "netty.server.num-network-threads: 1",
         "netty.server.num-worker-threads: 3",
     ])
     coordinator = (
-        DockerContainer(f"fluss/fluss:{FLUSS_VERSION}")
+        DockerContainer(f"{FLUSS_IMAGE}:{FLUSS_VERSION}")
         .with_network(network)
         .with_name("coordinator-server-python-test")
         .with_bind_ports(9123, 9123)
+        .with_bind_ports(9223, 9223)
         .with_command("coordinatorServer")
         .with_env("FLUSS_PROPERTIES", coordinator_props)
     )
@@ -89,18 +100,24 @@ def fluss_cluster():
     tablet_props = "\n".join([
         "zookeeper.address: zookeeper-python-test:2181",
         "bind.listeners: INTERNAL://tablet-server-python-test:0,"
-        " CLIENT://tablet-server-python-test:9123",
-        "advertised.listeners: CLIENT://localhost:9124",
+        " CLIENT://tablet-server-python-test:9123,"
+        " PLAIN_CLIENT://tablet-server-python-test:9223",
+        "advertised.listeners: CLIENT://localhost:9124,"
+        " PLAIN_CLIENT://localhost:9224",
         "internal.listener.name: INTERNAL",
+        "security.protocol.map: CLIENT:sasl",
+        "security.sasl.enabled.mechanisms: plain",
+        f"security.sasl.plain.jaas.config: {sasl_jaas}",
         "tablet-server.id: 0",
         "netty.server.num-network-threads: 1",
         "netty.server.num-worker-threads: 3",
     ])
     tablet_server = (
-        DockerContainer(f"fluss/fluss:{FLUSS_VERSION}")
+        DockerContainer(f"{FLUSS_IMAGE}:{FLUSS_VERSION}")
         .with_network(network)
         .with_name("tablet-server-python-test")
         .with_bind_ports(9123, 9124)
+        .with_bind_ports(9223, 9224)
         .with_command("tabletServer")
         .with_env("FLUSS_PROPERTIES", tablet_props)
     )
@@ -111,10 +128,13 @@ def fluss_cluster():
 
     _wait_for_port("localhost", 9123)
     _wait_for_port("localhost", 9124)
+    _wait_for_port("localhost", 9223)
+    _wait_for_port("localhost", 9224)
     # Extra wait for cluster to fully initialize
     time.sleep(10)
 
-    yield "127.0.0.1:9123"
+    # (plaintext_bootstrap, sasl_bootstrap)
+    yield ("127.0.0.1:9223", "127.0.0.1:9123")
 
     tablet_server.stop()
     coordinator.stop()
@@ -124,13 +144,28 @@ def fluss_cluster():
 
 @pytest_asyncio.fixture(scope="session")
 async def connection(fluss_cluster):
-    """Session-scoped connection to the Fluss cluster."""
-    config = fluss.Config({"bootstrap.servers": fluss_cluster})
+    """Session-scoped connection to the Fluss cluster (plaintext)."""
+    plaintext_addr, _sasl_addr = fluss_cluster
+    config = fluss.Config({"bootstrap.servers": plaintext_addr})
     conn = await fluss.FlussConnection.create(config)
     yield conn
     conn.close()
 
 
+@pytest.fixture(scope="session")
+def sasl_bootstrap_servers(fluss_cluster):
+    """Bootstrap servers for the SASL listener."""
+    _plaintext_addr, sasl_addr = fluss_cluster
+    return sasl_addr
+
+
+@pytest.fixture(scope="session")
+def plaintext_bootstrap_servers(fluss_cluster):
+    """Bootstrap servers for the plaintext (non-SASL) listener."""
+    plaintext_addr, _sasl_addr = fluss_cluster
+    return plaintext_addr
+
+
 @pytest_asyncio.fixture(scope="session")
 async def admin(connection):
     """Session-scoped admin client."""
diff --git a/fluss-rust/bindings/python/test/test_sasl_auth.py b/fluss-rust/bindings/python/test/test_sasl_auth.py
new file mode 100644
index 0000000000..30fce4ce6d
--- /dev/null
+++ b/fluss-rust/bindings/python/test/test_sasl_auth.py
@@ -0,0 +1,108 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Integration tests for SASL/PLAIN authentication.
+
+Mirrors the Rust integration tests in crates/fluss/tests/integration/sasl_auth.rs.
+"""
+
+import pytest
+
+import fluss
+
+
+async def test_sasl_connect_with_valid_credentials(sasl_bootstrap_servers):
+    """Verify that a client with correct SASL credentials can connect and perform operations."""
+    config = fluss.Config({
+        "bootstrap.servers": sasl_bootstrap_servers,
+        "security.protocol": "sasl",
+        "security.sasl.mechanism": "PLAIN",
+        "security.sasl.username": "admin",
+        "security.sasl.password": "admin-secret",
+    })
+    conn = await fluss.FlussConnection.create(config)
+    admin = await conn.get_admin()
+
+    db_name = "py_sasl_test_valid_db"
+    db_descriptor = fluss.DatabaseDescriptor(comment="created via SASL auth")
+    await admin.create_database(db_name, db_descriptor, ignore_if_exists=True)
+
+    assert await admin.database_exists(db_name)
+
+    # Cleanup
+    await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
+    conn.close()
+
+
+async def test_sasl_connect_with_second_user(sasl_bootstrap_servers):
+    """Verify that a second user can also authenticate successfully."""
+    config = fluss.Config({
+        "bootstrap.servers": sasl_bootstrap_servers,
+        "security.protocol": "sasl",
+        "security.sasl.mechanism": "PLAIN",
+        "security.sasl.username": "alice",
+        "security.sasl.password": "alice-secret",
+    })
+    conn = await fluss.FlussConnection.create(config)
+    admin = await conn.get_admin()
+
+    # Basic operation to confirm functional connection
+    assert not await admin.database_exists("some_nonexistent_db_alice")
+    conn.close()
+
+
+async def test_sasl_connect_with_wrong_password(sasl_bootstrap_servers):
+    """Verify that wrong credentials are rejected with AUTHENTICATE_EXCEPTION."""
+    config = fluss.Config({
+        "bootstrap.servers": sasl_bootstrap_servers,
+        "security.protocol": "sasl",
+        "security.sasl.mechanism": "PLAIN",
+        "security.sasl.username": "admin",
+        "security.sasl.password": "wrong-password",
+    })
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await fluss.FlussConnection.create(config)
+
+    assert exc_info.value.error_code == fluss.ErrorCode.AUTHENTICATE_EXCEPTION
+
+
+async def test_sasl_connect_with_unknown_user(sasl_bootstrap_servers):
+    """Verify that a nonexistent user is rejected with AUTHENTICATE_EXCEPTION."""
+    config = fluss.Config({
+        "bootstrap.servers": sasl_bootstrap_servers,
+        "security.protocol": "sasl",
+        "security.sasl.mechanism": "PLAIN",
+        "security.sasl.username": "nonexistent_user",
+        "security.sasl.password": "some-password",
+    })
+    with pytest.raises(fluss.FlussError) as exc_info:
+        await fluss.FlussConnection.create(config)
+
+    assert exc_info.value.error_code == fluss.ErrorCode.AUTHENTICATE_EXCEPTION
+
+
+async def test_sasl_client_to_plaintext_server(plaintext_bootstrap_servers):
+    """Verify that a SASL-configured client fails when connecting to a plaintext server."""
+    config = fluss.Config({
+        "bootstrap.servers": plaintext_bootstrap_servers,
+        "security.protocol": "sasl",
+        "security.sasl.mechanism": "PLAIN",
+        "security.sasl.username": "admin",
+        "security.sasl.password": "admin-secret",
+    })
+    with pytest.raises(fluss.FlussError):
+        await fluss.FlussConnection.create(config)
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index a17e57fb5f..703b588647 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -23,6 +23,7 @@ use crate::config::Config;
 use crate::rpc::RpcClient;
 use parking_lot::RwLock;
 use std::sync::Arc;
+use std::time::Duration;
 
 use crate::error::{Error, FlussError, Result};
 use crate::metadata::TablePath;
@@ -36,7 +37,22 @@ pub struct FlussConnection {
 
 impl FlussConnection {
     pub async fn new(arg: Config) -> Result<Self> {
-        let connections = Arc::new(RpcClient::new());
+        arg.validate_security()
+            .map_err(|msg| Error::IllegalArgument { message: msg })?;
+
+        let timeout = Duration::from_millis(arg.connect_timeout_ms);
+        let connections = if arg.is_sasl_enabled() {
+            Arc::new(
+                RpcClient::new()
+                    .with_sasl(
+                        arg.security_sasl_username.clone(),
+                        arg.security_sasl_password.clone(),
+                    )
+                    .with_timeout(timeout),
+            )
+        } else {
+            Arc::new(RpcClient::new().with_timeout(timeout))
+        };
         let metadata = Metadata::new(arg.bootstrap_servers.as_str(), connections.clone()).await?;
 
         Ok(FlussConnection {
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index a0d7e70716..438c948307 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -30,6 +30,9 @@ const DEFAULT_MAX_POLL_RECORDS: usize = 500;
 const DEFAULT_WRITER_BATCH_TIMEOUT_MS: i64 = 100;
 
 const DEFAULT_ACKS: &str = "all";
+const DEFAULT_CONNECT_TIMEOUT_MS: u64 = 120_000;
+const DEFAULT_SECURITY_PROTOCOL: &str = "PLAINTEXT";
+const DEFAULT_SASL_MECHANISM: &str = "PLAIN";
 
 /// Bucket assigner strategy for tables without bucket keys.
 /// Matches Java `client.writer.bucket.no-key-assigner`.
@@ -51,7 +54,7 @@ impl fmt::Display for NoKeyAssigner {
     }
 }
 
-#[derive(Parser, Debug, Clone, Deserialize, Serialize)]
+#[derive(Parser, Clone, Deserialize, Serialize)]
 #[command(author, version, about, long_about = None)]
 pub struct Config {
     #[arg(long, default_value_t = String::from(DEFAULT_BOOTSTRAP_SERVER))]
@@ -96,6 +99,58 @@ pub struct Config {
     /// Default: 100 (matching Java CLIENT_WRITER_BATCH_TIMEOUT)
     #[arg(long, default_value_t = DEFAULT_WRITER_BATCH_TIMEOUT_MS)]
     pub writer_batch_timeout_ms: i64,
+
+    /// Connect timeout in milliseconds for TCP transport connect.
+    /// Default: 120000 (120 seconds).
+    #[arg(long, default_value_t = DEFAULT_CONNECT_TIMEOUT_MS)]
+    pub connect_timeout_ms: u64,
+
+    #[arg(long, default_value_t = String::from(DEFAULT_SECURITY_PROTOCOL))]
+    pub security_protocol: String,
+
+    #[arg(long, default_value_t = String::from(DEFAULT_SASL_MECHANISM))]
+    pub security_sasl_mechanism: String,
+
+    #[arg(long, default_value_t = String::new())]
+    pub security_sasl_username: String,
+
+    #[arg(long, default_value_t = String::new())]
+    #[serde(skip_serializing)]
+    pub security_sasl_password: String,
+}
+
+impl std::fmt::Debug for Config {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("Config")
+            .field("bootstrap_servers", &self.bootstrap_servers)
+            .field("writer_request_max_size", &self.writer_request_max_size)
+            .field("writer_acks", &self.writer_acks)
+            .field("writer_retries", &self.writer_retries)
+            .field("writer_batch_size", &self.writer_batch_size)
+            .field(
+                "writer_bucket_no_key_assigner",
+                &self.writer_bucket_no_key_assigner,
+            )
+            .field(
+                "scanner_remote_log_prefetch_num",
+                &self.scanner_remote_log_prefetch_num,
+            )
+            .field(
+                "remote_file_download_thread_num",
+                &self.remote_file_download_thread_num,
+            )
+            .field(
+                "scanner_log_max_poll_records",
+                &self.scanner_log_max_poll_records,
+            )
+            .field("writer_batch_timeout_ms", &self.writer_batch_timeout_ms)
+            .field("connect_timeout_ms", &self.connect_timeout_ms)
+            .field("security_protocol", &self.security_protocol)
+            .field("security_sasl_mechanism", &self.security_sasl_mechanism)
+            .field("security_sasl_username", &self.security_sasl_username)
+            .field("security_sasl_password", &"[REDACTED]")
+            .finish()
+    }
 }
 
 impl Default for Config {
@@ -112,6 +167,115 @@ impl Default for Config {
             scanner_remote_log_read_concurrency: DEFAULT_SCANNER_REMOTE_LOG_READ_CONCURRENCY,
             scanner_log_max_poll_records: DEFAULT_MAX_POLL_RECORDS,
             writer_batch_timeout_ms: DEFAULT_WRITER_BATCH_TIMEOUT_MS,
+            connect_timeout_ms: DEFAULT_CONNECT_TIMEOUT_MS,
+            security_protocol: String::from(DEFAULT_SECURITY_PROTOCOL),
+            security_sasl_mechanism: String::from(DEFAULT_SASL_MECHANISM),
+            security_sasl_username: String::new(),
+            security_sasl_password: String::new(),
+        }
+    }
+}
+
+impl Config {
+    /// Returns true when the security protocol indicates SASL authentication
+    /// should be performed. Matches Java's `SaslAuthenticationPlugin` which
+    /// registers as `"sasl"` (case-insensitive).
+    pub fn is_sasl_enabled(&self) -> bool {
+        self.security_protocol.eq_ignore_ascii_case("sasl")
+    }
+
+    /// Validates security configuration. Returns `Ok(())` when the config is
+    /// consistent, or an error message when SASL is enabled but the config is
+    /// incomplete or uses an unsupported mechanism.
+    pub fn validate_security(&self) -> Result<(), String> {
+        if !self.is_sasl_enabled() {
+            return Ok(());
+        }
+        if !self.security_sasl_mechanism.eq_ignore_ascii_case("PLAIN") {
+            return Err(format!(
+                "Unsupported SASL mechanism: '{}'. Only 'PLAIN' is supported.",
+                self.security_sasl_mechanism
+            ));
+        }
+        if self.security_sasl_username.is_empty() {
+            return Err(
+                "security_sasl_username must be set when security_protocol is 'sasl'".to_string(),
+            );
         }
+        if self.security_sasl_password.is_empty() {
+            return Err(
+                "security_sasl_password must be set when security_protocol is 'sasl'".to_string(),
+            );
+        }
+        Ok(())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_default_is_not_sasl() {
+        let config = Config::default();
+        assert!(!config.is_sasl_enabled());
+        assert!(config.validate_security().is_ok());
+    }
+
+    #[test]
+    fn test_sasl_enabled_valid() {
+        let config = Config {
+            security_protocol: "sasl".to_string(),
+            security_sasl_mechanism: "PLAIN".to_string(),
+            security_sasl_username: "admin".to_string(),
+            security_sasl_password: "secret".to_string(),
+            ..Config::default()
+        };
+        assert!(config.is_sasl_enabled());
+        assert!(config.validate_security().is_ok());
+    }
+
+    #[test]
+    fn test_sasl_enabled_case_insensitive() {
+        let config = Config {
+            security_protocol: "SASL".to_string(),
+            security_sasl_username: "admin".to_string(),
+            security_sasl_password: "secret".to_string(),
+            ..Config::default()
+        };
+        assert!(config.is_sasl_enabled());
+        assert!(config.validate_security().is_ok());
+    }
+
+    #[test]
+    fn test_sasl_missing_username() {
+        let config = Config {
+            security_protocol: "sasl".to_string(),
+            security_sasl_password: "secret".to_string(),
+            ..Config::default()
+        };
+        assert!(config.validate_security().is_err());
+    }
+
+    #[test]
+    fn test_sasl_missing_password() {
+        let config = Config {
+            security_protocol: "sasl".to_string(),
+            security_sasl_username: "admin".to_string(),
+            ..Config::default()
+        };
+        assert!(config.validate_security().is_err());
+    }
+
+    #[test]
+    fn test_sasl_unsupported_mechanism() {
+        let config = Config {
+            security_protocol: "sasl".to_string(),
+            security_sasl_mechanism: "SCRAM-SHA-256".to_string(),
+            security_sasl_username: "admin".to_string(),
+            security_sasl_password: "secret".to_string(),
+            ..Config::default()
+        };
+        assert!(config.validate_security().is_err());
     }
 }
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index eca4cf3846..1c7ee7eb8f 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -408,4 +408,13 @@ message DropPartitionRequest {
   required bool ignore_if_not_exists = 3;
 }
 
-message DropPartitionResponse {}
\ No newline at end of file
+message DropPartitionResponse {}
+
+message AuthenticateRequest {
+  required string protocol = 1;
+  required bytes token = 2;
+}
+
+message AuthenticateResponse {
+  optional bytes challenge = 1;
+}
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index f6009c071e..4231fb03b3 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -40,6 +40,7 @@ pub enum ApiKey {
     GetLatestLakeSnapshot,
     CreatePartition,
     DropPartition,
+    Authenticate,
     Unknown(i16),
 }
 
@@ -67,6 +68,7 @@ impl From<i16> for ApiKey {
             1035 => ApiKey::GetDatabaseInfo,
             1036 => ApiKey::CreatePartition,
             1037 => ApiKey::DropPartition,
+            1038 => ApiKey::Authenticate,
             _ => Unknown(key),
         }
     }
@@ -96,6 +98,7 @@ impl From<ApiKey> for i16 {
             ApiKey::GetDatabaseInfo => 1035,
             ApiKey::CreatePartition => 1036,
             ApiKey::DropPartition => 1037,
+            ApiKey::Authenticate => 1038,
             Unknown(x) => x,
         }
     }
@@ -129,6 +132,7 @@ mod tests {
             (1035, ApiKey::GetDatabaseInfo),
             (1036, ApiKey::CreatePartition),
             (1037, ApiKey::DropPartition),
+            (1038, ApiKey::Authenticate),
         ];
 
         for (raw, key) in cases {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/authenticate.rs b/fluss-rust/crates/fluss/src/rpc/message/authenticate.rs
new file mode 100644
index 0000000000..1292cdc919
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/authenticate.rs
@@ -0,0 +1,86 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::{AuthenticateRequest as ProtoAuthenticateRequest, AuthenticateResponse};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug, Clone)]
+pub struct AuthenticateRequest {
+    pub inner_request: ProtoAuthenticateRequest,
+}
+
+impl AuthenticateRequest {
+    /// Build a SASL/PLAIN authenticate request.
+    /// Token format: `\0<username>\0<password>` (NUL-separated UTF-8).
+    pub fn new_plain(username: &str, password: &str) -> Self {
+        let mut token = Vec::with_capacity(1 + username.len() + 1 + password.len());
+        token.push(0u8);
+        token.extend_from_slice(username.as_bytes());
+        token.push(0u8);
+        token.extend_from_slice(password.as_bytes());
+
+        Self {
+            inner_request: ProtoAuthenticateRequest {
+                protocol: "PLAIN".to_string(),
+                token,
+            },
+        }
+    }
+
+    /// Build an authenticate request from a server challenge (for multi-round auth).
+    pub fn from_challenge(protocol: &str, challenge: Vec<u8>) -> Self {
+        Self {
+            inner_request: ProtoAuthenticateRequest {
+                protocol: protocol.to_string(),
+                token: challenge,
+            },
+        }
+    }
+}
+
+impl RequestBody for AuthenticateRequest {
+    type ResponseBody = AuthenticateResponse;
+    const API_KEY: ApiKey = ApiKey::Authenticate;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(AuthenticateRequest);
+impl_read_version_type!(AuthenticateResponse);
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_new_plain_token_format() {
+        let req = AuthenticateRequest::new_plain("admin", "secret");
+        assert_eq!(req.inner_request.protocol, "PLAIN");
+        assert_eq!(req.inner_request.token, b"\0admin\0secret");
+    }
+
+    #[test]
+    fn test_new_plain_empty_credentials() {
+        let req = AuthenticateRequest::new_plain("", "");
+        assert_eq!(req.inner_request.token, b"\0\0");
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index addb97a15f..9ad4545fb9 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -20,6 +20,7 @@ use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::{ReadError, WriteError};
 use bytes::{Buf, BufMut};
 
+mod authenticate;
 mod create_database;
 mod create_partition;
 mod create_table;
@@ -44,6 +45,7 @@ mod table_exists;
 mod update_metadata;
 
 pub use crate::rpc::RpcError;
+pub use authenticate::*;
 pub use create_database::*;
 pub use create_partition::*;
 pub use create_table::*;
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index a345c2fdc5..13c5d9ca09 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -29,6 +29,7 @@ use futures::future::BoxFuture;
 use log::warn;
 use parking_lot::{Mutex, RwLock};
 use std::collections::HashMap;
+use std::fmt;
 use std::io::Cursor;
 use std::ops::DerefMut;
 use std::sync::Arc;
@@ -44,12 +45,34 @@ pub type MessengerTransport = ServerConnectionInner<BufStream<Transport>>;
 
 pub type ServerConnection = Arc<MessengerTransport>;
 
+// Matches Java's ExponentialBackoff(100ms initial, 2x multiplier, 5000ms max, 0.2 jitter).
+const AUTH_INITIAL_BACKOFF_MS: f64 = 100.0;
+const AUTH_MAX_BACKOFF_MS: f64 = 5000.0;
+const AUTH_BACKOFF_MULTIPLIER: f64 = 2.0;
+const AUTH_JITTER: f64 = 0.2;
+
+#[derive(Clone)]
+pub struct SaslConfig {
+    pub username: String,
+    pub password: String,
+}
+
+impl fmt::Debug for SaslConfig {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.debug_struct("SaslConfig")
+            .field("username", &self.username)
+            .field("password", &"[REDACTED]")
+            .finish()
+    }
+}
+
 #[derive(Debug, Default)]
 pub struct RpcClient {
     connections: RwLock<HashMap<String, ServerConnection>>,
     client_id: Arc<str>,
     timeout: Option<Duration>,
     max_message_size: usize,
+    sasl_config: Option<SaslConfig>,
 }
 
 impl RpcClient {
@@ -59,13 +82,24 @@ impl RpcClient {
             client_id: Arc::from(""),
             timeout: None,
             max_message_size: usize::MAX,
+            sasl_config: None,
         }
     }
 
+    pub fn with_timeout(mut self, timeout: Duration) -> Self {
+        self.timeout = Some(timeout);
+        self
+    }
+
+    pub fn with_sasl(mut self, username: String, password: String) -> Self {
+        self.sasl_config = Some(SaslConfig { username, password });
+        self
+    }
+
     pub async fn get_connection(
         &self,
         server_node: &ServerNode,
-    ) -> Result<ServerConnection, RpcError> {
+    ) -> Result<ServerConnection, Error> {
         let server_id = server_node.uid();
         {
             let connections = self.connections.read();
@@ -89,7 +123,7 @@ impl RpcClient {
         Ok(new_server)
     }
 
-    async fn connect(&self, server_node: &ServerNode) -> Result<ServerConnection, RpcError> {
+    async fn connect(&self, server_node: &ServerNode) -> Result<ServerConnection, Error> {
         let url = server_node.url();
         let transport = Transport::connect(&url, self.timeout)
             .await
@@ -100,7 +134,74 @@ impl RpcClient {
             self.max_message_size,
             self.client_id.clone(),
         );
-        Ok(ServerConnection::new(messenger))
+        let connection = ServerConnection::new(messenger);
+
+        if let Some(ref sasl) = self.sasl_config {
+            Self::authenticate(&connection, &sasl.username, &sasl.password).await?;
+        }
+
+        Ok(connection)
+    }
+
+    /// Perform SASL/PLAIN authentication handshake.
+    ///
+    /// Retries on `RetriableAuthenticateException` with exponential backoff
+    /// (matching Java's unbounded retry behaviour). Non-retriable errors
+    /// (wrong password, unknown user) propagate immediately as
+    /// `Error::FlussAPIError` with the original error code.
+    async fn authenticate(
+        connection: &ServerConnection,
+        username: &str,
+        password: &str,
+    ) -> Result<(), Error> {
+        use crate::rpc::fluss_api_error::FlussError;
+        use crate::rpc::message::AuthenticateRequest;
+        use rand::Rng;
+
+        let initial_request = AuthenticateRequest::new_plain(username, password);
+        let mut retry_count: u32 = 0;
+
+        loop {
+            let request = initial_request.clone();
+            let result = connection.request(request).await;
+
+            match result {
+                Ok(response) => {
+                    // Check for server challenge (multi-round auth).
+                    // PLAIN mechanism never sends a challenge, but we handle it
+                    // for protocol correctness matching Java's handleAuthenticateResponse.
+                    if let Some(challenge) = response.challenge {
+                        let challenge_req = AuthenticateRequest::from_challenge("PLAIN", challenge);
+                        connection.request(challenge_req).await?;
+                    }
+                    return Ok(());
+                }
+                Err(Error::FlussAPIError { ref api_error })
+                    if FlussError::for_code(api_error.code)
+                        == FlussError::RetriableAuthenticateException =>
+                {
+                    retry_count += 1;
+                    // Cap the exponent like Java's ExponentialBackoff.expMax so that
+                    // jitter still produces a range at steady state instead of being
+                    // clamped to AUTH_MAX_BACKOFF_MS.
+                    let exp_max = (AUTH_MAX_BACKOFF_MS / AUTH_INITIAL_BACKOFF_MS).log2();
+                    let exp = ((retry_count as f64) - 1.0).min(exp_max);
+                    let term = AUTH_INITIAL_BACKOFF_MS * AUTH_BACKOFF_MULTIPLIER.powf(exp);
+                    let jitter_factor =
+                        1.0 - AUTH_JITTER + rand::rng().random::<f64>() * (2.0 * AUTH_JITTER);
+                    let backoff_ms = (term * jitter_factor) as u64;
+                    log::warn!(
+                        "SASL authentication retriable failure (attempt {retry_count}), \
+                         retrying in {backoff_ms}ms: {}",
+                        api_error.message
+                    );
+                    tokio::time::sleep(Duration::from_millis(backoff_ms)).await;
+                }
+                // Server-side auth errors (wrong password, unknown user, etc.)
+                // propagate with their original error code preserved.
+                Err(e) => return Err(e),
+            }
+        }
     }
 }
 
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index 350292316f..5bbdaf01dc 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -15,49 +15,19 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::integration::fluss_cluster::FlussTestingCluster;
-use parking_lot::RwLock;
-
-use std::sync::Arc;
-use std::sync::LazyLock;
-
-#[cfg(test)]
-use test_env_helpers::*;
-
-// Module-level shared cluster instance (only for this test file)
-static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>> =
-    LazyLock::new(|| Arc::new(RwLock::new(None)));
-
 #[cfg(test)]
-#[before_all]
-#[after_all]
 mod admin_test {
-    use super::SHARED_FLUSS_CLUSTER;
-    use crate::integration::fluss_cluster::FlussTestingCluster;
-    use crate::integration::utils::{get_cluster, start_cluster, stop_cluster};
+    use crate::integration::utils::get_shared_cluster;
     use fluss::error::FlussError;
     use fluss::metadata::{
         DataTypes, DatabaseDescriptorBuilder, KvFormat, LogFormat, PartitionSpec, Schema,
         TableDescriptor, TablePath,
     };
     use std::collections::HashMap;
-    use std::sync::Arc;
-
-    fn before_all() {
-        start_cluster("test-admin", SHARED_FLUSS_CLUSTER.clone());
-    }
-
-    fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
-        get_cluster(&SHARED_FLUSS_CLUSTER)
-    }
-
-    fn after_all() {
-        stop_cluster(SHARED_FLUSS_CLUSTER.clone());
-    }
 
     #[tokio::test]
     async fn test_create_database() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("should get admin");
@@ -97,13 +67,11 @@ mod admin_test {
 
         // database shouldn't exist now
         assert!(!admin.database_exists(db_name).await.unwrap());
-
-        // Note: We don't stop the shared cluster here as it's used by other tests
     }
 
     #[tokio::test]
     async fn test_create_table() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection
             .get_admin()
@@ -232,7 +200,7 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_partition_apis() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection
             .get_admin()
@@ -371,7 +339,7 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_fluss_error_response() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection
             .get_admin()
@@ -405,7 +373,7 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_error_database_not_exist() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.unwrap();
 
@@ -424,7 +392,7 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_error_database_already_exist() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.unwrap();
 
@@ -454,7 +422,7 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_error_table_already_exist() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.unwrap();
 
@@ -502,7 +470,7 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_error_table_not_exist() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.unwrap();
 
@@ -564,7 +532,7 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_error_table_not_partitioned() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.unwrap();
 
diff --git a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
index e4dcad9fd9..a2e9157954 100644
--- a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
+++ b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
@@ -25,7 +25,8 @@ use testcontainers::core::ContainerPort;
 use testcontainers::runners::AsyncRunner;
 use testcontainers::{ContainerAsync, GenericImage, ImageExt};
 
-const FLUSS_VERSION: &str = "0.7.0";
+const FLUSS_VERSION: &str = "0.8.0-incubating";
+const FLUSS_IMAGE: &str = "apache/fluss";
 
 pub struct FlussTestingClusterBuilder {
     number_of_tablet_servers: i32,
@@ -33,9 +34,20 @@ pub struct FlussTestingClusterBuilder {
     cluster_conf: HashMap<String, String>,
     testing_name: String,
     remote_data_dir: Option<std::path::PathBuf>,
+    sasl_enabled: bool,
+    sasl_users: Vec<(String, String)>,
+    /// Host port for the coordinator server (default 9123).
+    coordinator_host_port: u16,
+    /// Host port for the plaintext (PLAIN_CLIENT) listener.
+    /// When set together with `sasl_enabled`, the cluster exposes two listeners:
+    /// CLIENT (SASL) on `coordinator_host_port` and PLAIN_CLIENT on this port.
+    plain_client_port: Option<u16>,
+    image: String,
+    image_tag: String,
 }
 
 impl FlussTestingClusterBuilder {
+    #[allow(dead_code)]
     pub fn new(testing_name: impl Into<String>) -> Self {
         Self::new_with_cluster_conf(testing_name.into(), &HashMap::default())
     }
@@ -47,6 +59,18 @@ impl FlussTestingClusterBuilder {
         self
     }
 
+    /// Enable SASL/PLAIN authentication on the cluster with dual listeners.
+    /// Users are specified as `(username, password)` pairs.
+    /// This automatically configures a PLAIN_CLIENT (plaintext) listener in addition
+    /// to the CLIENT (SASL) listener, allowing both authenticated and unauthenticated
+    /// connections on the same cluster.
+    pub fn with_sasl(mut self, users: Vec<(String, String)>) -> Self {
+        self.sasl_enabled = true;
+        self.sasl_users = users;
+        self.plain_client_port = Some(self.coordinator_host_port + 100);
+        self
+    }
+
     pub fn new_with_cluster_conf(
         testing_name: impl Into<String>,
         conf: &HashMap<String, String>,
@@ -68,6 +92,12 @@ impl FlussTestingClusterBuilder {
             network: "fluss-cluster-network",
             testing_name: testing_name.into(),
             remote_data_dir: None,
+            sasl_enabled: false,
+            sasl_users: Vec::new(),
+            coordinator_host_port: 9123,
+            plain_client_port: None,
+            image: FLUSS_IMAGE.to_string(),
+            image_tag: FLUSS_VERSION.to_string(),
         }
     }
 
@@ -84,6 +114,43 @@ impl FlussTestingClusterBuilder {
     }
 
     pub async fn build(&mut self) -> FlussTestingCluster {
+        // Remove stale containers from previous runs (if any) so we can reuse names.
+        let stale_containers: Vec<String> = std::iter::once(self.zookeeper_container_name())
+            .chain(std::iter::once(self.coordinator_server_container_name()))
+            .chain(
+                (0..self.number_of_tablet_servers).map(|id| self.tablet_server_container_name(id)),
+            )
+            .collect();
+        for name in &stale_containers {
+            let _ = std::process::Command::new("docker")
+                .args(["rm", "-f", name])
+                .output();
+        }
+
+        // Inject SASL server-side configuration into cluster_conf
+        if self.sasl_enabled && !self.sasl_users.is_empty() {
+            self.cluster_conf.insert(
+                "security.protocol.map".to_string(),
+                "CLIENT:sasl".to_string(),
+            );
+            self.cluster_conf.insert(
+                "security.sasl.enabled.mechanisms".to_string(),
+                "plain".to_string(),
+            );
+            // Build JAAS config: user_<name>="<password>" for each user
+            let user_entries: Vec<String> = self
+                .sasl_users
+                .iter()
+                .map(|(u, p)| format!("user_{}=\"{}\"", u, p))
+                .collect();
+            let jaas_config = format!(
+                "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required {};",
+                user_entries.join(" ")
+            );
+            self.cluster_conf
+                .insert("security.sasl.plain.jaas.config".to_string(), jaas_config);
+        }
+
         let zookeeper = Arc::new(
             GenericImage::new("zookeeper", "3.9.2")
                 .with_network(self.network)
@@ -103,64 +170,122 @@ impl FlussTestingClusterBuilder {
             );
         }
 
+        // When dual listeners are configured, bootstrap_servers points to the plaintext
+        // listener and sasl_bootstrap_servers points to the SASL listener.
+        let (bootstrap_servers, sasl_bootstrap_servers) =
+            if let Some(plain_port) = self.plain_client_port {
+                (
+                    format!("127.0.0.1:{}", plain_port),
+                    Some(format!("127.0.0.1:{}", self.coordinator_host_port)),
+                )
+            } else {
+                (format!("127.0.0.1:{}", self.coordinator_host_port), None)
+            };
+
         FlussTestingCluster {
             zookeeper,
             coordinator_server,
             tablet_servers,
-            bootstrap_servers: "127.0.0.1:9123".to_string(),
+            bootstrap_servers,
+            sasl_bootstrap_servers,
             remote_data_dir: self.remote_data_dir.clone(),
+            sasl_users: self.sasl_users.clone(),
+            container_names: stale_containers,
         }
     }
 
     async fn start_coordinator_server(&mut self) -> ContainerAsync<GenericImage> {
+        let port = self.coordinator_host_port;
+        let container_name = self.coordinator_server_container_name();
         let mut coordinator_confs = HashMap::new();
         coordinator_confs.insert(
             "zookeeper.address",
             format!("{}:2181", self.zookeeper_container_name()),
         );
-        coordinator_confs.insert(
-            "bind.listeners",
-            format!(
-                "INTERNAL://{}:0, CLIENT://{}:9123",
-                self.coordinator_server_container_name(),
-                self.coordinator_server_container_name()
-            ),
-        );
-        coordinator_confs.insert(
-            "advertised.listeners",
-            "CLIENT://localhost:9123".to_string(),
-        );
+
+        if let Some(plain_port) = self.plain_client_port {
+            // Dual listeners: CLIENT (SASL) + PLAIN_CLIENT (plaintext)
+            coordinator_confs.insert(
+                "bind.listeners",
+                format!(
+                    "INTERNAL://{}:0, CLIENT://{}:{}, PLAIN_CLIENT://{}:{}",
+                    container_name, container_name, port, container_name, plain_port
+                ),
+            );
+            coordinator_confs.insert(
+                "advertised.listeners",
+                format!(
+                    "CLIENT://localhost:{}, PLAIN_CLIENT://localhost:{}",
+                    port, plain_port
+                ),
+            );
+        } else {
+            coordinator_confs.insert(
+                "bind.listeners",
+                format!(
+                    "INTERNAL://{}:0, CLIENT://{}:{}",
+                    container_name, container_name, port
+                ),
+            );
+            coordinator_confs.insert(
+                "advertised.listeners",
+                format!("CLIENT://localhost:{}", port),
+            );
+        }
+
         coordinator_confs.insert("internal.listener.name", "INTERNAL".to_string());
-        GenericImage::new("fluss/fluss", FLUSS_VERSION)
+
+        let mut image = GenericImage::new(&self.image, &self.image_tag)
             .with_container_name(self.coordinator_server_container_name())
-            .with_mapped_port(9123, ContainerPort::Tcp(9123))
+            .with_mapped_port(port, ContainerPort::Tcp(port))
             .with_network(self.network)
             .with_cmd(vec!["coordinatorServer"])
             .with_env_var(
                 "FLUSS_PROPERTIES",
                 self.to_fluss_properties_with(coordinator_confs),
-            )
-            .start()
-            .await
-            .unwrap()
+            );
+
+        if let Some(plain_port) = self.plain_client_port {
+            image = image.with_mapped_port(plain_port, ContainerPort::Tcp(plain_port));
+        }
+
+        image.start().await.unwrap()
     }
 
     async fn start_tablet_server(&self, server_id: i32) -> ContainerAsync<GenericImage> {
+        let port = self.coordinator_host_port;
+        let container_name = self.tablet_server_container_name(server_id);
         let mut tablet_server_confs = HashMap::new();
-        let bind_listeners = format!(
-            "INTERNAL://{}:0, CLIENT://{}:9123",
-            self.tablet_server_container_name(server_id),
-            self.tablet_server_container_name(server_id),
-        );
-        let expose_host_port = 9124 + server_id;
-        let advertised_listeners = format!("CLIENT://localhost:{}", expose_host_port);
+        let expose_host_port = (port as i32) + 1 + server_id;
         let tablet_server_id = format!("{}", server_id);
+
+        if let Some(plain_port) = self.plain_client_port {
+            // Dual listeners: CLIENT (SASL) + PLAIN_CLIENT (plaintext)
+            let bind_listeners = format!(
+                "INTERNAL://{}:0, CLIENT://{}:{}, PLAIN_CLIENT://{}:{}",
+                container_name, container_name, port, container_name, plain_port,
+            );
+            let plain_expose_host_port = (plain_port as i32) + 1 + server_id;
+            let advertised_listeners = format!(
+                "CLIENT://localhost:{}, PLAIN_CLIENT://localhost:{}",
+                expose_host_port, plain_expose_host_port
+            );
+            tablet_server_confs.insert("bind.listeners", bind_listeners);
+            tablet_server_confs.insert("advertised.listeners", advertised_listeners);
+        } else {
+            let bind_listeners = format!(
+                "INTERNAL://{}:0, CLIENT://{}:{}",
+                container_name, container_name, port,
+            );
+            let advertised_listeners = format!("CLIENT://localhost:{}", expose_host_port);
+            tablet_server_confs.insert("bind.listeners", bind_listeners);
+            tablet_server_confs.insert("advertised.listeners", advertised_listeners);
+        }
+
         tablet_server_confs.insert(
             "zookeeper.address",
             format!("{}:2181", self.zookeeper_container_name()),
         );
-        tablet_server_confs.insert("bind.listeners", bind_listeners);
-        tablet_server_confs.insert("advertised.listeners", advertised_listeners);
         tablet_server_confs.insert("internal.listener.name", "INTERNAL".to_string());
         tablet_server_confs.insert("tablet-server.id", tablet_server_id);
 
@@ -172,9 +297,9 @@ impl FlussTestingClusterBuilder {
                 remote_data_dir.to_string_lossy().to_string(),
             );
         }
-        let mut image = GenericImage::new("fluss/fluss", FLUSS_VERSION)
+        let mut image = GenericImage::new(&self.image, &self.image_tag)
             .with_cmd(vec!["tabletServer"])
-            .with_mapped_port(expose_host_port as u16, ContainerPort::Tcp(9123))
+            .with_mapped_port(expose_host_port as u16, ContainerPort::Tcp(port))
             .with_network(self.network)
             .with_container_name(self.tablet_server_container_name(server_id))
             .with_env_var(
@@ -182,6 +307,15 @@ impl FlussTestingClusterBuilder {
                 self.to_fluss_properties_with(tablet_server_confs),
             );
 
+        // Add port mapping for plaintext listener
+        if let Some(plain_port) = self.plain_client_port {
+            let plain_expose_host_port = (plain_port as i32) + 1 + server_id;
+            image = image.with_mapped_port(
+                plain_expose_host_port as u16,
+                ContainerPort::Tcp(plain_port),
+            );
+        }
+
         // Add volume mount if remote_data_dir is provided
         if let Some(ref remote_data_dir) = self.remote_data_dir {
             use testcontainers::core::Mount;
@@ -210,35 +344,45 @@ impl FlussTestingClusterBuilder {
 
 /// Provides an easy way to launch a Fluss cluster with coordinator and tablet servers.
 #[derive(Clone)]
+#[allow(dead_code)] // Fields held for RAII (keeping Docker containers alive).
 pub struct FlussTestingCluster {
     zookeeper: Arc<ContainerAsync<GenericImage>>,
     coordinator_server: Arc<ContainerAsync<GenericImage>>,
     tablet_servers: HashMap<i32, Arc<ContainerAsync<GenericImage>>>,
+    /// Bootstrap servers for plaintext connections.
+    /// When dual listeners are configured, this points to the PLAIN_CLIENT listener.
     bootstrap_servers: String,
+    /// Bootstrap servers for SASL connections (only set when dual listeners are configured).
+    sasl_bootstrap_servers: Option<String>,
     remote_data_dir: Option<std::path::PathBuf>,
+    sasl_users: Vec<(String, String)>,
+    container_names: Vec<String>,
 }
 
 impl FlussTestingCluster {
-    pub async fn stop(&self) {
-        for tablet_server in self.tablet_servers.values() {
-            tablet_server.stop().await.unwrap()
+    /// Synchronously stops and removes all Docker containers and cleans up the
+    /// remote data directory. Safe to call from non-async contexts (e.g. atexit).
+    #[allow(dead_code)]
+    pub fn stop(&self) {
+        for name in &self.container_names {
+            let _ = std::process::Command::new("docker")
+                .args(["rm", "-f", name])
+                .output();
         }
-        self.coordinator_server.stop().await.unwrap();
-        self.zookeeper.stop().await.unwrap();
-        if let Some(remote_data_dir) = &self.remote_data_dir {
-            // Try to clean up the remote data directory, but don't fail if it can't be deleted.
-            // This can happen in CI environments or if Docker containers are still using the directory.
-            // The directory will be cleaned up by the CI system or OS eventually.
-            if let Err(e) = tokio::fs::remove_dir_all(remote_data_dir).await {
-                eprintln!(
-                    "Warning: Failed to delete remote data directory: {:?}, error: {:?}. \
-                     This is non-fatal and the directory may be cleaned up later.",
-                    remote_data_dir, e
-                );
-            }
+        if let Some(ref dir) = self.remote_data_dir {
+            let _ = std::fs::remove_dir_all(dir);
         }
     }
 
+    pub fn sasl_users(&self) -> &[(String, String)] {
+        &self.sasl_users
+    }
+
+    /// Returns the plaintext (non-SASL) bootstrap servers address.
+    pub fn plaintext_bootstrap_servers(&self) -> &str {
+        &self.bootstrap_servers
+    }
+
     pub async fn get_fluss_connection(&self) -> FlussConnection {
         let config = Config {
             writer_acks: "all".to_string(),
@@ -246,6 +390,58 @@ impl FlussTestingCluster {
             ..Default::default()
         };
 
+        self.connect_with_retry(config).await
+    }
+
+    /// Connect with SASL/PLAIN credentials.
+    /// Uses `sasl_bootstrap_servers` when dual listeners are configured.
+    pub async fn get_fluss_connection_with_sasl(
+        &self,
+        username: &str,
+        password: &str,
+    ) -> FlussConnection {
+        let bootstrap = self
+            .sasl_bootstrap_servers
+            .clone()
+            .unwrap_or_else(|| self.bootstrap_servers.clone());
+        let config = Config {
+            writer_acks: "all".to_string(),
+            bootstrap_servers: bootstrap,
+            security_protocol: "sasl".to_string(),
+            security_sasl_mechanism: "PLAIN".to_string(),
+            security_sasl_username: username.to_string(),
+            security_sasl_password: password.to_string(),
+            ..Default::default()
+        };
+
+        self.connect_with_retry(config).await
+    }
+
+    /// Try to connect with SASL/PLAIN credentials, returning the error on failure.
+    /// Uses `sasl_bootstrap_servers` when dual listeners are configured.
+    pub async fn try_fluss_connection_with_sasl(
+        &self,
+        username: &str,
+        password: &str,
+    ) -> fluss::error::Result<FlussConnection> {
+        let bootstrap = self
+            .sasl_bootstrap_servers
+            .clone()
+            .unwrap_or_else(|| self.bootstrap_servers.clone());
+        let config = Config {
+            writer_acks: "all".to_string(),
+            bootstrap_servers: bootstrap,
+            security_protocol: "sasl".to_string(),
+            security_sasl_mechanism: "PLAIN".to_string(),
+            security_sasl_username: username.to_string(),
+            security_sasl_password: password.to_string(),
+            ..Default::default()
+        };
+
+        FlussConnection::new(config).await
+    }
+
+    async fn connect_with_retry(&self, config: Config) -> FlussConnection {
         // Retry mechanism: retry for up to 1 minute
         let max_retries = 60; // 60 retry attempts
         let retry_interval = Duration::from_secs(1); // 1 second interval between retries
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index c101a18941..f0e0c5793d 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -16,42 +16,11 @@
  * limitations under the License.
  */
 
-use parking_lot::RwLock;
-use std::sync::Arc;
-use std::sync::LazyLock;
-
-use crate::integration::fluss_cluster::FlussTestingCluster;
 #[cfg(test)]
-use test_env_helpers::*;
-
-// Module-level shared cluster instance (only for this test file)
-static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>> =
-    LazyLock::new(|| Arc::new(RwLock::new(None)));
-
-#[cfg(test)]
-#[before_all]
-#[after_all]
 mod kv_table_test {
-    use super::SHARED_FLUSS_CLUSTER;
-    use crate::integration::fluss_cluster::FlussTestingCluster;
-    use crate::integration::utils::{
-        create_partitions, create_table, get_cluster, start_cluster, stop_cluster,
-    };
+    use crate::integration::utils::{create_partitions, create_table, get_shared_cluster};
     use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::row::{GenericRow, InternalRow};
-    use std::sync::Arc;
-
-    fn before_all() {
-        start_cluster("test_kv_table", SHARED_FLUSS_CLUSTER.clone());
-    }
-
-    fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
-        get_cluster(&SHARED_FLUSS_CLUSTER)
-    }
-
-    fn after_all() {
-        stop_cluster(SHARED_FLUSS_CLUSTER.clone());
-    }
 
     fn make_key(id: i32) -> GenericRow<'static> {
         let mut row = GenericRow::new(3);
@@ -61,7 +30,7 @@ mod kv_table_test {
 
     #[tokio::test]
     async fn upsert_delete_and_lookup() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.unwrap();
@@ -200,7 +169,7 @@ mod kv_table_test {
 
     #[tokio::test]
     async fn composite_primary_keys() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.unwrap();
@@ -310,7 +279,7 @@ mod kv_table_test {
     async fn partial_update() {
         use fluss::row::Datum;
 
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
@@ -431,7 +400,7 @@ mod kv_table_test {
 
     #[tokio::test]
     async fn partitioned_table_upsert_and_lookup() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
@@ -601,7 +570,7 @@ mod kv_table_test {
     async fn all_supported_datatypes() {
         use fluss::row::{Date, Datum, Decimal, Time, TimestampLtz, TimestampNtz};
 
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 779ffdd319..4aa88ac4e0 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -16,55 +16,21 @@
  * limitations under the License.
  */
 
-use parking_lot::RwLock;
-use std::sync::Arc;
-use std::sync::LazyLock;
-
-use crate::integration::fluss_cluster::FlussTestingCluster;
-#[cfg(test)]
-use test_env_helpers::*;
-
-// Module-level shared cluster instance (only for this test file)
-static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>> =
-    LazyLock::new(|| Arc::new(RwLock::new(None)));
-
 #[cfg(test)]
-#[before_all]
-#[after_all]
 mod table_test {
-    use super::SHARED_FLUSS_CLUSTER;
-    use crate::integration::fluss_cluster::FlussTestingCluster;
-    use crate::integration::utils::{
-        create_partitions, create_table, get_cluster, start_cluster, stop_cluster,
-    };
+    use crate::integration::utils::{create_partitions, create_table, get_shared_cluster};
     use arrow::array::record_batch;
     use fluss::client::{EARLIEST_OFFSET, FlussTable, TableScan};
     use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::record::ScanRecord;
     use fluss::row::InternalRow;
     use fluss::rpc::message::OffsetSpec;
-    use jiff::Timestamp;
     use std::collections::HashMap;
-    use std::sync::Arc;
-    use std::sync::atomic::AtomicUsize;
-    use std::sync::atomic::Ordering;
     use std::time::Duration;
 
-    fn before_all() {
-        start_cluster("test_table", SHARED_FLUSS_CLUSTER.clone());
-    }
-
-    fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
-        get_cluster(&SHARED_FLUSS_CLUSTER)
-    }
-
-    fn after_all() {
-        stop_cluster(SHARED_FLUSS_CLUSTER.clone());
-    }
-
     #[tokio::test]
     async fn append_record_batch_and_scan() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
@@ -174,7 +140,7 @@ mod table_test {
 
     #[tokio::test]
     async fn list_offsets() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
@@ -221,8 +187,6 @@ mod table_test {
             "Latest offset should be 0 for empty table"
         );
 
-        let before_append_ms = Timestamp::now().as_millisecond();
-
         // Append some records
         let append_writer = connection
             .get_table(&table_path)
@@ -247,8 +211,6 @@ mod table_test {
 
         tokio::time::sleep(tokio::time::Duration::from_secs(1)).await;
 
-        let after_append_ms = Timestamp::now().as_millisecond();
-
         // Test latest offset after appending (should be 3)
         let latest_offsets_after = admin
             .list_offsets(&table_path, &[0], OffsetSpec::Latest)
@@ -273,34 +235,65 @@ mod table_test {
             "Earliest offset should still be 0"
         );
 
-        // Test list_offsets_by_timestamp
+        // Scan records back to get server-assigned timestamps (avoids host/container
+        // clock skew issues that make host-based timestamps unreliable).
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let log_scanner = table
+            .new_scan()
+            .create_log_scanner()
+            .expect("Failed to create log scanner");
+        log_scanner
+            .subscribe(0, EARLIEST_OFFSET)
+            .await
+            .expect("Failed to subscribe");
+
+        let mut record_timestamps: Vec<i64> = Vec::new();
+        let scan_start = std::time::Instant::now();
+        while record_timestamps.len() < 3 && scan_start.elapsed() < Duration::from_secs(10) {
+            let scan_records = log_scanner
+                .poll(Duration::from_millis(500))
+                .await
+                .expect("Failed to poll records");
+            for rec in scan_records {
+                record_timestamps.push(rec.timestamp());
+            }
+        }
+        assert_eq!(record_timestamps.len(), 3, "Expected 3 record timestamps");
+
+        let min_ts = *record_timestamps.iter().min().unwrap();
+        let max_ts = *record_timestamps.iter().max().unwrap();
 
-        let timestamp_offsets = admin
-            .list_offsets(&table_path, &[0], OffsetSpec::Timestamp(before_append_ms))
+        // Timestamp before all records should resolve to offset 0
+        let before_offsets = admin
+            .list_offsets(&table_path, &[0], OffsetSpec::Timestamp(min_ts - 1))
             .await
-            .expect("Failed to list offsets by timestamp");
+            .expect("Failed to list offsets by timestamp (before)");
 
         assert_eq!(
-            timestamp_offsets.get(&0),
+            before_offsets.get(&0),
             Some(&0),
-            "Timestamp before append should resolve to offset 0 (start of new data)"
+            "Timestamp before first record should resolve to offset 0"
         );
 
-        let timestamp_offsets = admin
-            .list_offsets(&table_path, &[0], OffsetSpec::Timestamp(after_append_ms))
+        // Timestamp after all records should resolve to offset 3
+        let after_offsets = admin
+            .list_offsets(&table_path, &[0], OffsetSpec::Timestamp(max_ts + 1))
             .await
-            .expect("Failed to list offsets by timestamp");
+            .expect("Failed to list offsets by timestamp (after)");
 
         assert_eq!(
-            timestamp_offsets.get(&0),
+            after_offsets.get(&0),
             Some(&3),
-            "Timestamp after append should resolve to offset 0 (no newer records)"
+            "Timestamp after last record should resolve to offset 3"
         );
     }
 
     #[tokio::test]
     async fn test_project() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
@@ -456,7 +449,7 @@ mod table_test {
 
     #[tokio::test]
     async fn test_poll_batches() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
@@ -588,7 +581,7 @@ mod table_test {
     async fn all_supported_datatypes() {
         use fluss::row::{Date, Datum, Decimal, GenericRow, Time, TimestampLtz, TimestampNtz};
 
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
@@ -1019,7 +1012,7 @@ mod table_test {
 
     #[tokio::test]
     async fn partitioned_table_append_scan() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
@@ -1314,7 +1307,7 @@ mod table_test {
 
     #[tokio::test]
     async fn undersized_row_returns_error() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
diff --git a/fluss-rust/crates/fluss/tests/integration/sasl_auth.rs b/fluss-rust/crates/fluss/tests/integration/sasl_auth.rs
new file mode 100644
index 0000000000..878c9830ac
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/sasl_auth.rs
@@ -0,0 +1,149 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#[cfg(test)]
+mod sasl_auth_test {
+    use crate::integration::utils::get_shared_cluster;
+    use fluss::client::FlussConnection;
+    use fluss::config::Config;
+    use fluss::error::FlussError;
+    use fluss::metadata::DatabaseDescriptorBuilder;
+
+    const SASL_USERNAME: &str = "admin";
+    const SASL_PASSWORD: &str = "admin-secret";
+
+    /// Verify that a client with correct SASL credentials can connect and perform operations.
+    #[tokio::test]
+    async fn test_sasl_connect_with_valid_credentials() {
+        let cluster = get_shared_cluster();
+        let connection = cluster
+            .get_fluss_connection_with_sasl(SASL_USERNAME, SASL_PASSWORD)
+            .await;
+
+        let admin = connection
+            .get_admin()
+            .await
+            .expect("Should get admin with valid SASL credentials");
+
+        // Perform a basic operation to confirm the connection is fully functional
+        let db_name = "sasl_test_valid_db";
+        let descriptor = DatabaseDescriptorBuilder::default()
+            .comment("created via SASL auth")
+            .build();
+
+        admin
+            .create_database(db_name, Some(&descriptor), true)
+            .await
+            .expect("Should create database with SASL auth");
+
+        assert!(admin.database_exists(db_name).await.unwrap());
+
+        // Cleanup
+        admin
+            .drop_database(db_name, true, true)
+            .await
+            .expect("Should drop database");
+    }
+
+    /// Verify that a second user can also authenticate successfully.
+    #[tokio::test]
+    async fn test_sasl_connect_with_second_user() {
+        let cluster = get_shared_cluster();
+        let connection = cluster
+            .get_fluss_connection_with_sasl("alice", "alice-secret")
+            .await;
+
+        let admin = connection
+            .get_admin()
+            .await
+            .expect("Should get admin with alice credentials");
+
+        // Basic operation to confirm functional connection
+        assert!(
+            admin
+                .database_exists("some_nonexistent_db_alice")
+                .await
+                .is_ok()
+        );
+    }
+
+    /// Verify that wrong credentials are rejected with a typed AuthenticateException error.
+    #[tokio::test]
+    async fn test_sasl_connect_with_wrong_password() {
+        let cluster = get_shared_cluster();
+        let result = cluster
+            .try_fluss_connection_with_sasl(SASL_USERNAME, "wrong-password")
+            .await;
+
+        let err = match result {
+            Err(e) => e,
+            Ok(_) => panic!("Connection with wrong password should fail"),
+        };
+
+        // The server error code must be preserved (not wrapped in a generic string).
+        // Code 46 = AuthenticateException — this is what C++ and Python bindings
+        // use to distinguish auth failures from network errors.
+        assert_eq!(
+            err.api_error(),
+            Some(FlussError::AuthenticateException),
+            "Wrong password should produce AuthenticateException, got: {err}"
+        );
+    }
+
+    /// Verify that a SASL-configured client fails when connecting to a plaintext server.
+    #[tokio::test]
+    async fn test_sasl_client_to_plaintext_server() {
+        let cluster = get_shared_cluster();
+        let plaintext_addr = cluster.plaintext_bootstrap_servers().to_string();
+
+        let config = Config {
+            writer_acks: "all".to_string(),
+            bootstrap_servers: plaintext_addr,
+            security_protocol: "sasl".to_string(),
+            security_sasl_mechanism: "PLAIN".to_string(),
+            security_sasl_username: SASL_USERNAME.to_string(),
+            security_sasl_password: SASL_PASSWORD.to_string(),
+            ..Default::default()
+        };
+
+        let result = FlussConnection::new(config).await;
+        assert!(
+            result.is_err(),
+            "SASL client connecting to plaintext server should fail"
+        );
+    }
+
+    /// Verify that a nonexistent user is rejected with a typed error.
+    #[tokio::test]
+    async fn test_sasl_connect_with_unknown_user() {
+        let cluster = get_shared_cluster();
+        let result = cluster
+            .try_fluss_connection_with_sasl("nonexistent_user", "some-password")
+            .await;
+
+        let err = match result {
+            Err(e) => e,
+            Ok(_) => panic!("Connection with unknown user should fail"),
+        };
+
+        assert_eq!(
+            err.api_error(),
+            Some(FlussError::AuthenticateException),
+            "Unknown user should produce AuthenticateException, got: {err}"
+        );
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index fcd67738ab..52b8974e95 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -15,107 +15,22 @@
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */
-use crate::integration::fluss_cluster::FlussTestingCluster;
-use parking_lot::RwLock;
-use std::sync::Arc;
-use std::sync::LazyLock;
 
 #[cfg(test)]
-use test_env_helpers::*;
-
-// Module-level shared cluster instance (only for this test file)
-static SHARED_FLUSS_CLUSTER: LazyLock<Arc<RwLock<Option<FlussTestingCluster>>>> =
-    LazyLock::new(|| Arc::new(RwLock::new(None)));
-
-#[cfg(test)]
-#[before_all]
-#[after_all]
 mod table_remote_scan_test {
-    use super::SHARED_FLUSS_CLUSTER;
-    use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
-    use crate::integration::utils::{
-        create_table, get_cluster, stop_cluster, wait_for_cluster_ready,
-    };
+    use crate::integration::utils::{create_table, get_shared_cluster};
     use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::row::{GenericRow, InternalRow};
-    use std::collections::HashMap;
-    use std::sync::Arc;
-    use std::sync::atomic::AtomicUsize;
-    use std::thread;
     use std::time::Duration;
-    use uuid::Uuid;
-    fn before_all() {
-        // Create a new tokio runtime in a separate thread
-        let cluster_lock = SHARED_FLUSS_CLUSTER.clone();
-        thread::spawn(move || {
-            let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
-            rt.block_on(async {
-                // Create a temporary directory for remote data that can be accessed from both
-                // container and host. Use a fixed path so it's the same in container and host.
-                // On macOS, Docker Desktop may have issues with /tmp, so we use a path in the
-                // current working directory or user's home directory which Docker can access.
-                let temp_dir = std::env::current_dir()
-                    .unwrap_or_else(|_| std::path::PathBuf::from("."))
-                    .join("target")
-                    .join(format!("test-remote-data-{}", Uuid::new_v4()));
-
-                // Remove existing directory if it exists to start fresh
-                let _ = std::fs::remove_dir_all(&temp_dir);
-                std::fs::create_dir_all(&temp_dir)
-                    .expect("Failed to create temporary directory for remote data");
-                println!("temp_dir: {:?}", temp_dir);
-
-                // Verify directory was created and is accessible
-                if !temp_dir.exists() {
-                    panic!("Remote data directory was not created: {:?}", temp_dir);
-                }
-
-                // Get absolute path for Docker mount
-                let temp_dir = temp_dir
-                    .canonicalize()
-                    .expect("Failed to canonicalize remote data directory path");
-
-                let mut cluster_conf = HashMap::new();
-                // set to a small size to make data can be tiered to remote
-                cluster_conf.insert("log.segment.file-size".to_string(), "120b".to_string());
-                cluster_conf.insert(
-                    "remote.log.task-interval-duration".to_string(),
-                    "1s".to_string(),
-                );
-                // remote.data.dir uses the same path in container and host
-                cluster_conf.insert(
-                    "remote.data.dir".to_string(),
-                    temp_dir.to_string_lossy().to_string(),
-                );
-
-                let cluster = FlussTestingClusterBuilder::new_with_cluster_conf(
-                    "test_table_remote",
-                    &cluster_conf,
-                )
-                .with_remote_data_dir(temp_dir)
-                .build()
-                .await;
-                wait_for_cluster_ready(&cluster).await;
-                let mut guard = cluster_lock.write();
-                *guard = Some(cluster);
-            });
-        })
-        .join()
-        .expect("Failed to create cluster");
-    }
-
-    fn after_all() {
-        stop_cluster(SHARED_FLUSS_CLUSTER.clone());
-    }
 
     #[tokio::test]
     async fn test_scan_remote_log() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
         let admin = connection.get_admin().await.expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss", "test_append_record_batch_and_scan");
+        let table_path = TablePath::new("fluss", "test_scan_remote_log");
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
@@ -206,8 +121,4 @@ mod table_remote_scan_test {
             );
         }
     }
-
-    fn get_fluss_cluster() -> Arc<FlussTestingCluster> {
-        get_cluster(&SHARED_FLUSS_CLUSTER)
-    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index ae61d3ad68..b53abc8609 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -18,20 +18,97 @@
 use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
 use fluss::client::FlussAdmin;
 use fluss::metadata::{PartitionSpec, TableDescriptor, TablePath};
-use parking_lot::RwLock;
 use std::collections::HashMap;
 use std::sync::Arc;
+use std::sync::LazyLock;
 use std::time::Duration;
 
-/// Polls the cluster until CoordinatorEventProcessor is initialized and tablet server is available.
-/// Times out after 20 seconds.
-pub async fn wait_for_cluster_ready(cluster: &FlussTestingCluster) {
-    let timeout = Duration::from_secs(20);
+extern "C" fn cleanup_on_exit() {
+    SHARED_CLUSTER.stop();
+}
+
+/// Shared cluster with dual listeners: PLAIN_CLIENT (plaintext) on port 9223
+/// and CLIENT (SASL) on port 9123. Includes remote storage config so
+/// table_remote_scan can also use this cluster.
+static SHARED_CLUSTER: LazyLock<FlussTestingCluster> = LazyLock::new(|| {
+    std::thread::spawn(|| {
+        let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
+        rt.block_on(async {
+            let temp_dir = std::env::current_dir()
+                .unwrap_or_else(|_| std::path::PathBuf::from("."))
+                .join("target")
+                .join(format!("test-remote-data-{}", uuid::Uuid::new_v4()));
+            let _ = std::fs::remove_dir_all(&temp_dir);
+            std::fs::create_dir_all(&temp_dir)
+                .expect("Failed to create temporary directory for remote data");
+            let temp_dir = temp_dir
+                .canonicalize()
+                .expect("Failed to canonicalize remote data directory path");
+
+            let mut cluster_conf = HashMap::new();
+            cluster_conf.insert("log.segment.file-size".to_string(), "120b".to_string());
+            cluster_conf.insert(
+                "remote.log.task-interval-duration".to_string(),
+                "1s".to_string(),
+            );
+
+            let cluster =
+                FlussTestingClusterBuilder::new_with_cluster_conf("shared-test", &cluster_conf)
+                    .with_sasl(vec![
+                        ("admin".to_string(), "admin-secret".to_string()),
+                        ("alice".to_string(), "alice-secret".to_string()),
+                    ])
+                    .with_remote_data_dir(temp_dir)
+                    .build()
+                    .await;
+            wait_for_cluster_ready_with_sasl(&cluster).await;
+
+            // Register cleanup so containers are removed on process exit.
+            unsafe {
+                unsafe extern "C" {
+                    fn atexit(f: extern "C" fn()) -> std::os::raw::c_int;
+                }
+                atexit(cleanup_on_exit);
+            }
+
+            cluster
+        })
+    })
+    .join()
+    .expect("Failed to initialize shared cluster")
+});
+
+/// Returns an `Arc` to the shared test cluster.
+pub fn get_shared_cluster() -> Arc<FlussTestingCluster> {
+    Arc::new(SHARED_CLUSTER.clone())
+}
+
+pub async fn create_table(
+    admin: &FlussAdmin,
+    table_path: &TablePath,
+    table_descriptor: &TableDescriptor,
+) {
+    admin
+        .create_table(table_path, table_descriptor, false)
+        .await
+        .expect("Failed to create table");
+}
+
+/// Similar to wait_for_cluster_ready but connects with SASL credentials.
+pub async fn wait_for_cluster_ready_with_sasl(cluster: &FlussTestingCluster) {
+    let timeout = Duration::from_secs(30);
     let poll_interval = Duration::from_millis(500);
     let start = std::time::Instant::now();
 
+    let (username, password) = cluster
+        .sasl_users()
+        .first()
+        .expect("SASL cluster must have at least one user");
+
     loop {
-        let connection = cluster.get_fluss_connection().await;
+        let connection = cluster
+            .get_fluss_connection_with_sasl(username, password)
+            .await;
         if connection.get_admin().await.is_ok()
             && connection
                 .get_metadata()
@@ -44,7 +121,7 @@ pub async fn wait_for_cluster_ready(cluster: &FlussTestingCluster) {
 
         if start.elapsed() >= timeout {
             panic!(
-                "Server readiness check timed out after {} seconds. \
+                "SASL server readiness check timed out after {} seconds. \
                  CoordinatorEventProcessor may not be initialized or TabletServer may not be available.",
                 timeout.as_secs()
             );
@@ -54,56 +131,6 @@ pub async fn wait_for_cluster_ready(cluster: &FlussTestingCluster) {
     }
 }
 
-pub async fn create_table(
-    admin: &FlussAdmin,
-    table_path: &TablePath,
-    table_descriptor: &TableDescriptor,
-) {
-    admin
-        .create_table(&table_path, &table_descriptor, false)
-        .await
-        .expect("Failed to create table");
-}
-
-pub fn start_cluster(name: &str, cluster_lock: Arc<RwLock<Option<FlussTestingCluster>>>) {
-    let name = name.to_string();
-    std::thread::spawn(move || {
-        let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
-        rt.block_on(async {
-            let cluster = FlussTestingClusterBuilder::new(&name).build().await;
-            wait_for_cluster_ready(&cluster).await;
-            let mut guard = cluster_lock.write();
-            *guard = Some(cluster);
-        });
-    })
-    .join()
-    .expect("Failed to create cluster");
-}
-
-pub fn stop_cluster(cluster_lock: Arc<RwLock<Option<FlussTestingCluster>>>) {
-    std::thread::spawn(move || {
-        let rt = tokio::runtime::Runtime::new().expect("Failed to create runtime");
-        rt.block_on(async {
-            let mut guard = cluster_lock.write();
-            if let Some(cluster) = guard.take() {
-                cluster.stop().await;
-            }
-        });
-    })
-    .join()
-    .expect("Failed to cleanup cluster");
-}
-
-pub fn get_cluster(cluster_lock: &RwLock<Option<FlussTestingCluster>>) -> Arc<FlussTestingCluster> {
-    let guard = cluster_lock.read();
-    Arc::new(
-        guard
-            .as_ref()
-            .expect("Fluss cluster not initialized. Make sure before_all() was called.")
-            .clone(),
-    )
-}
-
 /// Creates partitions for a partitioned table.
 ///
 /// # Arguments
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
index a6cc27a952..967564693e 100644
--- a/fluss-rust/crates/fluss/tests/test_fluss.rs
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -24,6 +24,7 @@ mod integration {
     mod fluss_cluster;
     mod kv_table;
     mod log_table;
+    mod sasl_auth;
 
     mod utils;
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/error-handling.md b/fluss-rust/website/docs/user-guide/cpp/error-handling.md
index 76b03e3e97..3ded0c2d17 100644
--- a/fluss-rust/website/docs/user-guide/cpp/error-handling.md
+++ b/fluss-rust/website/docs/user-guide/cpp/error-handling.md
@@ -94,6 +94,7 @@ if (!result.Ok()) {
 | `ErrorCode::PARTITION_ALREADY_EXISTS`         | 42   | Partition already exists            |
 | `ErrorCode::PARTITION_SPEC_INVALID_EXCEPTION` | 43   | Invalid partition spec              |
 | `ErrorCode::LEADER_NOT_AVAILABLE_EXCEPTION`   | 44   | No leader available for partition   |
+| `ErrorCode::AUTHENTICATE_EXCEPTION`           | 46   | Authentication failed (bad credentials) |
 
 See `fluss::ErrorCode` in `fluss.hpp` for the full list of named constants.
 
@@ -147,6 +148,26 @@ if (!result.Ok()) {
 }
 ```
 
+### Authentication Failed
+
+SASL credentials are incorrect or the user does not exist:
+
+```cpp
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+config.security_protocol = "sasl";
+config.security_sasl_username = "admin";
+config.security_sasl_password = "wrong-password";
+
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+if (!result.Ok()) {
+    if (result.error_code == fluss::ErrorCode::AUTHENTICATE_EXCEPTION) {
+        std::cerr << "Authentication failed: " << result.error_message << std::endl;
+    }
+}
+```
+
 ### Schema Mismatch
 
 Using incorrect types or column indices when writing:
diff --git a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
index 2245ee1bf1..f4b6309b8b 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
@@ -25,15 +25,32 @@ All fields have sensible defaults. Only `bootstrap_servers` typically needs to b
 
 ```cpp
 fluss::Configuration config;
-config.bootstrap_servers = "127.0.0.1:9123";    // Coordinator address
-config.writer_request_max_size = 10 * 1024 * 1024;     // Max request size (10 MB)
-config.writer_acks = "all";                      // Wait for all replicas
-config.writer_retries = std::numeric_limits<int32_t>::max();  // Retry on failure
-config.writer_batch_size = 2 * 1024 * 1024;     // Batch size (2 MB)
-config.writer_batch_timeout_ms = 100;           // Max time to wait for a batch to fill
-config.writer_bucket_no_key_assigner = "sticky"; // "sticky" or "round_robin"
-config.scanner_remote_log_prefetch_num = 4;      // Remote log prefetch count
-config.remote_file_download_thread_num = 3;  // Download threads
-config.scanner_remote_log_read_concurrency = 4;   // In-file remote log read concurrency
-config.scanner_log_max_poll_records = 500;        // Max records returned per poll()
+config.bootstrap_servers = "127.0.0.1:9123";                  // Coordinator address
+config.writer_request_max_size = 10 * 1024 * 1024;            // Max request size (10 MB)
+config.writer_acks = "all";                                    // Wait for all replicas
+config.writer_retries = std::numeric_limits<int32_t>::max();   // Retry on failure
+config.writer_batch_size = 2 * 1024 * 1024;                   // Batch size (2 MB)
+config.writer_batch_timeout_ms = 100;                          // Max time to wait for a batch to fill
+config.writer_bucket_no_key_assigner = "sticky";               // "sticky" or "round_robin"
+config.scanner_remote_log_prefetch_num = 4;                    // Remote log prefetch count
+config.remote_file_download_thread_num = 3;                    // Download threads
+config.scanner_remote_log_read_concurrency = 4;                // In-file remote log read concurrency
+config.scanner_log_max_poll_records = 500;                     // Max records per poll
+config.connect_timeout_ms = 120000;                            // TCP connect timeout (ms)
+```
+
+## SASL Authentication
+
+To connect to a Fluss cluster with SASL/PLAIN authentication enabled:
+
+```cpp
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+config.security_protocol = "sasl";
+config.security_sasl_mechanism = "PLAIN";
+config.security_sasl_username = "admin";
+config.security_sasl_password = "admin-secret";
+
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
 ```
diff --git a/fluss-rust/website/docs/user-guide/python/error-handling.md b/fluss-rust/website/docs/user-guide/python/error-handling.md
index 9fa482190a..50a9e46be0 100644
--- a/fluss-rust/website/docs/user-guide/python/error-handling.md
+++ b/fluss-rust/website/docs/user-guide/python/error-handling.md
@@ -53,6 +53,7 @@ except fluss.FlussError as e:
 | `ErrorCode.PARTITION_ALREADY_EXISTS`         | 42   | Partition already exists            |
 | `ErrorCode.PARTITION_SPEC_INVALID_EXCEPTION` | 43   | Invalid partition spec              |
 | `ErrorCode.LEADER_NOT_AVAILABLE_EXCEPTION`   | 44   | No leader available for partition   |
+| `ErrorCode.AUTHENTICATE_EXCEPTION`           | 46   | Authentication failed (bad credentials) |
 
 See `fluss.ErrorCode` for the full list of named constants.
 
@@ -95,6 +96,24 @@ except fluss.FlussError as e:
         print("Partition does not exist, create it first")
 ```
 
+### Authentication Failed
+
+SASL credentials are incorrect or the user does not exist.
+
+```python
+try:
+    config = fluss.Config({
+        "bootstrap.servers": "127.0.0.1:9123",
+        "client.security.protocol": "sasl",
+        "client.security.sasl.username": "admin",
+        "client.security.sasl.password": "wrong-password",
+    })
+    conn = await fluss.FlussConnection.create(config)
+except fluss.FlussError as e:
+    if e.error_code == fluss.ErrorCode.AUTHENTICATE_EXCEPTION:
+        print(f"Authentication failed: {e.message}")
+```
+
 ### Schema Mismatch
 
 Row data doesn't match the table schema.
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
index 39c53be4ea..90b1249ca4 100644
--- a/fluss-rust/website/docs/user-guide/python/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -28,12 +28,34 @@ with await fluss.FlussConnection.create(config) as conn:
 | `writer.acks`                         | Acknowledgment setting (`all` waits for all replicas)                                 | `all`              |
 | `writer.retries`                      | Number of retries on failure                                                          | `2147483647`       |
 | `writer.batch-size`                   | Batch size for writes in bytes                                                        | `2097152` (2 MB)   |
-| `writer.batch-timeout-ms`             | The maximum time to wait for a writer batch to fill up before sending.               | `100`              |
-| `writer.bucket.no-key-assigner`       | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`           |
+| `writer.batch-timeout-ms`             | The maximum time to wait for a writer batch to fill up before sending.                | `100`              |
+| `writer.bucket.no-key-assigner`       | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin`  | `sticky`           |
 | `scanner.remote-log.prefetch-num`     | Number of remote log segments to prefetch                                             | `4`                |
 | `remote-file.download-thread-num`     | Number of threads for remote log downloads                                            | `3`                |
 | `scanner.remote-log.read-concurrency` | Streaming read concurrency within a remote log file                                   | `4`                |
 | `scanner.log.max-poll-records`        | Max records returned in a single poll()                                               | `500`              |
+| `connect-timeout`                     | TCP connect timeout in milliseconds                                                   | `120000`           |
+| `security.protocol`                   | `PLAINTEXT` (default) or `sasl` for SASL auth                                        | `PLAINTEXT`        |
+| `security.sasl.mechanism`             | SASL mechanism (only `PLAIN` is supported)                                            | `PLAIN`            |
+| `security.sasl.username`              | SASL username (required when protocol is `sasl`)                                      | (empty)            |
+| `security.sasl.password`              | SASL password (required when protocol is `sasl`)                                      | (empty)            |
+
+## SASL Authentication
+
+To connect to a Fluss cluster with SASL/PLAIN authentication enabled:
+
+```python
+config = fluss.Config({
+    "bootstrap.servers": "127.0.0.1:9123",
+    "security.protocol": "sasl",
+    "security.sasl.mechanism": "PLAIN",
+    "security.sasl.username": "admin",
+    "security.sasl.password": "admin-secret",
+})
+conn = await fluss.FlussConnection.create(config)
+```
+
+## Connection Lifecycle
 
 Remember to close the connection when done:
 
diff --git a/fluss-rust/website/docs/user-guide/rust/error-handling.md b/fluss-rust/website/docs/user-guide/rust/error-handling.md
index 35ede6c85c..964f81f206 100644
--- a/fluss-rust/website/docs/user-guide/rust/error-handling.md
+++ b/fluss-rust/website/docs/user-guide/rust/error-handling.md
@@ -71,6 +71,9 @@ match result {
     Err(ref e) if e.api_error() == Some(FlussError::LeaderNotAvailableException) => {
         eprintln!("Leader not available: {}", e);
     }
+    Err(ref e) if e.api_error() == Some(FlussError::AuthenticateException) => {
+        eprintln!("Authentication failed: {}", e);
+    }
     _ => {}
 }
 ```
@@ -133,6 +136,22 @@ match result {
 }
 ```
 
+### Authentication Failed
+
+SASL credentials are incorrect or the user does not exist.
+
+```rust
+use fluss::error::{Error, FlussError};
+
+let result = FlussConnection::new(config).await;
+match result {
+    Err(ref e) if e.api_error() == Some(FlussError::AuthenticateException) => {
+        eprintln!("Authentication failed: {}", e);
+    }
+    _ => {}
+}
+```
+
 ### Schema Mismatch
 
 Row data does not match the expected table schema.
diff --git a/fluss-rust/website/docs/user-guide/rust/example/configuration.md b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
index a2f52dc1f0..f6340c976d 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
@@ -17,16 +17,36 @@ let conn = FlussConnection::new(config).await?;
 
 ## Connection Configurations
 
-| Option                          | Description                                                                          | Default          |
-|---------------------------------|--------------------------------------------------------------------------------------|------------------|
-| `bootstrap_servers`             | Coordinator server address                                                           | `127.0.0.1:9123` |
-| `writer_request_max_size`       | Maximum request size in bytes                                                        | 10 MB            |
-| `writer_acks`                   | Acknowledgment setting (`all` waits for all replicas)                                | `all`            |
-| `writer_retries`                | Number of retries on failure                                                         | `i32::MAX`       |
-| `writer_batch_size`             | Batch size for writes                                                                | 2 MB             |
-| `writer_batch_timeout_ms`       | The maximum time to wait for a writer batch to fill up before sending.               | `100`            |
-| `writer_bucket_no_key_assigner` | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`         |
-| `scanner_remote_log_prefetch_num` | Number of remote log segments to prefetch                                           | `4`              |
-| `remote_file_download_thread_num` | Number of concurrent remote log file downloads                                      | `3`              |
-| `scanner_remote_log_read_concurrency` | Streaming read concurrency within a remote log file                           | `4`              |
-| `scanner_log_max_poll_records`  | Maximum records returned in a single `poll()`                                       | `500`            |
+| Option                                | Description                                                                          | Default          |
+|---------------------------------------|--------------------------------------------------------------------------------------|------------------|
+| `bootstrap_servers`                   | Coordinator server address                                                           | `127.0.0.1:9123` |
+| `writer_request_max_size`             | Maximum request size in bytes                                                        | 10 MB            |
+| `writer_acks`                         | Acknowledgment setting (`all` waits for all replicas)                                | `all`            |
+| `writer_retries`                      | Number of retries on failure                                                         | `i32::MAX`       |
+| `writer_batch_size`                   | Batch size for writes                                                                | 2 MB             |
+| `writer_batch_timeout_ms`             | The maximum time to wait for a writer batch to fill up before sending.               | `100`            |
+| `writer_bucket_no_key_assigner`       | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`         |
+| `scanner_remote_log_prefetch_num`     | Number of remote log segments to prefetch                                            | `4`              |
+| `remote_file_download_thread_num`     | Number of concurrent remote log file downloads                                       | `3`              |
+| `scanner_remote_log_read_concurrency` | Streaming read concurrency within a remote log file                                  | `4`              |
+| `scanner_log_max_poll_records`        | Maximum records returned in a single `poll()`                                        | `500`            |
+| `connect_timeout_ms`                  | TCP connect timeout in milliseconds                                                  | 120000           |
+| `security_protocol`                   | `PLAINTEXT` (default) or `sasl` for SASL auth                                       | `PLAINTEXT`      |
+| `security_sasl_mechanism`             | SASL mechanism (only `PLAIN` is supported)                                           | `PLAIN`          |
+| `security_sasl_username`              | SASL username (required when protocol is `sasl`)                                     | (empty)          |
+| `security_sasl_password`              | SASL password (required when protocol is `sasl`)                                     | (empty)          |
+
+## SASL Authentication
+
+To connect to a Fluss cluster with SASL/PLAIN authentication enabled:
+
+```rust
+let mut config = Config::default();
+config.bootstrap_servers = "127.0.0.1:9123".to_string();
+config.security_protocol = "sasl".to_string();
+config.security_sasl_mechanism = "PLAIN".to_string();
+config.security_sasl_username = "admin".to_string();
+config.security_sasl_password = "admin-secret".to_string();
+
+let conn = FlussConnection::new(config).await?;
+```

From 99d6621359e261b7844952074fda1f7fbaa667fe Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 28 Feb 2026 12:51:09 +0000
Subject: [PATCH 174/287] chore:fix test_get_server_nodes to use shared cluster
 (#392)

---
 fluss-rust/crates/fluss/tests/integration/admin.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index 5bbdaf01dc..c64770468b 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -489,7 +489,7 @@ mod admin_test {
 
     #[tokio::test]
     async fn test_get_server_nodes() {
-        let cluster = get_fluss_cluster();
+        let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().await.unwrap();
 

From e3e9e4e1e0f913b59d99d0a142c73c657f6e4d13 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sun, 1 Mar 2026 04:03:03 +0000
Subject: [PATCH 175/287] [doc] Update API Ref following SASL / NoKeyAssigner
 (#396)

---
 .../docs/user-guide/cpp/api-reference.md      | 28 ++++++++++-------
 .../docs/user-guide/python/api-reference.md   | 30 ++++++++++++-------
 .../docs/user-guide/rust/api-reference.md     | 28 ++++++++++-------
 3 files changed, 55 insertions(+), 31 deletions(-)

diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index 489f13a17b..debd311d40 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -15,16 +15,24 @@ Complete API reference for the Fluss C++ client.
 
 ## `Configuration`
 
-| Field                             | Type          | Default              | Description                                                     |
-|-----------------------------------|---------------|----------------------|-----------------------------------------------------------------|
-| `bootstrap_servers`               | `std::string` | `"127.0.0.1:9123"`   | Coordinator server address                                      |
-| `writer_request_max_size`         | `int32_t`     | `10485760` (10 MB)   | Maximum request size in bytes                                   |
-| `writer_acks`                     | `std::string` | `"all"`              | Acknowledgment setting (`"all"`, `"0"`, `"1"`, or `"-1"`)       |
-| `writer_retries`                  | `int32_t`     | `INT32_MAX`          | Number of retries on failure                                    |
-| `writer_batch_size`               | `int32_t`     | `2097152` (2 MB)     | Batch size for writes in bytes                                  |
-| `scanner_remote_log_prefetch_num` | `size_t`      | `4`                  | Number of remote log segments to prefetch                       |
-| `remote_file_download_thread_num` | `size_t`      | `3`                  | Number of threads for remote log downloads                      |
-| `scanner_log_max_poll_records`    | `size_t`      | `500`                | Maximum number of records returned in a single Poll()           |
+| Field                                 | Type          | Default              | Description                                                                              |
+|---------------------------------------|---------------|----------------------|------------------------------------------------------------------------------------------|
+| `bootstrap_servers`                   | `std::string` | `"127.0.0.1:9123"`   | Coordinator server address                                                               |
+| `writer_request_max_size`             | `int32_t`     | `10485760` (10 MB)   | Maximum request size in bytes                                                            |
+| `writer_acks`                         | `std::string` | `"all"`              | Acknowledgment setting (`"all"`, `"0"`, `"1"`, or `"-1"`)                                |
+| `writer_retries`                      | `int32_t`     | `INT32_MAX`          | Number of retries on failure                                                             |
+| `writer_batch_size`                   | `int32_t`     | `2097152` (2 MB)     | Batch size for writes in bytes                                                           |
+| `writer_batch_timeout_ms`             | `int64_t`     | `100`                | Maximum time in ms to wait for a writer batch to fill up before sending                  |
+| `writer_bucket_no_key_assigner`       | `std::string` | `"sticky"`           | Bucket assignment strategy for tables without bucket keys: `"sticky"` or `"round_robin"` |
+| `scanner_remote_log_prefetch_num`     | `size_t`      | `4`                  | Number of remote log segments to prefetch                                                |
+| `remote_file_download_thread_num`     | `size_t`      | `3`                  | Number of threads for remote log downloads                                               |
+| `scanner_remote_log_read_concurrency` | `size_t`      | `4`                  | Streaming read concurrency within a remote log file                                      |
+| `scanner_log_max_poll_records`        | `size_t`      | `500`                | Maximum number of records returned in a single Poll()                                    |
+| `connect_timeout_ms`                  | `uint64_t`    | `120000`             | TCP connect timeout in milliseconds                                                      |
+| `security_protocol`                   | `std::string` | `"PLAINTEXT"`        | `"PLAINTEXT"` (default) or `"sasl"` for SASL auth                                        |
+| `security_sasl_mechanism`             | `std::string` | `"PLAIN"`            | SASL mechanism (only `"PLAIN"` is supported)                                             |
+| `security_sasl_username`              | `std::string` | (empty)              | SASL username (required when protocol is `"sasl"`)                                       |
+| `security_sasl_password`              | `std::string` | (empty)              | SASL password (required when protocol is `"sasl"`)                                       |
 
 ## `Connection`
 
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index 1c97066c0f..8f7ab61bbd 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -7,17 +7,25 @@ Complete API reference for the Fluss Python client.
 
 ## `Config`
 
-| Method / Property                  | Description                                               |
-|------------------------------------|-----------------------------------------------------------|
-| `Config(properties: dict = None)`  | Create config from a dict of key-value pairs              |
-| `bootstrap_servers`                | Get/set coordinator server address                        |
-| `writer_request_max_size`          | Get/set max request size in bytes                         |
-| `writer_acks`                      | Get/set acknowledgment setting (`"all"` for all replicas) |
-| `writer_retries`                   | Get/set number of retries on failure                      |
-| `writer_batch_size`                | Get/set write batch size in bytes                         |
-| `scanner_remote_log_prefetch_num`  | Get/set number of remote log segments to prefetch         |
-| `remote_file_download_thread_num`  | Get/set number of threads for remote log downloads        |
-| `scanner_log_max_poll_records`     | Get/set max number of records returned in a single poll() |
+| Method / Property                     | Description                                                                             |
+|---------------------------------------|-----------------------------------------------------------------------------------------|
+| `Config(properties: dict = None)`     | Create config from a dict of key-value pairs                                            |
+| `bootstrap_servers`                   | Get/set coordinator server address                                                      |
+| `writer_request_max_size`             | Get/set max request size in bytes                                                       |
+| `writer_acks`                         | Get/set acknowledgment setting (`"all"` for all replicas)                               |
+| `writer_retries`                      | Get/set number of retries on failure                                                    |
+| `writer_batch_size`                   | Get/set write batch size in bytes                                                       |
+| `writer_batch_timeout_ms`             | Get/set max time in ms to wait for a writer batch to fill up before sending             |
+| `writer.bucket.no-key-assigner`       | Bucket assignment strategy (`"sticky"` or `"round_robin"`); set via `Config(dict)` only |
+| `scanner_remote_log_prefetch_num`     | Get/set number of remote log segments to prefetch                                       |
+| `remote_file_download_thread_num`     | Get/set number of threads for remote log downloads                                      |
+| `scanner_remote_log_read_concurrency` | Get/set streaming read concurrency within a remote log file                             |
+| `scanner_log_max_poll_records`        | Get/set max number of records returned in a single poll()                               |
+| `connect_timeout_ms`                  | Get/set TCP connect timeout in milliseconds                                             |
+| `security_protocol`                   | Get/set security protocol (`"PLAINTEXT"` or `"sasl"`)                                   |
+| `security_sasl_mechanism`             | Get/set SASL mechanism (only `"PLAIN"` is supported)                                    |
+| `security_sasl_username`              | Get/set SASL username (required when protocol is `"sasl"`)                              |
+| `security_sasl_password`              | Get/set SASL password (required when protocol is `"sasl"`)                              |
 
 ## `FlussConnection`
 
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 2d149aac5a..3d72f555c6 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -7,16 +7,24 @@ Complete API reference for the Fluss Rust client.
 
 ## `Config`
 
-| Field                             | Type     | Default            | Description                                             |
-|-----------------------------------|----------|--------------------|---------------------------------------------------------|
-| `bootstrap_servers`               | `String` | `"127.0.0.1:9123"` | Coordinator server address                              |
-| `writer_request_max_size`         | `i32`    | `10485760` (10 MB) | Maximum request size in bytes                           |
-| `writer_acks`                     | `String` | `"all"`            | Acknowledgment setting (`"all"` waits for all replicas) |
-| `writer_retries`                  | `i32`    | `i32::MAX`         | Number of retries on failure                            |
-| `writer_batch_size`               | `i32`    | `2097152` (2 MB)   | Batch size for writes in bytes                          |
-| `scanner_remote_log_prefetch_num` | `usize`  | `4`                | Number of remote log segments to prefetch               |
-| `remote_file_download_thread_num` | `usize`  | `3`                | Number of threads for remote log downloads              |
-| `scanner_log_max_poll_records`    | `usize`  | `500`              | Maximum number of records returned in a single poll()   |
+| Field                                 | Type            | Default            | Description                                                                          |
+|---------------------------------------|-----------------|--------------------|--------------------------------------------------------------------------------------|
+| `bootstrap_servers`                   | `String`        | `"127.0.0.1:9123"` | Coordinator server address                                                           |
+| `writer_request_max_size`             | `i32`           | `10485760` (10 MB) | Maximum request size in bytes                                                        |
+| `writer_acks`                         | `String`        | `"all"`            | Acknowledgment setting (`"all"` waits for all replicas)                              |
+| `writer_retries`                      | `i32`           | `i32::MAX`         | Number of retries on failure                                                         |
+| `writer_batch_size`                   | `i32`           | `2097152` (2 MB)   | Batch size for writes in bytes                                                       |
+| `writer_batch_timeout_ms`             | `i64`           | `100`              | Maximum time in ms to wait for a writer batch to fill up before sending              |
+| `writer_bucket_no_key_assigner`       | `NoKeyAssigner` | `sticky`           | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` |
+| `scanner_remote_log_prefetch_num`     | `usize`         | `4`                | Number of remote log segments to prefetch                                            |
+| `remote_file_download_thread_num`     | `usize`         | `3`                | Number of threads for remote log downloads                                           |
+| `scanner_remote_log_read_concurrency` | `usize`         | `4`                | Streaming read concurrency within a remote log file                                  |
+| `scanner_log_max_poll_records`        | `usize`         | `500`              | Maximum number of records returned in a single poll()                                |
+| `connect_timeout_ms`                  | `u64`           | `120000`           | TCP connect timeout in milliseconds                                                  |
+| `security_protocol`                   | `String`        | `"PLAINTEXT"`      | `PLAINTEXT` (default) or `sasl` for SASL auth                                        |
+| `security_sasl_mechanism`             | `String`        | `"PLAIN"`          | SASL mechanism (only `PLAIN` is supported)                                           |
+| `security_sasl_username`              | `String`        | (empty)            | SASL username (required when protocol is `sasl`)                                     |
+| `security_sasl_password`              | `String`        | (empty)            | SASL password (required when protocol is `sasl`)                                     |
 
 ## `FlussConnection`
 

From 7bb905d1fb1735bbe099e4c4467159396ed44112 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sun, 1 Mar 2026 04:03:40 +0000
Subject: [PATCH 176/287] [doc] Update doc after rust / c++ panic fixes (#395)

---
 .../docs/user-guide/rust/api-reference.md     | 37 ++++++++++---------
 .../docs/user-guide/rust/data-types.md        | 14 +++----
 .../docs/user-guide/rust/example/index.md     |  2 +-
 .../user-guide/rust/example/log-tables.md     | 10 ++---
 .../rust/example/partitioned-tables.md        |  2 +-
 .../rust/example/primary-key-tables.md        |  6 +--
 6 files changed, 36 insertions(+), 35 deletions(-)

diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 3d72f555c6..d539a860ca 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -383,24 +383,25 @@ Implements the `InternalRow` trait (see below).
 
 ## `InternalRow` trait
 
-| Method                                                                         |  Description                            |
-|--------------------------------------------------------------------------------|-----------------------------------------|
-| `fn get_boolean(&self, idx: usize) -> bool`                                    | Get boolean value                       |
-| `fn get_byte(&self, idx: usize) -> i8`                                         | Get tinyint value                       |
-| `fn get_short(&self, idx: usize) -> i16`                                       | Get smallint value                      |
-| `fn get_int(&self, idx: usize) -> i32`                                         | Get int value                           |
-| `fn get_long(&self, idx: usize) -> i64`                                        | Get bigint value                        |
-| `fn get_float(&self, idx: usize) -> f32`                                       | Get float value                         |
-| `fn get_double(&self, idx: usize) -> f64`                                      | Get double value                        |
-| `fn get_string(&self, idx: usize) -> &str`                                     | Get string value                        |
-| `fn get_decimal(&self, idx: usize, precision: usize, scale: usize) -> Decimal` | Get decimal value                       |
-| `fn get_date(&self, idx: usize) -> Date`                                       | Get date value                          |
-| `fn get_time(&self, idx: usize) -> Time`                                       | Get time value                          |
-| `fn get_timestamp_ntz(&self, idx: usize, precision: u32) -> TimestampNtz`      | Get timestamp value                     |
-| `fn get_timestamp_ltz(&self, idx: usize, precision: u32) -> TimestampLtz`      | Get timestamp with local timezone value |
-| `fn get_bytes(&self, idx: usize) -> &[u8]`                                     | Get bytes value                         |
-| `fn get_binary(&self, idx: usize, length: usize) -> &[u8]`                     | Get fixed-length binary value           |
-| `fn get_char(&self, idx: usize, length: usize) -> &str`                        | Get fixed-length char value             |
+| Method                                                                                 | Description                             |
+|----------------------------------------------------------------------------------------|-----------------------------------------|
+| `fn is_null_at(&self, idx: usize) -> Result<bool>`                                     | Check if a field is null                |
+| `fn get_boolean(&self, idx: usize) -> Result<bool>`                                    | Get boolean value                       |
+| `fn get_byte(&self, idx: usize) -> Result<i8>`                                         | Get tinyint value                       |
+| `fn get_short(&self, idx: usize) -> Result<i16>`                                       | Get smallint value                      |
+| `fn get_int(&self, idx: usize) -> Result<i32>`                                         | Get int value                           |
+| `fn get_long(&self, idx: usize) -> Result<i64>`                                        | Get bigint value                        |
+| `fn get_float(&self, idx: usize) -> Result<f32>`                                       | Get float value                         |
+| `fn get_double(&self, idx: usize) -> Result<f64>`                                      | Get double value                        |
+| `fn get_string(&self, idx: usize) -> Result<&str>`                                     | Get string value                        |
+| `fn get_decimal(&self, idx: usize, precision: usize, scale: usize) -> Result<Decimal>` | Get decimal value                       |
+| `fn get_date(&self, idx: usize) -> Result<Date>`                                       | Get date value                          |
+| `fn get_time(&self, idx: usize) -> Result<Time>`                                       | Get time value                          |
+| `fn get_timestamp_ntz(&self, idx: usize, precision: u32) -> Result<TimestampNtz>`      | Get timestamp value                     |
+| `fn get_timestamp_ltz(&self, idx: usize, precision: u32) -> Result<TimestampLtz>`      | Get timestamp with local timezone value |
+| `fn get_bytes(&self, idx: usize) -> Result<&[u8]>`                                     | Get bytes value                         |
+| `fn get_binary(&self, idx: usize, length: usize) -> Result<&[u8]>`                     | Get fixed-length binary value           |
+| `fn get_char(&self, idx: usize, length: usize) -> Result<&str>`                        | Get fixed-length char value             |
 
 ## `ChangeType`
 
diff --git a/fluss-rust/website/docs/user-guide/rust/data-types.md b/fluss-rust/website/docs/user-guide/rust/data-types.md
index fe050bfc3c..143fe3457e 100644
--- a/fluss-rust/website/docs/user-guide/rust/data-types.md
+++ b/fluss-rust/website/docs/user-guide/rust/data-types.md
@@ -67,14 +67,14 @@ use fluss::row::InternalRow;
 for record in scan_records {
     let row = record.row();
 
-    if row.is_null_at(0) {
+    if row.is_null_at(0)? {
         // field is null
     }
-    let id: i32 = row.get_int(0);
-    let name: &str = row.get_string(1);
-    let score: f32 = row.get_float(2);
-    let date: Date = row.get_date(3);
-    let ts: TimestampNtz = row.get_timestamp_ntz(4, 6);
-    let decimal: Decimal = row.get_decimal(5, 10, 2);
+    let id: i32 = row.get_int(0)?;
+    let name: &str = row.get_string(1)?;
+    let score: f32 = row.get_float(2)?;
+    let date: Date = row.get_date(3)?;
+    let ts: TimestampNtz = row.get_timestamp_ntz(4, 6)?;
+    let decimal: Decimal = row.get_decimal(5, 10, 2)?;
 }
 ```
diff --git a/fluss-rust/website/docs/user-guide/rust/example/index.md b/fluss-rust/website/docs/user-guide/rust/example/index.md
index dcee87b0f6..e35c8dc3f3 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/index.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/index.md
@@ -48,7 +48,7 @@ async fn main() -> Result<()> {
     let records = scanner.poll(Duration::from_secs(5)).await?;
     for record in records {
         let row = record.row();
-        println!("id={}, name={}", row.get_int(0), row.get_string(1));
+        println!("id={}, name={}", row.get_int(0)?, row.get_string(1)?);
     }
 
     Ok(())
diff --git a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
index f5a4d0e25e..7c01cf1ccd 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
@@ -70,8 +70,8 @@ for (bucket, bucket_records) in records.records_by_buckets() {
         let row = record.row();
         println!(
             "  event_id={}, event_type={} @ offset={}",
-            row.get_int(0),
-            row.get_string(1),
+            row.get_int(0)?,
+            row.get_string(1)?,
             record.offset()
         );
     }
@@ -82,9 +82,9 @@ for record in records {
     let row = record.row();
     println!(
         "event_id={}, event_type={}, timestamp={} @ offset={}",
-        row.get_int(0),
-        row.get_string(1),
-        row.get_long(2),
+        row.get_int(0)?,
+        row.get_string(1)?,
+        row.get_long(2)?,
         record.offset()
     );
 }
diff --git a/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
index 3edf4d88ce..40bd4d60c2 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
@@ -208,7 +208,7 @@ key.set_field(2, 1i64);    // zone (partition column)
 
 let result = lookuper.lookup(&key).await?;
 if let Some(row) = result.get_single_row()? {
-    println!("Found: score={}", row.get_long(3));
+    println!("Found: score={}", row.get_long(3)?);
 }
 ```
 
diff --git a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
index 5b299cca3a..9e819796ce 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
@@ -104,9 +104,9 @@ let result = lookuper.lookup(&key).await?;
 if let Some(row) = result.get_single_row()? {
     println!(
         "Found: id={}, name={}, age={}",
-        row.get_int(0),
-        row.get_string(1),
-        row.get_long(2)
+        row.get_int(0)?,
+        row.get_string(1)?,
+        row.get_long(2)?
     );
 } else {
     println!("Record not found");

From c100ee375c79427935009293baa6a82e2eb4337a Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sun, 1 Mar 2026 11:29:21 +0100
Subject: [PATCH 177/287] chore: Add missing python type stubs (#400)

---
 fluss-rust/bindings/python/fluss/__init__.pyi | 29 ++++++++++++++++---
 1 file changed, 25 insertions(+), 4 deletions(-)

diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 4c2142d7b0..c387d7340e 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -169,6 +169,30 @@ class Config:
     def scanner_log_max_poll_records(self) -> int: ...
     @scanner_log_max_poll_records.setter
     def scanner_log_max_poll_records(self, num: int) -> None: ...
+    @property
+    def writer_batch_timeout_ms(self) -> int: ...
+    @writer_batch_timeout_ms.setter
+    def writer_batch_timeout_ms(self, timeout: int) -> None: ...
+    @property
+    def connect_timeout_ms(self) -> int: ...
+    @connect_timeout_ms.setter
+    def connect_timeout_ms(self, timeout: int) -> None: ...
+    @property
+    def security_protocol(self) -> str: ...
+    @security_protocol.setter
+    def security_protocol(self, protocol: str) -> None: ...
+    @property
+    def security_sasl_mechanism(self) -> str: ...
+    @security_sasl_mechanism.setter
+    def security_sasl_mechanism(self, mechanism: str) -> None: ...
+    @property
+    def security_sasl_username(self) -> str: ...
+    @security_sasl_username.setter
+    def security_sasl_username(self, username: str) -> None: ...
+    @property
+    def security_sasl_password(self) -> str: ...
+    @security_sasl_password.setter
+    def security_sasl_password(self, password: str) -> None: ...
 
 class FlussConnection:
     @staticmethod
@@ -837,10 +861,6 @@ class TableBucket:
     def __str__(self) -> str: ...
     def __repr__(self) -> str: ...
 
-class TableDistribution:
-    def bucket_keys(self) -> List[str]: ...
-    def bucket_count(self) -> Optional[int]: ...
-
 class PartitionInfo:
     """Information about a partition."""
 
@@ -864,6 +884,7 @@ class ErrorCode:
     """
 
     CLIENT_ERROR: int
+    NONE: int
     UNKNOWN_SERVER_ERROR: int
     NETWORK_EXCEPTION: int
     UNSUPPORTED_VERSION: int

From 20072070ac80348942a3cdf903455295050c4567 Mon Sep 17 00:00:00 2001
From: AlexZhao <zhaohaidao2008@hotmail.com>
Date: Mon, 2 Mar 2026 10:38:07 +0800
Subject: [PATCH 178/287] docs: add cpp build guides with examples (#376)

---
 fluss-rust/MODULE.bazel                       |  65 ++++
 fluss-rust/bindings/cpp/.gitignore            |  10 +
 fluss-rust/bindings/cpp/BUILD.bazel           |  46 ++-
 fluss-rust/bindings/cpp/CMakeLists.txt        | 141 ++++++-
 fluss-rust/bindings/cpp/bazel/cpp/BUILD.bazel |  26 ++
 fluss-rust/bindings/cpp/bazel/cpp/deps.bzl    | 349 ++++++++++++++++++
 .../bazel-consumer/build/BUILD.bazel}         |  12 +-
 .../bazel-consumer/build/MODULE.bazel         |  39 ++
 .../cpp/examples/bazel-consumer/build/main.cc |  28 ++
 .../bazel-consumer/system/BUILD.bazel         |  25 ++
 .../bazel-consumer/system/MODULE.bazel        |  44 +++
 .../examples/bazel-consumer/system/main.cc    |  27 ++
 .../bindings/cpp/scripts/ensure_protoc.sh     | 277 ++++++++++++++
 fluss-rust/docs/cpp-bazel-usage.md            | 291 +++++++++++++++
 fluss-rust/docs/cpp-cmake-usage.md            | 129 +++++++
 15 files changed, 1486 insertions(+), 23 deletions(-)
 create mode 100644 fluss-rust/MODULE.bazel
 create mode 100644 fluss-rust/bindings/cpp/bazel/cpp/BUILD.bazel
 create mode 100644 fluss-rust/bindings/cpp/bazel/cpp/deps.bzl
 rename fluss-rust/bindings/cpp/{MODULE.bazel => examples/bazel-consumer/build/BUILD.bazel} (80%)
 create mode 100644 fluss-rust/bindings/cpp/examples/bazel-consumer/build/MODULE.bazel
 create mode 100644 fluss-rust/bindings/cpp/examples/bazel-consumer/build/main.cc
 create mode 100644 fluss-rust/bindings/cpp/examples/bazel-consumer/system/BUILD.bazel
 create mode 100644 fluss-rust/bindings/cpp/examples/bazel-consumer/system/MODULE.bazel
 create mode 100644 fluss-rust/bindings/cpp/examples/bazel-consumer/system/main.cc
 create mode 100755 fluss-rust/bindings/cpp/scripts/ensure_protoc.sh
 create mode 100644 fluss-rust/docs/cpp-bazel-usage.md
 create mode 100644 fluss-rust/docs/cpp-cmake-usage.md

diff --git a/fluss-rust/MODULE.bazel b/fluss-rust/MODULE.bazel
new file mode 100644
index 0000000000..f0e6025073
--- /dev/null
+++ b/fluss-rust/MODULE.bazel
@@ -0,0 +1,65 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# Required at repository root for root module mode (`bazel_dep(name = "fluss-cpp", ...)`).
+# Consumer examples use `local_path_override(..., path = "/path/to/fluss-rust")`, so
+# Bazel resolves the module from the repository root. This also matches the Rust
+# workspace layout used by `bindings/cpp` during cargo-based Bazel/CMake builds.
+# `0.0.0` is a local-development placeholder in this repository branch.
+# Consumers should depend on a published release version.
+module(
+    name = "fluss-cpp",
+    version = "0.0.0",
+)
+
+bazel_dep(name = "rules_cc", version = "0.0.17")
+bazel_dep(name = "platforms", version = "0.0.10")
+bazel_dep(name = "rules_foreign_cc", version = "0.15.1")
+bazel_dep(name = "rules_python", version = "1.2.0")
+
+python = use_extension("@rules_python//python/extensions:python.bzl", "python")
+python.toolchain(python_version = "3.12")
+use_repo(python, "python_3_12")
+
+foreign_cc_tools = use_extension("@rules_foreign_cc//foreign_cc:extensions.bzl", "tools")
+use_repo(
+    foreign_cc_tools,
+    "cmake_3.31.8_toolchains",
+    "cmake_src",
+    "ninja_1.13.0_toolchains",
+    "ninja_build_src",
+    "rules_foreign_cc_framework_toolchains",
+)
+
+register_toolchains(
+    "@rules_foreign_cc_framework_toolchains//:all",
+    "@cmake_3.31.8_toolchains//:all",
+    "@ninja_1.13.0_toolchains//:all",
+    "@python_3_12//:all",
+    "@rules_foreign_cc//toolchains:all",
+)
+
+cpp_sdk = use_extension("//bindings/cpp/bazel/cpp:deps.bzl", "cpp_sdk")
+cpp_sdk.config(
+    mode = "build",
+    arrow_cpp_version = "19.0.1",
+    protobuf_version = "3.25.5",
+    ep_cmake_ranlib = "/usr/bin/ranlib",
+    ep_cmake_ar = "/usr/bin/ar",
+    ep_cmake_nm = "/usr/bin/nm",
+)
+use_repo(cpp_sdk, "apache_arrow_cpp")
diff --git a/fluss-rust/bindings/cpp/.gitignore b/fluss-rust/bindings/cpp/.gitignore
index da15a58b53..1f1632b95c 100644
--- a/fluss-rust/bindings/cpp/.gitignore
+++ b/fluss-rust/bindings/cpp/.gitignore
@@ -15,3 +15,13 @@ bazel-testlogs
 bazel-cpp
 bazel-*
 MODULE.bazel.lock
+
+# Keep versioned Bazel consumer examples (name starts with bazel-).
+!examples/bazel-consumer/
+!examples/bazel-consumer/**
+# `build/` is ignored globally above; keep this fixture path visible.
+!examples/bazel-consumer/build/
+!examples/bazel-consumer/build/**
+examples/bazel-consumer/**/MODULE.bazel.lock
+examples/bazel-consumer/**/bazel-*
+examples/bazel-consumer/**/tmp.log
diff --git a/fluss-rust/bindings/cpp/BUILD.bazel b/fluss-rust/bindings/cpp/BUILD.bazel
index 0ae2ce329b..d247baf18c 100644
--- a/fluss-rust/bindings/cpp/BUILD.bazel
+++ b/fluss-rust/bindings/cpp/BUILD.bazel
@@ -17,7 +17,7 @@
 
 licenses(["notice"])
 
-load("@rules_cc//cc:defs.bzl", "cc_library", "cc_binary")
+load("@rules_cc//cc:defs.bzl", "cc_binary", "cc_import", "cc_library")
 
 config_setting(
     name = "debug_mode",
@@ -34,6 +34,37 @@ config_setting(
     values = {"compilation_mode": "opt"},
 )
 
+_PROTOC_SETUP_SNIPPET = """
+        set -e
+        if [ -n "$${CARGO:-}" ]; then
+            if [ ! -x "$$CARGO" ]; then
+                echo "Error: CARGO is set but not executable: $$CARGO" >&2
+                exit 1
+            fi
+            CARGO_BIN="$$CARGO"
+        else
+            CARGO_BIN=$$(command -v cargo || true)
+            if [ -z "$$CARGO_BIN" ]; then
+                echo "Error: cargo not found in PATH and CARGO is not set" >&2
+                exit 1
+            fi
+        fi
+        if [ -n "$${PROTOC:-}" ]; then
+            if [ ! -x "$$PROTOC" ]; then
+                echo "Error: PROTOC is set but not executable: $$PROTOC" >&2
+                exit 1
+            fi
+            export PROTOC
+        else
+            PROTOC_BIN=$$(command -v protoc || true)
+            if [ -z "$$PROTOC_BIN" ]; then
+                echo "Error: protoc not found in PATH and PROTOC is not set" >&2
+                exit 1
+            fi
+            export PROTOC="$$PROTOC_BIN"
+        fi
+"""
+
 genrule(
     name = "cargo_build_debug",
     srcs = glob([
@@ -47,8 +78,7 @@ genrule(
         "src/lib.rs_debug.h",
         "cxxbridge/rust/cxx_debug.h",
     ],
-    cmd = """
-        set -e
+    cmd = _PROTOC_SETUP_SNIPPET + """
         EXECROOT=$$(pwd)
         OUTPUT_LIB=$(location rust_lib_debug.a)
         OUTPUT_CC=$(location rust_bridge_cc_debug.cc)
@@ -66,7 +96,7 @@ genrule(
             exit 1
         fi
         cd $$WORKSPACE_ROOT
-        cargo build --manifest-path $$CARGO_DIR/Cargo.toml
+        "$$CARGO_BIN" build --manifest-path $$CARGO_DIR/Cargo.toml
         CARGO_TARGET_DIR=$$WORKSPACE_ROOT/target
         # cxxbridge uses the Cargo package name (with hyphen): fluss-cpp
         RUST_BRIDGE_DIR=$$CARGO_TARGET_DIR/cxxbridge/fluss-cpp/src
@@ -114,8 +144,7 @@ genrule(
         "src/lib.rs_release.h",
         "cxxbridge/rust/cxx_release.h",
     ],
-    cmd = """
-        set -e
+    cmd = _PROTOC_SETUP_SNIPPET + """
         EXECROOT=$$(pwd)
         OUTPUT_LIB=$(location rust_lib_release.a)
         OUTPUT_CC=$(location rust_bridge_cc_release.cc)
@@ -133,7 +162,7 @@ genrule(
             exit 1
         fi
         cd $$WORKSPACE_ROOT
-        cargo build --release --manifest-path $$CARGO_DIR/Cargo.toml
+        "$$CARGO_BIN" build --release --manifest-path $$CARGO_DIR/Cargo.toml
         CARGO_TARGET_DIR=$$WORKSPACE_ROOT/target
         # cxxbridge uses the Cargo package name (with hyphen): fluss-cpp
         RUST_BRIDGE_DIR=$$CARGO_TARGET_DIR/cxxbridge/fluss-cpp/src
@@ -252,7 +281,6 @@ cc_library(
         "src/admin.cpp",
         "src/connection.cpp",
         "src/table.cpp",
-        ":rust_bridge_cc_unified",
     ],
     hdrs = [
         "include/fluss.hpp",
@@ -303,6 +331,7 @@ cc_library(
     }),
     deps = [
         ":rust_lib",
+        "//bindings/cpp/bazel/cpp:arrow_cpp_dep",
     ],
     visibility = ["//visibility:public"],
 )
@@ -405,4 +434,3 @@ cc_binary(
     }),
     visibility = ["//visibility:public"],
 )
-
diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
index 6bd9fc79aa..0cedf68249 100644
--- a/fluss-rust/bindings/cpp/CMakeLists.txt
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -27,9 +27,21 @@ include(FetchContent)
 set(FLUSS_GOOGLETEST_VERSION 1.15.2 CACHE STRING "version of GoogleTest")
 set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
 
-find_package(Threads REQUIRED)
+set(FLUSS_CPP_DEP_MODE "system" CACHE STRING "Dependency provisioning mode for fluss-cpp (system|build)")
+set_property(CACHE FLUSS_CPP_DEP_MODE PROPERTY STRINGS system build)
+set(FLUSS_CPP_ARROW_VERSION "19.0.1" CACHE STRING "Arrow C++ version baseline for fluss-cpp")
+set(FLUSS_CPP_PROTOBUF_VERSION "3.25.5" CACHE STRING "Protobuf/protoc version baseline for fluss-cpp")
+set(FLUSS_CPP_ARROW_SYSTEM_ROOT "" CACHE PATH "Optional Arrow installation prefix for system mode")
+set(FLUSS_CPP_ARROW_SOURCE_URL
+    "https://github.com/apache/arrow/archive/refs/tags/apache-arrow-19.0.1.tar.gz"
+    CACHE STRING
+    "Arrow source archive URL used in build mode")
+set(FLUSS_CPP_ARROW_SOURCE_SHA256
+    "4c898504958841cc86b6f8710ecb2919f96b5e10fa8989ac10ac4fca8362d86a"
+    CACHE STRING
+    "SHA256 for the Arrow source archive used in build mode")
 
-find_package(Arrow REQUIRED)
+find_package(Threads REQUIRED)
 
 if (NOT CMAKE_BUILD_TYPE)
     set(CMAKE_BUILD_TYPE Release)
@@ -47,11 +59,117 @@ if (FLUSS_DEV)
     set(FLUSS_ENABLE_TESTING ON)
 endif()
 
+if (NOT FLUSS_CPP_DEP_MODE STREQUAL "system" AND NOT FLUSS_CPP_DEP_MODE STREQUAL "build")
+    message(FATAL_ERROR "Unsupported FLUSS_CPP_DEP_MODE='${FLUSS_CPP_DEP_MODE}'. Expected 'system' or 'build'.")
+endif()
+
+find_program(FLUSS_PROTOC_EXECUTABLE NAMES protoc)
+if (NOT FLUSS_PROTOC_EXECUTABLE)
+    message(FATAL_ERROR "protoc not found. Install protoc or set it in PATH. (Fluss baseline: ${FLUSS_CPP_PROTOBUF_VERSION})")
+endif()
+
+if (DEFINED ENV{CARGO} AND NOT "$ENV{CARGO}" STREQUAL "" AND EXISTS "$ENV{CARGO}")
+    set(FLUSS_CARGO_EXECUTABLE "$ENV{CARGO}")
+else()
+    if (DEFINED ENV{CARGO} AND NOT "$ENV{CARGO}" STREQUAL "")
+        get_filename_component(_FLUSS_CARGO_HINT_DIR "$ENV{CARGO}" DIRECTORY)
+    endif()
+    find_program(FLUSS_CARGO_EXECUTABLE NAMES cargo HINTS "${_FLUSS_CARGO_HINT_DIR}")
+endif()
+if (NOT FLUSS_CARGO_EXECUTABLE)
+    message(FATAL_ERROR "cargo not found. Install Rust toolchain or set CARGO/PATH.")
+endif()
+
+execute_process(
+    COMMAND ${FLUSS_PROTOC_EXECUTABLE} --version
+    OUTPUT_VARIABLE FLUSS_PROTOC_VERSION_OUTPUT
+    OUTPUT_STRIP_TRAILING_WHITESPACE
+    ERROR_QUIET
+)
+string(REGEX MATCH "([0-9]+\\.[0-9]+\\.[0-9]+)" FLUSS_PROTOC_VERSION "${FLUSS_PROTOC_VERSION_OUTPUT}")
+set(FLUSS_PROTOC_VERSION_NORM "${FLUSS_PROTOC_VERSION}")
+set(FLUSS_CPP_PROTOBUF_VERSION_NORM "${FLUSS_CPP_PROTOBUF_VERSION}")
+string(REGEX REPLACE "^3\\." "" FLUSS_PROTOC_VERSION_NORM "${FLUSS_PROTOC_VERSION_NORM}")
+string(REGEX REPLACE "^3\\." "" FLUSS_CPP_PROTOBUF_VERSION_NORM "${FLUSS_CPP_PROTOBUF_VERSION_NORM}")
+if (FLUSS_PROTOC_VERSION AND
+    NOT FLUSS_PROTOC_VERSION VERSION_EQUAL FLUSS_CPP_PROTOBUF_VERSION AND
+    NOT FLUSS_PROTOC_VERSION_NORM VERSION_EQUAL FLUSS_CPP_PROTOBUF_VERSION_NORM)
+    message(WARNING
+        "protoc version (${FLUSS_PROTOC_VERSION}) does not match Fluss baseline "
+        "(${FLUSS_CPP_PROTOBUF_VERSION}). Build may still work, but this is outside the tested baseline.")
+endif()
+
+message(STATUS "Fluss C++ dependency mode: ${FLUSS_CPP_DEP_MODE}")
+message(STATUS "Fluss C++ protoc executable: ${FLUSS_PROTOC_EXECUTABLE} (${FLUSS_PROTOC_VERSION_OUTPUT})")
+message(STATUS "Fluss C++ cargo executable: ${FLUSS_CARGO_EXECUTABLE}")
+
+if (FLUSS_CPP_DEP_MODE STREQUAL "system")
+    if (FLUSS_CPP_ARROW_SYSTEM_ROOT)
+        list(APPEND CMAKE_PREFIX_PATH "${FLUSS_CPP_ARROW_SYSTEM_ROOT}")
+        set(Arrow_ROOT "${FLUSS_CPP_ARROW_SYSTEM_ROOT}")
+    endif()
+
+    find_package(Arrow REQUIRED)
+
+    if (DEFINED Arrow_VERSION AND Arrow_VERSION AND NOT Arrow_VERSION VERSION_EQUAL FLUSS_CPP_ARROW_VERSION)
+        message(WARNING
+            "Arrow version (${Arrow_VERSION}) does not match Fluss baseline "
+            "(${FLUSS_CPP_ARROW_VERSION}). Build may still work, but this is outside the tested baseline.")
+    endif()
+else()
+    # Build mode: provision Arrow C++ from source in-tree.
+    set(ARROW_BUILD_SHARED ON CACHE BOOL "" FORCE)
+    set(ARROW_BUILD_STATIC OFF CACHE BOOL "" FORCE)
+    set(ARROW_BUILD_TESTS OFF CACHE BOOL "" FORCE)
+    set(ARROW_BUILD_EXAMPLES OFF CACHE BOOL "" FORCE)
+    set(ARROW_BUILD_BENCHMARKS OFF CACHE BOOL "" FORCE)
+    set(ARROW_BUILD_INTEGRATION OFF CACHE BOOL "" FORCE)
+    set(ARROW_BUILD_UTILITIES OFF CACHE BOOL "" FORCE)
+    set(ARROW_COMPUTE OFF CACHE BOOL "" FORCE)
+    set(ARROW_CSV OFF CACHE BOOL "" FORCE)
+    set(ARROW_DATASET OFF CACHE BOOL "" FORCE)
+    set(ARROW_FILESYSTEM OFF CACHE BOOL "" FORCE)
+    set(ARROW_JSON OFF CACHE BOOL "" FORCE)
+    set(ARROW_PARQUET OFF CACHE BOOL "" FORCE)
+    set(ARROW_IPC ON CACHE BOOL "" FORCE)
+    # Reduce third-party sub-build complexity in build mode.
+    set(ARROW_JEMALLOC OFF CACHE BOOL "" FORCE)
+    set(ARROW_MIMALLOC OFF CACHE BOOL "" FORCE)
+    set(ARROW_DEPENDENCY_SOURCE BUNDLED CACHE STRING "" FORCE)
+    set(ARROW_SIMD_LEVEL NONE CACHE STRING "" FORCE)
+    set(ARROW_RUNTIME_SIMD_LEVEL NONE CACHE STRING "" FORCE)
+
+    FetchContent_Declare(
+        apache_arrow_src
+        URL ${FLUSS_CPP_ARROW_SOURCE_URL}
+        URL_HASH SHA256=${FLUSS_CPP_ARROW_SOURCE_SHA256}
+        SOURCE_SUBDIR cpp
+    )
+    FetchContent_MakeAvailable(apache_arrow_src)
+    set(FLUSS_CPP_ARROW_EXTRA_INCLUDE_DIRS
+        "${apache_arrow_src_SOURCE_DIR}/cpp/src"
+        "${apache_arrow_src_BINARY_DIR}/src")
+
+    if (TARGET arrow_shared AND NOT TARGET Arrow::arrow_shared)
+        add_library(Arrow::arrow_shared ALIAS arrow_shared)
+    endif()
+    if (NOT TARGET Arrow::arrow_shared)
+        message(FATAL_ERROR "Arrow build mode did not produce target Arrow::arrow_shared (or arrow_shared).")
+    endif()
+endif()
+
 # Get cargo target dir
-execute_process(COMMAND cargo locate-project --workspace --message-format plain
-    OUTPUT_VARIABLE CARGO_TARGET_DIR
+execute_process(COMMAND ${FLUSS_CARGO_EXECUTABLE} locate-project --workspace --message-format plain
+    OUTPUT_VARIABLE CARGO_MANIFEST_PATH
+    OUTPUT_STRIP_TRAILING_WHITESPACE
     WORKING_DIRECTORY ${PROJECT_SOURCE_DIR})
-string(REGEX REPLACE "/Cargo.toml\n$" "/target" CARGO_TARGET_DIR "${CARGO_TARGET_DIR}")
+if (NOT CARGO_MANIFEST_PATH)
+    message(FATAL_ERROR
+        "Failed to resolve Cargo workspace target dir via '${FLUSS_CARGO_EXECUTABLE} locate-project'. "
+        "Check Rust toolchain installation and PATH/CARGO.")
+endif()
+get_filename_component(CARGO_WORKSPACE_DIR "${CARGO_MANIFEST_PATH}" DIRECTORY)
+set(CARGO_TARGET_DIR "${CARGO_WORKSPACE_DIR}/target")
 
 set(CARGO_MANIFEST ${PROJECT_SOURCE_DIR}/Cargo.toml)
 set(RUST_SOURCE_FILE ${PROJECT_SOURCE_DIR}/src/lib.rs)
@@ -77,7 +195,7 @@ if (NOT CMAKE_BUILD_TYPE STREQUAL "Debug")
 endif()
 
 add_custom_target(cargo_build
-    COMMAND cargo build --manifest-path ${CARGO_MANIFEST} ${CARGO_BUILD_FLAGS}
+    COMMAND ${CMAKE_COMMAND} -E env PROTOC=${FLUSS_PROTOC_EXECUTABLE} ${FLUSS_CARGO_EXECUTABLE} build --manifest-path ${CARGO_MANIFEST} ${CARGO_BUILD_FLAGS}
     BYPRODUCTS ${RUST_BRIDGE_CPP} ${RUST_LIB} ${RUST_HEADER_FILE}
     DEPENDS ${RUST_SOURCE_FILE}
     USES_TERMINAL
@@ -88,6 +206,9 @@ add_library(fluss_cpp STATIC ${CPP_SOURCE_FILE} ${RUST_BRIDGE_CPP})
 target_sources(fluss_cpp PUBLIC ${CPP_HEADER_FILE})
 target_sources(fluss_cpp PRIVATE ${RUST_HEADER_FILE})
 target_include_directories(fluss_cpp PUBLIC ${CPP_INCLUDE_DIR})
+if (FLUSS_CPP_ARROW_EXTRA_INCLUDE_DIRS)
+    target_include_directories(fluss_cpp PUBLIC ${FLUSS_CPP_ARROW_EXTRA_INCLUDE_DIRS})
+endif()
 target_link_libraries(fluss_cpp PUBLIC ${RUST_LIB})
 target_link_libraries(fluss_cpp PRIVATE ${CMAKE_DL_LIBS} Threads::Threads)
 target_link_libraries(fluss_cpp PUBLIC Arrow::arrow_shared)
@@ -114,9 +235,11 @@ target_link_libraries(fluss_cpp_kv_example PRIVATE Arrow::arrow_shared)
 target_compile_definitions(fluss_cpp_kv_example PRIVATE ARROW_FOUND)
 target_include_directories(fluss_cpp_kv_example PUBLIC ${CPP_INCLUDE_DIR})
 
-set_target_properties(fluss_cpp
-    PROPERTIES ADDITIONAL_CLEAN_FILES ${CARGO_TARGET_DIR}
-)
+if (CARGO_TARGET_DIR)
+    set_target_properties(fluss_cpp
+        PROPERTIES ADDITIONAL_CLEAN_FILES "${CARGO_TARGET_DIR}"
+    )
+endif()
 add_dependencies(fluss_cpp cargo_build)
 
 if (FLUSS_ENABLE_ADDRESS_SANITIZER)
diff --git a/fluss-rust/bindings/cpp/bazel/cpp/BUILD.bazel b/fluss-rust/bindings/cpp/bazel/cpp/BUILD.bazel
new file mode 100644
index 0000000000..e4b730dc9b
--- /dev/null
+++ b/fluss-rust/bindings/cpp/bazel/cpp/BUILD.bazel
@@ -0,0 +1,26 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+package(default_visibility = ["//visibility:public"])
+
+# Stable indirection target for the Arrow C++ dependency. The implementation
+# repo name can change across modes (registry/build/system) without touching
+# bindings/cpp/BUILD.bazel.
+alias(
+    name = "arrow_cpp_dep",
+    actual = "@apache_arrow_cpp//:arrow_cpp",
+)
diff --git a/fluss-rust/bindings/cpp/bazel/cpp/deps.bzl b/fluss-rust/bindings/cpp/bazel/cpp/deps.bzl
new file mode 100644
index 0000000000..6dd5e1b635
--- /dev/null
+++ b/fluss-rust/bindings/cpp/bazel/cpp/deps.bzl
@@ -0,0 +1,349 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Bzlmod extension for fluss C++ SDK dependency provisioning."""
+
+load("@bazel_tools//tools/build_defs/repo:http.bzl", "http_archive")
+
+_ARROW_BUILD_FILE_TEMPLATE = """
+load("@rules_foreign_cc//foreign_cc:defs.bzl", "cmake")
+
+package(default_visibility = ["//visibility:public"])
+
+filegroup(
+    name = "all_srcs",
+    srcs = glob(
+        ["**"],
+        exclude = [
+            "**/BUILD",
+            "**/BUILD.bazel",
+        ],
+    ),
+)
+
+cmake(
+    name = "arrow_cpp",
+    lib_source = ":all_srcs",
+    working_directory = "cpp",
+    generate_args = ["-GUnix Makefiles"],
+    cache_entries = {
+        "CMAKE_BUILD_TYPE": "Release",
+        "CMAKE_INSTALL_LIBDIR": "lib",
+        "CMAKE_POSITION_INDEPENDENT_CODE": "ON",
+        "ARROW_BUILD_SHARED": "ON",
+        "ARROW_BUILD_STATIC": "OFF",
+        "ARROW_BUILD_TESTS": "OFF",
+        "ARROW_BUILD_EXAMPLES": "OFF",
+        "ARROW_BUILD_BENCHMARKS": "OFF",
+        "ARROW_BUILD_INTEGRATION": "OFF",
+        "ARROW_BUILD_UTILITIES": "OFF",
+        "ARROW_COMPUTE": "OFF",
+        "ARROW_CSV": "OFF",
+        "ARROW_DATASET": "OFF",
+        "ARROW_FILESYSTEM": "OFF",
+        "ARROW_JSON": "OFF",
+        "ARROW_PARQUET": "OFF",
+        "ARROW_IPC": "ON",
+        "ARROW_JEMALLOC": "OFF",
+        "ARROW_MIMALLOC": "OFF",
+        "ARROW_SIMD_LEVEL": "NONE",
+        "ARROW_RUNTIME_SIMD_LEVEL": "NONE",
+        "ARROW_DEPENDENCY_SOURCE": "BUNDLED",
+        # Temporary workarounds for older images / Bazel sandbox toolchain detection.
+        "EP_CMAKE_RANLIB": "__EP_CMAKE_RANLIB__",
+        "EP_CMAKE_AR": "__EP_CMAKE_AR__",
+        "EP_CMAKE_NM": "__EP_CMAKE_NM__",
+    },
+    out_include_dir = "include",
+    out_lib_dir = "lib",
+    out_shared_libs = select({
+        "@platforms//os:macos": [
+            "libarrow.dylib",
+            "libarrow.1900.dylib",
+        ],
+        "//conditions:default": [
+            "libarrow.so",
+            "libarrow.so.1900",
+            "libarrow.so.1900.1.0",
+        ],
+    }),
+)
+"""
+
+_ARROW_PATCH_CMDS = [
+    "sed -i.bak 's|#define ARROW_CXX_COMPILER_FLAGS \"@CMAKE_CXX_FLAGS@\"|#define ARROW_CXX_COMPILER_FLAGS \"\"|' cpp/src/arrow/util/config.h.cmake && rm -f cpp/src/arrow/util/config.h.cmake.bak",
+]
+
+_SYSTEM_ARROW_BUILD_FILE_TEMPLATE = """
+load("@rules_cc//cc:defs.bzl", "cc_import", "cc_library")
+
+package(default_visibility = ["//visibility:public"])
+
+cc_import(
+    name = "arrow_shared_import",
+    shared_library = "__SYSTEM_ARROW_SHARED_LIBRARY__",
+)
+
+filegroup(
+    name = "arrow_runtime_libs",
+    srcs = [
+__SYSTEM_ARROW_RUNTIME_SRCS__
+    ],
+)
+
+cc_library(
+    name = "arrow_cpp",
+    hdrs = [
+__SYSTEM_ARROW_HDRS__
+    ],
+    includes = ["__SYSTEM_ARROW_INCLUDE_DIR__"],
+    data = [":arrow_runtime_libs"],
+    deps = [":arrow_shared_import"],
+)
+"""
+
+_ARROW_BUILD_VERSIONS = {
+    "19.0.1": {
+        "urls": ["https://github.com/apache/arrow/archive/refs/tags/apache-arrow-19.0.1.tar.gz"],
+        "strip_prefix": "arrow-apache-arrow-19.0.1",
+        "integrity": "sha256-TImFBJWIQcyGtvhxDsspGflrXhD6iYmsEKxPyoNi2Go=",
+    },
+}
+
+_config_tag = tag_class(attrs = {
+    "mode": attr.string(default = "build"),
+    "arrow_cpp_version": attr.string(default = "19.0.1"),
+    "protobuf_version": attr.string(default = "3.25.5"),
+    "ep_cmake_ranlib": attr.string(default = "ranlib"),
+    "ep_cmake_ar": attr.string(default = "ar"),
+    "ep_cmake_nm": attr.string(default = "nm"),
+    "system_arrow_prefix": attr.string(default = "/usr"),
+    "system_arrow_include_dir": attr.string(default = "include"),
+    "system_arrow_shared_library": attr.string(default = "lib/x86_64-linux-gnu/libarrow.so"),
+    "system_arrow_runtime_glob": attr.string(default = "lib/x86_64-linux-gnu/libarrow.so*"),
+})
+
+def _render_arrow_build_file(tag):
+    return _ARROW_BUILD_FILE_TEMPLATE.replace(
+        "__EP_CMAKE_RANLIB__",
+        tag.ep_cmake_ranlib,
+    ).replace(
+        "__EP_CMAKE_AR__",
+        tag.ep_cmake_ar,
+    ).replace(
+        "__EP_CMAKE_NM__",
+        tag.ep_cmake_nm,
+    )
+
+def _render_system_arrow_build_file(tag, shared_library_override = None):
+    shared_library = shared_library_override if shared_library_override else (tag.system_arrow_shared_library if hasattr(tag, "system_arrow_shared_library") else tag.shared_library)
+    include_dir = tag.system_arrow_include_dir if hasattr(tag, "system_arrow_include_dir") else tag.include_dir
+    return _SYSTEM_ARROW_BUILD_FILE_TEMPLATE.replace(
+        "__SYSTEM_ARROW_SHARED_LIBRARY__",
+        "sysroot/" + shared_library,
+    ).replace(
+        "__SYSTEM_ARROW_INCLUDE_DIR__",
+        "sysroot/" + include_dir,
+    )
+
+def _starlark_string_list(items):
+    if not items:
+        return ""
+    return "\n".join(['        "%s",' % i for i in items])
+
+def _list_files(repo_ctx, base_dir, suffixes):
+    result = repo_ctx.execute([
+        "/usr/bin/find",
+        base_dir,
+        "(",
+        "-type",
+        "f",
+        "-o",
+        "-type",
+        "l",
+        ")",
+    ])
+    if result.return_code != 0:
+        fail("failed to enumerate files under %s: %s" % (base_dir, result.stderr))
+    files = []
+    for line in result.stdout.splitlines():
+        for suffix in suffixes:
+            if line.endswith(suffix):
+                files.append(line)
+                break
+    return sorted(files)
+
+def _copy_file_to_sysroot(repo_ctx, prefix, rel_path):
+    if rel_path.startswith("/"):
+        fail("expected relative path under prefix, got absolute path: %s" % rel_path)
+    src = prefix + "/" + rel_path
+    dst = "sysroot/" + rel_path
+    dst_parent = dst.rsplit("/", 1)[0] if "/" in dst else "sysroot"
+    mkdir_res = repo_ctx.execute(["/bin/mkdir", "-p", dst_parent])
+    if mkdir_res.return_code != 0:
+        fail("failed to create directory %s: %s" % (dst_parent, mkdir_res.stderr))
+    # Resolve symlinks into real files to keep the generated sysroot self-contained.
+    cp_res = repo_ctx.execute(["/bin/cp", "-L", src, dst])
+    if cp_res.return_code != 0:
+        fail("failed to copy %s to %s: %s" % (src, dst, cp_res.stderr))
+
+def _system_arrow_repo_impl(repo_ctx):
+    prefix = repo_ctx.attr.prefix.rstrip("/")
+    include_dir = repo_ctx.attr.include_dir
+    shared_library = repo_ctx.attr.shared_library
+    runtime_glob = repo_ctx.attr.runtime_glob
+
+    mkdir_res = repo_ctx.execute(["/bin/mkdir", "-p", "sysroot"])
+    if mkdir_res.return_code != 0:
+        fail("failed to create sysroot directory: %s" % mkdir_res.stderr)
+
+    include_dir_for_scan = include_dir
+    if include_dir_for_scan.endswith("/"):
+        include_dir_for_scan = include_dir_for_scan[:-1]
+    header_root = prefix + "/" + include_dir_for_scan + "/arrow"
+    headers = _list_files(repo_ctx, header_root, [".h", ".hpp"])
+    header_srcs_rel = []
+    header_srcs = []
+    for h in headers:
+        if not h.startswith(prefix + "/"):
+            fail("header path %s is outside prefix %s" % (h, prefix))
+        rel = h[len(prefix) + 1:]
+        header_srcs_rel.append(rel)
+        header_srcs.append("sysroot/" + rel)
+
+    runtime_dir = runtime_glob.rsplit("/", 1)[0]
+    runtime_prefix = runtime_glob.rsplit("/", 1)[1].replace("*", "")
+    runtime_files = _list_files(repo_ctx, prefix + "/" + runtime_dir, [""])
+    runtime_srcs_rel = []
+    runtime_srcs = []
+    for f in runtime_files:
+        rel = f[len(prefix) + 1:] if f.startswith(prefix + "/") else None
+        if rel == None:
+            continue
+        if rel.startswith(runtime_dir + "/") and rel.rsplit("/", 1)[1].startswith(runtime_prefix):
+            runtime_srcs_rel.append(rel)
+            runtime_srcs.append("sysroot/" + rel)
+    runtime_srcs_rel = sorted(runtime_srcs_rel)
+    runtime_srcs = sorted(runtime_srcs)
+
+    # Prefer a versioned soname file as the imported shared library so Bazel
+    # runfiles contain the exact filename required by the runtime loader.
+    shared_import_rel = "sysroot/" + shared_library
+    shared_basename = shared_library.rsplit("/", 1)[1]
+    soname_candidates = []
+    for rel in runtime_srcs_rel:
+        base = rel.rsplit("/", 1)[1]
+        if base == shared_basename:
+            continue
+        if base.startswith(shared_basename + "."):
+            soname_candidates.append("sysroot/" + rel)
+    if soname_candidates:
+        # Prefer shortest suffix first (e.g. libarrow.so.1900 before
+        # libarrow.so.1900.1.0) to match ELF SONAME naming when available.
+        soname_candidates = sorted(soname_candidates, key = lambda s: (len(s), s))
+        shared_import_rel = soname_candidates[0]
+
+    # Copy only required Arrow artifacts instead of mirroring the full system prefix.
+    copy_rel_paths = {}
+    for rel in header_srcs_rel + runtime_srcs_rel + [shared_library]:
+        copy_rel_paths[rel] = True
+    for rel in sorted(copy_rel_paths.keys()):
+        _copy_file_to_sysroot(repo_ctx, prefix, rel)
+
+    build_file = _render_system_arrow_build_file(repo_ctx.attr, shared_library_override = shared_import_rel[len("sysroot/"):]).replace(
+        "__SYSTEM_ARROW_HDRS__",
+        _starlark_string_list(header_srcs),
+    ).replace(
+        "__SYSTEM_ARROW_RUNTIME_SRCS__",
+        _starlark_string_list(runtime_srcs),
+    )
+    repo_ctx.file("BUILD.bazel", build_file)
+
+_system_arrow_repository = repository_rule(
+    implementation = _system_arrow_repo_impl,
+    attrs = {
+        "prefix": attr.string(mandatory = True),
+        "include_dir": attr.string(mandatory = True),
+        "shared_library": attr.string(mandatory = True),
+        "runtime_glob": attr.string(mandatory = True),
+    },
+    local = True,
+)
+
+def _select_config(ctx):
+    selected = None
+    selected_owner = None
+    root_selected = None
+    for mod in ctx.modules:
+        for tag in mod.tags.config:
+            is_root = hasattr(mod, "is_root") and mod.is_root
+            if is_root:
+                if root_selected != None:
+                    fail("cpp_sdk.config may only be declared once in the root module")
+                root_selected = tag
+                continue
+            if selected == None:
+                selected = tag
+                selected_owner = mod.name
+            elif selected_owner != mod.name:
+                # Prefer root override. Dependency defaults are tolerated as long
+                # as they come from a single module.
+                fail("multiple dependency defaults for cpp_sdk.config without root override")
+    if root_selected != None:
+        return root_selected
+    return selected
+
+def _cpp_sdk_impl(ctx):
+    tag = _select_config(ctx)
+    if tag == None:
+        return
+
+    if tag.mode == "registry":
+        return
+
+    if tag.mode == "system":
+        _system_arrow_repository(
+            name = "apache_arrow_cpp",
+            prefix = tag.system_arrow_prefix,
+            include_dir = tag.system_arrow_include_dir,
+            shared_library = tag.system_arrow_shared_library,
+            runtime_glob = tag.system_arrow_runtime_glob,
+        )
+        return
+
+    if tag.mode != "build":
+        fail("unsupported cpp_sdk mode: %s" % tag.mode)
+
+    arrow_version = _ARROW_BUILD_VERSIONS.get(tag.arrow_cpp_version)
+    if arrow_version == None:
+        fail("unsupported arrow_cpp_version for build mode: %s" % tag.arrow_cpp_version)
+
+    http_archive(
+        name = "apache_arrow_cpp",
+        urls = arrow_version["urls"],
+        strip_prefix = arrow_version["strip_prefix"],
+        integrity = arrow_version["integrity"],
+        patch_cmds = _ARROW_PATCH_CMDS,
+        build_file_content = _render_arrow_build_file(tag),
+    )
+
+cpp_sdk = module_extension(
+    implementation = _cpp_sdk_impl,
+    tag_classes = {
+        "config": _config_tag,
+    },
+)
diff --git a/fluss-rust/bindings/cpp/MODULE.bazel b/fluss-rust/bindings/cpp/examples/bazel-consumer/build/BUILD.bazel
similarity index 80%
rename from fluss-rust/bindings/cpp/MODULE.bazel
rename to fluss-rust/bindings/cpp/examples/bazel-consumer/build/BUILD.bazel
index f75d3e6f69..afd35edd7e 100644
--- a/fluss-rust/bindings/cpp/MODULE.bazel
+++ b/fluss-rust/bindings/cpp/examples/bazel-consumer/build/BUILD.bazel
@@ -15,9 +15,11 @@
 # specific language governing permissions and limitations
 # under the License.
 
-module(
-    name = "fluss_cpp",
-)
+load("@rules_cc//cc:defs.bzl", "cc_binary")
 
-bazel_dep(name = "rules_cc", version = "0.0.17")
-bazel_dep(name = "platforms", version = "0.0.10")
+cc_binary(
+    name = "consumer_build",
+    srcs = ["main.cc"],
+    copts = ["-std=c++17"],
+    deps = ["@fluss-cpp//bindings/cpp:fluss_cpp"],
+)
diff --git a/fluss-rust/bindings/cpp/examples/bazel-consumer/build/MODULE.bazel b/fluss-rust/bindings/cpp/examples/bazel-consumer/build/MODULE.bazel
new file mode 100644
index 0000000000..f31165c1cd
--- /dev/null
+++ b/fluss-rust/bindings/cpp/examples/bazel-consumer/build/MODULE.bazel
@@ -0,0 +1,39 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+module(name = "fluss_cpp_consumer_build")
+
+bazel_dep(name = "rules_cc", version = "0.2.14")
+bazel_dep(name = "fluss-cpp", version = "0.1.0")
+
+# Local override for repository-local validation only.
+local_path_override(
+    module_name = "fluss-cpp",
+    # Repository root path (the directory containing `bindings/cpp`).
+    path = "../../../../../",
+)
+
+fluss_cpp = use_extension("@fluss-cpp//bindings/cpp/bazel/cpp:deps.bzl", "cpp_sdk")
+fluss_cpp.config(
+    mode = "build",
+    protobuf_version = "3.25.5",
+    arrow_cpp_version = "19.0.1",
+    ep_cmake_ranlib = "/usr/bin/ranlib",
+    ep_cmake_ar = "/usr/bin/ar",
+    ep_cmake_nm = "/usr/bin/nm",
+)
+use_repo(fluss_cpp, "apache_arrow_cpp")
diff --git a/fluss-rust/bindings/cpp/examples/bazel-consumer/build/main.cc b/fluss-rust/bindings/cpp/examples/bazel-consumer/build/main.cc
new file mode 100644
index 0000000000..87e5b6820f
--- /dev/null
+++ b/fluss-rust/bindings/cpp/examples/bazel-consumer/build/main.cc
@@ -0,0 +1,28 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include "fluss.hpp"
+
+#include <iostream>
+
+int main() {
+    fluss::TablePath table_path("demo_db", "demo_table");
+    std::cout << "Bazel build-mode dependency example ready: "
+              << table_path.ToString() << std::endl;
+    return 0;
+}
+
diff --git a/fluss-rust/bindings/cpp/examples/bazel-consumer/system/BUILD.bazel b/fluss-rust/bindings/cpp/examples/bazel-consumer/system/BUILD.bazel
new file mode 100644
index 0000000000..2f24e6dec7
--- /dev/null
+++ b/fluss-rust/bindings/cpp/examples/bazel-consumer/system/BUILD.bazel
@@ -0,0 +1,25 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+load("@rules_cc//cc:defs.bzl", "cc_binary")
+
+cc_binary(
+    name = "consumer_system",
+    srcs = ["main.cc"],
+    copts = ["-std=c++17"],
+    deps = ["@fluss-cpp//bindings/cpp:fluss_cpp"],
+)
diff --git a/fluss-rust/bindings/cpp/examples/bazel-consumer/system/MODULE.bazel b/fluss-rust/bindings/cpp/examples/bazel-consumer/system/MODULE.bazel
new file mode 100644
index 0000000000..2a4d6a6584
--- /dev/null
+++ b/fluss-rust/bindings/cpp/examples/bazel-consumer/system/MODULE.bazel
@@ -0,0 +1,44 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+module(name = "fluss_cpp_consumer_system")
+
+bazel_dep(name = "rules_cc", version = "0.2.14")
+bazel_dep(name = "fluss-cpp", version = "0.1.0")
+
+# Repository-local example path (repository root containing `bindings/cpp`).
+# If you copy this example out of tree, replace this with an absolute path
+# (for example: /path/to/fluss-rust).
+local_path_override(
+    module_name = "fluss-cpp",
+    path = "../../../../../",
+)
+
+# Intended interface for preinstalled protoc + Arrow C++ environments.
+fluss_cpp = use_extension("@fluss-cpp//bindings/cpp/bazel/cpp:deps.bzl", "cpp_sdk")
+fluss_cpp.config(
+    mode = "system",
+    protobuf_version = "3.25.5",
+    arrow_cpp_version = "19.0.1",
+    # Adjust these paths for your environment.
+    # Ubuntu 22.04 (apt / custom package) commonly uses lib/x86_64-linux-gnu.
+    system_arrow_prefix = "/usr",
+    system_arrow_include_dir = "include",
+    system_arrow_shared_library = "lib/x86_64-linux-gnu/libarrow.so",
+    system_arrow_runtime_glob = "lib/x86_64-linux-gnu/libarrow.so*",
+)
+use_repo(fluss_cpp, "apache_arrow_cpp")
diff --git a/fluss-rust/bindings/cpp/examples/bazel-consumer/system/main.cc b/fluss-rust/bindings/cpp/examples/bazel-consumer/system/main.cc
new file mode 100644
index 0000000000..b1f0b70b84
--- /dev/null
+++ b/fluss-rust/bindings/cpp/examples/bazel-consumer/system/main.cc
@@ -0,0 +1,27 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+#include "fluss.hpp"
+
+#include <iostream>
+
+int main() {
+    fluss::TablePath table_path("demo_db", "demo_table");
+    std::cout << "Bazel system-mode dependency example ready: "
+              << table_path.ToString() << std::endl;
+    return 0;
+}
diff --git a/fluss-rust/bindings/cpp/scripts/ensure_protoc.sh b/fluss-rust/bindings/cpp/scripts/ensure_protoc.sh
new file mode 100755
index 0000000000..3210bcc7a5
--- /dev/null
+++ b/fluss-rust/bindings/cpp/scripts/ensure_protoc.sh
@@ -0,0 +1,277 @@
+#!/bin/bash
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+set -euo pipefail
+
+PROTOBUF_BASELINE_VERSION="${PROTOBUF_BASELINE_VERSION:-3.25.5}"
+if [[ -n "${XDG_CACHE_HOME:-}" ]]; then
+  _PROTOC_DEFAULT_CACHE_BASE="${XDG_CACHE_HOME}"
+elif [[ -n "${HOME:-}" ]]; then
+  _PROTOC_DEFAULT_CACHE_BASE="${HOME}/.cache"
+else
+  _PROTOC_DEFAULT_CACHE_BASE="/tmp"
+fi
+
+_PROTOC_UNAME_S="$(uname -s | tr '[:upper:]' '[:lower:]')"
+case "${_PROTOC_UNAME_S}" in
+  linux*)
+    _PROTOC_DEFAULT_OS="linux"
+    ;;
+  darwin*)
+    _PROTOC_DEFAULT_OS="osx"
+    ;;
+  *)
+    echo "ERROR: unsupported host OS '${_PROTOC_UNAME_S}'. Please set PROTOC_OS explicitly." >&2
+    exit 1
+    ;;
+esac
+
+_PROTOC_UNAME_M="$(uname -m)"
+case "${_PROTOC_UNAME_M}" in
+  x86_64|amd64)
+    _PROTOC_DEFAULT_ARCH="x86_64"
+    ;;
+  aarch64|arm64)
+    _PROTOC_DEFAULT_ARCH="aarch_64"
+    ;;
+  *)
+    echo "ERROR: unsupported host arch '${_PROTOC_UNAME_M}'. Please set PROTOC_ARCH explicitly." >&2
+    exit 1
+    ;;
+esac
+
+PROTOC_INSTALL_ROOT="${PROTOC_INSTALL_ROOT:-${_PROTOC_DEFAULT_CACHE_BASE}/fluss-cpp-tools}"
+PROTOC_OS="${PROTOC_OS:-${_PROTOC_DEFAULT_OS}}"
+PROTOC_ARCH="${PROTOC_ARCH:-${_PROTOC_DEFAULT_ARCH}}"
+PROTOC_FORCE_INSTALL="${PROTOC_FORCE_INSTALL:-0}"
+PROTOC_PRINT_PATH_ONLY="${PROTOC_PRINT_PATH_ONLY:-0}"
+PROTOC_ALLOW_INSECURE_DOWNLOAD="${PROTOC_ALLOW_INSECURE_DOWNLOAD:-0}"
+PROTOC_SKIP_CHECKSUM_VERIFY="${PROTOC_SKIP_CHECKSUM_VERIFY:-0}"
+
+usage() {
+  cat <<'EOF'
+Usage: bindings/cpp/scripts/ensure_protoc.sh [--print-path]
+
+Ensures a protoc binary matching the configured protobuf baseline is available.
+Installs into a local cache directory (default: \$XDG_CACHE_HOME/fluss-cpp-tools or
+\$HOME/.cache/fluss-cpp-tools) and prints
+the protoc path on stdout.
+
+Env vars:
+  PROTOBUF_BASELINE_VERSION  Baseline protobuf version (default: 3.25.5)
+  PROTOC_INSTALL_ROOT        Local cache root (default: XDG/HOME cache dir)
+  PROTOC_OS                 protoc package OS (default: auto-detect host: linux/osx)
+  PROTOC_ARCH               protoc package arch (default: auto-detect host: x86_64/aarch_64)
+  PROTOC_FORCE_INSTALL      1 to force re-download
+  PROTOC_ALLOW_INSECURE_DOWNLOAD
+                            1 to disable TLS verification (not recommended)
+  PROTOC_SKIP_CHECKSUM_VERIFY
+                            1 to skip pinned archive checksum verification
+  BAZEL_PROXY_URL           Optional proxy (sets curl/wget proxy envs if present)
+EOF
+}
+
+for arg in "$@"; do
+  case "$arg" in
+    --print-path)
+      PROTOC_PRINT_PATH_ONLY=1
+      ;;
+    -h|--help)
+      usage
+      exit 0
+      ;;
+    *)
+      echo "Unknown argument: $arg" >&2
+      usage >&2
+      exit 1
+      ;;
+  esac
+done
+
+setup_proxy_env() {
+  if [[ -n "${BAZEL_PROXY_URL:-}" ]]; then
+    export http_proxy="${http_proxy:-$BAZEL_PROXY_URL}"
+    export https_proxy="${https_proxy:-$BAZEL_PROXY_URL}"
+    export HTTP_PROXY="${HTTP_PROXY:-$http_proxy}"
+    export HTTPS_PROXY="${HTTPS_PROXY:-$https_proxy}"
+  fi
+}
+
+normalize_version_for_protoc_release() {
+  local v="$1"
+  # Protobuf release packaging switched from v3.x.y to vX.Y for newer versions.
+  # For our current agreed baseline (3.25.5), the protoc archive/tag is 25.5.
+  if [[ "$v" =~ ^3\.([0-9]+\.[0-9]+)$ ]]; then
+    local stripped="${BASH_REMATCH[1]}"
+    local major="${stripped%%.*}"
+    if [[ "$major" -ge 21 ]]; then
+      echo "$stripped"
+      return 0
+    fi
+  fi
+  echo "$v"
+}
+
+version_matches_baseline() {
+  local actual="$1"
+  local baseline="$2"
+  local actual_norm baseline_norm
+  actual_norm="$(normalize_version_for_protoc_release "$actual")"
+  baseline_norm="$(normalize_version_for_protoc_release "$baseline")"
+  [[ "$actual" == "$baseline" || "$actual_norm" == "$baseline_norm" ]]
+}
+
+lookup_protoc_archive_sha256() {
+  local release_version="$1"
+  local os="$2"
+  local arch="$3"
+  case "${release_version}:${os}:${arch}" in
+    25.5:linux:aarch_64)
+      echo "dc715bb5aab2ebf9653d7d3efbe55e01a035e45c26f391ff6d9b7923e22914b7"
+      ;;
+    25.5:linux:x86_64)
+      echo "e1ed237a17b2e851cf9662cb5ad02b46e70ff8e060e05984725bc4b4228c6b28"
+      ;;
+    25.5:osx:aarch_64)
+      echo "781a6fc4c265034872cadc65e63dd3c0fc49245b70917821b60e2d457a6876ab"
+      ;;
+    25.5:osx:x86_64)
+      echo "c5447e4f0d5caffb18d9ff21eae7bc7faf2bb2000083d6f49e5b6000b30fceae"
+      ;;
+    *)
+      return 1
+      ;;
+  esac
+}
+
+verify_download_sha256() {
+  local file="$1"
+  local expected="$2"
+  local actual=""
+  if command -v sha256sum >/dev/null 2>&1; then
+    actual="$(sha256sum "$file" | awk '{print $1}')"
+  elif command -v shasum >/dev/null 2>&1; then
+    actual="$(shasum -a 256 "$file" | awk '{print $1}')"
+  else
+    echo "ERROR: neither sha256sum nor shasum is available for checksum verification." >&2
+    return 1
+  fi
+  if [[ "$actual" != "$expected" ]]; then
+    echo "ERROR: protoc archive checksum mismatch." >&2
+    echo "  expected: $expected" >&2
+    echo "  actual:   $actual" >&2
+    return 1
+  fi
+}
+
+download_file() {
+  local url="$1"
+  local out="$2"
+
+  if command -v curl >/dev/null 2>&1; then
+    local curl_args=(-fL)
+    if [[ "${PROTOC_ALLOW_INSECURE_DOWNLOAD}" == "1" ]]; then
+      curl_args+=(-k)
+    fi
+    curl "${curl_args[@]}" "$url" -o "$out"
+    return 0
+  fi
+
+  if command -v wget >/dev/null 2>&1; then
+    local wget_args=()
+    if [[ -n "${https_proxy:-}" || -n "${http_proxy:-}" ]]; then
+      wget_args+=(-e use_proxy=yes)
+      if [[ -n "${https_proxy:-}" ]]; then
+        wget_args+=(-e "https_proxy=${https_proxy}")
+      fi
+      if [[ -n "${http_proxy:-}" ]]; then
+        wget_args+=(-e "http_proxy=${http_proxy}")
+      fi
+    fi
+    if [[ "${PROTOC_ALLOW_INSECURE_DOWNLOAD}" == "1" ]]; then
+      wget_args+=(--no-check-certificate)
+    fi
+    wget "${wget_args[@]}" -O "$out" "$url"
+    return 0
+  fi
+
+  echo "ERROR: neither curl nor wget is available for downloading protoc." >&2
+  return 1
+}
+
+ensure_zip_tools() {
+  command -v unzip >/dev/null 2>&1 || {
+    echo "ERROR: unzip not found." >&2
+    exit 1
+  }
+}
+
+setup_proxy_env
+ensure_zip_tools
+
+if command -v protoc >/dev/null 2>&1; then
+  existing_out="$(protoc --version 2>/dev/null || true)"
+  if [[ "$existing_out" =~ ([0-9]+\.[0-9]+\.[0-9]+) ]]; then
+    existing_ver="${BASH_REMATCH[1]}"
+    if version_matches_baseline "$existing_ver" "$PROTOBUF_BASELINE_VERSION"; then
+      command -v protoc
+      exit 0
+    fi
+  fi
+fi
+
+PROTOC_RELEASE_VERSION="$(normalize_version_for_protoc_release "$PROTOBUF_BASELINE_VERSION")"
+PROTOC_ARCHIVE="protoc-${PROTOC_RELEASE_VERSION}-${PROTOC_OS}-${PROTOC_ARCH}.zip"
+PROTOC_URL="https://github.com/protocolbuffers/protobuf/releases/download/v${PROTOC_RELEASE_VERSION}/${PROTOC_ARCHIVE}"
+PROTOC_PREFIX="${PROTOC_INSTALL_ROOT}/protoc-${PROTOC_RELEASE_VERSION}-${PROTOC_OS}-${PROTOC_ARCH}"
+PROTOC_BIN="${PROTOC_PREFIX}/bin/protoc"
+
+if [[ "${PROTOC_FORCE_INSTALL}" != "1" && -x "${PROTOC_BIN}" ]]; then
+  if [[ "${PROTOC_PRINT_PATH_ONLY}" == "1" ]]; then
+    echo "${PROTOC_BIN}"
+  else
+    echo "${PROTOC_BIN}"
+  fi
+  exit 0
+fi
+
+mkdir -p "${PROTOC_INSTALL_ROOT}"
+tmpdir="$(mktemp -d "${PROTOC_INSTALL_ROOT}/.protoc-download.XXXXXX")"
+trap 'rm -rf "${tmpdir}"' EXIT
+
+archive_path="${tmpdir}/${PROTOC_ARCHIVE}"
+download_file "${PROTOC_URL}" "${archive_path}"
+if [[ "${PROTOC_SKIP_CHECKSUM_VERIFY}" != "1" ]]; then
+  if expected_sha256="$(lookup_protoc_archive_sha256 "${PROTOC_RELEASE_VERSION}" "${PROTOC_OS}" "${PROTOC_ARCH}")"; then
+    verify_download_sha256 "${archive_path}" "${expected_sha256}"
+  else
+    echo "ERROR: no pinned checksum for protoc archive ${PROTOC_ARCHIVE}. Set PROTOC_SKIP_CHECKSUM_VERIFY=1 to bypass." >&2
+    exit 1
+  fi
+fi
+
+extract_dir="${tmpdir}/extract"
+mkdir -p "${extract_dir}"
+unzip -q "${archive_path}" -d "${extract_dir}"
+
+rm -rf "${PROTOC_PREFIX}"
+mkdir -p "${PROTOC_PREFIX}"
+cp -a "${extract_dir}/." "${PROTOC_PREFIX}/"
+chmod +x "${PROTOC_BIN}"
+
+echo "${PROTOC_BIN}"
diff --git a/fluss-rust/docs/cpp-bazel-usage.md b/fluss-rust/docs/cpp-bazel-usage.md
new file mode 100644
index 0000000000..61d861edcc
--- /dev/null
+++ b/fluss-rust/docs/cpp-bazel-usage.md
@@ -0,0 +1,291 @@
+# Fluss C++ Bazel Usage Guide (System / Build Modes)
+
+This guide is for:
+
+- C++ application teams consuming Fluss C++ bindings via Bazel
+- Maintainers evolving the Bazel integration
+
+For the CMake flow with the same `system` / `build` dependency modes, see
+`docs/cpp-cmake-usage.md`.
+
+Current simplification scope:
+
+- Keep only two dependency modes in the mainline guidance:
+  - `system`
+  - `build`
+- Defer strict internal-registry-only module flow from the mainline path
+
+## Scope
+
+- Dependency model: **root module mode**
+- Consumer dependency target: `@fluss-cpp//bindings/cpp:fluss_cpp`
+- Root `MODULE.bazel` is required for root module mode.
+- Build systems covered by this document: **Bazel**
+- Dependency modes covered by this document: **system/build**
+
+Version baseline references currently used by examples:
+
+- `protobuf/protoc`: `3.25.5`
+- `arrow-cpp`: `19.0.1`
+
+## Common Consumer `BUILD.bazel`
+
+Both modes use the same dependency target:
+
+```starlark
+load("@rules_cc//cc:defs.bzl", "cc_binary")
+
+cc_binary(
+    name = "fluss_reader",
+    srcs = ["reader.cc"],
+    deps = ["@fluss-cpp//bindings/cpp:fluss_cpp"],
+)
+```
+
+## Mode 1: `system` (Recommended in preinstalled environments)
+
+Use this mode when your environment already provides:
+
+- `protoc`
+- Arrow C++ (headers + shared libraries)
+
+### Consumer `MODULE.bazel` (pattern)
+
+```starlark
+module(name = "my_cpp_app")
+
+bazel_dep(name = "rules_cc", version = "0.2.14")
+bazel_dep(name = "fluss-cpp", version = "<released-version>")
+
+fluss_cpp = use_extension("@fluss-cpp//bindings/cpp/bazel/cpp:deps.bzl", "cpp_sdk")
+fluss_cpp.config(
+    mode = "system",
+    protobuf_version = "3.25.5",
+    arrow_cpp_version = "19.0.1",
+    # Adjust Arrow paths for your environment
+    system_arrow_prefix = "/usr",
+    system_arrow_include_dir = "include",
+    system_arrow_shared_library = "lib/x86_64-linux-gnu/libarrow.so",
+    system_arrow_runtime_glob = "lib/x86_64-linux-gnu/libarrow.so*",
+)
+use_repo(fluss_cpp, "apache_arrow_cpp")
+```
+
+### Build and run (consumer workspace pattern)
+
+Run from your consumer workspace root (the directory containing
+`MODULE.bazel` and your top-level `BUILD.bazel`).
+
+```bash
+PROTOC_BIN="$(command -v protoc)"
+CARGO_BIN="$(command -v cargo)"
+bazel run \
+  --action_env=PROTOC="$PROTOC_BIN" \
+  --action_env=CARGO="$CARGO_BIN" \
+  --action_env=PATH="$(dirname "$CARGO_BIN"):$PATH" \
+  //:fluss_reader
+```
+
+### Runnable example
+
+- `bindings/cpp/examples/bazel-consumer/system`
+
+```bash
+cd bindings/cpp/examples/bazel-consumer/system
+PROTOC_BIN="$(command -v protoc)"
+CARGO_BIN="$(command -v cargo)"
+bazel run \
+  --action_env=PROTOC="$PROTOC_BIN" \
+  --action_env=CARGO="$CARGO_BIN" \
+  --action_env=PATH="$(dirname "$CARGO_BIN"):$PATH" \
+  //:consumer_system
+```
+
+## Mode 2: `build` (No internal registry / no preinstalled Arrow)
+
+Use this mode when Arrow C++ is not preinstalled and you want Bazel to
+provision it from source.
+
+### Consumer `MODULE.bazel` (pattern)
+
+```starlark
+module(name = "my_cpp_app")
+
+bazel_dep(name = "rules_cc", version = "0.2.14")
+bazel_dep(name = "fluss-cpp", version = "<released-version>")
+
+fluss_cpp = use_extension("@fluss-cpp//bindings/cpp/bazel/cpp:deps.bzl", "cpp_sdk")
+fluss_cpp.config(
+    mode = "build",
+    protobuf_version = "3.25.5",
+    arrow_cpp_version = "19.0.1",
+)
+use_repo(fluss_cpp, "apache_arrow_cpp")
+```
+
+Notes:
+
+- `build` mode in the core Bazel integration still uses `PROTOC` (env / PATH).
+- To auto-download a pinned `protoc` for `build` mode, use
+  `bindings/cpp/scripts/ensure_protoc.sh` and pass the result via `--action_env=PROTOC=...`.
+- `ensure_protoc.sh` auto-detects host OS/arch (`linux`/`osx`, `x86_64`/`aarch_64`).
+- Some environments may require `ep_cmake_ar/ranlib/nm` overrides.
+
+### Build and run (consumer workspace pattern, with auto-downloaded `protoc`)
+
+Run from the `fluss-rust` repository root, or adjust the script path if you
+copied it elsewhere.
+
+```bash
+PROTOC_BIN="$(bash bindings/cpp/scripts/ensure_protoc.sh --print-path)"
+```
+
+```bash
+bazel run --action_env=PROTOC="$PROTOC_BIN" //:fluss_reader
+```
+
+If `cargo` is not on Bazel action `PATH`, also pass:
+
+```bash
+CARGO_BIN="$(command -v cargo)"
+bazel run \
+  --action_env=PROTOC="$PROTOC_BIN" \
+  --action_env=CARGO="$CARGO_BIN" \
+  --action_env=PATH="$(dirname "$CARGO_BIN"):$PATH" \
+  //:fluss_reader
+```
+
+### Runnable example
+
+- `bindings/cpp/examples/bazel-consumer/build`
+
+```bash
+cd bindings/cpp/examples/bazel-consumer/build
+PROTOC_BIN="$(bash ../../../scripts/ensure_protoc.sh --print-path)"
+CARGO_BIN="$(command -v cargo)"
+bazel run \
+  --action_env=PROTOC="$PROTOC_BIN" \
+  --action_env=CARGO="$CARGO_BIN" \
+  --action_env=PATH="$(dirname "$CARGO_BIN"):$PATH" \
+  //:consumer_build
+```
+
+## Local Development Override (Optional)
+
+For repository-local validation only:
+
+```starlark
+local_path_override(
+    module_name = "fluss-cpp",
+    path = "/path/to/fluss-rust",
+)
+```
+
+Do not keep local overrides in long-lived branches.
+
+Repository-local examples in this repo use `version = "0.1.0"` together with
+`local_path_override(...)` for local validation before publishing to the Bazel
+registry.
+
+## Repository-local Validation (Direct Commands)
+
+These commands validate the repository examples directly.
+If your environment requires a proxy for Bazel external downloads, export it
+before running (replace the placeholder URL with your actual proxy):
+
+```bash
+export BAZEL_PROXY_URL="http://proxy.example.com:3128"
+export http_proxy="$BAZEL_PROXY_URL"
+export https_proxy="$BAZEL_PROXY_URL"
+export HTTP_PROXY="$http_proxy"
+export HTTPS_PROXY="$https_proxy"
+unset all_proxy ALL_PROXY
+```
+
+### Validate `build` example
+
+```bash
+cd bindings/cpp/examples/bazel-consumer/build
+PROTOC_BIN="$(bash ../../../scripts/ensure_protoc.sh --print-path)"
+CARGO_BIN="$(command -v cargo)"
+bazel --ignore_all_rc_files run \
+  --registry=https://bcr.bazel.build \
+  --lockfile_mode=off \
+  --repo_env=http_proxy="${http_proxy:-}" \
+  --repo_env=https_proxy="${https_proxy:-}" \
+  --repo_env=HTTP_PROXY="${HTTP_PROXY:-}" \
+  --repo_env=HTTPS_PROXY="${HTTPS_PROXY:-}" \
+  --action_env=http_proxy="${http_proxy:-}" \
+  --action_env=https_proxy="${https_proxy:-}" \
+  --action_env=HTTP_PROXY="${HTTP_PROXY:-}" \
+  --action_env=HTTPS_PROXY="${HTTPS_PROXY:-}" \
+  --action_env=all_proxy= \
+  --action_env=ALL_PROXY= \
+  --action_env=PROTOC="$PROTOC_BIN" \
+  --action_env=CARGO="$CARGO_BIN" \
+  --action_env=PATH="$(dirname "$CARGO_BIN"):$PATH" \
+  --strategy=CcCmakeMakeRule=local \
+  --strategy=BootstrapGNUMake=local \
+  --strategy=BootstrapPkgConfig=local \
+  //:consumer_build
+```
+
+### Validate `system` example (using a local Arrow prefix)
+
+The `system` example defaults to `/usr`. If your Arrow prefix is elsewhere
+(for example a locally built prefix), copy the example to a temp directory and
+patch `MODULE.bazel` before running:
+
+```bash
+tmp_dir="$(mktemp -d /tmp/fluss-bazel-system-doc.XXXXXX)"
+FLUSS_RUST_ROOT="$(pwd)"
+cp -a bindings/cpp/examples/bazel-consumer/system/. "$tmp_dir/"
+sed -i \
+  -e "s|path = \"../../../../../\"|path = \"$FLUSS_RUST_ROOT\"|" \
+  -e 's|system_arrow_prefix = "/usr"|system_arrow_prefix = "/tmp/fluss-system-arrow-19.0.1"|' \
+  -e 's|system_arrow_shared_library = "lib/x86_64-linux-gnu/libarrow.so"|system_arrow_shared_library = "lib/libarrow.so"|' \
+  -e 's|system_arrow_runtime_glob = "lib/x86_64-linux-gnu/libarrow.so\\*"|system_arrow_runtime_glob = "lib/libarrow.so*"|' \
+  "$tmp_dir/MODULE.bazel"
+cd "$tmp_dir"
+PROTOC_BIN="$(command -v protoc)"
+CARGO_BIN="$(command -v cargo)"
+bazel --ignore_all_rc_files run \
+  --registry=https://bcr.bazel.build \
+  --lockfile_mode=off \
+  --repo_env=http_proxy="${http_proxy:-}" \
+  --repo_env=https_proxy="${https_proxy:-}" \
+  --repo_env=HTTP_PROXY="${HTTP_PROXY:-}" \
+  --repo_env=HTTPS_PROXY="${HTTPS_PROXY:-}" \
+  --action_env=http_proxy="${http_proxy:-}" \
+  --action_env=https_proxy="${https_proxy:-}" \
+  --action_env=HTTP_PROXY="${HTTP_PROXY:-}" \
+  --action_env=HTTPS_PROXY="${HTTPS_PROXY:-}" \
+  --action_env=all_proxy= \
+  --action_env=ALL_PROXY= \
+  --action_env=PROTOC="$PROTOC_BIN" \
+  --action_env=CARGO="$CARGO_BIN" \
+  --action_env=PATH="$(dirname "$CARGO_BIN"):$PATH" \
+  //:consumer_system
+```
+
+On macOS (BSD `sed`), replace `sed -i` with `sed -i ''` in the patch step above.
+
+## Upgrade Procedure
+
+1. Update `bazel_dep(name = "fluss-cpp", version = "...")`
+2. Update mode version settings if needed (`protobuf_version`, `arrow_cpp_version`)
+3. Run `bazel mod tidy`
+4. Commit `MODULE.bazel` and `MODULE.bazel.lock`
+5. Run build + tests
+6. Verify dependency graph:
+
+```bash
+bazel mod graph | rg "fluss-cpp@"
+```
+
+## Examples and Non-Mainline References
+
+Mainline examples:
+
+- `bindings/cpp/examples/bazel-consumer/build`
+- `bindings/cpp/examples/bazel-consumer/system`
diff --git a/fluss-rust/docs/cpp-cmake-usage.md b/fluss-rust/docs/cpp-cmake-usage.md
new file mode 100644
index 0000000000..3002d1c4b4
--- /dev/null
+++ b/fluss-rust/docs/cpp-cmake-usage.md
@@ -0,0 +1,129 @@
+# Fluss C++ CMake Usage Guide (System / Build Modes)
+
+## Audience
+
+- C++ application teams building `bindings/cpp` with CMake
+- Maintainers evolving Fluss C++ dependency provisioning
+
+## Scope
+
+- Build system covered by this document: **CMake**
+- Dependency modes covered by this document: **system/build**
+
+Current tested baselines:
+
+- `protoc`: `3.25.5`
+- `arrow-cpp`: `19.0.1`
+
+Notes:
+
+- CMake currently warns (does not fail) when local `protoc`/Arrow versions differ from the baselines.
+- `protoc` is required because Rust `prost-build` runs during the C++ build.
+
+## Common Prerequisites
+
+- Rust toolchain (`cargo` in `PATH`, or set `CARGO=/path/to/cargo`)
+- `protoc` in `PATH` (required for `system` mode; `build` mode can auto-download via `bindings/cpp/scripts/ensure_protoc.sh`)
+- C++17 compiler
+- CMake 3.22+
+
+Examples below use `bindings/cpp` as the source directory.
+
+## Mode 1: `system`
+
+Use this mode when the environment already provides Arrow C++.
+
+### Configure
+
+```bash
+cmake -S bindings/cpp -B /tmp/fluss-cpp-cmake-system \
+  -DFLUSS_CPP_DEP_MODE=system \
+  -DFLUSS_CPP_ARROW_SYSTEM_ROOT=/path/to/arrow/prefix
+```
+
+Typical prefixes:
+
+- Ubuntu package install: `/usr`
+- Custom install prefix: `/usr/local` or `/opt/arrow`
+
+### Build
+
+```bash
+cmake --build /tmp/fluss-cpp-cmake-system --target fluss_cpp -j
+```
+
+## Mode 2: `build`
+
+Use this mode when Arrow C++ is not preinstalled and CMake should fetch/build it.
+
+### Configure (with auto-downloaded `protoc`)
+
+```bash
+PROTOC_BIN="$(bash bindings/cpp/scripts/ensure_protoc.sh --print-path)"
+export PATH="$(dirname "$PROTOC_BIN"):$PATH"
+```
+
+Then configure:
+
+```bash
+cmake -S bindings/cpp -B /tmp/fluss-cpp-cmake-build \
+  -DFLUSS_CPP_DEP_MODE=build
+```
+
+Optional overrides:
+
+- `-DFLUSS_CPP_ARROW_VERSION=19.0.1`
+- `-DFLUSS_CPP_ARROW_SOURCE_URL=...` (internal mirror or pinned archive)
+- `-DFLUSS_CPP_PROTOBUF_VERSION=3.25.5` (baseline warning only)
+
+If your environment needs a proxy for CMake/FetchContent downloads, export standard proxy vars before configure/build:
+
+```bash
+export http_proxy=http://host:port
+export https_proxy=http://host:port
+export HTTP_PROXY="$http_proxy"
+export HTTPS_PROXY="$https_proxy"
+```
+
+### Build
+
+```bash
+cmake --build /tmp/fluss-cpp-cmake-build --target fluss_cpp -j
+```
+
+This mode is slower on first build because it compiles Arrow C++ from source.
+
+## Repository-local Validation (Direct Commands)
+
+### Validate `system` mode
+
+```bash
+PROTOC_BIN="$(bash bindings/cpp/scripts/ensure_protoc.sh --print-path)"
+export PATH="$(dirname "$PROTOC_BIN"):$PATH"
+cmake -S bindings/cpp -B /tmp/fluss-cpp-cmake-system \
+  -DFLUSS_CPP_DEP_MODE=system \
+  -DFLUSS_CPP_ARROW_SYSTEM_ROOT=/tmp/fluss-system-arrow-19.0.1
+cmake --build /tmp/fluss-cpp-cmake-system --target fluss_cpp -j
+```
+
+### Validate `build` mode
+
+```bash
+PROTOC_BIN="$(bash bindings/cpp/scripts/ensure_protoc.sh --print-path)"
+export PATH="$(dirname "$PROTOC_BIN"):$PATH"
+cmake -S bindings/cpp -B /tmp/fluss-cpp-cmake-build \
+  -DFLUSS_CPP_DEP_MODE=build
+cmake --build /tmp/fluss-cpp-cmake-build --target fluss_cpp -j
+```
+
+## Troubleshooting
+
+- `cargo not found`
+  - Install Rust toolchain or set `CARGO=/path/to/cargo`.
+- `protoc not found`
+  - Install `protoc` and ensure it is in `PATH`.
+  - For `build` mode, use `bindings/cpp/scripts/ensure_protoc.sh` and prepend the returned path to `PATH`.
+- `arrow/c/bridge.h` not found (build mode)
+  - Reconfigure after updating to the latest `bindings/cpp/CMakeLists.txt`; build mode now adds Arrow source/build include dirs explicitly.
+- Long first build in `build` mode
+  - Expected. Arrow C++ source build dominates wall time.

From 316d1a0524ba883de1a2fc2d7ed50f6218a87373 Mon Sep 17 00:00:00 2001
From: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
Date: Mon, 2 Mar 2026 10:43:45 +0800
Subject: [PATCH 179/287] chore: update dependency list for release 0.1.0

---
 fluss-rust/.licenserc.yaml                    |   1 +
 fluss-rust/DEPENDENCIES.rust.tsv              | 330 ++++++++++++++++++
 fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv | 317 +++++++++++++++++
 .../bindings/python/DEPENDENCIES.rust.tsv     | 317 +++++++++++++++++
 .../crates/examples/DEPENDENCIES.rust.tsv     | 306 ++++++++++++++++
 fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv | 305 ++++++++++++++++
 6 files changed, 1576 insertions(+)
 create mode 100644 fluss-rust/DEPENDENCIES.rust.tsv
 create mode 100644 fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv
 create mode 100644 fluss-rust/bindings/python/DEPENDENCIES.rust.tsv
 create mode 100644 fluss-rust/crates/examples/DEPENDENCIES.rust.tsv
 create mode 100644 fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv

diff --git a/fluss-rust/.licenserc.yaml b/fluss-rust/.licenserc.yaml
index d323856373..a5b1f76ca8 100644
--- a/fluss-rust/.licenserc.yaml
+++ b/fluss-rust/.licenserc.yaml
@@ -28,4 +28,5 @@ header:
     - 'bindings/python/fluss/py.typed'
     - 'website/**'
     - '**/*.md'
+    - '**/DEPENDENCIES.*.tsv'
   comment: on-failure
diff --git a/fluss-rust/DEPENDENCIES.rust.tsv b/fluss-rust/DEPENDENCIES.rust.tsv
new file mode 100644
index 0000000000..be7d2c8ee1
--- /dev/null
+++ b/fluss-rust/DEPENDENCIES.rust.tsv
@@ -0,0 +1,330 @@
+crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense	Zlib
+ahash@0.8.12	X									X			
+aho-corasick@1.1.3										X		X	
+android-tzdata@0.1.1	X									X			
+android_system_properties@0.1.5	X									X			
+anstream@0.6.20	X									X			
+anstyle@1.0.11	X									X			
+anstyle-parse@0.2.7	X									X			
+anstyle-query@1.1.4	X									X			
+anstyle-wincon@3.0.10	X									X			
+anyhow@1.0.100	X									X			
+arrow@57.1.0	X												
+arrow-arith@57.1.0	X												
+arrow-array@57.1.0	X												
+arrow-buffer@57.1.0	X												
+arrow-cast@57.1.0	X												
+arrow-csv@57.1.0	X												
+arrow-data@57.1.0	X												
+arrow-ipc@57.1.0	X												
+arrow-json@57.1.0	X												
+arrow-ord@57.1.0	X												
+arrow-pyarrow@57.1.0	X												
+arrow-row@57.1.0	X												
+arrow-schema@57.1.0	X												
+arrow-select@57.1.0	X												
+arrow-string@57.1.0	X												
+async-trait@0.1.89	X									X			
+atoi@2.0.0										X			
+atomic-waker@1.1.2	X									X			
+autocfg@1.5.0	X									X			
+backon@1.6.0	X												
+base64@0.22.1	X									X			
+bigdecimal@0.4.10	X									X			
+bitflags@2.9.3	X									X			
+bitvec@1.0.1										X			
+block-buffer@0.10.4	X									X			
+bumpalo@3.19.0	X									X			
+byteorder@1.5.0										X		X	
+bytes@1.11.1										X			
+cc@1.2.34	X									X			
+cfg-if@1.0.3	X									X			
+chrono@0.4.41	X									X			
+clap@4.5.45	X									X			
+clap_builder@4.5.44	X									X			
+clap_derive@4.5.45	X									X			
+clap_lex@0.7.5	X									X			
+codespan-reporting@0.13.1	X												
+colorchoice@1.0.4	X									X			
+const-oid@0.9.6	X									X			
+const-random@0.1.18	X									X			
+const-random-macro@0.1.16	X									X			
+core-foundation-sys@0.8.7	X									X			
+cpufeatures@0.2.17	X									X			
+crc32c@0.6.8	X									X			
+crossbeam-utils@0.8.21	X									X			
+crunchy@0.2.4										X			
+crypto-common@0.1.7	X									X			
+csv@1.3.1										X		X	
+csv-core@0.1.12										X		X	
+cxx@1.0.190	X									X			
+cxx-build@1.0.190	X									X			
+cxxbridge-flags@1.0.190	X									X			
+cxxbridge-macro@1.0.190	X									X			
+dashmap@6.1.0										X			
+delegate@0.13.5	X									X			
+digest@0.10.7	X									X			
+displaydoc@0.2.5	X									X			
+either@1.15.0	X									X			
+equivalent@1.0.2	X									X			
+errno@0.3.13	X									X			
+fastrand@2.3.0	X									X			
+fixedbitset@0.5.7	X									X			
+flatbuffers@25.2.10	X												
+fluss-cpp@0.1.0	X												
+fluss-examples@0.1.0	X												
+fluss-rs@0.1.0	X												
+fluss_python@0.1.0	X												
+fnv@1.0.7	X									X			
+foldhash@0.2.0													X
+form_urlencoded@1.2.2	X									X			
+funty@2.0.0										X			
+futures@0.3.31	X									X			
+futures-channel@0.3.31	X									X			
+futures-core@0.3.31	X									X			
+futures-executor@0.3.31	X									X			
+futures-io@0.3.31	X									X			
+futures-macro@0.3.31	X									X			
+futures-sink@0.3.31	X									X			
+futures-task@0.3.31	X									X			
+futures-util@0.3.31	X									X			
+generic-array@0.14.7										X			
+getrandom@0.2.16	X									X			
+getrandom@0.3.3	X									X			
+gloo-timers@0.3.0	X									X			
+h2@0.4.12										X			
+half@2.6.0	X									X			
+hashbrown@0.14.5	X									X			
+hashbrown@0.15.5	X									X			
+hashbrown@0.16.1	X									X			
+heck@0.5.0	X									X			
+hex@0.4.3	X									X			
+hmac@0.12.1	X									X			
+home@0.5.11	X									X			
+http@1.3.1	X									X			
+http-body@1.0.1										X			
+http-body-util@0.1.3										X			
+httparse@1.10.1	X									X			
+httpdate@1.0.3	X									X			
+hyper@1.7.0										X			
+hyper-rustls@0.27.7	X							X		X			
+hyper-util@0.1.17										X			
+iana-time-zone@0.1.63	X									X			
+iana-time-zone-haiku@0.1.2	X									X			
+icu_collections@2.0.0											X		
+icu_locale_core@2.0.0											X		
+icu_normalizer@2.0.0											X		
+icu_normalizer_data@2.0.0											X		
+icu_properties@2.0.1											X		
+icu_properties_data@2.0.1											X		
+icu_provider@2.0.0											X		
+idna@1.1.0	X									X			
+idna_adapter@1.2.1	X									X			
+indexmap@2.11.0	X									X			
+indoc@2.0.6	X									X			
+ipnet@2.11.0	X									X			
+iri-string@0.7.9	X									X			
+is_terminal_polyfill@1.70.1	X									X			
+itertools@0.14.0	X									X			
+itoa@1.0.15	X									X			
+jiff@0.2.16										X		X	
+jiff-tzdb@0.1.5										X		X	
+jiff-tzdb-platform@0.1.3										X		X	
+jobserver@0.1.34	X									X			
+js-sys@0.3.77	X									X			
+lexical-core@1.0.5	X									X			
+lexical-parse-float@1.0.5	X									X			
+lexical-parse-integer@1.0.5	X									X			
+lexical-util@1.0.6	X									X			
+lexical-write-float@1.0.5	X									X			
+lexical-write-integer@1.0.5	X									X			
+libc@0.2.175	X									X			
+libm@0.2.15										X			
+link-cplusplus@1.0.12	X									X			
+linked-hash-map@0.5.6	X									X			
+linux-raw-sys@0.9.4	X	X								X			
+litemap@0.8.0											X		
+lock_api@0.4.13	X									X			
+log@0.4.27	X									X			
+lz4_flex@0.12.0										X			
+md-5@0.10.6	X									X			
+memchr@2.7.5										X		X	
+memoffset@0.9.1										X			
+mio@1.0.4										X			
+multimap@0.10.1	X									X			
+num-bigint@0.4.6	X									X			
+num-complex@0.4.6	X									X			
+num-integer@0.1.46	X									X			
+num-traits@0.2.19	X									X			
+once_cell@1.21.3	X									X			
+once_cell_polyfill@1.70.1	X									X			
+opendal@0.55.0	X												
+ordered-float@5.1.0										X			
+parking_lot@0.12.4	X									X			
+parking_lot_core@0.9.11	X									X			
+parse-display@0.10.0	X									X			
+parse-display-derive@0.10.0	X									X			
+percent-encoding@2.3.2	X									X			
+petgraph@0.7.1	X									X			
+pin-project-lite@0.2.16	X									X			
+pin-utils@0.1.0	X									X			
+pkg-config@0.3.32	X									X			
+portable-atomic@1.11.1	X									X			
+portable-atomic-util@0.2.4	X									X			
+potential_utf@0.1.3											X		
+ppv-lite86@0.2.21	X									X			
+prettyplease@0.2.37	X									X			
+proc-macro2@1.0.101	X									X			
+prost@0.14.1	X												
+prost-build@0.14.1	X												
+prost-derive@0.14.1	X												
+prost-types@0.14.1	X												
+pyo3@0.26.0	X									X			
+pyo3-async-runtimes@0.26.0	X												
+pyo3-build-config@0.26.0	X									X			
+pyo3-ffi@0.26.0	X									X			
+pyo3-macros@0.26.0	X									X			
+pyo3-macros-backend@0.26.0	X									X			
+quick-xml@0.37.5										X			
+quick-xml@0.38.4										X			
+quote@1.0.40	X									X			
+r-efi@5.3.0	X								X	X			
+radium@0.7.0										X			
+rand@0.8.5	X									X			
+rand@0.9.2	X									X			
+rand_chacha@0.3.1	X									X			
+rand_chacha@0.9.0	X									X			
+rand_core@0.6.4	X									X			
+rand_core@0.9.3	X									X			
+redox_syscall@0.5.17										X			
+regex@1.11.2	X									X			
+regex-automata@0.4.10	X									X			
+regex-syntax@0.8.6	X									X			
+reqsign@0.16.5	X												
+reqwest@0.12.25	X									X			
+ring@0.17.14	X							X					
+rustc_version@0.4.1	X									X			
+rustix@1.0.8	X	X								X			
+rustls@0.23.32	X							X		X			
+rustls-pki-types@1.12.0	X									X			
+rustls-webpki@0.103.7								X					
+rustversion@1.0.22	X									X			
+ryu@1.0.20	X				X								
+scopeguard@1.2.0	X									X			
+scratch@1.0.9	X									X			
+semver@1.0.26	X									X			
+serde@1.0.228	X									X			
+serde_core@1.0.228	X									X			
+serde_derive@1.0.228	X									X			
+serde_json@1.0.143	X									X			
+serde_urlencoded@0.7.1	X									X			
+sha1@0.10.6	X									X			
+sha2@0.10.9	X									X			
+shlex@1.3.0	X									X			
+signal-hook-registry@1.4.6	X									X			
+simdutf8@0.1.5	X									X			
+slab@0.4.11										X			
+smallvec@1.15.1	X									X			
+snafu@0.8.9	X									X			
+snafu-derive@0.8.9	X									X			
+socket2@0.6.0	X									X			
+stable_deref_trait@1.2.1	X									X			
+static_assertions@1.1.0	X									X			
+strsim@0.11.1										X			
+structmeta@0.3.0	X									X			
+structmeta-derive@0.3.0	X									X			
+strum@0.26.3										X			
+strum_macros@0.26.4										X			
+subtle@2.6.1				X									
+syn@2.0.106	X									X			
+sync_wrapper@1.0.2	X												
+synstructure@0.13.2										X			
+tap@1.0.1										X			
+target-lexicon@0.13.3		X											
+tempfile@3.23.0	X									X			
+termcolor@1.4.1										X		X	
+thiserror@1.0.69	X									X			
+thiserror-impl@1.0.69	X									X			
+tiny-keccak@2.0.2						X							
+tinystr@0.8.1											X		
+tokio@1.48.0										X			
+tokio-macros@2.6.0										X			
+tokio-rustls@0.26.4	X									X			
+tokio-util@0.7.16										X			
+tower@0.5.2										X			
+tower-http@0.6.8										X			
+tower-layer@0.3.3										X			
+tower-service@0.3.3										X			
+tracing@0.1.41										X			
+tracing-attributes@0.1.30										X			
+tracing-core@0.1.34										X			
+try-lock@0.2.5										X			
+twox-hash@2.1.2										X			
+typenum@1.19.0	X									X			
+unicode-ident@1.0.18	X									X	X		
+unicode-width@0.2.2	X									X			
+unindent@0.2.4	X									X			
+untrusted@0.9.0								X					
+url@2.5.7	X									X			
+utf8_iter@1.0.4	X									X			
+utf8parse@0.2.2	X									X			
+uuid@1.18.0	X									X			
+value-bag@1.12.0	X									X			
+version_check@0.9.5	X									X			
+want@0.3.1										X			
+wasi@0.11.1+wasi-snapshot-preview1	X	X								X			
+wasi@0.14.2+wasi-0.2.4	X	X								X			
+wasm-bindgen@0.2.100	X									X			
+wasm-bindgen-backend@0.2.100	X									X			
+wasm-bindgen-futures@0.4.50	X									X			
+wasm-bindgen-macro@0.2.100	X									X			
+wasm-bindgen-macro-support@0.2.100	X									X			
+wasm-bindgen-shared@0.2.100	X									X			
+wasm-streams@0.4.2	X									X			
+web-sys@0.3.77	X									X			
+webpki-roots@1.0.3							X						
+winapi-util@0.1.11										X		X	
+windows-core@0.61.2	X									X			
+windows-implement@0.60.0	X									X			
+windows-interface@0.59.1	X									X			
+windows-link@0.1.3	X									X			
+windows-link@0.2.1	X									X			
+windows-result@0.3.4	X									X			
+windows-strings@0.4.2	X									X			
+windows-sys@0.52.0	X									X			
+windows-sys@0.59.0	X									X			
+windows-sys@0.60.2	X									X			
+windows-sys@0.61.2	X									X			
+windows-targets@0.52.6	X									X			
+windows-targets@0.53.3	X									X			
+windows_aarch64_gnullvm@0.52.6	X									X			
+windows_aarch64_gnullvm@0.53.0	X									X			
+windows_aarch64_msvc@0.52.6	X									X			
+windows_aarch64_msvc@0.53.0	X									X			
+windows_i686_gnu@0.52.6	X									X			
+windows_i686_gnu@0.53.0	X									X			
+windows_i686_gnullvm@0.52.6	X									X			
+windows_i686_gnullvm@0.53.0	X									X			
+windows_i686_msvc@0.52.6	X									X			
+windows_i686_msvc@0.53.0	X									X			
+windows_x86_64_gnu@0.52.6	X									X			
+windows_x86_64_gnu@0.53.0	X									X			
+windows_x86_64_gnullvm@0.52.6	X									X			
+windows_x86_64_gnullvm@0.53.0	X									X			
+windows_x86_64_msvc@0.52.6	X									X			
+windows_x86_64_msvc@0.53.0	X									X			
+wit-bindgen-rt@0.39.0	X	X								X			
+writeable@0.6.1											X		
+wyz@0.5.1										X			
+yoke@0.8.0											X		
+yoke-derive@0.8.0											X		
+zerocopy@0.8.26	X		X							X			
+zerofrom@0.1.6											X		
+zerofrom-derive@0.1.6											X		
+zeroize@1.8.2	X									X			
+zerotrie@0.2.2											X		
+zerovec@0.11.4											X		
+zerovec-derive@0.11.1											X		
+zstd@0.13.3										X			
+zstd-safe@7.2.4	X									X			
+zstd-sys@2.0.16+zstd.1.5.7	X									X			
diff --git a/fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv b/fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv
new file mode 100644
index 0000000000..b2324052e7
--- /dev/null
+++ b/fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv
@@ -0,0 +1,317 @@
+crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense	Zlib
+ahash@0.8.12	X									X			
+aho-corasick@1.1.3										X		X	
+android-tzdata@0.1.1	X									X			
+android_system_properties@0.1.5	X									X			
+anstream@0.6.20	X									X			
+anstyle@1.0.11	X									X			
+anstyle-parse@0.2.7	X									X			
+anstyle-query@1.1.4	X									X			
+anstyle-wincon@3.0.10	X									X			
+anyhow@1.0.100	X									X			
+arrow@57.1.0	X												
+arrow-arith@57.1.0	X												
+arrow-array@57.1.0	X												
+arrow-buffer@57.1.0	X												
+arrow-cast@57.1.0	X												
+arrow-csv@57.1.0	X												
+arrow-data@57.1.0	X												
+arrow-ipc@57.1.0	X												
+arrow-json@57.1.0	X												
+arrow-ord@57.1.0	X												
+arrow-row@57.1.0	X												
+arrow-schema@57.1.0	X												
+arrow-select@57.1.0	X												
+arrow-string@57.1.0	X												
+async-trait@0.1.89	X									X			
+atoi@2.0.0										X			
+atomic-waker@1.1.2	X									X			
+autocfg@1.5.0	X									X			
+backon@1.6.0	X												
+base64@0.22.1	X									X			
+bigdecimal@0.4.10	X									X			
+bitflags@2.9.3	X									X			
+bitvec@1.0.1										X			
+block-buffer@0.10.4	X									X			
+bumpalo@3.19.0	X									X			
+byteorder@1.5.0										X		X	
+bytes@1.11.1										X			
+cc@1.2.34	X									X			
+cfg-if@1.0.3	X									X			
+chrono@0.4.41	X									X			
+clap@4.5.45	X									X			
+clap_builder@4.5.44	X									X			
+clap_derive@4.5.45	X									X			
+clap_lex@0.7.5	X									X			
+codespan-reporting@0.13.1	X												
+colorchoice@1.0.4	X									X			
+const-oid@0.9.6	X									X			
+const-random@0.1.18	X									X			
+const-random-macro@0.1.16	X									X			
+core-foundation-sys@0.8.7	X									X			
+cpufeatures@0.2.17	X									X			
+crc32c@0.6.8	X									X			
+crossbeam-utils@0.8.21	X									X			
+crunchy@0.2.4										X			
+crypto-common@0.1.7	X									X			
+csv@1.3.1										X		X	
+csv-core@0.1.12										X		X	
+cxx@1.0.190	X									X			
+cxx-build@1.0.190	X									X			
+cxxbridge-flags@1.0.190	X									X			
+cxxbridge-macro@1.0.190	X									X			
+dashmap@6.1.0										X			
+delegate@0.13.5	X									X			
+digest@0.10.7	X									X			
+displaydoc@0.2.5	X									X			
+either@1.15.0	X									X			
+equivalent@1.0.2	X									X			
+errno@0.3.13	X									X			
+fastrand@2.3.0	X									X			
+fixedbitset@0.5.7	X									X			
+flatbuffers@25.2.10	X												
+fluss-cpp@0.1.0	X												
+fluss-rs@0.1.0	X												
+fnv@1.0.7	X									X			
+foldhash@0.2.0													X
+form_urlencoded@1.2.2	X									X			
+funty@2.0.0										X			
+futures@0.3.31	X									X			
+futures-channel@0.3.31	X									X			
+futures-core@0.3.31	X									X			
+futures-executor@0.3.31	X									X			
+futures-io@0.3.31	X									X			
+futures-macro@0.3.31	X									X			
+futures-sink@0.3.31	X									X			
+futures-task@0.3.31	X									X			
+futures-util@0.3.31	X									X			
+generic-array@0.14.7										X			
+getrandom@0.2.16	X									X			
+getrandom@0.3.3	X									X			
+gloo-timers@0.3.0	X									X			
+h2@0.4.12										X			
+half@2.6.0	X									X			
+hashbrown@0.14.5	X									X			
+hashbrown@0.15.5	X									X			
+hashbrown@0.16.1	X									X			
+heck@0.5.0	X									X			
+hex@0.4.3	X									X			
+hmac@0.12.1	X									X			
+home@0.5.11	X									X			
+http@1.3.1	X									X			
+http-body@1.0.1										X			
+http-body-util@0.1.3										X			
+httparse@1.10.1	X									X			
+httpdate@1.0.3	X									X			
+hyper@1.7.0										X			
+hyper-rustls@0.27.7	X							X		X			
+hyper-util@0.1.17										X			
+iana-time-zone@0.1.63	X									X			
+iana-time-zone-haiku@0.1.2	X									X			
+icu_collections@2.0.0											X		
+icu_locale_core@2.0.0											X		
+icu_normalizer@2.0.0											X		
+icu_normalizer_data@2.0.0											X		
+icu_properties@2.0.1											X		
+icu_properties_data@2.0.1											X		
+icu_provider@2.0.0											X		
+idna@1.1.0	X									X			
+idna_adapter@1.2.1	X									X			
+indexmap@2.11.0	X									X			
+ipnet@2.11.0	X									X			
+iri-string@0.7.9	X									X			
+is_terminal_polyfill@1.70.1	X									X			
+itertools@0.14.0	X									X			
+itoa@1.0.15	X									X			
+jiff@0.2.16										X		X	
+jiff-tzdb@0.1.5										X		X	
+jiff-tzdb-platform@0.1.3										X		X	
+jobserver@0.1.34	X									X			
+js-sys@0.3.77	X									X			
+lexical-core@1.0.5	X									X			
+lexical-parse-float@1.0.5	X									X			
+lexical-parse-integer@1.0.5	X									X			
+lexical-util@1.0.6	X									X			
+lexical-write-float@1.0.5	X									X			
+lexical-write-integer@1.0.5	X									X			
+libc@0.2.175	X									X			
+libm@0.2.15										X			
+link-cplusplus@1.0.12	X									X			
+linked-hash-map@0.5.6	X									X			
+linux-raw-sys@0.9.4	X	X								X			
+litemap@0.8.0											X		
+lock_api@0.4.13	X									X			
+log@0.4.27	X									X			
+lz4_flex@0.12.0										X			
+md-5@0.10.6	X									X			
+memchr@2.7.5										X		X	
+mio@1.0.4										X			
+multimap@0.10.1	X									X			
+num-bigint@0.4.6	X									X			
+num-complex@0.4.6	X									X			
+num-integer@0.1.46	X									X			
+num-traits@0.2.19	X									X			
+once_cell@1.21.3	X									X			
+once_cell_polyfill@1.70.1	X									X			
+opendal@0.55.0	X												
+ordered-float@5.1.0										X			
+parking_lot@0.12.4	X									X			
+parking_lot_core@0.9.11	X									X			
+parse-display@0.10.0	X									X			
+parse-display-derive@0.10.0	X									X			
+percent-encoding@2.3.2	X									X			
+petgraph@0.7.1	X									X			
+pin-project-lite@0.2.16	X									X			
+pin-utils@0.1.0	X									X			
+pkg-config@0.3.32	X									X			
+portable-atomic@1.11.1	X									X			
+portable-atomic-util@0.2.4	X									X			
+potential_utf@0.1.3											X		
+ppv-lite86@0.2.21	X									X			
+prettyplease@0.2.37	X									X			
+proc-macro2@1.0.101	X									X			
+prost@0.14.1	X												
+prost-build@0.14.1	X												
+prost-derive@0.14.1	X												
+prost-types@0.14.1	X												
+quick-xml@0.37.5										X			
+quick-xml@0.38.4										X			
+quote@1.0.40	X									X			
+r-efi@5.3.0	X								X	X			
+radium@0.7.0										X			
+rand@0.8.5	X									X			
+rand@0.9.2	X									X			
+rand_chacha@0.3.1	X									X			
+rand_chacha@0.9.0	X									X			
+rand_core@0.6.4	X									X			
+rand_core@0.9.3	X									X			
+redox_syscall@0.5.17										X			
+regex@1.11.2	X									X			
+regex-automata@0.4.10	X									X			
+regex-syntax@0.8.6	X									X			
+reqsign@0.16.5	X												
+reqwest@0.12.25	X									X			
+ring@0.17.14	X							X					
+rustc_version@0.4.1	X									X			
+rustix@1.0.8	X	X								X			
+rustls@0.23.32	X							X		X			
+rustls-pki-types@1.12.0	X									X			
+rustls-webpki@0.103.7								X					
+rustversion@1.0.22	X									X			
+ryu@1.0.20	X				X								
+scopeguard@1.2.0	X									X			
+scratch@1.0.9	X									X			
+semver@1.0.26	X									X			
+serde@1.0.228	X									X			
+serde_core@1.0.228	X									X			
+serde_derive@1.0.228	X									X			
+serde_json@1.0.143	X									X			
+serde_urlencoded@0.7.1	X									X			
+sha1@0.10.6	X									X			
+sha2@0.10.9	X									X			
+shlex@1.3.0	X									X			
+signal-hook-registry@1.4.6	X									X			
+simdutf8@0.1.5	X									X			
+slab@0.4.11										X			
+smallvec@1.15.1	X									X			
+snafu@0.8.9	X									X			
+snafu-derive@0.8.9	X									X			
+socket2@0.6.0	X									X			
+stable_deref_trait@1.2.1	X									X			
+static_assertions@1.1.0	X									X			
+strsim@0.11.1										X			
+structmeta@0.3.0	X									X			
+structmeta-derive@0.3.0	X									X			
+strum@0.26.3										X			
+strum_macros@0.26.4										X			
+subtle@2.6.1				X									
+syn@2.0.106	X									X			
+sync_wrapper@1.0.2	X												
+synstructure@0.13.2										X			
+tap@1.0.1										X			
+tempfile@3.23.0	X									X			
+termcolor@1.4.1										X		X	
+thiserror@1.0.69	X									X			
+thiserror-impl@1.0.69	X									X			
+tiny-keccak@2.0.2						X							
+tinystr@0.8.1											X		
+tokio@1.48.0										X			
+tokio-macros@2.6.0										X			
+tokio-rustls@0.26.4	X									X			
+tokio-util@0.7.16										X			
+tower@0.5.2										X			
+tower-http@0.6.8										X			
+tower-layer@0.3.3										X			
+tower-service@0.3.3										X			
+tracing@0.1.41										X			
+tracing-attributes@0.1.30										X			
+tracing-core@0.1.34										X			
+try-lock@0.2.5										X			
+twox-hash@2.1.2										X			
+typenum@1.19.0	X									X			
+unicode-ident@1.0.18	X									X	X		
+unicode-width@0.2.2	X									X			
+untrusted@0.9.0								X					
+url@2.5.7	X									X			
+utf8_iter@1.0.4	X									X			
+utf8parse@0.2.2	X									X			
+uuid@1.18.0	X									X			
+value-bag@1.12.0	X									X			
+version_check@0.9.5	X									X			
+want@0.3.1										X			
+wasi@0.11.1+wasi-snapshot-preview1	X	X								X			
+wasi@0.14.2+wasi-0.2.4	X	X								X			
+wasm-bindgen@0.2.100	X									X			
+wasm-bindgen-backend@0.2.100	X									X			
+wasm-bindgen-futures@0.4.50	X									X			
+wasm-bindgen-macro@0.2.100	X									X			
+wasm-bindgen-macro-support@0.2.100	X									X			
+wasm-bindgen-shared@0.2.100	X									X			
+wasm-streams@0.4.2	X									X			
+web-sys@0.3.77	X									X			
+webpki-roots@1.0.3							X						
+winapi-util@0.1.11										X		X	
+windows-core@0.61.2	X									X			
+windows-implement@0.60.0	X									X			
+windows-interface@0.59.1	X									X			
+windows-link@0.1.3	X									X			
+windows-link@0.2.1	X									X			
+windows-result@0.3.4	X									X			
+windows-strings@0.4.2	X									X			
+windows-sys@0.52.0	X									X			
+windows-sys@0.59.0	X									X			
+windows-sys@0.60.2	X									X			
+windows-sys@0.61.2	X									X			
+windows-targets@0.52.6	X									X			
+windows-targets@0.53.3	X									X			
+windows_aarch64_gnullvm@0.52.6	X									X			
+windows_aarch64_gnullvm@0.53.0	X									X			
+windows_aarch64_msvc@0.52.6	X									X			
+windows_aarch64_msvc@0.53.0	X									X			
+windows_i686_gnu@0.52.6	X									X			
+windows_i686_gnu@0.53.0	X									X			
+windows_i686_gnullvm@0.52.6	X									X			
+windows_i686_gnullvm@0.53.0	X									X			
+windows_i686_msvc@0.52.6	X									X			
+windows_i686_msvc@0.53.0	X									X			
+windows_x86_64_gnu@0.52.6	X									X			
+windows_x86_64_gnu@0.53.0	X									X			
+windows_x86_64_gnullvm@0.52.6	X									X			
+windows_x86_64_gnullvm@0.53.0	X									X			
+windows_x86_64_msvc@0.52.6	X									X			
+windows_x86_64_msvc@0.53.0	X									X			
+wit-bindgen-rt@0.39.0	X	X								X			
+writeable@0.6.1											X		
+wyz@0.5.1										X			
+yoke@0.8.0											X		
+yoke-derive@0.8.0											X		
+zerocopy@0.8.26	X		X							X			
+zerofrom@0.1.6											X		
+zerofrom-derive@0.1.6											X		
+zeroize@1.8.2	X									X			
+zerotrie@0.2.2											X		
+zerovec@0.11.4											X		
+zerovec-derive@0.11.1											X		
+zstd@0.13.3										X			
+zstd-safe@7.2.4	X									X			
+zstd-sys@2.0.16+zstd.1.5.7	X									X			
diff --git a/fluss-rust/bindings/python/DEPENDENCIES.rust.tsv b/fluss-rust/bindings/python/DEPENDENCIES.rust.tsv
new file mode 100644
index 0000000000..8bd8368c12
--- /dev/null
+++ b/fluss-rust/bindings/python/DEPENDENCIES.rust.tsv
@@ -0,0 +1,317 @@
+crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense
+ahash@0.8.12	X									X		
+aho-corasick@1.1.3										X		X
+android-tzdata@0.1.1	X									X		
+android_system_properties@0.1.5	X									X		
+anstream@0.6.20	X									X		
+anstyle@1.0.11	X									X		
+anstyle-parse@0.2.7	X									X		
+anstyle-query@1.1.4	X									X		
+anstyle-wincon@3.0.10	X									X		
+anyhow@1.0.100	X									X		
+arrow@57.1.0	X											
+arrow-arith@57.1.0	X											
+arrow-array@57.1.0	X											
+arrow-buffer@57.1.0	X											
+arrow-cast@57.1.0	X											
+arrow-csv@57.1.0	X											
+arrow-data@57.1.0	X											
+arrow-ipc@57.1.0	X											
+arrow-json@57.1.0	X											
+arrow-ord@57.1.0	X											
+arrow-pyarrow@57.1.0	X											
+arrow-row@57.1.0	X											
+arrow-schema@57.1.0	X											
+arrow-select@57.1.0	X											
+arrow-string@57.1.0	X											
+async-trait@0.1.89	X									X		
+atoi@2.0.0										X		
+atomic-waker@1.1.2	X									X		
+autocfg@1.5.0	X									X		
+backon@1.6.0	X											
+base64@0.22.1	X									X		
+bigdecimal@0.4.10	X									X		
+bitflags@2.9.3	X									X		
+bitvec@1.0.1										X		
+block-buffer@0.10.4	X									X		
+bumpalo@3.19.0	X									X		
+byteorder@1.5.0										X		X
+bytes@1.11.1										X		
+cc@1.2.34	X									X		
+cfg-if@1.0.3	X									X		
+chrono@0.4.41	X									X		
+clap@4.5.45	X									X		
+clap_builder@4.5.44	X									X		
+clap_derive@4.5.45	X									X		
+clap_lex@0.7.5	X									X		
+colorchoice@1.0.4	X									X		
+const-oid@0.9.6	X									X		
+const-random@0.1.18	X									X		
+const-random-macro@0.1.16	X									X		
+core-foundation-sys@0.8.7	X									X		
+cpufeatures@0.2.17	X									X		
+crc32c@0.6.8	X									X		
+crossbeam-utils@0.8.21	X									X		
+crunchy@0.2.4										X		
+crypto-common@0.1.7	X									X		
+csv@1.3.1										X		X
+csv-core@0.1.12										X		X
+dashmap@6.1.0										X		
+delegate@0.13.5	X									X		
+digest@0.10.7	X									X		
+displaydoc@0.2.5	X									X		
+either@1.15.0	X									X		
+equivalent@1.0.2	X									X		
+errno@0.3.13	X									X		
+fastrand@2.3.0	X									X		
+fixedbitset@0.5.7	X									X		
+flatbuffers@25.2.10	X											
+fluss-rs@0.1.0	X											
+fluss_python@0.1.0	X											
+fnv@1.0.7	X									X		
+form_urlencoded@1.2.2	X									X		
+funty@2.0.0										X		
+futures@0.3.31	X									X		
+futures-channel@0.3.31	X									X		
+futures-core@0.3.31	X									X		
+futures-executor@0.3.31	X									X		
+futures-io@0.3.31	X									X		
+futures-macro@0.3.31	X									X		
+futures-sink@0.3.31	X									X		
+futures-task@0.3.31	X									X		
+futures-util@0.3.31	X									X		
+generic-array@0.14.7										X		
+getrandom@0.2.16	X									X		
+getrandom@0.3.3	X									X		
+gloo-timers@0.3.0	X									X		
+h2@0.4.12										X		
+half@2.6.0	X									X		
+hashbrown@0.14.5	X									X		
+hashbrown@0.15.5	X									X		
+hashbrown@0.16.1	X									X		
+heck@0.5.0	X									X		
+hex@0.4.3	X									X		
+hmac@0.12.1	X									X		
+home@0.5.11	X									X		
+http@1.3.1	X									X		
+http-body@1.0.1										X		
+http-body-util@0.1.3										X		
+httparse@1.10.1	X									X		
+httpdate@1.0.3	X									X		
+hyper@1.7.0										X		
+hyper-rustls@0.27.7	X							X		X		
+hyper-util@0.1.17										X		
+iana-time-zone@0.1.63	X									X		
+iana-time-zone-haiku@0.1.2	X									X		
+icu_collections@2.0.0											X	
+icu_locale_core@2.0.0											X	
+icu_normalizer@2.0.0											X	
+icu_normalizer_data@2.0.0											X	
+icu_properties@2.0.1											X	
+icu_properties_data@2.0.1											X	
+icu_provider@2.0.0											X	
+idna@1.1.0	X									X		
+idna_adapter@1.2.1	X									X		
+indexmap@2.11.0	X									X		
+indoc@2.0.6	X									X		
+ipnet@2.11.0	X									X		
+iri-string@0.7.9	X									X		
+is_terminal_polyfill@1.70.1	X									X		
+itertools@0.14.0	X									X		
+itoa@1.0.15	X									X		
+jiff@0.2.16										X		X
+jiff-tzdb@0.1.5										X		X
+jiff-tzdb-platform@0.1.3										X		X
+jobserver@0.1.34	X									X		
+js-sys@0.3.77	X									X		
+lexical-core@1.0.5	X									X		
+lexical-parse-float@1.0.5	X									X		
+lexical-parse-integer@1.0.5	X									X		
+lexical-util@1.0.6	X									X		
+lexical-write-float@1.0.5	X									X		
+lexical-write-integer@1.0.5	X									X		
+libc@0.2.175	X									X		
+libm@0.2.15										X		
+linked-hash-map@0.5.6	X									X		
+linux-raw-sys@0.9.4	X	X								X		
+litemap@0.8.0											X	
+lock_api@0.4.13	X									X		
+log@0.4.27	X									X		
+lz4_flex@0.12.0										X		
+md-5@0.10.6	X									X		
+memchr@2.7.5										X		X
+memoffset@0.9.1										X		
+mio@1.0.4										X		
+multimap@0.10.1	X									X		
+num-bigint@0.4.6	X									X		
+num-complex@0.4.6	X									X		
+num-integer@0.1.46	X									X		
+num-traits@0.2.19	X									X		
+once_cell@1.21.3	X									X		
+once_cell_polyfill@1.70.1	X									X		
+opendal@0.55.0	X											
+ordered-float@5.1.0										X		
+parking_lot@0.12.4	X									X		
+parking_lot_core@0.9.11	X									X		
+parse-display@0.10.0	X									X		
+parse-display-derive@0.10.0	X									X		
+percent-encoding@2.3.2	X									X		
+petgraph@0.7.1	X									X		
+pin-project-lite@0.2.16	X									X		
+pin-utils@0.1.0	X									X		
+pkg-config@0.3.32	X									X		
+portable-atomic@1.11.1	X									X		
+portable-atomic-util@0.2.4	X									X		
+potential_utf@0.1.3											X	
+ppv-lite86@0.2.21	X									X		
+prettyplease@0.2.37	X									X		
+proc-macro2@1.0.101	X									X		
+prost@0.14.1	X											
+prost-build@0.14.1	X											
+prost-derive@0.14.1	X											
+prost-types@0.14.1	X											
+pyo3@0.26.0	X									X		
+pyo3-async-runtimes@0.26.0	X											
+pyo3-build-config@0.26.0	X									X		
+pyo3-ffi@0.26.0	X									X		
+pyo3-macros@0.26.0	X									X		
+pyo3-macros-backend@0.26.0	X									X		
+quick-xml@0.37.5										X		
+quick-xml@0.38.4										X		
+quote@1.0.40	X									X		
+r-efi@5.3.0	X								X	X		
+radium@0.7.0										X		
+rand@0.8.5	X									X		
+rand@0.9.2	X									X		
+rand_chacha@0.3.1	X									X		
+rand_chacha@0.9.0	X									X		
+rand_core@0.6.4	X									X		
+rand_core@0.9.3	X									X		
+redox_syscall@0.5.17										X		
+regex@1.11.2	X									X		
+regex-automata@0.4.10	X									X		
+regex-syntax@0.8.6	X									X		
+reqsign@0.16.5	X											
+reqwest@0.12.25	X									X		
+ring@0.17.14	X							X				
+rustc_version@0.4.1	X									X		
+rustix@1.0.8	X	X								X		
+rustls@0.23.32	X							X		X		
+rustls-pki-types@1.12.0	X									X		
+rustls-webpki@0.103.7								X				
+rustversion@1.0.22	X									X		
+ryu@1.0.20	X				X							
+scopeguard@1.2.0	X									X		
+semver@1.0.26	X									X		
+serde@1.0.228	X									X		
+serde_core@1.0.228	X									X		
+serde_derive@1.0.228	X									X		
+serde_json@1.0.143	X									X		
+serde_urlencoded@0.7.1	X									X		
+sha1@0.10.6	X									X		
+sha2@0.10.9	X									X		
+shlex@1.3.0	X									X		
+signal-hook-registry@1.4.6	X									X		
+simdutf8@0.1.5	X									X		
+slab@0.4.11										X		
+smallvec@1.15.1	X									X		
+snafu@0.8.9	X									X		
+snafu-derive@0.8.9	X									X		
+socket2@0.6.0	X									X		
+stable_deref_trait@1.2.1	X									X		
+static_assertions@1.1.0	X									X		
+strsim@0.11.1										X		
+structmeta@0.3.0	X									X		
+structmeta-derive@0.3.0	X									X		
+strum@0.26.3										X		
+strum_macros@0.26.4										X		
+subtle@2.6.1				X								
+syn@2.0.106	X									X		
+sync_wrapper@1.0.2	X											
+synstructure@0.13.2										X		
+tap@1.0.1										X		
+target-lexicon@0.13.3		X										
+tempfile@3.23.0	X									X		
+thiserror@1.0.69	X									X		
+thiserror-impl@1.0.69	X									X		
+tiny-keccak@2.0.2						X						
+tinystr@0.8.1											X	
+tokio@1.48.0										X		
+tokio-macros@2.6.0										X		
+tokio-rustls@0.26.4	X									X		
+tokio-util@0.7.16										X		
+tower@0.5.2										X		
+tower-http@0.6.8										X		
+tower-layer@0.3.3										X		
+tower-service@0.3.3										X		
+tracing@0.1.41										X		
+tracing-attributes@0.1.30										X		
+tracing-core@0.1.34										X		
+try-lock@0.2.5										X		
+twox-hash@2.1.2										X		
+typenum@1.19.0	X									X		
+unicode-ident@1.0.18	X									X	X	
+unindent@0.2.4	X									X		
+untrusted@0.9.0								X				
+url@2.5.7	X									X		
+utf8_iter@1.0.4	X									X		
+utf8parse@0.2.2	X									X		
+uuid@1.18.0	X									X		
+value-bag@1.12.0	X									X		
+version_check@0.9.5	X									X		
+want@0.3.1										X		
+wasi@0.11.1+wasi-snapshot-preview1	X	X								X		
+wasi@0.14.2+wasi-0.2.4	X	X								X		
+wasm-bindgen@0.2.100	X									X		
+wasm-bindgen-backend@0.2.100	X									X		
+wasm-bindgen-futures@0.4.50	X									X		
+wasm-bindgen-macro@0.2.100	X									X		
+wasm-bindgen-macro-support@0.2.100	X									X		
+wasm-bindgen-shared@0.2.100	X									X		
+wasm-streams@0.4.2	X									X		
+web-sys@0.3.77	X									X		
+webpki-roots@1.0.3							X					
+windows-core@0.61.2	X									X		
+windows-implement@0.60.0	X									X		
+windows-interface@0.59.1	X									X		
+windows-link@0.1.3	X									X		
+windows-link@0.2.1	X									X		
+windows-result@0.3.4	X									X		
+windows-strings@0.4.2	X									X		
+windows-sys@0.52.0	X									X		
+windows-sys@0.59.0	X									X		
+windows-sys@0.60.2	X									X		
+windows-sys@0.61.2	X									X		
+windows-targets@0.52.6	X									X		
+windows-targets@0.53.3	X									X		
+windows_aarch64_gnullvm@0.52.6	X									X		
+windows_aarch64_gnullvm@0.53.0	X									X		
+windows_aarch64_msvc@0.52.6	X									X		
+windows_aarch64_msvc@0.53.0	X									X		
+windows_i686_gnu@0.52.6	X									X		
+windows_i686_gnu@0.53.0	X									X		
+windows_i686_gnullvm@0.52.6	X									X		
+windows_i686_gnullvm@0.53.0	X									X		
+windows_i686_msvc@0.52.6	X									X		
+windows_i686_msvc@0.53.0	X									X		
+windows_x86_64_gnu@0.52.6	X									X		
+windows_x86_64_gnu@0.53.0	X									X		
+windows_x86_64_gnullvm@0.52.6	X									X		
+windows_x86_64_gnullvm@0.53.0	X									X		
+windows_x86_64_msvc@0.52.6	X									X		
+windows_x86_64_msvc@0.53.0	X									X		
+wit-bindgen-rt@0.39.0	X	X								X		
+writeable@0.6.1											X	
+wyz@0.5.1										X		
+yoke@0.8.0											X	
+yoke-derive@0.8.0											X	
+zerocopy@0.8.26	X		X							X		
+zerofrom@0.1.6											X	
+zerofrom-derive@0.1.6											X	
+zeroize@1.8.2	X									X		
+zerotrie@0.2.2											X	
+zerovec@0.11.4											X	
+zerovec-derive@0.11.1											X	
+zstd@0.13.3										X		
+zstd-safe@7.2.4	X									X		
+zstd-sys@2.0.16+zstd.1.5.7	X									X		
diff --git a/fluss-rust/crates/examples/DEPENDENCIES.rust.tsv b/fluss-rust/crates/examples/DEPENDENCIES.rust.tsv
new file mode 100644
index 0000000000..6b30630eff
--- /dev/null
+++ b/fluss-rust/crates/examples/DEPENDENCIES.rust.tsv
@@ -0,0 +1,306 @@
+crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense
+ahash@0.8.12	X									X		
+aho-corasick@1.1.3										X		X
+android-tzdata@0.1.1	X									X		
+android_system_properties@0.1.5	X									X		
+anstream@0.6.20	X									X		
+anstyle@1.0.11	X									X		
+anstyle-parse@0.2.7	X									X		
+anstyle-query@1.1.4	X									X		
+anstyle-wincon@3.0.10	X									X		
+anyhow@1.0.100	X									X		
+arrow@57.1.0	X											
+arrow-arith@57.1.0	X											
+arrow-array@57.1.0	X											
+arrow-buffer@57.1.0	X											
+arrow-cast@57.1.0	X											
+arrow-csv@57.1.0	X											
+arrow-data@57.1.0	X											
+arrow-ipc@57.1.0	X											
+arrow-json@57.1.0	X											
+arrow-ord@57.1.0	X											
+arrow-row@57.1.0	X											
+arrow-schema@57.1.0	X											
+arrow-select@57.1.0	X											
+arrow-string@57.1.0	X											
+async-trait@0.1.89	X									X		
+atoi@2.0.0										X		
+atomic-waker@1.1.2	X									X		
+autocfg@1.5.0	X									X		
+backon@1.6.0	X											
+base64@0.22.1	X									X		
+bigdecimal@0.4.10	X									X		
+bitflags@2.9.3	X									X		
+bitvec@1.0.1										X		
+block-buffer@0.10.4	X									X		
+bumpalo@3.19.0	X									X		
+byteorder@1.5.0										X		X
+bytes@1.11.1										X		
+cc@1.2.34	X									X		
+cfg-if@1.0.3	X									X		
+chrono@0.4.41	X									X		
+clap@4.5.45	X									X		
+clap_builder@4.5.44	X									X		
+clap_derive@4.5.45	X									X		
+clap_lex@0.7.5	X									X		
+colorchoice@1.0.4	X									X		
+const-oid@0.9.6	X									X		
+const-random@0.1.18	X									X		
+const-random-macro@0.1.16	X									X		
+core-foundation-sys@0.8.7	X									X		
+cpufeatures@0.2.17	X									X		
+crc32c@0.6.8	X									X		
+crossbeam-utils@0.8.21	X									X		
+crunchy@0.2.4										X		
+crypto-common@0.1.7	X									X		
+csv@1.3.1										X		X
+csv-core@0.1.12										X		X
+dashmap@6.1.0										X		
+delegate@0.13.5	X									X		
+digest@0.10.7	X									X		
+displaydoc@0.2.5	X									X		
+either@1.15.0	X									X		
+equivalent@1.0.2	X									X		
+errno@0.3.13	X									X		
+fastrand@2.3.0	X									X		
+fixedbitset@0.5.7	X									X		
+flatbuffers@25.2.10	X											
+fluss-examples@0.1.0	X											
+fluss-rs@0.1.0	X											
+fnv@1.0.7	X									X		
+form_urlencoded@1.2.2	X									X		
+funty@2.0.0										X		
+futures@0.3.31	X									X		
+futures-channel@0.3.31	X									X		
+futures-core@0.3.31	X									X		
+futures-executor@0.3.31	X									X		
+futures-io@0.3.31	X									X		
+futures-macro@0.3.31	X									X		
+futures-sink@0.3.31	X									X		
+futures-task@0.3.31	X									X		
+futures-util@0.3.31	X									X		
+generic-array@0.14.7										X		
+getrandom@0.2.16	X									X		
+getrandom@0.3.3	X									X		
+gloo-timers@0.3.0	X									X		
+h2@0.4.12										X		
+half@2.6.0	X									X		
+hashbrown@0.14.5	X									X		
+hashbrown@0.15.5	X									X		
+hashbrown@0.16.1	X									X		
+heck@0.5.0	X									X		
+hex@0.4.3	X									X		
+hmac@0.12.1	X									X		
+home@0.5.11	X									X		
+http@1.3.1	X									X		
+http-body@1.0.1										X		
+http-body-util@0.1.3										X		
+httparse@1.10.1	X									X		
+httpdate@1.0.3	X									X		
+hyper@1.7.0										X		
+hyper-rustls@0.27.7	X							X		X		
+hyper-util@0.1.17										X		
+iana-time-zone@0.1.63	X									X		
+iana-time-zone-haiku@0.1.2	X									X		
+icu_collections@2.0.0											X	
+icu_locale_core@2.0.0											X	
+icu_normalizer@2.0.0											X	
+icu_normalizer_data@2.0.0											X	
+icu_properties@2.0.1											X	
+icu_properties_data@2.0.1											X	
+icu_provider@2.0.0											X	
+idna@1.1.0	X									X		
+idna_adapter@1.2.1	X									X		
+indexmap@2.11.0	X									X		
+ipnet@2.11.0	X									X		
+iri-string@0.7.9	X									X		
+is_terminal_polyfill@1.70.1	X									X		
+itertools@0.14.0	X									X		
+itoa@1.0.15	X									X		
+jiff@0.2.16										X		X
+jiff-tzdb@0.1.5										X		X
+jiff-tzdb-platform@0.1.3										X		X
+jobserver@0.1.34	X									X		
+js-sys@0.3.77	X									X		
+lexical-core@1.0.5	X									X		
+lexical-parse-float@1.0.5	X									X		
+lexical-parse-integer@1.0.5	X									X		
+lexical-util@1.0.6	X									X		
+lexical-write-float@1.0.5	X									X		
+lexical-write-integer@1.0.5	X									X		
+libc@0.2.175	X									X		
+libm@0.2.15										X		
+linked-hash-map@0.5.6	X									X		
+linux-raw-sys@0.9.4	X	X								X		
+litemap@0.8.0											X	
+lock_api@0.4.13	X									X		
+log@0.4.27	X									X		
+lz4_flex@0.12.0										X		
+md-5@0.10.6	X									X		
+memchr@2.7.5										X		X
+mio@1.0.4										X		
+multimap@0.10.1	X									X		
+num-bigint@0.4.6	X									X		
+num-complex@0.4.6	X									X		
+num-integer@0.1.46	X									X		
+num-traits@0.2.19	X									X		
+once_cell@1.21.3	X									X		
+once_cell_polyfill@1.70.1	X									X		
+opendal@0.55.0	X											
+ordered-float@5.1.0										X		
+parking_lot@0.12.4	X									X		
+parking_lot_core@0.9.11	X									X		
+parse-display@0.10.0	X									X		
+parse-display-derive@0.10.0	X									X		
+percent-encoding@2.3.2	X									X		
+petgraph@0.7.1	X									X		
+pin-project-lite@0.2.16	X									X		
+pin-utils@0.1.0	X									X		
+pkg-config@0.3.32	X									X		
+portable-atomic@1.11.1	X									X		
+portable-atomic-util@0.2.4	X									X		
+potential_utf@0.1.3											X	
+ppv-lite86@0.2.21	X									X		
+prettyplease@0.2.37	X									X		
+proc-macro2@1.0.101	X									X		
+prost@0.14.1	X											
+prost-build@0.14.1	X											
+prost-derive@0.14.1	X											
+prost-types@0.14.1	X											
+quick-xml@0.37.5										X		
+quick-xml@0.38.4										X		
+quote@1.0.40	X									X		
+r-efi@5.3.0	X								X	X		
+radium@0.7.0										X		
+rand@0.8.5	X									X		
+rand@0.9.2	X									X		
+rand_chacha@0.3.1	X									X		
+rand_chacha@0.9.0	X									X		
+rand_core@0.6.4	X									X		
+rand_core@0.9.3	X									X		
+redox_syscall@0.5.17										X		
+regex@1.11.2	X									X		
+regex-automata@0.4.10	X									X		
+regex-syntax@0.8.6	X									X		
+reqsign@0.16.5	X											
+reqwest@0.12.25	X									X		
+ring@0.17.14	X							X				
+rustc_version@0.4.1	X									X		
+rustix@1.0.8	X	X								X		
+rustls@0.23.32	X							X		X		
+rustls-pki-types@1.12.0	X									X		
+rustls-webpki@0.103.7								X				
+rustversion@1.0.22	X									X		
+ryu@1.0.20	X				X							
+scopeguard@1.2.0	X									X		
+semver@1.0.26	X									X		
+serde@1.0.228	X									X		
+serde_core@1.0.228	X									X		
+serde_derive@1.0.228	X									X		
+serde_json@1.0.143	X									X		
+serde_urlencoded@0.7.1	X									X		
+sha1@0.10.6	X									X		
+sha2@0.10.9	X									X		
+shlex@1.3.0	X									X		
+signal-hook-registry@1.4.6	X									X		
+simdutf8@0.1.5	X									X		
+slab@0.4.11										X		
+smallvec@1.15.1	X									X		
+snafu@0.8.9	X									X		
+snafu-derive@0.8.9	X									X		
+socket2@0.6.0	X									X		
+stable_deref_trait@1.2.1	X									X		
+static_assertions@1.1.0	X									X		
+strsim@0.11.1										X		
+structmeta@0.3.0	X									X		
+structmeta-derive@0.3.0	X									X		
+strum@0.26.3										X		
+strum_macros@0.26.4										X		
+subtle@2.6.1				X								
+syn@2.0.106	X									X		
+sync_wrapper@1.0.2	X											
+synstructure@0.13.2										X		
+tap@1.0.1										X		
+tempfile@3.23.0	X									X		
+thiserror@1.0.69	X									X		
+thiserror-impl@1.0.69	X									X		
+tiny-keccak@2.0.2						X						
+tinystr@0.8.1											X	
+tokio@1.48.0										X		
+tokio-macros@2.6.0										X		
+tokio-rustls@0.26.4	X									X		
+tokio-util@0.7.16										X		
+tower@0.5.2										X		
+tower-http@0.6.8										X		
+tower-layer@0.3.3										X		
+tower-service@0.3.3										X		
+tracing@0.1.41										X		
+tracing-attributes@0.1.30										X		
+tracing-core@0.1.34										X		
+try-lock@0.2.5										X		
+twox-hash@2.1.2										X		
+typenum@1.19.0	X									X		
+unicode-ident@1.0.18	X									X	X	
+untrusted@0.9.0								X				
+url@2.5.7	X									X		
+utf8_iter@1.0.4	X									X		
+utf8parse@0.2.2	X									X		
+uuid@1.18.0	X									X		
+value-bag@1.12.0	X									X		
+version_check@0.9.5	X									X		
+want@0.3.1										X		
+wasi@0.11.1+wasi-snapshot-preview1	X	X								X		
+wasi@0.14.2+wasi-0.2.4	X	X								X		
+wasm-bindgen@0.2.100	X									X		
+wasm-bindgen-backend@0.2.100	X									X		
+wasm-bindgen-futures@0.4.50	X									X		
+wasm-bindgen-macro@0.2.100	X									X		
+wasm-bindgen-macro-support@0.2.100	X									X		
+wasm-bindgen-shared@0.2.100	X									X		
+wasm-streams@0.4.2	X									X		
+web-sys@0.3.77	X									X		
+webpki-roots@1.0.3							X					
+windows-core@0.61.2	X									X		
+windows-implement@0.60.0	X									X		
+windows-interface@0.59.1	X									X		
+windows-link@0.1.3	X									X		
+windows-link@0.2.1	X									X		
+windows-result@0.3.4	X									X		
+windows-strings@0.4.2	X									X		
+windows-sys@0.52.0	X									X		
+windows-sys@0.59.0	X									X		
+windows-sys@0.60.2	X									X		
+windows-sys@0.61.2	X									X		
+windows-targets@0.52.6	X									X		
+windows-targets@0.53.3	X									X		
+windows_aarch64_gnullvm@0.52.6	X									X		
+windows_aarch64_gnullvm@0.53.0	X									X		
+windows_aarch64_msvc@0.52.6	X									X		
+windows_aarch64_msvc@0.53.0	X									X		
+windows_i686_gnu@0.52.6	X									X		
+windows_i686_gnu@0.53.0	X									X		
+windows_i686_gnullvm@0.52.6	X									X		
+windows_i686_gnullvm@0.53.0	X									X		
+windows_i686_msvc@0.52.6	X									X		
+windows_i686_msvc@0.53.0	X									X		
+windows_x86_64_gnu@0.52.6	X									X		
+windows_x86_64_gnu@0.53.0	X									X		
+windows_x86_64_gnullvm@0.52.6	X									X		
+windows_x86_64_gnullvm@0.53.0	X									X		
+windows_x86_64_msvc@0.52.6	X									X		
+windows_x86_64_msvc@0.53.0	X									X		
+wit-bindgen-rt@0.39.0	X	X								X		
+writeable@0.6.1											X	
+wyz@0.5.1										X		
+yoke@0.8.0											X	
+yoke-derive@0.8.0											X	
+zerocopy@0.8.26	X		X							X		
+zerofrom@0.1.6											X	
+zerofrom-derive@0.1.6											X	
+zeroize@1.8.2	X									X		
+zerotrie@0.2.2											X	
+zerovec@0.11.4											X	
+zerovec-derive@0.11.1											X	
+zstd@0.13.3										X		
+zstd-safe@7.2.4	X									X		
+zstd-sys@2.0.16+zstd.1.5.7	X									X		
diff --git a/fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv b/fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv
new file mode 100644
index 0000000000..29cbe1e8c2
--- /dev/null
+++ b/fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv
@@ -0,0 +1,305 @@
+crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense
+ahash@0.8.12	X									X		
+aho-corasick@1.1.3										X		X
+android-tzdata@0.1.1	X									X		
+android_system_properties@0.1.5	X									X		
+anstream@0.6.20	X									X		
+anstyle@1.0.11	X									X		
+anstyle-parse@0.2.7	X									X		
+anstyle-query@1.1.4	X									X		
+anstyle-wincon@3.0.10	X									X		
+anyhow@1.0.100	X									X		
+arrow@57.1.0	X											
+arrow-arith@57.1.0	X											
+arrow-array@57.1.0	X											
+arrow-buffer@57.1.0	X											
+arrow-cast@57.1.0	X											
+arrow-csv@57.1.0	X											
+arrow-data@57.1.0	X											
+arrow-ipc@57.1.0	X											
+arrow-json@57.1.0	X											
+arrow-ord@57.1.0	X											
+arrow-row@57.1.0	X											
+arrow-schema@57.1.0	X											
+arrow-select@57.1.0	X											
+arrow-string@57.1.0	X											
+async-trait@0.1.89	X									X		
+atoi@2.0.0										X		
+atomic-waker@1.1.2	X									X		
+autocfg@1.5.0	X									X		
+backon@1.6.0	X											
+base64@0.22.1	X									X		
+bigdecimal@0.4.10	X									X		
+bitflags@2.9.3	X									X		
+bitvec@1.0.1										X		
+block-buffer@0.10.4	X									X		
+bumpalo@3.19.0	X									X		
+byteorder@1.5.0										X		X
+bytes@1.11.1										X		
+cc@1.2.34	X									X		
+cfg-if@1.0.3	X									X		
+chrono@0.4.41	X									X		
+clap@4.5.45	X									X		
+clap_builder@4.5.44	X									X		
+clap_derive@4.5.45	X									X		
+clap_lex@0.7.5	X									X		
+colorchoice@1.0.4	X									X		
+const-oid@0.9.6	X									X		
+const-random@0.1.18	X									X		
+const-random-macro@0.1.16	X									X		
+core-foundation-sys@0.8.7	X									X		
+cpufeatures@0.2.17	X									X		
+crc32c@0.6.8	X									X		
+crossbeam-utils@0.8.21	X									X		
+crunchy@0.2.4										X		
+crypto-common@0.1.7	X									X		
+csv@1.3.1										X		X
+csv-core@0.1.12										X		X
+dashmap@6.1.0										X		
+delegate@0.13.5	X									X		
+digest@0.10.7	X									X		
+displaydoc@0.2.5	X									X		
+either@1.15.0	X									X		
+equivalent@1.0.2	X									X		
+errno@0.3.13	X									X		
+fastrand@2.3.0	X									X		
+fixedbitset@0.5.7	X									X		
+flatbuffers@25.2.10	X											
+fluss-rs@0.1.0	X											
+fnv@1.0.7	X									X		
+form_urlencoded@1.2.2	X									X		
+funty@2.0.0										X		
+futures@0.3.31	X									X		
+futures-channel@0.3.31	X									X		
+futures-core@0.3.31	X									X		
+futures-executor@0.3.31	X									X		
+futures-io@0.3.31	X									X		
+futures-macro@0.3.31	X									X		
+futures-sink@0.3.31	X									X		
+futures-task@0.3.31	X									X		
+futures-util@0.3.31	X									X		
+generic-array@0.14.7										X		
+getrandom@0.2.16	X									X		
+getrandom@0.3.3	X									X		
+gloo-timers@0.3.0	X									X		
+h2@0.4.12										X		
+half@2.6.0	X									X		
+hashbrown@0.14.5	X									X		
+hashbrown@0.15.5	X									X		
+hashbrown@0.16.1	X									X		
+heck@0.5.0	X									X		
+hex@0.4.3	X									X		
+hmac@0.12.1	X									X		
+home@0.5.11	X									X		
+http@1.3.1	X									X		
+http-body@1.0.1										X		
+http-body-util@0.1.3										X		
+httparse@1.10.1	X									X		
+httpdate@1.0.3	X									X		
+hyper@1.7.0										X		
+hyper-rustls@0.27.7	X							X		X		
+hyper-util@0.1.17										X		
+iana-time-zone@0.1.63	X									X		
+iana-time-zone-haiku@0.1.2	X									X		
+icu_collections@2.0.0											X	
+icu_locale_core@2.0.0											X	
+icu_normalizer@2.0.0											X	
+icu_normalizer_data@2.0.0											X	
+icu_properties@2.0.1											X	
+icu_properties_data@2.0.1											X	
+icu_provider@2.0.0											X	
+idna@1.1.0	X									X		
+idna_adapter@1.2.1	X									X		
+indexmap@2.11.0	X									X		
+ipnet@2.11.0	X									X		
+iri-string@0.7.9	X									X		
+is_terminal_polyfill@1.70.1	X									X		
+itertools@0.14.0	X									X		
+itoa@1.0.15	X									X		
+jiff@0.2.16										X		X
+jiff-tzdb@0.1.5										X		X
+jiff-tzdb-platform@0.1.3										X		X
+jobserver@0.1.34	X									X		
+js-sys@0.3.77	X									X		
+lexical-core@1.0.5	X									X		
+lexical-parse-float@1.0.5	X									X		
+lexical-parse-integer@1.0.5	X									X		
+lexical-util@1.0.6	X									X		
+lexical-write-float@1.0.5	X									X		
+lexical-write-integer@1.0.5	X									X		
+libc@0.2.175	X									X		
+libm@0.2.15										X		
+linked-hash-map@0.5.6	X									X		
+linux-raw-sys@0.9.4	X	X								X		
+litemap@0.8.0											X	
+lock_api@0.4.13	X									X		
+log@0.4.27	X									X		
+lz4_flex@0.12.0										X		
+md-5@0.10.6	X									X		
+memchr@2.7.5										X		X
+mio@1.0.4										X		
+multimap@0.10.1	X									X		
+num-bigint@0.4.6	X									X		
+num-complex@0.4.6	X									X		
+num-integer@0.1.46	X									X		
+num-traits@0.2.19	X									X		
+once_cell@1.21.3	X									X		
+once_cell_polyfill@1.70.1	X									X		
+opendal@0.55.0	X											
+ordered-float@5.1.0										X		
+parking_lot@0.12.4	X									X		
+parking_lot_core@0.9.11	X									X		
+parse-display@0.10.0	X									X		
+parse-display-derive@0.10.0	X									X		
+percent-encoding@2.3.2	X									X		
+petgraph@0.7.1	X									X		
+pin-project-lite@0.2.16	X									X		
+pin-utils@0.1.0	X									X		
+pkg-config@0.3.32	X									X		
+portable-atomic@1.11.1	X									X		
+portable-atomic-util@0.2.4	X									X		
+potential_utf@0.1.3											X	
+ppv-lite86@0.2.21	X									X		
+prettyplease@0.2.37	X									X		
+proc-macro2@1.0.101	X									X		
+prost@0.14.1	X											
+prost-build@0.14.1	X											
+prost-derive@0.14.1	X											
+prost-types@0.14.1	X											
+quick-xml@0.37.5										X		
+quick-xml@0.38.4										X		
+quote@1.0.40	X									X		
+r-efi@5.3.0	X								X	X		
+radium@0.7.0										X		
+rand@0.8.5	X									X		
+rand@0.9.2	X									X		
+rand_chacha@0.3.1	X									X		
+rand_chacha@0.9.0	X									X		
+rand_core@0.6.4	X									X		
+rand_core@0.9.3	X									X		
+redox_syscall@0.5.17										X		
+regex@1.11.2	X									X		
+regex-automata@0.4.10	X									X		
+regex-syntax@0.8.6	X									X		
+reqsign@0.16.5	X											
+reqwest@0.12.25	X									X		
+ring@0.17.14	X							X				
+rustc_version@0.4.1	X									X		
+rustix@1.0.8	X	X								X		
+rustls@0.23.32	X							X		X		
+rustls-pki-types@1.12.0	X									X		
+rustls-webpki@0.103.7								X				
+rustversion@1.0.22	X									X		
+ryu@1.0.20	X				X							
+scopeguard@1.2.0	X									X		
+semver@1.0.26	X									X		
+serde@1.0.228	X									X		
+serde_core@1.0.228	X									X		
+serde_derive@1.0.228	X									X		
+serde_json@1.0.143	X									X		
+serde_urlencoded@0.7.1	X									X		
+sha1@0.10.6	X									X		
+sha2@0.10.9	X									X		
+shlex@1.3.0	X									X		
+signal-hook-registry@1.4.6	X									X		
+simdutf8@0.1.5	X									X		
+slab@0.4.11										X		
+smallvec@1.15.1	X									X		
+snafu@0.8.9	X									X		
+snafu-derive@0.8.9	X									X		
+socket2@0.6.0	X									X		
+stable_deref_trait@1.2.1	X									X		
+static_assertions@1.1.0	X									X		
+strsim@0.11.1										X		
+structmeta@0.3.0	X									X		
+structmeta-derive@0.3.0	X									X		
+strum@0.26.3										X		
+strum_macros@0.26.4										X		
+subtle@2.6.1				X								
+syn@2.0.106	X									X		
+sync_wrapper@1.0.2	X											
+synstructure@0.13.2										X		
+tap@1.0.1										X		
+tempfile@3.23.0	X									X		
+thiserror@1.0.69	X									X		
+thiserror-impl@1.0.69	X									X		
+tiny-keccak@2.0.2						X						
+tinystr@0.8.1											X	
+tokio@1.48.0										X		
+tokio-macros@2.6.0										X		
+tokio-rustls@0.26.4	X									X		
+tokio-util@0.7.16										X		
+tower@0.5.2										X		
+tower-http@0.6.8										X		
+tower-layer@0.3.3										X		
+tower-service@0.3.3										X		
+tracing@0.1.41										X		
+tracing-attributes@0.1.30										X		
+tracing-core@0.1.34										X		
+try-lock@0.2.5										X		
+twox-hash@2.1.2										X		
+typenum@1.19.0	X									X		
+unicode-ident@1.0.18	X									X	X	
+untrusted@0.9.0								X				
+url@2.5.7	X									X		
+utf8_iter@1.0.4	X									X		
+utf8parse@0.2.2	X									X		
+uuid@1.18.0	X									X		
+value-bag@1.12.0	X									X		
+version_check@0.9.5	X									X		
+want@0.3.1										X		
+wasi@0.11.1+wasi-snapshot-preview1	X	X								X		
+wasi@0.14.2+wasi-0.2.4	X	X								X		
+wasm-bindgen@0.2.100	X									X		
+wasm-bindgen-backend@0.2.100	X									X		
+wasm-bindgen-futures@0.4.50	X									X		
+wasm-bindgen-macro@0.2.100	X									X		
+wasm-bindgen-macro-support@0.2.100	X									X		
+wasm-bindgen-shared@0.2.100	X									X		
+wasm-streams@0.4.2	X									X		
+web-sys@0.3.77	X									X		
+webpki-roots@1.0.3							X					
+windows-core@0.61.2	X									X		
+windows-implement@0.60.0	X									X		
+windows-interface@0.59.1	X									X		
+windows-link@0.1.3	X									X		
+windows-link@0.2.1	X									X		
+windows-result@0.3.4	X									X		
+windows-strings@0.4.2	X									X		
+windows-sys@0.52.0	X									X		
+windows-sys@0.59.0	X									X		
+windows-sys@0.60.2	X									X		
+windows-sys@0.61.2	X									X		
+windows-targets@0.52.6	X									X		
+windows-targets@0.53.3	X									X		
+windows_aarch64_gnullvm@0.52.6	X									X		
+windows_aarch64_gnullvm@0.53.0	X									X		
+windows_aarch64_msvc@0.52.6	X									X		
+windows_aarch64_msvc@0.53.0	X									X		
+windows_i686_gnu@0.52.6	X									X		
+windows_i686_gnu@0.53.0	X									X		
+windows_i686_gnullvm@0.52.6	X									X		
+windows_i686_gnullvm@0.53.0	X									X		
+windows_i686_msvc@0.52.6	X									X		
+windows_i686_msvc@0.53.0	X									X		
+windows_x86_64_gnu@0.52.6	X									X		
+windows_x86_64_gnu@0.53.0	X									X		
+windows_x86_64_gnullvm@0.52.6	X									X		
+windows_x86_64_gnullvm@0.53.0	X									X		
+windows_x86_64_msvc@0.52.6	X									X		
+windows_x86_64_msvc@0.53.0	X									X		
+wit-bindgen-rt@0.39.0	X	X								X		
+writeable@0.6.1											X	
+wyz@0.5.1										X		
+yoke@0.8.0											X	
+yoke-derive@0.8.0											X	
+zerocopy@0.8.26	X		X							X		
+zerofrom@0.1.6											X	
+zerofrom-derive@0.1.6											X	
+zeroize@1.8.2	X									X		
+zerotrie@0.2.2											X	
+zerovec@0.11.4											X	
+zerovec-derive@0.11.1											X	
+zstd@0.13.3										X		
+zstd-safe@7.2.4	X									X		
+zstd-sys@2.0.16+zstd.1.5.7	X									X		

From eb60036076ed93487be05442f14099baf025a337 Mon Sep 17 00:00:00 2001
From: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
Date: Mon, 2 Mar 2026 10:57:07 +0800
Subject: [PATCH 180/287] Bump version to 0.2.0

---
 fluss-rust/Cargo.toml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 77d714006a..584897789c 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -24,7 +24,7 @@ homepage = "https://fluss.apache.org/"
 license = "Apache-2.0"
 repository = "https://github.com/apache/fluss-rust"
 rust-version = "1.85"
-version = "0.1.0"
+version = "0.2.0"
 keywords = ["fluss", "streaming-storage", "datalake"]
 
 [workspace]
@@ -32,7 +32,7 @@ resolver = "2"
 members = ["crates/fluss", "crates/examples", "bindings/python", "bindings/cpp"]
 
 [workspace.dependencies]
-fluss = { package = "fluss-rs", version = "0.1.0", path = "crates/fluss", features = ["storage-all"] }
+fluss = { package = "fluss-rs", version = "0.2.0", path = "crates/fluss", features = ["storage-all"] }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression"] }

From 0ea4e071d4d90b740356267a382cc79156ef6edc Mon Sep 17 00:00:00 2001
From: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
Date: Mon, 2 Mar 2026 11:26:39 +0800
Subject: [PATCH 181/287] ci: update verify tag version

---
 .../actions/verify-tag-version/action.yml      | 18 +++++++++++-------
 1 file changed, 11 insertions(+), 7 deletions(-)

diff --git a/fluss-rust/.github/actions/verify-tag-version/action.yml b/fluss-rust/.github/actions/verify-tag-version/action.yml
index ad16b4f979..1b34bdba03 100644
--- a/fluss-rust/.github/actions/verify-tag-version/action.yml
+++ b/fluss-rust/.github/actions/verify-tag-version/action.yml
@@ -26,12 +26,16 @@ runs:
   using: 'composite'
   steps:
     - run: |
-        TAG_VERSION="${GITHUB_REF#refs/tags/v}"
-        CRATE_VERSION=$(sed -n '/^\[workspace.package\]/,/^\[/p' Cargo.toml | grep '^\s*version\s*=' | head -1 | sed -E 's/.*"([^"]+)".*/\1/')
-        base() { echo "$1" | sed -E 's/-rc(\.[0-9]+|[0-9]+)$//'; }
-        if [ "$(base "$TAG_VERSION")" != "$(base "$CRATE_VERSION")" ]; then
-          echo "::error::Tag version ($TAG_VERSION) does not match Cargo.toml version ($CRATE_VERSION). Run scripts/bump-version.sh before tagging, or tag the version that is in Cargo.toml."
-          exit 1
-        fi
         echo "Tag and crate version match: $TAG_VERSION"
       shell: bash
+# uncomment for 0.1.0-incubating-rc0, add it back when incubating is not needed anymore
+#    - run: |
+#        TAG_VERSION="${GITHUB_REF#refs/tags/v}"
+#        CRATE_VERSION=$(sed -n '/^\[workspace.package\]/,/^\[/p' Cargo.toml | grep '^\s*version\s*=' | head -1 | sed -E 's/.*"([^"]+)".*/\1/')
+#        base() { echo "$1" | sed -E 's/-rc(\.[0-9]+|[0-9]+)$//'; }
+#        if [ "$(base "$TAG_VERSION")" != "$(base "$CRATE_VERSION")" ]; then
+#          echo "::error::Tag version ($TAG_VERSION) does not match Cargo.toml version ($CRATE_VERSION). Run scripts/bump-version.sh before tagging, or tag the version that is in Cargo.toml."
+#          exit 1
+#        fi
+#        echo "Tag and crate version match: $TAG_VERSION"
+#      shell: bash

From 7818f020e93cfb8dba3265a04f75ed6112bca288 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Tue, 3 Mar 2026 16:00:51 +0800
Subject: [PATCH 182/287] chore: update rust docs (#416)

---
 fluss-rust/crates/fluss/src/error.rs          |  2 +-
 fluss-rust/crates/fluss/src/lib.rs            | 87 +++++++++++++++++++
 .../crates/fluss/src/record/kv/kv_record.rs   |  2 +-
 fluss-rust/crates/fluss/src/row/binary/mod.rs |  2 +-
 fluss-rust/crates/fluss/src/row/encode/mod.rs |  6 +-
 5 files changed, 93 insertions(+), 6 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index 59524a6387..5cf0d4b847 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -33,7 +33,7 @@ pub enum Error {
     )]
     UnexpectedError {
         message: String,
-        /// see https://github.com/shepmaster/snafu/issues/446
+        /// see <https://github.com/shepmaster/snafu/issues/446>
         #[snafu(source(from(Box<dyn std::error::Error + Send + Sync + 'static>, Some)))]
         source: Option<Box<dyn std::error::Error + Send + Sync + 'static>>,
     },
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index 689c37ca06..cd060c8e45 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -15,6 +15,93 @@
 // specific language governing permissions and limitations
 // under the License.
 
+//! Apache Fluss (Incubating) Official Rust Client
+//!
+//! Official Rust client library for [Apache Fluss (Incubating)](https://fluss.apache.org/).
+//! It supports **primary key (KV) tables** (upsert + lookup) and **log tables** (append + scan).
+//!
+//! # Examples
+//!
+//! ## Primary key table and log table
+//!
+//! Connect to a cluster, create a KV table (upsert and lookup), then a log table (append and scan):
+//!
+//! ```rust,no_run
+//! use fluss::client::EARLIEST_OFFSET;
+//! use fluss::client::FlussConnection;
+//! use fluss::config::Config;
+//! use fluss::error::Result;
+//! use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+//! use fluss::row::{GenericRow, InternalRow};
+//! use std::time::Duration;
+//!
+//! #[tokio::main]
+//! async fn main() -> Result<()> {
+//!     let mut config = Config::default();
+//!     config.bootstrap_servers = "127.0.0.1:9123".to_string();
+//!     let connection = FlussConnection::new(config).await?;
+//!     let admin = connection.get_admin().await?;
+//!
+//!     // ---- Primary key (KV) table: upsert and lookup ----
+//!     let kv_path = TablePath::new("fluss", "users");
+//!     let mut kv_schema = Schema::builder()
+//!         .column("id", DataTypes::int())
+//!         .column("name", DataTypes::string())
+//!         .column("age", DataTypes::bigint())
+//!         .primary_key(vec!["id"]);
+//!     let kv_descriptor = TableDescriptor::builder()
+//!         .schema(kv_schema.build()?)
+//!         .build()?;
+//!     admin.create_table(&kv_path, &kv_descriptor, false).await?;
+//!
+//!     let kv_table = connection.get_table(&kv_path).await?;
+//!     let upsert_writer = kv_table.new_upsert()?.create_writer()?;
+//!     let mut row = GenericRow::new(3);
+//!     row.set_field(0, 1i32);
+//!     row.set_field(1, "Alice");
+//!     row.set_field(2, 30i64);
+//!     upsert_writer.upsert(&row)?;
+//!     upsert_writer.flush().await?;
+//!
+//!     let mut lookuper = kv_table.new_lookup()?.create_lookuper()?;
+//!     let mut key = GenericRow::new(1);
+//!     key.set_field(0, 1i32);
+//!     let result = lookuper.lookup(&key).await?;
+//!     if let Some(r) = result.get_single_row()? {
+//!         println!("KV lookup: id={}, name={}, age={}",
+//!                  r.get_int(0)?, r.get_string(1)?, r.get_long(2)?);
+//!     }
+//!
+//!     // ---- Log table: append and scan ----
+//!     let log_path = TablePath::new("fluss", "events");
+//!     let mut log_schema_builder = Schema::builder()
+//!         .column("ts", DataTypes::bigint())
+//!         .column("message", DataTypes::string());
+//!     let log_descriptor = TableDescriptor::builder()
+//!         .schema(log_schema_builder.build()?)
+//!         .build()?;
+//!     admin.create_table(&log_path, &log_descriptor, false).await?;
+//!
+//!     let log_table = connection.get_table(&log_path).await?;
+//!     let append_writer = log_table.new_append()?.create_writer()?;
+//!     let mut event = GenericRow::new(2);
+//!     event.set_field(0, 1700000000i64);
+//!     event.set_field(1, "hello");
+//!     append_writer.append(&event)?;
+//!     append_writer.flush().await?;
+//!
+//!     let scanner = log_table.new_scan().create_log_scanner()?;
+//!     scanner.subscribe(0, EARLIEST_OFFSET).await?;
+//!     let scan_records = scanner.poll(Duration::from_secs(1)).await?;
+//!     for record in scan_records {
+//!         let r = record.row();
+//!         println!("Log scan: ts={}, message={}", r.get_long(0)?, r.get_string(1)?);
+//!     }
+//!
+//!     Ok(())
+//! }
+//! ```
+
 pub mod client;
 pub mod metadata;
 pub mod record;
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
index a9c45d6971..ed67aa0e24 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record.rs
@@ -50,7 +50,7 @@ pub const LENGTH_LENGTH: usize = 4;
 /// use the `row()` method with a RowDecoder (typically obtained from the iterator).
 ///
 /// Reference implementation:
-/// https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/record/KvRecord.java
+/// <https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/record/KvRecord.java>
 #[derive(Debug, Clone)]
 pub struct KvRecord {
     key: Bytes,
diff --git a/fluss-rust/crates/fluss/src/row/binary/mod.rs b/fluss-rust/crates/fluss/src/row/binary/mod.rs
index c31cbd59c1..2a88ee1753 100644
--- a/fluss-rust/crates/fluss/src/row/binary/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/mod.rs
@@ -19,7 +19,7 @@ mod binary_writer;
 
 pub use binary_writer::*;
 
-/// The binary row format types, it indicates the generated [`BinaryRow`] type by the [`BinaryWriter`]
+/// The binary row format types, it indicates the generated row type by the [`BinaryWriter`]
 #[allow(dead_code)]
 pub enum BinaryRowFormat {
     Compacted,
diff --git a/fluss-rust/crates/fluss/src/row/encode/mod.rs b/fluss-rust/crates/fluss/src/row/encode/mod.rs
index 1ce7aef75c..16a540ebf8 100644
--- a/fluss-rust/crates/fluss/src/row/encode/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/mod.rs
@@ -64,12 +64,12 @@ impl KeyEncoderFactory {
     }
 }
 
-/// An encoder to write [`BinaryRow`]. It's used to write row
-/// multi-times one by one. When writing a new row:
+/// An encoder to write binary row data. It's used to write rows
+/// one by one. When writing a new row:
 ///
 /// 1. call method [`RowEncoder::start_new_row()`] to start the writing.
 /// 2. call method [`RowEncoder::encode_field()`] to write the row's field.
-/// 3. call method [`RowEncoder::finishRow()`] to finish the writing and get the written row.
+/// 3. call method [`RowEncoder::finish_row()`] to finish the writing and get the written row.
 #[allow(dead_code)]
 pub trait RowEncoder: Send + Sync {
     /// Start to write a new row.

From 1fefc8da9633497d4c5ad035eef035e121276e47 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Tue, 3 Mar 2026 11:19:58 +0000
Subject: [PATCH 183/287] chore: error handling fix CPP, for pointer returning
 methods (#409)

---
 fluss-rust/bindings/cpp/src/connection.cpp    |  40 +--
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |   8 +
 fluss-rust/bindings/cpp/src/lib.rs            | 298 ++++++++++--------
 fluss-rust/bindings/cpp/src/table.cpp         | 107 +++----
 .../bindings/cpp/test/test_sasl_auth.cpp      |   5 +-
 5 files changed, 243 insertions(+), 215 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/connection.cpp b/fluss-rust/bindings/cpp/src/connection.cpp
index dcf85783d9..6cd73017f5 100644
--- a/fluss-rust/bindings/cpp/src/connection.cpp
+++ b/fluss-rust/bindings/cpp/src/connection.cpp
@@ -47,15 +47,13 @@ Connection& Connection::operator=(Connection&& other) noexcept {
 }
 
 Result Connection::Create(const Configuration& config, Connection& out) {
-    try {
-        auto ffi_config = utils::to_ffi_config(config);
-        out.conn_ = ffi::new_connection(ffi_config);
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        return utils::make_client_error(e.what());
+    auto ffi_config = utils::to_ffi_config(config);
+    auto ffi_result = ffi::new_connection(ffi_config);
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.conn_ = utils::ptr_from_ffi<ffi::Connection>(ffi_result);
     }
+    return result;
 }
 
 bool Connection::Available() const { return conn_ != nullptr; }
@@ -65,14 +63,12 @@ Result Connection::GetAdmin(Admin& out) {
         return utils::make_client_error("Connection not available");
     }
 
-    try {
-        out.admin_ = conn_->get_admin();
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        return utils::make_client_error(e.what());
+    auto ffi_result = conn_->get_admin();
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.admin_ = utils::ptr_from_ffi<ffi::Admin>(ffi_result);
     }
+    return result;
 }
 
 Result Connection::GetTable(const TablePath& table_path, Table& out) {
@@ -80,15 +76,13 @@ Result Connection::GetTable(const TablePath& table_path, Table& out) {
         return utils::make_client_error("Connection not available");
     }
 
-    try {
-        auto ffi_path = utils::to_ffi_table_path(table_path);
-        out.table_ = conn_->get_table(ffi_path);
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        return utils::make_client_error(e.what());
+    auto ffi_path = utils::to_ffi_table_path(table_path);
+    auto ffi_result = conn_->get_table(ffi_path);
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out.table_ = utils::ptr_from_ffi<ffi::Table>(ffi_result);
     }
+    return result;
 }
 
 }  // namespace fluss
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 3375761460..93a60bf6e9 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -19,6 +19,8 @@
 
 #pragma once
 
+#include <cassert>
+
 #include "fluss.hpp"
 #include "lib.rs.h"
 
@@ -37,6 +39,12 @@ inline Result from_ffi_result(const ffi::FfiResult& ffi_result) {
     return Result{ffi_result.error_code, std::string(ffi_result.error_message)};
 }
 
+template <typename T>
+inline T* ptr_from_ffi(const ffi::FfiPtrResult& r) {
+    assert(r.ptr != 0 && "ptr_from_ffi: null pointer in FfiPtrResult");
+    return reinterpret_cast<T*>(r.ptr);
+}
+
 inline ffi::FfiTablePath to_ffi_table_path(const TablePath& path) {
     ffi::FfiTablePath ffi_path;
     ffi_path.database_name = rust::String(path.database_name);
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index c310fc838e..366a19831e 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -247,6 +247,11 @@ mod ffi {
         server_nodes: Vec<FfiServerNode>,
     }
 
+    struct FfiPtrResult {
+        result: FfiResult,
+        ptr: usize,
+    }
+
     extern "Rust" {
         type Connection;
         type Admin;
@@ -263,13 +268,10 @@ mod ffi {
         type LookupResultInner;
 
         // Connection
-        // TODO: all Result<*mut T> methods lose server error codes (mapped to CLIENT_ERROR).
-        // Fix by introducing  some struct like { result: FfiResult, ptr: i64 } to preserve error
-        // codes from the server, matching how Rust and Python bindings handle errors.
-        fn new_connection(config: &FfiConfig) -> Result<*mut Connection>;
+        fn new_connection(config: &FfiConfig) -> FfiPtrResult;
         unsafe fn delete_connection(conn: *mut Connection);
-        fn get_admin(self: &Connection) -> Result<*mut Admin>;
-        fn get_table(self: &Connection, table_path: &FfiTablePath) -> Result<*mut Table>;
+        fn get_admin(self: &Connection) -> FfiPtrResult;
+        fn get_table(self: &Connection, table_path: &FfiTablePath) -> FfiPtrResult;
 
         // Admin
         unsafe fn delete_admin(admin: *mut Admin);
@@ -344,20 +346,13 @@ mod ffi {
 
         // Table
         unsafe fn delete_table(table: *mut Table);
-        fn new_append_writer(self: &Table) -> Result<*mut AppendWriter>;
-        fn create_scanner(
-            self: &Table,
-            column_indices: Vec<usize>,
-            batch: bool,
-        ) -> Result<*mut LogScanner>;
+        fn new_append_writer(self: &Table) -> FfiPtrResult;
+        fn create_scanner(self: &Table, column_indices: Vec<usize>, batch: bool) -> FfiPtrResult;
         fn get_table_info_from_table(self: &Table) -> FfiTableInfo;
         fn get_table_path(self: &Table) -> FfiTablePath;
         fn has_primary_key(self: &Table) -> bool;
-        fn create_upsert_writer(
-            self: &Table,
-            column_indices: Vec<usize>,
-        ) -> Result<*mut UpsertWriter>;
-        fn new_lookuper(self: &Table) -> Result<*mut Lookuper>;
+        fn create_upsert_writer(self: &Table, column_indices: Vec<usize>) -> FfiPtrResult;
+        fn new_lookuper(self: &Table) -> FfiPtrResult;
 
         // GenericRowInner — opaque row for writes
         fn new_generic_row(field_count: usize) -> Box<GenericRowInner>;
@@ -378,21 +373,22 @@ mod ffi {
 
         // AppendWriter
         unsafe fn delete_append_writer(writer: *mut AppendWriter);
-        fn append(self: &mut AppendWriter, row: &GenericRowInner) -> Result<Box<WriteResult>>;
+        fn append(self: &mut AppendWriter, row: &GenericRowInner) -> FfiPtrResult;
         fn append_arrow_batch(
             self: &mut AppendWriter,
             array_ptr: usize,
             schema_ptr: usize,
-        ) -> Result<Box<WriteResult>>;
+        ) -> FfiPtrResult;
         fn flush(self: &mut AppendWriter) -> FfiResult;
 
-        // WriteResult — dropped automatically via rust::Box, or call wait() for ack
+        // WriteResult
+        unsafe fn delete_write_result(wr: *mut WriteResult);
         fn wait(self: &mut WriteResult) -> FfiResult;
 
         // UpsertWriter
         unsafe fn delete_upsert_writer(writer: *mut UpsertWriter);
-        fn upsert(self: &mut UpsertWriter, row: &GenericRowInner) -> Result<Box<WriteResult>>;
-        fn delete_row(self: &mut UpsertWriter, row: &GenericRowInner) -> Result<Box<WriteResult>>;
+        fn upsert(self: &mut UpsertWriter, row: &GenericRowInner) -> FfiPtrResult;
+        fn delete_row(self: &mut UpsertWriter, row: &GenericRowInner) -> FfiPtrResult;
         fn upsert_flush(self: &mut UpsertWriter) -> FfiResult;
 
         // Lookuper
@@ -630,13 +626,34 @@ fn err_from_core_error(e: &fcore::error::Error) -> ffi::FfiResult {
     }
 }
 
+fn ok_ptr(ptr: usize) -> ffi::FfiPtrResult {
+    ffi::FfiPtrResult {
+        result: ok_result(),
+        ptr,
+    }
+}
+
+fn client_err_ptr(msg: String) -> ffi::FfiPtrResult {
+    ffi::FfiPtrResult {
+        result: client_err(msg),
+        ptr: 0usize,
+    }
+}
+
+fn err_ptr_from_core(e: &fcore::error::Error) -> ffi::FfiPtrResult {
+    ffi::FfiPtrResult {
+        result: err_from_core_error(e),
+        ptr: 0usize,
+    }
+}
+
 // Connection implementation
-fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
+fn new_connection(config: &ffi::FfiConfig) -> ffi::FfiPtrResult {
     let assigner_type = match config.writer_bucket_no_key_assigner.as_str() {
         "round_robin" => fluss::config::NoKeyAssigner::RoundRobin,
         "sticky" => fluss::config::NoKeyAssigner::Sticky,
         other => {
-            return Err(format!(
+            return client_err_ptr(format!(
                 "Unknown bucket assigner type: '{other}', expected 'sticky' or 'round_robin'"
             ));
         }
@@ -664,10 +681,10 @@ fn new_connection(config: &ffi::FfiConfig) -> Result<*mut Connection, String> {
 
     match conn {
         Ok(c) => {
-            let conn = Box::into_raw(Box::new(Connection { inner: Arc::new(c) }));
-            Ok(conn)
+            let ptr = Box::into_raw(Box::new(Connection { inner: Arc::new(c) }));
+            ok_ptr(ptr as usize)
         }
-        Err(e) => Err(format!("Failed to connect: {e}")),
+        Err(e) => err_ptr_from_core(&e),
     }
 }
 
@@ -680,19 +697,19 @@ unsafe fn delete_connection(conn: *mut Connection) {
 }
 
 impl Connection {
-    fn get_admin(&self) -> Result<*mut Admin, String> {
+    fn get_admin(&self) -> ffi::FfiPtrResult {
         let admin_result = RUNTIME.block_on(async { self.inner.get_admin().await });
 
         match admin_result {
             Ok(admin) => {
-                let admin = Box::into_raw(Box::new(Admin { inner: admin }));
-                Ok(admin)
+                let ptr = Box::into_raw(Box::new(Admin { inner: admin }));
+                ok_ptr(ptr as usize)
             }
-            Err(e) => Err(format!("Failed to get admin: {e}")),
+            Err(e) => err_ptr_from_core(&e),
         }
     }
 
-    fn get_table(&self, table_path: &ffi::FfiTablePath) -> Result<*mut Table, String> {
+    fn get_table(&self, table_path: &ffi::FfiTablePath) -> ffi::FfiPtrResult {
         let path = fcore::metadata::TablePath::new(
             table_path.database_name.clone(),
             table_path.table_name.clone(),
@@ -702,16 +719,16 @@ impl Connection {
 
         match table_result {
             Ok(t) => {
-                let table = Box::into_raw(Box::new(Table {
+                let ptr = Box::into_raw(Box::new(Table {
                     connection: self.inner.clone(),
                     metadata: t.metadata().clone(),
                     table_info: t.get_table_info().clone(),
                     table_path: t.table_path().clone(),
                     has_pk: t.has_primary_key(),
                 }));
-                Ok(table)
+                ok_ptr(ptr as usize)
             }
-            Err(e) => Err(format!("Failed to get table: {e}")),
+            Err(e) => err_ptr_from_core(&e),
         }
     }
 }
@@ -1196,29 +1213,27 @@ impl Table {
             .collect()
     }
 
-    fn new_append_writer(&self) -> Result<*mut AppendWriter, String> {
+    fn new_append_writer(&self) -> ffi::FfiPtrResult {
         let _enter = RUNTIME.enter();
 
-        let table_append = self
-            .fluss_table()
-            .new_append()
-            .map_err(|e| format!("Failed to create append: {e}"))?;
+        let table_append = match self.fluss_table().new_append() {
+            Ok(a) => a,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        let writer = table_append
-            .create_writer()
-            .map_err(|e| format!("Failed to create writer: {e}"))?;
+        let writer = match table_append.create_writer() {
+            Ok(w) => w,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        Ok(Box::into_raw(Box::new(AppendWriter {
+        let ptr = Box::into_raw(Box::new(AppendWriter {
             inner: writer,
             table_info: self.table_info.clone(),
-        })))
+        }));
+        ok_ptr(ptr as usize)
     }
 
-    fn create_scanner(
-        &self,
-        column_indices: Vec<usize>,
-        batch: bool,
-    ) -> Result<*mut LogScanner, String> {
+    fn create_scanner(&self, column_indices: Vec<usize>, batch: bool) -> ffi::FfiPtrResult {
         RUNTIME.block_on(async {
             let fluss_table = self.fluss_table();
             let scan = fluss_table.new_scan();
@@ -1226,29 +1241,34 @@ impl Table {
             let (projected_columns, scan) = if column_indices.is_empty() {
                 (self.table_info.get_schema().columns().to_vec(), scan)
             } else {
-                let cols = self.resolve_projected_columns(&column_indices)?;
-                let scan = scan
-                    .project(&column_indices)
-                    .map_err(|e| format!("Failed to project columns: {e}"))?;
+                let cols = match self.resolve_projected_columns(&column_indices) {
+                    Ok(c) => c,
+                    Err(e) => return client_err_ptr(e),
+                };
+                let scan = match scan.project(&column_indices) {
+                    Ok(s) => s,
+                    Err(e) => return err_ptr_from_core(&e),
+                };
                 (cols, scan)
             };
 
             let scanner = if batch {
-                let s = scan
-                    .create_record_batch_log_scanner()
-                    .map_err(|e| format!("Failed to create record batch log scanner: {e}"))?;
-                ScannerKind::Batch(s)
+                match scan.create_record_batch_log_scanner() {
+                    Ok(s) => ScannerKind::Batch(s),
+                    Err(e) => return err_ptr_from_core(&e),
+                }
             } else {
-                let s = scan
-                    .create_log_scanner()
-                    .map_err(|e| format!("Failed to create log scanner: {e}"))?;
-                ScannerKind::Record(s)
+                match scan.create_log_scanner() {
+                    Ok(s) => ScannerKind::Record(s),
+                    Err(e) => return err_ptr_from_core(&e),
+                }
             };
 
-            Ok(Box::into_raw(Box::new(LogScanner {
+            let ptr = Box::into_raw(Box::new(LogScanner {
                 scanner,
                 projected_columns,
-            })))
+            }));
+            ok_ptr(ptr as usize)
         })
     }
 
@@ -1267,51 +1287,53 @@ impl Table {
         self.has_pk
     }
 
-    fn create_upsert_writer(
-        &self,
-        column_indices: Vec<usize>,
-    ) -> Result<*mut UpsertWriter, String> {
+    fn create_upsert_writer(&self, column_indices: Vec<usize>) -> ffi::FfiPtrResult {
         let _enter = RUNTIME.enter();
 
-        let table_upsert = self
-            .fluss_table()
-            .new_upsert()
-            .map_err(|e| format!("Failed to create upsert: {e}"))?;
+        let table_upsert = match self.fluss_table().new_upsert() {
+            Ok(u) => u,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
         let table_upsert = if column_indices.is_empty() {
             table_upsert
         } else {
-            table_upsert
-                .partial_update(Some(column_indices))
-                .map_err(|e| format!("Failed to set partial update columns: {e}"))?
+            match table_upsert.partial_update(Some(column_indices)) {
+                Ok(u) => u,
+                Err(e) => return err_ptr_from_core(&e),
+            }
         };
 
-        let writer = table_upsert
-            .create_writer()
-            .map_err(|e| format!("Failed to create upsert writer: {e}"))?;
+        let writer = match table_upsert.create_writer() {
+            Ok(w) => w,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        Ok(Box::into_raw(Box::new(UpsertWriter {
+        let ptr = Box::into_raw(Box::new(UpsertWriter {
             inner: writer,
             table_info: self.table_info.clone(),
-        })))
+        }));
+        ok_ptr(ptr as usize)
     }
 
-    fn new_lookuper(&self) -> Result<*mut Lookuper, String> {
+    fn new_lookuper(&self) -> ffi::FfiPtrResult {
         let _enter = RUNTIME.enter();
 
-        let table_lookup = self
-            .fluss_table()
-            .new_lookup()
-            .map_err(|e| format!("Failed to create lookup: {e}"))?;
+        let table_lookup = match self.fluss_table().new_lookup() {
+            Ok(l) => l,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        let lookuper = table_lookup
-            .create_lookuper()
-            .map_err(|e| format!("Failed to create lookuper: {e}"))?;
+        let lookuper = match table_lookup.create_lookuper() {
+            Ok(l) => l,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        Ok(Box::into_raw(Box::new(Lookuper {
+        let ptr = Box::into_raw(Box::new(Lookuper {
             inner: lookuper,
             table_info: self.table_info.clone(),
-        })))
+        }));
+        ok_ptr(ptr as usize)
     }
 }
 
@@ -1325,26 +1347,25 @@ unsafe fn delete_append_writer(writer: *mut AppendWriter) {
 }
 
 impl AppendWriter {
-    fn append(&mut self, row: &GenericRowInner) -> Result<Box<WriteResult>, String> {
+    fn append(&mut self, row: &GenericRowInner) -> ffi::FfiPtrResult {
         let schema = self.table_info.get_schema();
-        let generic_row =
-            types::resolve_row_types(&row.row, Some(schema)).map_err(|e| e.to_string())?;
+        let generic_row = match types::resolve_row_types(&row.row, Some(schema)) {
+            Ok(r) => r,
+            Err(e) => return client_err_ptr(e.to_string()),
+        };
 
-        let result_future = self
-            .inner
-            .append(&generic_row)
-            .map_err(|e| format!("Failed to append: {e}"))?;
+        let result_future = match self.inner.append(&generic_row) {
+            Ok(f) => f,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        Ok(Box::new(WriteResult {
+        let ptr = Box::into_raw(Box::new(WriteResult {
             inner: Some(result_future),
-        }))
+        }));
+        ok_ptr(ptr as usize)
     }
 
-    fn append_arrow_batch(
-        &mut self,
-        array_ptr: usize,
-        schema_ptr: usize,
-    ) -> Result<Box<WriteResult>, String> {
+    fn append_arrow_batch(&mut self, array_ptr: usize, schema_ptr: usize) -> ffi::FfiPtrResult {
         use arrow::ffi::{FFI_ArrowArray, FFI_ArrowSchema};
 
         // Safety: C++ allocates these via `new ArrowArray/ArrowSchema` after a
@@ -1355,22 +1376,25 @@ impl AppendWriter {
 
         // Safety: `from_ffi` requires that the array and schema conform to the
         // Arrow C Data Interface, which is guaranteed by C++'s ExportRecordBatch.
-        let array_data = unsafe { arrow::ffi::from_ffi(ffi_array, &ffi_schema) }
-            .map_err(|e| format!("Failed to import Arrow batch: {e}"))?;
+        let array_data = match unsafe { arrow::ffi::from_ffi(ffi_array, &ffi_schema) } {
+            Ok(d) => d,
+            Err(e) => return client_err_ptr(format!("Failed to import Arrow batch: {e}")),
+        };
         // ffi_array is consumed by from_ffi; ffi_schema is dropped here (Box goes out of scope)
 
         // Reconstruct RecordBatch from the imported StructArray data
         let struct_array = arrow::array::StructArray::from(array_data);
         let batch = arrow::record_batch::RecordBatch::from(struct_array);
 
-        let result_future = self
-            .inner
-            .append_arrow_batch(batch)
-            .map_err(|e| format!("Failed to append Arrow batch: {e}"))?;
+        let result_future = match self.inner.append_arrow_batch(batch) {
+            Ok(f) => f,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        Ok(Box::new(WriteResult {
+        let ptr = Box::into_raw(Box::new(WriteResult {
             inner: Some(result_future),
-        }))
+        }));
+        ok_ptr(ptr as usize)
     }
 
     fn flush(&mut self) -> ffi::FfiResult {
@@ -1383,6 +1407,14 @@ impl AppendWriter {
     }
 }
 
+unsafe fn delete_write_result(wr: *mut WriteResult) {
+    if !wr.is_null() {
+        unsafe {
+            drop(Box::from_raw(wr));
+        }
+    }
+}
+
 impl WriteResult {
     fn wait(&mut self) -> ffi::FfiResult {
         if let Some(future) = self.inner.take() {
@@ -1417,36 +1449,42 @@ impl UpsertWriter {
         row
     }
 
-    fn upsert(&mut self, row: &GenericRowInner) -> Result<Box<WriteResult>, String> {
+    fn upsert(&mut self, row: &GenericRowInner) -> ffi::FfiPtrResult {
         let schema = self.table_info.get_schema();
-        let generic_row =
-            types::resolve_row_types(&row.row, Some(schema)).map_err(|e| e.to_string())?;
+        let generic_row = match types::resolve_row_types(&row.row, Some(schema)) {
+            Ok(r) => r,
+            Err(e) => return client_err_ptr(e.to_string()),
+        };
         let generic_row = self.pad_row(generic_row);
 
-        let result_future = self
-            .inner
-            .upsert(&generic_row)
-            .map_err(|e| format!("Failed to upsert: {e}"))?;
+        let result_future = match self.inner.upsert(&generic_row) {
+            Ok(f) => f,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        Ok(Box::new(WriteResult {
+        let ptr = Box::into_raw(Box::new(WriteResult {
             inner: Some(result_future),
-        }))
+        }));
+        ok_ptr(ptr as usize)
     }
 
-    fn delete_row(&mut self, row: &GenericRowInner) -> Result<Box<WriteResult>, String> {
+    fn delete_row(&mut self, row: &GenericRowInner) -> ffi::FfiPtrResult {
         let schema = self.table_info.get_schema();
-        let generic_row =
-            types::resolve_row_types(&row.row, Some(schema)).map_err(|e| e.to_string())?;
+        let generic_row = match types::resolve_row_types(&row.row, Some(schema)) {
+            Ok(r) => r,
+            Err(e) => return client_err_ptr(e.to_string()),
+        };
         let generic_row = self.pad_row(generic_row);
 
-        let result_future = self
-            .inner
-            .delete(&generic_row)
-            .map_err(|e| format!("Failed to delete: {e}"))?;
+        let result_future = match self.inner.delete(&generic_row) {
+            Ok(f) => f,
+            Err(e) => return err_ptr_from_core(&e),
+        };
 
-        Ok(Box::new(WriteResult {
+        let ptr = Box::into_raw(Box::new(WriteResult {
             inner: Some(result_future),
-        }))
+        }));
+        ok_ptr(ptr as usize)
     }
 
     fn upsert_flush(&mut self) -> ffi::FfiResult {
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index b0b7029d22..c49a64433b 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -578,14 +578,12 @@ Result TableAppend::CreateWriter(AppendWriter& out) {
         return utils::make_client_error("Table not available");
     }
 
-    try {
-        out = AppendWriter(table_->new_append_writer());
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        return utils::make_client_error(e.what());
+    auto ffi_result = table_->new_append_writer();
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = AppendWriter(utils::ptr_from_ffi<ffi::AppendWriter>(ffi_result));
     }
+    return result;
 }
 
 // ============================================================================
@@ -645,11 +643,14 @@ Result TableUpsert::CreateWriter(UpsertWriter& out) {
         for (size_t idx : resolved_indices) {
             rust_indices.push_back(idx);
         }
-        out = UpsertWriter(table_->create_upsert_writer(std::move(rust_indices)));
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
+        auto ffi_result = table_->create_upsert_writer(std::move(rust_indices));
+        auto result = utils::from_ffi_result(ffi_result.result);
+        if (result.Ok()) {
+            out = UpsertWriter(utils::ptr_from_ffi<ffi::UpsertWriter>(ffi_result));
+        }
+        return result;
     } catch (const std::exception& e) {
+        // ResolveNameProjection() may throw
         return utils::make_client_error(e.what());
     }
 }
@@ -665,14 +666,12 @@ Result TableLookup::CreateLookuper(Lookuper& out) {
         return utils::make_client_error("Table not available");
     }
 
-    try {
-        out = Lookuper(table_->new_lookuper());
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        return utils::make_client_error(e.what());
+    auto ffi_result = table_->new_lookuper();
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = Lookuper(utils::ptr_from_ffi<ffi::Lookuper>(ffi_result));
     }
+    return result;
 }
 
 // ============================================================================
@@ -731,11 +730,14 @@ Result TableScan::DoCreateScanner(LogScanner& out, bool is_record_batch) {
         for (size_t idx : resolved_indices) {
             rust_indices.push_back(idx);
         }
-        out.scanner_ = table_->create_scanner(std::move(rust_indices), is_record_batch);
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
+        auto ffi_result = table_->create_scanner(std::move(rust_indices), is_record_batch);
+        auto result = utils::from_ffi_result(ffi_result.result);
+        if (result.Ok()) {
+            out.scanner_ = utils::ptr_from_ffi<ffi::LogScanner>(ffi_result);
+        }
+        return result;
     } catch (const std::exception& e) {
+        // ResolveNameProjection() may throw
         return utils::make_client_error(e.what());
     }
 }
@@ -752,8 +754,7 @@ WriteResult::~WriteResult() noexcept { Destroy(); }
 
 void WriteResult::Destroy() noexcept {
     if (inner_) {
-        // Reconstruct the rust::Box to let Rust drop the value
-        rust::Box<ffi::WriteResult>::from_raw(inner_);
+        ffi::delete_write_result(inner_);
         inner_ = nullptr;
     }
 }
@@ -827,15 +828,12 @@ Result AppendWriter::Append(const GenericRow& row, WriteResult& out) {
         return utils::make_client_error("GenericRow not available");
     }
 
-    try {
-        auto rust_box = writer_->append(*row.inner_);
-        out = WriteResult(rust_box.into_raw());
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        return utils::make_client_error(e.what());
+    auto ffi_result = writer_->append(*row.inner_);
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = WriteResult(utils::ptr_from_ffi<ffi::WriteResult>(ffi_result));
     }
+    return result;
 }
 
 Result AppendWriter::AppendArrowBatch(const std::shared_ptr<arrow::RecordBatch>& batch) {
@@ -864,19 +862,16 @@ Result AppendWriter::AppendArrowBatch(const std::shared_ptr<arrow::RecordBatch>&
     auto* array_heap = new ArrowArray(std::move(c_array));
     auto* schema_heap = new ArrowSchema(std::move(c_schema));
 
-    try {
-        // Rust takes ownership of both pointers immediately via Box::from_raw(),
-        // so after this call (success or exception) C++ must NOT free them.
-        auto result_box = writer_->append_arrow_batch(reinterpret_cast<size_t>(array_heap),
-                                                      reinterpret_cast<size_t>(schema_heap));
+    // Rust takes ownership of both pointers immediately via Box::from_raw(),
+    // so after this call C++ must NOT free them.
+    auto ffi_result = writer_->append_arrow_batch(reinterpret_cast<size_t>(array_heap),
+                                                  reinterpret_cast<size_t>(schema_heap));
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
         out.Destroy();
-        out.inner_ = result_box.into_raw();
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(std::string(e.what()));
-    } catch (const std::exception& e) {
-        return utils::make_client_error(std::string(e.what()));
+        out.inner_ = utils::ptr_from_ffi<ffi::WriteResult>(ffi_result);
     }
+    return result;
 }
 
 Result AppendWriter::Flush() {
@@ -933,15 +928,12 @@ Result UpsertWriter::Upsert(const GenericRow& row, WriteResult& out) {
         return utils::make_client_error("GenericRow not available");
     }
 
-    try {
-        auto rust_box = writer_->upsert(*row.inner_);
-        out = WriteResult(rust_box.into_raw());
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        return utils::make_client_error(e.what());
+    auto ffi_result = writer_->upsert(*row.inner_);
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = WriteResult(utils::ptr_from_ffi<ffi::WriteResult>(ffi_result));
     }
+    return result;
 }
 
 Result UpsertWriter::Delete(const GenericRow& row) {
@@ -957,15 +949,12 @@ Result UpsertWriter::Delete(const GenericRow& row, WriteResult& out) {
         return utils::make_client_error("GenericRow not available");
     }
 
-    try {
-        auto rust_box = writer_->delete_row(*row.inner_);
-        out = WriteResult(rust_box.into_raw());
-        return utils::make_ok();
-    } catch (const rust::Error& e) {
-        return utils::make_client_error(e.what());
-    } catch (const std::exception& e) {
-        return utils::make_client_error(e.what());
+    auto ffi_result = writer_->delete_row(*row.inner_);
+    auto result = utils::from_ffi_result(ffi_result.result);
+    if (result.Ok()) {
+        out = WriteResult(utils::ptr_from_ffi<ffi::WriteResult>(ffi_result));
     }
+    return result;
 }
 
 Result UpsertWriter::Flush() {
diff --git a/fluss-rust/bindings/cpp/test/test_sasl_auth.cpp b/fluss-rust/bindings/cpp/test/test_sasl_auth.cpp
index 2208db3019..5a52a1ab79 100644
--- a/fluss-rust/bindings/cpp/test/test_sasl_auth.cpp
+++ b/fluss-rust/bindings/cpp/test/test_sasl_auth.cpp
@@ -89,8 +89,7 @@ TEST_F(SaslAuthTest, SaslConnectWithWrongPassword) {
     fluss::Connection conn;
     auto result = fluss::Connection::Create(config, conn);
     ASSERT_FALSE(result.Ok());
-    // TODO: error_code is CLIENT_ERROR (-2) because CXX Result<*mut T> loses the server
-    // error code. Should be AUTHENTICATE_EXCEPTION (46) once fixed
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::AUTHENTICATE_EXCEPTION);
     EXPECT_NE(result.error_message.find("Authentication failed"), std::string::npos)
         << "Expected 'Authentication failed' in: " << result.error_message;
 }
@@ -106,7 +105,7 @@ TEST_F(SaslAuthTest, SaslConnectWithUnknownUser) {
     fluss::Connection conn;
     auto result = fluss::Connection::Create(config, conn);
     ASSERT_FALSE(result.Ok());
-    // TODO: same as above — should check error_code == AUTHENTICATE_EXCEPTION once fixed.
+    EXPECT_EQ(result.error_code, fluss::ErrorCode::AUTHENTICATE_EXCEPTION);
     EXPECT_NE(result.error_message.find("Authentication failed"), std::string::npos)
         << "Expected 'Authentication failed' in: " << result.error_message;
 }

From 0e86cc37e2872810ef136df9488e4813ecfe69be Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Tue, 3 Mar 2026 20:02:30 +0800
Subject: [PATCH 184/287] ci: fix ci build wheel issue for python (#419)

---
 .../.github/workflows/release_python.yml      | 20 ++++++++++++++++++-
 fluss-rust/bindings/python/Cargo.toml         |  2 +-
 2 files changed, 20 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/.github/workflows/release_python.yml b/fluss-rust/.github/workflows/release_python.yml
index d7bd04ccb7..323838d54c 100644
--- a/fluss-rust/.github/workflows/release_python.yml
+++ b/fluss-rust/.github/workflows/release_python.yml
@@ -94,9 +94,10 @@ jobs:
 
       - name: Install protoc (Windows)
         if: runner.os == 'Windows'
-        run: choco install protobuf -y
+        run: choco install protoc -y
         shell: pwsh
 
+      # Install protoc in manylinux container (x86_64/aarch64); script shared via YAML anchor
       - uses: PyO3/maturin-action@v1
         with:
           working-directory: bindings/python
@@ -104,6 +105,20 @@ jobs:
           command: build
           args: --release -o dist -i python3.9
           manylinux: ${{ matrix.manylinux || 'auto' }}
+          before-script-linux: &protoc-install |
+            set -e
+            ARCH=$(uname -m)
+            case "$ARCH" in
+              x86_64)  ZIP=protoc-27.1-linux-x86_64.zip ;;
+              aarch64) ZIP=protoc-27.1-linux-aarch_64.zip ;;
+              *) echo "Unsupported arch $ARCH"; exit 1 ;;
+            esac
+            curl -sLO "https://github.com/protocolbuffers/protobuf/releases/download/v27.1/${ZIP}"
+            python3 -c "import zipfile; zipfile.ZipFile('${ZIP}').extractall('/tmp/protoc_install')"
+            chmod +x /tmp/protoc_install/bin/protoc
+            rm -f "${ZIP}"
+            export PATH="/tmp/protoc_install/bin:$PATH"
+            export PROTOC=/tmp/protoc_install/bin/protoc
       - uses: PyO3/maturin-action@v1
         with:
           working-directory: bindings/python
@@ -111,6 +126,7 @@ jobs:
           command: build
           args: --release -o dist -i python3.10
           manylinux: ${{ matrix.manylinux || 'auto' }}
+          before-script-linux: *protoc-install
       - uses: PyO3/maturin-action@v1
         with:
           working-directory: bindings/python
@@ -118,6 +134,7 @@ jobs:
           command: build
           args: --release -o dist -i python3.11
           manylinux: ${{ matrix.manylinux || 'auto' }}
+          before-script-linux: *protoc-install
       - uses: PyO3/maturin-action@v1
         with:
           working-directory: bindings/python
@@ -125,6 +142,7 @@ jobs:
           command: build
           args: --release -o dist -i python3.12
           manylinux: ${{ matrix.manylinux || 'auto' }}
+          before-script-linux: *protoc-install
 
       - name: Upload wheels
         uses: actions/upload-artifact@v4
diff --git a/fluss-rust/bindings/python/Cargo.toml b/fluss-rust/bindings/python/Cargo.toml
index 9cf20e3d7b..30ac0469bc 100644
--- a/fluss-rust/bindings/python/Cargo.toml
+++ b/fluss-rust/bindings/python/Cargo.toml
@@ -27,7 +27,7 @@ name = "fluss"
 crate-type = ["cdylib"]
 
 [dependencies]
-pyo3 = { version = "0.26.0", features = ["extension-module"] }
+pyo3 = { version = "0.26.0", features = ["extension-module", "generate-import-lib"] }
 fluss = { workspace = true, features = ["storage-all"] }
 tokio = { workspace = true }
 arrow = { workspace = true }

From b9944eb31a126ba08c2926f54eca5fe6ff5f8462 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Tue, 3 Mar 2026 13:35:16 +0000
Subject: [PATCH 185/287] chore: fix mut schema builder public api (#420)

---
 fluss-rust/crates/examples/Cargo.toml         | 2 +-
 fluss-rust/crates/fluss/src/metadata/table.rs | 6 +++---
 fluss-rust/crates/fluss/src/test_utils.rs     | 2 +-
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
index cce6faf258..26251cc721 100644
--- a/fluss-rust/crates/examples/Cargo.toml
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -37,4 +37,4 @@ path = "src/example_kv_table.rs"
 
 [[example]]
 name = "example-partitioned-upsert-lookup"
-path = "src/example_partitioned_kv_table.rs"
\ No newline at end of file
+path = "src/example_partitioned_kv_table.rs"
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index 7f0d2e2a27..dba9a5230d 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -234,8 +234,8 @@ impl SchemaBuilder {
         Ok(self)
     }
 
-    pub fn build(&mut self) -> Result<Schema> {
-        let columns = Self::normalize_columns(&mut self.columns, self.primary_key.as_ref())?;
+    pub fn build(&self) -> Result<Schema> {
+        let columns = Self::normalize_columns(&self.columns, self.primary_key.as_ref())?;
 
         let column_names: HashSet<_> = columns.iter().map(|c| &c.name).collect();
         for auto_inc_col in &self.auto_increment_col_names {
@@ -266,7 +266,7 @@ impl SchemaBuilder {
     }
 
     fn normalize_columns(
-        columns: &mut [Column],
+        columns: &[Column],
         primary_key: Option<&PrimaryKey>,
     ) -> Result<Vec<Column>> {
         let names: Vec<_> = columns.iter().map(|c| &c.name).collect();
diff --git a/fluss-rust/crates/fluss/src/test_utils.rs b/fluss-rust/crates/fluss/src/test_utils.rs
index 752d42244e..47bb2ea81e 100644
--- a/fluss-rust/crates/fluss/src/test_utils.rs
+++ b/fluss-rust/crates/fluss/src/test_utils.rs
@@ -25,7 +25,7 @@ use std::sync::Arc;
 
 pub(crate) fn build_table_info(table_path: TablePath, table_id: i64, buckets: i32) -> TableInfo {
     let row_type = DataTypes::row(vec![DataField::new("id", DataTypes::int(), None)]);
-    let mut schema_builder = Schema::builder().with_row_type(&row_type);
+    let schema_builder = Schema::builder().with_row_type(&row_type);
     let schema = schema_builder.build().expect("schema build");
     let table_descriptor = TableDescriptor::builder()
         .schema(schema)

From 2f0f517d96cfd87d4705eeb6bef0d41e9dfd07f1 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Wed, 4 Mar 2026 02:08:25 +0000
Subject: [PATCH 186/287] [doc] Setup workflow for doc publish (#414)

---
 fluss-rust/.asf.yaml                          |  4 +-
 .../workflows/deploy_documentation.yml        | 81 +++++++++++++++++++
 fluss-rust/website/docusaurus.config.ts       | 23 +++++-
 fluss-rust/website/package.json               |  1 +
 fluss-rust/website/static/CNAME               |  1 +
 fluss-rust/website/static/manifest.json       | 17 ++++
 6 files changed, 124 insertions(+), 3 deletions(-)
 create mode 100644 fluss-rust/.github/workflows/deploy_documentation.yml
 create mode 100644 fluss-rust/website/static/CNAME
 create mode 100644 fluss-rust/website/static/manifest.json

diff --git a/fluss-rust/.asf.yaml b/fluss-rust/.asf.yaml
index b71e0264e3..929cc9fd7c 100644
--- a/fluss-rust/.asf.yaml
+++ b/fluss-rust/.asf.yaml
@@ -19,7 +19,9 @@
 
 github:
   description: "Rust Client for Apache Fluss (Incubating)"
-  homepage: https://fluss.apache.org/
+  homepage: https://clients.fluss.apache.org/
+  ghp_branch: gh-pages
+  ghp_path: /
   features:
     issues: true
     projects: false
diff --git a/fluss-rust/.github/workflows/deploy_documentation.yml b/fluss-rust/.github/workflows/deploy_documentation.yml
new file mode 100644
index 0000000000..05d8f1c1b8
--- /dev/null
+++ b/fluss-rust/.github/workflows/deploy_documentation.yml
@@ -0,0 +1,81 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+name: Deploy Documentation
+
+on:
+  workflow_dispatch:
+
+permissions:
+  contents: write
+
+jobs:
+  deploy:
+    runs-on: ubuntu-latest
+    defaults:
+      run:
+        working-directory: ./website
+    steps:
+      - uses: actions/checkout@v6
+        with:
+          fetch-depth: 0
+
+      - uses: actions/setup-node@v6
+        with:
+          node-version: 24
+
+      - name: Install dependencies
+        run: npm install
+
+      - name: Build website
+        run: npm run build
+
+      - name: Deploy to gh-pages branch
+        working-directory: .
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        run: |
+          git config user.name "github-actions[bot]"
+          git config user.email "github-actions[bot]@users.noreply.github.com"
+
+          # Create a temporary directory with the built site
+          TMPDIR=$(mktemp -d)
+          cp -r website/build/* "$TMPDIR"
+
+          # Switch to the gh-pages branch (create orphan if it doesn't exist)
+          if git ls-remote --exit-code origin gh-pages; then
+            git fetch origin gh-pages
+            git checkout gh-pages
+          else
+            git checkout --orphan gh-pages
+            git rm -rf .
+          fi
+
+          # Replace contents with the new build
+          git rm -rf . || true
+          git clean -fdx
+          cp -r "$TMPDIR"/* .
+          rm -rf "$TMPDIR"
+
+          # Commit and push
+          git add -A
+          if git diff --cached --quiet; then
+            echo "No changes to deploy."
+          else
+            git commit -m "Deploy website from ${GITHUB_SHA::8}"
+            git push origin gh-pages
+          fi
diff --git a/fluss-rust/website/docusaurus.config.ts b/fluss-rust/website/docusaurus.config.ts
index 0d974e95df..8c2e173d3b 100644
--- a/fluss-rust/website/docusaurus.config.ts
+++ b/fluss-rust/website/docusaurus.config.ts
@@ -7,8 +7,8 @@ const config: Config = {
   tagline: 'Rust, Python, and C++ clients for Apache Fluss',
   favicon: 'img/logo/fluss_favicon.svg',
 
-  url: 'https://fluss.apache.org/',
-  baseUrl: '/fluss-rust/',
+  url: 'https://clients.fluss.apache.org',
+  baseUrl: '/',
 
   organizationName: 'apache',
   projectName: 'fluss-rust',
@@ -20,6 +20,25 @@ const config: Config = {
     locales: ['en'],
   },
 
+  plugins: [
+    [
+      '@docusaurus/plugin-pwa',
+      {
+        debug: false,
+        offlineModeActivationStrategies: [
+          'appInstalled',
+          'standalone',
+          'queryString',
+        ],
+        pwaHead: [
+          { tagName: 'link', rel: 'icon', href: '/img/logo/fluss_favicon.svg' },
+          { tagName: 'link', rel: 'manifest', href: '/manifest.json' },
+          { tagName: 'meta', name: 'theme-color', content: '#0071e3' },
+        ],
+      },
+    ],
+  ],
+
   presets: [
     [
       'classic',
diff --git a/fluss-rust/website/package.json b/fluss-rust/website/package.json
index 644a705184..75f1499fb4 100644
--- a/fluss-rust/website/package.json
+++ b/fluss-rust/website/package.json
@@ -12,6 +12,7 @@
   },
   "dependencies": {
     "@docusaurus/core": "^3.9.2",
+    "@docusaurus/plugin-pwa": "^3.9.2",
     "@docusaurus/preset-classic": "^3.9.2",
     "@mdx-js/react": "^3.0.0",
     "clsx": "^2.0.0",
diff --git a/fluss-rust/website/static/CNAME b/fluss-rust/website/static/CNAME
new file mode 100644
index 0000000000..6298936bc4
--- /dev/null
+++ b/fluss-rust/website/static/CNAME
@@ -0,0 +1 @@
+clients.fluss.apache.org
diff --git a/fluss-rust/website/static/manifest.json b/fluss-rust/website/static/manifest.json
new file mode 100644
index 0000000000..7cd3b569db
--- /dev/null
+++ b/fluss-rust/website/static/manifest.json
@@ -0,0 +1,17 @@
+{
+  "short_name": "Fluss Clients",
+  "name": "Apache Fluss Clients: Rust, Python, and C++",
+  "description": "Rust, Python, and C++ clients for Apache Fluss",
+  "start_url": "/",
+  "scope": "/",
+  "display": "standalone",
+  "background_color": "#000000",
+  "theme_color": "#0071e3",
+  "icons": [
+    {
+      "src": "img/logo/svg/colored_logo.svg",
+      "sizes": "any",
+      "type": "image/svg+xml"
+    }
+  ]
+}

From 8ba7762784d3333cb1ffb753f5cacd6b9a811fb2 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Wed, 4 Mar 2026 10:58:24 +0800
Subject: [PATCH 187/287] doc: update create a release doc (#421)

---
 .../website/docs/release/create-release.md      | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/fluss-rust/website/docs/release/create-release.md b/fluss-rust/website/docs/release/create-release.md
index fc936f9a61..ba9c8752a1 100644
--- a/fluss-rust/website/docs/release/create-release.md
+++ b/fluss-rust/website/docs/release/create-release.md
@@ -77,12 +77,13 @@ cd fluss-rust
 Set these once and use them in all following commands. (Bash syntax.)
 
 ```bash
-export RELEASE_VERSION="0.1.0"
-export RELEASE_TAG="v${RELEASE_VERSION}"
-export SVN_RELEASE_DIR="fluss-rust-${RELEASE_VERSION}"
+RELEASE_VERSION="0.1.0"
+SHORT_RELEASE_VERSION="0.1"
+RELEASE_TAG="v${RELEASE_VERSION}"
+SVN_RELEASE_DIR="fluss-rust-${RELEASE_VERSION}"
 # Only set if there is a previous release (for compare link in DISCUSS / release notes)
-export LAST_VERSION="0.0.9"
-export NEXT_VERSION="0.2.0"
+LAST_VERSION="0.0.9"
+NEXT_VERSION="0.2.0"
 ```
 
 For the **first release** there is no previous version; leave `LAST_VERSION` unset or omit it when using the compare link in the DISCUSS thread and release notes.
@@ -122,8 +123,8 @@ From `main`, create a release branch. All release artifacts will be built from t
 ```bash
 git checkout main
 git pull
-git checkout -b release-${RELEASE_VERSION}
-git push origin release-${RELEASE_VERSION}
+git checkout -b release-${SHORT_RELEASE_VERSION}
+git push origin release-${SHORT_RELEASE_VERSION}
 ```
 
 Do **not** create or push the release/RC tag yet; that happens in [Build a release candidate](#build-a-release-candidate) after the source artifacts are staged.
@@ -184,7 +185,7 @@ For a **direct release** (no RC), skip these and use `RELEASE_TAG` and `SVN_RELE
 Check out the release branch at the commit you want to release, create the signed tag, then push it. Use `RC_TAG` for a release candidate or `RELEASE_TAG` for a direct release. Pushing the tag triggers GitHub Actions (for an RC tag, fluss-python is published to TestPyPI).
 
 ```bash
-git checkout release-${RELEASE_VERSION}
+git checkout release-${SHORT_RELEASE_VERSION}
 git pull
 git tag -s $RC_TAG -m "${RC_TAG}"
 git push origin $RC_TAG

From b953ab193cb62456794e3bcd9b571f47375d618b Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Thu, 5 Mar 2026 04:47:25 +0100
Subject: [PATCH 188/287] feat: Add getter/setter property for
 writer_bucket_no_key_assigner config in python (#397)

---
 fluss-rust/bindings/cpp/src/lib.rs            | 14 ++++----
 fluss-rust/bindings/python/fluss/__init__.pyi |  4 +++
 fluss-rust/bindings/python/src/config.rs      | 33 ++++++++++++++-----
 fluss-rust/crates/fluss/src/config.rs         | 18 ++++------
 4 files changed, 41 insertions(+), 28 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 366a19831e..36b9c51694 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -649,14 +649,12 @@ fn err_ptr_from_core(e: &fcore::error::Error) -> ffi::FfiPtrResult {
 
 // Connection implementation
 fn new_connection(config: &ffi::FfiConfig) -> ffi::FfiPtrResult {
-    let assigner_type = match config.writer_bucket_no_key_assigner.as_str() {
-        "round_robin" => fluss::config::NoKeyAssigner::RoundRobin,
-        "sticky" => fluss::config::NoKeyAssigner::Sticky,
-        other => {
-            return client_err_ptr(format!(
-                "Unknown bucket assigner type: '{other}', expected 'sticky' or 'round_robin'"
-            ));
-        }
+    let assigner_type = match config
+        .writer_bucket_no_key_assigner
+        .parse::<fluss::config::NoKeyAssigner>()
+    {
+        Ok(v) => v,
+        Err(e) => return client_err_ptr(format!("Invalid bucket assigner type: {e}")),
     };
     let config_core = fluss::config::Config {
         bootstrap_servers: config.bootstrap_servers.to_string(),
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index c387d7340e..417ac9b2e9 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -154,6 +154,10 @@ class Config:
     @writer_batch_size.setter
     def writer_batch_size(self, size: int) -> None: ...
     @property
+    def writer_bucket_no_key_assigner(self) -> str: ...
+    @writer_bucket_no_key_assigner.setter
+    def writer_bucket_no_key_assigner(self, value: str) -> None: ...
+    @property
     def scanner_remote_log_prefetch_num(self) -> int: ...
     @scanner_remote_log_prefetch_num.setter
     def scanner_remote_log_prefetch_num(self, num: int) -> None: ...
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 4582d43d49..f99f9c63f8 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -98,15 +98,12 @@ impl Config {
                             })?;
                     }
                     "writer.bucket.no-key-assigner" => {
-                        config.writer_bucket_no_key_assigner = match value.as_str() {
-                            "round_robin" => fcore::config::NoKeyAssigner::RoundRobin,
-                            "sticky" => fcore::config::NoKeyAssigner::Sticky,
-                            other => {
-                                return Err(FlussError::new_err(format!(
-                                    "Unknown bucket assigner type: {other}, expected 'sticky' or 'round_robin'"
-                                )));
-                            }
-                        };
+                        config.writer_bucket_no_key_assigner =
+                            value.parse::<fcore::config::NoKeyAssigner>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
                     }
                     "connect-timeout" => {
                         config.connect_timeout_ms = value.parse::<u64>().map_err(|e| {
@@ -255,6 +252,24 @@ impl Config {
         self.inner.writer_batch_timeout_ms = timeout;
     }
 
+    /// Get the bucket assignment strategy for tables without bucket keys
+    #[getter]
+    fn writer_bucket_no_key_assigner(&self) -> String {
+        self.inner.writer_bucket_no_key_assigner.to_string()
+    }
+
+    /// Set the bucket assignment strategy for tables without bucket keys
+    #[setter]
+    fn set_writer_bucket_no_key_assigner(&mut self, value: String) -> PyResult<()> {
+        self.inner.writer_bucket_no_key_assigner =
+            value.parse::<fcore::config::NoKeyAssigner>().map_err(|e| {
+                FlussError::new_err(format!(
+                    "Invalid value '{value}' for 'writer.bucket.no-key-assigner': {e}"
+                ))
+            })?;
+        Ok(())
+    }
+
     /// Get the connect timeout in milliseconds
     #[getter]
     fn connect_timeout_ms(&self) -> u64 {
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 438c948307..08ffbfae77 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -17,7 +17,7 @@
 
 use clap::{Parser, ValueEnum};
 use serde::{Deserialize, Serialize};
-use std::fmt;
+use strum_macros::{Display, EnumString};
 
 const DEFAULT_BOOTSTRAP_SERVER: &str = "127.0.0.1:9123";
 const DEFAULT_REQUEST_MAX_SIZE: i32 = 10 * 1024 * 1024;
@@ -36,24 +36,20 @@ const DEFAULT_SASL_MECHANISM: &str = "PLAIN";
 
 /// Bucket assigner strategy for tables without bucket keys.
 /// Matches Java `client.writer.bucket.no-key-assigner`.
-#[derive(Debug, Clone, Copy, PartialEq, Eq, ValueEnum, Deserialize, Serialize)]
+#[derive(
+    Debug, Clone, Copy, PartialEq, Eq, ValueEnum, Deserialize, Serialize, EnumString, Display,
+)]
 #[serde(rename_all = "snake_case")]
+#[strum(ascii_case_insensitive)]
 pub enum NoKeyAssigner {
     /// Sticks to one bucket until the batch is full, then switches.
+    #[strum(serialize = "sticky")]
     Sticky,
     /// Assigns each record to the next bucket in a rotating sequence.
+    #[strum(serialize = "round_robin")]
     RoundRobin,
 }
 
-impl fmt::Display for NoKeyAssigner {
-    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
-        match self {
-            NoKeyAssigner::Sticky => write!(f, "sticky"),
-            NoKeyAssigner::RoundRobin => write!(f, "round_robin"),
-        }
-    }
-}
-
 #[derive(Parser, Clone, Deserialize, Serialize)]
 #[command(author, version, about, long_about = None)]
 pub struct Config {

From 8fdccce0d25c6af1e09c8218c1a138f05c355fe4 Mon Sep 17 00:00:00 2001
From: aicontentcreate2023-star <aicontentcreate2023@gmail.com>
Date: Thu, 5 Mar 2026 12:00:37 +0800
Subject: [PATCH 189/287] chore: update testing fluss image to 0.9.0 (#426)

---
 fluss-rust/bindings/cpp/test/test_utils.h                  | 2 +-
 fluss-rust/bindings/python/test/conftest.py                | 2 +-
 fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/fluss-rust/bindings/cpp/test/test_utils.h b/fluss-rust/bindings/cpp/test/test_utils.h
index 98d119a5d3..05c32cf21b 100644
--- a/fluss-rust/bindings/cpp/test/test_utils.h
+++ b/fluss-rust/bindings/cpp/test/test_utils.h
@@ -50,7 +50,7 @@
 namespace fluss_test {
 
 static constexpr const char* kFlussImage = "apache/fluss";
-static constexpr const char* kFlussVersion = "0.8.0-incubating";
+static constexpr const char* kFlussVersion = "0.9.0-incubating";
 static constexpr const char* kNetworkName = "fluss-cpp-test-network";
 static constexpr const char* kZookeeperName = "zookeeper-cpp-test";
 static constexpr const char* kCoordinatorName = "coordinator-server-cpp-test";
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index 0a969e8462..bb8d18b9cd 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -34,7 +34,7 @@
 import fluss
 
 FLUSS_IMAGE = "apache/fluss"
-FLUSS_VERSION = "0.8.0-incubating"
+FLUSS_VERSION = "0.9.0-incubating"
 BOOTSTRAP_SERVERS_ENV = os.environ.get("FLUSS_BOOTSTRAP_SERVERS")
 
 
diff --git a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
index a2e9157954..5dc3e33e22 100644
--- a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
+++ b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
@@ -25,7 +25,7 @@ use testcontainers::core::ContainerPort;
 use testcontainers::runners::AsyncRunner;
 use testcontainers::{ContainerAsync, GenericImage, ImageExt};
 
-const FLUSS_VERSION: &str = "0.8.0-incubating";
+const FLUSS_VERSION: &str = "0.9.0-incubating";
 const FLUSS_IMAGE: &str = "apache/fluss";
 
 pub struct FlussTestingClusterBuilder {

From f2b7d7fa6e98af749869ba7acb7cf12ebdedb5fc Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sat, 7 Mar 2026 02:19:21 +0100
Subject: [PATCH 190/287] chore: Remove config duplication in examples (#427)

---
 .../user-guide/cpp/example/configuration.md   | 16 +-------
 .../docs/user-guide/python/api-reference.md   | 38 +++++++++----------
 .../python/example/configuration.md           | 21 ++--------
 .../user-guide/rust/example/configuration.md  | 19 +---------
 4 files changed, 24 insertions(+), 70 deletions(-)

diff --git a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
index f4b6309b8b..38202618c9 100644
--- a/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/cpp/example/configuration.md
@@ -23,21 +23,7 @@ if (!result.Ok()) {
 
 All fields have sensible defaults. Only `bootstrap_servers` typically needs to be set.
 
-```cpp
-fluss::Configuration config;
-config.bootstrap_servers = "127.0.0.1:9123";                  // Coordinator address
-config.writer_request_max_size = 10 * 1024 * 1024;            // Max request size (10 MB)
-config.writer_acks = "all";                                    // Wait for all replicas
-config.writer_retries = std::numeric_limits<int32_t>::max();   // Retry on failure
-config.writer_batch_size = 2 * 1024 * 1024;                   // Batch size (2 MB)
-config.writer_batch_timeout_ms = 100;                          // Max time to wait for a batch to fill
-config.writer_bucket_no_key_assigner = "sticky";               // "sticky" or "round_robin"
-config.scanner_remote_log_prefetch_num = 4;                    // Remote log prefetch count
-config.remote_file_download_thread_num = 3;                    // Download threads
-config.scanner_remote_log_read_concurrency = 4;                // In-file remote log read concurrency
-config.scanner_log_max_poll_records = 500;                     // Max records per poll
-config.connect_timeout_ms = 120000;                            // TCP connect timeout (ms)
-```
+See the [`Configuration`](../api-reference.md#configuration) section in the API Reference for the full list of configuration fields, types, and defaults.
 
 ## SASL Authentication
 
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index 8f7ab61bbd..e9113b6974 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -7,25 +7,25 @@ Complete API reference for the Fluss Python client.
 
 ## `Config`
 
-| Method / Property                     | Description                                                                             |
-|---------------------------------------|-----------------------------------------------------------------------------------------|
-| `Config(properties: dict = None)`     | Create config from a dict of key-value pairs                                            |
-| `bootstrap_servers`                   | Get/set coordinator server address                                                      |
-| `writer_request_max_size`             | Get/set max request size in bytes                                                       |
-| `writer_acks`                         | Get/set acknowledgment setting (`"all"` for all replicas)                               |
-| `writer_retries`                      | Get/set number of retries on failure                                                    |
-| `writer_batch_size`                   | Get/set write batch size in bytes                                                       |
-| `writer_batch_timeout_ms`             | Get/set max time in ms to wait for a writer batch to fill up before sending             |
-| `writer.bucket.no-key-assigner`       | Bucket assignment strategy (`"sticky"` or `"round_robin"`); set via `Config(dict)` only |
-| `scanner_remote_log_prefetch_num`     | Get/set number of remote log segments to prefetch                                       |
-| `remote_file_download_thread_num`     | Get/set number of threads for remote log downloads                                      |
-| `scanner_remote_log_read_concurrency` | Get/set streaming read concurrency within a remote log file                             |
-| `scanner_log_max_poll_records`        | Get/set max number of records returned in a single poll()                               |
-| `connect_timeout_ms`                  | Get/set TCP connect timeout in milliseconds                                             |
-| `security_protocol`                   | Get/set security protocol (`"PLAINTEXT"` or `"sasl"`)                                   |
-| `security_sasl_mechanism`             | Get/set SASL mechanism (only `"PLAIN"` is supported)                                    |
-| `security_sasl_username`              | Get/set SASL username (required when protocol is `"sasl"`)                              |
-| `security_sasl_password`              | Get/set SASL password (required when protocol is `"sasl"`)                              |
+| Method / Property                     | Config Key                            | Description                                                                             |
+|---------------------------------------|---------------------------------------|-----------------------------------------------------------------------------------------|
+| `Config(properties: dict = None)`     |                                       | Create config from a dict of key-value pairs                                            |
+| `bootstrap_servers`                   | `bootstrap.servers`                   | Get/set coordinator server address                                                      |
+| `writer_request_max_size`             | `writer.request-max-size`             | Get/set max request size in bytes                                                       |
+| `writer_acks`                         | `writer.acks`                         | Get/set acknowledgment setting (`"all"` for all replicas)                               |
+| `writer_retries`                      | `writer.retries`                      | Get/set number of retries on failure                                                    |
+| `writer_batch_size`                   | `writer.batch-size`                   | Get/set write batch size in bytes                                                       |
+| `writer_batch_timeout_ms`             | `writer.batch-timeout-ms`             | Get/set max time in ms to wait for a writer batch to fill up before sending             |
+| `writer_bucket_no_key_assigner`       | `writer.bucket.no-key-assigner`       | Get/set bucket assignment strategy (`"sticky"` or `"round_robin"`)                      |
+| `scanner_remote_log_prefetch_num`     | `scanner.remote-log.prefetch-num`     | Get/set number of remote log segments to prefetch                                       |
+| `remote_file_download_thread_num`     | `remote-file.download-thread-num`     | Get/set number of threads for remote log downloads                                      |
+| `scanner_remote_log_read_concurrency` | `scanner.remote-log.read-concurrency` | Get/set streaming read concurrency within a remote log file                             |
+| `scanner_log_max_poll_records`        | `scanner.log.max-poll-records`        | Get/set max number of records returned in a single poll()                               |
+| `connect_timeout_ms`                  | `connect-timeout`                     | Get/set TCP connect timeout in milliseconds                                             |
+| `security_protocol`                   | `security.protocol`                   | Get/set security protocol (`"PLAINTEXT"` or `"sasl"`)                                   |
+| `security_sasl_mechanism`             | `security.sasl.mechanism`             | Get/set SASL mechanism (only `"PLAIN"` is supported)                                    |
+| `security_sasl_username`              | `security.sasl.username`              | Get/set SASL username (required when protocol is `"sasl"`)                              |
+| `security_sasl_password`              | `security.sasl.password`              | Get/set SASL password (required when protocol is `"sasl"`)                              |
 
 ## `FlussConnection`
 
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
index 90b1249ca4..995a81cc33 100644
--- a/fluss-rust/website/docs/user-guide/python/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -21,24 +21,9 @@ with await fluss.FlussConnection.create(config) as conn:
 
 ## Connection Configurations
 
-| Key                                   | Description                                                                           | Default            |
-|---------------------------------------|---------------------------------------------------------------------------------------|--------------------|
-| `bootstrap.servers`                   | Coordinator server address                                                            | `127.0.0.1:9123`   |
-| `writer.request-max-size`             | Maximum request size in bytes                                                         | `10485760` (10 MB) |
-| `writer.acks`                         | Acknowledgment setting (`all` waits for all replicas)                                 | `all`              |
-| `writer.retries`                      | Number of retries on failure                                                          | `2147483647`       |
-| `writer.batch-size`                   | Batch size for writes in bytes                                                        | `2097152` (2 MB)   |
-| `writer.batch-timeout-ms`             | The maximum time to wait for a writer batch to fill up before sending.                | `100`              |
-| `writer.bucket.no-key-assigner`       | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin`  | `sticky`           |
-| `scanner.remote-log.prefetch-num`     | Number of remote log segments to prefetch                                             | `4`                |
-| `remote-file.download-thread-num`     | Number of threads for remote log downloads                                            | `3`                |
-| `scanner.remote-log.read-concurrency` | Streaming read concurrency within a remote log file                                   | `4`                |
-| `scanner.log.max-poll-records`        | Max records returned in a single poll()                                               | `500`              |
-| `connect-timeout`                     | TCP connect timeout in milliseconds                                                   | `120000`           |
-| `security.protocol`                   | `PLAINTEXT` (default) or `sasl` for SASL auth                                        | `PLAINTEXT`        |
-| `security.sasl.mechanism`             | SASL mechanism (only `PLAIN` is supported)                                            | `PLAIN`            |
-| `security.sasl.username`              | SASL username (required when protocol is `sasl`)                                      | (empty)            |
-| `security.sasl.password`              | SASL password (required when protocol is `sasl`)                                      | (empty)            |
+Configuration options can be set either via dict keys in the `Config()` constructor, or via Python property setters.
+
+See the [`Config`](../api-reference.md#config) section in the API Reference for the full list of options, their config keys, and descriptions.
 
 ## SASL Authentication
 
diff --git a/fluss-rust/website/docs/user-guide/rust/example/configuration.md b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
index f6340c976d..eba38d85f2 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/configuration.md
@@ -17,24 +17,7 @@ let conn = FlussConnection::new(config).await?;
 
 ## Connection Configurations
 
-| Option                                | Description                                                                          | Default          |
-|---------------------------------------|--------------------------------------------------------------------------------------|------------------|
-| `bootstrap_servers`                   | Coordinator server address                                                           | `127.0.0.1:9123` |
-| `writer_request_max_size`             | Maximum request size in bytes                                                        | 10 MB            |
-| `writer_acks`                         | Acknowledgment setting (`all` waits for all replicas)                                | `all`            |
-| `writer_retries`                      | Number of retries on failure                                                         | `i32::MAX`       |
-| `writer_batch_size`                   | Batch size for writes                                                                | 2 MB             |
-| `writer_batch_timeout_ms`             | The maximum time to wait for a writer batch to fill up before sending.               | `100`            |
-| `writer_bucket_no_key_assigner`       | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` | `sticky`         |
-| `scanner_remote_log_prefetch_num`     | Number of remote log segments to prefetch                                            | `4`              |
-| `remote_file_download_thread_num`     | Number of concurrent remote log file downloads                                       | `3`              |
-| `scanner_remote_log_read_concurrency` | Streaming read concurrency within a remote log file                                  | `4`              |
-| `scanner_log_max_poll_records`        | Maximum records returned in a single `poll()`                                        | `500`            |
-| `connect_timeout_ms`                  | TCP connect timeout in milliseconds                                                  | 120000           |
-| `security_protocol`                   | `PLAINTEXT` (default) or `sasl` for SASL auth                                       | `PLAINTEXT`      |
-| `security_sasl_mechanism`             | SASL mechanism (only `PLAIN` is supported)                                           | `PLAIN`          |
-| `security_sasl_username`              | SASL username (required when protocol is `sasl`)                                     | (empty)          |
-| `security_sasl_password`              | SASL password (required when protocol is `sasl`)                                     | (empty)          |
+See the [`Config`](../api-reference.md#config) section in the API Reference for the full list of configuration options, types, and defaults.
 
 ## SASL Authentication
 

From 3ddbebeffd6e6aa38bc5b374efc16dd57ba238b8 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 8 Mar 2026 09:43:34 +0000
Subject: [PATCH 191/287] ci: parallelize cpp integration tests (#434)

---
 .../.github/workflows/build_and_test_cpp.yml  |   4 +-
 fluss-rust/bindings/cpp/CMakeLists.txt        |  15 ++-
 fluss-rust/bindings/cpp/test/test_main.cpp    |  10 ++
 fluss-rust/bindings/cpp/test/test_utils.h     | 102 +++++++++++-------
 4 files changed, 90 insertions(+), 41 deletions(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
index 5cdd14d7e4..1931983d4e 100644
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -70,9 +70,9 @@ jobs:
           cmake -B build -DFLUSS_ENABLE_TESTING=ON -DCMAKE_BUILD_TYPE=Debug
           cmake --build build --parallel
 
-      - name: Run C++ integration tests
+      - name: Run C++ integration tests (parallel)
         working-directory: bindings/cpp
-        run: cd build && ctest --output-on-failure --timeout 300
+        run: cd build && ctest -j$(nproc) --output-on-failure --timeout 300
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
index 0cedf68249..ac93611685 100644
--- a/fluss-rust/bindings/cpp/CMakeLists.txt
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -256,6 +256,7 @@ if (FLUSS_ENABLE_TESTING)
     FetchContent_MakeAvailable(googletest)
 
     enable_testing()
+    include(GoogleTest)
 
     file(GLOB TEST_SOURCE_FILES "test/*.cpp")
     add_executable(fluss_cpp_test ${TEST_SOURCE_FILES})
@@ -267,5 +268,17 @@ if (FLUSS_ENABLE_TESTING)
         ${PROJECT_SOURCE_DIR}/test
     )
 
-    add_test(NAME fluss_cpp_integration_tests COMMAND fluss_cpp_test)
+    # Individual tests for parallel execution via ctest -j.
+    gtest_discover_tests(fluss_cpp_test
+        PROPERTIES
+            TIMEOUT 120
+            FIXTURES_REQUIRED fluss_cluster
+    )
+
+    # Cleanup: stop Docker containers after all tests finish.
+    # Mirrors Python's pytest_unconfigure and Rust's atexit cleanup.
+    add_test(NAME fluss_cluster_cleanup COMMAND fluss_cpp_test --cleanup)
+    set_tests_properties(fluss_cluster_cleanup PROPERTIES
+        FIXTURES_CLEANUP fluss_cluster
+    )
 endif()
diff --git a/fluss-rust/bindings/cpp/test/test_main.cpp b/fluss-rust/bindings/cpp/test/test_main.cpp
index 8c2e2d966f..7b132d2c37 100644
--- a/fluss-rust/bindings/cpp/test/test_main.cpp
+++ b/fluss-rust/bindings/cpp/test/test_main.cpp
@@ -22,6 +22,16 @@
 #include "test_utils.h"
 
 int main(int argc, char** argv) {
+    // --cleanup: stop Docker containers and exit (used by ctest FIXTURES_CLEANUP).
+    for (int i = 1; i < argc; ++i) {
+        if (std::string(argv[i]) == "--cleanup") {
+            const char* env = std::getenv("FLUSS_BOOTSTRAP_SERVERS");
+            if (env && std::strlen(env) > 0) return 0;
+            fluss_test::FlussTestCluster::StopAll();
+            return 0;
+        }
+    }
+
     ::testing::InitGoogleTest(&argc, argv);
 
     // Register the global test environment (manages the Fluss cluster lifecycle).
diff --git a/fluss-rust/bindings/cpp/test/test_utils.h b/fluss-rust/bindings/cpp/test/test_utils.h
index 05c32cf21b..f5b4971654 100644
--- a/fluss-rust/bindings/cpp/test/test_utils.h
+++ b/fluss-rust/bindings/cpp/test/test_utils.h
@@ -126,29 +126,42 @@ class FlussTestCluster {
         const char* env_servers = std::getenv("FLUSS_BOOTSTRAP_SERVERS");
         if (env_servers && std::strlen(env_servers) > 0) {
             bootstrap_servers_ = env_servers;
+            const char* env_sasl = std::getenv("FLUSS_SASL_BOOTSTRAP_SERVERS");
+            if (env_sasl && std::strlen(env_sasl) > 0) {
+                sasl_bootstrap_servers_ = env_sasl;
+            }
             external_cluster_ = true;
             std::cout << "Using external cluster: " << bootstrap_servers_ << std::endl;
             return true;
         }
 
+        // Reuse cluster started by another parallel test process or previous run.
+        if (WaitForPort("127.0.0.1", kPlainClientPort, /*timeout_seconds=*/1)) {
+            SetBootstrapServers();
+            external_cluster_ = true;
+            return true;
+        }
+
         std::cout << "Starting Fluss cluster via Docker..." << std::endl;
 
-        // Create network
+        // Remove stopped (not running) containers from previous runs.
+        RunCommand(std::string("docker rm ") + kTabletServerName + " 2>/dev/null || true");
+        RunCommand(std::string("docker rm ") + kCoordinatorName + " 2>/dev/null || true");
+        RunCommand(std::string("docker rm ") + kZookeeperName + " 2>/dev/null || true");
+        RunCommand(std::string("docker network rm ") + kNetworkName + " 2>/dev/null || true");
+
         RunCommand(std::string("docker network create ") + kNetworkName + " 2>/dev/null || true");
 
-        // Start ZooKeeper
         std::string zk_cmd = std::string("docker run -d --rm") + " --name " + kZookeeperName +
                              " --network " + kNetworkName + " zookeeper:3.9.2";
         if (RunCommand(zk_cmd) != 0) {
-            std::cerr << "Failed to start ZooKeeper" << std::endl;
-            return false;
+            return WaitForCluster();
         }
 
-        // Wait for ZooKeeper to be ready before starting Fluss servers
+        // Wait for ZooKeeper to be ready
         std::this_thread::sleep_for(std::chrono::seconds(5));
 
-        // Start Coordinator Server (dual listeners: CLIENT=SASL on 9123, PLAIN_CLIENT=plaintext on
-        // 9223)
+        // Coordinator Server (dual listeners: SASL on 9123, plaintext on 9223)
         std::string sasl_jaas =
             "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required"
             " user_admin=\"admin-secret\" user_alice=\"alice-secret\";";
@@ -171,19 +184,15 @@ class FlussTestCluster {
         std::string coord_cmd = DockerRunCmd(kCoordinatorName, coord_props,
                                              {"9123:9123", "9223:9223"}, "coordinatorServer");
         if (RunCommand(coord_cmd) != 0) {
-            std::cerr << "Failed to start Coordinator Server" << std::endl;
-            Stop();
-            return false;
+            return WaitForCluster();
         }
 
-        // Wait for coordinator to be ready
         if (!WaitForPort("127.0.0.1", kCoordinatorPort)) {
             std::cerr << "Coordinator Server did not become ready" << std::endl;
-            Stop();
             return false;
         }
 
-        // Start Tablet Server (dual listeners: CLIENT=SASL on 9123, PLAIN_CLIENT=plaintext on 9223)
+        // Tablet Server (dual listeners: SASL on 9124, plaintext on 9224)
         std::string ts = std::string(kTabletServerName);
         std::string ts_props = JoinProps({
             "zookeeper.address: " + zk + ":2181",
@@ -205,43 +214,33 @@ class FlussTestCluster {
                                            std::to_string(kPlainClientTabletPort) + ":9223"},
                                           "tabletServer");
         if (RunCommand(ts_cmd) != 0) {
-            std::cerr << "Failed to start Tablet Server" << std::endl;
-            Stop();
-            return false;
+            return WaitForCluster();
         }
 
-        // Wait for tablet server to be ready
-        if (!WaitForPort("127.0.0.1", kTabletServerPort)) {
-            std::cerr << "Tablet Server did not become ready" << std::endl;
-            Stop();
-            return false;
-        }
-
-        // Wait for plaintext listeners
-        if (!WaitForPort("127.0.0.1", kPlainClientPort)) {
-            std::cerr << "Coordinator plaintext listener did not become ready" << std::endl;
-            Stop();
-            return false;
-        }
-        if (!WaitForPort("127.0.0.1", kPlainClientTabletPort)) {
-            std::cerr << "Tablet Server plaintext listener did not become ready" << std::endl;
-            Stop();
+        if (!WaitForPort("127.0.0.1", kTabletServerPort) ||
+            !WaitForPort("127.0.0.1", kPlainClientPort) ||
+            !WaitForPort("127.0.0.1", kPlainClientTabletPort)) {
+            std::cerr << "Cluster listeners did not become ready" << std::endl;
             return false;
         }
 
-        bootstrap_servers_ = "127.0.0.1:" + std::to_string(kPlainClientPort);
-        sasl_bootstrap_servers_ = "127.0.0.1:" + std::to_string(kCoordinatorPort);
+        SetBootstrapServers();
         std::cout << "Fluss cluster started successfully." << std::endl;
         return true;
     }
 
     void Stop() {
         if (external_cluster_) return;
+        StopAll();
+    }
 
+    /// Unconditionally stop and remove all cluster containers and the network.
+    /// Used by the --cleanup flag from ctest FIXTURES_CLEANUP.
+    static void StopAll() {
         std::cout << "Stopping Fluss cluster..." << std::endl;
-        RunCommand(std::string("docker stop ") + kTabletServerName + " 2>/dev/null || true");
-        RunCommand(std::string("docker stop ") + kCoordinatorName + " 2>/dev/null || true");
-        RunCommand(std::string("docker stop ") + kZookeeperName + " 2>/dev/null || true");
+        RunCommand(std::string("docker rm -f ") + kTabletServerName + " 2>/dev/null || true");
+        RunCommand(std::string("docker rm -f ") + kCoordinatorName + " 2>/dev/null || true");
+        RunCommand(std::string("docker rm -f ") + kZookeeperName + " 2>/dev/null || true");
         RunCommand(std::string("docker network rm ") + kNetworkName + " 2>/dev/null || true");
         std::cout << "Fluss cluster stopped." << std::endl;
     }
@@ -250,6 +249,32 @@ class FlussTestCluster {
     const std::string& GetSaslBootstrapServers() const { return sasl_bootstrap_servers_; }
 
    private:
+    void SetBootstrapServers() {
+        bootstrap_servers_ = "127.0.0.1:" + std::to_string(kPlainClientPort);
+        sasl_bootstrap_servers_ = "127.0.0.1:" + std::to_string(kCoordinatorPort);
+    }
+
+    /// Wait for a cluster being started by another process.
+    /// Fails fast if no containers exist (real Docker failure vs race).
+    bool WaitForCluster() {
+        if (RunCommand(std::string("docker inspect ") + kZookeeperName + " >/dev/null 2>&1") != 0) {
+            std::cerr << "Failed to start cluster (docker error)" << std::endl;
+            return false;
+        }
+        std::cout << "Waiting for cluster started by another process..." << std::endl;
+        if (!WaitForPort("127.0.0.1", kPlainClientPort) ||
+            !WaitForPort("127.0.0.1", kPlainClientTabletPort) ||
+            !WaitForPort("127.0.0.1", kCoordinatorPort) ||
+            !WaitForPort("127.0.0.1", kTabletServerPort)) {
+            std::cerr << "Cluster did not become ready" << std::endl;
+            return false;
+        }
+        SetBootstrapServers();
+        external_cluster_ = true;
+        std::cout << "Cluster ready." << std::endl;
+        return true;
+    }
+
     std::string bootstrap_servers_;
     std::string sasl_bootstrap_servers_;
     bool external_cluster_{false};
@@ -291,7 +316,8 @@ class FlussTestEnvironment : public ::testing::Environment {
         GTEST_SKIP() << "Fluss cluster did not become ready within timeout.";
     }
 
-    void TearDown() override { cluster_.Stop(); }
+    // Cluster stays alive for parallel processes and subsequent runs.
+    void TearDown() override {}
 
     fluss::Connection& GetConnection() { return connection_; }
     fluss::Admin& GetAdmin() { return admin_; }

From 036fac02b7710aba952ebe0945b5c7f6cb8c6c5e Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 8 Mar 2026 09:51:04 +0000
Subject: [PATCH 192/287] chore: pre-size Arrow builders and recommend jemalloc
 for write path (#430)

---
 fluss-rust/crates/examples/Cargo.toml         |  4 +
 .../crates/examples/src/example_table.rs      |  4 +
 fluss-rust/crates/fluss/Cargo.toml            |  1 -
 fluss-rust/crates/fluss/src/lib.rs            | 19 ++++
 fluss-rust/crates/fluss/src/record/arrow.rs   | 96 ++++++++++++-------
 5 files changed, 88 insertions(+), 36 deletions(-)

diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
index 26251cc721..b9187395a4 100644
--- a/fluss-rust/crates/examples/Cargo.toml
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -27,6 +27,10 @@ version = { workspace = true }
 fluss = { workspace = true, features = ["storage-all"] }
 tokio = { workspace = true }
 clap = { workspace = true }
+
+[target.'cfg(not(target_env = "msvc"))'.dependencies]
+tikv-jemallocator = "0.6"
+
 [[example]]
 name = "example-table"
 path = "src/example_table.rs"
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index e4ad1fbdfc..49f0ab4c6f 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -15,6 +15,10 @@
 // specific language governing permissions and limitations
 // under the License.
 
+#[cfg(not(target_env = "msvc"))]
+#[global_allocator]
+static GLOBAL: tikv_jemallocator::Jemalloc = tikv_jemallocator::Jemalloc;
+
 mod example_kv_table;
 mod example_partitioned_kv_table;
 
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index db1348a086..c0ba6f8dc8 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -80,6 +80,5 @@ jiff = { workspace = true, features = ["js"] }
 testcontainers = "0.25.0"
 test-env-helpers = "0.2.2"
 
-
 [build-dependencies]
 prost-build = { version = "0.14" }
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index cd060c8e45..13e85981c0 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -101,6 +101,25 @@
 //!     Ok(())
 //! }
 //! ```
+//!
+//! # Performance
+//!
+//! For production deployments on Linux, we recommend using
+//! [jemalloc](https://crates.io/crates/tikv-jemallocator) as the global allocator.
+//! The default glibc allocator (ptmalloc2) can cause RSS bloat and fragmentation under
+//! sustained write loads due to repeated same-size alloc/free cycles in Arrow batch building.
+//! jemalloc's thread-local size-class bins handle this pattern efficiently.
+//!
+//! ```toml
+//! [target.'cfg(not(target_env = "msvc"))'.dependencies]
+//! tikv-jemallocator = "0.6"
+//! ```
+//!
+//! ```rust,ignore
+//! #[cfg(not(target_env = "msvc"))]
+//! #[global_allocator]
+//! static GLOBAL: tikv_jemallocator::Jemalloc = tikv_jemallocator::Jemalloc;
+//! ```
 
 pub mod client;
 pub mod metadata;
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index ea27836e52..7fd16194f7 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -151,8 +151,13 @@ pub const NO_BATCH_SEQUENCE: i32 = -1;
 
 pub const BUILDER_DEFAULT_OFFSET: i64 = 0;
 
+// TODO: Switch to byte-size-based is_full() like Java's ArrowWriter instead of a hard record cap.
 pub const DEFAULT_MAX_RECORD: i32 = 256;
 
+/// Estimated average byte size for variable-width columns (Utf8, Binary).
+/// Used to pre-allocate data buffers and avoid reallocations during batch building.
+const VARIABLE_WIDTH_AVG_BYTES: usize = 64;
+
 pub struct MemoryLogRecordsArrowBuilder {
     base_log_offset: i64,
     schema_id: i32,
@@ -236,11 +241,12 @@ pub struct RowAppendRecordBatchBuilder {
 
 impl RowAppendRecordBatchBuilder {
     pub fn new(row_type: &RowType) -> Result<Self> {
+        let capacity = DEFAULT_MAX_RECORD as usize;
         let schema_ref = to_arrow_schema(row_type)?;
         let builders: Result<Vec<_>> = schema_ref
             .fields()
             .iter()
-            .map(|field| Self::create_builder(field.data_type()))
+            .map(|field| Self::create_builder(field.data_type(), capacity))
             .collect();
         let field_getters = FieldGetter::create_field_getters(row_type);
         Ok(Self {
@@ -251,26 +257,41 @@ impl RowAppendRecordBatchBuilder {
         })
     }
 
-    fn create_builder(data_type: &arrow_schema::DataType) -> Result<Box<dyn ArrayBuilder>> {
+    fn create_builder(
+        data_type: &arrow_schema::DataType,
+        capacity: usize,
+    ) -> Result<Box<dyn ArrayBuilder>> {
         match data_type {
-            arrow_schema::DataType::Int8 => Ok(Box::new(Int8Builder::new())),
-            arrow_schema::DataType::Int16 => Ok(Box::new(Int16Builder::new())),
-            arrow_schema::DataType::Int32 => Ok(Box::new(Int32Builder::new())),
-            arrow_schema::DataType::Int64 => Ok(Box::new(Int64Builder::new())),
-            arrow_schema::DataType::UInt8 => Ok(Box::new(UInt8Builder::new())),
-            arrow_schema::DataType::UInt16 => Ok(Box::new(UInt16Builder::new())),
-            arrow_schema::DataType::UInt32 => Ok(Box::new(UInt32Builder::new())),
-            arrow_schema::DataType::UInt64 => Ok(Box::new(UInt64Builder::new())),
-            arrow_schema::DataType::Float32 => Ok(Box::new(Float32Builder::new())),
-            arrow_schema::DataType::Float64 => Ok(Box::new(Float64Builder::new())),
-            arrow_schema::DataType::Boolean => Ok(Box::new(BooleanBuilder::new())),
-            arrow_schema::DataType::Utf8 => Ok(Box::new(StringBuilder::new())),
-            arrow_schema::DataType::Binary => Ok(Box::new(BinaryBuilder::new())),
-            arrow_schema::DataType::FixedSizeBinary(size) => {
-                Ok(Box::new(FixedSizeBinaryBuilder::new(*size)))
+            arrow_schema::DataType::Int8 => Ok(Box::new(Int8Builder::with_capacity(capacity))),
+            arrow_schema::DataType::Int16 => Ok(Box::new(Int16Builder::with_capacity(capacity))),
+            arrow_schema::DataType::Int32 => Ok(Box::new(Int32Builder::with_capacity(capacity))),
+            arrow_schema::DataType::Int64 => Ok(Box::new(Int64Builder::with_capacity(capacity))),
+            arrow_schema::DataType::UInt8 => Ok(Box::new(UInt8Builder::with_capacity(capacity))),
+            arrow_schema::DataType::UInt16 => Ok(Box::new(UInt16Builder::with_capacity(capacity))),
+            arrow_schema::DataType::UInt32 => Ok(Box::new(UInt32Builder::with_capacity(capacity))),
+            arrow_schema::DataType::UInt64 => Ok(Box::new(UInt64Builder::with_capacity(capacity))),
+            arrow_schema::DataType::Float32 => {
+                Ok(Box::new(Float32Builder::with_capacity(capacity)))
+            }
+            arrow_schema::DataType::Float64 => {
+                Ok(Box::new(Float64Builder::with_capacity(capacity)))
+            }
+            arrow_schema::DataType::Boolean => {
+                Ok(Box::new(BooleanBuilder::with_capacity(capacity)))
             }
+            arrow_schema::DataType::Utf8 => Ok(Box::new(StringBuilder::with_capacity(
+                capacity,
+                capacity * VARIABLE_WIDTH_AVG_BYTES,
+            ))),
+            arrow_schema::DataType::Binary => Ok(Box::new(BinaryBuilder::with_capacity(
+                capacity,
+                capacity * VARIABLE_WIDTH_AVG_BYTES,
+            ))),
+            arrow_schema::DataType::FixedSizeBinary(size) => Ok(Box::new(
+                FixedSizeBinaryBuilder::with_capacity(capacity, *size),
+            )),
             arrow_schema::DataType::Decimal128(precision, scale) => {
-                let builder = Decimal128Builder::new()
+                let builder = Decimal128Builder::with_capacity(capacity)
                     .with_precision_and_scale(*precision, *scale)
                     .map_err(|e| Error::IllegalArgument {
                         message: format!(
@@ -279,11 +300,13 @@ impl RowAppendRecordBatchBuilder {
                     })?;
                 Ok(Box::new(builder))
             }
-            arrow_schema::DataType::Date32 => Ok(Box::new(Date32Builder::new())),
+            arrow_schema::DataType::Date32 => Ok(Box::new(Date32Builder::with_capacity(capacity))),
             arrow_schema::DataType::Time32(unit) => match unit {
-                arrow_schema::TimeUnit::Second => Ok(Box::new(Time32SecondBuilder::new())),
+                arrow_schema::TimeUnit::Second => {
+                    Ok(Box::new(Time32SecondBuilder::with_capacity(capacity)))
+                }
                 arrow_schema::TimeUnit::Millisecond => {
-                    Ok(Box::new(Time32MillisecondBuilder::new()))
+                    Ok(Box::new(Time32MillisecondBuilder::with_capacity(capacity)))
                 }
                 _ => Err(Error::IllegalArgument {
                     message: format!(
@@ -293,9 +316,11 @@ impl RowAppendRecordBatchBuilder {
             },
             arrow_schema::DataType::Time64(unit) => match unit {
                 arrow_schema::TimeUnit::Microsecond => {
-                    Ok(Box::new(Time64MicrosecondBuilder::new()))
+                    Ok(Box::new(Time64MicrosecondBuilder::with_capacity(capacity)))
+                }
+                arrow_schema::TimeUnit::Nanosecond => {
+                    Ok(Box::new(Time64NanosecondBuilder::with_capacity(capacity)))
                 }
-                arrow_schema::TimeUnit::Nanosecond => Ok(Box::new(Time64NanosecondBuilder::new())),
                 _ => Err(Error::IllegalArgument {
                     message: format!(
                         "Time64 only supports Microsecond and Nanosecond units, got: {unit:?}"
@@ -303,17 +328,17 @@ impl RowAppendRecordBatchBuilder {
                 }),
             },
             arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Second, _) => {
-                Ok(Box::new(TimestampSecondBuilder::new()))
-            }
-            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Millisecond, _) => {
-                Ok(Box::new(TimestampMillisecondBuilder::new()))
-            }
-            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Microsecond, _) => {
-                Ok(Box::new(TimestampMicrosecondBuilder::new()))
-            }
-            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, _) => {
-                Ok(Box::new(TimestampNanosecondBuilder::new()))
+                Ok(Box::new(TimestampSecondBuilder::with_capacity(capacity)))
             }
+            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Millisecond, _) => Ok(
+                Box::new(TimestampMillisecondBuilder::with_capacity(capacity)),
+            ),
+            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Microsecond, _) => Ok(
+                Box::new(TimestampMicrosecondBuilder::with_capacity(capacity)),
+            ),
+            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, _) => Ok(
+                Box::new(TimestampNanosecondBuilder::with_capacity(capacity)),
+            ),
             dt => Err(Error::IllegalArgument {
                 message: format!("Unsupported data type: {dt:?}"),
             }),
@@ -1701,7 +1726,8 @@ mod tests {
 
         // Test valid builder creation with precision=10, scale=2
         let mut builder =
-            RowAppendRecordBatchBuilder::create_builder(&ArrowDataType::Decimal128(10, 2)).unwrap();
+            RowAppendRecordBatchBuilder::create_builder(&ArrowDataType::Decimal128(10, 2), 256)
+                .unwrap();
         let decimal_builder = builder
             .as_any_mut()
             .downcast_mut::<Decimal128Builder>()
@@ -1712,7 +1738,7 @@ mod tests {
 
         // Test error case: invalid precision/scale
         let result =
-            RowAppendRecordBatchBuilder::create_builder(&ArrowDataType::Decimal128(100, 50));
+            RowAppendRecordBatchBuilder::create_builder(&ArrowDataType::Decimal128(100, 50), 256);
         assert!(result.is_err());
     }
 

From e3316f6a12e823db881c2de5c80bb286a8706fda Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 8 Mar 2026 10:37:15 +0000
Subject: [PATCH 193/287] ci: parallelize python integration tests (#435)

---
 .../workflows/build_and_test_python.yml       |   4 +-
 fluss-rust/.gitignore                         |   2 +
 fluss-rust/bindings/python/pyproject.toml     |   1 +
 fluss-rust/bindings/python/test/conftest.py   | 218 +++++++++++++-----
 4 files changed, 170 insertions(+), 55 deletions(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index efb5caabdd..39dfa98047 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -73,9 +73,9 @@ jobs:
           uv sync --extra dev
           uv run maturin develop
 
-      - name: Run Python integration tests
+      - name: Run Python integration tests (parallel)
         working-directory: bindings/python
-        run: uv run pytest test/ -v
+        run: uv run pytest test/ -v -n auto
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
index f251aab32d..5d11a1c080 100644
--- a/fluss-rust/.gitignore
+++ b/fluss-rust/.gitignore
@@ -25,6 +25,8 @@ __pycache__/
 *.py[cod]
 *$py.class
 *.so
+*.dylib
+*.dSYM/
 *.egg-info/
 dist/
 build/
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index f5b0b68d62..63af88e4ed 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -50,6 +50,7 @@ dev = [
     "mypy>=1.17.1",
     "pytest>=8.3.5",
     "pytest-asyncio>=0.25.3",
+    "pytest-xdist>=3.5.0",
     "ruff>=0.9.10",
     "maturin>=1.8.2",
     "testcontainers>=4.0.0",
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index bb8d18b9cd..0e4cfe41b7 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -20,14 +20,27 @@
 If FLUSS_BOOTSTRAP_SERVERS is set, tests connect to an existing cluster.
 Otherwise, a Fluss cluster is started automatically via testcontainers.
 
+The first pytest-xdist worker to run starts the cluster; other workers
+detect it via port check and reuse it (matching the C++ test pattern).
+Containers are cleaned up after all workers finish via pytest_unconfigure.
+
 Run with:
-    uv run maturin develop && uv run pytest test/ -v
+    uv run maturin develop && uv run pytest test/ -v -n auto
 """
 
+import asyncio
 import os
 import socket
+import subprocess
 import time
 
+# Disable testcontainers Ryuk reaper for xdist runs — it would kill
+# containers when the first worker exits, while others are still running.
+# We handle cleanup ourselves in pytest_unconfigure.
+# In single-process mode, keep Ryuk as a safety net for hard crashes.
+if "PYTEST_XDIST_WORKER" in os.environ:
+    os.environ.setdefault("TESTCONTAINERS_RYUK_DISABLED", "true")
+
 import pytest
 import pytest_asyncio
 
@@ -37,6 +50,20 @@
 FLUSS_VERSION = "0.9.0-incubating"
 BOOTSTRAP_SERVERS_ENV = os.environ.get("FLUSS_BOOTSTRAP_SERVERS")
 
+# Container / network names
+NETWORK_NAME = "fluss-python-test-network"
+ZOOKEEPER_NAME = "zookeeper-python-test"
+COORDINATOR_NAME = "coordinator-server-python-test"
+TABLET_SERVER_NAME = "tablet-server-python-test"
+
+# Fixed host ports (must match across workers)
+COORDINATOR_PORT = 9123
+TABLET_SERVER_PORT = 9124
+PLAIN_CLIENT_PORT = 9223
+PLAIN_CLIENT_TABLET_PORT = 9224
+
+ALL_PORTS = [COORDINATOR_PORT, TABLET_SERVER_PORT, PLAIN_CLIENT_PORT, PLAIN_CLIENT_TABLET_PORT]
+
 
 def _wait_for_port(host, port, timeout=60):
     """Wait for a TCP port to become available."""
@@ -44,40 +71,56 @@ def _wait_for_port(host, port, timeout=60):
     while time.time() - start < timeout:
         try:
             with socket.create_connection((host, port), timeout=1):
-                return
+                return True
         except (ConnectionRefusedError, TimeoutError, OSError):
             time.sleep(1)
-    raise TimeoutError(f"Port {port} on {host} not available after {timeout}s")
+    return False
 
 
-@pytest.fixture(scope="session")
-def fluss_cluster():
-    """Start a Fluss cluster using testcontainers, or use an existing one."""
-    if BOOTSTRAP_SERVERS_ENV:
-        yield (BOOTSTRAP_SERVERS_ENV, BOOTSTRAP_SERVERS_ENV)
+def _all_ports_ready(timeout=60):
+    """Wait for all cluster ports to become available."""
+    deadline = time.time() + timeout
+    for port in ALL_PORTS:
+        remaining = deadline - time.time()
+        if remaining <= 0 or not _wait_for_port("localhost", port, timeout=remaining):
+            return False
+    return True
+
+
+def _run_cmd(cmd):
+    """Run a command (list form), return exit code."""
+    return subprocess.run(cmd, capture_output=True).returncode
+
+
+def _start_cluster():
+    """Start the Fluss Docker cluster via testcontainers.
+
+    If another worker already started the cluster (detected via port check),
+    reuse it. If container creation fails (name conflict from a racing worker),
+    wait for the other worker's cluster to become ready.
+    """
+    # Reuse cluster started by another parallel worker or previous run.
+    if _wait_for_port("localhost", PLAIN_CLIENT_PORT, timeout=1):
+        print("Reusing existing cluster via port check.")
         return
 
     from testcontainers.core.container import DockerContainer
-    from testcontainers.core.network import Network
 
-    network = Network()
-    network.create()
+    print("Starting Fluss cluster via testcontainers...")
 
-    zookeeper = (
-        DockerContainer("zookeeper:3.9.2")
-        .with_network(network)
-        .with_name("zookeeper-python-test")
-    )
+    # Create a named network via Docker CLI (idempotent, avoids orphaned
+    # random-named networks when multiple xdist workers race).
+    _run_cmd(["docker", "network", "create", NETWORK_NAME])
 
     sasl_jaas = (
         "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required"
         ' user_admin="admin-secret" user_alice="alice-secret";'
     )
     coordinator_props = "\n".join([
-        "zookeeper.address: zookeeper-python-test:2181",
-        "bind.listeners: INTERNAL://coordinator-server-python-test:0,"
-        " CLIENT://coordinator-server-python-test:9123,"
-        " PLAIN_CLIENT://coordinator-server-python-test:9223",
+        f"zookeeper.address: {ZOOKEEPER_NAME}:2181",
+        f"bind.listeners: INTERNAL://{COORDINATOR_NAME}:0,"
+        f" CLIENT://{COORDINATOR_NAME}:9123,"
+        f" PLAIN_CLIENT://{COORDINATOR_NAME}:9223",
         "advertised.listeners: CLIENT://localhost:9123,"
         " PLAIN_CLIENT://localhost:9223",
         "internal.listener.name: INTERNAL",
@@ -87,21 +130,11 @@ def fluss_cluster():
         "netty.server.num-network-threads: 1",
         "netty.server.num-worker-threads: 3",
     ])
-    coordinator = (
-        DockerContainer(f"{FLUSS_IMAGE}:{FLUSS_VERSION}")
-        .with_network(network)
-        .with_name("coordinator-server-python-test")
-        .with_bind_ports(9123, 9123)
-        .with_bind_ports(9223, 9223)
-        .with_command("coordinatorServer")
-        .with_env("FLUSS_PROPERTIES", coordinator_props)
-    )
-
     tablet_props = "\n".join([
-        "zookeeper.address: zookeeper-python-test:2181",
-        "bind.listeners: INTERNAL://tablet-server-python-test:0,"
-        " CLIENT://tablet-server-python-test:9123,"
-        " PLAIN_CLIENT://tablet-server-python-test:9223",
+        f"zookeeper.address: {ZOOKEEPER_NAME}:2181",
+        f"bind.listeners: INTERNAL://{TABLET_SERVER_NAME}:0,"
+        f" CLIENT://{TABLET_SERVER_NAME}:9123,"
+        f" PLAIN_CLIENT://{TABLET_SERVER_NAME}:9223",
         "advertised.listeners: CLIENT://localhost:9124,"
         " PLAIN_CLIENT://localhost:9224",
         "internal.listener.name: INTERNAL",
@@ -112,42 +145,121 @@ def fluss_cluster():
         "netty.server.num-network-threads: 1",
         "netty.server.num-worker-threads: 3",
     ])
+
+    zookeeper = (
+        DockerContainer("zookeeper:3.9.2")
+        .with_kwargs(network=NETWORK_NAME)
+        .with_name(ZOOKEEPER_NAME)
+    )
+    coordinator = (
+        DockerContainer(f"{FLUSS_IMAGE}:{FLUSS_VERSION}")
+        .with_kwargs(network=NETWORK_NAME)
+        .with_name(COORDINATOR_NAME)
+        .with_bind_ports(9123, 9123)
+        .with_bind_ports(9223, 9223)
+        .with_command("coordinatorServer")
+        .with_env("FLUSS_PROPERTIES", coordinator_props)
+    )
     tablet_server = (
         DockerContainer(f"{FLUSS_IMAGE}:{FLUSS_VERSION}")
-        .with_network(network)
-        .with_name("tablet-server-python-test")
+        .with_kwargs(network=NETWORK_NAME)
+        .with_name(TABLET_SERVER_NAME)
         .with_bind_ports(9123, 9124)
         .with_bind_ports(9223, 9224)
         .with_command("tabletServer")
         .with_env("FLUSS_PROPERTIES", tablet_props)
     )
 
-    zookeeper.start()
-    coordinator.start()
-    tablet_server.start()
+    try:
+        zookeeper.start()
+        coordinator.start()
+        tablet_server.start()
+    except Exception as e:
+        # Another worker may have started containers with the same names.
+        # Wait for the cluster to become ready instead of failing.
+        print(f"Container start failed ({e}), waiting for cluster from another worker...")
+        if _all_ports_ready():
+            return
+        raise
 
-    _wait_for_port("localhost", 9123)
-    _wait_for_port("localhost", 9124)
-    _wait_for_port("localhost", 9223)
-    _wait_for_port("localhost", 9224)
-    # Extra wait for cluster to fully initialize
-    time.sleep(10)
+    if not _all_ports_ready():
+        raise RuntimeError("Cluster listeners did not become ready")
 
-    # (plaintext_bootstrap, sasl_bootstrap)
-    yield ("127.0.0.1:9223", "127.0.0.1:9123")
+    print("Fluss cluster started successfully.")
+
+
+def _stop_cluster():
+    """Stop and remove the Fluss Docker cluster containers."""
+    for name in [TABLET_SERVER_NAME, COORDINATOR_NAME, ZOOKEEPER_NAME]:
+        subprocess.run(["docker", "rm", "-f", name], capture_output=True)
+    subprocess.run(["docker", "network", "rm", NETWORK_NAME], capture_output=True)
+
+
+async def _connect_with_retry(bootstrap_servers, timeout=60):
+    """Connect to the Fluss cluster with retries until it's fully ready.
+
+    Waits until both the coordinator and at least one tablet server are
+    available, matching the Rust wait_for_cluster_ready pattern.
+    """
+    config = fluss.Config({"bootstrap.servers": bootstrap_servers})
+    start = time.time()
+    last_err = None
+    while time.time() - start < timeout:
+        conn = None
+        try:
+            conn = await fluss.FlussConnection.create(config)
+            admin = await conn.get_admin()
+            nodes = await admin.get_server_nodes()
+            if any(n.server_type == "TabletServer" for n in nodes):
+                return conn
+            last_err = RuntimeError("No TabletServer available yet")
+        except Exception as e:
+            last_err = e
+        if conn is not None:
+            conn.close()
+        await asyncio.sleep(1)
+    raise RuntimeError(
+        f"Could not connect to cluster after {timeout}s: {last_err}"
+    )
 
-    tablet_server.stop()
-    coordinator.stop()
-    zookeeper.stop()
-    network.remove()
+
+def pytest_unconfigure(config):
+    """Clean up Docker containers after all xdist workers finish.
+
+    Runs once on the controller process (or the single process when
+    not using xdist). Workers are identified by the 'workerinput' attr.
+    """
+    if BOOTSTRAP_SERVERS_ENV:
+        return
+    if hasattr(config, "workerinput"):
+        return  # This is a worker, skip
+    _stop_cluster()
+
+
+@pytest.fixture(scope="session")
+def fluss_cluster():
+    """Start a Fluss cluster using testcontainers, or use an existing one."""
+    if BOOTSTRAP_SERVERS_ENV:
+        sasl_env = os.environ.get(
+            "FLUSS_SASL_BOOTSTRAP_SERVERS", BOOTSTRAP_SERVERS_ENV
+        )
+        yield (BOOTSTRAP_SERVERS_ENV, sasl_env)
+        return
+
+    _start_cluster()
+
+    # (plaintext_bootstrap, sasl_bootstrap)
+    yield (
+        f"127.0.0.1:{PLAIN_CLIENT_PORT}",
+        f"127.0.0.1:{COORDINATOR_PORT}",
+    )
 
 
 @pytest_asyncio.fixture(scope="session")
 async def connection(fluss_cluster):
     """Session-scoped connection to the Fluss cluster (plaintext)."""
     plaintext_addr, _sasl_addr = fluss_cluster
-    config = fluss.Config({"bootstrap.servers": plaintext_addr})
-    conn = await fluss.FlussConnection.create(config)
+    conn = await _connect_with_retry(plaintext_addr)
     yield conn
     conn.close()
 

From 1bf6d96b4b52d91438b14b46bb76e010c76fa41a Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Mon, 9 Mar 2026 02:43:03 +0100
Subject: [PATCH 194/287] ci: check tablet server availabitility (#437)

---
 fluss-rust/bindings/cpp/test/test_utils.h | 13 +++++++++++--
 1 file changed, 11 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/bindings/cpp/test/test_utils.h b/fluss-rust/bindings/cpp/test/test_utils.h
index f5b4971654..17a1da7684 100644
--- a/fluss-rust/bindings/cpp/test/test_utils.h
+++ b/fluss-rust/bindings/cpp/test/test_utils.h
@@ -306,8 +306,17 @@ class FlussTestEnvironment : public ::testing::Environment {
             if (result.Ok()) {
                 auto admin_result = connection_.GetAdmin(admin_);
                 if (admin_result.Ok()) {
-                    std::cout << "Connected to Fluss cluster." << std::endl;
-                    return;
+                    // check tablet server is available
+                    std::vector<fluss::ServerNode> nodes;
+                    auto nodes_result = admin_.GetServerNodes(nodes);
+                    if (nodes_result.Ok() &&
+                        std::any_of(nodes.begin(), nodes.end(),
+                                    [](const fluss::ServerNode& n) {
+                                        return n.server_type == "TabletServer";
+                                    })) {
+                        std::cout << "Connected to Fluss cluster." << std::endl;
+                        return;
+                    }
                 }
             }
             std::cout << "Waiting for Fluss cluster to be ready..." << std::endl;

From 89e77ba058bb250973bfc6d70d78a4b835f9fa9b Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 11 Mar 2026 13:23:26 +0000
Subject: [PATCH 195/287] chore: refactor to typed Column Writers (#440)

---
 fluss-rust/crates/fluss/src/record/arrow.rs   | 169 +---
 .../crates/fluss/src/row/column_writer.rs     | 771 ++++++++++++++++++
 fluss-rust/crates/fluss/src/row/datum.rs      |  79 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |   3 +-
 4 files changed, 848 insertions(+), 174 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/row/column_writer.rs

diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 7fd16194f7..a0dfc84a84 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -20,16 +20,9 @@ use crate::compression::ArrowCompressionInfo;
 use crate::error::{Error, Result};
 use crate::metadata::{DataType, RowType};
 use crate::record::{ChangeType, ScanRecord};
-use crate::row::field_getter::FieldGetter;
+use crate::row::column_writer::ColumnWriter;
 use crate::row::{ColumnarRow, InternalRow};
-use arrow::array::{
-    ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
-    FixedSizeBinaryBuilder, Float32Builder, Float64Builder, Int8Builder, Int16Builder,
-    Int32Builder, Int64Builder, StringBuilder, Time32MillisecondBuilder, Time32SecondBuilder,
-    Time64MicrosecondBuilder, Time64NanosecondBuilder, TimestampMicrosecondBuilder,
-    TimestampMillisecondBuilder, TimestampNanosecondBuilder, TimestampSecondBuilder, UInt8Builder,
-    UInt16Builder, UInt32Builder, UInt64Builder,
-};
+use arrow::array::{ArrayBuilder, ArrayRef};
 use arrow::{
     array::RecordBatch,
     buffer::Buffer,
@@ -154,10 +147,6 @@ pub const BUILDER_DEFAULT_OFFSET: i64 = 0;
 // TODO: Switch to byte-size-based is_full() like Java's ArrowWriter instead of a hard record cap.
 pub const DEFAULT_MAX_RECORD: i32 = 256;
 
-/// Estimated average byte size for variable-width columns (Utf8, Binary).
-/// Used to pre-allocate data buffers and avoid reallocations during batch building.
-const VARIABLE_WIDTH_AVG_BYTES: usize = 64;
-
 pub struct MemoryLogRecordsArrowBuilder {
     base_log_offset: i64,
     schema_id: i32,
@@ -234,8 +223,7 @@ impl ArrowRecordBatchInnerBuilder for PrebuiltRecordBatchBuilder {
 
 pub struct RowAppendRecordBatchBuilder {
     table_schema: SchemaRef,
-    arrow_column_builders: Vec<Box<dyn ArrayBuilder>>,
-    field_getters: Box<[FieldGetter]>,
+    column_writers: Vec<ColumnWriter>,
     records_count: i32,
 }
 
@@ -243,117 +231,31 @@ impl RowAppendRecordBatchBuilder {
     pub fn new(row_type: &RowType) -> Result<Self> {
         let capacity = DEFAULT_MAX_RECORD as usize;
         let schema_ref = to_arrow_schema(row_type)?;
-        let builders: Result<Vec<_>> = schema_ref
+        let writers: Result<Vec<_>> = row_type
             .fields()
             .iter()
-            .map(|field| Self::create_builder(field.data_type(), capacity))
+            .enumerate()
+            .map(|(pos, field)| {
+                let arrow_type = schema_ref.field(pos).data_type();
+                ColumnWriter::create(field.data_type(), arrow_type, pos, capacity)
+            })
             .collect();
-        let field_getters = FieldGetter::create_field_getters(row_type);
         Ok(Self {
             table_schema: schema_ref.clone(),
-            arrow_column_builders: builders?,
-            field_getters,
+            column_writers: writers?,
             records_count: 0,
         })
     }
-
-    fn create_builder(
-        data_type: &arrow_schema::DataType,
-        capacity: usize,
-    ) -> Result<Box<dyn ArrayBuilder>> {
-        match data_type {
-            arrow_schema::DataType::Int8 => Ok(Box::new(Int8Builder::with_capacity(capacity))),
-            arrow_schema::DataType::Int16 => Ok(Box::new(Int16Builder::with_capacity(capacity))),
-            arrow_schema::DataType::Int32 => Ok(Box::new(Int32Builder::with_capacity(capacity))),
-            arrow_schema::DataType::Int64 => Ok(Box::new(Int64Builder::with_capacity(capacity))),
-            arrow_schema::DataType::UInt8 => Ok(Box::new(UInt8Builder::with_capacity(capacity))),
-            arrow_schema::DataType::UInt16 => Ok(Box::new(UInt16Builder::with_capacity(capacity))),
-            arrow_schema::DataType::UInt32 => Ok(Box::new(UInt32Builder::with_capacity(capacity))),
-            arrow_schema::DataType::UInt64 => Ok(Box::new(UInt64Builder::with_capacity(capacity))),
-            arrow_schema::DataType::Float32 => {
-                Ok(Box::new(Float32Builder::with_capacity(capacity)))
-            }
-            arrow_schema::DataType::Float64 => {
-                Ok(Box::new(Float64Builder::with_capacity(capacity)))
-            }
-            arrow_schema::DataType::Boolean => {
-                Ok(Box::new(BooleanBuilder::with_capacity(capacity)))
-            }
-            arrow_schema::DataType::Utf8 => Ok(Box::new(StringBuilder::with_capacity(
-                capacity,
-                capacity * VARIABLE_WIDTH_AVG_BYTES,
-            ))),
-            arrow_schema::DataType::Binary => Ok(Box::new(BinaryBuilder::with_capacity(
-                capacity,
-                capacity * VARIABLE_WIDTH_AVG_BYTES,
-            ))),
-            arrow_schema::DataType::FixedSizeBinary(size) => Ok(Box::new(
-                FixedSizeBinaryBuilder::with_capacity(capacity, *size),
-            )),
-            arrow_schema::DataType::Decimal128(precision, scale) => {
-                let builder = Decimal128Builder::with_capacity(capacity)
-                    .with_precision_and_scale(*precision, *scale)
-                    .map_err(|e| Error::IllegalArgument {
-                        message: format!(
-                            "Invalid decimal precision {precision} or scale {scale}: {e}"
-                        ),
-                    })?;
-                Ok(Box::new(builder))
-            }
-            arrow_schema::DataType::Date32 => Ok(Box::new(Date32Builder::with_capacity(capacity))),
-            arrow_schema::DataType::Time32(unit) => match unit {
-                arrow_schema::TimeUnit::Second => {
-                    Ok(Box::new(Time32SecondBuilder::with_capacity(capacity)))
-                }
-                arrow_schema::TimeUnit::Millisecond => {
-                    Ok(Box::new(Time32MillisecondBuilder::with_capacity(capacity)))
-                }
-                _ => Err(Error::IllegalArgument {
-                    message: format!(
-                        "Time32 only supports Second and Millisecond units, got: {unit:?}"
-                    ),
-                }),
-            },
-            arrow_schema::DataType::Time64(unit) => match unit {
-                arrow_schema::TimeUnit::Microsecond => {
-                    Ok(Box::new(Time64MicrosecondBuilder::with_capacity(capacity)))
-                }
-                arrow_schema::TimeUnit::Nanosecond => {
-                    Ok(Box::new(Time64NanosecondBuilder::with_capacity(capacity)))
-                }
-                _ => Err(Error::IllegalArgument {
-                    message: format!(
-                        "Time64 only supports Microsecond and Nanosecond units, got: {unit:?}"
-                    ),
-                }),
-            },
-            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Second, _) => {
-                Ok(Box::new(TimestampSecondBuilder::with_capacity(capacity)))
-            }
-            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Millisecond, _) => Ok(
-                Box::new(TimestampMillisecondBuilder::with_capacity(capacity)),
-            ),
-            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Microsecond, _) => Ok(
-                Box::new(TimestampMicrosecondBuilder::with_capacity(capacity)),
-            ),
-            arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, _) => Ok(
-                Box::new(TimestampNanosecondBuilder::with_capacity(capacity)),
-            ),
-            dt => Err(Error::IllegalArgument {
-                message: format!("Unsupported data type: {dt:?}"),
-            }),
-        }
-    }
 }
 
 impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
     fn build_arrow_record_batch(&mut self) -> Result<Arc<RecordBatch>> {
         let arrays: Result<Vec<ArrayRef>> = self
-            .arrow_column_builders
+            .column_writers
             .iter_mut()
             .enumerate()
-            .map(|(idx, b)| {
-                let array = b.finish();
+            .map(|(idx, writer)| {
+                let array = writer.finish();
                 let expected_type = self.table_schema.field(idx).data_type();
 
                 // Validate array type matches schema
@@ -379,17 +281,8 @@ impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
     }
 
     fn append(&mut self, row: &dyn InternalRow) -> Result<bool> {
-        for (idx, getter) in self.field_getters.iter().enumerate() {
-            let datum = getter.get_field(row)?;
-            let field_type = self.table_schema.field(idx).data_type();
-            let builder =
-                self.arrow_column_builders
-                    .get_mut(idx)
-                    .ok_or_else(|| Error::UnexpectedError {
-                        message: format!("Column builder at index {idx} not found."),
-                        source: None,
-                    })?;
-            datum.append_to(builder, field_type)?;
+        for writer in &mut self.column_writers {
+            writer.write_field(row)?;
         }
         self.records_count += 1;
         Ok(true)
@@ -415,9 +308,9 @@ impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
         // Returns the uncompressed Arrow array memory size (same as Java's arrowWriter.estimatedSizeInBytes()).
         // Note: This is the size before compression. After build(), the actual size may be smaller
         // if compression is enabled.
-        self.arrow_column_builders
+        self.column_writers
             .iter()
-            .map(|builder| builder.finish_cloned().get_array_memory_size())
+            .map(|writer| writer.finish_cloned().get_array_memory_size())
             .sum()
     }
 }
@@ -1722,23 +1615,27 @@ mod tests {
 
     #[test]
     fn test_temporal_and_decimal_builder_validation() {
+        use crate::row::column_writer::ColumnWriter;
         use arrow::array::Array;
 
         // Test valid builder creation with precision=10, scale=2
-        let mut builder =
-            RowAppendRecordBatchBuilder::create_builder(&ArrowDataType::Decimal128(10, 2), 256)
-                .unwrap();
-        let decimal_builder = builder
-            .as_any_mut()
-            .downcast_mut::<Decimal128Builder>()
-            .expect("Expected Decimal128Builder");
-        // Verify precision and scale
-        let array = decimal_builder.finish();
+        let mut writer = ColumnWriter::create(
+            &DataTypes::decimal(10, 2),
+            &ArrowDataType::Decimal128(10, 2),
+            0,
+            256,
+        )
+        .unwrap();
+        let array = writer.finish();
         assert_eq!(array.data_type(), &ArrowDataType::Decimal128(10, 2));
 
-        // Test error case: invalid precision/scale
-        let result =
-            RowAppendRecordBatchBuilder::create_builder(&ArrowDataType::Decimal128(100, 50), 256);
+        // Test error case: invalid Arrow precision/scale (exceeds Arrow's limit)
+        let result = ColumnWriter::create(
+            &DataTypes::decimal(10, 2),
+            &ArrowDataType::Decimal128(100, 50),
+            0,
+            256,
+        );
         assert!(result.is_err());
     }
 
diff --git a/fluss-rust/crates/fluss/src/row/column_writer.rs b/fluss-rust/crates/fluss/src/row/column_writer.rs
new file mode 100644
index 0000000000..34dd0f5cc3
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/column_writer.rs
@@ -0,0 +1,771 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Typed column writers that write directly from [`InternalRow`] to concrete
+//! Arrow builders, bypassing the intermediate [`Datum`] enum and runtime
+//! `downcast_mut` dispatch.
+
+use crate::error::Error::RowConvertError;
+use crate::error::{Error, Result};
+use crate::metadata::DataType;
+use crate::row::InternalRow;
+use crate::row::datum::{
+    MICROS_PER_MILLI, MILLIS_PER_SECOND, NANOS_PER_MILLI, append_decimal_to_builder,
+    millis_nanos_to_micros, millis_nanos_to_nanos,
+};
+use arrow::array::{
+    ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
+    FixedSizeBinaryBuilder, Float32Builder, Float64Builder, Int8Builder, Int16Builder,
+    Int32Builder, Int64Builder, StringBuilder, Time32MillisecondBuilder, Time32SecondBuilder,
+    Time64MicrosecondBuilder, Time64NanosecondBuilder, TimestampMicrosecondBuilder,
+    TimestampMillisecondBuilder, TimestampNanosecondBuilder, TimestampSecondBuilder,
+};
+use arrow_schema::DataType as ArrowDataType;
+
+/// Estimated average byte size for variable-width columns (Utf8, Binary).
+/// Used to pre-allocate data buffers and avoid reallocations during batch building.
+const VARIABLE_WIDTH_AVG_BYTES: usize = 64;
+
+/// A typed column writer that reads one column from an [`InternalRow`] and
+/// appends directly to a concrete Arrow builder — no intermediate [`Datum`],
+/// no `as_any_mut().downcast_mut()`.
+pub struct ColumnWriter {
+    pos: usize,
+    nullable: bool,
+    inner: TypedWriter,
+}
+
+enum TypedWriter {
+    Bool(BooleanBuilder),
+    Int8(Int8Builder),
+    Int16(Int16Builder),
+    Int32(Int32Builder),
+    Int64(Int64Builder),
+    Float32(Float32Builder),
+    Float64(Float64Builder),
+    Char {
+        len: usize,
+        builder: StringBuilder,
+    },
+    String(StringBuilder),
+    Bytes(BinaryBuilder),
+    Binary {
+        len: usize,
+        builder: FixedSizeBinaryBuilder,
+    },
+    Decimal128 {
+        src_precision: usize,
+        src_scale: usize,
+        target_precision: u32,
+        target_scale: i64,
+        builder: Decimal128Builder,
+    },
+    Date32(Date32Builder),
+    Time32Second(Time32SecondBuilder),
+    Time32Millisecond(Time32MillisecondBuilder),
+    Time64Microsecond(Time64MicrosecondBuilder),
+    Time64Nanosecond(Time64NanosecondBuilder),
+    TimestampNtzSecond {
+        precision: u32,
+        builder: TimestampSecondBuilder,
+    },
+    TimestampNtzMillisecond {
+        precision: u32,
+        builder: TimestampMillisecondBuilder,
+    },
+    TimestampNtzMicrosecond {
+        precision: u32,
+        builder: TimestampMicrosecondBuilder,
+    },
+    TimestampNtzNanosecond {
+        precision: u32,
+        builder: TimestampNanosecondBuilder,
+    },
+    TimestampLtzSecond {
+        precision: u32,
+        builder: TimestampSecondBuilder,
+    },
+    TimestampLtzMillisecond {
+        precision: u32,
+        builder: TimestampMillisecondBuilder,
+    },
+    TimestampLtzMicrosecond {
+        precision: u32,
+        builder: TimestampMicrosecondBuilder,
+    },
+    TimestampLtzNanosecond {
+        precision: u32,
+        builder: TimestampNanosecondBuilder,
+    },
+}
+
+/// Dispatch to the inner builder across all `TypedWriter` variants.
+/// Exhaustive matching ensures new variants won't compile without an arm.
+macro_rules! with_builder {
+    ($self:expr, $b:ident => $body:expr) => {
+        match $self {
+            TypedWriter::Bool($b) => $body,
+            TypedWriter::Int8($b) => $body,
+            TypedWriter::Int16($b) => $body,
+            TypedWriter::Int32($b) => $body,
+            TypedWriter::Int64($b) => $body,
+            TypedWriter::Float32($b) => $body,
+            TypedWriter::Float64($b) => $body,
+            TypedWriter::Char { builder: $b, .. } => $body,
+            TypedWriter::String($b) => $body,
+            TypedWriter::Bytes($b) => $body,
+            TypedWriter::Binary { builder: $b, .. } => $body,
+            TypedWriter::Decimal128 { builder: $b, .. } => $body,
+            TypedWriter::Date32($b) => $body,
+            TypedWriter::Time32Second($b) => $body,
+            TypedWriter::Time32Millisecond($b) => $body,
+            TypedWriter::Time64Microsecond($b) => $body,
+            TypedWriter::Time64Nanosecond($b) => $body,
+            TypedWriter::TimestampNtzSecond { builder: $b, .. } => $body,
+            TypedWriter::TimestampNtzMillisecond { builder: $b, .. } => $body,
+            TypedWriter::TimestampNtzMicrosecond { builder: $b, .. } => $body,
+            TypedWriter::TimestampNtzNanosecond { builder: $b, .. } => $body,
+            TypedWriter::TimestampLtzSecond { builder: $b, .. } => $body,
+            TypedWriter::TimestampLtzMillisecond { builder: $b, .. } => $body,
+            TypedWriter::TimestampLtzMicrosecond { builder: $b, .. } => $body,
+            TypedWriter::TimestampLtzNanosecond { builder: $b, .. } => $body,
+        }
+    };
+}
+
+impl ColumnWriter {
+    /// Create a column writer for the given Fluss `DataType` and Arrow
+    /// `ArrowDataType` at position `pos` with the given pre-allocation
+    /// `capacity`.
+    pub fn create(
+        fluss_type: &DataType,
+        arrow_type: &ArrowDataType,
+        pos: usize,
+        capacity: usize,
+    ) -> Result<Self> {
+        let nullable = fluss_type.is_nullable();
+
+        let inner = match fluss_type {
+            DataType::Boolean(_) => TypedWriter::Bool(BooleanBuilder::with_capacity(capacity)),
+            DataType::TinyInt(_) => TypedWriter::Int8(Int8Builder::with_capacity(capacity)),
+            DataType::SmallInt(_) => TypedWriter::Int16(Int16Builder::with_capacity(capacity)),
+            DataType::Int(_) => TypedWriter::Int32(Int32Builder::with_capacity(capacity)),
+            DataType::BigInt(_) => TypedWriter::Int64(Int64Builder::with_capacity(capacity)),
+            DataType::Float(_) => TypedWriter::Float32(Float32Builder::with_capacity(capacity)),
+            DataType::Double(_) => TypedWriter::Float64(Float64Builder::with_capacity(capacity)),
+            DataType::Char(t) => TypedWriter::Char {
+                len: t.length() as usize,
+                builder: StringBuilder::with_capacity(
+                    capacity,
+                    capacity.saturating_mul(VARIABLE_WIDTH_AVG_BYTES),
+                ),
+            },
+            DataType::String(_) => TypedWriter::String(StringBuilder::with_capacity(
+                capacity,
+                capacity.saturating_mul(VARIABLE_WIDTH_AVG_BYTES),
+            )),
+            DataType::Bytes(_) => TypedWriter::Bytes(BinaryBuilder::with_capacity(
+                capacity,
+                capacity.saturating_mul(VARIABLE_WIDTH_AVG_BYTES),
+            )),
+            DataType::Binary(t) => {
+                let arrow_len: i32 = t.length().try_into().map_err(|_| Error::IllegalArgument {
+                    message: format!(
+                        "Binary length {} exceeds Arrow's maximum (i32::MAX)",
+                        t.length()
+                    ),
+                })?;
+                TypedWriter::Binary {
+                    len: t.length(),
+                    builder: FixedSizeBinaryBuilder::with_capacity(capacity, arrow_len),
+                }
+            }
+            DataType::Decimal(dt) => {
+                let (target_p, target_s) = match arrow_type {
+                    ArrowDataType::Decimal128(p, s) => (*p, *s),
+                    _ => {
+                        return Err(Error::IllegalArgument {
+                            message: format!(
+                                "Expected Decimal128 Arrow type for Decimal, got: {arrow_type:?}"
+                            ),
+                        });
+                    }
+                };
+                if target_s < 0 {
+                    return Err(Error::IllegalArgument {
+                        message: format!("Negative decimal scale {target_s} is not supported"),
+                    });
+                }
+                let builder = Decimal128Builder::with_capacity(capacity)
+                    .with_precision_and_scale(target_p, target_s)
+                    .map_err(|e| Error::IllegalArgument {
+                        message: format!(
+                            "Invalid decimal precision {target_p} or scale {target_s}: {e}"
+                        ),
+                    })?;
+                TypedWriter::Decimal128 {
+                    src_precision: dt.precision() as usize,
+                    src_scale: dt.scale() as usize,
+                    target_precision: target_p as u32,
+                    target_scale: target_s as i64,
+                    builder,
+                }
+            }
+            DataType::Date(_) => TypedWriter::Date32(Date32Builder::with_capacity(capacity)),
+            DataType::Time(_) => match arrow_type {
+                ArrowDataType::Time32(arrow_schema::TimeUnit::Second) => {
+                    TypedWriter::Time32Second(Time32SecondBuilder::with_capacity(capacity))
+                }
+                ArrowDataType::Time32(arrow_schema::TimeUnit::Millisecond) => {
+                    TypedWriter::Time32Millisecond(Time32MillisecondBuilder::with_capacity(
+                        capacity,
+                    ))
+                }
+                ArrowDataType::Time64(arrow_schema::TimeUnit::Microsecond) => {
+                    TypedWriter::Time64Microsecond(Time64MicrosecondBuilder::with_capacity(
+                        capacity,
+                    ))
+                }
+                ArrowDataType::Time64(arrow_schema::TimeUnit::Nanosecond) => {
+                    TypedWriter::Time64Nanosecond(Time64NanosecondBuilder::with_capacity(capacity))
+                }
+                _ => {
+                    return Err(Error::IllegalArgument {
+                        message: format!("Unsupported Arrow type for Time: {arrow_type:?}"),
+                    });
+                }
+            },
+            DataType::Timestamp(t) => {
+                let precision = t.precision();
+                match arrow_type {
+                    ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, _) => {
+                        TypedWriter::TimestampNtzSecond {
+                            precision,
+                            builder: TimestampSecondBuilder::with_capacity(capacity),
+                        }
+                    }
+                    ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, _) => {
+                        TypedWriter::TimestampNtzMillisecond {
+                            precision,
+                            builder: TimestampMillisecondBuilder::with_capacity(capacity),
+                        }
+                    }
+                    ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, _) => {
+                        TypedWriter::TimestampNtzMicrosecond {
+                            precision,
+                            builder: TimestampMicrosecondBuilder::with_capacity(capacity),
+                        }
+                    }
+                    ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, _) => {
+                        TypedWriter::TimestampNtzNanosecond {
+                            precision,
+                            builder: TimestampNanosecondBuilder::with_capacity(capacity),
+                        }
+                    }
+                    _ => {
+                        return Err(Error::IllegalArgument {
+                            message: format!(
+                                "Unsupported Arrow type for Timestamp: {arrow_type:?}"
+                            ),
+                        });
+                    }
+                }
+            }
+            DataType::TimestampLTz(t) => {
+                let precision = t.precision();
+                match arrow_type {
+                    ArrowDataType::Timestamp(arrow_schema::TimeUnit::Second, _) => {
+                        TypedWriter::TimestampLtzSecond {
+                            precision,
+                            builder: TimestampSecondBuilder::with_capacity(capacity),
+                        }
+                    }
+                    ArrowDataType::Timestamp(arrow_schema::TimeUnit::Millisecond, _) => {
+                        TypedWriter::TimestampLtzMillisecond {
+                            precision,
+                            builder: TimestampMillisecondBuilder::with_capacity(capacity),
+                        }
+                    }
+                    ArrowDataType::Timestamp(arrow_schema::TimeUnit::Microsecond, _) => {
+                        TypedWriter::TimestampLtzMicrosecond {
+                            precision,
+                            builder: TimestampMicrosecondBuilder::with_capacity(capacity),
+                        }
+                    }
+                    ArrowDataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, _) => {
+                        TypedWriter::TimestampLtzNanosecond {
+                            precision,
+                            builder: TimestampNanosecondBuilder::with_capacity(capacity),
+                        }
+                    }
+                    _ => {
+                        return Err(Error::IllegalArgument {
+                            message: format!(
+                                "Unsupported Arrow type for TimestampLTz: {arrow_type:?}"
+                            ),
+                        });
+                    }
+                }
+            }
+            _ => {
+                return Err(Error::IllegalArgument {
+                    message: format!("Unsupported Fluss DataType: {fluss_type:?}"),
+                });
+            }
+        };
+
+        Ok(Self {
+            pos,
+            nullable,
+            inner,
+        })
+    }
+
+    /// Read one value from `row` at this writer's column position and append it
+    /// directly to the concrete Arrow builder.
+    #[inline]
+    pub fn write_field(&mut self, row: &dyn InternalRow) -> Result<()> {
+        if self.nullable && row.is_null_at(self.pos)? {
+            self.append_null();
+            return Ok(());
+        }
+        self.write_non_null(row)
+    }
+
+    /// Finish the builder, producing the final Arrow array.
+    pub fn finish(&mut self) -> ArrayRef {
+        self.as_builder_mut().finish()
+    }
+
+    /// Clone-finish the builder for size estimation (does not reset the builder).
+    pub fn finish_cloned(&self) -> ArrayRef {
+        self.as_builder_ref().finish_cloned()
+    }
+
+    fn append_null(&mut self) {
+        with_builder!(&mut self.inner, b => b.append_null());
+    }
+
+    /// Returns a trait-object reference to the inner builder.
+    /// Used for type-agnostic operations (`finish`, `finish_cloned`).
+    fn as_builder_mut(&mut self) -> &mut dyn ArrayBuilder {
+        with_builder!(&mut self.inner, b => b)
+    }
+
+    fn as_builder_ref(&self) -> &dyn ArrayBuilder {
+        with_builder!(&self.inner, b => b)
+    }
+
+    #[inline]
+    fn write_non_null(&mut self, row: &dyn InternalRow) -> Result<()> {
+        let pos = self.pos;
+
+        match &mut self.inner {
+            TypedWriter::Bool(b) => {
+                b.append_value(row.get_boolean(pos)?);
+                Ok(())
+            }
+            TypedWriter::Int8(b) => {
+                b.append_value(row.get_byte(pos)?);
+                Ok(())
+            }
+            TypedWriter::Int16(b) => {
+                b.append_value(row.get_short(pos)?);
+                Ok(())
+            }
+            TypedWriter::Int32(b) => {
+                b.append_value(row.get_int(pos)?);
+                Ok(())
+            }
+            TypedWriter::Int64(b) => {
+                b.append_value(row.get_long(pos)?);
+                Ok(())
+            }
+            TypedWriter::Float32(b) => {
+                b.append_value(row.get_float(pos)?);
+                Ok(())
+            }
+            TypedWriter::Float64(b) => {
+                b.append_value(row.get_double(pos)?);
+                Ok(())
+            }
+            TypedWriter::Char { len, builder } => {
+                let v = row.get_char(pos, *len)?;
+                builder.append_value(v);
+                Ok(())
+            }
+            TypedWriter::String(b) => {
+                let v = row.get_string(pos)?;
+                b.append_value(v);
+                Ok(())
+            }
+            TypedWriter::Bytes(b) => {
+                let v = row.get_bytes(pos)?;
+                b.append_value(v);
+                Ok(())
+            }
+            TypedWriter::Binary { len, builder } => {
+                let v = row.get_binary(pos, *len)?;
+                builder.append_value(v).map_err(|e| RowConvertError {
+                    message: format!("Failed to append binary value: {e}"),
+                })?;
+                Ok(())
+            }
+            TypedWriter::Decimal128 {
+                src_precision,
+                src_scale,
+                target_precision,
+                target_scale,
+                builder,
+            } => {
+                let decimal = row.get_decimal(pos, *src_precision, *src_scale)?;
+                append_decimal_to_builder(&decimal, *target_precision, *target_scale, builder)
+            }
+            TypedWriter::Date32(b) => {
+                let date = row.get_date(pos)?;
+                b.append_value(date.get_inner());
+                Ok(())
+            }
+            TypedWriter::Time32Second(b) => {
+                let millis = row.get_time(pos)?.get_inner();
+                if millis % MILLIS_PER_SECOND as i32 != 0 {
+                    return Err(RowConvertError {
+                        message: format!(
+                            "Time value {millis} ms has sub-second precision but schema expects seconds only"
+                        ),
+                    });
+                }
+                b.append_value(millis / MILLIS_PER_SECOND as i32);
+                Ok(())
+            }
+            TypedWriter::Time32Millisecond(b) => {
+                b.append_value(row.get_time(pos)?.get_inner());
+                Ok(())
+            }
+            TypedWriter::Time64Microsecond(b) => {
+                let millis = row.get_time(pos)?.get_inner();
+                let micros = (millis as i64)
+                    .checked_mul(MICROS_PER_MILLI)
+                    .ok_or_else(|| RowConvertError {
+                        message: format!(
+                            "Time value {millis} ms overflows when converting to microseconds"
+                        ),
+                    })?;
+                b.append_value(micros);
+                Ok(())
+            }
+            TypedWriter::Time64Nanosecond(b) => {
+                let millis = row.get_time(pos)?.get_inner();
+                let nanos = (millis as i64)
+                    .checked_mul(NANOS_PER_MILLI)
+                    .ok_or_else(|| RowConvertError {
+                        message: format!(
+                            "Time value {millis} ms overflows when converting to nanoseconds"
+                        ),
+                    })?;
+                b.append_value(nanos);
+                Ok(())
+            }
+            // --- TimestampNtz variants ---
+            TypedWriter::TimestampNtzSecond {
+                precision, builder, ..
+            } => {
+                let ts = row.get_timestamp_ntz(pos, *precision)?;
+                builder.append_value(ts.get_millisecond() / MILLIS_PER_SECOND);
+                Ok(())
+            }
+            TypedWriter::TimestampNtzMillisecond {
+                precision, builder, ..
+            } => {
+                let ts = row.get_timestamp_ntz(pos, *precision)?;
+                builder.append_value(ts.get_millisecond());
+                Ok(())
+            }
+            TypedWriter::TimestampNtzMicrosecond {
+                precision, builder, ..
+            } => {
+                let ts = row.get_timestamp_ntz(pos, *precision)?;
+                builder.append_value(millis_nanos_to_micros(
+                    ts.get_millisecond(),
+                    ts.get_nano_of_millisecond(),
+                )?);
+                Ok(())
+            }
+            TypedWriter::TimestampNtzNanosecond {
+                precision, builder, ..
+            } => {
+                let ts = row.get_timestamp_ntz(pos, *precision)?;
+                builder.append_value(millis_nanos_to_nanos(
+                    ts.get_millisecond(),
+                    ts.get_nano_of_millisecond(),
+                )?);
+                Ok(())
+            }
+            // --- TimestampLtz variants ---
+            TypedWriter::TimestampLtzSecond {
+                precision, builder, ..
+            } => {
+                let ts = row.get_timestamp_ltz(pos, *precision)?;
+                builder.append_value(ts.get_epoch_millisecond() / MILLIS_PER_SECOND);
+                Ok(())
+            }
+            TypedWriter::TimestampLtzMillisecond {
+                precision, builder, ..
+            } => {
+                let ts = row.get_timestamp_ltz(pos, *precision)?;
+                builder.append_value(ts.get_epoch_millisecond());
+                Ok(())
+            }
+            TypedWriter::TimestampLtzMicrosecond {
+                precision, builder, ..
+            } => {
+                let ts = row.get_timestamp_ltz(pos, *precision)?;
+                builder.append_value(millis_nanos_to_micros(
+                    ts.get_epoch_millisecond(),
+                    ts.get_nano_of_millisecond(),
+                )?);
+                Ok(())
+            }
+            TypedWriter::TimestampLtzNanosecond {
+                precision, builder, ..
+            } => {
+                let ts = row.get_timestamp_ltz(pos, *precision)?;
+                builder.append_value(millis_nanos_to_nanos(
+                    ts.get_epoch_millisecond(),
+                    ts.get_nano_of_millisecond(),
+                )?);
+                Ok(())
+            }
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::DataTypes;
+    use crate::record::to_arrow_type;
+    use crate::row::{Date, Datum, GenericRow, Time, TimestampLtz, TimestampNtz};
+    use arrow::array::*;
+    use bigdecimal::BigDecimal;
+    use std::str::FromStr;
+
+    /// Helper: create a ColumnWriter from a Fluss DataType, deriving the Arrow type automatically.
+    fn writer_for(fluss_type: &DataType, capacity: usize) -> ColumnWriter {
+        let arrow_type = to_arrow_type(fluss_type).unwrap();
+        ColumnWriter::create(fluss_type, &arrow_type, 0, capacity).unwrap()
+    }
+
+    /// Helper: write a single datum and return the finished array.
+    fn write_one(fluss_type: &DataType, datum: Datum) -> ArrayRef {
+        let mut w = writer_for(fluss_type, 4);
+        w.write_field(&GenericRow::from_data(vec![datum])).unwrap();
+        w.finish()
+    }
+
+    #[test]
+    fn write_all_scalar_types() {
+        // Boolean
+        let arr = write_one(&DataTypes::boolean(), Datum::Bool(true));
+        assert!(
+            arr.as_any()
+                .downcast_ref::<BooleanArray>()
+                .unwrap()
+                .value(0)
+        );
+
+        // Integer types
+        let arr = write_one(&DataTypes::tinyint(), Datum::Int8(42));
+        assert_eq!(
+            arr.as_any().downcast_ref::<Int8Array>().unwrap().value(0),
+            42
+        );
+
+        let arr = write_one(&DataTypes::smallint(), Datum::Int16(1000));
+        assert_eq!(
+            arr.as_any().downcast_ref::<Int16Array>().unwrap().value(0),
+            1000
+        );
+
+        let arr = write_one(&DataTypes::int(), Datum::Int32(100_000));
+        assert_eq!(
+            arr.as_any().downcast_ref::<Int32Array>().unwrap().value(0),
+            100_000
+        );
+
+        let arr = write_one(&DataTypes::bigint(), Datum::Int64(9_000_000_000));
+        assert_eq!(
+            arr.as_any().downcast_ref::<Int64Array>().unwrap().value(0),
+            9_000_000_000
+        );
+
+        // Float types
+        let arr = write_one(&DataTypes::float(), Datum::Float32(1.5.into()));
+        assert!(
+            (arr.as_any()
+                .downcast_ref::<Float32Array>()
+                .unwrap()
+                .value(0)
+                - 1.5)
+                .abs()
+                < 0.001
+        );
+
+        let arr = write_one(&DataTypes::double(), Datum::Float64(1.125.into()));
+        assert!(
+            (arr.as_any()
+                .downcast_ref::<Float64Array>()
+                .unwrap()
+                .value(0)
+                - 1.125)
+                .abs()
+                < 0.001
+        );
+
+        // String / Char
+        let arr = write_one(&DataTypes::string(), Datum::String("hello".into()));
+        assert_eq!(
+            arr.as_any().downcast_ref::<StringArray>().unwrap().value(0),
+            "hello"
+        );
+
+        let arr = write_one(&DataTypes::char(10), Datum::String("world".into()));
+        assert_eq!(
+            arr.as_any().downcast_ref::<StringArray>().unwrap().value(0),
+            "world"
+        );
+
+        // Bytes / Binary
+        let arr = write_one(&DataTypes::bytes(), Datum::Blob(vec![1, 2, 3].into()));
+        assert_eq!(
+            arr.as_any().downcast_ref::<BinaryArray>().unwrap().value(0),
+            &[1, 2, 3]
+        );
+
+        let arr = write_one(
+            &DataTypes::binary(4),
+            Datum::Blob(vec![10, 20, 30, 40].into()),
+        );
+        assert_eq!(
+            arr.as_any()
+                .downcast_ref::<FixedSizeBinaryArray>()
+                .unwrap()
+                .value(0),
+            &[10, 20, 30, 40]
+        );
+
+        // Date
+        let arr = write_one(&DataTypes::date(), Datum::Date(Date::new(19000)));
+        assert_eq!(
+            arr.as_any().downcast_ref::<Date32Array>().unwrap().value(0),
+            19000
+        );
+
+        // Time (precision 3 → Millisecond)
+        let arr = write_one(
+            &DataTypes::time_with_precision(3),
+            Datum::Time(Time::new(45_000)),
+        );
+        assert_eq!(
+            arr.as_any()
+                .downcast_ref::<Time32MillisecondArray>()
+                .unwrap()
+                .value(0),
+            45_000
+        );
+
+        // Decimal
+        let decimal =
+            crate::row::Decimal::from_big_decimal(BigDecimal::from_str("123.45").unwrap(), 10, 2)
+                .unwrap();
+        let arr = write_one(&DataTypes::decimal(10, 2), Datum::Decimal(decimal));
+        assert_eq!(
+            arr.as_any()
+                .downcast_ref::<Decimal128Array>()
+                .unwrap()
+                .value(0),
+            12345
+        );
+
+        // Timestamp NTZ (precision 3 → Millisecond)
+        let arr = write_one(
+            &DataTypes::timestamp_with_precision(3),
+            Datum::TimestampNtz(TimestampNtz::new(1_700_000_000_000)),
+        );
+        assert_eq!(
+            arr.as_any()
+                .downcast_ref::<TimestampMillisecondArray>()
+                .unwrap()
+                .value(0),
+            1_700_000_000_000
+        );
+
+        // Timestamp LTZ (precision 3 → Millisecond)
+        let arr = write_one(
+            &DataTypes::timestamp_ltz_with_precision(3),
+            Datum::TimestampLtz(TimestampLtz::new(1_700_000_000_000)),
+        );
+        assert_eq!(
+            arr.as_any()
+                .downcast_ref::<TimestampMillisecondArray>()
+                .unwrap()
+                .value(0),
+            1_700_000_000_000
+        );
+    }
+
+    #[test]
+    fn write_null_and_multiple_rows() {
+        // Null
+        let arr = write_one(&DataTypes::int(), Datum::Null);
+        assert!(arr.is_null(0));
+
+        // Multiple rows
+        let mut w = writer_for(&DataTypes::int(), 8);
+        for val in [10, 20, 30] {
+            w.write_field(&GenericRow::from_data(vec![val])).unwrap();
+        }
+        let arr = w.finish();
+        let int_arr = arr.as_any().downcast_ref::<Int32Array>().unwrap();
+        assert_eq!(int_arr.len(), 3);
+        assert_eq!(int_arr.value(0), 10);
+        assert_eq!(int_arr.value(1), 20);
+        assert_eq!(int_arr.value(2), 30);
+
+        // finish_cloned does not reset
+        let mut w = writer_for(&DataTypes::int(), 4);
+        w.write_field(&GenericRow::from_data(vec![42_i32])).unwrap();
+        assert_eq!(w.finish_cloned().len(), 1);
+        w.write_field(&GenericRow::from_data(vec![99_i32])).unwrap();
+        let int_arr = w
+            .finish()
+            .as_any()
+            .downcast_ref::<Int32Array>()
+            .unwrap()
+            .clone();
+        assert_eq!((int_arr.value(0), int_arr.value(1)), (42, 99));
+    }
+
+    #[test]
+    fn unsupported_type_returns_error() {
+        let fluss_type = DataTypes::array(DataTypes::int());
+        let arrow_type = ArrowDataType::List(arrow_schema::FieldRef::new(
+            arrow_schema::Field::new("item", ArrowDataType::Int32, true),
+        ));
+        assert!(ColumnWriter::create(&fluss_type, &arrow_type, 0, 4).is_err());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index b370fb1d89..9b2e80a641 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -397,13 +397,13 @@ pub trait ToArrow {
 }
 
 // Time unit conversion constants
-const MILLIS_PER_SECOND: i64 = 1_000;
-const MICROS_PER_MILLI: i64 = 1_000;
-const NANOS_PER_MILLI: i64 = 1_000_000;
+pub(crate) const MILLIS_PER_SECOND: i64 = 1_000;
+pub(crate) const MICROS_PER_MILLI: i64 = 1_000;
+pub(crate) const NANOS_PER_MILLI: i64 = 1_000_000;
 
 /// Converts milliseconds and nanoseconds-within-millisecond to total microseconds.
 /// Returns an error if the conversion would overflow.
-fn millis_nanos_to_micros(millis: i64, nanos: i32) -> Result<i64> {
+pub(crate) fn millis_nanos_to_micros(millis: i64, nanos: i32) -> Result<i64> {
     let millis_micros = millis
         .checked_mul(MICROS_PER_MILLI)
         .ok_or_else(|| RowConvertError {
@@ -423,7 +423,7 @@ fn millis_nanos_to_micros(millis: i64, nanos: i32) -> Result<i64> {
 
 /// Converts milliseconds and nanoseconds-within-millisecond to total nanoseconds.
 /// Returns an error if the conversion would overflow.
-fn millis_nanos_to_nanos(millis: i64, nanos: i32) -> Result<i64> {
+pub(crate) fn millis_nanos_to_nanos(millis: i64, nanos: i32) -> Result<i64> {
     let millis_nanos = millis
         .checked_mul(NANOS_PER_MILLI)
         .ok_or_else(|| RowConvertError {
@@ -440,6 +440,42 @@ fn millis_nanos_to_nanos(millis: i64, nanos: i32) -> Result<i64> {
         })
 }
 
+/// Rescales a [`Decimal`] to the given Arrow target precision/scale and appends
+/// the resulting i128 to the builder.
+pub(crate) fn append_decimal_to_builder(
+    decimal: &Decimal,
+    target_precision: u32,
+    target_scale: i64,
+    builder: &mut Decimal128Builder,
+) -> Result<()> {
+    use bigdecimal::RoundingMode;
+
+    let bd = decimal.to_big_decimal();
+    let rescaled = bd.with_scale_round(target_scale, RoundingMode::HalfUp);
+    let (unscaled, _) = rescaled.as_bigint_and_exponent();
+
+    let actual_precision = Decimal::compute_precision(&unscaled);
+    if actual_precision > target_precision as usize {
+        return Err(RowConvertError {
+            message: format!(
+                "Decimal precision overflow: value has {actual_precision} digits but Arrow expects {target_precision} (value: {rescaled})"
+            ),
+        });
+    }
+
+    let i128_val: i128 = match unscaled.try_into() {
+        Ok(v) => v,
+        Err(_) => {
+            return Err(RowConvertError {
+                message: format!("Decimal value exceeds i128 range: {rescaled}"),
+            });
+        }
+    };
+
+    builder.append_value(i128_val);
+    Ok(())
+}
+
 trait AppendResult {
     fn into_append_result(self) -> Result<()>;
 }
@@ -539,45 +575,14 @@ impl Datum<'_> {
                     }
                 };
 
-                // Validate scale is non-negative (Fluss doesn't support negative scales)
                 if s < 0 {
                     return Err(RowConvertError {
                         message: format!("Negative decimal scale {s} is not supported"),
                     });
                 }
 
-                let target_precision = p as u32;
-                let target_scale = s as i64; // Safe now: 0..127 → 0i64..127i64
-
                 if let Some(b) = builder.as_any_mut().downcast_mut::<Decimal128Builder>() {
-                    use bigdecimal::RoundingMode;
-
-                    // Rescale the decimal to match Arrow's target scale
-                    let bd = decimal.to_big_decimal();
-                    let rescaled = bd.with_scale_round(target_scale, RoundingMode::HalfUp);
-                    let (unscaled, _) = rescaled.as_bigint_and_exponent();
-
-                    // Validate precision
-                    let actual_precision = Decimal::compute_precision(&unscaled);
-                    if actual_precision > target_precision as usize {
-                        return Err(RowConvertError {
-                            message: format!(
-                                "Decimal precision overflow: value has {actual_precision} digits but Arrow expects {target_precision} (value: {rescaled})"
-                            ),
-                        });
-                    }
-
-                    // Convert to i128 for Arrow
-                    let i128_val: i128 = match unscaled.try_into() {
-                        Ok(v) => v,
-                        Err(_) => {
-                            return Err(RowConvertError {
-                                message: format!("Decimal value exceeds i128 range: {rescaled}"),
-                            });
-                        }
-                    };
-
-                    b.append_value(i128_val);
+                    append_decimal_to_builder(decimal, p as u32, s as i64, b)?;
                     return Ok(());
                 }
 
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 8fb777d257..ef99ba297a 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -17,10 +17,11 @@
 
 mod column;
 
-mod datum;
+pub(crate) mod datum;
 mod decimal;
 
 pub mod binary;
+pub(crate) mod column_writer;
 pub mod compacted;
 pub mod encode;
 pub mod field_getter;

From 520c842b4c6610e7f2988d440526486af45b0901 Mon Sep 17 00:00:00 2001
From: XiaoHongbo <1346652787@qq.com>
Date: Wed, 11 Mar 2026 22:12:26 +0800
Subject: [PATCH 196/287] feat(python): add get_primary_keys() method to Schema
 class  (#436)

---------

Co-authored-by: xiaohongbo <xiaohongbo.xhb@alibaba-inc.com>
---
 fluss-rust/bindings/python/fluss/__init__.pyi |  1 +
 fluss-rust/bindings/python/src/metadata.rs    |  8 +++-
 fluss-rust/bindings/python/test/test_admin.py |  1 +
 .../bindings/python/test/test_schema.py       | 37 +++++++++++++++++++
 .../docs/user-guide/python/api-reference.md   |  2 +
 5 files changed, 48 insertions(+), 1 deletion(-)
 create mode 100644 fluss-rust/bindings/python/test/test_schema.py

diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 417ac9b2e9..e06e932756 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -775,6 +775,7 @@ class Schema:
     def get_column_names(self) -> List[str]: ...
     def get_column_types(self) -> List[str]: ...
     def get_columns(self) -> List[Tuple[str, str]]: ...
+    def get_primary_keys(self) -> List[str]: ...
     def __str__(self) -> str: ...
 
 class TableDescriptor:
diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
index d6b122d27b..02ef121dda 100644
--- a/fluss-rust/bindings/python/src/metadata.rs
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -220,7 +220,13 @@ impl Schema {
             .collect()
     }
 
-    // TODO: support primaryKey
+    /// Get primary key column names, returns empty list if no primary key is defined
+    fn get_primary_keys(&self) -> Vec<String> {
+        self.__schema
+            .primary_key()
+            .map(|pk| pk.column_names().to_vec())
+            .unwrap_or_default()
+    }
 
     fn __str__(&self) -> String {
         format!("Schema: columns={:?}", self.get_columns())
diff --git a/fluss-rust/bindings/python/test/test_admin.py b/fluss-rust/bindings/python/test/test_admin.py
index e2f43431d5..646248d8d4 100644
--- a/fluss-rust/bindings/python/test/test_admin.py
+++ b/fluss-rust/bindings/python/test/test_admin.py
@@ -82,6 +82,7 @@ async def test_create_table(admin):
         ),
         primary_keys=["id"],
     )
+    assert schema.get_primary_keys() == ["id"]
 
     table_descriptor = fluss.TableDescriptor(
         schema,
diff --git a/fluss-rust/bindings/python/test/test_schema.py b/fluss-rust/bindings/python/test/test_schema.py
new file mode 100644
index 0000000000..a72d933453
--- /dev/null
+++ b/fluss-rust/bindings/python/test/test_schema.py
@@ -0,0 +1,37 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+"""Unit tests for Schema (no cluster required)."""
+
+import pyarrow as pa
+
+import fluss
+
+
+def test_get_primary_keys():
+    fields = pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("name", pa.string()),
+    ])
+
+    schema_with_pk = fluss.Schema(fields, primary_keys=["id"])
+    assert schema_with_pk.get_primary_keys() == ["id"]
+
+    schema_without_pk = fluss.Schema(fields)
+    assert schema_without_pk.get_primary_keys() == []
+
+
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index e9113b6974..fef10a8c5c 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -241,6 +241,8 @@ for record in scan_records:
 | `Schema(schema: pa.Schema, primary_keys=None)` | Create from PyArrow schema |
 | `.get_column_names() -> list[str]`             | Get column names           |
 | `.get_column_types() -> list[str]`             | Get column type names      |
+| `.get_columns() -> list[tuple[str, str]]`      | Get `(name, type)` pairs   |
+| `.get_primary_keys() -> list[str]`             | Get primary key columns    |
 
 ## `TableDescriptor`
 

From 0fe3978a6d14ab0b920eb74d741730690bc7fb4e Mon Sep 17 00:00:00 2001
From: Aryamaan Singh <71913204+toxicteddy00077@users.noreply.github.com>
Date: Wed, 11 Mar 2026 21:03:11 +0530
Subject: [PATCH 197/287] chore: added is_retriable() to FlussError (#422)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     | 15 ++++
 fluss-rust/bindings/python/fluss/__init__.pyi |  2 +
 fluss-rust/bindings/python/src/error.rs       | 10 +++
 fluss-rust/crates/fluss/src/error.rs          | 11 +++
 .../crates/fluss/src/rpc/fluss_api_error.rs   | 77 +++++++++++++++++++
 .../docs/user-guide/cpp/error-handling.md     | 47 +++++++++++
 .../docs/user-guide/python/error-handling.md  | 40 ++++++++++
 .../docs/user-guide/rust/error-handling.md    | 42 ++++++++++
 8 files changed, 244 insertions(+)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index b507da7229..d0da6173c8 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -180,6 +180,18 @@ struct ErrorCode {
     static constexpr int INVALID_ALTER_TABLE_EXCEPTION = 56;
     /// Deletion operations are disabled on this table.
     static constexpr int DELETION_DISABLED_EXCEPTION = 57;
+
+    /// Returns true if retrying the request may succeed. Mirrors Java's RetriableException hierarchy.
+    static constexpr bool IsRetriable(int32_t code) {
+        return code == NETWORK_EXCEPTION || code == CORRUPT_MESSAGE ||
+               code == SCHEMA_NOT_EXIST || code == LOG_STORAGE_EXCEPTION ||
+               code == KV_STORAGE_EXCEPTION || code == NOT_LEADER_OR_FOLLOWER ||
+               code == CORRUPT_RECORD_EXCEPTION ||
+               code == UNKNOWN_TABLE_OR_BUCKET_EXCEPTION || code == REQUEST_TIME_OUT ||
+               code == STORAGE_EXCEPTION ||
+               code == NOT_ENOUGH_REPLICAS_AFTER_APPEND_EXCEPTION ||
+               code == NOT_ENOUGH_REPLICAS_EXCEPTION || code == LEADER_NOT_AVAILABLE_EXCEPTION;
+    }
 };
 
 struct Date {
@@ -326,6 +338,9 @@ struct Result {
     std::string error_message;
 
     bool Ok() const { return error_code == 0; }
+
+    /// Returns true if retrying the request may succeed. Client-side errors always return false.
+    bool IsRetriable() const { return ErrorCode::IsRetriable(error_code); }
 };
 
 struct TablePath {
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index e06e932756..63be0e2cc6 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -837,6 +837,8 @@ class FlussError(Exception):
     error_code: int
     def __init__(self, message: str, error_code: int = -2) -> None: ...
     def __str__(self) -> str: ...
+    @property
+    def is_retriable(self) -> bool: ...
 
 class LakeSnapshot:
     def __init__(self, snapshot_id: int) -> None: ...
diff --git a/fluss-rust/bindings/python/src/error.rs b/fluss-rust/bindings/python/src/error.rs
index 606b9f4fd3..10c6cfa0ec 100644
--- a/fluss-rust/bindings/python/src/error.rs
+++ b/fluss-rust/bindings/python/src/error.rs
@@ -51,6 +51,16 @@ impl FlussError {
             format!("FlussError: {}", self.message)
         }
     }
+
+    /// Returns ``True`` if retrying the request may succeed. Client-side errors always return ``False``.
+    #[getter]
+    fn is_retriable(&self) -> bool {
+        use fluss::rpc::FlussError as CoreFlussError;
+        if self.error_code == CLIENT_ERROR_CODE {
+            return false;
+        }
+        CoreFlussError::for_code(self.error_code).is_retriable()
+    }
 }
 
 impl FlussError {
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index 5cf0d4b847..d56432c517 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -165,6 +165,17 @@ impl Error {
             None
         }
     }
+
+    /// Returns `true` if retrying the request may succeed.
+    /// [`Error::RpcError`] is always retriable; [`Error::FlussAPIError`] delegates to
+    /// [`ApiError::is_retriable`]; all other variants are not.
+    pub fn is_retriable(&self) -> bool {
+        match self {
+            Error::RpcError { .. } => true,
+            Error::FlussAPIError { api_error } => api_error.is_retriable(),
+            _ => false,
+        }
+    }
 }
 
 impl From<ArrowError> for Error {
diff --git a/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs b/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
index a501b9974e..95a39c6945 100644
--- a/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
+++ b/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
@@ -39,6 +39,13 @@ impl Display for ApiError {
     }
 }
 
+impl ApiError {
+    /// Returns `true` if retrying the request may succeed. Delegates to [`FlussError::is_retriable`].
+    pub fn is_retriable(&self) -> bool {
+        FlussError::for_code(self.code).is_retriable()
+    }
+}
+
 /// Fluss protocol errors. These errors are part of the client-server protocol.
 /// The error codes cannot be changed, but the names can be.
 ///
@@ -172,6 +179,25 @@ impl FlussError {
         *self as i32
     }
 
+    pub fn is_retriable(&self) -> bool {
+        matches!(
+            self,
+            FlussError::NetworkException
+                | FlussError::CorruptMessage
+                | FlussError::SchemaNotExist
+                | FlussError::LogStorageException
+                | FlussError::KvStorageException
+                | FlussError::NotLeaderOrFollower
+                | FlussError::CorruptRecordException
+                | FlussError::UnknownTableOrBucketException
+                | FlussError::RequestTimeOut
+                | FlussError::StorageException
+                | FlussError::NotEnoughReplicasAfterAppendException
+                | FlussError::NotEnoughReplicasException
+                | FlussError::LeaderNotAvailableException
+        )
+    }
+
     /// Returns a friendly description of the error.
     pub fn message(&self) -> &'static str {
         match self {
@@ -403,4 +429,55 @@ mod tests {
         let fluss_error = FlussError::from(api_error);
         assert_eq!(fluss_error, FlussError::TableNotExist);
     }
+
+    #[test]
+    fn is_retriable_known_retriable_errors() {
+        let retriable = [
+            FlussError::NetworkException,
+            FlussError::CorruptMessage,
+            FlussError::SchemaNotExist,
+            FlussError::LogStorageException,
+            FlussError::KvStorageException,
+            FlussError::NotLeaderOrFollower,
+            FlussError::CorruptRecordException,
+            FlussError::UnknownTableOrBucketException,
+            FlussError::RequestTimeOut,
+            FlussError::StorageException,
+            FlussError::NotEnoughReplicasAfterAppendException,
+            FlussError::NotEnoughReplicasException,
+            FlussError::LeaderNotAvailableException,
+        ];
+        for err in &retriable {
+            assert!(err.is_retriable(), "{err:?} should be retriable");
+        }
+    }
+
+    #[test]
+    fn is_retriable_known_non_retriable_errors() {
+        let non_retriable = [
+            FlussError::UnknownServerError,
+            FlussError::None,
+            FlussError::TableNotExist,
+            FlussError::AuthenticateException,
+            FlussError::AuthorizationException,
+            FlussError::RecordTooLargeException,
+            FlussError::DeletionDisabledException,
+            FlussError::InvalidCoordinatorException,
+            FlussError::FencedLeaderEpochException,
+            FlussError::FencedTieringEpochException,
+            FlussError::RetriableAuthenticateException,
+        ];
+        for err in &non_retriable {
+            assert!(!err.is_retriable(), "{err:?} should not be retriable");
+        }
+    }
+
+    #[test]
+    fn api_error_is_retriable_delegates_to_fluss_error() {
+        let retriable_api = FlussError::RequestTimeOut.to_api_error(None);
+        assert!(retriable_api.is_retriable());
+
+        let permanent_api = FlussError::TableNotExist.to_api_error(None);
+        assert!(!permanent_api.is_retriable());
+    }
 }
diff --git a/fluss-rust/website/docs/user-guide/cpp/error-handling.md b/fluss-rust/website/docs/user-guide/cpp/error-handling.md
index 3ded0c2d17..7447a264c7 100644
--- a/fluss-rust/website/docs/user-guide/cpp/error-handling.md
+++ b/fluss-rust/website/docs/user-guide/cpp/error-handling.md
@@ -98,6 +98,53 @@ if (!result.Ok()) {
 
 See `fluss::ErrorCode` in `fluss.hpp` for the full list of named constants.
 
+## Retry Logic
+
+Some errors are transient, where the server may be temporarily unavailable, mid-election, or under load. `IsRetriable()` can be used for deciding to to retry an operation rather than treating the error as permanent.
+
+`ErrorCode::IsRetriable(int32_t code)` is a static helper available directly on the error code:
+
+```cpp
+fluss::Result result = writer.Append(row);
+if (!result.Ok()) {
+    if (result.IsRetriable()) {
+        // Transient failure — safe to retry 
+    } else {
+        // Permanent failure — log and abort
+        std::cerr << "Fatal error (code " << result.error_code
+                  << "): " << result.error_message << std::endl;
+    }
+}
+```
+
+`Result::IsRetriable()` delegates to `ErrorCode::IsRetriable()`, so you can also call it directly on the code:
+
+```cpp
+if (fluss::ErrorCode::IsRetriable(result.error_code)) {
+    // retry
+}
+```
+
+### Retriable Error Codes
+
+| Constant                                                    | Code | Reason                                    |
+|-------------------------------------------------------------|------|-------------------------------------------|
+| `ErrorCode::NETWORK_EXCEPTION`                          | 1    | Server disconnected                       |
+| `ErrorCode::CORRUPT_MESSAGE`                            | 3    | CRC or size error                         |
+| `ErrorCode::SCHEMA_NOT_EXIST`                           | 9    | Schema may not exist                      |
+| `ErrorCode::LOG_STORAGE_EXCEPTION`                      | 10   | Transient log storage error               |
+| `ErrorCode::KV_STORAGE_EXCEPTION`                       | 11   | Transient KV storage error                |
+| `ErrorCode::NOT_LEADER_OR_FOLLOWER`                     | 12   | Leader election in progress               |
+| `ErrorCode::CORRUPT_RECORD_EXCEPTION`                   | 14   | Corrupt record                            |
+| `ErrorCode::UNKNOWN_TABLE_OR_BUCKET_EXCEPTION`          | 21   | Metadata not yet available                |
+| `ErrorCode::REQUEST_TIME_OUT`                           | 25   | Request timed out                         |
+| `ErrorCode::STORAGE_EXCEPTION`                          | 26   | Transient storage error                   |
+| `ErrorCode::NOT_ENOUGH_REPLICAS_AFTER_APPEND_EXCEPTION` | 28   | Wrote to server but with low ISR size     |
+| `ErrorCode::NOT_ENOUGH_REPLICAS_EXCEPTION`              | 29   | Low ISR size at write time                |
+| `ErrorCode::LEADER_NOT_AVAILABLE_EXCEPTION`             | 44   | No leader available for partition         |
+
+Client-side errors (`ErrorCode::CLIENT_ERROR`, code -2) always return `false` from `IsRetriable()`.
+
 ## Common Error Scenarios
 
 ### Connection Refused
diff --git a/fluss-rust/website/docs/user-guide/python/error-handling.md b/fluss-rust/website/docs/user-guide/python/error-handling.md
index 50a9e46be0..5bef366516 100644
--- a/fluss-rust/website/docs/user-guide/python/error-handling.md
+++ b/fluss-rust/website/docs/user-guide/python/error-handling.md
@@ -57,6 +57,46 @@ except fluss.FlussError as e:
 
 See `fluss.ErrorCode` for the full list of named constants.
 
+## Retry Logic
+
+Some errors are transient, where the server may be temporarily unavailable, mid-election, or under load. `is_retriable` can be used for deciding to retry an operation rather than treating the error as permanent.
+
+`FlussError.is_retriable` is a property available directly on the exception:
+
+```python
+import fluss
+
+try:
+    await writer.append(row)
+except fluss.FlussError as e:
+    if e.is_retriable:
+        # Transient failure — safe to retry
+        pass
+    else:
+        # Permanent failure — log and abort
+        print(f"Fatal error (code {e.error_code}): {e.message}")
+```
+
+### Retriable Error Codes
+
+| Constant                                                     | Code | Reason                                    |
+|--------------------------------------------------------------|------|-------------------------------------------|
+| `ErrorCode.NETWORK_EXCEPTION`                               | 1    | Server disconnected                       |
+| `ErrorCode.CORRUPT_MESSAGE`                                 | 3    | CRC or size error                         |
+| `ErrorCode.SCHEMA_NOT_EXIST`                                | 9    | Schema may not exist                      |
+| `ErrorCode.LOG_STORAGE_EXCEPTION`                           | 10   | Transient log storage error               |
+| `ErrorCode.KV_STORAGE_EXCEPTION`                            | 11   | Transient KV storage error                |
+| `ErrorCode.NOT_LEADER_OR_FOLLOWER`                          | 12   | Leader election in progress               |
+| `ErrorCode.CORRUPT_RECORD_EXCEPTION`                        | 14   | Corrupt record                            |
+| `ErrorCode.UNKNOWN_TABLE_OR_BUCKET_EXCEPTION`               | 21   | Metadata not yet available                |
+| `ErrorCode.REQUEST_TIME_OUT`                                | 25   | Request timed out                         |
+| `ErrorCode.STORAGE_EXCEPTION`                               | 26   | Transient storage error                   |
+| `ErrorCode.NOT_ENOUGH_REPLICAS_AFTER_APPEND_EXCEPTION`      | 28   | Wrote to server but with low ISR size     |
+| `ErrorCode.NOT_ENOUGH_REPLICAS_EXCEPTION`                   | 29   | Low ISR size at write time                |
+| `ErrorCode.LEADER_NOT_AVAILABLE_EXCEPTION`                  | 44   | No leader available for partition         |
+
+Client-side errors (`ErrorCode.CLIENT_ERROR`, code -2) always return `False` from `is_retriable`.
+
 ## Common Error Scenarios
 
 ### Connection Refused
diff --git a/fluss-rust/website/docs/user-guide/rust/error-handling.md b/fluss-rust/website/docs/user-guide/rust/error-handling.md
index 964f81f206..b7e4b45436 100644
--- a/fluss-rust/website/docs/user-guide/rust/error-handling.md
+++ b/fluss-rust/website/docs/user-guide/rust/error-handling.md
@@ -78,6 +78,48 @@ match result {
 }
 ```
 
+## Retry Logic
+
+Some errors are transient, where the server may be temporarily unavailable, mid-election, or under load. `is_retriable()` can be used for deciding to retry an operation rather than treating the error as permanent.
+
+`Error::is_retriable()` is available directly on any `Error` value. `RpcError` is always retriable; `FlussAPIError` delegates to the server error code; all other variants return `false`.
+
+```rust
+use fluss::error::Error;
+
+match writer.append(&row) {
+    Ok(_) => {}
+    Err(ref e) if e.is_retriable() => {
+        // Transient failure — safe to retry
+    }
+    Err(e) => {
+        // Permanent failure — log and abort
+        eprintln!("Fatal error: {}", e);
+    }
+}
+```
+
+### Retriable Variants
+
+| Variant / Error                              | Code | Reason                                    |
+|----------------------------------------------|------|-------------------------------------------|
+| `Error::RpcError`                            | —    | Network-level failure, always retriable   |
+| `FlussError::NetworkException`               | 1    | Server disconnected                       |
+| `FlussError::CorruptMessage`                 | 3    | CRC or size error                         |
+| `FlussError::SchemaNotExist`                 | 9    | Schema may not exist                      |
+| `FlussError::LogStorageException`            | 10   | Transient log storage error               |
+| `FlussError::KvStorageException`             | 11   | Transient KV storage error                |
+| `FlussError::NotLeaderOrFollower`            | 12   | Leader election in progress               |
+| `FlussError::CorruptRecordException`         | 14   | Corrupt record                            |
+| `FlussError::UnknownTableOrBucketException`  | 21   | Metadata not yet available                |
+| `FlussError::RequestTimeOut`                 | 25   | Request timed out                         |
+| `FlussError::StorageException`               | 26   | Transient storage error                   |
+| `FlussError::NotEnoughReplicasAfterAppendException` | 28 | Wrote to server but with low ISR size |
+| `FlussError::NotEnoughReplicasException`     | 29   | Low ISR size at write time                |
+| `FlussError::LeaderNotAvailableException`    | 44   | No leader available for partition         |
+
+All other `Error` variants (e.g. `RowConvertError`, `IllegalArgument`, `UnsupportedOperation`) always return `false` from `is_retriable()`.
+
 ## Common Error Scenarios
 
 ### Connection Refused

From 45be5c1adce42b2fcd218555dd20b5e501d2912a Mon Sep 17 00:00:00 2001
From: Prajwal banakar <prajwal.banakara@gmail.com>
Date: Thu, 12 Mar 2026 07:37:20 +0530
Subject: [PATCH 198/287] feat: allow configuring scanner fetch parameters
 (#417)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  8 ++
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  4 +
 fluss-rust/bindings/cpp/src/lib.rs            |  8 ++
 fluss-rust/bindings/python/fluss/__init__.pyi | 16 +++
 fluss-rust/bindings/python/src/config.rs      | 74 ++++++++++++++
 .../crates/fluss/src/client/connection.rs     |  2 +
 .../crates/fluss/src/client/table/scanner.rs  | 87 ++++++++++++-----
 fluss-rust/crates/fluss/src/config.rs         | 97 +++++++++++++++++++
 .../docs/user-guide/cpp/api-reference.md      |  4 +
 .../docs/user-guide/python/api-reference.md   |  4 +
 .../docs/user-guide/rust/api-reference.md     |  4 +
 11 files changed, 286 insertions(+), 22 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index d0da6173c8..79561a127f 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -1012,6 +1012,14 @@ struct Configuration {
     size_t scanner_remote_log_read_concurrency{4};
     // Maximum number of records returned in a single call to Poll() for LogScanner
     size_t scanner_log_max_poll_records{500};
+    // Maximum bytes per fetch response for LogScanner (16 MB)
+    int32_t scanner_log_fetch_max_bytes{16 * 1024 * 1024};
+    // Minimum bytes to accumulate before server returns a fetch response
+    int32_t scanner_log_fetch_min_bytes{1};
+    // Maximum time (ms) the server may wait to satisfy min bytes
+    int32_t scanner_log_fetch_wait_max_time_ms{500};
+    // Maximum bytes per fetch response per bucket for LogScanner (1 MB)
+    int32_t scanner_log_fetch_max_bytes_for_bucket{1024 * 1024};
     int64_t writer_batch_timeout_ms{100};
     // Connect timeout in milliseconds for TCP transport connect
     uint64_t connect_timeout_ms{120000};
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 93a60bf6e9..754ed0fd8f 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -64,6 +64,10 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.remote_file_download_thread_num = config.remote_file_download_thread_num;
     ffi_config.scanner_remote_log_read_concurrency = config.scanner_remote_log_read_concurrency;
     ffi_config.scanner_log_max_poll_records = config.scanner_log_max_poll_records;
+    ffi_config.scanner_log_fetch_max_bytes = config.scanner_log_fetch_max_bytes;
+    ffi_config.scanner_log_fetch_min_bytes = config.scanner_log_fetch_min_bytes;
+    ffi_config.scanner_log_fetch_wait_max_time_ms = config.scanner_log_fetch_wait_max_time_ms;
+    ffi_config.scanner_log_fetch_max_bytes_for_bucket = config.scanner_log_fetch_max_bytes_for_bucket;
     ffi_config.writer_batch_timeout_ms = config.writer_batch_timeout_ms;
     ffi_config.connect_timeout_ms = config.connect_timeout_ms;
     ffi_config.security_protocol = rust::String(config.security_protocol);
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 36b9c51694..8d5153e6da 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -48,6 +48,10 @@ mod ffi {
         remote_file_download_thread_num: usize,
         scanner_remote_log_read_concurrency: usize,
         scanner_log_max_poll_records: usize,
+        scanner_log_fetch_max_bytes: i32,
+        scanner_log_fetch_min_bytes: i32,
+        scanner_log_fetch_wait_max_time_ms: i32,
+        scanner_log_fetch_max_bytes_for_bucket: i32,
         writer_batch_timeout_ms: i64,
         connect_timeout_ms: u64,
         security_protocol: String,
@@ -668,6 +672,10 @@ fn new_connection(config: &ffi::FfiConfig) -> ffi::FfiPtrResult {
         remote_file_download_thread_num: config.remote_file_download_thread_num,
         scanner_remote_log_read_concurrency: config.scanner_remote_log_read_concurrency,
         scanner_log_max_poll_records: config.scanner_log_max_poll_records,
+        scanner_log_fetch_max_bytes: config.scanner_log_fetch_max_bytes,
+        scanner_log_fetch_min_bytes: config.scanner_log_fetch_min_bytes,
+        scanner_log_fetch_wait_max_time_ms: config.scanner_log_fetch_wait_max_time_ms,
+        scanner_log_fetch_max_bytes_for_bucket: config.scanner_log_fetch_max_bytes_for_bucket,
         connect_timeout_ms: config.connect_timeout_ms,
         security_protocol: config.security_protocol.to_string(),
         security_sasl_mechanism: config.security_sasl_mechanism.to_string(),
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 63be0e2cc6..20b259e872 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -174,6 +174,22 @@ class Config:
     @scanner_log_max_poll_records.setter
     def scanner_log_max_poll_records(self, num: int) -> None: ...
     @property
+    def scanner_log_fetch_max_bytes(self) -> int: ...
+    @scanner_log_fetch_max_bytes.setter
+    def scanner_log_fetch_max_bytes(self, bytes: int) -> None: ...
+    @property
+    def scanner_log_fetch_min_bytes(self) -> int: ...
+    @scanner_log_fetch_min_bytes.setter
+    def scanner_log_fetch_min_bytes(self, bytes: int) -> None: ...
+    @property
+    def scanner_log_fetch_wait_max_time_ms(self) -> int: ...
+    @scanner_log_fetch_wait_max_time_ms.setter
+    def scanner_log_fetch_wait_max_time_ms(self, ms: int) -> None: ...
+    @property
+    def scanner_log_fetch_max_bytes_for_bucket(self) -> int: ...
+    @scanner_log_fetch_max_bytes_for_bucket.setter
+    def scanner_log_fetch_max_bytes_for_bucket(self, bytes: int) -> None: ...
+    @property
     def writer_batch_timeout_ms(self) -> int: ...
     @writer_batch_timeout_ms.setter
     def writer_batch_timeout_ms(self, timeout: int) -> None: ...
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index f99f9c63f8..fd3c980ba1 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -97,6 +97,32 @@ impl Config {
                                 ))
                             })?;
                     }
+                    "scanner.log.fetch.max-bytes" => {
+                        config.scanner_log_fetch_max_bytes = value.parse::<i32>().map_err(|e| {
+                            FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
+                        })?;
+                    }
+                    "scanner.log.fetch.min-bytes" => {
+                        config.scanner_log_fetch_min_bytes = value.parse::<i32>().map_err(|e| {
+                            FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
+                        })?;
+                    }
+                    "scanner.log.fetch.wait-max-time-ms" => {
+                        config.scanner_log_fetch_wait_max_time_ms =
+                            value.parse::<i32>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
+                    }
+                    "scanner.log.fetch.max-bytes-for-bucket" => {
+                        config.scanner_log_fetch_max_bytes_for_bucket =
+                            value.parse::<i32>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
+                    }
                     "writer.bucket.no-key-assigner" => {
                         config.writer_bucket_no_key_assigner =
                             value.parse::<fcore::config::NoKeyAssigner>().map_err(|e| {
@@ -329,6 +355,54 @@ impl Config {
     fn set_security_sasl_password(&mut self, password: String) {
         self.inner.security_sasl_password = password;
     }
+
+    /// Get the maximum bytes per fetch response for LogScanner
+    #[getter]
+    fn scanner_log_fetch_max_bytes(&self) -> i32 {
+        self.inner.scanner_log_fetch_max_bytes
+    }
+
+    /// Set the maximum bytes per fetch response for LogScanner
+    #[setter]
+    fn set_scanner_log_fetch_max_bytes(&mut self, bytes: i32) {
+        self.inner.scanner_log_fetch_max_bytes = bytes;
+    }
+
+    /// Get the minimum bytes to accumulate before returning a fetch response
+    #[getter]
+    fn scanner_log_fetch_min_bytes(&self) -> i32 {
+        self.inner.scanner_log_fetch_min_bytes
+    }
+
+    /// Set the minimum bytes to accumulate before returning a fetch response
+    #[setter]
+    fn set_scanner_log_fetch_min_bytes(&mut self, bytes: i32) {
+        self.inner.scanner_log_fetch_min_bytes = bytes;
+    }
+
+    /// Get the maximum time (ms) the server may wait to satisfy min-bytes
+    #[getter]
+    fn scanner_log_fetch_wait_max_time_ms(&self) -> i32 {
+        self.inner.scanner_log_fetch_wait_max_time_ms
+    }
+
+    /// Set the maximum time (ms) the server may wait to satisfy min-bytes
+    #[setter]
+    fn set_scanner_log_fetch_wait_max_time_ms(&mut self, ms: i32) {
+        self.inner.scanner_log_fetch_wait_max_time_ms = ms;
+    }
+
+    /// Get the maximum bytes per fetch response per bucket for LogScanner
+    #[getter]
+    fn scanner_log_fetch_max_bytes_for_bucket(&self) -> i32 {
+        self.inner.scanner_log_fetch_max_bytes_for_bucket
+    }
+
+    /// Set the maximum bytes per fetch response per bucket for LogScanner
+    #[setter]
+    fn set_scanner_log_fetch_max_bytes_for_bucket(&mut self, bytes: i32) {
+        self.inner.scanner_log_fetch_max_bytes_for_bucket = bytes;
+    }
 }
 
 impl Config {
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 703b588647..2610f6da0b 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -39,6 +39,8 @@ impl FlussConnection {
     pub async fn new(arg: Config) -> Result<Self> {
         arg.validate_security()
             .map_err(|msg| Error::IllegalArgument { message: msg })?;
+        arg.validate_scanner_fetch()
+            .map_err(|msg| Error::IllegalArgument { message: msg })?;
 
         let timeout = Duration::from_millis(arg.connect_timeout_ms);
         let connections = if arg.is_sasl_enabled() {
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index e837ba76c3..43025393e8 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -15,17 +15,6 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use arrow_schema::SchemaRef;
-use log::{debug, warn};
-use parking_lot::{Mutex, RwLock};
-use std::{
-    collections::{HashMap, HashSet},
-    slice::from_ref,
-    sync::Arc,
-    time::{Duration, Instant},
-};
-use tempfile::TempDir;
-
 use crate::client::connection::FlussConnection;
 use crate::client::credentials::SecurityTokenManager;
 use crate::client::metadata::Metadata;
@@ -44,12 +33,16 @@ use crate::record::{
 use crate::rpc::{RpcClient, RpcError, message};
 use crate::util::FairBucketStatusMap;
 use crate::{PartitionId, TableId};
-
-const LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
-#[allow(dead_code)]
-const LOG_FETCH_MAX_BYTES_FOR_BUCKET: i32 = 1024;
-const LOG_FETCH_MIN_BYTES: i32 = 1;
-const LOG_FETCH_WAIT_MAX_TIME: i32 = 500;
+use arrow_schema::SchemaRef;
+use log::{debug, warn};
+use parking_lot::{Mutex, RwLock};
+use std::{
+    collections::{HashMap, HashSet},
+    slice::from_ref,
+    sync::Arc,
+    time::{Duration, Instant},
+};
+use tempfile::TempDir;
 
 pub struct TableScan<'a> {
     conn: &'a FlussConnection,
@@ -637,6 +630,10 @@ struct LogFetcher {
     log_fetch_buffer: Arc<LogFetchBuffer>,
     nodes_with_pending_fetch_requests: Arc<Mutex<HashSet<i32>>>,
     max_poll_records: usize,
+    fetch_max_bytes: i32,
+    fetch_min_bytes: i32,
+    fetch_wait_max_time_ms: i32,
+    fetch_max_bytes_for_bucket: i32,
 }
 
 struct FetchResponseContext {
@@ -697,6 +694,10 @@ impl LogFetcher {
             log_fetch_buffer,
             nodes_with_pending_fetch_requests: Arc::new(Mutex::new(HashSet::new())),
             max_poll_records: config.scanner_log_max_poll_records,
+            fetch_max_bytes: config.scanner_log_fetch_max_bytes,
+            fetch_min_bytes: config.scanner_log_fetch_min_bytes,
+            fetch_wait_max_time_ms: config.scanner_log_fetch_wait_max_time_ms,
+            fetch_max_bytes_for_bucket: config.scanner_log_fetch_max_bytes_for_bucket,
         })
     }
 
@@ -1479,8 +1480,7 @@ impl LogFetcher {
                             partition_id: bucket.partition_id(),
                             bucket_id: bucket.bucket_id(),
                             fetch_offset: offset,
-                            // 1M
-                            max_fetch_bytes: 1024 * 1024,
+                            max_fetch_bytes: self.fetch_max_bytes_for_bucket,
                         };
 
                         fetch_log_req_for_buckets
@@ -1514,10 +1514,10 @@ impl LogFetcher {
 
                     let fetch_log_request = FetchLogRequest {
                         follower_server_id: -1,
-                        max_bytes: LOG_FETCH_MAX_BYTES,
+                        max_bytes: self.fetch_max_bytes,
                         tables_req: vec![req_for_table],
-                        max_wait_ms: Some(LOG_FETCH_WAIT_MAX_TIME),
-                        min_bytes: Some(LOG_FETCH_MIN_BYTES),
+                        max_wait_ms: Some(self.fetch_wait_max_time_ms),
+                        min_bytes: Some(self.fetch_min_bytes),
                     };
                     (leader_id, fetch_log_request)
                 })
@@ -1990,4 +1990,47 @@ mod tests {
         let result = validate_scan_support(&table_path, &table_info);
         assert!(result.is_ok());
     }
+    #[tokio::test]
+    async fn prepare_fetch_log_requests_uses_configured_fetch_params() -> Result<()> {
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = build_table_info(table_path.clone(), 1, 1);
+        let cluster = build_cluster_arc(&table_path, 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster));
+        let status = Arc::new(LogScannerStatus::new());
+        status.assign_scan_bucket(TableBucket::new(1, 0), 0);
+
+        let config = crate::config::Config {
+            scanner_log_fetch_max_bytes: 1234,
+            scanner_log_fetch_min_bytes: 7,
+            scanner_log_fetch_wait_max_time_ms: 89,
+            scanner_log_fetch_max_bytes_for_bucket: 512,
+            ..crate::config::Config::default()
+        };
+
+        let fetcher = LogFetcher::new(
+            table_info,
+            Arc::new(RpcClient::new()),
+            metadata,
+            status,
+            &config,
+            None,
+        )?;
+
+        let requests = fetcher.prepare_fetch_log_requests().await;
+        // In this test cluster, leader id should exist; but even if it changes,
+        // assert over all built requests.
+        assert!(!requests.is_empty());
+        for req in requests.values() {
+            assert_eq!(req.max_bytes, 1234);
+            assert_eq!(req.min_bytes, Some(7));
+            assert_eq!(req.max_wait_ms, Some(89));
+
+            for table_req in &req.tables_req {
+                for bucket_req in &table_req.buckets_req {
+                    assert_eq!(bucket_req.max_fetch_bytes, 512);
+                }
+            }
+        }
+        Ok(())
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 08ffbfae77..e85a449250 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -27,7 +27,11 @@ const DEFAULT_PREFETCH_NUM: usize = 4;
 const DEFAULT_DOWNLOAD_THREADS: usize = 3;
 const DEFAULT_SCANNER_REMOTE_LOG_READ_CONCURRENCY: usize = 4;
 const DEFAULT_MAX_POLL_RECORDS: usize = 500;
+const DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES: i32 = 16 * 1024 * 1024;
+const DEFAULT_SCANNER_LOG_FETCH_MIN_BYTES: i32 = 1;
+const DEFAULT_SCANNER_LOG_FETCH_WAIT_MAX_TIME_MS: i32 = 500;
 const DEFAULT_WRITER_BATCH_TIMEOUT_MS: i64 = 100;
+const DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES_FOR_BUCKET: i32 = 1024 * 1024;
 
 const DEFAULT_ACKS: &str = "all";
 const DEFAULT_CONNECT_TIMEOUT_MS: u64 = 120_000;
@@ -91,11 +95,31 @@ pub struct Config {
     #[arg(long, default_value_t = DEFAULT_MAX_POLL_RECORDS)]
     pub scanner_log_max_poll_records: usize,
 
+    /// Maximum bytes per fetch response for LogScanner.
+    /// Default: 16777216 (16MB)
+    #[arg(long, default_value_t = DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES)]
+    pub scanner_log_fetch_max_bytes: i32,
+
+    /// Minimum bytes to accumulate before returning a fetch response.
+    /// Default: 1
+    #[arg(long, default_value_t = DEFAULT_SCANNER_LOG_FETCH_MIN_BYTES)]
+    pub scanner_log_fetch_min_bytes: i32,
+
+    /// Maximum time the server may wait (ms) to satisfy min-bytes.
+    /// Default: 500
+    #[arg(long, default_value_t = DEFAULT_SCANNER_LOG_FETCH_WAIT_MAX_TIME_MS)]
+    pub scanner_log_fetch_wait_max_time_ms: i32,
+
     /// The maximum time to wait for a batch to be completed in milliseconds.
     /// Default: 100 (matching Java CLIENT_WRITER_BATCH_TIMEOUT)
     #[arg(long, default_value_t = DEFAULT_WRITER_BATCH_TIMEOUT_MS)]
     pub writer_batch_timeout_ms: i64,
 
+    /// Maximum bytes per fetch response **per bucket** for LogScanner.
+    /// Default: 1048576 (1MB)
+    #[arg(long, default_value_t = DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES_FOR_BUCKET)]
+    pub scanner_log_fetch_max_bytes_for_bucket: i32,
+
     /// Connect timeout in milliseconds for TCP transport connect.
     /// Default: 120000 (120 seconds).
     #[arg(long, default_value_t = DEFAULT_CONNECT_TIMEOUT_MS)]
@@ -139,6 +163,22 @@ impl std::fmt::Debug for Config {
                 "scanner_log_max_poll_records",
                 &self.scanner_log_max_poll_records,
             )
+            .field(
+                "scanner_log_fetch_max_bytes",
+                &self.scanner_log_fetch_max_bytes,
+            )
+            .field(
+                "scanner_log_fetch_min_bytes",
+                &self.scanner_log_fetch_min_bytes,
+            )
+            .field(
+                "scanner_log_fetch_max_bytes_for_bucket",
+                &self.scanner_log_fetch_max_bytes_for_bucket,
+            )
+            .field(
+                "scanner_log_fetch_wait_max_time_ms",
+                &self.scanner_log_fetch_wait_max_time_ms,
+            )
             .field("writer_batch_timeout_ms", &self.writer_batch_timeout_ms)
             .field("connect_timeout_ms", &self.connect_timeout_ms)
             .field("security_protocol", &self.security_protocol)
@@ -162,6 +202,10 @@ impl Default for Config {
             remote_file_download_thread_num: DEFAULT_DOWNLOAD_THREADS,
             scanner_remote_log_read_concurrency: DEFAULT_SCANNER_REMOTE_LOG_READ_CONCURRENCY,
             scanner_log_max_poll_records: DEFAULT_MAX_POLL_RECORDS,
+            scanner_log_fetch_max_bytes: DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES,
+            scanner_log_fetch_min_bytes: DEFAULT_SCANNER_LOG_FETCH_MIN_BYTES,
+            scanner_log_fetch_wait_max_time_ms: DEFAULT_SCANNER_LOG_FETCH_WAIT_MAX_TIME_MS,
+            scanner_log_fetch_max_bytes_for_bucket: DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES_FOR_BUCKET,
             writer_batch_timeout_ms: DEFAULT_WRITER_BATCH_TIMEOUT_MS,
             connect_timeout_ms: DEFAULT_CONNECT_TIMEOUT_MS,
             security_protocol: String::from(DEFAULT_SECURITY_PROTOCOL),
@@ -205,6 +249,32 @@ impl Config {
         }
         Ok(())
     }
+    pub fn validate_scanner_fetch(&self) -> Result<(), String> {
+        if self.scanner_log_fetch_min_bytes <= 0 {
+            return Err("scanner_log_fetch_min_bytes must be > 0".to_string());
+        }
+        if self.scanner_log_fetch_max_bytes <= 0 {
+            return Err("scanner_log_fetch_max_bytes must be > 0".to_string());
+        }
+        if self.scanner_log_fetch_max_bytes < self.scanner_log_fetch_min_bytes {
+            return Err(
+                "scanner_log_fetch_max_bytes must be >= scanner_log_fetch_min_bytes".to_string(),
+            );
+        }
+        if self.scanner_log_fetch_wait_max_time_ms < 0 {
+            return Err("scanner_log_fetch_wait_max_time_ms must be >= 0".to_string());
+        }
+        if self.scanner_log_fetch_max_bytes_for_bucket <= 0 {
+            return Err("scanner_log_fetch_max_bytes_for_bucket must be > 0".to_string());
+        }
+        if self.scanner_log_fetch_max_bytes_for_bucket > self.scanner_log_fetch_max_bytes {
+            return Err(
+                "scanner_log_fetch_max_bytes_for_bucket must be <= scanner_log_fetch_max_bytes"
+                    .to_string(),
+            );
+        }
+        Ok(())
+    }
 }
 
 #[cfg(test)]
@@ -274,4 +344,31 @@ mod tests {
         };
         assert!(config.validate_security().is_err());
     }
+    #[test]
+    fn test_scanner_fetch_defaults_valid() {
+        let config = Config::default();
+        assert!(config.validate_scanner_fetch().is_ok());
+        assert_eq!(config.scanner_log_fetch_max_bytes, 16 * 1024 * 1024);
+        assert_eq!(config.scanner_log_fetch_min_bytes, 1);
+        assert_eq!(config.scanner_log_fetch_wait_max_time_ms, 500);
+    }
+
+    #[test]
+    fn test_scanner_fetch_invalid_ranges() {
+        let config = Config {
+            scanner_log_fetch_min_bytes: 2,
+            scanner_log_fetch_max_bytes: 1,
+            ..Config::default()
+        };
+        assert!(config.validate_scanner_fetch().is_err());
+    }
+
+    #[test]
+    fn test_scanner_fetch_negative_wait() {
+        let config = Config {
+            scanner_log_fetch_wait_max_time_ms: -1,
+            ..Config::default()
+        };
+        assert!(config.validate_scanner_fetch().is_err());
+    }
 }
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index debd311d40..d14cf16d13 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -28,6 +28,10 @@ Complete API reference for the Fluss C++ client.
 | `remote_file_download_thread_num`     | `size_t`      | `3`                  | Number of threads for remote log downloads                                               |
 | `scanner_remote_log_read_concurrency` | `size_t`      | `4`                  | Streaming read concurrency within a remote log file                                      |
 | `scanner_log_max_poll_records`        | `size_t`      | `500`                | Maximum number of records returned in a single Poll()                                    |
+| `scanner_log_fetch_max_bytes`         | `int32_t`     | `16777216` (16 MB)   | Maximum bytes per fetch response for LogScanner                                          |
+| `scanner_log_fetch_min_bytes`         | `int32_t`     | `1`                  | Minimum bytes the server must accumulate before returning a fetch response               |
+| `scanner_log_fetch_wait_max_time_ms`  | `int32_t`     | `500`                | Maximum time (ms) the server may wait to satisfy min-bytes                               |
+| `scanner_log_fetch_max_bytes_for_bucket`| `int32_t`   | `1048576` (1 MB)     | Maximum bytes per fetch response per bucket for LogScanner                               |
 | `connect_timeout_ms`                  | `uint64_t`    | `120000`             | TCP connect timeout in milliseconds                                                      |
 | `security_protocol`                   | `std::string` | `"PLAINTEXT"`        | `"PLAINTEXT"` (default) or `"sasl"` for SASL auth                                        |
 | `security_sasl_mechanism`             | `std::string` | `"PLAIN"`            | SASL mechanism (only `"PLAIN"` is supported)                                             |
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index fef10a8c5c..a4b594bce3 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -21,6 +21,10 @@ Complete API reference for the Fluss Python client.
 | `remote_file_download_thread_num`     | `remote-file.download-thread-num`     | Get/set number of threads for remote log downloads                                      |
 | `scanner_remote_log_read_concurrency` | `scanner.remote-log.read-concurrency` | Get/set streaming read concurrency within a remote log file                             |
 | `scanner_log_max_poll_records`        | `scanner.log.max-poll-records`        | Get/set max number of records returned in a single poll()                               |
+| `scanner_log_fetch_max_bytes`         | `scanner.log.fetch.max-bytes`         | Get/set maximum bytes per fetch response for LogScanner                                 |
+| `scanner_log_fetch_min_bytes`         | `scanner.log.fetch.min-bytes`         | Get/set minimum bytes the server must accumulate before returning a fetch response      |
+| `scanner_log_fetch_wait_max_time_ms`  | `scanner.log.fetch.wait-max-time-ms`  | Get/set maximum time (ms) the server may wait to satisfy min-bytes                      |
+| `scanner_log_fetch_max_bytes_for_bucket` | `scanner.log.fetch.max-bytes-for-bucket` | Get/set maximum bytes per fetch response per bucket for LogScanner                |
 | `connect_timeout_ms`                  | `connect-timeout`                     | Get/set TCP connect timeout in milliseconds                                             |
 | `security_protocol`                   | `security.protocol`                   | Get/set security protocol (`"PLAINTEXT"` or `"sasl"`)                                   |
 | `security_sasl_mechanism`             | `security.sasl.mechanism`             | Get/set SASL mechanism (only `"PLAIN"` is supported)                                    |
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index d539a860ca..7f4552265f 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -20,6 +20,10 @@ Complete API reference for the Fluss Rust client.
 | `remote_file_download_thread_num`     | `usize`         | `3`                | Number of threads for remote log downloads                                           |
 | `scanner_remote_log_read_concurrency` | `usize`         | `4`                | Streaming read concurrency within a remote log file                                  |
 | `scanner_log_max_poll_records`        | `usize`         | `500`              | Maximum number of records returned in a single poll()                                |
+| `scanner_log_fetch_max_bytes`         | `i32`           | `16777216` (16 MB) | Maximum bytes per fetch response for LogScanner                                      |
+| `scanner_log_fetch_min_bytes`         | `i32`           | `1`                | Minimum bytes the server must accumulate before returning a fetch response           |
+| `scanner_log_fetch_wait_max_time_ms`  | `i32`           | `500`              | Maximum time (ms) the server may wait to satisfy min-bytes                           |
+| `scanner_log_fetch_max_bytes_for_bucket`| `i32`         | `1048576` (1 MB)   | Maximum bytes per fetch response per bucket for LogScanner                           |
 | `connect_timeout_ms`                  | `u64`           | `120000`           | TCP connect timeout in milliseconds                                                  |
 | `security_protocol`                   | `String`        | `"PLAINTEXT"`      | `PLAINTEXT` (default) or `sasl` for SASL auth                                        |
 | `security_sasl_mechanism`             | `String`        | `"PLAIN"`          | SASL mechanism (only `PLAIN` is supported)                                           |

From 7413fce5a0a644aa20040b67a55890d8e4408371 Mon Sep 17 00:00:00 2001
From: Prajwal banakar <prajwal.banakara@gmail.com>
Date: Sun, 15 Mar 2026 07:20:11 +0530
Subject: [PATCH 199/287] [client] Add LookupResult::to_record_batch() (#411)

---
 .../crates/fluss/src/client/table/lookup.rs   | 124 ++++++++++++++++--
 fluss-rust/crates/fluss/src/record/arrow.rs   |   9 ++
 .../docs/user-guide/rust/api-reference.md     |   3 +-
 .../rust/example/primary-key-tables.md        |   8 ++
 4 files changed, 135 insertions(+), 9 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index ce154912e4..3d643ed332 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -20,6 +20,7 @@ use crate::client::metadata::Metadata;
 use crate::client::table::partition_getter::PartitionGetter;
 use crate::error::{Error, Result};
 use crate::metadata::{PhysicalTablePath, RowType, TableBucket, TableInfo, TablePath};
+use crate::record::RowAppendRecordBatchBuilder;
 use crate::record::kv::SCHEMA_ID_LENGTH;
 use crate::row::InternalRow;
 use crate::row::compacted::CompactedRow;
@@ -27,6 +28,7 @@ use crate::row::encode::{KeyEncoder, KeyEncoderFactory};
 use crate::rpc::ApiError;
 use crate::rpc::RpcClient;
 use crate::rpc::message::LookupRequest;
+use arrow::array::RecordBatch;
 use std::sync::Arc;
 
 /// The result of a lookup operation.
@@ -53,6 +55,19 @@ impl LookupResult {
         }
     }
 
+    /// Extracts the row payload by stripping the schema id prefix.
+    fn extract_payload(bytes: &[u8]) -> Result<&[u8]> {
+        bytes
+            .get(SCHEMA_ID_LENGTH..)
+            .ok_or_else(|| Error::RowConvertError {
+                message: format!(
+                    "Row payload too short: {} bytes, need at least {} for schema id",
+                    bytes.len(),
+                    SCHEMA_ID_LENGTH
+                ),
+            })
+    }
+
     /// Returns the only row in the result set as a [`CompactedRow`].
     ///
     /// This method provides a zero-copy view of the row data, which means the returned
@@ -62,14 +77,14 @@ impl LookupResult {
     /// - `Ok(Some(row))`: If exactly one row exists.
     /// - `Ok(None)`: If the result set is empty.
     /// - `Err(Error::UnexpectedError)`: If the result set contains more than one row.
-    ///
+    /// - `Err(Error)`: If the row payload is too short to contain a schema id.
     pub fn get_single_row(&self) -> Result<Option<CompactedRow<'_>>> {
         match self.rows.len() {
             0 => Ok(None),
-            1 => Ok(Some(CompactedRow::from_bytes(
-                &self.row_type,
-                &self.rows[0][SCHEMA_ID_LENGTH..],
-            ))),
+            1 => {
+                let payload = Self::extract_payload(&self.rows[0])?;
+                Ok(Some(CompactedRow::from_bytes(&self.row_type, payload)))
+            }
             _ => Err(Error::UnexpectedError {
                 message: "LookupResult contains multiple rows, use get_rows() instead".to_string(),
                 source: None,
@@ -77,14 +92,42 @@ impl LookupResult {
         }
     }
 
-    /// Returns all rows as CompactedRows.
-    pub fn get_rows(&self) -> Vec<CompactedRow<'_>> {
+    /// Returns all rows in the result set as [`CompactedRow`]s.
+    ///
+    /// # Returns
+    /// - `Ok(rows)` - All rows in the result set.
+    /// - `Err(Error)` - If any row payload is too short to contain a schema id.
+    pub fn get_rows(&self) -> Result<Vec<CompactedRow<'_>>> {
         self.rows
             .iter()
             // TODO Add schema id check and fetch when implementing prefix lookup
-            .map(|bytes| CompactedRow::from_bytes(&self.row_type, &bytes[SCHEMA_ID_LENGTH..]))
+            .map(|bytes| {
+                let payload = Self::extract_payload(bytes)?;
+                Ok(CompactedRow::from_bytes(&self.row_type, payload))
+            })
             .collect()
     }
+
+    /// Converts all rows in this result into an Arrow [`RecordBatch`].
+    ///
+    /// This is useful for integration with DataFusion or other Arrow-based tools.
+    ///
+    /// # Returns
+    /// - `Ok(RecordBatch)` - All rows in columnar Arrow format. Returns an empty
+    ///   batch (with the correct schema) if the result set is empty.
+    /// - `Err(Error)` - If the conversion fails.
+    pub fn to_record_batch(&self) -> Result<RecordBatch> {
+        let mut builder = RowAppendRecordBatchBuilder::new(&self.row_type)?;
+
+        for bytes in &self.rows {
+            let payload = Self::extract_payload(bytes)?;
+
+            let row = CompactedRow::from_bytes(&self.row_type, payload);
+            builder.append(&row)?;
+        }
+
+        builder.build_arrow_record_batch().map(Arc::unwrap_or_clone)
+    }
 }
 
 /// Configuration and factory struct for creating lookup operations.
@@ -306,3 +349,68 @@ impl Lookuper {
         &self.table_info
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{DataField, DataTypes};
+    use crate::row::binary::BinaryWriter;
+    use crate::row::compacted::CompactedRowWriter;
+    use arrow::array::Int32Array;
+
+    fn make_row_bytes(schema_id: i16, row_data: &[u8]) -> Vec<u8> {
+        let mut bytes = Vec::with_capacity(SCHEMA_ID_LENGTH + row_data.len());
+        bytes.extend_from_slice(&schema_id.to_le_bytes());
+        bytes.extend_from_slice(row_data);
+        bytes
+    }
+
+    #[test]
+    fn test_to_record_batch_empty() {
+        let row_type = Arc::new(RowType::new(vec![DataField::new(
+            "id",
+            DataTypes::int(),
+            None,
+        )]));
+        let result = LookupResult::empty(row_type);
+        let batch = result.to_record_batch().unwrap();
+        assert_eq!(batch.num_rows(), 0);
+        assert_eq!(batch.num_columns(), 1);
+    }
+
+    #[test]
+    fn test_to_record_batch_with_row() {
+        let row_type = Arc::new(RowType::new(vec![DataField::new(
+            "id",
+            DataTypes::int(),
+            None,
+        )]));
+
+        let mut writer = CompactedRowWriter::new(1);
+        writer.write_int(42);
+        let row_bytes = make_row_bytes(0, writer.buffer());
+
+        let result = LookupResult::new(vec![row_bytes], Arc::clone(&row_type));
+        let batch = result.to_record_batch().unwrap();
+
+        assert_eq!(batch.num_rows(), 1);
+        let col = batch
+            .column(0)
+            .as_any()
+            .downcast_ref::<Int32Array>()
+            .unwrap();
+        assert_eq!(col.value(0), 42);
+    }
+
+    #[test]
+    fn test_to_record_batch_payload_too_short() {
+        let row_type = Arc::new(RowType::new(vec![DataField::new(
+            "id",
+            DataTypes::int(),
+            None,
+        )]));
+        // Only 1 byte — shorter than SCHEMA_ID_LENGTH (2)
+        let result = LookupResult::new(vec![vec![0u8]], Arc::clone(&row_type));
+        assert!(result.to_record_batch().is_err());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index a0dfc84a84..83d102a1e6 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -246,6 +246,15 @@ impl RowAppendRecordBatchBuilder {
             records_count: 0,
         })
     }
+    /// Appends a row to the builder.
+    pub fn append(&mut self, row: &dyn InternalRow) -> Result<bool> {
+        ArrowRecordBatchInnerBuilder::append(self, row)
+    }
+
+    /// Builds the final Arrow RecordBatch.
+    pub fn build_arrow_record_batch(&mut self) -> Result<Arc<RecordBatch>> {
+        ArrowRecordBatchInnerBuilder::build_arrow_record_batch(self)
+    }
 }
 
 impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 7f4552265f..fbe3428c14 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -229,7 +229,8 @@ for record in records {
 | Method                                                         |  Description                     |
 |----------------------------------------------------------------|----------------------------------|
 | `fn get_single_row(&self) -> Result<Option<impl InternalRow>>` | Get a single row from the result |
-| `fn get_rows(&self) -> Vec<impl InternalRow>`                  | Get all rows from the result     |
+| `fn get_rows(&self) -> Result<Vec<impl InternalRow>>`          | Get all rows from the result     |
+| `fn to_record_batch(&self) -> Result<RecordBatch>`             | Convert all rows to an Arrow `RecordBatch` for DataFusion or other Arrow-based tools    |
 
 ## `WriteResultFuture`
 
diff --git a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
index 9e819796ce..7fe8a553ff 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
@@ -112,3 +112,11 @@ if let Some(row) = result.get_single_row()? {
     println!("Record not found");
 }
 ```
+## Looking Up Records as Arrow RecordBatch
+
+Use `to_record_batch()` to get lookup results in Arrow format, for example when integrating with DataFusion.
+```rust
+let result = lookuper.lookup(&key).await?;
+let batch = result.to_record_batch()?;
+println!("Rows: {}", batch.num_rows());
+```

From ce67b9fadfbc42ca2b0ed023a1864d45ab77128e Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 15 Mar 2026 02:09:48 +0000
Subject: [PATCH 200/287] feat: introduce idempotent writes (#404)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |   8 +
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |   5 +
 fluss-rust/bindings/cpp/src/lib.rs            |   8 +
 fluss-rust/bindings/python/fluss/__init__.pyi |  16 +
 fluss-rust/bindings/python/src/config.rs      |  80 ++
 .../crates/fluss/src/client/connection.rs     |   4 +
 .../fluss/src/client/write/accumulator.rs     | 976 +++++++++++++++++-
 .../crates/fluss/src/client/write/batch.rs    |  54 +-
 .../fluss/src/client/write/broadcast.rs       |  11 +
 .../fluss/src/client/write/idempotence.rs     | 724 +++++++++++++
 .../crates/fluss/src/client/write/mod.rs      |  25 +-
 .../crates/fluss/src/client/write/sender.rs   | 762 ++++++++++++--
 .../fluss/src/client/write/writer_client.rs   | 113 +-
 fluss-rust/crates/fluss/src/config.rs         | 123 +++
 fluss-rust/crates/fluss/src/error.rs          |   9 +
 .../crates/fluss/src/proto/fluss_api.proto    |   9 +
 fluss-rust/crates/fluss/src/record/arrow.rs   |   5 +
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |  49 +-
 .../fluss/src/rpc/message/init_writer.rs      |  50 +
 .../crates/fluss/src/rpc/message/mod.rs       |   2 +
 20 files changed, 2867 insertions(+), 166 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/write/idempotence.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/init_writer.rs

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 79561a127f..768db0f740 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -1021,6 +1021,14 @@ struct Configuration {
     // Maximum bytes per fetch response per bucket for LogScanner (1 MB)
     int32_t scanner_log_fetch_max_bytes_for_bucket{1024 * 1024};
     int64_t writer_batch_timeout_ms{100};
+    // Whether to enable idempotent writes
+    bool writer_enable_idempotence{true};
+    // Maximum number of in-flight requests per bucket for idempotent writes
+    size_t writer_max_inflight_requests_per_bucket{5};
+    // Total memory available for buffering write batches (default 64MB)
+    size_t writer_buffer_memory_size{64 * 1024 * 1024};
+    // Maximum time in milliseconds to block waiting for buffer memory
+    uint64_t writer_buffer_wait_timeout_ms{std::numeric_limits<uint64_t>::max()};
     // Connect timeout in milliseconds for TCP transport connect
     uint64_t connect_timeout_ms{120000};
     // Security protocol: "PLAINTEXT" (default, no auth) or "sasl" (SASL auth)
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 754ed0fd8f..fcd4e1dcae 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -69,6 +69,11 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.scanner_log_fetch_wait_max_time_ms = config.scanner_log_fetch_wait_max_time_ms;
     ffi_config.scanner_log_fetch_max_bytes_for_bucket = config.scanner_log_fetch_max_bytes_for_bucket;
     ffi_config.writer_batch_timeout_ms = config.writer_batch_timeout_ms;
+    ffi_config.writer_enable_idempotence = config.writer_enable_idempotence;
+    ffi_config.writer_max_inflight_requests_per_bucket =
+        config.writer_max_inflight_requests_per_bucket;
+    ffi_config.writer_buffer_memory_size = config.writer_buffer_memory_size;
+    ffi_config.writer_buffer_wait_timeout_ms = config.writer_buffer_wait_timeout_ms;
     ffi_config.connect_timeout_ms = config.connect_timeout_ms;
     ffi_config.security_protocol = rust::String(config.security_protocol);
     ffi_config.security_sasl_mechanism = rust::String(config.security_sasl_mechanism);
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 8d5153e6da..284eec898f 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -53,6 +53,10 @@ mod ffi {
         scanner_log_fetch_wait_max_time_ms: i32,
         scanner_log_fetch_max_bytes_for_bucket: i32,
         writer_batch_timeout_ms: i64,
+        writer_enable_idempotence: bool,
+        writer_max_inflight_requests_per_bucket: usize,
+        writer_buffer_memory_size: usize,
+        writer_buffer_wait_timeout_ms: u64,
         connect_timeout_ms: u64,
         security_protocol: String,
         security_sasl_mechanism: String,
@@ -676,6 +680,10 @@ fn new_connection(config: &ffi::FfiConfig) -> ffi::FfiPtrResult {
         scanner_log_fetch_min_bytes: config.scanner_log_fetch_min_bytes,
         scanner_log_fetch_wait_max_time_ms: config.scanner_log_fetch_wait_max_time_ms,
         scanner_log_fetch_max_bytes_for_bucket: config.scanner_log_fetch_max_bytes_for_bucket,
+        writer_enable_idempotence: config.writer_enable_idempotence,
+        writer_max_inflight_requests_per_bucket: config.writer_max_inflight_requests_per_bucket,
+        writer_buffer_memory_size: config.writer_buffer_memory_size,
+        writer_buffer_wait_timeout_ms: config.writer_buffer_wait_timeout_ms,
         connect_timeout_ms: config.connect_timeout_ms,
         security_protocol: config.security_protocol.to_string(),
         security_sasl_mechanism: config.security_sasl_mechanism.to_string(),
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 20b259e872..95f30801e9 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -194,6 +194,22 @@ class Config:
     @writer_batch_timeout_ms.setter
     def writer_batch_timeout_ms(self, timeout: int) -> None: ...
     @property
+    def writer_enable_idempotence(self) -> bool: ...
+    @writer_enable_idempotence.setter
+    def writer_enable_idempotence(self, enabled: bool) -> None: ...
+    @property
+    def writer_max_inflight_requests_per_bucket(self) -> int: ...
+    @writer_max_inflight_requests_per_bucket.setter
+    def writer_max_inflight_requests_per_bucket(self, num: int) -> None: ...
+    @property
+    def writer_buffer_memory_size(self) -> int: ...
+    @writer_buffer_memory_size.setter
+    def writer_buffer_memory_size(self, size: int) -> None: ...
+    @property
+    def writer_buffer_wait_timeout_ms(self) -> int: ...
+    @writer_buffer_wait_timeout_ms.setter
+    def writer_buffer_wait_timeout_ms(self, timeout: int) -> None: ...
+    @property
     def connect_timeout_ms(self) -> int: ...
     @connect_timeout_ms.setter
     def connect_timeout_ms(self, timeout: int) -> None: ...
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index fd3c980ba1..65bcc9adfe 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -123,6 +123,38 @@ impl Config {
                                 ))
                             })?;
                     }
+                    "writer.enable-idempotence" => {
+                        config.writer_enable_idempotence = match value.as_str() {
+                            "true" => true,
+                            "false" => false,
+                            other => {
+                                return Err(FlussError::new_err(format!(
+                                    "Invalid value '{other}' for '{key}', expected 'true' or 'false'"
+                                )));
+                            }
+                        };
+                    }
+                    "writer.max-inflight-requests-per-bucket" => {
+                        config.writer_max_inflight_requests_per_bucket =
+                            value.parse::<usize>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
+                    }
+                    "writer.buffer.memory-size" => {
+                        config.writer_buffer_memory_size = value.parse::<usize>().map_err(|e| {
+                            FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
+                        })?;
+                    }
+                    "writer.buffer.wait-timeout-ms" => {
+                        config.writer_buffer_wait_timeout_ms =
+                            value.parse::<u64>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
+                    }
                     "writer.bucket.no-key-assigner" => {
                         config.writer_bucket_no_key_assigner =
                             value.parse::<fcore::config::NoKeyAssigner>().map_err(|e| {
@@ -296,6 +328,54 @@ impl Config {
         Ok(())
     }
 
+    /// Get whether idempotent writes are enabled
+    #[getter]
+    fn writer_enable_idempotence(&self) -> bool {
+        self.inner.writer_enable_idempotence
+    }
+
+    /// Set whether idempotent writes are enabled
+    #[setter]
+    fn set_writer_enable_idempotence(&mut self, enabled: bool) {
+        self.inner.writer_enable_idempotence = enabled;
+    }
+
+    /// Get the max in-flight requests per bucket
+    #[getter]
+    fn writer_max_inflight_requests_per_bucket(&self) -> usize {
+        self.inner.writer_max_inflight_requests_per_bucket
+    }
+
+    /// Set the max in-flight requests per bucket
+    #[setter]
+    fn set_writer_max_inflight_requests_per_bucket(&mut self, num: usize) {
+        self.inner.writer_max_inflight_requests_per_bucket = num;
+    }
+
+    /// Get the writer buffer memory size
+    #[getter]
+    fn writer_buffer_memory_size(&self) -> usize {
+        self.inner.writer_buffer_memory_size
+    }
+
+    /// Set the writer buffer memory size
+    #[setter]
+    fn set_writer_buffer_memory_size(&mut self, size: usize) {
+        self.inner.writer_buffer_memory_size = size;
+    }
+
+    /// Get the writer buffer wait timeout in milliseconds
+    #[getter]
+    fn writer_buffer_wait_timeout_ms(&self) -> u64 {
+        self.inner.writer_buffer_wait_timeout_ms
+    }
+
+    /// Set the writer buffer wait timeout in milliseconds
+    #[setter]
+    fn set_writer_buffer_wait_timeout_ms(&mut self, timeout: u64) {
+        self.inner.writer_buffer_wait_timeout_ms = timeout;
+    }
+
     /// Get the connect timeout in milliseconds
     #[getter]
     fn connect_timeout_ms(&self) -> u64 {
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 2610f6da0b..78e9362b8f 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -28,6 +28,10 @@ use std::time::Duration;
 use crate::error::{Error, FlussError, Result};
 use crate::metadata::TablePath;
 
+// TODO: implement `close(&self, timeout: Duration)` to gracefully shut down the
+// writer client (drain pending batches, then force-close on timeout).
+// Java's FlussConnection.close() calls writerClient.close(Long.MAX_VALUE).
+// WriterClient::close() already exists but is never called from the public API.
 pub struct FlussConnection {
     metadata: Arc<Metadata>,
     network_connects: Arc<RpcClient>,
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 0cf501cb45..53d004012a 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -15,21 +15,150 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::client::broadcast;
+use crate::client::write::IdempotenceManager;
 use crate::client::write::batch::WriteBatch::{ArrowLog, Kv};
 use crate::client::write::batch::{ArrowLogWriteBatch, KvWriteBatch, WriteBatch};
 use crate::client::{LogWriteRecord, Record, ResultHandle, WriteRecord};
 use crate::cluster::{BucketLocation, Cluster, ServerNode};
 use crate::config::Config;
-use crate::error::Result;
+use crate::error::{Error, Result};
 use crate::metadata::{PhysicalTablePath, TableBucket};
+use crate::record::{NO_BATCH_SEQUENCE, NO_WRITER_ID};
 use crate::util::current_time_ms;
 use crate::{BucketId, PartitionId, TableId};
 use dashmap::DashMap;
-use parking_lot::Mutex;
-use parking_lot::RwLock;
+use parking_lot::{Condvar, Mutex, RwLock};
 use std::collections::{HashMap, HashSet, VecDeque};
 use std::sync::Arc;
-use std::sync::atomic::{AtomicI32, AtomicI64, Ordering};
+use std::sync::atomic::{AtomicBool, AtomicI32, AtomicI64, AtomicUsize, Ordering};
+use std::time::{Duration, Instant};
+use tokio::sync::Notify;
+
+/// Byte-counting semaphore that blocks producers when total buffered memory
+/// exceeds the configured limit. Matches Java's `LazyMemorySegmentPool` behavior.
+///
+/// TODO: Replace `notify_all()` with per-waiter FIFO signaling (Java uses per-request
+/// Condition objects in a Deque) to avoid thundering herd under high contention.
+///
+/// TODO: Track actual batch memory usage instead of reserving a fixed `writer_batch_size`
+/// per batch. This over-counts when batches don't fill completely, reducing effective
+/// throughput. Requires tighter coupling with batch internals.
+pub(crate) struct MemoryLimiter {
+    state: Mutex<usize>,
+    cond: Condvar,
+    max_memory: usize,
+    wait_timeout: Duration,
+    closed: AtomicBool,
+    waiting_count: AtomicUsize,
+}
+
+impl MemoryLimiter {
+    pub fn new(max_memory: usize, wait_timeout: Duration) -> Self {
+        Self {
+            state: Mutex::new(0),
+            cond: Condvar::new(),
+            max_memory,
+            wait_timeout,
+            closed: AtomicBool::new(false),
+            waiting_count: AtomicUsize::new(0),
+        }
+    }
+
+    /// Try to acquire `size` bytes. Blocks until memory is available,
+    /// the timeout expires, or the limiter is closed.
+    /// Returns a `MemoryPermit` on success.
+    pub fn acquire(self: &Arc<Self>, size: usize) -> Result<MemoryPermit> {
+        if self.closed.load(Ordering::Acquire) {
+            return Err(Error::WriterClosed {
+                message: "Memory limiter is closed".to_string(),
+            });
+        }
+
+        if size > self.max_memory {
+            return Err(Error::IllegalArgument {
+                message: format!(
+                    "Batch size {} exceeds total buffer memory limit {}",
+                    size, self.max_memory
+                ),
+            });
+        }
+
+        let mut used = self.state.lock();
+        let deadline = Instant::now() + self.wait_timeout;
+        while *used + size > self.max_memory {
+            self.waiting_count.fetch_add(1, Ordering::Relaxed);
+            let result = self.cond.wait_until(&mut used, deadline);
+            self.waiting_count.fetch_sub(1, Ordering::Relaxed);
+
+            if self.closed.load(Ordering::Acquire) {
+                return Err(Error::WriterClosed {
+                    message: "Memory limiter is closed".to_string(),
+                });
+            }
+            if result.timed_out() && *used + size > self.max_memory {
+                return Err(Error::BufferExhausted {
+                    message: format!(
+                        "Failed to allocate {} bytes for write batch within {}ms. \
+                         {} of {} bytes in use, {} threads waiting.",
+                        size,
+                        self.wait_timeout.as_millis(),
+                        *used,
+                        self.max_memory,
+                        self.waiting_count.load(Ordering::Relaxed),
+                    ),
+                });
+            }
+        }
+
+        *used += size;
+        Ok(MemoryPermit {
+            limiter: Arc::clone(self),
+            size,
+        })
+    }
+
+    fn release(&self, size: usize) {
+        let mut used = self.state.lock();
+        *used = used.saturating_sub(size);
+        self.cond.notify_all();
+    }
+
+    /// Returns true if any producers are currently blocked waiting for memory.
+    /// Used by `ready()` to mark all batches as immediately sendable when
+    /// memory is exhausted (matching Java's `exhausted` flag).
+    pub fn has_waiters(&self) -> bool {
+        self.waiting_count.load(Ordering::Relaxed) > 0
+    }
+
+    /// Mark the limiter as closed and wake all blocked producers.
+    fn close(&self) {
+        self.closed.store(true, Ordering::Release);
+        self.cond.notify_all();
+    }
+}
+
+/// RAII guard that releases memory back to the `MemoryLimiter` on drop.
+pub(crate) struct MemoryPermit {
+    limiter: Arc<MemoryLimiter>,
+    size: usize,
+}
+
+impl std::fmt::Debug for MemoryPermit {
+    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+        f.debug_struct("MemoryPermit")
+            .field("size", &self.size)
+            .finish_non_exhaustive()
+    }
+}
+
+impl Drop for MemoryPermit {
+    fn drop(&mut self) {
+        if self.size > 0 {
+            self.limiter.release(self.size);
+        }
+    }
+}
 
 // Type alias to simplify complex nested types
 type BucketBatches = Vec<(BucketId, Arc<Mutex<VecDeque<WriteBatch>>>)>;
@@ -38,19 +167,30 @@ type BucketBatches = Vec<(BucketId, Arc<Mutex<VecDeque<WriteBatch>>>)>;
 pub struct RecordAccumulator {
     config: Config,
     write_batches: DashMap<Arc<PhysicalTablePath>, BucketAndWriteBatches>,
-    // batch_id -> complete callback
-    incomplete_batches: RwLock<HashMap<i64, ResultHandle>>,
+    // batch_id -> (complete callback, memory permit)
+    incomplete_batches: RwLock<HashMap<i64, (ResultHandle, MemoryPermit)>>,
     batch_timeout_ms: i64,
-    closed: bool,
+    closed: AtomicBool,
     flushes_in_progress: AtomicI32,
     appends_in_progress: i32,
     nodes_drain_index: Mutex<HashMap<i32, usize>>,
     batch_id: AtomicI64,
+    idempotence_manager: Arc<IdempotenceManager>,
+    memory_limiter: Arc<MemoryLimiter>,
+    /// Wakes the sender task when new batches are created or existing batches
+    /// become full, so the sender can drain them immediately instead of waiting
+    /// for its next poll cycle. This is the Rust equivalent of Java's
+    /// `Sender.wakeup()` / Kafka's `RecordAccumulator.wakeup()`.
+    sender_wakeup: Notify,
 }
 
 impl RecordAccumulator {
-    pub fn new(config: Config) -> Self {
+    pub fn new(config: Config, idempotence_manager: Arc<IdempotenceManager>) -> Self {
         let batch_timeout_ms = config.writer_batch_timeout_ms;
+        let memory_limiter = Arc::new(MemoryLimiter::new(
+            config.writer_buffer_memory_size,
+            Duration::from_millis(config.writer_buffer_wait_timeout_ms),
+        ));
         RecordAccumulator {
             config,
             write_batches: Default::default(),
@@ -61,6 +201,9 @@ impl RecordAccumulator {
             appends_in_progress: Default::default(),
             nodes_drain_index: Default::default(),
             batch_id: Default::default(),
+            idempotence_manager,
+            memory_limiter,
+            sender_wakeup: Notify::new(),
         }
     }
 
@@ -90,11 +233,9 @@ impl RecordAccumulator {
         cluster: &Cluster,
         record: &WriteRecord,
         dq: &mut VecDeque<WriteBatch>,
+        permit: MemoryPermit,
+        alloc_size: usize,
     ) -> Result<RecordAppendResult> {
-        if let Some(append_result) = self.try_append(record, dq)? {
-            return Ok(append_result);
-        }
-
         let physical_table_path = &record.physical_table_path;
         let table_path = physical_table_path.get_table_path();
         let table_info = cluster.get_table(table_path)?;
@@ -117,8 +258,7 @@ impl RecordAccumulator {
                 self.batch_id.fetch_add(1, Ordering::Relaxed),
                 Arc::clone(physical_table_path),
                 schema_id,
-                // TODO: Decide how to derive write limit in the absence of java's equivalent of PreAllocatedPagedOutputView
-                KvWriteBatch::DEFAULT_WRITE_LIMIT,
+                alloc_size,
                 record.write_format.to_kv_format()?,
                 kv_record.target_columns.clone(),
                 current_time_ms(),
@@ -136,7 +276,7 @@ impl RecordAccumulator {
 
         self.incomplete_batches
             .write()
-            .insert(batch_id, result_handle.clone());
+            .insert(batch_id, (result_handle.clone(), permit));
         Ok(RecordAppendResult::new(
             result_handle,
             dq.len() > 1 || batch_is_closed,
@@ -191,7 +331,24 @@ impl RecordAccumulator {
                 true, false, true,
             ));
         }
-        self.append_new_batch(cluster, record, &mut dq_guard)
+
+        // Drop dq lock before blocking on memory to prevent deadlock:
+        // producer holds dq + blocks on memory, while sender needs dq to drain.
+        drop(dq_guard);
+
+        let batch_size = self.config.writer_batch_size as usize;
+        let record_size = record.estimated_record_size();
+        let alloc_size = batch_size.max(record_size);
+        let permit = self.memory_limiter.acquire(alloc_size)?;
+
+        // Re-acquire dq lock after memory is available
+        let mut dq_guard = dq.lock();
+        // Re-try: another thread may have created a batch while we waited
+        if let Some(append_result) = self.try_append(record, &mut dq_guard)? {
+            return Ok(append_result); // permit drops here, memory released
+        }
+
+        self.append_new_batch(cluster, record, &mut dq_guard, permit, alloc_size)
     }
 
     pub fn ready(&self, cluster: &Arc<Cluster>) -> Result<ReadyCheckResult> {
@@ -215,6 +372,7 @@ impl RecordAccumulator {
         let mut ready_nodes = HashSet::new();
         let mut next_ready_check_delay_ms = self.batch_timeout_ms;
         let mut unknown_leader_tables = HashSet::new();
+        let exhausted = self.memory_limiter.has_waiters();
 
         for (physical_table_path, mut partition_id, bucket_batches) in entries {
             next_ready_check_delay_ms = self.bucket_ready(
@@ -226,6 +384,7 @@ impl RecordAccumulator {
                 &mut unknown_leader_tables,
                 cluster,
                 next_ready_check_delay_ms,
+                exhausted,
             )?
         }
 
@@ -247,6 +406,7 @@ impl RecordAccumulator {
         unknown_leader_tables: &mut HashSet<Arc<PhysicalTablePath>>,
         cluster: &Cluster,
         next_ready_check_delay_ms: i64,
+        exhausted: bool,
     ) -> Result<i64> {
         let mut next_delay = next_ready_check_delay_ms;
 
@@ -284,8 +444,14 @@ impl RecordAccumulator {
             let full = deque_size > 1 || batch.is_closed();
             let table_bucket = cluster.get_table_bucket(physical_table_path, bucket_id)?;
             if let Some(leader) = cluster.leader_for(&table_bucket) {
-                next_delay =
-                    self.batch_ready(leader, waited_time_ms, full, ready_nodes, next_delay);
+                next_delay = self.batch_ready(
+                    leader,
+                    waited_time_ms,
+                    full,
+                    exhausted,
+                    ready_nodes,
+                    next_delay,
+                );
             } else {
                 unknown_leader_tables.insert(Arc::clone(physical_table_path));
             }
@@ -298,12 +464,17 @@ impl RecordAccumulator {
         leader: &ServerNode,
         waited_time_ms: i64,
         full: bool,
+        exhausted: bool,
         ready_nodes: &mut HashSet<ServerNode>,
         next_ready_check_delay_ms: i64,
     ) -> i64 {
         if !ready_nodes.contains(leader) {
             let expired = waited_time_ms >= self.batch_timeout_ms;
-            let sendable = full || expired || self.closed || self.flush_in_progress();
+            let sendable = full
+                || expired
+                || exhausted
+                || self.closed.load(Ordering::Acquire)
+                || self.flush_in_progress();
 
             if sendable {
                 ready_nodes.insert(leader.clone());
@@ -335,6 +506,46 @@ impl RecordAccumulator {
         Ok(batches)
     }
 
+    /// Matches Java's `shouldStopDrainBatchesForBucket`. Returns true if
+    /// this bucket should be skipped during drain.
+    fn should_stop_drain_batches_for_bucket(
+        &self,
+        first: &WriteBatch,
+        table_bucket: &TableBucket,
+    ) -> bool {
+        if !self.idempotence_manager.is_enabled() {
+            return false;
+        }
+        if !self.idempotence_manager.is_writer_id_valid() {
+            return true;
+        }
+
+        // Use batch_id comparison instead of sequence comparison. After
+        // handle_failed_batch adjusts InFlightBatch sequences, the WriteBatch's
+        // stored sequence may be stale (re_enqueue syncs it, but this is more
+        // robust). Java can compare sequences because resetWriterState mutates
+        // the batch directly; Rust uses lightweight InFlightBatch proxies.
+        let is_first_in_flight = self.idempotence_manager.in_flight_count(table_bucket) == 0
+            || (first.has_batch_sequence()
+                && self
+                    .idempotence_manager
+                    .is_first_in_flight_batch(table_bucket, first.batch_id()));
+
+        if is_first_in_flight {
+            return false;
+        }
+
+        if !first.has_batch_sequence() {
+            // Fresh batch: respect max in-flight limit
+            !self
+                .idempotence_manager
+                .can_send_more_requests(table_bucket)
+        } else {
+            // Re-enqueued batch that's NOT first in-flight: stop
+            true
+        }
+    }
+
     fn drain_batches_for_one_node(
         &self,
         cluster: &Cluster,
@@ -391,10 +602,41 @@ impl RecordAccumulator {
                             break;
                         }
 
+                        // Improvement: `continue` instead of `break` to skip
+                        // only this bucket, not all buckets for the node.
+                        if self.should_stop_drain_batches_for_bucket(first_batch, &table_bucket) {
+                            if current_index == start {
+                                break;
+                            }
+                            continue;
+                        }
+
                         maybe_batch = Some(batch_lock.pop_front().unwrap());
                     }
                 }
 
+                if let Some(ref mut batch) = maybe_batch {
+                    // Assign writer state to fresh batches (matching Java's drain loop)
+                    let writer_id = if self.idempotence_manager.is_enabled() {
+                        self.idempotence_manager.writer_id()
+                    } else {
+                        NO_WRITER_ID
+                    };
+                    if writer_id != NO_WRITER_ID && !batch.has_batch_sequence() {
+                        self.idempotence_manager
+                            .maybe_update_writer_id(&table_bucket);
+                        let seq = self
+                            .idempotence_manager
+                            .next_sequence_and_increment(&table_bucket);
+                        batch.set_writer_state(writer_id, seq);
+                        self.idempotence_manager.add_in_flight_batch(
+                            &table_bucket,
+                            seq,
+                            batch.batch_id(),
+                        );
+                    }
+                }
+
                 if let Some(mut batch) = maybe_batch {
                     let current_batch_size = batch.estimated_size_in_bytes();
                     size += current_batch_size;
@@ -425,34 +667,160 @@ impl RecordAccumulator {
         self.incomplete_batches.write().remove(&batch_id);
     }
 
-    pub fn re_enqueue(&self, ready_write_batch: ReadyWriteBatch) {
+    pub fn re_enqueue(&self, mut ready_write_batch: ReadyWriteBatch) {
         ready_write_batch.write_batch.re_enqueued();
+
+        // Sync WriteBatch sequence with IdempotenceManager's adjusted sequence.
+        // When handle_failed_batch adjusts InFlightBatch sequences (after a prior
+        // batch fails), the WriteBatch is not updated (unlike Java which calls
+        // resetWriterState on the actual batch). We must sync here so that:
+        // 1. should_stop_drain_batches_for_bucket comparisons work correctly
+        // 2. build() produces bytes with the correct (adjusted) sequence
+        if self.idempotence_manager.is_enabled()
+            && ready_write_batch.write_batch.has_batch_sequence()
+        {
+            if let Some(adjusted_seq) = self.idempotence_manager.get_adjusted_sequence(
+                &ready_write_batch.table_bucket,
+                ready_write_batch.write_batch.batch_id(),
+            ) {
+                if adjusted_seq != ready_write_batch.write_batch.batch_sequence() {
+                    let writer_id = ready_write_batch.write_batch.writer_id();
+                    ready_write_batch
+                        .write_batch
+                        .set_writer_state(writer_id, adjusted_seq);
+                }
+            }
+        }
+
+        let dq = self.get_or_create_deque(&ready_write_batch);
+        let mut dq_guard = dq.lock();
+        if self.idempotence_manager.is_enabled() {
+            self.insert_in_sequence_order(&mut dq_guard, ready_write_batch);
+        } else {
+            dq_guard.push_front(ready_write_batch.write_batch);
+        }
+    }
+
+    /// Insert a re-enqueued batch in sequence order. Matches Java's
+    /// `insertInSequenceOrder`. If the batch is the next expected in-flight,
+    /// push to front; otherwise, find the correct sorted position.
+    fn insert_in_sequence_order(
+        &self,
+        dq: &mut VecDeque<WriteBatch>,
+        ready_write_batch: ReadyWriteBatch,
+    ) {
+        debug_assert!(
+            ready_write_batch.write_batch.batch_sequence() != NO_BATCH_SEQUENCE,
+            "Re-enqueuing a batch without a sequence (batch_id={})",
+            ready_write_batch.write_batch.batch_id()
+        );
+        debug_assert!(
+            self.idempotence_manager
+                .in_flight_count(&ready_write_batch.table_bucket)
+                > 0,
+            "Re-enqueuing a batch not tracked in in-flight (batch_id={}, bucket={})",
+            ready_write_batch.write_batch.batch_id(),
+            ready_write_batch.table_bucket
+        );
+
+        if dq.is_empty() {
+            dq.push_front(ready_write_batch.write_batch);
+            return;
+        }
+
+        // If it's the first in-flight batch for its bucket, push to front
+        if self.idempotence_manager.is_first_in_flight_batch(
+            &ready_write_batch.table_bucket,
+            ready_write_batch.write_batch.batch_id(),
+        ) {
+            dq.push_front(ready_write_batch.write_batch);
+            return;
+        }
+
+        // Find the correct position sorted by batch_sequence
+        let batch_seq = ready_write_batch.write_batch.batch_sequence();
+        let mut insert_pos = dq.len();
+        for (i, existing) in dq.iter().enumerate() {
+            if existing.has_batch_sequence() && existing.batch_sequence() > batch_seq {
+                insert_pos = i;
+                break;
+            }
+        }
+        dq.insert(insert_pos, ready_write_batch.write_batch);
+    }
+
+    fn get_or_create_deque(
+        &self,
+        ready_write_batch: &ReadyWriteBatch,
+    ) -> Arc<Mutex<VecDeque<WriteBatch>>> {
         let physical_table_path = ready_write_batch.write_batch.physical_table_path();
         let bucket_id = ready_write_batch.table_bucket.bucket_id();
         let table_id = ready_write_batch.table_bucket.table_id();
         let partition_id = ready_write_batch.table_bucket.partition_id();
         let is_partitioned_table = partition_id.is_some();
 
-        let dq = {
-            let mut binding = self
-                .write_batches
-                .entry(Arc::clone(physical_table_path))
-                .or_insert_with(|| BucketAndWriteBatches {
-                    table_id,
-                    is_partitioned_table,
-                    partition_id,
-                    batches: Default::default(),
-                });
-            let bucket_and_batches = binding.value_mut();
-            bucket_and_batches
-                .batches
-                .entry(bucket_id)
-                .or_insert_with(|| Arc::new(Mutex::new(VecDeque::new())))
-                .clone()
-        };
+        let mut binding = self
+            .write_batches
+            .entry(Arc::clone(physical_table_path))
+            .or_insert_with(|| BucketAndWriteBatches {
+                table_id,
+                is_partitioned_table,
+                partition_id,
+                batches: Default::default(),
+            });
+        let bucket_and_batches = binding.value_mut();
+        bucket_and_batches
+            .batches
+            .entry(bucket_id)
+            .or_insert_with(|| Arc::new(Mutex::new(VecDeque::new())))
+            .clone()
+    }
 
-        let mut dq_guard = dq.lock();
-        dq_guard.push_front(ready_write_batch.write_batch);
+    /// Mark the accumulator as closed. All batches become immediately ready
+    /// (sendable) in `batch_ready`, triggering a full drain without waiting
+    /// for `batch_timeout_ms`. Matches Java's `RecordAccumulator.close()`.
+    pub fn close(&self) {
+        self.closed.store(true, Ordering::Release);
+        self.wakeup_sender();
+    }
+
+    pub fn is_closed(&self) -> bool {
+        self.closed.load(Ordering::Acquire)
+    }
+
+    pub fn abort_batches(&self, error: broadcast::Error) {
+        self.memory_limiter.close();
+        // Complete batches still in deques (not yet drained).
+        for mut entry in self.write_batches.iter_mut() {
+            for (_bucket_id, deque) in entry.value_mut().batches.iter_mut() {
+                let mut dq = deque.lock();
+                while let Some(batch) = dq.pop_front() {
+                    batch.complete(Err(error.clone()));
+                }
+            }
+        }
+        // Fail any remaining handles (including in-flight batches that were
+        // drained but not yet completed). This is a no-op for handles already
+        // completed above via WriteBatch::complete.
+        let mut incomplete = self.incomplete_batches.write();
+        for (handle, _permit) in incomplete.values() {
+            handle.fail(error.clone());
+        }
+        incomplete.clear();
+    }
+
+    pub fn has_incomplete(&self) -> bool {
+        !self.incomplete_batches.read().is_empty()
+    }
+
+    /// Wake the sender task so it can drain ready batches immediately.
+    pub fn wakeup_sender(&self) {
+        self.sender_wakeup.notify_one();
+    }
+
+    /// Returns a future that completes when `wakeup_sender()` is called.
+    pub fn notified(&self) -> tokio::sync::futures::Notified<'_> {
+        self.sender_wakeup.notified()
     }
 
     fn get_all_buckets_in_current_node(
@@ -473,18 +841,42 @@ impl RecordAccumulator {
         buckets
     }
 
+    pub fn has_undrained(&self) -> bool {
+        for entry in self.write_batches.iter() {
+            for (_, batch_deque) in entry.value().batches.iter() {
+                if !batch_deque.lock().is_empty() {
+                    return true;
+                }
+            }
+        }
+        false
+    }
+
+    pub fn get_physical_table_paths_in_batches(&self) -> Vec<Arc<PhysicalTablePath>> {
+        self.write_batches
+            .iter()
+            .map(|entry| Arc::clone(entry.key()))
+            .collect()
+    }
+
     fn flush_in_progress(&self) -> bool {
         self.flushes_in_progress.load(Ordering::SeqCst) > 0
     }
 
     pub fn begin_flush(&self) {
         self.flushes_in_progress.fetch_add(1, Ordering::SeqCst);
+        self.wakeup_sender();
     }
 
     #[allow(unused_must_use)]
     pub async fn await_flush_completion(&self) -> Result<()> {
         // Clone handles before awaiting to avoid holding RwLock read guard across await points
-        let handles: Vec<_> = self.incomplete_batches.read().values().cloned().collect();
+        let handles: Vec<_> = self
+            .incomplete_batches
+            .read()
+            .values()
+            .map(|(h, _)| h.clone())
+            .collect();
 
         // Await on all handles
         let result = async {
@@ -586,10 +978,18 @@ mod tests {
     use crate::test_utils::{build_cluster, build_table_info};
     use std::sync::Arc;
 
+    fn disabled_idempotence() -> Arc<IdempotenceManager> {
+        Arc::new(IdempotenceManager::new(false, 5))
+    }
+
+    fn enabled_idempotence() -> Arc<IdempotenceManager> {
+        Arc::new(IdempotenceManager::new(true, 5))
+    }
+
     #[tokio::test]
     async fn re_enqueue_increments_attempts() -> Result<()> {
         let config = Config::default();
-        let accumulator = RecordAccumulator::new(config);
+        let accumulator = RecordAccumulator::new(config, disabled_idempotence());
         let table_path = TablePath::new("db".to_string(), "tbl".to_string());
         let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
         let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
@@ -623,7 +1023,7 @@ mod tests {
         use std::sync::atomic::Ordering;
 
         let config = Config::default();
-        let accumulator = RecordAccumulator::new(config);
+        let accumulator = RecordAccumulator::new(config, disabled_idempotence());
 
         accumulator.begin_flush();
         assert_eq!(accumulator.flushes_in_progress.load(Ordering::SeqCst), 1);
@@ -633,7 +1033,11 @@ mod tests {
             let broadcast = BroadcastOnce::default();
             let receiver = broadcast.receiver();
             let handle = ResultHandle::new(receiver);
-            accumulator.incomplete_batches.write().insert(1, handle);
+            let permit = accumulator.memory_limiter.acquire(1024).unwrap();
+            accumulator
+                .incomplete_batches
+                .write()
+                .insert(1, (handle, permit));
             // broadcast is dropped here, causing an error
         }
 
@@ -647,4 +1051,490 @@ mod tests {
 
         Ok(())
     }
+
+    fn append_and_drain(
+        accumulator: &RecordAccumulator,
+        cluster: &Arc<crate::cluster::Cluster>,
+        table_path: &TablePath,
+        bucket_id: i32,
+    ) -> Result<ReadyWriteBatch> {
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 2));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
+        accumulator.append(&record, bucket_id, cluster, false)?;
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let mut batches = accumulator.drain(cluster.clone(), &nodes, 1024 * 1024)?;
+        let mut drained = batches.remove(&1).expect("drained batches");
+        Ok(drained.pop().expect("batch"))
+    }
+
+    #[test]
+    fn test_should_stop_drain_for_fresh_batch_over_limit() {
+        let idempotence = Arc::new(IdempotenceManager::new(true, 2));
+        idempotence.set_writer_id(42);
+        let config = Config::default();
+        let accumulator = RecordAccumulator::new(config, Arc::clone(&idempotence));
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
+        accumulator
+            .append(&record, 0, &cluster, false)
+            .expect("append");
+
+        let table_bucket = TableBucket::new(1, 0);
+
+        // Add 2 in-flight batches (reaching the max_in_flight=2)
+        idempotence.add_in_flight_batch(&table_bucket, 0, 100);
+        idempotence.add_in_flight_batch(&table_bucket, 1, 101);
+
+        // Get the front batch from the deque
+        let entry = accumulator
+            .write_batches
+            .get(&PhysicalTablePath::of(Arc::new(table_path)))
+            .unwrap();
+        let dq = entry.batches.get(&0).unwrap();
+        let dq_guard = dq.lock();
+        let first_batch = dq_guard.front().unwrap();
+
+        // Fresh batch (no batch_sequence) with in-flight at limit → should stop
+        assert!(!first_batch.has_batch_sequence());
+        assert!(accumulator.should_stop_drain_batches_for_bucket(first_batch, &table_bucket));
+
+        // Remove one in-flight → under limit → should not stop
+        drop(dq_guard);
+        idempotence.remove_in_flight_batch(&table_bucket, 101);
+        let dq_guard = entry.batches.get(&0).unwrap().lock();
+        let first_batch = dq_guard.front().unwrap();
+        assert!(!accumulator.should_stop_drain_batches_for_bucket(first_batch, &table_bucket));
+    }
+
+    #[test]
+    fn test_should_stop_drain_for_retry_not_first_inflight() {
+        let idempotence = enabled_idempotence();
+        idempotence.set_writer_id(42);
+        let config = Config::default();
+        let accumulator = RecordAccumulator::new(config, Arc::clone(&idempotence));
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
+
+        // Drain two separate batches to get batch0(seq=0) and batch1(seq=1)
+        let batch0 =
+            append_and_drain(&accumulator, &cluster, &table_path, 0).expect("drain batch0");
+        let batch1 =
+            append_and_drain(&accumulator, &cluster, &table_path, 0).expect("drain batch1");
+
+        assert_eq!(batch0.write_batch.batch_sequence(), 0);
+        assert_eq!(batch1.write_batch.batch_sequence(), 1);
+
+        let batch1_id = batch1.write_batch.batch_id();
+        let table_bucket = batch0.table_bucket.clone();
+
+        // Re-enqueue only batch1 (simulating batch0 still in-flight, batch1 got error)
+        accumulator.re_enqueue(batch1);
+
+        let entry = accumulator
+            .write_batches
+            .get(&PhysicalTablePath::of(Arc::new(table_path)))
+            .unwrap();
+        let dq = entry.batches.get(&0).unwrap();
+        let dq_guard = dq.lock();
+        let first_batch = dq_guard.front().unwrap();
+
+        // Batch1 is re-enqueued with seq=1, but batch0 (seq=0) is the first in-flight.
+        // batch1's batch_id != first in-flight batch_id → should stop.
+        assert!(first_batch.has_batch_sequence());
+        assert_eq!(first_batch.batch_id(), batch1_id);
+        assert!(accumulator.should_stop_drain_batches_for_bucket(first_batch, &table_bucket));
+    }
+
+    #[tokio::test]
+    async fn test_insert_in_sequence_order() -> Result<()> {
+        let idempotence = enabled_idempotence();
+        idempotence.set_writer_id(42);
+        let config = Config::default();
+        let accumulator = RecordAccumulator::new(config, Arc::clone(&idempotence));
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let cluster = Arc::new(build_cluster(&table_path, 1, 2));
+
+        // Create and drain 3 batches to get them with sequences 0, 1, 2
+        let batch0 = append_and_drain(&accumulator, &cluster, &table_path, 0)?;
+        let batch1 = append_and_drain(&accumulator, &cluster, &table_path, 0)?;
+        let batch2 = append_and_drain(&accumulator, &cluster, &table_path, 0)?;
+
+        assert_eq!(batch0.write_batch.batch_sequence(), 0);
+        assert_eq!(batch1.write_batch.batch_sequence(), 1);
+        assert_eq!(batch2.write_batch.batch_sequence(), 2);
+
+        let batch0_id = batch0.write_batch.batch_id();
+        let batch1_id = batch1.write_batch.batch_id();
+        let batch2_id = batch2.write_batch.batch_id();
+        let table_bucket = batch0.table_bucket.clone();
+
+        // Re-enqueue in reverse order: 2, 0, 1
+        // insert_in_sequence_order should sort them as: 0, 1, 2
+        accumulator.re_enqueue(batch2);
+        accumulator.re_enqueue(batch0);
+        accumulator.re_enqueue(batch1);
+
+        // Verify the deque order directly
+        let entry = accumulator
+            .write_batches
+            .get(&PhysicalTablePath::of(Arc::new(table_path)))
+            .unwrap();
+        let dq = entry.batches.get(&0).unwrap();
+        let dq_guard = dq.lock();
+        assert_eq!(dq_guard.len(), 3);
+        // batch0 (seq=0) is the first in-flight, so it should be at front
+        assert_eq!(dq_guard[0].batch_id(), batch0_id);
+        assert_eq!(dq_guard[0].batch_sequence(), 0);
+        assert_eq!(dq_guard[1].batch_id(), batch1_id);
+        assert_eq!(dq_guard[1].batch_sequence(), 1);
+        assert_eq!(dq_guard[2].batch_id(), batch2_id);
+        assert_eq!(dq_guard[2].batch_sequence(), 2);
+        drop(dq_guard);
+
+        // Drain: first in-flight is seq=0, so batch0 passes should_stop check
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let mut batches = accumulator.drain(cluster.clone(), &nodes, 1024 * 1024)?;
+        let drained = batches.remove(&1).expect("drained batches");
+        assert_eq!(drained.len(), 1);
+        assert_eq!(drained[0].write_batch.batch_sequence(), 0);
+
+        // Complete batch0 so batch1 becomes first in-flight
+        idempotence.handle_completed_batch(&table_bucket, batch0_id, 42);
+
+        let mut batches = accumulator.drain(cluster.clone(), &nodes, 1024 * 1024)?;
+        let drained = batches.remove(&1).expect("drained");
+        assert_eq!(drained[0].write_batch.batch_sequence(), 1);
+
+        idempotence.handle_completed_batch(&table_bucket, batch1_id, 42);
+
+        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024)?;
+        let drained = batches.remove(&1).expect("drained");
+        assert_eq!(drained[0].write_batch.batch_sequence(), 2);
+
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn test_abort_batches() -> Result<()> {
+        let idempotence = disabled_idempotence();
+        let config = Config::default();
+        let accumulator = RecordAccumulator::new(config, Arc::clone(&idempotence));
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
+
+        let result = accumulator.append(&record, 0, &cluster, false)?;
+        let handle = result.result_handle.expect("handle");
+        assert!(accumulator.has_incomplete());
+
+        accumulator.abort_batches(broadcast::Error::Client {
+            message: "test abort".to_string(),
+        });
+
+        assert!(!accumulator.has_incomplete());
+        assert!(!accumulator.has_undrained());
+
+        // The handle should receive the error
+        let batch_result = handle.wait().await?;
+        assert!(matches!(
+            batch_result,
+            Err(broadcast::Error::Client { message }) if message == "test abort"
+        ));
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn test_drain_skips_blocked_bucket_continues_others() -> Result<()> {
+        // Use max_in_flight=1 so that one in-flight batch blocks further draining
+        let idempotence = Arc::new(IdempotenceManager::new(true, 1));
+        idempotence.set_writer_id(42);
+        let config = Config::default();
+        let accumulator = RecordAccumulator::new(config, Arc::clone(&idempotence));
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let cluster = Arc::new(build_cluster(&table_path, 1, 2));
+
+        // Append to both buckets
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 2));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+
+        // Append to bucket 0
+        let record =
+            WriteRecord::for_append(table_info.clone(), physical_table_path.clone(), 1, &row);
+        accumulator.append(&record, 0, &cluster, false)?;
+
+        // Append to bucket 1
+        let record =
+            WriteRecord::for_append(table_info.clone(), physical_table_path.clone(), 1, &row);
+        accumulator.append(&record, 1, &cluster, false)?;
+
+        // Drain once — both buckets get batches assigned with sequences
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let batches = accumulator.drain(cluster.clone(), &nodes, 1024 * 1024)?;
+        let drained = batches.get(&1).expect("drained");
+        // Both buckets should produce batches
+        assert_eq!(drained.len(), 2);
+
+        // Now: both buckets have 1 in-flight each (added during drain).
+        // Append another record to each bucket.
+        let record =
+            WriteRecord::for_append(table_info.clone(), physical_table_path.clone(), 1, &row);
+        accumulator.append(&record, 0, &cluster, false)?;
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
+        accumulator.append(&record, 1, &cluster, false)?;
+
+        // With max_in_flight=1, both buckets are at limit → should_stop returns true
+        // for fresh batches. The drain should skip both (continue, not break).
+        let batches2 = accumulator.drain(cluster.clone(), &nodes, 1024 * 1024)?;
+        // No batches should be drained (both blocked)
+        assert!(
+            batches2.is_empty() || batches2.get(&1).is_none_or(|b| b.is_empty()),
+            "Expected no batches when all buckets are blocked"
+        );
+
+        // Complete the in-flight for bucket 0
+        let bucket0_batch = &drained[0];
+        idempotence.handle_completed_batch(
+            &bucket0_batch.table_bucket,
+            bucket0_batch.write_batch.batch_id(),
+            42,
+        );
+
+        // Now bucket 0 is unblocked but bucket 1 is still blocked
+        let batches3 = accumulator.drain(cluster, &nodes, 1024 * 1024)?;
+        let drained3 = batches3.get(&1).expect("some drained");
+        // Only bucket 0 should produce a batch (continue skipped bucket 1)
+        assert_eq!(drained3.len(), 1);
+        assert_eq!(drained3[0].table_bucket.bucket_id(), 0);
+
+        Ok(())
+    }
+
+    #[test]
+    fn test_memory_limiter_acquire_release() {
+        let limiter = Arc::new(MemoryLimiter::new(1024, Duration::from_secs(1)));
+
+        let permit1 = limiter.acquire(512).unwrap();
+        let permit2 = limiter.acquire(512).unwrap();
+
+        // At capacity — verify used is 1024
+        assert_eq!(*limiter.state.lock(), 1024);
+
+        // Release one permit, verify used drops
+        drop(permit1);
+        assert_eq!(*limiter.state.lock(), 512);
+
+        drop(permit2);
+        assert_eq!(*limiter.state.lock(), 0);
+    }
+
+    #[test]
+    fn test_memory_limiter_oversized_batch_fails_immediately() {
+        let limiter = Arc::new(MemoryLimiter::new(1024, Duration::from_secs(60)));
+
+        let result = limiter.acquire(2048);
+        assert!(matches!(result.unwrap_err(), Error::IllegalArgument { .. }));
+    }
+
+    #[test]
+    fn test_memory_limiter_blocks_then_unblocks() {
+        let limiter = Arc::new(MemoryLimiter::new(1024, Duration::from_secs(5)));
+
+        let permit = limiter.acquire(1024).unwrap();
+        assert_eq!(*limiter.state.lock(), 1024);
+
+        // Spawn a thread that tries to acquire — it should block
+        let limiter2 = Arc::clone(&limiter);
+        let handle = std::thread::spawn(move || limiter2.acquire(512));
+
+        // Give the thread time to block
+        std::thread::sleep(Duration::from_millis(50));
+        // Still at capacity (thread is blocked)
+        assert_eq!(*limiter.state.lock(), 1024);
+
+        // Release the permit — thread should unblock
+        drop(permit);
+
+        let result = handle.join().unwrap();
+        assert!(result.is_ok());
+        let _permit2 = result.unwrap();
+        assert_eq!(*limiter.state.lock(), 512);
+    }
+
+    #[test]
+    fn test_memory_limiter_timeout() {
+        let limiter = Arc::new(MemoryLimiter::new(1024, Duration::from_millis(100)));
+
+        let _permit = limiter.acquire(1024).unwrap();
+
+        // This should timeout
+        let start = Instant::now();
+        let result = limiter.acquire(512);
+        let elapsed = start.elapsed();
+
+        assert!(matches!(result.unwrap_err(), Error::BufferExhausted { .. }));
+        assert!(elapsed >= Duration::from_millis(80)); // allow some timing slack
+    }
+
+    #[test]
+    fn test_memory_limiter_close_fails_immediately() {
+        let limiter = Arc::new(MemoryLimiter::new(1024, Duration::from_secs(60)));
+
+        let _permit = limiter.acquire(512).unwrap();
+
+        limiter.close();
+
+        // New acquire should fail immediately, not block for 60s
+        let start = Instant::now();
+        let result = limiter.acquire(256);
+        let elapsed = start.elapsed();
+
+        assert!(matches!(result.unwrap_err(), Error::WriterClosed { .. }));
+        assert!(elapsed < Duration::from_millis(50));
+    }
+
+    #[test]
+    fn test_memory_limiter_close_unblocks_waiting_threads() {
+        let limiter = Arc::new(MemoryLimiter::new(1024, Duration::from_secs(60)));
+
+        // Fill the limiter completely
+        let _permit = limiter.acquire(1024).unwrap();
+
+        // Spawn a thread that blocks waiting for memory
+        let limiter2 = Arc::clone(&limiter);
+        let handle = std::thread::spawn(move || {
+            let start = Instant::now();
+            let result = limiter2.acquire(512);
+            (result, start.elapsed())
+        });
+
+        // Give the thread time to block
+        std::thread::sleep(Duration::from_millis(50));
+        assert_eq!(limiter.waiting_count.load(Ordering::Relaxed), 1);
+
+        // Close the limiter — should unblock the waiting thread
+        limiter.close();
+
+        let (result, elapsed) = handle.join().unwrap();
+        assert!(matches!(result.unwrap_err(), Error::WriterClosed { .. }));
+        assert!(elapsed < Duration::from_secs(5)); // should not wait the full 60s
+    }
+
+    #[test]
+    fn test_oversized_kv_record_does_not_panic() {
+        use crate::client::write::write_format::WriteFormat;
+        use crate::client::write::{RowBytes, WriteRecord};
+        use bytes::Bytes;
+
+        // Use a tiny batch size so the KV record exceeds it
+        let config = Config {
+            writer_batch_size: 64,
+            writer_buffer_memory_size: 1024 * 1024,
+            ..Config::default()
+        };
+
+        let accumulator = RecordAccumulator::new(config, disabled_idempotence());
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
+
+        // Create a KV record larger than batch_size (64 bytes)
+        let key = Bytes::from(vec![0u8; 32]);
+        let value = vec![0u8; 256];
+        let record = WriteRecord::for_upsert(
+            table_info,
+            physical_table_path,
+            1,
+            key,
+            None,
+            WriteFormat::CompactedKv,
+            None,
+            Some(RowBytes::Owned(Bytes::from(value))),
+        );
+
+        // This used to panic with "must append to a new batch" because
+        // the KV write limit was hardcoded to DEFAULT_WRITE_LIMIT (256 bytes)
+        // instead of using alloc_size = max(batch_size, record_size).
+        let result = accumulator.append(&record, 0, &cluster, false);
+        assert!(result.is_ok(), "oversized KV record should not panic");
+    }
+
+    #[test]
+    fn test_memory_permit_accounts_for_oversized_record() {
+        use crate::client::write::write_format::WriteFormat;
+        use crate::client::write::{RowBytes, WriteRecord};
+        use bytes::Bytes;
+
+        let config = Config {
+            writer_batch_size: 64,
+            writer_buffer_memory_size: 1024 * 1024,
+            ..Config::default()
+        };
+
+        let accumulator = RecordAccumulator::new(config, disabled_idempotence());
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
+
+        let key = Bytes::from(vec![0u8; 32]);
+        let value = vec![0u8; 256];
+        let record = WriteRecord::for_upsert(
+            table_info,
+            physical_table_path,
+            1,
+            key,
+            None,
+            WriteFormat::CompactedKv,
+            None,
+            Some(RowBytes::Owned(Bytes::from(value))),
+        );
+
+        // estimated_record_size includes batch header overhead
+        let expected_alloc = record.estimated_record_size();
+        assert!(expected_alloc > 64, "record should exceed batch_size=64");
+
+        accumulator.append(&record, 0, &cluster, false).unwrap();
+
+        // The permit should reserve max(batch_size, estimated_record_size) bytes.
+        let used = *accumulator.memory_limiter.state.lock();
+        assert_eq!(
+            used, expected_alloc,
+            "memory limiter should reserve max(batch_size, estimated_record_size)"
+        );
+    }
+
+    #[tokio::test]
+    async fn test_sender_wakeup_notifies() {
+        let accumulator = RecordAccumulator::new(Config::default(), disabled_idempotence());
+
+        // notified() should complete when wakeup_sender() is called
+        let notified = accumulator.notified();
+        accumulator.wakeup_sender();
+        // If wakeup doesn't work, this would hang forever.
+        tokio::time::timeout(Duration::from_millis(100), notified)
+            .await
+            .expect("notified should complete after wakeup_sender");
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index c765473096..e3cd2ca46d 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -22,6 +22,7 @@ use crate::error::{Error, Result};
 use crate::metadata::{KvFormat, PhysicalTablePath, RowType};
 use crate::record::MemoryLogRecordsArrowBuilder;
 use crate::record::kv::KvRecordBatchBuilder;
+use crate::record::{NO_BATCH_SEQUENCE, NO_WRITER_ID};
 use bytes::Bytes;
 use std::cmp::max;
 use std::sync::Arc;
@@ -35,6 +36,8 @@ pub struct InnerWriteBatch {
     completed: AtomicBool,
     attempts: AtomicI32,
     drained_ms: i64,
+    batch_sequence: i32,
+    writer_id: i64,
 }
 
 impl InnerWriteBatch {
@@ -47,9 +50,23 @@ impl InnerWriteBatch {
             completed: AtomicBool::new(false),
             attempts: AtomicI32::new(0),
             drained_ms: -1,
+            batch_sequence: NO_BATCH_SEQUENCE,
+            writer_id: NO_WRITER_ID,
         }
     }
 
+    pub fn batch_sequence(&self) -> i32 {
+        self.batch_sequence
+    }
+
+    pub fn writer_id(&self) -> i64 {
+        self.writer_id
+    }
+
+    pub fn has_batch_sequence(&self) -> bool {
+        self.batch_sequence != NO_BATCH_SEQUENCE
+    }
+
     fn waited_time_ms(&self, now: i64) -> i64 {
         max(0i64, now - self.create_ms)
     }
@@ -176,6 +193,25 @@ impl WriteBatch {
     pub fn is_done(&self) -> bool {
         self.inner_batch().is_done()
     }
+
+    pub fn batch_sequence(&self) -> i32 {
+        self.inner_batch().batch_sequence()
+    }
+
+    pub fn writer_id(&self) -> i64 {
+        self.inner_batch().writer_id()
+    }
+
+    pub fn has_batch_sequence(&self) -> bool {
+        self.inner_batch().has_batch_sequence()
+    }
+
+    pub fn set_writer_state(&mut self, writer_id: i64, batch_base_sequence: i32) {
+        match self {
+            WriteBatch::ArrowLog(batch) => batch.set_writer_state(writer_id, batch_base_sequence),
+            WriteBatch::Kv(batch) => batch.set_writer_state(writer_id, batch_base_sequence),
+        }
+    }
 }
 
 pub struct ArrowLogWriteBatch {
@@ -226,6 +262,14 @@ impl ArrowLogWriteBatch {
         }
     }
 
+    pub fn set_writer_state(&mut self, writer_id: i64, batch_base_sequence: i32) {
+        self.arrow_builder
+            .set_writer_state(writer_id, batch_base_sequence);
+        self.write_batch.batch_sequence = batch_base_sequence;
+        self.write_batch.writer_id = writer_id;
+        self.built_records = None;
+    }
+
     pub fn build(&mut self) -> Result<Bytes> {
         if let Some(bytes) = &self.built_records {
             return Ok(bytes.clone());
@@ -264,7 +308,6 @@ pub struct KvWriteBatch {
 }
 
 impl KvWriteBatch {
-    pub const DEFAULT_WRITE_LIMIT: usize = 256;
     #[allow(clippy::too_many_arguments)]
     pub fn new(
         batch_id: i64,
@@ -345,6 +388,13 @@ impl KvWriteBatch {
         self.kv_batch_builder.close()
     }
 
+    pub fn set_writer_state(&mut self, writer_id: i64, batch_base_sequence: i32) {
+        self.kv_batch_builder
+            .set_writer_state(writer_id, batch_base_sequence);
+        self.write_batch.batch_sequence = batch_base_sequence;
+        self.write_batch.writer_id = writer_id;
+    }
+
     pub fn target_columns(&self) -> Option<&Arc<Vec<usize>>> {
         self.target_columns.as_ref()
     }
@@ -509,7 +559,7 @@ mod tests {
             1,
             Arc::clone(&physical_path),
             1,
-            KvWriteBatch::DEFAULT_WRITE_LIMIT,
+            256,
             KvFormat::COMPACTED,
             None,
             0,
diff --git a/fluss-rust/crates/fluss/src/client/write/broadcast.rs b/fluss-rust/crates/fluss/src/client/write/broadcast.rs
index ec45776599..9e00403586 100644
--- a/fluss-rust/crates/fluss/src/client/write/broadcast.rs
+++ b/fluss-rust/crates/fluss/src/client/write/broadcast.rs
@@ -58,6 +58,17 @@ impl<T: Clone + Send + Sync> BroadcastOnceReceiver<T> {
 
         self.peek().expect("just got notified")
     }
+
+    /// Force-complete with an error if not already completed.
+    /// Used by `abort_batches` to fail in-flight handles that can't be
+    /// reached through `WriteBatch::complete`.
+    pub(crate) fn fail(&self, error: Error) {
+        let mut data = self.shared.data.write();
+        if data.is_none() {
+            *data = Some(Err(error));
+            self.shared.notify.notify_waiters();
+        }
+    }
 }
 
 #[derive(Debug)]
diff --git a/fluss-rust/crates/fluss/src/client/write/idempotence.rs b/fluss-rust/crates/fluss/src/client/write/idempotence.rs
new file mode 100644
index 0000000000..3c55f6ac5a
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/idempotence.rs
@@ -0,0 +1,724 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::metadata::TableBucket;
+use crate::record::{NO_BATCH_SEQUENCE, NO_WRITER_ID};
+use crate::rpc::FlussError;
+use log::debug;
+use parking_lot::Mutex;
+use std::collections::{HashMap, HashSet};
+use std::sync::atomic::{AtomicI64, Ordering};
+
+struct InFlightBatch {
+    batch_sequence: i32,
+    batch_id: i64,
+}
+
+struct BucketEntry {
+    writer_id: i64,
+    next_sequence: i32,
+    last_acked_sequence: i32,
+    in_flight: Vec<InFlightBatch>,
+    reset_batch_ids: HashSet<i64>,
+}
+
+impl BucketEntry {
+    fn new() -> Self {
+        Self {
+            writer_id: NO_WRITER_ID,
+            next_sequence: 0,
+            last_acked_sequence: -1,
+            in_flight: Vec::new(),
+            reset_batch_ids: HashSet::new(),
+        }
+    }
+}
+
+pub struct IdempotenceManager {
+    writer_id: AtomicI64,
+    bucket_entries: Mutex<HashMap<TableBucket, BucketEntry>>,
+    enabled: bool,
+    max_in_flight_requests_per_bucket: usize,
+}
+
+impl IdempotenceManager {
+    pub fn new(enabled: bool, max_in_flight_requests_per_bucket: usize) -> Self {
+        Self {
+            writer_id: AtomicI64::new(NO_WRITER_ID),
+            bucket_entries: Mutex::new(HashMap::new()),
+            enabled,
+            max_in_flight_requests_per_bucket,
+        }
+    }
+
+    pub fn is_enabled(&self) -> bool {
+        self.enabled
+    }
+
+    pub fn writer_id(&self) -> i64 {
+        self.writer_id.load(Ordering::Acquire)
+    }
+
+    pub fn has_writer_id(&self) -> bool {
+        self.writer_id() != NO_WRITER_ID
+    }
+
+    pub fn is_writer_id_valid(&self) -> bool {
+        self.has_writer_id()
+    }
+
+    pub fn in_flight_count(&self, bucket: &TableBucket) -> usize {
+        let entries = self.bucket_entries.lock();
+        entries.get(bucket).map_or(0, |e| e.in_flight.len())
+    }
+
+    pub fn can_send_more_requests(&self, bucket: &TableBucket) -> bool {
+        self.in_flight_count(bucket) < self.max_in_flight_requests_per_bucket
+    }
+
+    pub fn set_writer_id(&self, id: i64) {
+        self.writer_id.store(id, Ordering::Release);
+    }
+
+    pub fn reset_writer_id(&self) {
+        self.writer_id.store(NO_WRITER_ID, Ordering::Release);
+        self.bucket_entries.lock().clear();
+    }
+
+    pub fn next_sequence_and_increment(&self, bucket: &TableBucket) -> i32 {
+        let mut entries = self.bucket_entries.lock();
+        let entry = entries
+            .entry(bucket.clone())
+            .or_insert_with(BucketEntry::new);
+        let seq = entry.next_sequence;
+        entry.next_sequence += 1;
+        seq
+    }
+
+    pub fn add_in_flight_batch(&self, bucket: &TableBucket, batch_sequence: i32, batch_id: i64) {
+        debug_assert!(
+            batch_sequence != NO_BATCH_SEQUENCE,
+            "Can't track batch for bucket {bucket} when batch sequence is not set"
+        );
+        let mut entries = self.bucket_entries.lock();
+        let entry = entries
+            .entry(bucket.clone())
+            .or_insert_with(BucketEntry::new);
+        // Insert sorted by batch_sequence
+        let pos = entry
+            .in_flight
+            .binary_search_by_key(&batch_sequence, |b| b.batch_sequence)
+            .unwrap_or_else(|e| e);
+        entry.in_flight.insert(
+            pos,
+            InFlightBatch {
+                batch_sequence,
+                batch_id,
+            },
+        );
+    }
+
+    pub fn handle_completed_batch(
+        &self,
+        bucket: &TableBucket,
+        batch_id: i64,
+        batch_writer_id: i64,
+    ) {
+        if batch_writer_id != self.writer_id() {
+            debug!(
+                "Ignoring completed batch for bucket {bucket} with stale writer_id {batch_writer_id} (current: {})",
+                self.writer_id()
+            );
+            return;
+        }
+        let mut entries = self.bucket_entries.lock();
+        if let Some(entry) = entries.get_mut(bucket) {
+            // Find by batch_id to handle the case where the in-flight entry's sequence
+            // was adjusted by a prior handle_failed_batch call.
+            if let Some(pos) = entry.in_flight.iter().position(|b| b.batch_id == batch_id) {
+                let adjusted_seq = entry.in_flight[pos].batch_sequence;
+                entry.in_flight.remove(pos);
+                entry.reset_batch_ids.remove(&batch_id);
+                if adjusted_seq > entry.last_acked_sequence {
+                    entry.last_acked_sequence = adjusted_seq;
+                }
+            }
+        }
+    }
+
+    /// Handle a failed batch. Matches Java's `IdempotenceManager.handleFailedBatch`.
+    ///
+    /// For `OutOfOrderSequenceException` or `UnknownWriterIdException`, resets ALL
+    /// writer state (matching Java: "we cannot make any guarantees about the previously
+    /// committed message").
+    ///
+    /// For other errors, removes the specific in-flight entry by `batch_id` and
+    /// optionally adjusts downstream sequences. `adjust_sequences` should only be true
+    /// when the batch has NOT exhausted its retries.
+    pub fn handle_failed_batch(
+        &self,
+        bucket: &TableBucket,
+        batch_id: i64,
+        batch_writer_id: i64,
+        error: Option<FlussError>,
+        adjust_sequences: bool,
+    ) {
+        if batch_writer_id != self.writer_id() {
+            debug!(
+                "Ignoring failed batch for bucket {bucket} with stale writer_id {batch_writer_id} (current: {})",
+                self.writer_id()
+            );
+            return;
+        }
+
+        let mut entries = self.bucket_entries.lock();
+
+        // Matches Java: OutOfOrderSequence or UnknownWriterId → reset all writer state.
+        // Java's synchronized handleFailedBatch can call synchronized resetWriterId
+        // because Java monitors are reentrant. We inline the reset here to stay in
+        // the same lock scope.
+        if let Some(e) = error {
+            if e == FlussError::OutOfOrderSequenceException
+                || e == FlussError::UnknownWriterIdException
+            {
+                debug!(
+                    "Resetting writer ID due to {e:?} for bucket {bucket} \
+                     (writer_id={batch_writer_id}, batch_id={batch_id})"
+                );
+                self.writer_id.store(NO_WRITER_ID, Ordering::Release);
+                entries.clear();
+                return;
+            }
+        }
+        if let Some(entry) = entries.get_mut(bucket) {
+            // Find and remove by batch_id, capturing the (possibly adjusted) sequence
+            let failed_sequence = entry
+                .in_flight
+                .iter()
+                .position(|b| b.batch_id == batch_id)
+                .map(|pos| {
+                    let seq = entry.in_flight[pos].batch_sequence;
+                    entry.in_flight.remove(pos);
+                    seq
+                });
+            entry.reset_batch_ids.remove(&batch_id);
+            if adjust_sequences {
+                if let Some(failed_seq) = failed_sequence {
+                    // Decrement sequences of in-flight batches that have higher sequences
+                    for b in &mut entry.in_flight {
+                        if b.batch_sequence > failed_seq {
+                            b.batch_sequence -= 1;
+                            debug_assert!(
+                                b.batch_sequence >= 0,
+                                "Batch sequence for batch_id={} went negative: {}",
+                                b.batch_id,
+                                b.batch_sequence
+                            );
+                            entry.reset_batch_ids.insert(b.batch_id);
+                        }
+                    }
+                    // Roll back next_sequence
+                    if entry.next_sequence > failed_seq {
+                        entry.next_sequence -= 1;
+                        debug_assert!(
+                            entry.next_sequence >= 0,
+                            "Next sequence went negative: {}",
+                            entry.next_sequence
+                        );
+                    }
+                }
+            }
+        }
+    }
+
+    #[cfg(test)]
+    pub fn remove_in_flight_batch(&self, bucket: &TableBucket, batch_id: i64) {
+        let mut entries = self.bucket_entries.lock();
+        if let Some(entry) = entries.get_mut(bucket) {
+            entry.in_flight.retain(|b| b.batch_id != batch_id);
+        }
+    }
+
+    /// If the bucket's stored writer_id doesn't match the current writer_id
+    /// and there are no in-flight batches, reset the bucket entry to start
+    /// sequences from 0. Matches Java's `IdempotenceManager.maybeUpdateWriterId`.
+    pub fn maybe_update_writer_id(&self, bucket: &TableBucket) {
+        let current_writer_id = self.writer_id();
+        let mut entries = self.bucket_entries.lock();
+        let entry = entries
+            .entry(bucket.clone())
+            .or_insert_with(BucketEntry::new);
+        if entry.writer_id != current_writer_id && entry.in_flight.is_empty() {
+            entry.writer_id = current_writer_id;
+            entry.next_sequence = 0;
+            entry.last_acked_sequence = -1;
+            debug!(
+                "Writer id of bucket {bucket} set to {current_writer_id}. Reinitialize batch sequence at beginning."
+            );
+        }
+    }
+
+    /// Returns true if the given batch (identified by `batch_id`) is the first
+    /// in-flight batch for its bucket. Uses batch_id rather than batch_sequence
+    /// because sequence adjustment (`handle_failed_batch` with `adjust_sequences`)
+    /// modifies InFlightBatch sequences without updating the actual WriteBatch,
+    /// so batch_sequence on the WriteBatch may be stale.
+    pub fn is_first_in_flight_batch(&self, bucket: &TableBucket, batch_id: i64) -> bool {
+        let entries = self.bucket_entries.lock();
+        entries
+            .get(bucket)
+            .and_then(|e| e.in_flight.first())
+            .is_some_and(|b| b.batch_id == batch_id)
+    }
+
+    /// Returns the current (possibly adjusted) in-flight sequence for a batch.
+    /// Used by `re_enqueue` to sync the WriteBatch's sequence with the adjusted
+    /// InFlightBatch sequence.
+    ///
+    /// Does NOT clear `reset_batch_ids` — the reset marker must survive
+    /// re-enqueue so that `can_retry_for_error` can still see it on subsequent
+    /// retries. It is cleared only on terminal events: `handle_completed_batch`
+    /// or `handle_failed_batch`. This matches Java where `reopened` persists
+    /// across retries and is only cleared in `close()` (resource cleanup).
+    pub fn get_adjusted_sequence(&self, bucket: &TableBucket, batch_id: i64) -> Option<i32> {
+        let entries = self.bucket_entries.lock();
+        let entry = entries.get(bucket)?;
+        entry
+            .in_flight
+            .iter()
+            .find(|b| b.batch_id == batch_id)
+            .map(|b| b.batch_sequence)
+    }
+
+    pub fn is_next_sequence(&self, bucket: &TableBucket, batch_sequence: i32) -> bool {
+        let entries = self.bucket_entries.lock();
+        if let Some(entry) = entries.get(bucket) {
+            entry.last_acked_sequence + 1 == batch_sequence
+        } else {
+            // No entry means sequence 0 is expected (last_acked = -1, so -1 + 1 = 0)
+            batch_sequence == 0
+        }
+    }
+
+    pub fn can_retry_for_error(
+        &self,
+        bucket: &TableBucket,
+        batch_sequence: i32,
+        batch_id: i64,
+        error: FlussError,
+    ) -> bool {
+        if !self.has_writer_id() {
+            return false;
+        }
+        let entries = self.bucket_entries.lock();
+        let entry = entries.get(bucket);
+        let is_reset = entry.is_some_and(|e| e.reset_batch_ids.contains(&batch_id));
+
+        if error == FlussError::OutOfOrderSequenceException {
+            // Inline is_next_sequence logic to avoid double-locking
+            let is_next = entry.map_or(batch_sequence == 0, |e| {
+                e.last_acked_sequence + 1 == batch_sequence
+            });
+            return is_reset || !is_next;
+        }
+        if error == FlussError::UnknownWriterIdException {
+            return is_reset;
+        }
+        false
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    fn test_bucket(bucket_id: i32) -> TableBucket {
+        TableBucket::new(1, bucket_id)
+    }
+
+    /// Setup: 3 in-flight batches (seq 0,1,2 / batch_id 100,101,102) for bucket 0.
+    fn setup_three_in_flight() -> (IdempotenceManager, TableBucket) {
+        let mgr = IdempotenceManager::new(true, 5);
+        mgr.set_writer_id(42);
+        let b0 = test_bucket(0);
+        let _ = mgr.next_sequence_and_increment(&b0); // 0
+        let _ = mgr.next_sequence_and_increment(&b0); // 1
+        let _ = mgr.next_sequence_and_increment(&b0); // 2
+        mgr.add_in_flight_batch(&b0, 0, 100);
+        mgr.add_in_flight_batch(&b0, 1, 101);
+        mgr.add_in_flight_batch(&b0, 2, 102);
+        (mgr, b0)
+    }
+
+    #[test]
+    fn test_handle_completed_batch() {
+        let (mgr, b0) = setup_three_in_flight();
+
+        // Basic: complete middle batch, verify removal and last_acked update
+        mgr.handle_completed_batch(&b0, 101, 42);
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert_eq!(entry.last_acked_sequence, 1);
+            assert_eq!(entry.in_flight.len(), 2);
+            assert_eq!(entry.in_flight[0].batch_sequence, 0);
+            assert_eq!(entry.in_flight[1].batch_sequence, 2);
+        }
+
+        // Adjusted: fail batch_id=100 (seq=0) with adjustment, then complete
+        // batch_id=102 whose seq was adjusted from 2→1. last_acked should use
+        // the adjusted sequence.
+        let (mgr, b0) = setup_three_in_flight();
+        mgr.handle_failed_batch(&b0, 101, 42, None, true);
+        mgr.handle_completed_batch(&b0, 102, 42);
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert_eq!(entry.last_acked_sequence, 1); // adjusted, not original 2
+            assert_eq!(entry.in_flight.len(), 1);
+            assert_eq!(entry.in_flight[0].batch_id, 100);
+        }
+    }
+
+    #[test]
+    fn test_handle_failed_batch() {
+        // With sequence adjustment
+        let (mgr, b0) = setup_three_in_flight();
+        mgr.handle_failed_batch(&b0, 101, 42, None, true);
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert_eq!(entry.in_flight.len(), 2);
+            assert_eq!(entry.in_flight[0].batch_sequence, 0);
+            assert_eq!(entry.in_flight[1].batch_sequence, 1); // was 2, decremented
+            assert_eq!(entry.next_sequence, 2); // was 3, decremented
+        }
+
+        // Without sequence adjustment (retries exhausted)
+        let (mgr, b0) = setup_three_in_flight();
+        mgr.handle_failed_batch(&b0, 101, 42, None, false);
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert_eq!(entry.in_flight.len(), 2);
+            assert_eq!(entry.in_flight[0].batch_sequence, 0);
+            assert_eq!(entry.in_flight[1].batch_sequence, 2); // NOT decremented
+            assert_eq!(entry.next_sequence, 3); // NOT decremented
+        }
+
+        // OOS / UnknownWriterId errors reset all writer state
+        for error in [
+            FlussError::OutOfOrderSequenceException,
+            FlussError::UnknownWriterIdException,
+        ] {
+            let (mgr, b0) = setup_three_in_flight();
+            mgr.handle_failed_batch(&b0, 100, 42, Some(error), true);
+            assert!(!mgr.has_writer_id());
+            assert!(mgr.bucket_entries.lock().is_empty());
+        }
+    }
+
+    #[test]
+    fn test_can_retry_out_of_order() {
+        let mgr = IdempotenceManager::new(true, 5);
+        let b0 = test_bucket(0);
+
+        // No writer_id → never retriable
+        assert!(!mgr.can_retry_for_error(&b0, 0, 100, FlussError::OutOfOrderSequenceException));
+
+        mgr.set_writer_id(42);
+        mgr.add_in_flight_batch(&b0, 0, 100);
+        mgr.add_in_flight_batch(&b0, 1, 101);
+
+        // seq=0 IS next expected (last_acked=-1+1=0) → genuine violation, NOT retriable
+        assert!(!mgr.can_retry_for_error(&b0, 0, 100, FlussError::OutOfOrderSequenceException));
+        // seq=1 is NOT next expected → retriable
+        assert!(mgr.can_retry_for_error(&b0, 1, 101, FlussError::OutOfOrderSequenceException));
+    }
+
+    #[test]
+    fn test_can_retry_after_sequence_reset() {
+        // OOS: batch whose seq was adjusted to match last_acked+1 is still retriable
+        let (mgr, b0) = setup_three_in_flight();
+        mgr.handle_completed_batch(&b0, 100, 42); // last_acked=0
+        mgr.handle_failed_batch(&b0, 101, 42, None, true); // batch_id=102 adjusted to seq=1
+
+        // seq=1 == last_acked(0)+1, but batch was reset → retriable
+        assert!(mgr.can_retry_for_error(&b0, 1, 102, FlussError::OutOfOrderSequenceException));
+
+        // UnknownWriterId: non-reset → NOT retriable, reset → retriable
+        let (mgr, b0) = setup_three_in_flight();
+        assert!(!mgr.can_retry_for_error(&b0, 0, 100, FlussError::UnknownWriterIdException));
+        mgr.handle_failed_batch(&b0, 101, 42, None, true); // batch_id=102 is reset
+        assert!(mgr.can_retry_for_error(&b0, 1, 102, FlussError::UnknownWriterIdException));
+    }
+
+    #[test]
+    fn test_maybe_update_writer_id() {
+        let mgr = IdempotenceManager::new(true, 5);
+        mgr.set_writer_id(42);
+        let b0 = test_bucket(0);
+
+        mgr.maybe_update_writer_id(&b0);
+        let seq = mgr.next_sequence_and_increment(&b0);
+        mgr.add_in_flight_batch(&b0, seq, 100);
+
+        // With in-flight batches: rotation is deferred
+        mgr.set_writer_id(99);
+        mgr.maybe_update_writer_id(&b0);
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert_eq!(entry.writer_id, 42); // unchanged
+            assert_eq!(entry.next_sequence, 1);
+        }
+
+        // Complete must use the writer_id that was active when batch was sent
+        mgr.handle_completed_batch(&b0, 100, 99);
+        mgr.maybe_update_writer_id(&b0);
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert_eq!(entry.writer_id, 99);
+            assert_eq!(entry.next_sequence, 0);
+            assert_eq!(entry.last_acked_sequence, -1);
+        }
+    }
+
+    #[test]
+    fn test_is_first_in_flight_batch() {
+        let (mgr, b0) = setup_three_in_flight();
+
+        assert!(mgr.is_first_in_flight_batch(&b0, 100));
+        assert!(!mgr.is_first_in_flight_batch(&b0, 101));
+
+        // After adjustment + completion, batch_id still identifies first correctly
+        mgr.handle_failed_batch(&b0, 101, 42, None, true);
+        mgr.handle_completed_batch(&b0, 100, 42);
+        assert!(mgr.is_first_in_flight_batch(&b0, 102));
+        assert!(!mgr.is_first_in_flight_batch(&b0, 100));
+    }
+
+    #[test]
+    fn test_can_send_more_requests() {
+        let mgr = IdempotenceManager::new(true, 2);
+        let b0 = test_bucket(0);
+
+        assert!(mgr.can_send_more_requests(&b0));
+
+        mgr.add_in_flight_batch(&b0, 0, 100);
+        assert!(mgr.can_send_more_requests(&b0));
+
+        mgr.add_in_flight_batch(&b0, 1, 101);
+        assert!(!mgr.can_send_more_requests(&b0)); // at limit
+
+        mgr.remove_in_flight_batch(&b0, 100);
+        assert!(mgr.can_send_more_requests(&b0)); // under limit again
+    }
+
+    #[test]
+    fn test_reset_batch_ids_cleaned_on_complete() {
+        let (mgr, b0) = setup_three_in_flight();
+
+        // Fail batch_id=100 → batch_id=101 and 102 marked as reset
+        mgr.handle_failed_batch(&b0, 100, 42, None, true);
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert!(entry.reset_batch_ids.contains(&101));
+            assert!(entry.reset_batch_ids.contains(&102));
+        }
+
+        // Complete batch_id=101 → cleaned from reset set
+        mgr.handle_completed_batch(&b0, 101, 42);
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert!(!entry.reset_batch_ids.contains(&101));
+            assert!(entry.reset_batch_ids.contains(&102)); // still there
+        }
+    }
+
+    #[test]
+    fn test_get_adjusted_sequence() {
+        let (mgr, b0) = setup_three_in_flight();
+
+        // No entry for unknown bucket
+        assert_eq!(mgr.get_adjusted_sequence(&test_bucket(9), 100), None);
+
+        // Before adjustment: returns original sequences
+        assert_eq!(mgr.get_adjusted_sequence(&b0, 101), Some(1));
+        assert_eq!(mgr.get_adjusted_sequence(&b0, 999), None);
+
+        // After adjustment: returns adjusted sequences
+        mgr.handle_failed_batch(&b0, 100, 42, None, true);
+        assert_eq!(mgr.get_adjusted_sequence(&b0, 100), None); // removed
+        assert_eq!(mgr.get_adjusted_sequence(&b0, 101), Some(0)); // was 1
+        assert_eq!(mgr.get_adjusted_sequence(&b0, 102), Some(1)); // was 2
+
+        // Reset flag survives get_adjusted_sequence (unlike the old take_ variant).
+        // This matches Java where `reopened` persists across retries.
+        {
+            let entries = mgr.bucket_entries.lock();
+            let entry = entries.get(&b0).unwrap();
+            assert!(entry.reset_batch_ids.contains(&101));
+            assert!(entry.reset_batch_ids.contains(&102));
+        }
+    }
+
+    // --- Scenario tests ---
+    // Simulate Sender-level orchestration on IdempotenceManager.
+    // Each test mirrors a Java SenderTest integration test, exercising the same
+    // state transitions that Sender.handle_write_batch_error / complete_batch make.
+    //
+    // Convention: retriable failures make NO IdempotenceManager call (batch stays
+    // in-flight, Sender re-enqueues via accumulator). Non-retriable failures call
+    // handle_failed_batch. Successes call handle_completed_batch.
+
+    #[test]
+    fn scenario_multiple_inflight_retried_in_order() {
+        // Java: testIdempotenceWithMultipleInflightBatchesRetriedInOrder
+        // 3 batches in-flight, batch 0 times out, batches 1+2 get OOS.
+        // All are retriable and must be retried one-at-a-time in sequence order.
+        let (mgr, b0) = setup_three_in_flight();
+
+        // Batch 0 (seq=0) times out → retriable, stays in in-flight
+        // Batch 1 (seq=1) OOS → retriable (not next expected seq)
+        assert!(mgr.can_retry_for_error(&b0, 1, 101, FlussError::OutOfOrderSequenceException));
+        // Batch 2 (seq=2) OOS → retriable
+        assert!(mgr.can_retry_for_error(&b0, 2, 102, FlussError::OutOfOrderSequenceException));
+
+        // Retry phase: only first-in-flight batch should be drained
+        assert!(mgr.is_first_in_flight_batch(&b0, 100));
+        assert!(!mgr.is_first_in_flight_batch(&b0, 101));
+
+        // Retry batch 0 succeeds → last_acked=0
+        mgr.handle_completed_batch(&b0, 100, 42);
+        assert_eq!(last_acked(&mgr, &b0), 0);
+
+        // Batch 1 is now first, retry succeeds → last_acked=1
+        assert!(mgr.is_first_in_flight_batch(&b0, 101));
+        mgr.handle_completed_batch(&b0, 101, 42);
+        assert_eq!(last_acked(&mgr, &b0), 1);
+
+        // Batch 2 is now first, retry succeeds → last_acked=2
+        assert!(mgr.is_first_in_flight_batch(&b0, 102));
+        mgr.handle_completed_batch(&b0, 102, 42);
+        assert_eq!(last_acked(&mgr, &b0), 2);
+    }
+
+    #[test]
+    fn scenario_out_of_order_responses() {
+        // Java: testCorrectHandlingOfOutOfOrderResponses
+        // Server responds to batch 1 (OOS) before batch 0 (timeout).
+        // Both re-enqueued, retried in order.
+        let mgr = IdempotenceManager::new(true, 5);
+        mgr.set_writer_id(42);
+        let b0 = test_bucket(0);
+        let _ = mgr.next_sequence_and_increment(&b0);
+        let _ = mgr.next_sequence_and_increment(&b0);
+        mgr.add_in_flight_batch(&b0, 0, 100);
+        mgr.add_in_flight_batch(&b0, 1, 101);
+
+        // Batch 1 response arrives first: OOS → retriable (seq 1 ≠ next expected 0)
+        assert!(mgr.can_retry_for_error(&b0, 1, 101, FlussError::OutOfOrderSequenceException));
+        // Batch 0 response: timeout → retriable (no IdempotenceManager call)
+
+        // Retry: batch 0 must go first
+        assert!(mgr.is_first_in_flight_batch(&b0, 100));
+        mgr.handle_completed_batch(&b0, 100, 42);
+        assert_eq!(last_acked(&mgr, &b0), 0);
+
+        // Then batch 1
+        assert!(mgr.is_first_in_flight_batch(&b0, 101));
+        mgr.handle_completed_batch(&b0, 101, 42);
+        assert_eq!(last_acked(&mgr, &b0), 1);
+    }
+
+    #[test]
+    fn scenario_second_batch_succeeds_first() {
+        // Java: testCorrectHandlingOfOutOfOrderResponsesWhenSecondSucceeds
+        //       + testCorrectHandlingOfDuplicateSequenceError (same at this level)
+        // Batch 1 succeeds before batch 0. last_acked jumps ahead, then batch 0
+        // completes without regressing last_acked.
+        let mgr = IdempotenceManager::new(true, 5);
+        mgr.set_writer_id(42);
+        let b0 = test_bucket(0);
+        let _ = mgr.next_sequence_and_increment(&b0);
+        let _ = mgr.next_sequence_and_increment(&b0);
+        mgr.add_in_flight_batch(&b0, 0, 100);
+        mgr.add_in_flight_batch(&b0, 1, 101);
+
+        // Batch 1 succeeds first → last_acked jumps to 1
+        mgr.handle_completed_batch(&b0, 101, 42);
+        assert_eq!(last_acked(&mgr, &b0), 1);
+
+        // Batch 0 timeout → retriable → re-enqueued → retry succeeds
+        mgr.handle_completed_batch(&b0, 100, 42);
+        // last_acked stays 1 (0 < 1, higher wins)
+        assert_eq!(last_acked(&mgr, &b0), 1);
+        assert!(
+            mgr.bucket_entries
+                .lock()
+                .get(&b0)
+                .unwrap()
+                .in_flight
+                .is_empty()
+        );
+    }
+
+    #[test]
+    fn scenario_unknown_writer_id_resets_and_restarts() {
+        // Java: testRetryAfterResettingInFlightBatchSequence
+        // Batch 0 times out (retriable), batch 1 gets UnknownWriterId (non-retriable).
+        // UnknownWriterId resets all state. After new writer ID, sequences restart at 0.
+        let mgr = IdempotenceManager::new(true, 5);
+        mgr.set_writer_id(42);
+        let b0 = test_bucket(0);
+        let _ = mgr.next_sequence_and_increment(&b0);
+        let _ = mgr.next_sequence_and_increment(&b0);
+        mgr.add_in_flight_batch(&b0, 0, 100);
+        mgr.add_in_flight_batch(&b0, 1, 101);
+
+        // Batch 0 times out → retriable (stays in in-flight)
+        // Batch 1 UnknownWriterId → NOT retriable (non-reset batch)
+        assert!(!mgr.can_retry_for_error(&b0, 1, 101, FlussError::UnknownWriterIdException));
+
+        // Sender calls fail_batch → handle_failed_batch with error → full reset
+        mgr.handle_failed_batch(
+            &b0,
+            101,
+            42,
+            Some(FlussError::UnknownWriterIdException),
+            true,
+        );
+        assert!(!mgr.has_writer_id());
+        assert!(mgr.bucket_entries.lock().is_empty());
+
+        // New writer ID allocated, sequences restart at 0
+        mgr.set_writer_id(99);
+        assert_eq!(mgr.next_sequence_and_increment(&b0), 0);
+    }
+
+    fn last_acked(mgr: &IdempotenceManager, bucket: &TableBucket) -> i32 {
+        mgr.bucket_entries
+            .lock()
+            .get(bucket)
+            .unwrap()
+            .last_acked_sequence
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index 2c848d3555..bc324e1827 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -17,6 +17,7 @@
 
 mod accumulator;
 mod batch;
+mod idempotence;
 
 use crate::client::broadcast::{self as client_broadcast, BatchWriteResult, BroadcastOnceReceiver};
 use crate::error::Error;
@@ -38,8 +39,9 @@ mod sender;
 mod write_format;
 mod writer_client;
 
+pub(crate) use idempotence::IdempotenceManager;
 pub use write_format::WriteFormat;
-pub use writer_client::WriterClient;
+pub(crate) use writer_client::WriterClient;
 
 #[allow(dead_code)]
 pub struct WriteRecord<'a> {
@@ -59,6 +61,22 @@ impl<'a> WriteRecord<'a> {
     pub fn physical_table_path(&self) -> &Arc<PhysicalTablePath> {
         &self.physical_table_path
     }
+
+    /// Minimum batch capacity needed to fit this record, including batch header
+    /// overhead. Used to size memory reservations and KV write limits so that
+    /// oversized records don't panic on append.
+    pub fn estimated_record_size(&self) -> usize {
+        match &self.record {
+            Record::Kv(kv) => {
+                let record_size = crate::record::kv::KvRecord::size_of(
+                    &kv.key,
+                    kv.row_bytes.as_ref().map(|rb| rb.as_slice()),
+                );
+                crate::record::kv::RECORD_BATCH_HEADER_SIZE + record_size
+            }
+            Record::Log(_) => 0, // Arrow batches use record count, not byte size
+        }
+    }
 }
 
 pub enum Record<'a> {
@@ -175,6 +193,11 @@ impl ResultHandle {
         ResultHandle { receiver }
     }
 
+    /// Force-complete with an error if not already completed.
+    pub(crate) fn fail(&self, error: client_broadcast::Error) {
+        self.receiver.fail(error);
+    }
+
     pub async fn wait(&self) -> Result<BatchWriteResult, Error> {
         self.receiver
             .receive()
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index ac3836aa38..b526e1a96e 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -17,26 +17,43 @@
 
 use crate::client::broadcast;
 use crate::client::metadata::Metadata;
+use crate::client::write::IdempotenceManager;
 use crate::client::write::batch::WriteBatch;
 use crate::client::{ReadyWriteBatch, RecordAccumulator};
 use crate::error::Error::UnexpectedError;
 use crate::error::{FlussError, Result};
 use crate::metadata::{PhysicalTablePath, TableBucket, TablePath};
 use crate::proto::{
-    PbProduceLogRespForBucket, PbPutKvRespForBucket, ProduceLogResponse, PutKvResponse,
+    PbProduceLogRespForBucket, PbPutKvRespForBucket, PbTablePath, ProduceLogResponse, PutKvResponse,
 };
+use crate::record::{NO_BATCH_SEQUENCE, NO_WRITER_ID};
 use crate::rpc::ServerConnection;
-use crate::rpc::message::{ProduceLogRequest, PutKvRequest};
+use crate::rpc::message::{InitWriterRequest, ProduceLogRequest, PutKvRequest};
 use crate::{PartitionId, TableId};
+use futures::StreamExt;
+use futures::stream::FuturesUnordered;
 use log::{debug, warn};
 use parking_lot::Mutex;
 use std::collections::{HashMap, HashSet};
+use std::future::Future;
+use std::pin::Pin;
 use std::sync::Arc;
+use std::sync::atomic::{AtomicBool, Ordering};
 use std::time::Duration;
+use tokio::sync::mpsc;
+
+type SendFuture<'a> = Pin<Box<dyn Future<Output = Result<()>> + Send + 'a>>;
+
+/// Result of a synchronous drain: send futures, optional delay, and unknown leader tables.
+type DrainResult<'a> = (
+    Vec<SendFuture<'a>>,
+    Option<u64>,
+    HashSet<Arc<PhysicalTablePath>>,
+);
 
 #[allow(dead_code)]
 pub struct Sender {
-    running: bool,
+    running: AtomicBool,
     metadata: Arc<Metadata>,
     accumulator: Arc<RecordAccumulator>,
     in_flight_batches: Mutex<HashMap<TableBucket, Vec<i64>>>,
@@ -44,6 +61,7 @@ pub struct Sender {
     ack: i16,
     max_request_timeout_ms: i32,
     retries: i32,
+    idempotence_manager: Arc<IdempotenceManager>,
 }
 
 impl Sender {
@@ -54,9 +72,10 @@ impl Sender {
         max_request_timeout_ms: i32,
         ack: i16,
         retries: i32,
+        idempotence_manager: Arc<IdempotenceManager>,
     ) -> Self {
         Self {
-            running: true,
+            running: AtomicBool::new(true),
             metadata,
             accumulator,
             in_flight_batches: Default::default(),
@@ -64,60 +83,139 @@ impl Sender {
             ack,
             max_request_timeout_ms,
             retries,
+            idempotence_manager,
         }
     }
 
-    pub async fn run(&self) -> Result<()> {
+    const WRITER_ID_RETRY_TIMES: u32 = 3;
+    const WRITER_ID_RETRY_INTERVAL_MS: u64 = 100;
+
+    async fn maybe_wait_for_writer_id(&self) -> Result<()> {
+        if !self.idempotence_manager.is_enabled() || self.idempotence_manager.has_writer_id() {
+            return Ok(());
+        }
+        let mut retry_count = 0u32;
         loop {
-            if !self.running {
-                return Ok(());
+            match self.try_init_writer_id().await {
+                Ok(()) => return Ok(()),
+                Err(e) => {
+                    // Authorization errors are not transient — fail immediately.
+                    if e.api_error() == Some(FlussError::AuthorizationException) {
+                        return Err(e);
+                    }
+                    if retry_count >= Self::WRITER_ID_RETRY_TIMES {
+                        return Err(e);
+                    }
+                    if e.api_error().is_some_and(Self::is_invalid_metadata_error) {
+                        let physical_paths = self.accumulator.get_physical_table_paths_in_batches();
+                        let physical_refs: HashSet<&Arc<PhysicalTablePath>> =
+                            physical_paths.iter().collect();
+                        if let Err(meta_err) = self
+                            .metadata
+                            .update_tables_metadata(&HashSet::new(), &physical_refs, vec![])
+                            .await
+                        {
+                            warn!("Failed to refresh metadata after writer ID error: {meta_err}");
+                        }
+                    }
+                    retry_count += 1;
+                    let delay_ms = Self::WRITER_ID_RETRY_INTERVAL_MS * 2u64.pow(retry_count);
+                    warn!(
+                        "Failed to allocate writer ID (attempt {retry_count}/{}), retrying in {delay_ms}ms: {e}",
+                        Self::WRITER_ID_RETRY_TIMES,
+                    );
+                    tokio::time::sleep(Duration::from_millis(delay_ms)).await;
+                }
             }
-            self.run_once().await?;
         }
     }
 
-    async fn run_once(&self) -> Result<()> {
+    async fn try_init_writer_id(&self) -> Result<()> {
+        // Deduplicate by (database, table) since multiple physical paths (partitions)
+        // may share the same table. Matches Java's Set<TablePath> dedup.
+        let mut seen = HashSet::new();
+        let table_paths: Vec<PbTablePath> = self
+            .accumulator
+            .get_physical_table_paths_in_batches()
+            .iter()
+            .filter_map(|path| {
+                let key = (
+                    path.get_database_name().to_string(),
+                    path.get_table_name().to_string(),
+                );
+                if seen.insert(key.clone()) {
+                    Some(PbTablePath {
+                        database_name: key.0,
+                        table_name: key.1,
+                    })
+                } else {
+                    None
+                }
+            })
+            .collect();
+        if table_paths.is_empty() {
+            debug!("No table paths in batches, skipping writer ID allocation");
+            return Ok(());
+        }
         let cluster = self.metadata.get_cluster();
-        let ready_check_result = self.accumulator.ready(&cluster)?;
+        let server = cluster.get_one_available_server().ok_or(UnexpectedError {
+            message: "No tablet server available to allocate writer ID".to_string(),
+            source: None,
+        })?;
+        let connection = self.metadata.get_connection(server).await?;
+        let response = connection
+            .request(InitWriterRequest::new(table_paths))
+            .await?;
+        self.idempotence_manager.set_writer_id(response.writer_id);
+        debug!(
+            "Allocated writer ID {} for idempotent writes",
+            response.writer_id
+        );
+        Ok(())
+    }
 
-        // Update metadata if needed
-        if !ready_check_result.unknown_leader_tables.is_empty() {
-            let mut table_paths: HashSet<&TablePath> = HashSet::new();
-            let mut physical_table_paths: HashSet<&Arc<PhysicalTablePath>> = HashSet::new();
+    fn maybe_abort_batches(&self, error: &crate::error::Error) {
+        if self.accumulator.has_incomplete() {
+            warn!("Aborting write batches due to fatal error: {error}");
+            self.accumulator.abort_batches(broadcast::Error::Client {
+                message: format!("Writer ID allocation failed: {error}"),
+            });
+        }
+    }
 
-            for unknown_paths in ready_check_result.unknown_leader_tables.iter() {
-                if unknown_paths.get_partition_name().is_some() {
-                    physical_table_paths.insert(unknown_paths);
-                } else {
-                    table_paths.insert(unknown_paths.get_table_path());
-                }
+    /// Sequential init + drain + metadata refresh. Used by `run_once` (shutdown)
+    /// where blocking is acceptable.
+    async fn prepare_sends(&self) -> Result<(Vec<SendFuture<'_>>, Option<u64>)> {
+        if let Err(e) = self.maybe_wait_for_writer_id().await {
+            warn!("Failed to allocate writer ID after retries: {e}");
+            self.maybe_abort_batches(&e);
+            return Ok((vec![], None));
+        }
+        let (futures, delay, unknown_leaders) = self.drain_ready_sends()?;
+        if !unknown_leaders.is_empty() {
+            if let Err(e) = self.refresh_unknown_leaders(&unknown_leaders).await {
+                warn!("Metadata refresh for unknown leaders failed: {e}");
             }
+        }
+        Ok((futures, delay))
+    }
 
-            if let Err(e) = self
-                .metadata
-                .update_tables_metadata(&table_paths, &physical_table_paths, vec![])
-                .await
-            {
-                match e.api_error() {
-                    Some(FlussError::PartitionNotExists) => {
-                        warn!("Partition does not exist during metadata update, continuing: {e}");
-                    }
-                    _ => return Err(e),
-                }
-            }
+    /// Fully synchronous drain: `ready()` → `drain()` → build send futures.
+    /// No async work — safe to call on the hot path without starving
+    /// `pending.next()`. Returns unknown leader tables so the caller can
+    /// schedule a concurrent metadata refresh.
+    fn drain_ready_sends(&self) -> Result<DrainResult<'_>> {
+        let cluster = self.metadata.get_cluster();
+        let ready_check_result = self.accumulator.ready(&cluster)?;
 
-            debug!(
-                "Client update metadata due to unknown leader tables from the batched records: {:?}",
-                ready_check_result.unknown_leader_tables
-            );
-        }
+        let unknown_leaders = ready_check_result.unknown_leader_tables;
 
         if ready_check_result.ready_nodes.is_empty() {
-            tokio::time::sleep(Duration::from_millis(
-                ready_check_result.next_ready_check_delay_ms as u64,
-            ))
-            .await;
-            return Ok(());
+            return Ok((
+                vec![],
+                Some(ready_check_result.next_ready_check_delay_ms as u64),
+                unknown_leaders,
+            ));
         }
 
         let batches = self.accumulator.drain(
@@ -126,11 +224,67 @@ impl Sender {
             self.max_request_size,
         )?;
 
+        let mut futures = Vec::new();
         if !batches.is_empty() {
             self.add_to_inflight_batches(&batches);
-            self.send_write_requests(batches).await?;
+            for (leader_id, leader_batches) in batches {
+                futures.push(
+                    Box::pin(self.send_write_request(leader_id, self.ack, leader_batches))
+                        as SendFuture<'_>,
+                );
+            }
         }
 
+        Ok((futures, None, unknown_leaders))
+    }
+
+    /// Refresh metadata for buckets with unknown leaders. Runs as a concurrent
+    /// maintenance task so it never blocks the response-processing hot path.
+    async fn refresh_unknown_leaders(
+        &self,
+        unknown_leaders: &HashSet<Arc<PhysicalTablePath>>,
+    ) -> Result<()> {
+        let mut table_paths: HashSet<&TablePath> = HashSet::new();
+        let mut physical_table_paths: HashSet<&Arc<PhysicalTablePath>> = HashSet::new();
+
+        for path in unknown_leaders {
+            if path.get_partition_name().is_some() {
+                physical_table_paths.insert(path);
+            } else {
+                table_paths.insert(path.get_table_path());
+            }
+        }
+
+        if let Err(e) = self
+            .metadata
+            .update_tables_metadata(&table_paths, &physical_table_paths, vec![])
+            .await
+        {
+            match e.api_error() {
+                Some(FlussError::PartitionNotExists) => {
+                    warn!("Partition does not exist during metadata update, continuing: {e}");
+                }
+                _ => return Err(e),
+            }
+        }
+
+        debug!(
+            "Updated metadata for unknown leader tables: {:?}",
+            unknown_leaders
+        );
+        Ok(())
+    }
+
+    /// Blocking version of drain + send, used during shutdown drain.
+    async fn run_once(&self) -> Result<()> {
+        let (futures, delay) = self.prepare_sends().await?;
+        if let Some(ms) = delay {
+            tokio::time::sleep(Duration::from_millis(ms)).await;
+            return Ok(());
+        }
+        for result in futures::future::join_all(futures).await {
+            result?;
+        }
         Ok(())
     }
 
@@ -146,17 +300,6 @@ impl Sender {
         }
     }
 
-    async fn send_write_requests(
-        &self,
-        collated: HashMap<i32, Vec<ReadyWriteBatch>>,
-    ) -> Result<()> {
-        for (leader_id, batches) in collated {
-            self.send_write_request(leader_id, self.ack, batches)
-                .await?;
-        }
-        Ok(())
-    }
-
     async fn send_write_request(
         &self,
         destination: i32,
@@ -399,11 +542,40 @@ impl Sender {
         Ok(())
     }
 
+    // TODO: Java has a second overload `completeBatch(batch, bucket, logEndOffset)` used for
+    // KV responses. When callers need write offset info, change BatchWriteResult to carry
+    // optional offset metadata and plumb it through BroadcastOnce → ResultHandle → WriteResultFuture.
     fn complete_batch(&self, ready_write_batch: ReadyWriteBatch) {
+        if self.idempotence_manager.is_enabled()
+            && ready_write_batch.write_batch.batch_sequence() != NO_BATCH_SEQUENCE
+        {
+            self.idempotence_manager.handle_completed_batch(
+                &ready_write_batch.table_bucket,
+                ready_write_batch.write_batch.batch_id(),
+                ready_write_batch.write_batch.writer_id(),
+            );
+        }
         self.finish_batch(ready_write_batch, Ok(()));
     }
 
-    fn fail_batch(&self, ready_write_batch: ReadyWriteBatch, error: broadcast::Error) {
+    fn fail_batch(
+        &self,
+        ready_write_batch: ReadyWriteBatch,
+        error: broadcast::Error,
+        fluss_error: Option<FlussError>,
+        adjust_sequences: bool,
+    ) {
+        if self.idempotence_manager.is_enabled()
+            && ready_write_batch.write_batch.batch_sequence() != NO_BATCH_SEQUENCE
+        {
+            self.idempotence_manager.handle_failed_batch(
+                &ready_write_batch.table_bucket,
+                ready_write_batch.write_batch.batch_id(),
+                ready_write_batch.write_batch.writer_id(),
+                fluss_error,
+                adjust_sequences,
+            );
+        }
         self.finish_batch(ready_write_batch, Err(error));
     }
 
@@ -444,11 +616,15 @@ impl Sender {
         message: String,
     ) -> Result<()> {
         for batch in batches {
+            // Local errors (e.g. build failure) — server never saw the batch,
+            // so it's always safe to adjust sequences.
             self.fail_batch(
                 batch,
                 broadcast::Error::Client {
                     message: message.clone(),
                 },
+                None,
+                true,
             );
         }
         Ok(())
@@ -467,6 +643,39 @@ impl Sender {
                 physical_table_path.as_ref(),
                 ready_write_batch.table_bucket.bucket_id()
             );
+
+            // If idempotence is enabled, only retry if the current writer ID still matches
+            // the batch's writer ID. If the writer ID was reset (e.g., by another bucket's
+            // error), fail the batch instead of retrying with stale state.
+            if self.idempotence_manager.is_enabled() {
+                let batch_writer_id = ready_write_batch.write_batch.writer_id();
+                if batch_writer_id != NO_WRITER_ID
+                    && self.idempotence_manager.writer_id() != batch_writer_id
+                {
+                    warn!(
+                        "Writer ID changed from {} to {} since batch was sent, failing instead of retrying",
+                        batch_writer_id,
+                        self.idempotence_manager.writer_id()
+                    );
+                    self.fail_batch(
+                        ready_write_batch,
+                        broadcast::Error::WriteFailed {
+                            code: FlussError::UnknownWriterIdException.code(),
+                            message: format!(
+                                "Attempted to retry sending a batch but the writer id has changed from {} to {}. This batch will be dropped.",
+                                batch_writer_id,
+                                self.idempotence_manager.writer_id()
+                            ),
+                        },
+                        Some(FlussError::UnknownWriterIdException),
+                        false,
+                    );
+                    return Ok(
+                        Self::is_invalid_metadata_error(error).then_some(physical_table_path)
+                    );
+                }
+            }
+
             self.re_enqueue_batch(ready_write_batch);
             return Ok(Self::is_invalid_metadata_error(error).then_some(physical_table_path));
         }
@@ -481,18 +690,25 @@ impl Sender {
             return Ok(None);
         }
 
+        // Generic error path. handle_failed_batch will detect OutOfOrderSequence /
+        // UnknownWriterId and reset all writer state internally (matching Java).
+        // For other errors, only adjust sequences if the batch didn't exhaust its retries.
+        let can_adjust = ready_write_batch.write_batch.attempts() < self.retries;
         self.fail_batch(
             ready_write_batch,
             broadcast::Error::WriteFailed {
                 code: error.code(),
                 message,
             },
+            Some(error),
+            can_adjust,
         );
         Ok(Self::is_invalid_metadata_error(error).then_some(physical_table_path))
     }
 
     fn re_enqueue_batch(&self, ready_write_batch: ReadyWriteBatch) {
         self.remove_from_inflight_batches(&ready_write_batch);
+        // TODO: add retry metrics (Java: writerMetricGroup.recordsRetryTotal().inc(recordCount))
         self.accumulator.re_enqueue(ready_write_batch);
     }
 
@@ -508,9 +724,25 @@ impl Sender {
     }
 
     fn can_retry(&self, ready_write_batch: &ReadyWriteBatch, error: FlussError) -> bool {
-        ready_write_batch.write_batch.attempts() < self.retries
-            && !ready_write_batch.write_batch.is_done()
-            && Self::is_retriable_error(error)
+        if ready_write_batch.write_batch.attempts() >= self.retries
+            || ready_write_batch.write_batch.is_done()
+        {
+            return false;
+        }
+        if Self::is_retriable_error(error) {
+            return true;
+        }
+        // Idempotent-specific retry logic
+        let seq = ready_write_batch.write_batch.batch_sequence();
+        if self.idempotence_manager.is_enabled() && seq != NO_BATCH_SEQUENCE {
+            return self.idempotence_manager.can_retry_for_error(
+                &ready_write_batch.table_bucket,
+                seq,
+                ready_write_batch.write_batch.batch_id(),
+                error,
+            );
+        }
+        false
     }
 
     async fn update_metadata_if_needed(
@@ -561,8 +793,145 @@ impl Sender {
         )
     }
 
-    pub async fn close(&mut self) {
-        self.running = false;
+    /// Event-loop sender: drain batches and fire RPCs into a `FuturesUnordered`,
+    /// then process responses as they arrive. This interleaves drain cycles with
+    /// response handling — when a fast leader responds, we immediately drain and
+    /// send more batches for its buckets while slow leaders are still in-flight.
+    ///
+    /// Slow work (writer-ID init with retry backoff, metadata refresh for
+    /// unknown leaders) runs as concurrent maintenance tasks so it never blocks
+    /// `pending.next()`. The drain path (`drain_ready_sends`) is fully
+    /// synchronous — no `.await` on the hot path. Without this separation,
+    /// backoff sleeps during writer-ID init could stall response processing
+    /// and cause severe backpressure when the accumulator memory budget is full
+    /// (responses not polled → memory not freed → writers block).
+    /// Single-select event loop with `need_drain` tick.
+    ///
+    /// Invariants:
+    /// - `need_drain` is a one-shot "try a drain tick ASAP" flag.
+    /// - Each iteration either performs a sync drain tick (if flagged) or blocks
+    ///   in a single `tokio::select!`.
+    /// - `accumulator.notified()` is always listened to (producer wakeups).
+    /// - The idle timer is only armed when truly idle (no futures in any pool).
+    /// - When writer_id isn't ready, a drain tick is a no-op but the loop stays
+    ///   responsive (notified/init/meta can still wake it).
+    pub async fn run_with_shutdown(&self, mut shutdown_rx: mpsc::Receiver<()>) -> Result<()> {
+        let mut pending: FuturesUnordered<SendFuture<'_>> = FuturesUnordered::new();
+        let mut init_futs: FuturesUnordered<SendFuture<'_>> = FuturesUnordered::new();
+        let mut meta_futs: FuturesUnordered<SendFuture<'_>> = FuturesUnordered::new();
+        let mut pending_unknown: HashSet<Arc<PhysicalTablePath>> = HashSet::new();
+
+        let mut need_drain = true; // drain on first iteration to pick up any pre-existing batches
+        let mut next_delay_ms: u64 = 1;
+
+        loop {
+            // Spawn writer-ID init task if needed and not already running.
+            if init_futs.is_empty()
+                && self.idempotence_manager.is_enabled()
+                && !self.idempotence_manager.has_writer_id()
+                && self.accumulator.has_undrained()
+            {
+                init_futs.push(Box::pin(self.maybe_wait_for_writer_id()));
+            }
+
+            // Spawn metadata refresh if we have accumulated unknown leaders
+            // and no refresh is currently running.
+            if !pending_unknown.is_empty() && meta_futs.is_empty() {
+                let leaders = std::mem::take(&mut pending_unknown);
+                meta_futs.push(Box::pin(async move {
+                    self.refresh_unknown_leaders(&leaders).await
+                }));
+            }
+
+            // Drain tick: synchronous, never blocks response processing.
+            // Clear unconditionally — "need_drain" means "try", not "must succeed".
+            if need_drain {
+                need_drain = false;
+
+                if !self.idempotence_manager.is_enabled()
+                    || self.idempotence_manager.has_writer_id()
+                {
+                    match self.drain_ready_sends() {
+                        Ok((futures, delay, unknown_leaders)) => {
+                            if let Some(d) = delay {
+                                next_delay_ms = d;
+                            }
+                            pending_unknown.extend(unknown_leaders);
+                            for f in futures {
+                                pending.push(f);
+                            }
+                        }
+                        Err(e) => {
+                            warn!("Error in drain cycle: {e}");
+                        }
+                    }
+                }
+            }
+
+            let truly_idle = pending.is_empty() && init_futs.is_empty() && meta_futs.is_empty();
+            debug_assert!(next_delay_ms >= 1);
+
+            // One select to rule them all.
+            tokio::select! {
+                _ = shutdown_rx.recv() => break,
+
+                // Always listen for producer wakeups.
+                _ = self.accumulator.notified() => {
+                    need_drain = true;
+                }
+
+                // Process in-flight send responses.
+                Some(result) = pending.next(), if !pending.is_empty() => {
+                    if let Err(e) = result {
+                        warn!("Uncaught error in send request, continuing: {e}");
+                    }
+                    need_drain = true;
+                }
+
+                // Writer-ID init completed.
+                Some(result) = init_futs.next(), if !init_futs.is_empty() => {
+                    match result {
+                        Ok(()) => need_drain = true,
+                        Err(e) => {
+                            warn!("Failed to allocate writer ID after retries: {e}");
+                            self.maybe_abort_batches(&e);
+                        }
+                    }
+                }
+
+                // Metadata refresh completed — new leaders may now be known.
+                Some(result) = meta_futs.next(), if !meta_futs.is_empty() => {
+                    if let Err(e) = result {
+                        warn!("Metadata refresh for unknown leaders failed: {e}");
+                    }
+                    need_drain = true;
+                }
+
+                // Idle timer: batch timeout / linger expiry.
+                _ = tokio::time::sleep(Duration::from_millis(next_delay_ms)), if truly_idle => {
+                    need_drain = true;
+                }
+            }
+        }
+
+        // Graceful shutdown: drain remaining batches, then wait for all
+        // in-flight sends to complete.
+        while self.accumulator.has_undrained() {
+            if let Err(e) = self.run_once().await {
+                warn!("Error during shutdown drain, continuing: {e}");
+            }
+        }
+        while let Some(result) = pending.next().await {
+            if let Err(e) = result {
+                warn!("Error in send during shutdown, continuing: {e}");
+            }
+        }
+        self.close();
+        Ok(())
+    }
+
+    pub fn close(&self) {
+        self.running.store(false, Ordering::Relaxed);
     }
 }
 
@@ -643,6 +1012,14 @@ mod tests {
     use crate::test_utils::{build_cluster_arc, build_table_info};
     use std::collections::{HashMap, HashSet};
 
+    fn disabled_idempotence() -> Arc<IdempotenceManager> {
+        Arc::new(IdempotenceManager::new(false, 5))
+    }
+
+    fn enabled_idempotence() -> Arc<IdempotenceManager> {
+        Arc::new(IdempotenceManager::new(true, 5))
+    }
+
     fn build_ready_batch(
         accumulator: &RecordAccumulator,
         cluster: Arc<Cluster>,
@@ -669,8 +1046,20 @@ mod tests {
         let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
         let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
         let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
-        let accumulator = Arc::new(RecordAccumulator::new(Config::default()));
-        let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 1);
+        let idempotence = disabled_idempotence();
+        let accumulator = Arc::new(RecordAccumulator::new(
+            Config::default(),
+            Arc::clone(&idempotence),
+        ));
+        let sender = Sender::new(
+            metadata,
+            accumulator.clone(),
+            1024 * 1024,
+            1000,
+            1,
+            1,
+            idempotence,
+        );
 
         let (batch, _handle) =
             build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path.clone())?;
@@ -699,8 +1088,20 @@ mod tests {
         let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
         let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
         let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
-        let accumulator = Arc::new(RecordAccumulator::new(Config::default()));
-        let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 0);
+        let idempotence = disabled_idempotence();
+        let accumulator = Arc::new(RecordAccumulator::new(
+            Config::default(),
+            Arc::clone(&idempotence),
+        ));
+        let sender = Sender::new(
+            metadata,
+            accumulator.clone(),
+            1024 * 1024,
+            1000,
+            1,
+            0,
+            idempotence,
+        );
 
         let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path)?;
         sender.handle_write_batch_error(
@@ -723,8 +1124,20 @@ mod tests {
         let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
         let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
         let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
-        let accumulator = Arc::new(RecordAccumulator::new(Config::default()));
-        let sender = Sender::new(metadata, accumulator.clone(), 1024 * 1024, 1000, 1, 0);
+        let idempotence = disabled_idempotence();
+        let accumulator = Arc::new(RecordAccumulator::new(
+            Config::default(),
+            Arc::clone(&idempotence),
+        ));
+        let sender = Sender::new(
+            metadata,
+            accumulator.clone(),
+            1024 * 1024,
+            1000,
+            1,
+            0,
+            idempotence,
+        );
 
         let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster, table_path)?;
         let request_buckets = vec![batch.table_bucket.clone()];
@@ -748,4 +1161,221 @@ mod tests {
         assert!(matches!(batch_result, Ok(())));
         Ok(())
     }
+
+    #[tokio::test]
+    async fn test_unknown_writer_id_resets() -> Result<()> {
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
+        let idempotence = enabled_idempotence();
+        let accumulator = Arc::new(RecordAccumulator::new(
+            Config::default(),
+            Arc::clone(&idempotence),
+        ));
+        idempotence.set_writer_id(42);
+        let sender = Sender::new(
+            metadata,
+            accumulator.clone(),
+            1024 * 1024,
+            1000,
+            -1,
+            i32::MAX,
+            Arc::clone(&idempotence),
+        );
+
+        // build_ready_batch drains the batch, which assigns seq=0 and adds in-flight
+        let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path)?;
+        assert_eq!(batch.write_batch.batch_sequence(), 0);
+        assert_eq!(batch.write_batch.writer_id(), 42);
+
+        sender.handle_write_batch_error(
+            batch,
+            FlussError::UnknownWriterIdException,
+            "unknown writer".to_string(),
+        )?;
+
+        // Writer ID should be reset
+        assert!(!idempotence.has_writer_id());
+
+        // Batch should be failed (not retried)
+        let batch_result = handle.wait().await?;
+        assert!(matches!(
+            batch_result,
+            Err(broadcast::Error::WriteFailed { code, .. })
+                if code == FlussError::UnknownWriterIdException.code()
+        ));
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn test_out_of_order_sequence_non_retriable_resets() -> Result<()> {
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
+        let idempotence = enabled_idempotence();
+        let accumulator = Arc::new(RecordAccumulator::new(
+            Config::default(),
+            Arc::clone(&idempotence),
+        ));
+        idempotence.set_writer_id(42);
+        // retries=0 means can_retry returns false immediately (attempts >= retries)
+        let sender = Sender::new(
+            metadata,
+            accumulator.clone(),
+            1024 * 1024,
+            1000,
+            -1,
+            0,
+            Arc::clone(&idempotence),
+        );
+
+        // build_ready_batch drains the batch, which assigns seq=0 and adds in-flight
+        let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path)?;
+        assert_eq!(batch.write_batch.batch_sequence(), 0);
+
+        // OutOfOrderSequence with retries exhausted → non-retriable → resets writer ID
+        sender.handle_write_batch_error(
+            batch,
+            FlussError::OutOfOrderSequenceException,
+            "out of order".to_string(),
+        )?;
+
+        // Writer ID should be reset (matching Java behavior)
+        assert!(!idempotence.has_writer_id());
+
+        // Batch should be failed
+        let batch_result = handle.wait().await?;
+        assert!(matches!(
+            batch_result,
+            Err(broadcast::Error::WriteFailed { code, .. })
+                if code == FlussError::OutOfOrderSequenceException.code()
+        ));
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn test_stale_writer_id_prevents_retry() -> Result<()> {
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
+        let metadata = Arc::new(Metadata::new_for_test(cluster.clone()));
+        let idempotence = enabled_idempotence();
+        let accumulator = Arc::new(RecordAccumulator::new(
+            Config::default(),
+            Arc::clone(&idempotence),
+        ));
+        idempotence.set_writer_id(42);
+        let sender = Sender::new(
+            metadata,
+            accumulator.clone(),
+            1024 * 1024,
+            1000,
+            -1,
+            i32::MAX,
+            Arc::clone(&idempotence),
+        );
+
+        // build_ready_batch drains the batch, which assigns seq=0 and adds in-flight
+        let (batch, handle) = build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path)?;
+        assert_eq!(batch.write_batch.writer_id(), 42);
+        let mut inflight = HashMap::new();
+        inflight.insert(1, vec![batch]);
+        sender.add_to_inflight_batches(&inflight);
+        let batch = inflight.remove(&1).unwrap().pop().unwrap();
+
+        // Simulate writer ID reset (e.g., another bucket got UnknownWriterIdException)
+        idempotence.reset_writer_id();
+        idempotence.set_writer_id(99); // new writer ID allocated
+
+        // NetworkException is normally retriable, but writer ID changed
+        sender.handle_write_batch_error(
+            batch,
+            FlussError::NetworkException,
+            "connection reset".to_string(),
+        )?;
+
+        // Batch should be failed (not retried) because writer ID is stale
+        let batch_result = handle.wait().await?;
+        assert!(matches!(
+            batch_result,
+            Err(broadcast::Error::WriteFailed { code, .. })
+                if code == FlussError::UnknownWriterIdException.code()
+        ));
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn test_writer_state_assigned_on_drain() -> Result<()> {
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
+        let idempotence = enabled_idempotence();
+        let accumulator = Arc::new(RecordAccumulator::new(
+            Config::default(),
+            Arc::clone(&idempotence),
+        ));
+        idempotence.set_writer_id(99);
+
+        // Append a record to the accumulator
+        let table_info = Arc::new(build_table_info(table_path.as_ref().clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(table_path));
+        let row = GenericRow {
+            values: vec![Datum::Int32(42)],
+        };
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
+        accumulator.append(&record, 0, &cluster, false)?;
+
+        // Drain the batches — accumulator now assigns writer state during drain
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let batches = accumulator.drain(cluster, &nodes, 1024 * 1024)?;
+
+        // Verify the batch got writer state assigned by the accumulator
+        let batch_list = batches.values().next().unwrap();
+        let batch = &batch_list[0];
+        assert_eq!(batch.write_batch.batch_sequence(), 0);
+        assert_eq!(batch.write_batch.writer_id(), 99);
+        Ok(())
+    }
+
+    #[tokio::test]
+    async fn test_reenqueued_batch_keeps_sequence_on_redrain() -> Result<()> {
+        let table_path = Arc::new(TablePath::new("db".to_string(), "tbl".to_string()));
+        let cluster = build_cluster_arc(table_path.as_ref(), 1, 1);
+        let idempotence = enabled_idempotence();
+        let accumulator = Arc::new(RecordAccumulator::new(
+            Config::default(),
+            Arc::clone(&idempotence),
+        ));
+        idempotence.set_writer_id(99);
+
+        // build_ready_batch drains the batch, which now assigns writer state
+        // (seq=0) during drain since idempotence is enabled.
+        let (batch, _handle) =
+            build_ready_batch(accumulator.as_ref(), cluster.clone(), table_path)?;
+
+        let writer_id = idempotence.writer_id();
+        assert_eq!(batch.write_batch.batch_sequence(), 0);
+        assert!(batch.write_batch.has_batch_sequence());
+        assert_eq!(batch.write_batch.writer_id(), writer_id);
+
+        // Re-enqueue the batch (simulating a retriable error)
+        accumulator.re_enqueue(batch);
+
+        // Drain again
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let mut batches = accumulator.drain(cluster, &nodes, 1024 * 1024)?;
+        let batch_list = batches.values_mut().next().unwrap();
+        let ready_batch = &mut batch_list[0];
+
+        // Re-enqueued batch keeps its original sequence
+        assert!(ready_batch.write_batch.has_batch_sequence());
+        assert_eq!(ready_batch.write_batch.writer_id(), writer_id);
+        assert_eq!(ready_batch.write_batch.batch_sequence(), 0);
+        // Only one sequence was allocated (during the first drain)
+        assert_eq!(
+            idempotence.next_sequence_and_increment(&ready_batch.table_bucket),
+            1
+        );
+        Ok(())
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index 23f523c8bf..aee6bcd91d 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -18,6 +18,8 @@
 use crate::BucketId;
 use crate::bucketing::BucketingFunction;
 use crate::client::metadata::Metadata;
+use crate::client::write::IdempotenceManager;
+use crate::client::write::broadcast;
 use crate::client::write::bucket_assigner::{
     BucketAssigner, HashBucketAssigner, RoundRobinBucketAssigner, StickyBucketAssigner,
 };
@@ -29,7 +31,10 @@ use crate::error::{Error, Result};
 use crate::metadata::{PhysicalTablePath, TableInfo};
 use bytes::Bytes;
 use dashmap::DashMap;
+use log::warn;
+use parking_lot::Mutex;
 use std::sync::Arc;
+use std::time::Duration;
 use tokio::sync::mpsc;
 use tokio::task::JoinHandle;
 
@@ -38,46 +43,58 @@ pub struct WriterClient {
     config: Config,
     max_request_size: i32,
     accumulate: Arc<RecordAccumulator>,
-    shutdown_tx: mpsc::Sender<()>,
-    sender_join_handle: JoinHandle<()>,
+    shutdown_tx: Mutex<Option<mpsc::Sender<()>>>,
+    sender_join_handle: Mutex<Option<JoinHandle<()>>>,
     metadata: Arc<Metadata>,
     bucket_assigners: DashMap<Arc<PhysicalTablePath>, Arc<dyn BucketAssigner>>,
+    idempotence_manager: Arc<IdempotenceManager>,
 }
 
 impl WriterClient {
     pub fn new(config: Config, metadata: Arc<Metadata>) -> Result<Self> {
-        let (shutdown_tx, mut shutdown_rx) = mpsc::channel(1);
+        let ack = Self::get_ack(&config)?;
 
-        let accumulator = Arc::new(RecordAccumulator::new(config.clone()));
+        config
+            .validate_idempotence()
+            .map_err(|message| Error::IllegalArgument { message })?;
 
-        let mut sender = Sender::new(
+        let idempotence_manager = Arc::new(IdempotenceManager::new(
+            config.writer_enable_idempotence,
+            config.writer_max_inflight_requests_per_bucket,
+        ));
+
+        let (shutdown_tx, shutdown_rx) = mpsc::channel(1);
+
+        let accumulator = Arc::new(RecordAccumulator::new(
+            config.clone(),
+            Arc::clone(&idempotence_manager),
+        ));
+
+        let sender = Arc::new(Sender::new(
             metadata.clone(),
             accumulator.clone(),
             config.writer_request_max_size,
             30_000,
-            Self::get_ack(&config)?,
+            ack,
             config.writer_retries,
-        );
+            Arc::clone(&idempotence_manager),
+        ));
 
         let join_handle = tokio::spawn(async move {
-            tokio::select! {
-                _ = sender.run() => {
-                    // do-nothing
-                },
-                _ = shutdown_rx.recv() => {
-                    sender.close().await
-                }
+            if let Err(e) = sender.run_with_shutdown(shutdown_rx).await {
+                warn!("Sender loop exited with error: {e}");
             }
         });
 
         Ok(Self {
             max_request_size: config.writer_request_max_size,
             config,
-            shutdown_tx,
-            sender_join_handle: join_handle,
+            shutdown_tx: Mutex::new(Some(shutdown_tx)),
+            sender_join_handle: Mutex::new(Some(join_handle)),
             accumulate: accumulator,
             metadata,
             bucket_assigners: Default::default(),
+            idempotence_manager,
         })
     }
 
@@ -93,6 +110,11 @@ impl WriterClient {
     }
 
     pub fn send(&self, record: &WriteRecord<'_>) -> Result<ResultHandle> {
+        if self.accumulate.is_closed() {
+            return Err(Error::WriterClosed {
+                message: "Cannot send: writer is closed".to_string(),
+            });
+        }
         let physical_table_path = &record.physical_table_path;
         let cluster = self.metadata.get_cluster();
         let bucket_key = record.bucket_key.as_ref();
@@ -115,7 +137,7 @@ impl WriterClient {
         }
 
         if result.batch_is_full || result.new_batch_created {
-            // todo: wakeup
+            self.accumulate.wakeup_sender();
         }
 
         Ok(result.result_handle.expect("result_handle should exist"))
@@ -146,21 +168,48 @@ impl WriterClient {
         Ok((bucket_assigner, bucket_id))
     }
 
-    pub async fn close(self) -> Result<()> {
-        self.shutdown_tx
-            .send(())
-            .await
-            .map_err(|e| Error::UnexpectedError {
-                message: format!("Failed to close write client: {e:?}"),
-                source: None,
-            })?;
-
-        self.sender_join_handle
-            .await
-            .map_err(|e| Error::UnexpectedError {
-                message: format!("Failed to close write client: {e:?}"),
-                source: None,
-            })?;
+    /// Close the writer with a timeout. Matches Java's two-phase shutdown:
+    ///
+    /// 1. **Graceful**: Signal the sender to drain all remaining batches.
+    ///    `accumulator.close()` makes all batches immediately ready (no need
+    ///    to wait for `batch_timeout_ms`).
+    /// 2. **Force** (if timeout exceeded): Abort the sender task and fail
+    ///    all remaining batches with an error.
+    ///
+    /// Idempotent: calling `close` a second time returns `Ok(())` immediately.
+    pub async fn close(&self, timeout: Duration) -> Result<()> {
+        // Take shutdown_tx and join_handle out of their Mutexes.
+        // Second call sees None and returns early.
+        let shutdown_tx = self.shutdown_tx.lock().take();
+        let join_handle = self.sender_join_handle.lock().take();
+
+        let Some(mut join_handle) = join_handle else {
+            return Ok(());
+        };
+
+        // Phase 1: Signal graceful shutdown.
+        // Mark accumulator closed so all batches become immediately sendable.
+        self.accumulate.close();
+        // Drop the shutdown sender — recv() returns None, breaking the sender loop.
+        drop(shutdown_tx);
+
+        // Phase 2: Wait for graceful drain, bounded by timeout.
+        tokio::select! {
+            result = &mut join_handle => {
+                if let Err(e) = result {
+                    warn!("Sender task panicked during shutdown: {e}");
+                }
+            }
+            _ = tokio::time::sleep(timeout) => {
+                // Phase 3: Force close — timeout exceeded.
+                warn!("Graceful shutdown timed out after {timeout:?}, force closing");
+                join_handle.abort();
+                let _ = join_handle.await; // Wait for cancellation to complete
+                self.accumulate.abort_batches(broadcast::Error::Client {
+                    message: "Writer force closed (shutdown timeout exceeded)".to_string(),
+                });
+            }
+        }
         Ok(())
     }
 
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index e85a449250..32db44f6a5 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -32,7 +32,11 @@ const DEFAULT_SCANNER_LOG_FETCH_MIN_BYTES: i32 = 1;
 const DEFAULT_SCANNER_LOG_FETCH_WAIT_MAX_TIME_MS: i32 = 500;
 const DEFAULT_WRITER_BATCH_TIMEOUT_MS: i64 = 100;
 const DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES_FOR_BUCKET: i32 = 1024 * 1024;
+const DEFAULT_WRITER_MAX_INFLIGHT_REQUESTS_PER_BUCKET: usize = 5;
+const DEFAULT_WRITER_BUFFER_MEMORY_SIZE: usize = 64 * 1024 * 1024; // 64MB, matching Java
+const DEFAULT_WRITER_BUFFER_WAIT_TIMEOUT_MS: u64 = u64::MAX;
 
+const MAX_IN_FLIGHT_REQUESTS_PER_BUCKET_FOR_IDEMPOTENCE: usize = 5;
 const DEFAULT_ACKS: &str = "all";
 const DEFAULT_CONNECT_TIMEOUT_MS: u64 = 120_000;
 const DEFAULT_SECURITY_PROTOCOL: &str = "PLAINTEXT";
@@ -120,6 +124,30 @@ pub struct Config {
     #[arg(long, default_value_t = DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES_FOR_BUCKET)]
     pub scanner_log_fetch_max_bytes_for_bucket: i32,
 
+    /// Whether to enable idempotent writes. When enabled, each batch is tagged with
+    /// a server-allocated writer ID and per-bucket sequence number so the server can
+    /// detect and deduplicate retried batches.
+    /// Default: true (matching Java CLIENT_WRITER_ENABLE_IDEMPOTENCE)
+    #[arg(long, default_value_t = true)]
+    pub writer_enable_idempotence: bool,
+
+    /// Maximum number of in-flight requests per bucket for idempotent writes.
+    /// Default: 5 (matching Java client.writer.max-inflight-requests-per-bucket)
+    #[arg(long, default_value_t = DEFAULT_WRITER_MAX_INFLIGHT_REQUESTS_PER_BUCKET)]
+    pub writer_max_inflight_requests_per_bucket: usize,
+
+    /// Total memory available for buffering write batches across all buckets.
+    /// When this limit is reached, `upsert()`/`append()` will block until
+    /// in-flight batches complete and free memory.
+    /// Default: 64MB (matching Java's LazyMemorySegmentPool: 512 pages x 128KB)
+    #[arg(long, default_value_t = DEFAULT_WRITER_BUFFER_MEMORY_SIZE)]
+    pub writer_buffer_memory_size: usize,
+
+    /// Maximum time in milliseconds to block waiting for buffer memory.
+    /// If the timeout is exceeded, the write call returns an error.
+    #[arg(long, default_value_t = DEFAULT_WRITER_BUFFER_WAIT_TIMEOUT_MS)]
+    pub writer_buffer_wait_timeout_ms: u64,
+
     /// Connect timeout in milliseconds for TCP transport connect.
     /// Default: 120000 (120 seconds).
     #[arg(long, default_value_t = DEFAULT_CONNECT_TIMEOUT_MS)]
@@ -180,6 +208,16 @@ impl std::fmt::Debug for Config {
                 &self.scanner_log_fetch_wait_max_time_ms,
             )
             .field("writer_batch_timeout_ms", &self.writer_batch_timeout_ms)
+            .field("writer_enable_idempotence", &self.writer_enable_idempotence)
+            .field(
+                "writer_max_inflight_requests_per_bucket",
+                &self.writer_max_inflight_requests_per_bucket,
+            )
+            .field("writer_buffer_memory_size", &self.writer_buffer_memory_size)
+            .field(
+                "writer_buffer_wait_timeout_ms",
+                &self.writer_buffer_wait_timeout_ms,
+            )
             .field("connect_timeout_ms", &self.connect_timeout_ms)
             .field("security_protocol", &self.security_protocol)
             .field("security_sasl_mechanism", &self.security_sasl_mechanism)
@@ -207,6 +245,11 @@ impl Default for Config {
             scanner_log_fetch_wait_max_time_ms: DEFAULT_SCANNER_LOG_FETCH_WAIT_MAX_TIME_MS,
             scanner_log_fetch_max_bytes_for_bucket: DEFAULT_SCANNER_LOG_FETCH_MAX_BYTES_FOR_BUCKET,
             writer_batch_timeout_ms: DEFAULT_WRITER_BATCH_TIMEOUT_MS,
+            writer_enable_idempotence: true,
+            writer_max_inflight_requests_per_bucket:
+                DEFAULT_WRITER_MAX_INFLIGHT_REQUESTS_PER_BUCKET,
+            writer_buffer_memory_size: DEFAULT_WRITER_BUFFER_MEMORY_SIZE,
+            writer_buffer_wait_timeout_ms: DEFAULT_WRITER_BUFFER_WAIT_TIMEOUT_MS,
             connect_timeout_ms: DEFAULT_CONNECT_TIMEOUT_MS,
             security_protocol: String::from(DEFAULT_SECURITY_PROTOCOL),
             security_sasl_mechanism: String::from(DEFAULT_SASL_MECHANISM),
@@ -224,6 +267,38 @@ impl Config {
         self.security_protocol.eq_ignore_ascii_case("sasl")
     }
 
+    /// Validates idempotence configuration. Returns `Ok(())` when the config is
+    /// consistent, or an error message when idempotence is enabled but other
+    /// settings are incompatible.
+    pub fn validate_idempotence(&self) -> Result<(), String> {
+        if !self.writer_enable_idempotence {
+            return Ok(());
+        }
+        let acks_is_all = self.writer_acks.eq_ignore_ascii_case("all") || self.writer_acks == "-1";
+        if !acks_is_all {
+            return Err(format!(
+                "Idempotent writes require acks='all' (-1), but got acks='{}'",
+                self.writer_acks
+            ));
+        }
+        if self.writer_retries <= 0 {
+            return Err(format!(
+                "Idempotent writes require retries > 0, but got retries={}",
+                self.writer_retries
+            ));
+        }
+        if self.writer_max_inflight_requests_per_bucket
+            > MAX_IN_FLIGHT_REQUESTS_PER_BUCKET_FOR_IDEMPOTENCE
+        {
+            return Err(format!(
+                "Idempotent writes require max-inflight-requests-per-bucket <= {}, but got {}",
+                MAX_IN_FLIGHT_REQUESTS_PER_BUCKET_FOR_IDEMPOTENCE,
+                self.writer_max_inflight_requests_per_bucket
+            ));
+        }
+        Ok(())
+    }
+
     /// Validates security configuration. Returns `Ok(())` when the config is
     /// consistent, or an error message when SASL is enabled but the config is
     /// incomplete or uses an unsupported mechanism.
@@ -371,4 +446,52 @@ mod tests {
         };
         assert!(config.validate_scanner_fetch().is_err());
     }
+
+    #[test]
+    fn test_idempotence_default_is_valid() {
+        let config = Config::default();
+        assert!(config.validate_idempotence().is_ok());
+    }
+
+    #[test]
+    fn test_idempotence_disabled_skips_validation() {
+        let config = Config {
+            writer_enable_idempotence: false,
+            writer_acks: "0".to_string(),
+            writer_retries: 0,
+            writer_max_inflight_requests_per_bucket: 100,
+            ..Config::default()
+        };
+        assert!(config.validate_idempotence().is_ok());
+    }
+
+    #[test]
+    fn test_idempotence_requires_acks_all() {
+        let config = Config {
+            writer_enable_idempotence: true,
+            writer_acks: "1".to_string(),
+            ..Config::default()
+        };
+        assert!(config.validate_idempotence().is_err());
+    }
+
+    #[test]
+    fn test_idempotence_requires_retries() {
+        let config = Config {
+            writer_enable_idempotence: true,
+            writer_retries: 0,
+            ..Config::default()
+        };
+        assert!(config.validate_idempotence().is_err());
+    }
+
+    #[test]
+    fn test_idempotence_requires_bounded_inflight() {
+        let config = Config {
+            writer_enable_idempotence: true,
+            writer_max_inflight_requests_per_bucket: 10,
+            ..Config::default()
+        };
+        assert!(config.validate_idempotence().is_err());
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index d56432c517..c2f72a74b0 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -104,6 +104,15 @@ pub enum Error {
     )]
     UnsupportedOperation { message: String },
 
+    #[snafu(visibility(pub(crate)), display("Fluss writer closed: {}.", message))]
+    WriterClosed { message: String },
+
+    #[snafu(
+        visibility(pub(crate)),
+        display("Fluss buffer exhausted: {}.", message)
+    )]
+    BufferExhausted { message: String },
+
     #[snafu(visibility(pub(crate)), display("Fluss API Error: {}.", api_error))]
     FlussAPIError { api_error: ApiError },
 }
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index 1c7ee7eb8f..a733dd7016 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -417,4 +417,13 @@ message AuthenticateRequest {
 
 message AuthenticateResponse {
   optional bytes challenge = 1;
+}
+
+// init writer request and response
+message InitWriterRequest {
+  repeated PbTablePath table_path = 1;
+}
+
+message InitWriterResponse {
+  required int64 writer_id = 1;
 }
\ No newline at end of file
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 83d102a1e6..d8ba6d95c9 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -445,6 +445,11 @@ impl MemoryLogRecordsArrowBuilder {
         Ok(())
     }
 
+    pub fn set_writer_state(&mut self, writer_id: i64, batch_base_sequence: i32) {
+        self.writer_id = writer_id;
+        self.batch_sequence = batch_base_sequence;
+    }
+
     /// Get an estimate of the number of bytes written to the underlying buffer.
     /// This includes the batch header size plus the estimated arrow data size.
     pub fn estimated_size_in_bytes(&self) -> usize {
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index 4231fb03b3..d1b3ea68aa 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -19,28 +19,29 @@ use crate::rpc::api_key::ApiKey::Unknown;
 
 #[derive(Debug, PartialEq, Eq, PartialOrd, Ord, Hash, Clone, Copy)]
 pub enum ApiKey {
-    CreateDatabase,
-    DropDatabase,
-    ListDatabases,
-    DatabaseExists,
-    CreateTable,
-    DropTable,
-    GetTable,
-    ListTables,
-    ListPartitionInfos,
-    TableExists,
-    MetaData,
-    ProduceLog,
-    PutKv,
-    FetchLog,
-    Lookup,
-    ListOffsets,
-    GetFileSystemSecurityToken,
-    GetDatabaseInfo,
-    GetLatestLakeSnapshot,
-    CreatePartition,
-    DropPartition,
-    Authenticate,
+    CreateDatabase,             // 1001
+    DropDatabase,               // 1002
+    ListDatabases,              // 1003
+    DatabaseExists,             // 1004
+    CreateTable,                // 1005
+    DropTable,                  // 1006
+    GetTable,                   // 1007
+    ListTables,                 // 1008
+    ListPartitionInfos,         // 1009
+    TableExists,                // 1010
+    MetaData,                   // 1012
+    ProduceLog,                 // 1014
+    FetchLog,                   // 1015
+    PutKv,                      // 1016
+    Lookup,                     // 1017
+    ListOffsets,                // 1021
+    GetFileSystemSecurityToken, // 1025
+    InitWriter,                 // 1026
+    GetLatestLakeSnapshot,      // 1032
+    GetDatabaseInfo,            // 1035
+    CreatePartition,            // 1036
+    DropPartition,              // 1037
+    Authenticate,               // 1038
     Unknown(i16),
 }
 
@@ -64,11 +65,13 @@ impl From<i16> for ApiKey {
             1017 => ApiKey::Lookup,
             1021 => ApiKey::ListOffsets,
             1025 => ApiKey::GetFileSystemSecurityToken,
+            1026 => ApiKey::InitWriter,
             1032 => ApiKey::GetLatestLakeSnapshot,
             1035 => ApiKey::GetDatabaseInfo,
             1036 => ApiKey::CreatePartition,
             1037 => ApiKey::DropPartition,
             1038 => ApiKey::Authenticate,
+
             _ => Unknown(key),
         }
     }
@@ -94,6 +97,7 @@ impl From<ApiKey> for i16 {
             ApiKey::Lookup => 1017,
             ApiKey::ListOffsets => 1021,
             ApiKey::GetFileSystemSecurityToken => 1025,
+            ApiKey::InitWriter => 1026,
             ApiKey::GetLatestLakeSnapshot => 1032,
             ApiKey::GetDatabaseInfo => 1035,
             ApiKey::CreatePartition => 1036,
@@ -128,6 +132,7 @@ mod tests {
             (1017, ApiKey::Lookup),
             (1021, ApiKey::ListOffsets),
             (1025, ApiKey::GetFileSystemSecurityToken),
+            (1026, ApiKey::InitWriter),
             (1032, ApiKey::GetLatestLakeSnapshot),
             (1035, ApiKey::GetDatabaseInfo),
             (1036, ApiKey::CreatePartition),
diff --git a/fluss-rust/crates/fluss/src/rpc/message/init_writer.rs b/fluss-rust/crates/fluss/src/rpc/message/init_writer.rs
new file mode 100644
index 0000000000..0bbb0dc56a
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/init_writer.rs
@@ -0,0 +1,50 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::{InitWriterResponse, PbTablePath};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+pub struct InitWriterRequest {
+    pub inner_request: proto::InitWriterRequest,
+}
+
+impl InitWriterRequest {
+    pub fn new(table_paths: Vec<PbTablePath>) -> Self {
+        InitWriterRequest {
+            inner_request: proto::InitWriterRequest {
+                table_path: table_paths,
+            },
+        }
+    }
+}
+
+impl RequestBody for InitWriterRequest {
+    type ResponseBody = InitWriterResponse;
+
+    const API_KEY: ApiKey = ApiKey::InitWriter;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(InitWriterRequest);
+impl_read_version_type!(InitWriterResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 9ad4545fb9..89a8ba14f4 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -34,6 +34,7 @@ mod get_latest_lake_snapshot;
 mod get_security_token;
 mod get_table;
 mod header;
+mod init_writer;
 mod list_databases;
 mod list_offsets;
 mod list_partition_infos;
@@ -59,6 +60,7 @@ pub use get_latest_lake_snapshot::*;
 pub use get_security_token::*;
 pub use get_table::*;
 pub use header::*;
+pub use init_writer::*;
 pub use list_databases::*;
 pub use list_offsets::*;
 pub use list_partition_infos::*;

From 5f1d86ef929ba35998a4495433bdd45a0c1c1732 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Thu, 19 Mar 2026 19:52:55 +0100
Subject: [PATCH 201/287] chore: no-op .asf.yaml change to attempt trigger gh
 page setup

---
 fluss-rust/.asf.yaml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/fluss-rust/.asf.yaml b/fluss-rust/.asf.yaml
index 929cc9fd7c..9f188c7eab 100644
--- a/fluss-rust/.asf.yaml
+++ b/fluss-rust/.asf.yaml
@@ -38,7 +38,6 @@ github:
     squash:  true
     merge:   false
     rebase:  true
-
 notifications:
   commits:      commits@fluss.apache.org
   issues:       issues@fluss.apache.org

From 007244e27c125684ba4a392247e133453db2ab66 Mon Sep 17 00:00:00 2001
From: fluxo <cml@apache.org>
Date: Thu, 19 Mar 2026 12:48:10 -0700
Subject: [PATCH 202/287] troubeshooting test commit

---
 fluss-rust/.asf.yaml | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/fluss-rust/.asf.yaml b/fluss-rust/.asf.yaml
index 9f188c7eab..fae1722d2f 100644
--- a/fluss-rust/.asf.yaml
+++ b/fluss-rust/.asf.yaml
@@ -43,4 +43,5 @@ notifications:
   issues:       issues@fluss.apache.org
   pullrequests: issues@fluss.apache.org
   jobs:         builds@fluss.apache.org
-  discussions:  issues@fluss.apache.org
\ No newline at end of file
+  discussions:  issues@fluss.apache.org
+

From 7d8ab3d82ce108661f6cf0b8705b1dc498ea0cc9 Mon Sep 17 00:00:00 2001
From: fluxo <cml@apache.org>
Date: Thu, 19 Mar 2026 15:06:39 -0700
Subject: [PATCH 203/287] INFRA-27705 - infrastructure test commit

---
 fluss-rust/.asf.yaml | 1 +
 1 file changed, 1 insertion(+)

diff --git a/fluss-rust/.asf.yaml b/fluss-rust/.asf.yaml
index fae1722d2f..bcf432a16d 100644
--- a/fluss-rust/.asf.yaml
+++ b/fluss-rust/.asf.yaml
@@ -34,6 +34,7 @@ github:
     - lakehouse
     - rust
     - python
+    - infra-test
   enabled_merge_buttons:
     squash:  true
     merge:   false

From fd2de539d7a17318ba3941082938608d6f09e900 Mon Sep 17 00:00:00 2001
From: fluxo <cml@apache.org>
Date: Thu, 19 Mar 2026 15:11:19 -0700
Subject: [PATCH 204/287] INFRA-27705 - remove test label

---
 fluss-rust/.asf.yaml | 1 -
 1 file changed, 1 deletion(-)

diff --git a/fluss-rust/.asf.yaml b/fluss-rust/.asf.yaml
index bcf432a16d..fae1722d2f 100644
--- a/fluss-rust/.asf.yaml
+++ b/fluss-rust/.asf.yaml
@@ -34,7 +34,6 @@ github:
     - lakehouse
     - rust
     - python
-    - infra-test
   enabled_merge_buttons:
     squash:  true
     merge:   false

From a106cb6f567b9b644c70da0a381967f0b41e0341 Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 20 Mar 2026 15:54:56 +0800
Subject: [PATCH 205/287] doc: optimize pyfluss description in pypi (#439)

---
 .../.github/workflows/release_python.yml      |   6 -
 fluss-rust/.gitignore                         |   3 +-
 .../bindings/python/GENERATED_README.md       |   1 -
 fluss-rust/bindings/python/PYPI_README.md     |  28 +++++
 fluss-rust/bindings/python/generate_readme.py | 104 ------------------
 fluss-rust/bindings/python/pyproject.toml     |   6 +-
 fluss-rust/justfile                           |   4 -
 7 files changed, 32 insertions(+), 120 deletions(-)
 delete mode 100644 fluss-rust/bindings/python/GENERATED_README.md
 create mode 100644 fluss-rust/bindings/python/PYPI_README.md
 delete mode 100644 fluss-rust/bindings/python/generate_readme.py

diff --git a/fluss-rust/.github/workflows/release_python.yml b/fluss-rust/.github/workflows/release_python.yml
index 323838d54c..7e5794693f 100644
--- a/fluss-rust/.github/workflows/release_python.yml
+++ b/fluss-rust/.github/workflows/release_python.yml
@@ -49,9 +49,6 @@ jobs:
     steps:
       - uses: actions/checkout@v4
 
-      - name: Generate Python README
-        run: python bindings/python/generate_readme.py
-
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
 
@@ -81,9 +78,6 @@ jobs:
     steps:
       - uses: actions/checkout@v4
 
-      - name: Generate Python README
-        run: python3 bindings/python/generate_readme.py
-
       - name: Install protoc (Linux)
         if: runner.os == 'Linux'
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
index 5d11a1c080..c821382293 100644
--- a/fluss-rust/.gitignore
+++ b/fluss-rust/.gitignore
@@ -20,7 +20,6 @@ Cargo.lock
 .vscode/
 
 # Python
-bindings/python/GENERATED_README.md
 __pycache__/
 *.py[cod]
 *$py.class
@@ -53,4 +52,4 @@ website/package-lock.json
 website/versioned_docs
 website/versioned_sidebars
 website/versions.json
-website/pnpm-lock.yaml
\ No newline at end of file
+website/pnpm-lock.yaml
diff --git a/fluss-rust/bindings/python/GENERATED_README.md b/fluss-rust/bindings/python/GENERATED_README.md
deleted file mode 100644
index 0a011ba6ee..0000000000
--- a/fluss-rust/bindings/python/GENERATED_README.md
+++ /dev/null
@@ -1 +0,0 @@
-This readme can be automatically generated by generate_readme.py.
\ No newline at end of file
diff --git a/fluss-rust/bindings/python/PYPI_README.md b/fluss-rust/bindings/python/PYPI_README.md
new file mode 100644
index 0000000000..ee9796a46c
--- /dev/null
+++ b/fluss-rust/bindings/python/PYPI_README.md
@@ -0,0 +1,28 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements.  See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership.  The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
+
+# Fluss Python Client
+
+PyFluss is a Python library for programmatic access to Apache Fluss (Incubating).
+It provides Python APIs to work with Fluss table metadata and read or write table data.
+
+The documentation is available at <https://clients.fluss.apache.org/>.
+
+## Get in Touch
+
+Join the Fluss community at <https://fluss.apache.org/community/welcome/>.
diff --git a/fluss-rust/bindings/python/generate_readme.py b/fluss-rust/bindings/python/generate_readme.py
deleted file mode 100644
index 206f9e2ab0..0000000000
--- a/fluss-rust/bindings/python/generate_readme.py
+++ /dev/null
@@ -1,104 +0,0 @@
-#!/usr/bin/env python3
-# Licensed to the Apache Software Foundation (ASF) under one or more
-# contributor license agreements.  See the NOTICE file distributed with
-# this work for additional information regarding copyright ownership.
-# The ASF licenses this file to you under the Apache License, Version 2.0
-# (the "License"); you may not use this file except in compliance with
-# the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-"""Generate bindings/python/GENERATED_README.md from the website docs.
-
-Usage:
-    python generate_readme.py          # writes GENERATED_README.md
-    python generate_readme.py --check  # exits non-zero if GENERATED_README.md is stale
-"""
-
-from __future__ import annotations
-
-import re
-import sys
-from pathlib import Path
-
-SCRIPT_DIR = Path(__file__).resolve().parent
-DOCS_DIR = SCRIPT_DIR / "../../website/docs/user-guide/python"
-
-LICENSE_HEADER = """\
-<!--
- Licensed to the Apache Software Foundation (ASF) under one
- or more contributor license agreements.  See the NOTICE file
- distributed with this work for additional information
- regarding copyright ownership.  The ASF licenses this file
- to you under the Apache License, Version 2.0 (the
- "License"); you may not use this file except in compliance
- with the License.  You may obtain a copy of the License at
-
-      http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-"""
-
-# Files in the order they should appear in the README.
-SECTIONS: list[str] = [
-    "installation.md",
-    "example/index.md",
-    "example/configuration.md",
-    "example/admin-operations.md",
-    "example/log-tables.md",
-    "example/primary-key-tables.md",
-    "example/partitioned-tables.md",
-    "error-handling.md",
-    "data-types.md",
-    "api-reference.md",
-]
-
-FRONTMATTER_RE = re.compile(r"^---\n.*?^---\n", re.MULTILINE | re.DOTALL)
-
-
-def strip_frontmatter(text: str) -> str:
-    return FRONTMATTER_RE.sub("", text, count=1)
-
-
-def build_readme() -> str:
-    parts = [LICENSE_HEADER, "# Fluss Python Client\n"]
-
-    for section in SECTIONS:
-        path = DOCS_DIR / section
-        if not path.exists():
-            print(f"warning: {path} not found, skipping", file=sys.stderr)
-            continue
-        content = strip_frontmatter(path.read_text()).strip()
-        parts.append(content)
-
-    return "\n\n".join(parts) + "\n"
-
-
-def main() -> None:
-    readme = build_readme()
-    dest = SCRIPT_DIR / "GENERATED_README.md"
-
-    if "--check" in sys.argv:
-        if not dest.exists() or dest.read_text() != readme:
-            print("GENERATED_README.md is out of date. Run: python generate_readme.py")
-            sys.exit(1)
-        print("GENERATED_README.md is up to date.")
-        return
-
-    dest.write_text(readme)
-    print(f"Wrote {dest}")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index 63af88e4ed..1664597b05 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -21,10 +21,10 @@ build-backend = "maturin"
 
 [project]
 name = "pyfluss"
-description = "Apache Fluss (incubating) Python Binding"
+description = "Apache Fluss (incubating) Python client"
 authors = [{name = "Apache Fluss", email = "dev@fluss.apache.org"}]
 license = {text = "Apache-2.0"}
-readme = "GENERATED_README.md"
+readme = "PYPI_README.md"
 requires-python = ">=3.9"
 classifiers = [
     "License :: OSI Approved :: Apache Software License",
@@ -42,7 +42,7 @@ dependencies = [
 ]
 
 [project.urls]
-Homepage = "https://fluss.apache.org/"
+Homepage = "https://clients.fluss.apache.org/"
 Repository = "https://github.com/apache/fluss-rust"
 
 [project.optional-dependencies]
diff --git a/fluss-rust/justfile b/fluss-rust/justfile
index c2a611688b..c4e1a763ac 100644
--- a/fluss-rust/justfile
+++ b/fluss-rust/justfile
@@ -26,7 +26,3 @@ release [version]:
 # Usage: just bump-version <current> <next>   e.g. just bump-version 0.1.0 0.1.1
 bump-version from to:
     ./scripts/bump-version.sh {{from}} {{to}}
-
-# Regenerate bindings/python/GENERATED_README.md from website docs.
-generate-python-readme:
-    python bindings/python/generate_readme.py

From c5cddd9e70199dfdd52680d778e9f48324e59c26 Mon Sep 17 00:00:00 2001
From: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 20 Mar 2026 16:02:48 +0800
Subject: [PATCH 206/287] Revert "Bump version to 0.2.0"

This reverts commit eb60036076ed93487be05442f14099baf025a337.
---
 fluss-rust/Cargo.toml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 584897789c..77d714006a 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -24,7 +24,7 @@ homepage = "https://fluss.apache.org/"
 license = "Apache-2.0"
 repository = "https://github.com/apache/fluss-rust"
 rust-version = "1.85"
-version = "0.2.0"
+version = "0.1.0"
 keywords = ["fluss", "streaming-storage", "datalake"]
 
 [workspace]
@@ -32,7 +32,7 @@ resolver = "2"
 members = ["crates/fluss", "crates/examples", "bindings/python", "bindings/cpp"]
 
 [workspace.dependencies]
-fluss = { package = "fluss-rs", version = "0.2.0", path = "crates/fluss", features = ["storage-all"] }
+fluss = { package = "fluss-rs", version = "0.1.0", path = "crates/fluss", features = ["storage-all"] }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression"] }

From 7b9a400da59d6fc0018c7ac2a540f17022b68b4b Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 20 Mar 2026 16:20:58 +0800
Subject: [PATCH 207/287] [doc] Update fluss-rust readme markdown (#415)

---
 fluss-rust/Cargo.toml                         |   4 +-
 fluss-rust/bindings/python/pyproject.toml     |   2 +-
 fluss-rust/crates/fluss/Cargo.toml            |   8 +-
 fluss-rust/crates/fluss/README.md             | 110 +++++++++++++++---
 .../docs/user-guide/rust/installation.md      |   4 +-
 5 files changed, 104 insertions(+), 24 deletions(-)

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 77d714006a..cd473e74d9 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -18,9 +18,8 @@
 [workspace.package]
 authors = ["Apache Fluss <dev@fluss.apache.org>"]
 categories = ["api-bindings", "database"]
-description = "The rust implementation of fluss"
 edition = "2024"
-homepage = "https://fluss.apache.org/"
+homepage = "https://clients.fluss.apache.org/"
 license = "Apache-2.0"
 repository = "https://github.com/apache/fluss-rust"
 rust-version = "1.85"
@@ -36,7 +35,6 @@ fluss = { package = "fluss-rs", version = "0.1.0", path = "crates/fluss", featur
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression"] }
-
 bigdecimal = "0.4"
 serde = { version = "1.0", features = ["derive"] }
 serde_json = "1.0"
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index 1664597b05..ce4c436381 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -42,7 +42,7 @@ dependencies = [
 ]
 
 [project.urls]
-Homepage = "https://clients.fluss.apache.org/"
+Homepage = "https://clients.fluss.apache.org/user-guide/rust/installation/"
 Repository = "https://github.com/apache/fluss-rust"
 
 [project.optional-dependencies]
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index c0ba6f8dc8..7b68e51f4e 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -22,10 +22,12 @@ rust-version = { workspace = true }
 version = { workspace = true }
 name = "fluss-rs"
 authors = { workspace = true }
-description = { workspace = true }
-homepage = { workspace = true }
+description = "The official rust client of Apache Fluss (Incubating)"
+homepage = "https://clients.fluss.apache.org/user-guide/rust/installation/"
 repository = { workspace = true }
 keywords = { workspace = true }
+categories = { workspace = true }
+documentation = "https://docs.rs/fluss-rs"
 
 [lib]
 name = "fluss"
@@ -81,4 +83,4 @@ testcontainers = "0.25.0"
 test-env-helpers = "0.2.2"
 
 [build-dependencies]
-prost-build = { version = "0.14" }
+prost-build = "0.14"
diff --git a/fluss-rust/crates/fluss/README.md b/fluss-rust/crates/fluss/README.md
index aad8de96c1..b37a75df79 100644
--- a/fluss-rust/crates/fluss/README.md
+++ b/fluss-rust/crates/fluss/README.md
@@ -1,25 +1,105 @@
-# Apache Fluss™ Rust Client (Incubating)
+# Apache Fluss (Incubating) Official Rust Client
 
-Rust client library for [Apache Fluss™](https://fluss.apache.org/). This crate provides the core client used by the fluss-rust workspace and by the Python and C++ bindings.
+Official Rust client library for [Apache Fluss (Incubating)](https://fluss.apache.org/).
 
-# Todo: move how to use to the first, and how to build to the last, https://github.com/apache/opendal/blob/main/core/README.md 
-# is a good reference
+[![crates.io](https://img.shields.io/crates/v/fluss-rs.svg)](https://crates.io/crates/fluss-rs)
+[![docs.rs](https://img.shields.io/docsrs/fluss-rs)](https://docs.rs/fluss-rs/)
 
-## Requirements
+## Usage
 
-- Rust (see [rust-toolchain.toml](../../rust-toolchain.toml) at repo root)
-- protobuf (for build)
+The following example shows both **primary key (KV) tables** and **log tables** in one flow: connect, create a KV table (upsert + lookup), then create a log table (append + scan).
 
-## Build
+```rust
+use fluss::client::EARLIEST_OFFSET;
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+use fluss::error::Result;
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+use fluss::row::{GenericRow, InternalRow};
+use std::time::Duration;
 
-From the repository root:
+#[tokio::main]
+async fn main() -> Result<()> {
+    let mut config = Config::default();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
+    let connection = FlussConnection::new(config).await?;
+    let admin = connection.get_admin().await?;
 
-```bash
-cargo build -p fluss-rs
+    // ---- Primary key (KV) table: upsert and lookup ----
+    let kv_path = TablePath::new("fluss", "users");
+    let mut kv_schema = Schema::builder()
+        .column("id", DataTypes::int())
+        .column("name", DataTypes::string())
+        .column("age", DataTypes::bigint())
+        .primary_key(vec!["id"]);
+    let kv_descriptor = TableDescriptor::builder()
+        .schema(kv_schema.build()?)
+        .build()?;
+    admin.create_table(&kv_path, &kv_descriptor, false).await?;
+
+    let kv_table = connection.get_table(&kv_path).await?;
+    let upsert_writer = kv_table.new_upsert()?.create_writer()?;
+    let mut row = GenericRow::new(3);
+    row.set_field(0, 1i32);
+    row.set_field(1, "Alice");
+    row.set_field(2, 30i64);
+    upsert_writer.upsert(&row)?;
+    upsert_writer.flush().await?;
+
+    let mut lookuper = kv_table.new_lookup()?.create_lookuper()?;
+    let mut key = GenericRow::new(1);
+    key.set_field(0, 1i32);
+    let result = lookuper.lookup(&key).await?;
+    if let Some(r) = result.get_single_row()? {
+        println!("KV lookup: id={}, name={}, age={}",
+                 r.get_int(0)?, r.get_string(1)?, r.get_long(2)?);
+    }
+
+    // ---- Log table: append and scan ----
+    let log_path = TablePath::new("fluss", "events");
+    let log_schema = Schema::builder()
+        .column("ts", DataTypes::bigint())
+        .column("message", DataTypes::string())
+        .build()?;
+    let log_descriptor = TableDescriptor::builder()
+        .schema(log_schema)
+        .build()?;
+    admin.create_table(&log_path, &log_descriptor, false).await?;
+
+    let log_table = connection.get_table(&log_path).await?;
+    let append_writer = log_table.new_append()?.create_writer()?;
+    let mut event = GenericRow::new(2);
+    event.set_field(0, 1700000000i64);
+    event.set_field(1, "hello");
+    append_writer.append(&event)?;
+    append_writer.flush().await?;
+
+    let scanner = log_table.new_scan().create_log_scanner()?;
+    scanner.subscribe(0, EARLIEST_OFFSET).await?;
+    let scan_records = scanner.poll(Duration::from_secs(1)).await?;
+    for record in scan_records {
+        let r = record.row();
+        println!("Log scan: ts={}, message={}", r.get_long(0)?, r.get_string(1)?);
+    }
+
+    Ok(())
+}
 ```
 
-## Quick start and examples
+## Storage Support
+
+The Fluss client reads remote data by accessing Fluss’s **remote files** (e.g. log segments and snapshots) directly. The following **remote file systems** are supported; enable the matching feature(s) for your deployment:
+
+| Storage Backend | Feature Flag | Status | Description |
+|----------------|--------------|--------|-------------|
+| Local Filesystem | `storage-fs` | ✅ Stable | Local filesystem storage |
+| Amazon S3 | `storage-s3` | ✅ Stable | Amazon S3 storage |
+| Alibaba Cloud OSS | `storage-oss` | ✅ Stable | Alibaba Cloud Object Storage Service |
 
-## TODO
-- [ ] Expand API documentation and usage examples in this README.
-- [ ] Add more examples for table, log scan, and write flows.
+You can enable all storage backends at once using the `storage-all` feature flag.
+
+Example usage in Cargo.toml:
+```toml
+[dependencies]
+fluss-rs = { version = "0.x.x", features = ["storage-s3", "storage-fs"] }
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/installation.md b/fluss-rust/website/docs/user-guide/rust/installation.md
index e698783195..540d4a10a0 100644
--- a/fluss-rust/website/docs/user-guide/rust/installation.md
+++ b/fluss-rust/website/docs/user-guide/rust/installation.md
@@ -7,7 +7,7 @@ The Fluss Rust client is published to [crates.io](https://crates.io/crates/fluss
 
 ```toml
 [dependencies]
-fluss-rs = "0.1"
+fluss-rs = "0.1.0"
 tokio = { version = "1", features = ["full"] }
 ```
 
@@ -16,7 +16,7 @@ tokio = { version = "1", features = ["full"] }
 ```toml
 [dependencies]
 # Default: memory and filesystem storage
-fluss-rs = "0.1"
+fluss-rs = "0.1.0"
 
 # With S3 storage support
 fluss-rs = { version = "0.1", features = ["storage-s3"] }

From 05b73f46fe5fe859b6afbd9c4b01bcaa441418cc Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 21 Mar 2026 03:32:26 +0000
Subject: [PATCH 208/287] chore: Idempotency bug: OOO loop when response is
 lost but subsequent batches succeed (#448)

---
 .../fluss/src/client/write/idempotence.rs     | 43 ++++++++++++++++++
 .../crates/fluss/src/client/write/sender.rs   | 44 ++++++++++++++-----
 2 files changed, 75 insertions(+), 12 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/write/idempotence.rs b/fluss-rust/crates/fluss/src/client/write/idempotence.rs
index 3c55f6ac5a..eeec8761b2 100644
--- a/fluss-rust/crates/fluss/src/client/write/idempotence.rs
+++ b/fluss-rust/crates/fluss/src/client/write/idempotence.rs
@@ -314,6 +314,19 @@ impl IdempotenceManager {
         }
     }
 
+    /// Returns true if the batch has already been committed on the server.
+    ///
+    /// If the batch's sequence is less than or equal to `last_acked_sequence`, it means
+    /// a higher-sequence batch has already been acknowledged. This implies the current batch
+    /// was also successfully written on the server (otherwise the higher-sequence batch could
+    /// not have been committed).
+    pub fn is_already_committed(&self, bucket: &TableBucket, batch_sequence: i32) -> bool {
+        let entries = self.bucket_entries.lock();
+        entries
+            .get(bucket)
+            .is_some_and(|e| e.last_acked_sequence >= 0 && batch_sequence <= e.last_acked_sequence)
+    }
+
     pub fn can_retry_for_error(
         &self,
         bucket: &TableBucket,
@@ -530,6 +543,36 @@ mod tests {
         assert!(mgr.can_send_more_requests(&b0)); // under limit again
     }
 
+    #[test]
+    fn test_is_already_committed() {
+        let mgr = IdempotenceManager::new(true, 5);
+        let b0 = test_bucket(0);
+        mgr.set_writer_id(42);
+
+        // No entry yet → not committed
+        assert!(!mgr.is_already_committed(&b0, 0));
+
+        // Initialize bucket and ack seq=0
+        let _ = mgr.next_sequence_and_increment(&b0); // 0
+        mgr.add_in_flight_batch(&b0, 0, 100);
+        mgr.handle_completed_batch(&b0, 100, 42); // last_acked=0
+
+        // seq=0 <= last_acked(0) → committed
+        assert!(mgr.is_already_committed(&b0, 0));
+        // seq=1 > last_acked(0) → not committed
+        assert!(!mgr.is_already_committed(&b0, 1));
+
+        // Ack up to seq=4, then check seq=0 still committed
+        for seq in 1..=4 {
+            let _ = mgr.next_sequence_and_increment(&b0);
+            mgr.add_in_flight_batch(&b0, seq, 100 + seq as i64);
+            mgr.handle_completed_batch(&b0, 100 + seq as i64, 42);
+        }
+        assert!(mgr.is_already_committed(&b0, 0)); // seq=0 <= last_acked(4)
+        assert!(mgr.is_already_committed(&b0, 4)); // seq=4 <= last_acked(4)
+        assert!(!mgr.is_already_committed(&b0, 5)); // seq=5 > last_acked(4)
+    }
+
     #[test]
     fn test_reset_batch_ids_cleaned_on_complete() {
         let (mgr, b0) = setup_three_in_flight();
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index b526e1a96e..dd5370d8ed 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -637,6 +637,35 @@ impl Sender {
         message: String,
     ) -> Result<Option<Arc<PhysicalTablePath>>> {
         let physical_table_path = Arc::clone(ready_write_batch.write_batch.physical_table_path());
+
+        if error == FlussError::DuplicateSequenceException {
+            warn!(
+                "Duplicate sequence for {} on bucket {}: {message}",
+                physical_table_path.as_ref(),
+                ready_write_batch.table_bucket.bucket_id()
+            );
+            self.complete_batch(ready_write_batch);
+            return Ok(None);
+        }
+
+        if error == FlussError::OutOfOrderSequenceException
+            && self.idempotence_manager.is_enabled()
+            && self.idempotence_manager.is_already_committed(
+                &ready_write_batch.table_bucket,
+                ready_write_batch.write_batch.batch_sequence(),
+            )
+        {
+            warn!(
+                "Batch for {} on bucket {} with sequence {} received OutOfOrderSequenceException \
+                 but has already been committed. Treating as success due to lost response.",
+                physical_table_path.as_ref(),
+                ready_write_batch.table_bucket.bucket_id(),
+                ready_write_batch.write_batch.batch_sequence(),
+            );
+            self.complete_batch(ready_write_batch);
+            return Ok(None);
+        }
+
         if self.can_retry(&ready_write_batch, error) {
             warn!(
                 "Retrying write batch for {} on bucket {} after error {error:?}: {message}",
@@ -680,18 +709,9 @@ impl Sender {
             return Ok(Self::is_invalid_metadata_error(error).then_some(physical_table_path));
         }
 
-        if error == FlussError::DuplicateSequenceException {
-            warn!(
-                "Duplicate sequence for {} on bucket {}: {message}",
-                physical_table_path.as_ref(),
-                ready_write_batch.table_bucket.bucket_id()
-            );
-            self.complete_batch(ready_write_batch);
-            return Ok(None);
-        }
-
-        // Generic error path. handle_failed_batch will detect OutOfOrderSequence /
-        // UnknownWriterId and reset all writer state internally (matching Java).
+        // Generic error path. handle_failed_batch will detect remaining
+        // OutOfOrderSequence (not already committed) / UnknownWriterId cases and
+        // reset all writer state internally (matching Java).
         // For other errors, only adjust sequences if the batch didn't exhaust its retries.
         let can_adjust = ready_write_batch.write_batch.attempts() < self.retries;
         self.fail_batch(

From ff98cc7afa8fa25a4e51cbf27818b23a13576dd6 Mon Sep 17 00:00:00 2001
From: Aryamaan Singh <71913204+toxicteddy00077@users.noreply.github.com>
Date: Mon, 23 Mar 2026 07:20:00 +0530
Subject: [PATCH 209/287] chore: added check to get_admin() before creating new
 admin (#369)

---
 fluss-rust/bindings/cpp/src/lib.rs            |  2 +-
 fluss-rust/bindings/cpp/test/test_utils.h     |  1 -
 fluss-rust/bindings/python/src/admin.rs       |  6 +-
 fluss-rust/bindings/python/src/table.rs       |  4 +-
 .../src/example_partitioned_kv_table.rs       | 10 +--
 fluss-rust/crates/fluss/src/client/admin.rs   | 73 +++++++++++--------
 .../crates/fluss/src/client/connection.rs     | 30 ++++++--
 .../crates/fluss/tests/integration/utils.rs   | 11 ++-
 8 files changed, 82 insertions(+), 55 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 284eec898f..82254ea95a 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -556,7 +556,7 @@ pub struct Connection {
 }
 
 pub struct Admin {
-    inner: fcore::client::FlussAdmin,
+    inner: Arc<fcore::client::FlussAdmin>,
 }
 
 pub struct Table {
diff --git a/fluss-rust/bindings/cpp/test/test_utils.h b/fluss-rust/bindings/cpp/test/test_utils.h
index 17a1da7684..1ff7e2810b 100644
--- a/fluss-rust/bindings/cpp/test/test_utils.h
+++ b/fluss-rust/bindings/cpp/test/test_utils.h
@@ -306,7 +306,6 @@ class FlussTestEnvironment : public ::testing::Environment {
             if (result.Ok()) {
                 auto admin_result = connection_.GetAdmin(admin_);
                 if (admin_result.Ok()) {
-                    // check tablet server is available
                     std::vector<fluss::ServerNode> nodes;
                     auto nodes_result = admin_.GetServerNodes(nodes);
                     if (nodes_result.Ok() &&
diff --git a/fluss-rust/bindings/python/src/admin.rs b/fluss-rust/bindings/python/src/admin.rs
index 703b13347b..5f4e45d5b9 100644
--- a/fluss-rust/bindings/python/src/admin.rs
+++ b/fluss-rust/bindings/python/src/admin.rs
@@ -532,10 +532,8 @@ impl FlussAdmin {
 
 impl FlussAdmin {
     // Internal method to create FlussAdmin from core admin
-    pub fn from_core(admin: fcore::client::FlussAdmin) -> Self {
-        Self {
-            __admin: Arc::new(admin),
-        }
+    pub fn from_core(admin: Arc<fcore::client::FlussAdmin>) -> Self {
+        Self { __admin: admin }
     }
 }
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 660cd6be16..8c9ea0e46b 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -1902,7 +1902,7 @@ macro_rules! with_scanner {
 #[pyclass]
 pub struct LogScanner {
     scanner: ScannerKind,
-    admin: fcore::client::FlussAdmin,
+    admin: Arc<fcore::client::FlussAdmin>,
     table_info: fcore::metadata::TableInfo,
     /// The projected Arrow schema to use for empty table creation
     projected_schema: SchemaRef,
@@ -2207,7 +2207,7 @@ impl LogScanner {
 impl LogScanner {
     fn new(
         scanner: ScannerKind,
-        admin: fcore::client::FlussAdmin,
+        admin: Arc<fcore::client::FlussAdmin>,
         table_info: fcore::metadata::TableInfo,
         projected_schema: SchemaRef,
         projected_row_type: fcore::metadata::RowType,
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index 9cd2e7df86..ba49934ee9 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -46,7 +46,7 @@ pub async fn main() -> Result<()> {
 
     let table_path = TablePath::new("fluss", "partitioned_kv_example");
 
-    let mut admin = conn.get_admin().await?;
+    let admin = conn.get_admin().await?;
     admin
         .create_table(&table_path, &table_descriptor, true)
         .await?;
@@ -55,9 +55,9 @@ pub async fn main() -> Result<()> {
         admin.get_table_info(&table_path).await?
     );
 
-    create_partition(&table_path, &mut admin, "APAC", 1).await;
-    create_partition(&table_path, &mut admin, "EMEA", 2).await;
-    create_partition(&table_path, &mut admin, "US", 3).await;
+    create_partition(&table_path, &admin, "APAC", 1).await;
+    create_partition(&table_path, &admin, "EMEA", 2).await;
+    create_partition(&table_path, &admin, "US", 3).await;
 
     let table = conn.get_table(&table_path).await?;
     let table_upsert = table.new_upsert()?;
@@ -129,7 +129,7 @@ pub async fn main() -> Result<()> {
     Ok(())
 }
 
-async fn create_partition(table_path: &TablePath, admin: &mut FlussAdmin, region: &str, zone: i64) {
+async fn create_partition(table_path: &TablePath, admin: &FlussAdmin, region: &str, zone: i64) {
     let mut partition_values = HashMap::new();
     partition_values.insert("region".to_string(), region.to_string());
     partition_values.insert("zone".to_string(), zone.to_string());
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 7a79e5ed99..7f1f64efca 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -38,30 +38,28 @@ use std::sync::Arc;
 use tokio::task::JoinHandle;
 
 pub struct FlussAdmin {
-    admin_gateway: ServerConnection,
-    #[allow(dead_code)]
     metadata: Arc<Metadata>,
-    #[allow(dead_code)]
     rpc_client: Arc<RpcClient>,
 }
 
 impl FlussAdmin {
-    pub async fn new(connections: Arc<RpcClient>, metadata: Arc<Metadata>) -> Result<Self> {
-        let admin_con =
-            connections
-                .get_connection(metadata.get_cluster().get_coordinator_server().ok_or_else(
-                    || Error::UnexpectedError {
-                        message: "Coordinator server not found in cluster metadata".to_string(),
-                        source: None,
-                    },
-                )?)
-                .await?;
-
-        Ok(FlussAdmin {
-            admin_gateway: admin_con,
+    pub fn new(connections: Arc<RpcClient>, metadata: Arc<Metadata>) -> Self {
+        FlussAdmin {
             metadata,
             rpc_client: connections,
-        })
+        }
+    }
+
+    async fn admin_gateway(&self) -> Result<ServerConnection> {
+        let cluster = self.metadata.get_cluster();
+        let coordinator =
+            cluster
+                .get_coordinator_server()
+                .ok_or_else(|| Error::UnexpectedError {
+                    message: "Coordinator server not found in cluster metadata".to_string(),
+                    source: None,
+                })?;
+        self.rpc_client.get_connection(coordinator).await
     }
 
     pub async fn create_database(
@@ -71,7 +69,8 @@ impl FlussAdmin {
         ignore_if_exists: bool,
     ) -> Result<()> {
         let _response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(CreateDatabaseRequest::new(
                 database_name,
                 database_descriptor,
@@ -88,7 +87,8 @@ impl FlussAdmin {
         ignore_if_exists: bool,
     ) -> Result<()> {
         let _response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(CreateTableRequest::new(
                 table_path,
                 table_descriptor,
@@ -104,7 +104,8 @@ impl FlussAdmin {
         ignore_if_not_exists: bool,
     ) -> Result<()> {
         let _response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(DropTableRequest::new(table_path, ignore_if_not_exists))
             .await?;
         Ok(())
@@ -112,7 +113,8 @@ impl FlussAdmin {
 
     pub async fn get_table_info(&self, table_path: &TablePath) -> Result<TableInfo> {
         let response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(GetTableRequest::new(table_path))
             .await?;
 
@@ -144,7 +146,8 @@ impl FlussAdmin {
     /// List all tables in the given database
     pub async fn list_tables(&self, database_name: &str) -> Result<Vec<String>> {
         let response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(ListTablesRequest::new(database_name))
             .await?;
         Ok(response.table_name)
@@ -162,7 +165,8 @@ impl FlussAdmin {
         partial_partition_spec: Option<&PartitionSpec>,
     ) -> Result<Vec<PartitionInfo>> {
         let response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(ListPartitionInfosRequest::new(
                 table_path,
                 partial_partition_spec,
@@ -179,7 +183,8 @@ impl FlussAdmin {
         ignore_if_exists: bool,
     ) -> Result<()> {
         let _response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(CreatePartitionRequest::new(
                 table_path,
                 partition_spec,
@@ -197,7 +202,8 @@ impl FlussAdmin {
         ignore_if_not_exists: bool,
     ) -> Result<()> {
         let _response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(DropPartitionRequest::new(
                 table_path,
                 partition_spec,
@@ -210,7 +216,8 @@ impl FlussAdmin {
     /// Check if a table exists
     pub async fn table_exists(&self, table_path: &TablePath) -> Result<bool> {
         let response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(TableExistsRequest::new(table_path))
             .await?;
         Ok(response.exists)
@@ -224,7 +231,8 @@ impl FlussAdmin {
         cascade: bool,
     ) -> Result<()> {
         let _response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(DropDatabaseRequest::new(
                 database_name,
                 ignore_if_not_exists,
@@ -237,7 +245,8 @@ impl FlussAdmin {
     /// List all databases
     pub async fn list_databases(&self) -> Result<Vec<String>> {
         let response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(ListDatabasesRequest::new())
             .await?;
         Ok(response.database_name)
@@ -246,7 +255,8 @@ impl FlussAdmin {
     /// Check if a database exists
     pub async fn database_exists(&self, database_name: &str) -> Result<bool> {
         let response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(DatabaseExistsRequest::new(database_name))
             .await?;
         Ok(response.exists)
@@ -255,7 +265,7 @@ impl FlussAdmin {
     /// Get database information
     pub async fn get_database_info(&self, database_name: &str) -> Result<DatabaseInfo> {
         let request = GetDatabaseInfoRequest::new(database_name);
-        let response = self.admin_gateway.request(request).await?;
+        let response = self.admin_gateway().await?.request(request).await?;
 
         // Convert proto response to DatabaseInfo
         let database_descriptor = DatabaseDescriptor::from_json_bytes(&response.database_json)?;
@@ -278,7 +288,8 @@ impl FlussAdmin {
     /// Get the latest lake snapshot for a table
     pub async fn get_latest_lake_snapshot(&self, table_path: &TablePath) -> Result<LakeSnapshot> {
         let response = self
-            .admin_gateway
+            .admin_gateway()
+            .await?
             .request(GetLatestLakeSnapshotRequest::new(table_path))
             .await?;
 
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 78e9362b8f..7dc1285f6f 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -20,14 +20,13 @@ use crate::client::admin::FlussAdmin;
 use crate::client::metadata::Metadata;
 use crate::client::table::FlussTable;
 use crate::config::Config;
+use crate::error::{Error, FlussError, Result};
+use crate::metadata::TablePath;
 use crate::rpc::RpcClient;
 use parking_lot::RwLock;
 use std::sync::Arc;
 use std::time::Duration;
 
-use crate::error::{Error, FlussError, Result};
-use crate::metadata::TablePath;
-
 // TODO: implement `close(&self, timeout: Duration)` to gracefully shut down the
 // writer client (drain pending batches, then force-close on timeout).
 // Java's FlussConnection.close() calls writerClient.close(Long.MAX_VALUE).
@@ -37,6 +36,7 @@ pub struct FlussConnection {
     network_connects: Arc<RpcClient>,
     args: Config,
     writer_client: RwLock<Option<Arc<WriterClient>>>,
+    admin_client: RwLock<Option<Arc<FlussAdmin>>>,
 }
 
 impl FlussConnection {
@@ -66,6 +66,7 @@ impl FlussConnection {
             network_connects: connections.clone(),
             args: arg.clone(),
             writer_client: Default::default(),
+            admin_client: RwLock::new(None),
         })
     }
 
@@ -81,8 +82,27 @@ impl FlussConnection {
         &self.args
     }
 
-    pub async fn get_admin(&self) -> Result<FlussAdmin> {
-        FlussAdmin::new(self.network_connects.clone(), self.metadata.clone()).await
+    pub async fn get_admin(&self) -> Result<Arc<FlussAdmin>> {
+        // 1. Fast path: return cached instance if already initialized.
+        if let Some(admin) = self.admin_client.read().as_ref() {
+            return Ok(admin.clone());
+        }
+
+        // 2. Slow path: acquire write lock.
+        let mut admin_guard = self.admin_client.write();
+
+        // 3. Double-check: another thread may have initialized while we waited.
+        if let Some(admin) = admin_guard.as_ref() {
+            return Ok(admin.clone());
+        }
+
+        // 4. Initialize and cache.
+        let admin = Arc::new(FlussAdmin::new(
+            self.network_connects.clone(),
+            self.metadata.clone(),
+        ));
+        *admin_guard = Some(admin.clone());
+        Ok(admin)
     }
 
     pub fn get_or_create_writer_client(&self) -> Result<Arc<WriterClient>> {
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index b53abc8609..970b84ae8e 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -109,12 +109,11 @@ pub async fn wait_for_cluster_ready_with_sasl(cluster: &FlussTestingCluster) {
         let connection = cluster
             .get_fluss_connection_with_sasl(username, password)
             .await;
-        if connection.get_admin().await.is_ok()
-            && connection
-                .get_metadata()
-                .get_cluster()
-                .get_one_available_server()
-                .is_some()
+        if connection
+            .get_metadata()
+            .get_cluster()
+            .get_one_available_server()
+            .is_some()
         {
             return;
         }

From ffa14b2051874514ac24f2704b79d53450736cdd Mon Sep 17 00:00:00 2001
From: yuxia Luo <luoyuxia@alumni.sjtu.edu.cn>
Date: Mon, 23 Mar 2026 10:21:48 +0800
Subject: [PATCH 210/287] chore: make get admin sync (#450)

---
 fluss-rust/bindings/cpp/src/lib.rs            |  2 +-
 fluss-rust/bindings/cpp/src/types.rs          |  2 +-
 fluss-rust/bindings/python/example/example.py |  2 +-
 fluss-rust/bindings/python/fluss/__init__.pyi |  2 +-
 fluss-rust/bindings/python/src/connection.rs  | 18 ++++--------
 fluss-rust/bindings/python/src/table.rs       |  1 -
 fluss-rust/bindings/python/test/conftest.py   |  4 +--
 .../bindings/python/test/test_sasl_auth.py    |  4 +--
 .../crates/examples/src/example_kv_table.rs   |  2 +-
 .../src/example_partitioned_kv_table.rs       |  2 +-
 .../crates/examples/src/example_table.rs      |  2 +-
 fluss-rust/crates/fluss/README.md             |  2 +-
 .../crates/fluss/src/client/connection.rs     |  2 +-
 .../crates/fluss/src/client/table/scanner.rs  |  4 +--
 .../crates/fluss/src/client/write/sender.rs   |  5 +---
 fluss-rust/crates/fluss/src/lib.rs            |  2 +-
 .../fluss/src/metadata/data_lake_format.rs    |  2 +-
 .../crates/fluss/src/metadata/datatype.rs     |  6 ++--
 .../crates/fluss/tests/integration/admin.rs   | 29 +++++++------------
 .../fluss/tests/integration/kv_table.rs       | 10 +++----
 .../fluss/tests/integration/log_table.rs      | 14 ++++-----
 .../fluss/tests/integration/sasl_auth.rs      |  2 --
 .../tests/integration/table_remote_scan.rs    |  2 +-
 .../docs/user-guide/python/api-reference.md   |  2 +-
 .../python/example/admin-operations.md        |  2 +-
 .../docs/user-guide/python/example/index.md   |  2 +-
 .../user-guide/python/example/log-tables.md   |  2 +-
 .../docs/user-guide/rust/api-reference.md     |  2 +-
 .../docs/user-guide/rust/error-handling.md    |  4 +--
 .../rust/example/admin-operations.md          |  2 +-
 .../docs/user-guide/rust/example/index.md     |  2 +-
 .../user-guide/rust/example/log-tables.md     |  2 +-
 .../rust/example/partitioned-tables.md        |  2 +-
 33 files changed, 61 insertions(+), 82 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 82254ea95a..778fef30e2 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -712,7 +712,7 @@ unsafe fn delete_connection(conn: *mut Connection) {
 
 impl Connection {
     fn get_admin(&self) -> ffi::FfiPtrResult {
-        let admin_result = RUNTIME.block_on(async { self.inner.get_admin().await });
+        let admin_result = self.inner.get_admin();
 
         match admin_result {
             Ok(admin) => {
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index f8efe677f4..3c0c6f7685 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -336,7 +336,7 @@ pub fn resolve_row_types(
                     Some(fcore::metadata::DataType::Decimal(dt)) => {
                         let (precision, scale) = (dt.precision(), dt.scale());
                         let bd = bigdecimal::BigDecimal::from_str(cow.as_ref()).map_err(|e| {
-                            anyhow!("Column {idx}: invalid decimal string '{}': {e}", cow)
+                            anyhow!("Column {idx}: invalid decimal string '{cow}': {e}")
                         })?;
                         let decimal = fcore::row::Decimal::from_big_decimal(bd, precision, scale)
                             .map_err(|e| anyhow!("Column {idx}: {e}"))?;
diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 3564d91cc5..52cefe1e6b 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -65,7 +65,7 @@ async def main():
     table_descriptor = fluss.TableDescriptor(fluss_schema)
 
     # Get the admin for Fluss
-    admin = await conn.get_admin()
+    admin = conn.get_admin()
 
     # Create a Fluss table
     table_path = fluss.TablePath("fluss", "sample_table_types")
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 95f30801e9..977845718a 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -233,7 +233,7 @@ class Config:
 class FlussConnection:
     @staticmethod
     async def create(config: Config) -> FlussConnection: ...
-    async def get_admin(self) -> FlussAdmin: ...
+    def get_admin(self) -> FlussAdmin: ...
     async def get_table(self, table_path: TablePath) -> FlussTable: ...
     def close(self) -> None: ...
     def __enter__(self) -> FlussConnection: ...
diff --git a/fluss-rust/bindings/python/src/connection.rs b/fluss-rust/bindings/python/src/connection.rs
index 31a9505bba..a8d2d9e37d 100644
--- a/fluss-rust/bindings/python/src/connection.rs
+++ b/fluss-rust/bindings/python/src/connection.rs
@@ -46,19 +46,13 @@ impl FlussConnection {
     }
 
     /// Get admin interface
-    fn get_admin<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let client = self.inner.clone();
+    fn get_admin(&self, py: Python<'_>) -> PyResult<Py<FlussAdmin>> {
+        let admin = self
+            .inner
+            .get_admin()
+            .map_err(|e| FlussError::from_core_error(&e))?;
 
-        future_into_py(py, async move {
-            let admin = client
-                .get_admin()
-                .await
-                .map_err(|e| FlussError::from_core_error(&e))?;
-
-            let py_admin = FlussAdmin::from_core(admin);
-
-            Python::attach(|py| Py::new(py, py_admin))
-        })
+        Py::new(py, FlussAdmin::from_core(admin))
     }
 
     /// Get a table
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 8c9ea0e46b..cda8d3b201 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -508,7 +508,6 @@ impl TableScan {
 
             let admin = conn
                 .get_admin()
-                .await
                 .map_err(|e| FlussError::from_core_error(&e))?;
 
             let (projected_schema, projected_row_type) =
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index 0e4cfe41b7..420747e66a 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -208,7 +208,7 @@ async def _connect_with_retry(bootstrap_servers, timeout=60):
         conn = None
         try:
             conn = await fluss.FlussConnection.create(config)
-            admin = await conn.get_admin()
+            admin = conn.get_admin()
             nodes = await admin.get_server_nodes()
             if any(n.server_type == "TabletServer" for n in nodes):
                 return conn
@@ -281,4 +281,4 @@ def plaintext_bootstrap_servers(fluss_cluster):
 @pytest_asyncio.fixture(scope="session")
 async def admin(connection):
     """Session-scoped admin client."""
-    return await connection.get_admin()
+    return connection.get_admin()
diff --git a/fluss-rust/bindings/python/test/test_sasl_auth.py b/fluss-rust/bindings/python/test/test_sasl_auth.py
index 30fce4ce6d..9dd2ddda3f 100644
--- a/fluss-rust/bindings/python/test/test_sasl_auth.py
+++ b/fluss-rust/bindings/python/test/test_sasl_auth.py
@@ -35,7 +35,7 @@ async def test_sasl_connect_with_valid_credentials(sasl_bootstrap_servers):
         "security.sasl.password": "admin-secret",
     })
     conn = await fluss.FlussConnection.create(config)
-    admin = await conn.get_admin()
+    admin = conn.get_admin()
 
     db_name = "py_sasl_test_valid_db"
     db_descriptor = fluss.DatabaseDescriptor(comment="created via SASL auth")
@@ -58,7 +58,7 @@ async def test_sasl_connect_with_second_user(sasl_bootstrap_servers):
         "security.sasl.password": "alice-secret",
     })
     conn = await fluss.FlussConnection.create(config)
-    admin = await conn.get_admin()
+    admin = conn.get_admin()
 
     # Basic operation to confirm functional connection
     assert not await admin.database_exists("some_nonexistent_db_alice")
diff --git a/fluss-rust/crates/examples/src/example_kv_table.rs b/fluss-rust/crates/examples/src/example_kv_table.rs
index 8fb60baa24..ad12ed79cf 100644
--- a/fluss-rust/crates/examples/src/example_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_kv_table.rs
@@ -43,7 +43,7 @@ pub async fn main() -> Result<()> {
 
     let table_path = TablePath::new("fluss", "rust_upsert_lookup_example");
 
-    let admin = conn.get_admin().await?;
+    let admin = conn.get_admin()?;
     admin
         .create_table(&table_path, &table_descriptor, true)
         .await?;
diff --git a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
index ba49934ee9..944d8d4962 100644
--- a/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
+++ b/fluss-rust/crates/examples/src/example_partitioned_kv_table.rs
@@ -46,7 +46,7 @@ pub async fn main() -> Result<()> {
 
     let table_path = TablePath::new("fluss", "partitioned_kv_example");
 
-    let admin = conn.get_admin().await?;
+    let admin = conn.get_admin()?;
     admin
         .create_table(&table_path, &table_descriptor, true)
         .await?;
diff --git a/fluss-rust/crates/examples/src/example_table.rs b/fluss-rust/crates/examples/src/example_table.rs
index 49f0ab4c6f..1f751f3c98 100644
--- a/fluss-rust/crates/examples/src/example_table.rs
+++ b/fluss-rust/crates/examples/src/example_table.rs
@@ -49,7 +49,7 @@ pub async fn main() -> Result<()> {
 
     let table_path = TablePath::new("fluss", "rust_test_long");
 
-    let admin = conn.get_admin().await?;
+    let admin = conn.get_admin()?;
 
     admin
         .create_table(&table_path, &table_descriptor, true)
diff --git a/fluss-rust/crates/fluss/README.md b/fluss-rust/crates/fluss/README.md
index b37a75df79..76dc0ec293 100644
--- a/fluss-rust/crates/fluss/README.md
+++ b/fluss-rust/crates/fluss/README.md
@@ -23,7 +23,7 @@ async fn main() -> Result<()> {
     let mut config = Config::default();
     config.bootstrap_servers = "127.0.0.1:9123".to_string();
     let connection = FlussConnection::new(config).await?;
-    let admin = connection.get_admin().await?;
+    let admin = connection.get_admin()?;
 
     // ---- Primary key (KV) table: upsert and lookup ----
     let kv_path = TablePath::new("fluss", "users");
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 7dc1285f6f..88f87e4c43 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -82,7 +82,7 @@ impl FlussConnection {
         &self.args
     }
 
-    pub async fn get_admin(&self) -> Result<Arc<FlussAdmin>> {
+    pub fn get_admin(&self) -> Result<Arc<FlussAdmin>> {
         // 1. Fast path: return cached instance if already initialized.
         if let Some(admin) = self.admin_client.read().as_ref() {
             return Ok(admin.clone());
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 43025393e8..ab7d441c0e 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -94,7 +94,7 @@ impl<'a> TableScan<'a> {
     ///             .build()?,
     ///         ).build()?;
     ///     let table_path = TablePath::new("fluss".to_owned(), "rust_test_long".to_owned());
-    ///     let admin = conn.get_admin().await?;
+    ///     let admin = conn.get_admin()?;
     ///     admin.create_table(&table_path, &table_descriptor, true)
     ///         .await?;
     ///     let table_info = admin.get_table_info(&table_path).await?;
@@ -169,7 +169,7 @@ impl<'a> TableScan<'a> {
     ///             .build()?,
     ///         ).build()?;
     ///     let table_path = TablePath::new("fluss".to_owned(), "rust_test_long".to_owned());
-    ///     let admin = conn.get_admin().await?;
+    ///     let admin = conn.get_admin()?;
     ///     admin.create_table(&table_path, &table_descriptor, true)
     ///         .await?;
     ///     let table = conn.get_table(&table_path).await?;
diff --git a/fluss-rust/crates/fluss/src/client/write/sender.rs b/fluss-rust/crates/fluss/src/client/write/sender.rs
index dd5370d8ed..8e738d0dc5 100644
--- a/fluss-rust/crates/fluss/src/client/write/sender.rs
+++ b/fluss-rust/crates/fluss/src/client/write/sender.rs
@@ -268,10 +268,7 @@ impl Sender {
             }
         }
 
-        debug!(
-            "Updated metadata for unknown leader tables: {:?}",
-            unknown_leaders
-        );
+        debug!("Updated metadata for unknown leader tables: {unknown_leaders:?}");
         Ok(())
     }
 
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index 13e85981c0..6537189e61 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -40,7 +40,7 @@
 //!     let mut config = Config::default();
 //!     config.bootstrap_servers = "127.0.0.1:9123".to_string();
 //!     let connection = FlussConnection::new(config).await?;
-//!     let admin = connection.get_admin().await?;
+//!     let admin = connection.get_admin()?;
 //!
 //!     // ---- Primary key (KV) table: upsert and lookup ----
 //!     let kv_path = TablePath::new("fluss", "users");
diff --git a/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs b/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
index b0c3b0d7b3..77e5ad3c1c 100644
--- a/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
+++ b/fluss-rust/crates/fluss/src/metadata/data_lake_format.rs
@@ -54,7 +54,7 @@ mod tests {
 
         for (raw, expected) in cases {
             let parsed = raw.parse::<DataLakeFormat>().unwrap();
-            assert_eq!(parsed, expected, "failed to parse: {}", raw);
+            assert_eq!(parsed, expected, "failed to parse: {raw}");
         }
 
         // negative cases
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 6d888d9de1..d9eb56b503 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -954,7 +954,7 @@ impl RowType {
             .iter()
             .map(|name| {
                 self.get_field_index(name).ok_or_else(|| IllegalArgument {
-                    message: format!("Field '{}' does not exist in the row type", name),
+                    message: format!("Field '{name}' does not exist in the row type"),
                 })
             })
             .collect::<Result<Vec<_>>>()?;
@@ -1522,7 +1522,7 @@ fn test_time_valid_precision() {
     // Test all valid precision values 0 through 9
     for precision in 0..=9 {
         let result = TimeType::with_nullable(true, precision);
-        assert!(result.is_ok(), "precision {} should be valid", precision);
+        assert!(result.is_ok(), "precision {precision} should be valid");
         let time = result.unwrap();
         assert_eq!(time.precision(), precision);
     }
@@ -1550,7 +1550,7 @@ fn test_timestamp_valid_precision() {
     // Test all valid precision values 0 through 9
     for precision in 0..=9 {
         let result = TimestampType::with_nullable(true, precision);
-        assert!(result.is_ok(), "precision {} should be valid", precision);
+        assert!(result.is_ok(), "precision {precision} should be valid");
         let timestamp_type = result.unwrap();
         assert_eq!(timestamp_type.precision(), precision);
     }
diff --git a/fluss-rust/crates/fluss/tests/integration/admin.rs b/fluss-rust/crates/fluss/tests/integration/admin.rs
index c64770468b..0860cbef97 100644
--- a/fluss-rust/crates/fluss/tests/integration/admin.rs
+++ b/fluss-rust/crates/fluss/tests/integration/admin.rs
@@ -30,7 +30,7 @@ mod admin_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("should get admin");
+        let admin = connection.get_admin().expect("should get admin");
 
         let db_descriptor = DatabaseDescriptorBuilder::default()
             .comment("test_db")
@@ -73,10 +73,7 @@ mod admin_test {
     async fn test_create_table() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection
-            .get_admin()
-            .await
-            .expect("Failed to get admin client");
+        let admin = connection.get_admin().expect("Failed to get admin client");
 
         let test_db_name = "test_create_table_db";
         let db_descriptor = DatabaseDescriptorBuilder::default()
@@ -202,10 +199,7 @@ mod admin_test {
     async fn test_partition_apis() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection
-            .get_admin()
-            .await
-            .expect("Failed to get admin client");
+        let admin = connection.get_admin().expect("Failed to get admin client");
 
         let test_db_name = "test_partition_apis_db";
         let db_descriptor = DatabaseDescriptorBuilder::default()
@@ -341,10 +335,7 @@ mod admin_test {
     async fn test_fluss_error_response() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection
-            .get_admin()
-            .await
-            .expect("Failed to get admin client");
+        let admin = connection.get_admin().expect("Failed to get admin client");
 
         let table_path = TablePath::new("fluss", "not_exist");
 
@@ -375,7 +366,7 @@ mod admin_test {
     async fn test_error_database_not_exist() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().await.unwrap();
+        let admin = connection.get_admin().unwrap();
 
         // get_database_info for non-existent database
         let result = admin.get_database_info("no_such_db").await;
@@ -394,7 +385,7 @@ mod admin_test {
     async fn test_error_database_already_exist() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().await.unwrap();
+        let admin = connection.get_admin().unwrap();
 
         let db_name = "test_error_db_already_exist";
         let descriptor = DatabaseDescriptorBuilder::default().build();
@@ -424,7 +415,7 @@ mod admin_test {
     async fn test_error_table_already_exist() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().await.unwrap();
+        let admin = connection.get_admin().unwrap();
 
         let db_name = "test_error_tbl_already_exist_db";
         let descriptor = DatabaseDescriptorBuilder::default().build();
@@ -472,7 +463,7 @@ mod admin_test {
     async fn test_error_table_not_exist() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().await.unwrap();
+        let admin = connection.get_admin().unwrap();
 
         let table_path = TablePath::new("fluss", "no_such_table");
 
@@ -491,7 +482,7 @@ mod admin_test {
     async fn test_get_server_nodes() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().await.unwrap();
+        let admin = connection.get_admin().unwrap();
 
         let nodes = admin
             .get_server_nodes()
@@ -534,7 +525,7 @@ mod admin_test {
     async fn test_error_table_not_partitioned() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().await.unwrap();
+        let admin = connection.get_admin().unwrap();
 
         let db_name = "test_error_not_partitioned_db";
         let descriptor = DatabaseDescriptorBuilder::default().build();
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index f0e0c5793d..b942988512 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -33,7 +33,7 @@ mod kv_table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.unwrap();
+        let admin = connection.get_admin().unwrap();
 
         let table_path = TablePath::new("fluss", "test_upsert_and_lookup");
 
@@ -172,7 +172,7 @@ mod kv_table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.unwrap();
+        let admin = connection.get_admin().unwrap();
 
         let table_path = TablePath::new("fluss", "test_composite_pk");
 
@@ -282,7 +282,7 @@ mod kv_table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_partial_update");
 
@@ -403,7 +403,7 @@ mod kv_table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_partitioned_kv_table");
 
@@ -573,7 +573,7 @@ mod kv_table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_all_datatypes");
 
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 4aa88ac4e0..330e143674 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -33,7 +33,7 @@ mod table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_append_record_batch_and_scan");
 
@@ -143,7 +143,7 @@ mod table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_list_offsets");
 
@@ -296,7 +296,7 @@ mod table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_project");
 
@@ -451,7 +451,7 @@ mod table_test {
     async fn test_poll_batches() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_poll_batches");
         let schema = Schema::builder()
@@ -584,7 +584,7 @@ mod table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_log_all_datatypes");
 
@@ -1015,7 +1015,7 @@ mod table_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_partitioned_log_append");
 
@@ -1309,7 +1309,7 @@ mod table_test {
     async fn undersized_row_returns_error() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_log_undersized_row");
 
diff --git a/fluss-rust/crates/fluss/tests/integration/sasl_auth.rs b/fluss-rust/crates/fluss/tests/integration/sasl_auth.rs
index 878c9830ac..439d65fee7 100644
--- a/fluss-rust/crates/fluss/tests/integration/sasl_auth.rs
+++ b/fluss-rust/crates/fluss/tests/integration/sasl_auth.rs
@@ -36,7 +36,6 @@ mod sasl_auth_test {
 
         let admin = connection
             .get_admin()
-            .await
             .expect("Should get admin with valid SASL credentials");
 
         // Perform a basic operation to confirm the connection is fully functional
@@ -69,7 +68,6 @@ mod sasl_auth_test {
 
         let admin = connection
             .get_admin()
-            .await
             .expect("Should get admin with alice credentials");
 
         // Basic operation to confirm functional connection
diff --git a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
index 52b8974e95..293c1f78c9 100644
--- a/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
+++ b/fluss-rust/crates/fluss/tests/integration/table_remote_scan.rs
@@ -28,7 +28,7 @@ mod table_remote_scan_test {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
-        let admin = connection.get_admin().await.expect("Failed to get admin");
+        let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_scan_remote_log");
 
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index a4b594bce3..1268d37f9f 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -36,7 +36,7 @@ Complete API reference for the Fluss Python client.
 | Method                                                    |  Description                          |
 |-----------------------------------------------------------|---------------------------------------|
 | `await FlussConnection.create(config) -> FlussConnection` | Connect to a Fluss cluster            |
-| `await conn.get_admin() -> FlussAdmin`                    | Get admin interface                   |
+| `conn.get_admin() -> FlussAdmin`                        | Get admin interface                   |
 | `await conn.get_table(table_path) -> FlussTable`          | Get a table for read/write operations |
 | `conn.close()`                                            | Close the connection                  |
 
diff --git a/fluss-rust/website/docs/user-guide/python/example/admin-operations.md b/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
index ba3748a050..2cda6c4abf 100644
--- a/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
+++ b/fluss-rust/website/docs/user-guide/python/example/admin-operations.md
@@ -4,7 +4,7 @@ sidebar_position: 3
 # Admin Operations
 
 ```python
-admin = await conn.get_admin()
+admin = conn.get_admin()
 ```
 
 ## Databases
diff --git a/fluss-rust/website/docs/user-guide/python/example/index.md b/fluss-rust/website/docs/user-guide/python/example/index.md
index 389b648698..ec9fa78f45 100644
--- a/fluss-rust/website/docs/user-guide/python/example/index.md
+++ b/fluss-rust/website/docs/user-guide/python/example/index.md
@@ -14,7 +14,7 @@ async def main():
     # Connect
     config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
     conn = await fluss.FlussConnection.create(config)
-    admin = await conn.get_admin()
+    admin = conn.get_admin()
 
     # Create a log table
     schema = fluss.Schema(pa.schema([
diff --git a/fluss-rust/website/docs/user-guide/python/example/log-tables.md b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
index adaa162ada..c320bf4813 100644
--- a/fluss-rust/website/docs/user-guide/python/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
@@ -112,7 +112,7 @@ scanner.unsubscribe(bucket_id=0)
 To only consume new records (skip existing data), first resolve the current latest offset via `list_offsets`, then subscribe at that offset:
 
 ```python
-admin = await conn.get_admin()
+admin = conn.get_admin()
 offsets = await admin.list_offsets(table_path, [0], fluss.OffsetSpec.latest())
 latest = offsets[0]
 
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index fbe3428c14..a4befa5e3c 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -35,7 +35,7 @@ Complete API reference for the Fluss Rust client.
 | Method                                                                        | Description                                    |
 |-------------------------------------------------------------------------------|------------------------------------------------|
 | `async fn new(config: Config) -> Result<Self>`                                | Create a new connection to a Fluss cluster     |
-| `async fn get_admin(&self) -> Result<FlussAdmin>`                             | Get the admin interface for cluster management |
+| `fn get_admin(&self) -> Result<Arc<FlussAdmin>>`                              | Get the admin interface for cluster management |
 | `async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>>` | Get a table for read/write operations          |
 | `fn config(&self) -> &Config`                                                 | Get a reference to the connection config       |
 
diff --git a/fluss-rust/website/docs/user-guide/rust/error-handling.md b/fluss-rust/website/docs/user-guide/rust/error-handling.md
index b7e4b45436..4966428997 100644
--- a/fluss-rust/website/docs/user-guide/rust/error-handling.md
+++ b/fluss-rust/website/docs/user-guide/rust/error-handling.md
@@ -12,7 +12,7 @@ use fluss::error::{Error, Result};
 
 // All operations return Result<T>
 let conn = FlussConnection::new(config).await?;
-let admin = conn.get_admin().await?;
+let admin = conn.get_admin()?;
 let table = conn.get_table(&table_path).await?;
 ```
 
@@ -217,7 +217,7 @@ use fluss::error::Result;
 
 async fn my_pipeline() -> Result<()> {
     let conn = FlussConnection::new(config).await?;
-    let admin = conn.get_admin().await?;
+    let admin = conn.get_admin()?;
     let table = conn.get_table(&table_path).await?;
     let writer = table.new_append()?.create_writer()?;
     writer.append(&row)?;
diff --git a/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md b/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
index d18ad0eca5..39752754f1 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/admin-operations.md
@@ -6,7 +6,7 @@ sidebar_position: 3
 ## Get Admin Interface
 
 ```rust
-let admin = conn.get_admin().await?;
+let admin = conn.get_admin()?;
 ```
 
 ## Database Operations
diff --git a/fluss-rust/website/docs/user-guide/rust/example/index.md b/fluss-rust/website/docs/user-guide/rust/example/index.md
index e35c8dc3f3..f1d5a6882d 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/index.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/index.md
@@ -19,7 +19,7 @@ async fn main() -> Result<()> {
     let mut config = Config::default();
     config.bootstrap_servers = "127.0.0.1:9123".to_string();
     let conn = FlussConnection::new(config).await?;
-    let admin = conn.get_admin().await?;
+    let admin = conn.get_admin()?;
 
     // Create a log table
     let table_path = TablePath::new("fluss", "quickstart_rust");
diff --git a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
index 7c01cf1ccd..0485779699 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
@@ -106,7 +106,7 @@ To start reading only new records, first resolve the current latest offset via `
 ```rust
 use fluss::rpc::message::OffsetSpec;
 
-let admin = conn.get_admin().await?;
+let admin = conn.get_admin()?;
 let offsets = admin.list_offsets(&table_path, &[0], OffsetSpec::Latest).await?;
 let latest = offsets[&0];
 log_scanner.subscribe(0, latest).await?;
diff --git a/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
index 40bd4d60c2..38517e165d 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
@@ -65,7 +65,7 @@ For partitioned tables, use partition-aware subscribe methods.
 use std::time::Duration;
 
 let table = conn.get_table(&table_path).await?;
-let admin = conn.get_admin().await?;
+let admin = conn.get_admin()?;
 let partitions = admin.list_partition_infos(&table_path).await?;
 
 let log_scanner = table.new_scan().create_log_scanner()?;

From 5a230cb7c3b793ed76dad514c0acf4172e52bea4 Mon Sep 17 00:00:00 2001
From: "zhengyunhong.zyh" <zhengyunhong.zyh@alibaba-inc.com>
Date: Mon, 23 Mar 2026 20:21:09 +0800
Subject: [PATCH 211/287] chore: update dependency list for release 0.1.0

---
 fluss-rust/DEPENDENCIES.rust.tsv              | 335 +++++-----
 fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv | 326 +++++----
 .../bindings/python/DEPENDENCIES.rust.tsv     | 627 +++++++++---------
 .../crates/examples/DEPENDENCIES.rust.tsv     | 606 +++++++++--------
 fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv | 602 +++++++++--------
 5 files changed, 1231 insertions(+), 1265 deletions(-)

diff --git a/fluss-rust/DEPENDENCIES.rust.tsv b/fluss-rust/DEPENDENCIES.rust.tsv
index be7d2c8ee1..b46eeac210 100644
--- a/fluss-rust/DEPENDENCIES.rust.tsv
+++ b/fluss-rust/DEPENDENCIES.rust.tsv
@@ -1,29 +1,28 @@
 crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense	Zlib
 ahash@0.8.12	X									X			
-aho-corasick@1.1.3										X		X	
-android-tzdata@0.1.1	X									X			
+aho-corasick@1.1.4										X		X	
 android_system_properties@0.1.5	X									X			
-anstream@0.6.20	X									X			
-anstyle@1.0.11	X									X			
-anstyle-parse@0.2.7	X									X			
-anstyle-query@1.1.4	X									X			
-anstyle-wincon@3.0.10	X									X			
-anyhow@1.0.100	X									X			
-arrow@57.1.0	X												
-arrow-arith@57.1.0	X												
-arrow-array@57.1.0	X												
-arrow-buffer@57.1.0	X												
-arrow-cast@57.1.0	X												
-arrow-csv@57.1.0	X												
-arrow-data@57.1.0	X												
-arrow-ipc@57.1.0	X												
-arrow-json@57.1.0	X												
-arrow-ord@57.1.0	X												
-arrow-pyarrow@57.1.0	X												
-arrow-row@57.1.0	X												
-arrow-schema@57.1.0	X												
-arrow-select@57.1.0	X												
-arrow-string@57.1.0	X												
+anstream@1.0.0	X									X			
+anstyle@1.0.14	X									X			
+anstyle-parse@1.0.0	X									X			
+anstyle-query@1.1.5	X									X			
+anstyle-wincon@3.0.11	X									X			
+anyhow@1.0.102	X									X			
+arrow@57.3.0	X												
+arrow-arith@57.3.0	X												
+arrow-array@57.3.0	X												
+arrow-buffer@57.3.0	X												
+arrow-cast@57.3.0	X												
+arrow-csv@57.3.0	X												
+arrow-data@57.3.0	X												
+arrow-ipc@57.3.0	X												
+arrow-json@57.3.0	X												
+arrow-ord@57.3.0	X												
+arrow-pyarrow@57.3.0	X												
+arrow-row@57.3.0	X												
+arrow-schema@57.3.0	X												
+arrow-select@57.3.0	X												
+arrow-string@57.3.0	X												
 async-trait@0.1.89	X									X			
 atoi@2.0.0										X			
 atomic-waker@1.1.2	X									X			
@@ -31,21 +30,21 @@ autocfg@1.5.0	X									X
 backon@1.6.0	X												
 base64@0.22.1	X									X			
 bigdecimal@0.4.10	X									X			
-bitflags@2.9.3	X									X			
+bitflags@2.11.0	X									X			
 bitvec@1.0.1										X			
 block-buffer@0.10.4	X									X			
-bumpalo@3.19.0	X									X			
+bumpalo@3.20.2	X									X			
 byteorder@1.5.0										X		X	
 bytes@1.11.1										X			
-cc@1.2.34	X									X			
-cfg-if@1.0.3	X									X			
-chrono@0.4.41	X									X			
-clap@4.5.45	X									X			
-clap_builder@4.5.44	X									X			
-clap_derive@4.5.45	X									X			
-clap_lex@0.7.5	X									X			
+cc@1.2.57	X									X			
+cfg-if@1.0.4	X									X			
+chrono@0.4.44	X									X			
+clap@4.6.0	X									X			
+clap_builder@4.6.0	X									X			
+clap_derive@4.6.0	X									X			
+clap_lex@1.1.0	X									X			
 codespan-reporting@0.13.1	X												
-colorchoice@1.0.4	X									X			
+colorchoice@1.0.5	X									X			
 const-oid@0.9.6	X									X			
 const-random@0.1.18	X									X			
 const-random-macro@0.1.16	X									X			
@@ -55,276 +54,272 @@ crc32c@0.6.8	X									X
 crossbeam-utils@0.8.21	X									X			
 crunchy@0.2.4										X			
 crypto-common@0.1.7	X									X			
-csv@1.3.1										X		X	
-csv-core@0.1.12										X		X	
-cxx@1.0.190	X									X			
-cxx-build@1.0.190	X									X			
-cxxbridge-flags@1.0.190	X									X			
-cxxbridge-macro@1.0.190	X									X			
+csv@1.4.0										X		X	
+csv-core@0.1.13										X		X	
+cxx@1.0.194	X									X			
+cxx-build@1.0.194	X									X			
+cxxbridge-flags@1.0.194	X									X			
+cxxbridge-macro@1.0.194	X									X			
 dashmap@6.1.0										X			
 delegate@0.13.5	X									X			
 digest@0.10.7	X									X			
 displaydoc@0.2.5	X									X			
 either@1.15.0	X									X			
 equivalent@1.0.2	X									X			
-errno@0.3.13	X									X			
+errno@0.3.14	X									X			
 fastrand@2.3.0	X									X			
+find-msvc-tools@0.1.9	X									X			
 fixedbitset@0.5.7	X									X			
-flatbuffers@25.2.10	X												
+flatbuffers@25.12.19	X												
 fluss-cpp@0.1.0	X												
 fluss-examples@0.1.0	X												
 fluss-rs@0.1.0	X												
 fluss_python@0.1.0	X												
 fnv@1.0.7	X									X			
+foldhash@0.1.5													X
 foldhash@0.2.0													X
 form_urlencoded@1.2.2	X									X			
 funty@2.0.0										X			
-futures@0.3.31	X									X			
-futures-channel@0.3.31	X									X			
-futures-core@0.3.31	X									X			
-futures-executor@0.3.31	X									X			
-futures-io@0.3.31	X									X			
-futures-macro@0.3.31	X									X			
-futures-sink@0.3.31	X									X			
-futures-task@0.3.31	X									X			
-futures-util@0.3.31	X									X			
+futures@0.3.32	X									X			
+futures-channel@0.3.32	X									X			
+futures-core@0.3.32	X									X			
+futures-executor@0.3.32	X									X			
+futures-io@0.3.32	X									X			
+futures-macro@0.3.32	X									X			
+futures-sink@0.3.32	X									X			
+futures-task@0.3.32	X									X			
+futures-util@0.3.32	X									X			
 generic-array@0.14.7										X			
-getrandom@0.2.16	X									X			
-getrandom@0.3.3	X									X			
+getrandom@0.2.17	X									X			
+getrandom@0.3.4	X									X			
+getrandom@0.4.2	X									X			
 gloo-timers@0.3.0	X									X			
-h2@0.4.12										X			
-half@2.6.0	X									X			
+h2@0.4.13										X			
+half@2.7.1	X									X			
 hashbrown@0.14.5	X									X			
 hashbrown@0.15.5	X									X			
 hashbrown@0.16.1	X									X			
 heck@0.5.0	X									X			
 hex@0.4.3	X									X			
 hmac@0.12.1	X									X			
-home@0.5.11	X									X			
-http@1.3.1	X									X			
+home@0.5.12	X									X			
+http@1.4.0	X									X			
 http-body@1.0.1										X			
 http-body-util@0.1.3										X			
 httparse@1.10.1	X									X			
 httpdate@1.0.3	X									X			
-hyper@1.7.0										X			
+hyper@1.8.1										X			
 hyper-rustls@0.27.7	X							X		X			
-hyper-util@0.1.17										X			
-iana-time-zone@0.1.63	X									X			
+hyper-util@0.1.20										X			
+iana-time-zone@0.1.65	X									X			
 iana-time-zone-haiku@0.1.2	X									X			
-icu_collections@2.0.0											X		
-icu_locale_core@2.0.0											X		
-icu_normalizer@2.0.0											X		
-icu_normalizer_data@2.0.0											X		
-icu_properties@2.0.1											X		
-icu_properties_data@2.0.1											X		
-icu_provider@2.0.0											X		
+icu_collections@2.1.1											X		
+icu_locale_core@2.1.1											X		
+icu_normalizer@2.1.1											X		
+icu_normalizer_data@2.1.1											X		
+icu_properties@2.1.2											X		
+icu_properties_data@2.1.2											X		
+icu_provider@2.1.1											X		
 idna@1.1.0	X									X			
 idna_adapter@1.2.1	X									X			
-indexmap@2.11.0	X									X			
-indoc@2.0.6	X									X			
-ipnet@2.11.0	X									X			
-iri-string@0.7.9	X									X			
-is_terminal_polyfill@1.70.1	X									X			
+indexmap@2.13.0	X									X			
+indoc@2.0.7	X									X			
+ipnet@2.12.0	X									X			
+iri-string@0.7.11	X									X			
+is_terminal_polyfill@1.70.2	X									X			
 itertools@0.14.0	X									X			
-itoa@1.0.15	X									X			
-jiff@0.2.16										X		X	
-jiff-tzdb@0.1.5										X		X	
+itoa@1.0.18	X									X			
+jiff@0.2.23										X		X	
+jiff-tzdb@0.1.6										X		X	
 jiff-tzdb-platform@0.1.3										X		X	
 jobserver@0.1.34	X									X			
-js-sys@0.3.77	X									X			
-lexical-core@1.0.5	X									X			
-lexical-parse-float@1.0.5	X									X			
-lexical-parse-integer@1.0.5	X									X			
-lexical-util@1.0.6	X									X			
-lexical-write-float@1.0.5	X									X			
-lexical-write-integer@1.0.5	X									X			
-libc@0.2.175	X									X			
-libm@0.2.15										X			
+js-sys@0.3.91	X									X			
+lexical-core@1.0.6	X									X			
+lexical-parse-float@1.0.6	X									X			
+lexical-parse-integer@1.0.6	X									X			
+lexical-util@1.0.7	X									X			
+lexical-write-float@1.0.6	X									X			
+lexical-write-integer@1.0.6	X									X			
+libc@0.2.183	X									X			
+libm@0.2.16										X			
 link-cplusplus@1.0.12	X									X			
 linked-hash-map@0.5.6	X									X			
-linux-raw-sys@0.9.4	X	X								X			
-litemap@0.8.0											X		
-lock_api@0.4.13	X									X			
-log@0.4.27	X									X			
-lz4_flex@0.12.0										X			
+linux-raw-sys@0.12.1	X	X								X			
+litemap@0.8.1											X		
+lock_api@0.4.14	X									X			
+log@0.4.29	X									X			
+lz4_flex@0.12.1										X			
 md-5@0.10.6	X									X			
-memchr@2.7.5										X		X	
+memchr@2.8.0										X		X	
 memoffset@0.9.1										X			
-mio@1.0.4										X			
+mio@1.1.1										X			
 multimap@0.10.1	X									X			
 num-bigint@0.4.6	X									X			
 num-complex@0.4.6	X									X			
 num-integer@0.1.46	X									X			
 num-traits@0.2.19	X									X			
-once_cell@1.21.3	X									X			
-once_cell_polyfill@1.70.1	X									X			
+once_cell@1.21.4	X									X			
+once_cell_polyfill@1.70.2	X									X			
 opendal@0.55.0	X												
 ordered-float@5.1.0										X			
-parking_lot@0.12.4	X									X			
-parking_lot_core@0.9.11	X									X			
+parking_lot@0.12.5	X									X			
+parking_lot_core@0.9.12	X									X			
 parse-display@0.10.0	X									X			
 parse-display-derive@0.10.0	X									X			
 percent-encoding@2.3.2	X									X			
-petgraph@0.7.1	X									X			
-pin-project-lite@0.2.16	X									X			
+petgraph@0.8.3	X									X			
+pin-project-lite@0.2.17	X									X			
 pin-utils@0.1.0	X									X			
 pkg-config@0.3.32	X									X			
-portable-atomic@1.11.1	X									X			
-portable-atomic-util@0.2.4	X									X			
-potential_utf@0.1.3											X		
+portable-atomic@1.13.1	X									X			
+portable-atomic-util@0.2.6	X									X			
+potential_utf@0.1.4											X		
 ppv-lite86@0.2.21	X									X			
 prettyplease@0.2.37	X									X			
-proc-macro2@1.0.101	X									X			
-prost@0.14.1	X												
-prost-build@0.14.1	X												
-prost-derive@0.14.1	X												
-prost-types@0.14.1	X												
+proc-macro2@1.0.106	X									X			
+prost@0.14.3	X												
+prost-build@0.14.3	X												
+prost-derive@0.14.3	X												
+prost-types@0.14.3	X												
 pyo3@0.26.0	X									X			
 pyo3-async-runtimes@0.26.0	X												
 pyo3-build-config@0.26.0	X									X			
 pyo3-ffi@0.26.0	X									X			
 pyo3-macros@0.26.0	X									X			
 pyo3-macros-backend@0.26.0	X									X			
+python3-dll-a@0.2.14										X			
 quick-xml@0.37.5										X			
 quick-xml@0.38.4										X			
-quote@1.0.40	X									X			
+quote@1.0.45	X									X			
 r-efi@5.3.0	X								X	X			
+r-efi@6.0.0	X								X	X			
 radium@0.7.0										X			
 rand@0.8.5	X									X			
 rand@0.9.2	X									X			
 rand_chacha@0.3.1	X									X			
 rand_chacha@0.9.0	X									X			
 rand_core@0.6.4	X									X			
-rand_core@0.9.3	X									X			
-redox_syscall@0.5.17										X			
-regex@1.11.2	X									X			
-regex-automata@0.4.10	X									X			
-regex-syntax@0.8.6	X									X			
+rand_core@0.9.5	X									X			
+redox_syscall@0.5.18										X			
+regex@1.12.3	X									X			
+regex-automata@0.4.14	X									X			
+regex-syntax@0.8.10	X									X			
 reqsign@0.16.5	X												
-reqwest@0.12.25	X									X			
+reqwest@0.12.28	X									X			
 ring@0.17.14	X							X					
 rustc_version@0.4.1	X									X			
-rustix@1.0.8	X	X								X			
-rustls@0.23.32	X							X		X			
-rustls-pki-types@1.12.0	X									X			
-rustls-webpki@0.103.7								X					
+rustix@1.1.4	X	X								X			
+rustls@0.23.37	X							X		X			
+rustls-pki-types@1.14.0	X									X			
+rustls-webpki@0.103.10								X					
 rustversion@1.0.22	X									X			
-ryu@1.0.20	X				X								
+ryu@1.0.23	X				X								
 scopeguard@1.2.0	X									X			
 scratch@1.0.9	X									X			
-semver@1.0.26	X									X			
+semver@1.0.27	X									X			
 serde@1.0.228	X									X			
 serde_core@1.0.228	X									X			
 serde_derive@1.0.228	X									X			
-serde_json@1.0.143	X									X			
+serde_json@1.0.149	X									X			
 serde_urlencoded@0.7.1	X									X			
 sha1@0.10.6	X									X			
 sha2@0.10.9	X									X			
 shlex@1.3.0	X									X			
-signal-hook-registry@1.4.6	X									X			
+signal-hook-registry@1.4.8	X									X			
 simdutf8@0.1.5	X									X			
-slab@0.4.11										X			
+slab@0.4.12										X			
 smallvec@1.15.1	X									X			
 snafu@0.8.9	X									X			
 snafu-derive@0.8.9	X									X			
-socket2@0.6.0	X									X			
+socket2@0.6.3	X									X			
 stable_deref_trait@1.2.1	X									X			
-static_assertions@1.1.0	X									X			
 strsim@0.11.1										X			
 structmeta@0.3.0	X									X			
 structmeta-derive@0.3.0	X									X			
 strum@0.26.3										X			
 strum_macros@0.26.4										X			
 subtle@2.6.1				X									
-syn@2.0.106	X									X			
+syn@2.0.117	X									X			
 sync_wrapper@1.0.2	X												
 synstructure@0.13.2										X			
 tap@1.0.1										X			
-target-lexicon@0.13.3		X											
-tempfile@3.23.0	X									X			
+target-lexicon@0.13.5		X											
+tempfile@3.27.0	X									X			
 termcolor@1.4.1										X		X	
 thiserror@1.0.69	X									X			
 thiserror-impl@1.0.69	X									X			
+tikv-jemalloc-sys@0.6.1+5.3.0-1-ge13ca993e8ccb9ba9847cc330696e02839f328f7	X									X			
+tikv-jemallocator@0.6.1	X									X			
 tiny-keccak@2.0.2						X							
-tinystr@0.8.1											X		
-tokio@1.48.0										X			
-tokio-macros@2.6.0										X			
+tinystr@0.8.2											X		
+tokio@1.50.0										X			
+tokio-macros@2.6.1										X			
 tokio-rustls@0.26.4	X									X			
-tokio-util@0.7.16										X			
-tower@0.5.2										X			
+tokio-util@0.7.18										X			
+tower@0.5.3										X			
 tower-http@0.6.8										X			
 tower-layer@0.3.3										X			
 tower-service@0.3.3										X			
-tracing@0.1.41										X			
-tracing-attributes@0.1.30										X			
-tracing-core@0.1.34										X			
+tracing@0.1.44										X			
+tracing-attributes@0.1.31										X			
+tracing-core@0.1.36										X			
 try-lock@0.2.5										X			
 twox-hash@2.1.2										X			
 typenum@1.19.0	X									X			
-unicode-ident@1.0.18	X									X	X		
+unicode-ident@1.0.24	X									X	X		
 unicode-width@0.2.2	X									X			
 unindent@0.2.4	X									X			
 untrusted@0.9.0								X					
-url@2.5.7	X									X			
+url@2.5.8	X									X			
 utf8_iter@1.0.4	X									X			
 utf8parse@0.2.2	X									X			
-uuid@1.18.0	X									X			
+uuid@1.22.0	X									X			
 value-bag@1.12.0	X									X			
 version_check@0.9.5	X									X			
 want@0.3.1										X			
 wasi@0.11.1+wasi-snapshot-preview1	X	X								X			
-wasi@0.14.2+wasi-0.2.4	X	X								X			
-wasm-bindgen@0.2.100	X									X			
-wasm-bindgen-backend@0.2.100	X									X			
-wasm-bindgen-futures@0.4.50	X									X			
-wasm-bindgen-macro@0.2.100	X									X			
-wasm-bindgen-macro-support@0.2.100	X									X			
-wasm-bindgen-shared@0.2.100	X									X			
+wasip2@1.0.2+wasi-0.2.9	X	X								X			
+wasip3@0.4.0+wasi-0.3.0-rc-2026-01-06	X	X								X			
+wasm-bindgen@0.2.114	X									X			
+wasm-bindgen-futures@0.4.64	X									X			
+wasm-bindgen-macro@0.2.114	X									X			
+wasm-bindgen-macro-support@0.2.114	X									X			
+wasm-bindgen-shared@0.2.114	X									X			
 wasm-streams@0.4.2	X									X			
-web-sys@0.3.77	X									X			
-webpki-roots@1.0.3							X						
+web-sys@0.3.91	X									X			
+webpki-roots@1.0.6							X						
 winapi-util@0.1.11										X		X	
-windows-core@0.61.2	X									X			
-windows-implement@0.60.0	X									X			
-windows-interface@0.59.1	X									X			
-windows-link@0.1.3	X									X			
+windows-core@0.62.2	X									X			
+windows-implement@0.60.2	X									X			
+windows-interface@0.59.3	X									X			
 windows-link@0.2.1	X									X			
-windows-result@0.3.4	X									X			
-windows-strings@0.4.2	X									X			
+windows-result@0.4.1	X									X			
+windows-strings@0.5.1	X									X			
 windows-sys@0.52.0	X									X			
-windows-sys@0.59.0	X									X			
-windows-sys@0.60.2	X									X			
 windows-sys@0.61.2	X									X			
 windows-targets@0.52.6	X									X			
-windows-targets@0.53.3	X									X			
 windows_aarch64_gnullvm@0.52.6	X									X			
-windows_aarch64_gnullvm@0.53.0	X									X			
 windows_aarch64_msvc@0.52.6	X									X			
-windows_aarch64_msvc@0.53.0	X									X			
 windows_i686_gnu@0.52.6	X									X			
-windows_i686_gnu@0.53.0	X									X			
 windows_i686_gnullvm@0.52.6	X									X			
-windows_i686_gnullvm@0.53.0	X									X			
 windows_i686_msvc@0.52.6	X									X			
-windows_i686_msvc@0.53.0	X									X			
 windows_x86_64_gnu@0.52.6	X									X			
-windows_x86_64_gnu@0.53.0	X									X			
 windows_x86_64_gnullvm@0.52.6	X									X			
-windows_x86_64_gnullvm@0.53.0	X									X			
 windows_x86_64_msvc@0.52.6	X									X			
-windows_x86_64_msvc@0.53.0	X									X			
-wit-bindgen-rt@0.39.0	X	X								X			
-writeable@0.6.1											X		
+wit-bindgen@0.51.0	X	X								X			
+writeable@0.6.2											X		
 wyz@0.5.1										X			
-yoke@0.8.0											X		
-yoke-derive@0.8.0											X		
-zerocopy@0.8.26	X		X							X			
+yoke@0.8.1											X		
+yoke-derive@0.8.1											X		
+zerocopy@0.8.47	X		X							X			
+zerocopy-derive@0.8.47	X		X							X			
 zerofrom@0.1.6											X		
 zerofrom-derive@0.1.6											X		
 zeroize@1.8.2	X									X			
-zerotrie@0.2.2											X		
-zerovec@0.11.4											X		
-zerovec-derive@0.11.1											X		
+zerotrie@0.2.3											X		
+zerovec@0.11.5											X		
+zerovec-derive@0.11.2											X		
+zmij@1.0.21										X			
 zstd@0.13.3										X			
 zstd-safe@7.2.4	X									X			
 zstd-sys@2.0.16+zstd.1.5.7	X									X			
diff --git a/fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv b/fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv
index b2324052e7..89dbf76539 100644
--- a/fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv
+++ b/fluss-rust/bindings/cpp/DEPENDENCIES.rust.tsv
@@ -1,28 +1,27 @@
 crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense	Zlib
 ahash@0.8.12	X									X			
-aho-corasick@1.1.3										X		X	
-android-tzdata@0.1.1	X									X			
+aho-corasick@1.1.4										X		X	
 android_system_properties@0.1.5	X									X			
-anstream@0.6.20	X									X			
-anstyle@1.0.11	X									X			
-anstyle-parse@0.2.7	X									X			
-anstyle-query@1.1.4	X									X			
-anstyle-wincon@3.0.10	X									X			
-anyhow@1.0.100	X									X			
-arrow@57.1.0	X												
-arrow-arith@57.1.0	X												
-arrow-array@57.1.0	X												
-arrow-buffer@57.1.0	X												
-arrow-cast@57.1.0	X												
-arrow-csv@57.1.0	X												
-arrow-data@57.1.0	X												
-arrow-ipc@57.1.0	X												
-arrow-json@57.1.0	X												
-arrow-ord@57.1.0	X												
-arrow-row@57.1.0	X												
-arrow-schema@57.1.0	X												
-arrow-select@57.1.0	X												
-arrow-string@57.1.0	X												
+anstream@1.0.0	X									X			
+anstyle@1.0.14	X									X			
+anstyle-parse@1.0.0	X									X			
+anstyle-query@1.1.5	X									X			
+anstyle-wincon@3.0.11	X									X			
+anyhow@1.0.102	X									X			
+arrow@57.3.0	X												
+arrow-arith@57.3.0	X												
+arrow-array@57.3.0	X												
+arrow-buffer@57.3.0	X												
+arrow-cast@57.3.0	X												
+arrow-csv@57.3.0	X												
+arrow-data@57.3.0	X												
+arrow-ipc@57.3.0	X												
+arrow-json@57.3.0	X												
+arrow-ord@57.3.0	X												
+arrow-row@57.3.0	X												
+arrow-schema@57.3.0	X												
+arrow-select@57.3.0	X												
+arrow-string@57.3.0	X												
 async-trait@0.1.89	X									X			
 atoi@2.0.0										X			
 atomic-waker@1.1.2	X									X			
@@ -30,21 +29,21 @@ autocfg@1.5.0	X									X
 backon@1.6.0	X												
 base64@0.22.1	X									X			
 bigdecimal@0.4.10	X									X			
-bitflags@2.9.3	X									X			
+bitflags@2.11.0	X									X			
 bitvec@1.0.1										X			
 block-buffer@0.10.4	X									X			
-bumpalo@3.19.0	X									X			
+bumpalo@3.20.2	X									X			
 byteorder@1.5.0										X		X	
 bytes@1.11.1										X			
-cc@1.2.34	X									X			
-cfg-if@1.0.3	X									X			
-chrono@0.4.41	X									X			
-clap@4.5.45	X									X			
-clap_builder@4.5.44	X									X			
-clap_derive@4.5.45	X									X			
-clap_lex@0.7.5	X									X			
+cc@1.2.57	X									X			
+cfg-if@1.0.4	X									X			
+chrono@0.4.44	X									X			
+clap@4.6.0	X									X			
+clap_builder@4.6.0	X									X			
+clap_derive@4.6.0	X									X			
+clap_lex@1.1.0	X									X			
 codespan-reporting@0.13.1	X												
-colorchoice@1.0.4	X									X			
+colorchoice@1.0.5	X									X			
 const-oid@0.9.6	X									X			
 const-random@0.1.18	X									X			
 const-random-macro@0.1.16	X									X			
@@ -54,264 +53,257 @@ crc32c@0.6.8	X									X
 crossbeam-utils@0.8.21	X									X			
 crunchy@0.2.4										X			
 crypto-common@0.1.7	X									X			
-csv@1.3.1										X		X	
-csv-core@0.1.12										X		X	
-cxx@1.0.190	X									X			
-cxx-build@1.0.190	X									X			
-cxxbridge-flags@1.0.190	X									X			
-cxxbridge-macro@1.0.190	X									X			
+csv@1.4.0										X		X	
+csv-core@0.1.13										X		X	
+cxx@1.0.194	X									X			
+cxx-build@1.0.194	X									X			
+cxxbridge-flags@1.0.194	X									X			
+cxxbridge-macro@1.0.194	X									X			
 dashmap@6.1.0										X			
 delegate@0.13.5	X									X			
 digest@0.10.7	X									X			
 displaydoc@0.2.5	X									X			
 either@1.15.0	X									X			
 equivalent@1.0.2	X									X			
-errno@0.3.13	X									X			
+errno@0.3.14	X									X			
 fastrand@2.3.0	X									X			
+find-msvc-tools@0.1.9	X									X			
 fixedbitset@0.5.7	X									X			
-flatbuffers@25.2.10	X												
+flatbuffers@25.12.19	X												
 fluss-cpp@0.1.0	X												
 fluss-rs@0.1.0	X												
 fnv@1.0.7	X									X			
+foldhash@0.1.5													X
 foldhash@0.2.0													X
 form_urlencoded@1.2.2	X									X			
 funty@2.0.0										X			
-futures@0.3.31	X									X			
-futures-channel@0.3.31	X									X			
-futures-core@0.3.31	X									X			
-futures-executor@0.3.31	X									X			
-futures-io@0.3.31	X									X			
-futures-macro@0.3.31	X									X			
-futures-sink@0.3.31	X									X			
-futures-task@0.3.31	X									X			
-futures-util@0.3.31	X									X			
+futures@0.3.32	X									X			
+futures-channel@0.3.32	X									X			
+futures-core@0.3.32	X									X			
+futures-executor@0.3.32	X									X			
+futures-io@0.3.32	X									X			
+futures-macro@0.3.32	X									X			
+futures-sink@0.3.32	X									X			
+futures-task@0.3.32	X									X			
+futures-util@0.3.32	X									X			
 generic-array@0.14.7										X			
-getrandom@0.2.16	X									X			
-getrandom@0.3.3	X									X			
+getrandom@0.2.17	X									X			
+getrandom@0.3.4	X									X			
+getrandom@0.4.2	X									X			
 gloo-timers@0.3.0	X									X			
-h2@0.4.12										X			
-half@2.6.0	X									X			
+h2@0.4.13										X			
+half@2.7.1	X									X			
 hashbrown@0.14.5	X									X			
 hashbrown@0.15.5	X									X			
 hashbrown@0.16.1	X									X			
 heck@0.5.0	X									X			
 hex@0.4.3	X									X			
 hmac@0.12.1	X									X			
-home@0.5.11	X									X			
-http@1.3.1	X									X			
+home@0.5.12	X									X			
+http@1.4.0	X									X			
 http-body@1.0.1										X			
 http-body-util@0.1.3										X			
 httparse@1.10.1	X									X			
 httpdate@1.0.3	X									X			
-hyper@1.7.0										X			
+hyper@1.8.1										X			
 hyper-rustls@0.27.7	X							X		X			
-hyper-util@0.1.17										X			
-iana-time-zone@0.1.63	X									X			
+hyper-util@0.1.20										X			
+iana-time-zone@0.1.65	X									X			
 iana-time-zone-haiku@0.1.2	X									X			
-icu_collections@2.0.0											X		
-icu_locale_core@2.0.0											X		
-icu_normalizer@2.0.0											X		
-icu_normalizer_data@2.0.0											X		
-icu_properties@2.0.1											X		
-icu_properties_data@2.0.1											X		
-icu_provider@2.0.0											X		
+icu_collections@2.1.1											X		
+icu_locale_core@2.1.1											X		
+icu_normalizer@2.1.1											X		
+icu_normalizer_data@2.1.1											X		
+icu_properties@2.1.2											X		
+icu_properties_data@2.1.2											X		
+icu_provider@2.1.1											X		
 idna@1.1.0	X									X			
 idna_adapter@1.2.1	X									X			
-indexmap@2.11.0	X									X			
-ipnet@2.11.0	X									X			
-iri-string@0.7.9	X									X			
-is_terminal_polyfill@1.70.1	X									X			
+indexmap@2.13.0	X									X			
+ipnet@2.12.0	X									X			
+iri-string@0.7.11	X									X			
+is_terminal_polyfill@1.70.2	X									X			
 itertools@0.14.0	X									X			
-itoa@1.0.15	X									X			
-jiff@0.2.16										X		X	
-jiff-tzdb@0.1.5										X		X	
+itoa@1.0.18	X									X			
+jiff@0.2.23										X		X	
+jiff-tzdb@0.1.6										X		X	
 jiff-tzdb-platform@0.1.3										X		X	
 jobserver@0.1.34	X									X			
-js-sys@0.3.77	X									X			
-lexical-core@1.0.5	X									X			
-lexical-parse-float@1.0.5	X									X			
-lexical-parse-integer@1.0.5	X									X			
-lexical-util@1.0.6	X									X			
-lexical-write-float@1.0.5	X									X			
-lexical-write-integer@1.0.5	X									X			
-libc@0.2.175	X									X			
-libm@0.2.15										X			
+js-sys@0.3.91	X									X			
+lexical-core@1.0.6	X									X			
+lexical-parse-float@1.0.6	X									X			
+lexical-parse-integer@1.0.6	X									X			
+lexical-util@1.0.7	X									X			
+lexical-write-float@1.0.6	X									X			
+lexical-write-integer@1.0.6	X									X			
+libc@0.2.183	X									X			
+libm@0.2.16										X			
 link-cplusplus@1.0.12	X									X			
 linked-hash-map@0.5.6	X									X			
-linux-raw-sys@0.9.4	X	X								X			
-litemap@0.8.0											X		
-lock_api@0.4.13	X									X			
-log@0.4.27	X									X			
-lz4_flex@0.12.0										X			
+linux-raw-sys@0.12.1	X	X								X			
+litemap@0.8.1											X		
+lock_api@0.4.14	X									X			
+log@0.4.29	X									X			
+lz4_flex@0.12.1										X			
 md-5@0.10.6	X									X			
-memchr@2.7.5										X		X	
-mio@1.0.4										X			
+memchr@2.8.0										X		X	
+mio@1.1.1										X			
 multimap@0.10.1	X									X			
 num-bigint@0.4.6	X									X			
 num-complex@0.4.6	X									X			
 num-integer@0.1.46	X									X			
 num-traits@0.2.19	X									X			
-once_cell@1.21.3	X									X			
-once_cell_polyfill@1.70.1	X									X			
+once_cell@1.21.4	X									X			
+once_cell_polyfill@1.70.2	X									X			
 opendal@0.55.0	X												
 ordered-float@5.1.0										X			
-parking_lot@0.12.4	X									X			
-parking_lot_core@0.9.11	X									X			
+parking_lot@0.12.5	X									X			
+parking_lot_core@0.9.12	X									X			
 parse-display@0.10.0	X									X			
 parse-display-derive@0.10.0	X									X			
 percent-encoding@2.3.2	X									X			
-petgraph@0.7.1	X									X			
-pin-project-lite@0.2.16	X									X			
+petgraph@0.8.3	X									X			
+pin-project-lite@0.2.17	X									X			
 pin-utils@0.1.0	X									X			
 pkg-config@0.3.32	X									X			
-portable-atomic@1.11.1	X									X			
-portable-atomic-util@0.2.4	X									X			
-potential_utf@0.1.3											X		
+portable-atomic@1.13.1	X									X			
+portable-atomic-util@0.2.6	X									X			
+potential_utf@0.1.4											X		
 ppv-lite86@0.2.21	X									X			
 prettyplease@0.2.37	X									X			
-proc-macro2@1.0.101	X									X			
-prost@0.14.1	X												
-prost-build@0.14.1	X												
-prost-derive@0.14.1	X												
-prost-types@0.14.1	X												
+proc-macro2@1.0.106	X									X			
+prost@0.14.3	X												
+prost-build@0.14.3	X												
+prost-derive@0.14.3	X												
+prost-types@0.14.3	X												
 quick-xml@0.37.5										X			
 quick-xml@0.38.4										X			
-quote@1.0.40	X									X			
+quote@1.0.45	X									X			
 r-efi@5.3.0	X								X	X			
+r-efi@6.0.0	X								X	X			
 radium@0.7.0										X			
 rand@0.8.5	X									X			
 rand@0.9.2	X									X			
 rand_chacha@0.3.1	X									X			
 rand_chacha@0.9.0	X									X			
 rand_core@0.6.4	X									X			
-rand_core@0.9.3	X									X			
-redox_syscall@0.5.17										X			
-regex@1.11.2	X									X			
-regex-automata@0.4.10	X									X			
-regex-syntax@0.8.6	X									X			
+rand_core@0.9.5	X									X			
+redox_syscall@0.5.18										X			
+regex@1.12.3	X									X			
+regex-automata@0.4.14	X									X			
+regex-syntax@0.8.10	X									X			
 reqsign@0.16.5	X												
-reqwest@0.12.25	X									X			
+reqwest@0.12.28	X									X			
 ring@0.17.14	X							X					
 rustc_version@0.4.1	X									X			
-rustix@1.0.8	X	X								X			
-rustls@0.23.32	X							X		X			
-rustls-pki-types@1.12.0	X									X			
-rustls-webpki@0.103.7								X					
+rustix@1.1.4	X	X								X			
+rustls@0.23.37	X							X		X			
+rustls-pki-types@1.14.0	X									X			
+rustls-webpki@0.103.10								X					
 rustversion@1.0.22	X									X			
-ryu@1.0.20	X				X								
+ryu@1.0.23	X				X								
 scopeguard@1.2.0	X									X			
 scratch@1.0.9	X									X			
-semver@1.0.26	X									X			
+semver@1.0.27	X									X			
 serde@1.0.228	X									X			
 serde_core@1.0.228	X									X			
 serde_derive@1.0.228	X									X			
-serde_json@1.0.143	X									X			
+serde_json@1.0.149	X									X			
 serde_urlencoded@0.7.1	X									X			
 sha1@0.10.6	X									X			
 sha2@0.10.9	X									X			
 shlex@1.3.0	X									X			
-signal-hook-registry@1.4.6	X									X			
+signal-hook-registry@1.4.8	X									X			
 simdutf8@0.1.5	X									X			
-slab@0.4.11										X			
+slab@0.4.12										X			
 smallvec@1.15.1	X									X			
 snafu@0.8.9	X									X			
 snafu-derive@0.8.9	X									X			
-socket2@0.6.0	X									X			
+socket2@0.6.3	X									X			
 stable_deref_trait@1.2.1	X									X			
-static_assertions@1.1.0	X									X			
 strsim@0.11.1										X			
 structmeta@0.3.0	X									X			
 structmeta-derive@0.3.0	X									X			
 strum@0.26.3										X			
 strum_macros@0.26.4										X			
 subtle@2.6.1				X									
-syn@2.0.106	X									X			
+syn@2.0.117	X									X			
 sync_wrapper@1.0.2	X												
 synstructure@0.13.2										X			
 tap@1.0.1										X			
-tempfile@3.23.0	X									X			
+tempfile@3.27.0	X									X			
 termcolor@1.4.1										X		X	
 thiserror@1.0.69	X									X			
 thiserror-impl@1.0.69	X									X			
 tiny-keccak@2.0.2						X							
-tinystr@0.8.1											X		
-tokio@1.48.0										X			
-tokio-macros@2.6.0										X			
+tinystr@0.8.2											X		
+tokio@1.50.0										X			
+tokio-macros@2.6.1										X			
 tokio-rustls@0.26.4	X									X			
-tokio-util@0.7.16										X			
-tower@0.5.2										X			
+tokio-util@0.7.18										X			
+tower@0.5.3										X			
 tower-http@0.6.8										X			
 tower-layer@0.3.3										X			
 tower-service@0.3.3										X			
-tracing@0.1.41										X			
-tracing-attributes@0.1.30										X			
-tracing-core@0.1.34										X			
+tracing@0.1.44										X			
+tracing-attributes@0.1.31										X			
+tracing-core@0.1.36										X			
 try-lock@0.2.5										X			
 twox-hash@2.1.2										X			
 typenum@1.19.0	X									X			
-unicode-ident@1.0.18	X									X	X		
+unicode-ident@1.0.24	X									X	X		
 unicode-width@0.2.2	X									X			
 untrusted@0.9.0								X					
-url@2.5.7	X									X			
+url@2.5.8	X									X			
 utf8_iter@1.0.4	X									X			
 utf8parse@0.2.2	X									X			
-uuid@1.18.0	X									X			
+uuid@1.22.0	X									X			
 value-bag@1.12.0	X									X			
 version_check@0.9.5	X									X			
 want@0.3.1										X			
 wasi@0.11.1+wasi-snapshot-preview1	X	X								X			
-wasi@0.14.2+wasi-0.2.4	X	X								X			
-wasm-bindgen@0.2.100	X									X			
-wasm-bindgen-backend@0.2.100	X									X			
-wasm-bindgen-futures@0.4.50	X									X			
-wasm-bindgen-macro@0.2.100	X									X			
-wasm-bindgen-macro-support@0.2.100	X									X			
-wasm-bindgen-shared@0.2.100	X									X			
+wasip2@1.0.2+wasi-0.2.9	X	X								X			
+wasip3@0.4.0+wasi-0.3.0-rc-2026-01-06	X	X								X			
+wasm-bindgen@0.2.114	X									X			
+wasm-bindgen-futures@0.4.64	X									X			
+wasm-bindgen-macro@0.2.114	X									X			
+wasm-bindgen-macro-support@0.2.114	X									X			
+wasm-bindgen-shared@0.2.114	X									X			
 wasm-streams@0.4.2	X									X			
-web-sys@0.3.77	X									X			
-webpki-roots@1.0.3							X						
+web-sys@0.3.91	X									X			
+webpki-roots@1.0.6							X						
 winapi-util@0.1.11										X		X	
-windows-core@0.61.2	X									X			
-windows-implement@0.60.0	X									X			
-windows-interface@0.59.1	X									X			
-windows-link@0.1.3	X									X			
+windows-core@0.62.2	X									X			
+windows-implement@0.60.2	X									X			
+windows-interface@0.59.3	X									X			
 windows-link@0.2.1	X									X			
-windows-result@0.3.4	X									X			
-windows-strings@0.4.2	X									X			
+windows-result@0.4.1	X									X			
+windows-strings@0.5.1	X									X			
 windows-sys@0.52.0	X									X			
-windows-sys@0.59.0	X									X			
-windows-sys@0.60.2	X									X			
 windows-sys@0.61.2	X									X			
 windows-targets@0.52.6	X									X			
-windows-targets@0.53.3	X									X			
 windows_aarch64_gnullvm@0.52.6	X									X			
-windows_aarch64_gnullvm@0.53.0	X									X			
 windows_aarch64_msvc@0.52.6	X									X			
-windows_aarch64_msvc@0.53.0	X									X			
 windows_i686_gnu@0.52.6	X									X			
-windows_i686_gnu@0.53.0	X									X			
 windows_i686_gnullvm@0.52.6	X									X			
-windows_i686_gnullvm@0.53.0	X									X			
 windows_i686_msvc@0.52.6	X									X			
-windows_i686_msvc@0.53.0	X									X			
 windows_x86_64_gnu@0.52.6	X									X			
-windows_x86_64_gnu@0.53.0	X									X			
 windows_x86_64_gnullvm@0.52.6	X									X			
-windows_x86_64_gnullvm@0.53.0	X									X			
 windows_x86_64_msvc@0.52.6	X									X			
-windows_x86_64_msvc@0.53.0	X									X			
-wit-bindgen-rt@0.39.0	X	X								X			
-writeable@0.6.1											X		
+wit-bindgen@0.51.0	X	X								X			
+writeable@0.6.2											X		
 wyz@0.5.1										X			
-yoke@0.8.0											X		
-yoke-derive@0.8.0											X		
-zerocopy@0.8.26	X		X							X			
+yoke@0.8.1											X		
+yoke-derive@0.8.1											X		
+zerocopy@0.8.47	X		X							X			
+zerocopy-derive@0.8.47	X		X							X			
 zerofrom@0.1.6											X		
 zerofrom-derive@0.1.6											X		
 zeroize@1.8.2	X									X			
-zerotrie@0.2.2											X		
-zerovec@0.11.4											X		
-zerovec-derive@0.11.1											X		
+zerotrie@0.2.3											X		
+zerovec@0.11.5											X		
+zerovec-derive@0.11.2											X		
+zmij@1.0.21										X			
 zstd@0.13.3										X			
 zstd-safe@7.2.4	X									X			
 zstd-sys@2.0.16+zstd.1.5.7	X									X			
diff --git a/fluss-rust/bindings/python/DEPENDENCIES.rust.tsv b/fluss-rust/bindings/python/DEPENDENCIES.rust.tsv
index 8bd8368c12..bc7b9b78f2 100644
--- a/fluss-rust/bindings/python/DEPENDENCIES.rust.tsv
+++ b/fluss-rust/bindings/python/DEPENDENCIES.rust.tsv
@@ -1,317 +1,310 @@
-crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense
-ahash@0.8.12	X									X		
-aho-corasick@1.1.3										X		X
-android-tzdata@0.1.1	X									X		
-android_system_properties@0.1.5	X									X		
-anstream@0.6.20	X									X		
-anstyle@1.0.11	X									X		
-anstyle-parse@0.2.7	X									X		
-anstyle-query@1.1.4	X									X		
-anstyle-wincon@3.0.10	X									X		
-anyhow@1.0.100	X									X		
-arrow@57.1.0	X											
-arrow-arith@57.1.0	X											
-arrow-array@57.1.0	X											
-arrow-buffer@57.1.0	X											
-arrow-cast@57.1.0	X											
-arrow-csv@57.1.0	X											
-arrow-data@57.1.0	X											
-arrow-ipc@57.1.0	X											
-arrow-json@57.1.0	X											
-arrow-ord@57.1.0	X											
-arrow-pyarrow@57.1.0	X											
-arrow-row@57.1.0	X											
-arrow-schema@57.1.0	X											
-arrow-select@57.1.0	X											
-arrow-string@57.1.0	X											
-async-trait@0.1.89	X									X		
-atoi@2.0.0										X		
-atomic-waker@1.1.2	X									X		
-autocfg@1.5.0	X									X		
-backon@1.6.0	X											
-base64@0.22.1	X									X		
-bigdecimal@0.4.10	X									X		
-bitflags@2.9.3	X									X		
-bitvec@1.0.1										X		
-block-buffer@0.10.4	X									X		
-bumpalo@3.19.0	X									X		
-byteorder@1.5.0										X		X
-bytes@1.11.1										X		
-cc@1.2.34	X									X		
-cfg-if@1.0.3	X									X		
-chrono@0.4.41	X									X		
-clap@4.5.45	X									X		
-clap_builder@4.5.44	X									X		
-clap_derive@4.5.45	X									X		
-clap_lex@0.7.5	X									X		
-colorchoice@1.0.4	X									X		
-const-oid@0.9.6	X									X		
-const-random@0.1.18	X									X		
-const-random-macro@0.1.16	X									X		
-core-foundation-sys@0.8.7	X									X		
-cpufeatures@0.2.17	X									X		
-crc32c@0.6.8	X									X		
-crossbeam-utils@0.8.21	X									X		
-crunchy@0.2.4										X		
-crypto-common@0.1.7	X									X		
-csv@1.3.1										X		X
-csv-core@0.1.12										X		X
-dashmap@6.1.0										X		
-delegate@0.13.5	X									X		
-digest@0.10.7	X									X		
-displaydoc@0.2.5	X									X		
-either@1.15.0	X									X		
-equivalent@1.0.2	X									X		
-errno@0.3.13	X									X		
-fastrand@2.3.0	X									X		
-fixedbitset@0.5.7	X									X		
-flatbuffers@25.2.10	X											
-fluss-rs@0.1.0	X											
-fluss_python@0.1.0	X											
-fnv@1.0.7	X									X		
-form_urlencoded@1.2.2	X									X		
-funty@2.0.0										X		
-futures@0.3.31	X									X		
-futures-channel@0.3.31	X									X		
-futures-core@0.3.31	X									X		
-futures-executor@0.3.31	X									X		
-futures-io@0.3.31	X									X		
-futures-macro@0.3.31	X									X		
-futures-sink@0.3.31	X									X		
-futures-task@0.3.31	X									X		
-futures-util@0.3.31	X									X		
-generic-array@0.14.7										X		
-getrandom@0.2.16	X									X		
-getrandom@0.3.3	X									X		
-gloo-timers@0.3.0	X									X		
-h2@0.4.12										X		
-half@2.6.0	X									X		
-hashbrown@0.14.5	X									X		
-hashbrown@0.15.5	X									X		
-hashbrown@0.16.1	X									X		
-heck@0.5.0	X									X		
-hex@0.4.3	X									X		
-hmac@0.12.1	X									X		
-home@0.5.11	X									X		
-http@1.3.1	X									X		
-http-body@1.0.1										X		
-http-body-util@0.1.3										X		
-httparse@1.10.1	X									X		
-httpdate@1.0.3	X									X		
-hyper@1.7.0										X		
-hyper-rustls@0.27.7	X							X		X		
-hyper-util@0.1.17										X		
-iana-time-zone@0.1.63	X									X		
-iana-time-zone-haiku@0.1.2	X									X		
-icu_collections@2.0.0											X	
-icu_locale_core@2.0.0											X	
-icu_normalizer@2.0.0											X	
-icu_normalizer_data@2.0.0											X	
-icu_properties@2.0.1											X	
-icu_properties_data@2.0.1											X	
-icu_provider@2.0.0											X	
-idna@1.1.0	X									X		
-idna_adapter@1.2.1	X									X		
-indexmap@2.11.0	X									X		
-indoc@2.0.6	X									X		
-ipnet@2.11.0	X									X		
-iri-string@0.7.9	X									X		
-is_terminal_polyfill@1.70.1	X									X		
-itertools@0.14.0	X									X		
-itoa@1.0.15	X									X		
-jiff@0.2.16										X		X
-jiff-tzdb@0.1.5										X		X
-jiff-tzdb-platform@0.1.3										X		X
-jobserver@0.1.34	X									X		
-js-sys@0.3.77	X									X		
-lexical-core@1.0.5	X									X		
-lexical-parse-float@1.0.5	X									X		
-lexical-parse-integer@1.0.5	X									X		
-lexical-util@1.0.6	X									X		
-lexical-write-float@1.0.5	X									X		
-lexical-write-integer@1.0.5	X									X		
-libc@0.2.175	X									X		
-libm@0.2.15										X		
-linked-hash-map@0.5.6	X									X		
-linux-raw-sys@0.9.4	X	X								X		
-litemap@0.8.0											X	
-lock_api@0.4.13	X									X		
-log@0.4.27	X									X		
-lz4_flex@0.12.0										X		
-md-5@0.10.6	X									X		
-memchr@2.7.5										X		X
-memoffset@0.9.1										X		
-mio@1.0.4										X		
-multimap@0.10.1	X									X		
-num-bigint@0.4.6	X									X		
-num-complex@0.4.6	X									X		
-num-integer@0.1.46	X									X		
-num-traits@0.2.19	X									X		
-once_cell@1.21.3	X									X		
-once_cell_polyfill@1.70.1	X									X		
-opendal@0.55.0	X											
-ordered-float@5.1.0										X		
-parking_lot@0.12.4	X									X		
-parking_lot_core@0.9.11	X									X		
-parse-display@0.10.0	X									X		
-parse-display-derive@0.10.0	X									X		
-percent-encoding@2.3.2	X									X		
-petgraph@0.7.1	X									X		
-pin-project-lite@0.2.16	X									X		
-pin-utils@0.1.0	X									X		
-pkg-config@0.3.32	X									X		
-portable-atomic@1.11.1	X									X		
-portable-atomic-util@0.2.4	X									X		
-potential_utf@0.1.3											X	
-ppv-lite86@0.2.21	X									X		
-prettyplease@0.2.37	X									X		
-proc-macro2@1.0.101	X									X		
-prost@0.14.1	X											
-prost-build@0.14.1	X											
-prost-derive@0.14.1	X											
-prost-types@0.14.1	X											
-pyo3@0.26.0	X									X		
-pyo3-async-runtimes@0.26.0	X											
-pyo3-build-config@0.26.0	X									X		
-pyo3-ffi@0.26.0	X									X		
-pyo3-macros@0.26.0	X									X		
-pyo3-macros-backend@0.26.0	X									X		
-quick-xml@0.37.5										X		
-quick-xml@0.38.4										X		
-quote@1.0.40	X									X		
-r-efi@5.3.0	X								X	X		
-radium@0.7.0										X		
-rand@0.8.5	X									X		
-rand@0.9.2	X									X		
-rand_chacha@0.3.1	X									X		
-rand_chacha@0.9.0	X									X		
-rand_core@0.6.4	X									X		
-rand_core@0.9.3	X									X		
-redox_syscall@0.5.17										X		
-regex@1.11.2	X									X		
-regex-automata@0.4.10	X									X		
-regex-syntax@0.8.6	X									X		
-reqsign@0.16.5	X											
-reqwest@0.12.25	X									X		
-ring@0.17.14	X							X				
-rustc_version@0.4.1	X									X		
-rustix@1.0.8	X	X								X		
-rustls@0.23.32	X							X		X		
-rustls-pki-types@1.12.0	X									X		
-rustls-webpki@0.103.7								X				
-rustversion@1.0.22	X									X		
-ryu@1.0.20	X				X							
-scopeguard@1.2.0	X									X		
-semver@1.0.26	X									X		
-serde@1.0.228	X									X		
-serde_core@1.0.228	X									X		
-serde_derive@1.0.228	X									X		
-serde_json@1.0.143	X									X		
-serde_urlencoded@0.7.1	X									X		
-sha1@0.10.6	X									X		
-sha2@0.10.9	X									X		
-shlex@1.3.0	X									X		
-signal-hook-registry@1.4.6	X									X		
-simdutf8@0.1.5	X									X		
-slab@0.4.11										X		
-smallvec@1.15.1	X									X		
-snafu@0.8.9	X									X		
-snafu-derive@0.8.9	X									X		
-socket2@0.6.0	X									X		
-stable_deref_trait@1.2.1	X									X		
-static_assertions@1.1.0	X									X		
-strsim@0.11.1										X		
-structmeta@0.3.0	X									X		
-structmeta-derive@0.3.0	X									X		
-strum@0.26.3										X		
-strum_macros@0.26.4										X		
-subtle@2.6.1				X								
-syn@2.0.106	X									X		
-sync_wrapper@1.0.2	X											
-synstructure@0.13.2										X		
-tap@1.0.1										X		
-target-lexicon@0.13.3		X										
-tempfile@3.23.0	X									X		
-thiserror@1.0.69	X									X		
-thiserror-impl@1.0.69	X									X		
-tiny-keccak@2.0.2						X						
-tinystr@0.8.1											X	
-tokio@1.48.0										X		
-tokio-macros@2.6.0										X		
-tokio-rustls@0.26.4	X									X		
-tokio-util@0.7.16										X		
-tower@0.5.2										X		
-tower-http@0.6.8										X		
-tower-layer@0.3.3										X		
-tower-service@0.3.3										X		
-tracing@0.1.41										X		
-tracing-attributes@0.1.30										X		
-tracing-core@0.1.34										X		
-try-lock@0.2.5										X		
-twox-hash@2.1.2										X		
-typenum@1.19.0	X									X		
-unicode-ident@1.0.18	X									X	X	
-unindent@0.2.4	X									X		
-untrusted@0.9.0								X				
-url@2.5.7	X									X		
-utf8_iter@1.0.4	X									X		
-utf8parse@0.2.2	X									X		
-uuid@1.18.0	X									X		
-value-bag@1.12.0	X									X		
-version_check@0.9.5	X									X		
-want@0.3.1										X		
-wasi@0.11.1+wasi-snapshot-preview1	X	X								X		
-wasi@0.14.2+wasi-0.2.4	X	X								X		
-wasm-bindgen@0.2.100	X									X		
-wasm-bindgen-backend@0.2.100	X									X		
-wasm-bindgen-futures@0.4.50	X									X		
-wasm-bindgen-macro@0.2.100	X									X		
-wasm-bindgen-macro-support@0.2.100	X									X		
-wasm-bindgen-shared@0.2.100	X									X		
-wasm-streams@0.4.2	X									X		
-web-sys@0.3.77	X									X		
-webpki-roots@1.0.3							X					
-windows-core@0.61.2	X									X		
-windows-implement@0.60.0	X									X		
-windows-interface@0.59.1	X									X		
-windows-link@0.1.3	X									X		
-windows-link@0.2.1	X									X		
-windows-result@0.3.4	X									X		
-windows-strings@0.4.2	X									X		
-windows-sys@0.52.0	X									X		
-windows-sys@0.59.0	X									X		
-windows-sys@0.60.2	X									X		
-windows-sys@0.61.2	X									X		
-windows-targets@0.52.6	X									X		
-windows-targets@0.53.3	X									X		
-windows_aarch64_gnullvm@0.52.6	X									X		
-windows_aarch64_gnullvm@0.53.0	X									X		
-windows_aarch64_msvc@0.52.6	X									X		
-windows_aarch64_msvc@0.53.0	X									X		
-windows_i686_gnu@0.52.6	X									X		
-windows_i686_gnu@0.53.0	X									X		
-windows_i686_gnullvm@0.52.6	X									X		
-windows_i686_gnullvm@0.53.0	X									X		
-windows_i686_msvc@0.52.6	X									X		
-windows_i686_msvc@0.53.0	X									X		
-windows_x86_64_gnu@0.52.6	X									X		
-windows_x86_64_gnu@0.53.0	X									X		
-windows_x86_64_gnullvm@0.52.6	X									X		
-windows_x86_64_gnullvm@0.53.0	X									X		
-windows_x86_64_msvc@0.52.6	X									X		
-windows_x86_64_msvc@0.53.0	X									X		
-wit-bindgen-rt@0.39.0	X	X								X		
-writeable@0.6.1											X	
-wyz@0.5.1										X		
-yoke@0.8.0											X	
-yoke-derive@0.8.0											X	
-zerocopy@0.8.26	X		X							X		
-zerofrom@0.1.6											X	
-zerofrom-derive@0.1.6											X	
-zeroize@1.8.2	X									X		
-zerotrie@0.2.2											X	
-zerovec@0.11.4											X	
-zerovec-derive@0.11.1											X	
-zstd@0.13.3										X		
-zstd-safe@7.2.4	X									X		
-zstd-sys@2.0.16+zstd.1.5.7	X									X		
+crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense	Zlib
+ahash@0.8.12	X									X			
+aho-corasick@1.1.4										X		X	
+android_system_properties@0.1.5	X									X			
+anstream@1.0.0	X									X			
+anstyle@1.0.14	X									X			
+anstyle-parse@1.0.0	X									X			
+anstyle-query@1.1.5	X									X			
+anstyle-wincon@3.0.11	X									X			
+anyhow@1.0.102	X									X			
+arrow@57.3.0	X												
+arrow-arith@57.3.0	X												
+arrow-array@57.3.0	X												
+arrow-buffer@57.3.0	X												
+arrow-cast@57.3.0	X												
+arrow-csv@57.3.0	X												
+arrow-data@57.3.0	X												
+arrow-ipc@57.3.0	X												
+arrow-json@57.3.0	X												
+arrow-ord@57.3.0	X												
+arrow-pyarrow@57.3.0	X												
+arrow-row@57.3.0	X												
+arrow-schema@57.3.0	X												
+arrow-select@57.3.0	X												
+arrow-string@57.3.0	X												
+async-trait@0.1.89	X									X			
+atoi@2.0.0										X			
+atomic-waker@1.1.2	X									X			
+autocfg@1.5.0	X									X			
+backon@1.6.0	X												
+base64@0.22.1	X									X			
+bigdecimal@0.4.10	X									X			
+bitflags@2.11.0	X									X			
+bitvec@1.0.1										X			
+block-buffer@0.10.4	X									X			
+bumpalo@3.20.2	X									X			
+byteorder@1.5.0										X		X	
+bytes@1.11.1										X			
+cc@1.2.57	X									X			
+cfg-if@1.0.4	X									X			
+chrono@0.4.44	X									X			
+clap@4.6.0	X									X			
+clap_builder@4.6.0	X									X			
+clap_derive@4.6.0	X									X			
+clap_lex@1.1.0	X									X			
+colorchoice@1.0.5	X									X			
+const-oid@0.9.6	X									X			
+const-random@0.1.18	X									X			
+const-random-macro@0.1.16	X									X			
+core-foundation-sys@0.8.7	X									X			
+cpufeatures@0.2.17	X									X			
+crc32c@0.6.8	X									X			
+crossbeam-utils@0.8.21	X									X			
+crunchy@0.2.4										X			
+crypto-common@0.1.7	X									X			
+csv@1.4.0										X		X	
+csv-core@0.1.13										X		X	
+dashmap@6.1.0										X			
+delegate@0.13.5	X									X			
+digest@0.10.7	X									X			
+displaydoc@0.2.5	X									X			
+either@1.15.0	X									X			
+equivalent@1.0.2	X									X			
+errno@0.3.14	X									X			
+fastrand@2.3.0	X									X			
+find-msvc-tools@0.1.9	X									X			
+fixedbitset@0.5.7	X									X			
+flatbuffers@25.12.19	X												
+fluss-rs@0.1.0	X												
+fluss_python@0.1.0	X												
+fnv@1.0.7	X									X			
+foldhash@0.1.5													X
+form_urlencoded@1.2.2	X									X			
+funty@2.0.0										X			
+futures@0.3.32	X									X			
+futures-channel@0.3.32	X									X			
+futures-core@0.3.32	X									X			
+futures-executor@0.3.32	X									X			
+futures-io@0.3.32	X									X			
+futures-macro@0.3.32	X									X			
+futures-sink@0.3.32	X									X			
+futures-task@0.3.32	X									X			
+futures-util@0.3.32	X									X			
+generic-array@0.14.7										X			
+getrandom@0.2.17	X									X			
+getrandom@0.3.4	X									X			
+getrandom@0.4.2	X									X			
+gloo-timers@0.3.0	X									X			
+h2@0.4.13										X			
+half@2.7.1	X									X			
+hashbrown@0.14.5	X									X			
+hashbrown@0.15.5	X									X			
+hashbrown@0.16.1	X									X			
+heck@0.5.0	X									X			
+hex@0.4.3	X									X			
+hmac@0.12.1	X									X			
+home@0.5.12	X									X			
+http@1.4.0	X									X			
+http-body@1.0.1										X			
+http-body-util@0.1.3										X			
+httparse@1.10.1	X									X			
+httpdate@1.0.3	X									X			
+hyper@1.8.1										X			
+hyper-rustls@0.27.7	X							X		X			
+hyper-util@0.1.20										X			
+iana-time-zone@0.1.65	X									X			
+iana-time-zone-haiku@0.1.2	X									X			
+icu_collections@2.1.1											X		
+icu_locale_core@2.1.1											X		
+icu_normalizer@2.1.1											X		
+icu_normalizer_data@2.1.1											X		
+icu_properties@2.1.2											X		
+icu_properties_data@2.1.2											X		
+icu_provider@2.1.1											X		
+idna@1.1.0	X									X			
+idna_adapter@1.2.1	X									X			
+indexmap@2.13.0	X									X			
+indoc@2.0.7	X									X			
+ipnet@2.12.0	X									X			
+iri-string@0.7.11	X									X			
+is_terminal_polyfill@1.70.2	X									X			
+itertools@0.14.0	X									X			
+itoa@1.0.18	X									X			
+jiff@0.2.23										X		X	
+jiff-tzdb@0.1.6										X		X	
+jiff-tzdb-platform@0.1.3										X		X	
+jobserver@0.1.34	X									X			
+js-sys@0.3.91	X									X			
+lexical-core@1.0.6	X									X			
+lexical-parse-float@1.0.6	X									X			
+lexical-parse-integer@1.0.6	X									X			
+lexical-util@1.0.7	X									X			
+lexical-write-float@1.0.6	X									X			
+lexical-write-integer@1.0.6	X									X			
+libc@0.2.183	X									X			
+libm@0.2.16										X			
+linked-hash-map@0.5.6	X									X			
+linux-raw-sys@0.12.1	X	X								X			
+litemap@0.8.1											X		
+lock_api@0.4.14	X									X			
+log@0.4.29	X									X			
+lz4_flex@0.12.1										X			
+md-5@0.10.6	X									X			
+memchr@2.8.0										X		X	
+memoffset@0.9.1										X			
+mio@1.1.1										X			
+multimap@0.10.1	X									X			
+num-bigint@0.4.6	X									X			
+num-complex@0.4.6	X									X			
+num-integer@0.1.46	X									X			
+num-traits@0.2.19	X									X			
+once_cell@1.21.4	X									X			
+once_cell_polyfill@1.70.2	X									X			
+opendal@0.55.0	X												
+ordered-float@5.1.0										X			
+parking_lot@0.12.5	X									X			
+parking_lot_core@0.9.12	X									X			
+parse-display@0.10.0	X									X			
+parse-display-derive@0.10.0	X									X			
+percent-encoding@2.3.2	X									X			
+petgraph@0.8.3	X									X			
+pin-project-lite@0.2.17	X									X			
+pin-utils@0.1.0	X									X			
+pkg-config@0.3.32	X									X			
+portable-atomic@1.13.1	X									X			
+portable-atomic-util@0.2.6	X									X			
+potential_utf@0.1.4											X		
+ppv-lite86@0.2.21	X									X			
+prettyplease@0.2.37	X									X			
+proc-macro2@1.0.106	X									X			
+prost@0.14.3	X												
+prost-build@0.14.3	X												
+prost-derive@0.14.3	X												
+prost-types@0.14.3	X												
+pyo3@0.26.0	X									X			
+pyo3-async-runtimes@0.26.0	X												
+pyo3-build-config@0.26.0	X									X			
+pyo3-ffi@0.26.0	X									X			
+pyo3-macros@0.26.0	X									X			
+pyo3-macros-backend@0.26.0	X									X			
+python3-dll-a@0.2.14										X			
+quick-xml@0.37.5										X			
+quick-xml@0.38.4										X			
+quote@1.0.45	X									X			
+r-efi@5.3.0	X								X	X			
+r-efi@6.0.0	X								X	X			
+radium@0.7.0										X			
+rand@0.8.5	X									X			
+rand@0.9.2	X									X			
+rand_chacha@0.3.1	X									X			
+rand_chacha@0.9.0	X									X			
+rand_core@0.6.4	X									X			
+rand_core@0.9.5	X									X			
+redox_syscall@0.5.18										X			
+regex@1.12.3	X									X			
+regex-automata@0.4.14	X									X			
+regex-syntax@0.8.10	X									X			
+reqsign@0.16.5	X												
+reqwest@0.12.28	X									X			
+ring@0.17.14	X							X					
+rustc_version@0.4.1	X									X			
+rustix@1.1.4	X	X								X			
+rustls@0.23.37	X							X		X			
+rustls-pki-types@1.14.0	X									X			
+rustls-webpki@0.103.10								X					
+rustversion@1.0.22	X									X			
+ryu@1.0.23	X				X								
+scopeguard@1.2.0	X									X			
+semver@1.0.27	X									X			
+serde@1.0.228	X									X			
+serde_core@1.0.228	X									X			
+serde_derive@1.0.228	X									X			
+serde_json@1.0.149	X									X			
+serde_urlencoded@0.7.1	X									X			
+sha1@0.10.6	X									X			
+sha2@0.10.9	X									X			
+shlex@1.3.0	X									X			
+signal-hook-registry@1.4.8	X									X			
+simdutf8@0.1.5	X									X			
+slab@0.4.12										X			
+smallvec@1.15.1	X									X			
+snafu@0.8.9	X									X			
+snafu-derive@0.8.9	X									X			
+socket2@0.6.3	X									X			
+stable_deref_trait@1.2.1	X									X			
+strsim@0.11.1										X			
+structmeta@0.3.0	X									X			
+structmeta-derive@0.3.0	X									X			
+strum@0.26.3										X			
+strum_macros@0.26.4										X			
+subtle@2.6.1				X									
+syn@2.0.117	X									X			
+sync_wrapper@1.0.2	X												
+synstructure@0.13.2										X			
+tap@1.0.1										X			
+target-lexicon@0.13.5		X											
+tempfile@3.27.0	X									X			
+thiserror@1.0.69	X									X			
+thiserror-impl@1.0.69	X									X			
+tiny-keccak@2.0.2						X							
+tinystr@0.8.2											X		
+tokio@1.50.0										X			
+tokio-macros@2.6.1										X			
+tokio-rustls@0.26.4	X									X			
+tokio-util@0.7.18										X			
+tower@0.5.3										X			
+tower-http@0.6.8										X			
+tower-layer@0.3.3										X			
+tower-service@0.3.3										X			
+tracing@0.1.44										X			
+tracing-attributes@0.1.31										X			
+tracing-core@0.1.36										X			
+try-lock@0.2.5										X			
+twox-hash@2.1.2										X			
+typenum@1.19.0	X									X			
+unicode-ident@1.0.24	X									X	X		
+unindent@0.2.4	X									X			
+untrusted@0.9.0								X					
+url@2.5.8	X									X			
+utf8_iter@1.0.4	X									X			
+utf8parse@0.2.2	X									X			
+uuid@1.22.0	X									X			
+value-bag@1.12.0	X									X			
+version_check@0.9.5	X									X			
+want@0.3.1										X			
+wasi@0.11.1+wasi-snapshot-preview1	X	X								X			
+wasip2@1.0.2+wasi-0.2.9	X	X								X			
+wasip3@0.4.0+wasi-0.3.0-rc-2026-01-06	X	X								X			
+wasm-bindgen@0.2.114	X									X			
+wasm-bindgen-futures@0.4.64	X									X			
+wasm-bindgen-macro@0.2.114	X									X			
+wasm-bindgen-macro-support@0.2.114	X									X			
+wasm-bindgen-shared@0.2.114	X									X			
+wasm-streams@0.4.2	X									X			
+web-sys@0.3.91	X									X			
+webpki-roots@1.0.6							X						
+windows-core@0.62.2	X									X			
+windows-implement@0.60.2	X									X			
+windows-interface@0.59.3	X									X			
+windows-link@0.2.1	X									X			
+windows-result@0.4.1	X									X			
+windows-strings@0.5.1	X									X			
+windows-sys@0.52.0	X									X			
+windows-sys@0.61.2	X									X			
+windows-targets@0.52.6	X									X			
+windows_aarch64_gnullvm@0.52.6	X									X			
+windows_aarch64_msvc@0.52.6	X									X			
+windows_i686_gnu@0.52.6	X									X			
+windows_i686_gnullvm@0.52.6	X									X			
+windows_i686_msvc@0.52.6	X									X			
+windows_x86_64_gnu@0.52.6	X									X			
+windows_x86_64_gnullvm@0.52.6	X									X			
+windows_x86_64_msvc@0.52.6	X									X			
+wit-bindgen@0.51.0	X	X								X			
+writeable@0.6.2											X		
+wyz@0.5.1										X			
+yoke@0.8.1											X		
+yoke-derive@0.8.1											X		
+zerocopy@0.8.47	X		X							X			
+zerocopy-derive@0.8.47	X		X							X			
+zerofrom@0.1.6											X		
+zerofrom-derive@0.1.6											X		
+zeroize@1.8.2	X									X			
+zerotrie@0.2.3											X		
+zerovec@0.11.5											X		
+zerovec-derive@0.11.2											X		
+zmij@1.0.21										X			
+zstd@0.13.3										X			
+zstd-safe@7.2.4	X									X			
+zstd-sys@2.0.16+zstd.1.5.7	X									X			
diff --git a/fluss-rust/crates/examples/DEPENDENCIES.rust.tsv b/fluss-rust/crates/examples/DEPENDENCIES.rust.tsv
index 6b30630eff..5af4754d0c 100644
--- a/fluss-rust/crates/examples/DEPENDENCIES.rust.tsv
+++ b/fluss-rust/crates/examples/DEPENDENCIES.rust.tsv
@@ -1,306 +1,300 @@
-crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense
-ahash@0.8.12	X									X		
-aho-corasick@1.1.3										X		X
-android-tzdata@0.1.1	X									X		
-android_system_properties@0.1.5	X									X		
-anstream@0.6.20	X									X		
-anstyle@1.0.11	X									X		
-anstyle-parse@0.2.7	X									X		
-anstyle-query@1.1.4	X									X		
-anstyle-wincon@3.0.10	X									X		
-anyhow@1.0.100	X									X		
-arrow@57.1.0	X											
-arrow-arith@57.1.0	X											
-arrow-array@57.1.0	X											
-arrow-buffer@57.1.0	X											
-arrow-cast@57.1.0	X											
-arrow-csv@57.1.0	X											
-arrow-data@57.1.0	X											
-arrow-ipc@57.1.0	X											
-arrow-json@57.1.0	X											
-arrow-ord@57.1.0	X											
-arrow-row@57.1.0	X											
-arrow-schema@57.1.0	X											
-arrow-select@57.1.0	X											
-arrow-string@57.1.0	X											
-async-trait@0.1.89	X									X		
-atoi@2.0.0										X		
-atomic-waker@1.1.2	X									X		
-autocfg@1.5.0	X									X		
-backon@1.6.0	X											
-base64@0.22.1	X									X		
-bigdecimal@0.4.10	X									X		
-bitflags@2.9.3	X									X		
-bitvec@1.0.1										X		
-block-buffer@0.10.4	X									X		
-bumpalo@3.19.0	X									X		
-byteorder@1.5.0										X		X
-bytes@1.11.1										X		
-cc@1.2.34	X									X		
-cfg-if@1.0.3	X									X		
-chrono@0.4.41	X									X		
-clap@4.5.45	X									X		
-clap_builder@4.5.44	X									X		
-clap_derive@4.5.45	X									X		
-clap_lex@0.7.5	X									X		
-colorchoice@1.0.4	X									X		
-const-oid@0.9.6	X									X		
-const-random@0.1.18	X									X		
-const-random-macro@0.1.16	X									X		
-core-foundation-sys@0.8.7	X									X		
-cpufeatures@0.2.17	X									X		
-crc32c@0.6.8	X									X		
-crossbeam-utils@0.8.21	X									X		
-crunchy@0.2.4										X		
-crypto-common@0.1.7	X									X		
-csv@1.3.1										X		X
-csv-core@0.1.12										X		X
-dashmap@6.1.0										X		
-delegate@0.13.5	X									X		
-digest@0.10.7	X									X		
-displaydoc@0.2.5	X									X		
-either@1.15.0	X									X		
-equivalent@1.0.2	X									X		
-errno@0.3.13	X									X		
-fastrand@2.3.0	X									X		
-fixedbitset@0.5.7	X									X		
-flatbuffers@25.2.10	X											
-fluss-examples@0.1.0	X											
-fluss-rs@0.1.0	X											
-fnv@1.0.7	X									X		
-form_urlencoded@1.2.2	X									X		
-funty@2.0.0										X		
-futures@0.3.31	X									X		
-futures-channel@0.3.31	X									X		
-futures-core@0.3.31	X									X		
-futures-executor@0.3.31	X									X		
-futures-io@0.3.31	X									X		
-futures-macro@0.3.31	X									X		
-futures-sink@0.3.31	X									X		
-futures-task@0.3.31	X									X		
-futures-util@0.3.31	X									X		
-generic-array@0.14.7										X		
-getrandom@0.2.16	X									X		
-getrandom@0.3.3	X									X		
-gloo-timers@0.3.0	X									X		
-h2@0.4.12										X		
-half@2.6.0	X									X		
-hashbrown@0.14.5	X									X		
-hashbrown@0.15.5	X									X		
-hashbrown@0.16.1	X									X		
-heck@0.5.0	X									X		
-hex@0.4.3	X									X		
-hmac@0.12.1	X									X		
-home@0.5.11	X									X		
-http@1.3.1	X									X		
-http-body@1.0.1										X		
-http-body-util@0.1.3										X		
-httparse@1.10.1	X									X		
-httpdate@1.0.3	X									X		
-hyper@1.7.0										X		
-hyper-rustls@0.27.7	X							X		X		
-hyper-util@0.1.17										X		
-iana-time-zone@0.1.63	X									X		
-iana-time-zone-haiku@0.1.2	X									X		
-icu_collections@2.0.0											X	
-icu_locale_core@2.0.0											X	
-icu_normalizer@2.0.0											X	
-icu_normalizer_data@2.0.0											X	
-icu_properties@2.0.1											X	
-icu_properties_data@2.0.1											X	
-icu_provider@2.0.0											X	
-idna@1.1.0	X									X		
-idna_adapter@1.2.1	X									X		
-indexmap@2.11.0	X									X		
-ipnet@2.11.0	X									X		
-iri-string@0.7.9	X									X		
-is_terminal_polyfill@1.70.1	X									X		
-itertools@0.14.0	X									X		
-itoa@1.0.15	X									X		
-jiff@0.2.16										X		X
-jiff-tzdb@0.1.5										X		X
-jiff-tzdb-platform@0.1.3										X		X
-jobserver@0.1.34	X									X		
-js-sys@0.3.77	X									X		
-lexical-core@1.0.5	X									X		
-lexical-parse-float@1.0.5	X									X		
-lexical-parse-integer@1.0.5	X									X		
-lexical-util@1.0.6	X									X		
-lexical-write-float@1.0.5	X									X		
-lexical-write-integer@1.0.5	X									X		
-libc@0.2.175	X									X		
-libm@0.2.15										X		
-linked-hash-map@0.5.6	X									X		
-linux-raw-sys@0.9.4	X	X								X		
-litemap@0.8.0											X	
-lock_api@0.4.13	X									X		
-log@0.4.27	X									X		
-lz4_flex@0.12.0										X		
-md-5@0.10.6	X									X		
-memchr@2.7.5										X		X
-mio@1.0.4										X		
-multimap@0.10.1	X									X		
-num-bigint@0.4.6	X									X		
-num-complex@0.4.6	X									X		
-num-integer@0.1.46	X									X		
-num-traits@0.2.19	X									X		
-once_cell@1.21.3	X									X		
-once_cell_polyfill@1.70.1	X									X		
-opendal@0.55.0	X											
-ordered-float@5.1.0										X		
-parking_lot@0.12.4	X									X		
-parking_lot_core@0.9.11	X									X		
-parse-display@0.10.0	X									X		
-parse-display-derive@0.10.0	X									X		
-percent-encoding@2.3.2	X									X		
-petgraph@0.7.1	X									X		
-pin-project-lite@0.2.16	X									X		
-pin-utils@0.1.0	X									X		
-pkg-config@0.3.32	X									X		
-portable-atomic@1.11.1	X									X		
-portable-atomic-util@0.2.4	X									X		
-potential_utf@0.1.3											X	
-ppv-lite86@0.2.21	X									X		
-prettyplease@0.2.37	X									X		
-proc-macro2@1.0.101	X									X		
-prost@0.14.1	X											
-prost-build@0.14.1	X											
-prost-derive@0.14.1	X											
-prost-types@0.14.1	X											
-quick-xml@0.37.5										X		
-quick-xml@0.38.4										X		
-quote@1.0.40	X									X		
-r-efi@5.3.0	X								X	X		
-radium@0.7.0										X		
-rand@0.8.5	X									X		
-rand@0.9.2	X									X		
-rand_chacha@0.3.1	X									X		
-rand_chacha@0.9.0	X									X		
-rand_core@0.6.4	X									X		
-rand_core@0.9.3	X									X		
-redox_syscall@0.5.17										X		
-regex@1.11.2	X									X		
-regex-automata@0.4.10	X									X		
-regex-syntax@0.8.6	X									X		
-reqsign@0.16.5	X											
-reqwest@0.12.25	X									X		
-ring@0.17.14	X							X				
-rustc_version@0.4.1	X									X		
-rustix@1.0.8	X	X								X		
-rustls@0.23.32	X							X		X		
-rustls-pki-types@1.12.0	X									X		
-rustls-webpki@0.103.7								X				
-rustversion@1.0.22	X									X		
-ryu@1.0.20	X				X							
-scopeguard@1.2.0	X									X		
-semver@1.0.26	X									X		
-serde@1.0.228	X									X		
-serde_core@1.0.228	X									X		
-serde_derive@1.0.228	X									X		
-serde_json@1.0.143	X									X		
-serde_urlencoded@0.7.1	X									X		
-sha1@0.10.6	X									X		
-sha2@0.10.9	X									X		
-shlex@1.3.0	X									X		
-signal-hook-registry@1.4.6	X									X		
-simdutf8@0.1.5	X									X		
-slab@0.4.11										X		
-smallvec@1.15.1	X									X		
-snafu@0.8.9	X									X		
-snafu-derive@0.8.9	X									X		
-socket2@0.6.0	X									X		
-stable_deref_trait@1.2.1	X									X		
-static_assertions@1.1.0	X									X		
-strsim@0.11.1										X		
-structmeta@0.3.0	X									X		
-structmeta-derive@0.3.0	X									X		
-strum@0.26.3										X		
-strum_macros@0.26.4										X		
-subtle@2.6.1				X								
-syn@2.0.106	X									X		
-sync_wrapper@1.0.2	X											
-synstructure@0.13.2										X		
-tap@1.0.1										X		
-tempfile@3.23.0	X									X		
-thiserror@1.0.69	X									X		
-thiserror-impl@1.0.69	X									X		
-tiny-keccak@2.0.2						X						
-tinystr@0.8.1											X	
-tokio@1.48.0										X		
-tokio-macros@2.6.0										X		
-tokio-rustls@0.26.4	X									X		
-tokio-util@0.7.16										X		
-tower@0.5.2										X		
-tower-http@0.6.8										X		
-tower-layer@0.3.3										X		
-tower-service@0.3.3										X		
-tracing@0.1.41										X		
-tracing-attributes@0.1.30										X		
-tracing-core@0.1.34										X		
-try-lock@0.2.5										X		
-twox-hash@2.1.2										X		
-typenum@1.19.0	X									X		
-unicode-ident@1.0.18	X									X	X	
-untrusted@0.9.0								X				
-url@2.5.7	X									X		
-utf8_iter@1.0.4	X									X		
-utf8parse@0.2.2	X									X		
-uuid@1.18.0	X									X		
-value-bag@1.12.0	X									X		
-version_check@0.9.5	X									X		
-want@0.3.1										X		
-wasi@0.11.1+wasi-snapshot-preview1	X	X								X		
-wasi@0.14.2+wasi-0.2.4	X	X								X		
-wasm-bindgen@0.2.100	X									X		
-wasm-bindgen-backend@0.2.100	X									X		
-wasm-bindgen-futures@0.4.50	X									X		
-wasm-bindgen-macro@0.2.100	X									X		
-wasm-bindgen-macro-support@0.2.100	X									X		
-wasm-bindgen-shared@0.2.100	X									X		
-wasm-streams@0.4.2	X									X		
-web-sys@0.3.77	X									X		
-webpki-roots@1.0.3							X					
-windows-core@0.61.2	X									X		
-windows-implement@0.60.0	X									X		
-windows-interface@0.59.1	X									X		
-windows-link@0.1.3	X									X		
-windows-link@0.2.1	X									X		
-windows-result@0.3.4	X									X		
-windows-strings@0.4.2	X									X		
-windows-sys@0.52.0	X									X		
-windows-sys@0.59.0	X									X		
-windows-sys@0.60.2	X									X		
-windows-sys@0.61.2	X									X		
-windows-targets@0.52.6	X									X		
-windows-targets@0.53.3	X									X		
-windows_aarch64_gnullvm@0.52.6	X									X		
-windows_aarch64_gnullvm@0.53.0	X									X		
-windows_aarch64_msvc@0.52.6	X									X		
-windows_aarch64_msvc@0.53.0	X									X		
-windows_i686_gnu@0.52.6	X									X		
-windows_i686_gnu@0.53.0	X									X		
-windows_i686_gnullvm@0.52.6	X									X		
-windows_i686_gnullvm@0.53.0	X									X		
-windows_i686_msvc@0.52.6	X									X		
-windows_i686_msvc@0.53.0	X									X		
-windows_x86_64_gnu@0.52.6	X									X		
-windows_x86_64_gnu@0.53.0	X									X		
-windows_x86_64_gnullvm@0.52.6	X									X		
-windows_x86_64_gnullvm@0.53.0	X									X		
-windows_x86_64_msvc@0.52.6	X									X		
-windows_x86_64_msvc@0.53.0	X									X		
-wit-bindgen-rt@0.39.0	X	X								X		
-writeable@0.6.1											X	
-wyz@0.5.1										X		
-yoke@0.8.0											X	
-yoke-derive@0.8.0											X	
-zerocopy@0.8.26	X		X							X		
-zerofrom@0.1.6											X	
-zerofrom-derive@0.1.6											X	
-zeroize@1.8.2	X									X		
-zerotrie@0.2.2											X	
-zerovec@0.11.4											X	
-zerovec-derive@0.11.1											X	
-zstd@0.13.3										X		
-zstd-safe@7.2.4	X									X		
-zstd-sys@2.0.16+zstd.1.5.7	X									X		
+crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense	Zlib
+ahash@0.8.12	X									X			
+aho-corasick@1.1.4										X		X	
+android_system_properties@0.1.5	X									X			
+anstream@1.0.0	X									X			
+anstyle@1.0.14	X									X			
+anstyle-parse@1.0.0	X									X			
+anstyle-query@1.1.5	X									X			
+anstyle-wincon@3.0.11	X									X			
+anyhow@1.0.102	X									X			
+arrow@57.3.0	X												
+arrow-arith@57.3.0	X												
+arrow-array@57.3.0	X												
+arrow-buffer@57.3.0	X												
+arrow-cast@57.3.0	X												
+arrow-csv@57.3.0	X												
+arrow-data@57.3.0	X												
+arrow-ipc@57.3.0	X												
+arrow-json@57.3.0	X												
+arrow-ord@57.3.0	X												
+arrow-row@57.3.0	X												
+arrow-schema@57.3.0	X												
+arrow-select@57.3.0	X												
+arrow-string@57.3.0	X												
+async-trait@0.1.89	X									X			
+atoi@2.0.0										X			
+atomic-waker@1.1.2	X									X			
+autocfg@1.5.0	X									X			
+backon@1.6.0	X												
+base64@0.22.1	X									X			
+bigdecimal@0.4.10	X									X			
+bitflags@2.11.0	X									X			
+bitvec@1.0.1										X			
+block-buffer@0.10.4	X									X			
+bumpalo@3.20.2	X									X			
+byteorder@1.5.0										X		X	
+bytes@1.11.1										X			
+cc@1.2.57	X									X			
+cfg-if@1.0.4	X									X			
+chrono@0.4.44	X									X			
+clap@4.6.0	X									X			
+clap_builder@4.6.0	X									X			
+clap_derive@4.6.0	X									X			
+clap_lex@1.1.0	X									X			
+colorchoice@1.0.5	X									X			
+const-oid@0.9.6	X									X			
+const-random@0.1.18	X									X			
+const-random-macro@0.1.16	X									X			
+core-foundation-sys@0.8.7	X									X			
+cpufeatures@0.2.17	X									X			
+crc32c@0.6.8	X									X			
+crossbeam-utils@0.8.21	X									X			
+crunchy@0.2.4										X			
+crypto-common@0.1.7	X									X			
+csv@1.4.0										X		X	
+csv-core@0.1.13										X		X	
+dashmap@6.1.0										X			
+delegate@0.13.5	X									X			
+digest@0.10.7	X									X			
+displaydoc@0.2.5	X									X			
+either@1.15.0	X									X			
+equivalent@1.0.2	X									X			
+errno@0.3.14	X									X			
+fastrand@2.3.0	X									X			
+find-msvc-tools@0.1.9	X									X			
+fixedbitset@0.5.7	X									X			
+flatbuffers@25.12.19	X												
+fluss-examples@0.1.0	X												
+fluss-rs@0.1.0	X												
+fnv@1.0.7	X									X			
+foldhash@0.1.5													X
+form_urlencoded@1.2.2	X									X			
+funty@2.0.0										X			
+futures@0.3.32	X									X			
+futures-channel@0.3.32	X									X			
+futures-core@0.3.32	X									X			
+futures-executor@0.3.32	X									X			
+futures-io@0.3.32	X									X			
+futures-macro@0.3.32	X									X			
+futures-sink@0.3.32	X									X			
+futures-task@0.3.32	X									X			
+futures-util@0.3.32	X									X			
+generic-array@0.14.7										X			
+getrandom@0.2.17	X									X			
+getrandom@0.3.4	X									X			
+getrandom@0.4.2	X									X			
+gloo-timers@0.3.0	X									X			
+h2@0.4.13										X			
+half@2.7.1	X									X			
+hashbrown@0.14.5	X									X			
+hashbrown@0.15.5	X									X			
+hashbrown@0.16.1	X									X			
+heck@0.5.0	X									X			
+hex@0.4.3	X									X			
+hmac@0.12.1	X									X			
+home@0.5.12	X									X			
+http@1.4.0	X									X			
+http-body@1.0.1										X			
+http-body-util@0.1.3										X			
+httparse@1.10.1	X									X			
+httpdate@1.0.3	X									X			
+hyper@1.8.1										X			
+hyper-rustls@0.27.7	X							X		X			
+hyper-util@0.1.20										X			
+iana-time-zone@0.1.65	X									X			
+iana-time-zone-haiku@0.1.2	X									X			
+icu_collections@2.1.1											X		
+icu_locale_core@2.1.1											X		
+icu_normalizer@2.1.1											X		
+icu_normalizer_data@2.1.1											X		
+icu_properties@2.1.2											X		
+icu_properties_data@2.1.2											X		
+icu_provider@2.1.1											X		
+idna@1.1.0	X									X			
+idna_adapter@1.2.1	X									X			
+indexmap@2.13.0	X									X			
+ipnet@2.12.0	X									X			
+iri-string@0.7.11	X									X			
+is_terminal_polyfill@1.70.2	X									X			
+itertools@0.14.0	X									X			
+itoa@1.0.18	X									X			
+jiff@0.2.23										X		X	
+jiff-tzdb@0.1.6										X		X	
+jiff-tzdb-platform@0.1.3										X		X	
+jobserver@0.1.34	X									X			
+js-sys@0.3.91	X									X			
+lexical-core@1.0.6	X									X			
+lexical-parse-float@1.0.6	X									X			
+lexical-parse-integer@1.0.6	X									X			
+lexical-util@1.0.7	X									X			
+lexical-write-float@1.0.6	X									X			
+lexical-write-integer@1.0.6	X									X			
+libc@0.2.183	X									X			
+libm@0.2.16										X			
+linked-hash-map@0.5.6	X									X			
+linux-raw-sys@0.12.1	X	X								X			
+litemap@0.8.1											X		
+lock_api@0.4.14	X									X			
+log@0.4.29	X									X			
+lz4_flex@0.12.1										X			
+md-5@0.10.6	X									X			
+memchr@2.8.0										X		X	
+mio@1.1.1										X			
+multimap@0.10.1	X									X			
+num-bigint@0.4.6	X									X			
+num-complex@0.4.6	X									X			
+num-integer@0.1.46	X									X			
+num-traits@0.2.19	X									X			
+once_cell@1.21.4	X									X			
+once_cell_polyfill@1.70.2	X									X			
+opendal@0.55.0	X												
+ordered-float@5.1.0										X			
+parking_lot@0.12.5	X									X			
+parking_lot_core@0.9.12	X									X			
+parse-display@0.10.0	X									X			
+parse-display-derive@0.10.0	X									X			
+percent-encoding@2.3.2	X									X			
+petgraph@0.8.3	X									X			
+pin-project-lite@0.2.17	X									X			
+pin-utils@0.1.0	X									X			
+pkg-config@0.3.32	X									X			
+portable-atomic@1.13.1	X									X			
+portable-atomic-util@0.2.6	X									X			
+potential_utf@0.1.4											X		
+ppv-lite86@0.2.21	X									X			
+prettyplease@0.2.37	X									X			
+proc-macro2@1.0.106	X									X			
+prost@0.14.3	X												
+prost-build@0.14.3	X												
+prost-derive@0.14.3	X												
+prost-types@0.14.3	X												
+quick-xml@0.37.5										X			
+quick-xml@0.38.4										X			
+quote@1.0.45	X									X			
+r-efi@5.3.0	X								X	X			
+r-efi@6.0.0	X								X	X			
+radium@0.7.0										X			
+rand@0.8.5	X									X			
+rand@0.9.2	X									X			
+rand_chacha@0.3.1	X									X			
+rand_chacha@0.9.0	X									X			
+rand_core@0.6.4	X									X			
+rand_core@0.9.5	X									X			
+redox_syscall@0.5.18										X			
+regex@1.12.3	X									X			
+regex-automata@0.4.14	X									X			
+regex-syntax@0.8.10	X									X			
+reqsign@0.16.5	X												
+reqwest@0.12.28	X									X			
+ring@0.17.14	X							X					
+rustc_version@0.4.1	X									X			
+rustix@1.1.4	X	X								X			
+rustls@0.23.37	X							X		X			
+rustls-pki-types@1.14.0	X									X			
+rustls-webpki@0.103.10								X					
+rustversion@1.0.22	X									X			
+ryu@1.0.23	X				X								
+scopeguard@1.2.0	X									X			
+semver@1.0.27	X									X			
+serde@1.0.228	X									X			
+serde_core@1.0.228	X									X			
+serde_derive@1.0.228	X									X			
+serde_json@1.0.149	X									X			
+serde_urlencoded@0.7.1	X									X			
+sha1@0.10.6	X									X			
+sha2@0.10.9	X									X			
+shlex@1.3.0	X									X			
+signal-hook-registry@1.4.8	X									X			
+simdutf8@0.1.5	X									X			
+slab@0.4.12										X			
+smallvec@1.15.1	X									X			
+snafu@0.8.9	X									X			
+snafu-derive@0.8.9	X									X			
+socket2@0.6.3	X									X			
+stable_deref_trait@1.2.1	X									X			
+strsim@0.11.1										X			
+structmeta@0.3.0	X									X			
+structmeta-derive@0.3.0	X									X			
+strum@0.26.3										X			
+strum_macros@0.26.4										X			
+subtle@2.6.1				X									
+syn@2.0.117	X									X			
+sync_wrapper@1.0.2	X												
+synstructure@0.13.2										X			
+tap@1.0.1										X			
+tempfile@3.27.0	X									X			
+thiserror@1.0.69	X									X			
+thiserror-impl@1.0.69	X									X			
+tikv-jemalloc-sys@0.6.1+5.3.0-1-ge13ca993e8ccb9ba9847cc330696e02839f328f7	X									X			
+tikv-jemallocator@0.6.1	X									X			
+tiny-keccak@2.0.2						X							
+tinystr@0.8.2											X		
+tokio@1.50.0										X			
+tokio-macros@2.6.1										X			
+tokio-rustls@0.26.4	X									X			
+tokio-util@0.7.18										X			
+tower@0.5.3										X			
+tower-http@0.6.8										X			
+tower-layer@0.3.3										X			
+tower-service@0.3.3										X			
+tracing@0.1.44										X			
+tracing-attributes@0.1.31										X			
+tracing-core@0.1.36										X			
+try-lock@0.2.5										X			
+twox-hash@2.1.2										X			
+typenum@1.19.0	X									X			
+unicode-ident@1.0.24	X									X	X		
+untrusted@0.9.0								X					
+url@2.5.8	X									X			
+utf8_iter@1.0.4	X									X			
+utf8parse@0.2.2	X									X			
+uuid@1.22.0	X									X			
+value-bag@1.12.0	X									X			
+version_check@0.9.5	X									X			
+want@0.3.1										X			
+wasi@0.11.1+wasi-snapshot-preview1	X	X								X			
+wasip2@1.0.2+wasi-0.2.9	X	X								X			
+wasip3@0.4.0+wasi-0.3.0-rc-2026-01-06	X	X								X			
+wasm-bindgen@0.2.114	X									X			
+wasm-bindgen-futures@0.4.64	X									X			
+wasm-bindgen-macro@0.2.114	X									X			
+wasm-bindgen-macro-support@0.2.114	X									X			
+wasm-bindgen-shared@0.2.114	X									X			
+wasm-streams@0.4.2	X									X			
+web-sys@0.3.91	X									X			
+webpki-roots@1.0.6							X						
+windows-core@0.62.2	X									X			
+windows-implement@0.60.2	X									X			
+windows-interface@0.59.3	X									X			
+windows-link@0.2.1	X									X			
+windows-result@0.4.1	X									X			
+windows-strings@0.5.1	X									X			
+windows-sys@0.52.0	X									X			
+windows-sys@0.61.2	X									X			
+windows-targets@0.52.6	X									X			
+windows_aarch64_gnullvm@0.52.6	X									X			
+windows_aarch64_msvc@0.52.6	X									X			
+windows_i686_gnu@0.52.6	X									X			
+windows_i686_gnullvm@0.52.6	X									X			
+windows_i686_msvc@0.52.6	X									X			
+windows_x86_64_gnu@0.52.6	X									X			
+windows_x86_64_gnullvm@0.52.6	X									X			
+windows_x86_64_msvc@0.52.6	X									X			
+wit-bindgen@0.51.0	X	X								X			
+writeable@0.6.2											X		
+wyz@0.5.1										X			
+yoke@0.8.1											X		
+yoke-derive@0.8.1											X		
+zerocopy@0.8.47	X		X							X			
+zerocopy-derive@0.8.47	X		X							X			
+zerofrom@0.1.6											X		
+zerofrom-derive@0.1.6											X		
+zeroize@1.8.2	X									X			
+zerotrie@0.2.3											X		
+zerovec@0.11.5											X		
+zerovec-derive@0.11.2											X		
+zmij@1.0.21										X			
+zstd@0.13.3										X			
+zstd-safe@7.2.4	X									X			
+zstd-sys@2.0.16+zstd.1.5.7	X									X			
diff --git a/fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv b/fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv
index 29cbe1e8c2..85a865852a 100644
--- a/fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv
+++ b/fluss-rust/crates/fluss/DEPENDENCIES.rust.tsv
@@ -1,305 +1,297 @@
-crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense
-ahash@0.8.12	X									X		
-aho-corasick@1.1.3										X		X
-android-tzdata@0.1.1	X									X		
-android_system_properties@0.1.5	X									X		
-anstream@0.6.20	X									X		
-anstyle@1.0.11	X									X		
-anstyle-parse@0.2.7	X									X		
-anstyle-query@1.1.4	X									X		
-anstyle-wincon@3.0.10	X									X		
-anyhow@1.0.100	X									X		
-arrow@57.1.0	X											
-arrow-arith@57.1.0	X											
-arrow-array@57.1.0	X											
-arrow-buffer@57.1.0	X											
-arrow-cast@57.1.0	X											
-arrow-csv@57.1.0	X											
-arrow-data@57.1.0	X											
-arrow-ipc@57.1.0	X											
-arrow-json@57.1.0	X											
-arrow-ord@57.1.0	X											
-arrow-row@57.1.0	X											
-arrow-schema@57.1.0	X											
-arrow-select@57.1.0	X											
-arrow-string@57.1.0	X											
-async-trait@0.1.89	X									X		
-atoi@2.0.0										X		
-atomic-waker@1.1.2	X									X		
-autocfg@1.5.0	X									X		
-backon@1.6.0	X											
-base64@0.22.1	X									X		
-bigdecimal@0.4.10	X									X		
-bitflags@2.9.3	X									X		
-bitvec@1.0.1										X		
-block-buffer@0.10.4	X									X		
-bumpalo@3.19.0	X									X		
-byteorder@1.5.0										X		X
-bytes@1.11.1										X		
-cc@1.2.34	X									X		
-cfg-if@1.0.3	X									X		
-chrono@0.4.41	X									X		
-clap@4.5.45	X									X		
-clap_builder@4.5.44	X									X		
-clap_derive@4.5.45	X									X		
-clap_lex@0.7.5	X									X		
-colorchoice@1.0.4	X									X		
-const-oid@0.9.6	X									X		
-const-random@0.1.18	X									X		
-const-random-macro@0.1.16	X									X		
-core-foundation-sys@0.8.7	X									X		
-cpufeatures@0.2.17	X									X		
-crc32c@0.6.8	X									X		
-crossbeam-utils@0.8.21	X									X		
-crunchy@0.2.4										X		
-crypto-common@0.1.7	X									X		
-csv@1.3.1										X		X
-csv-core@0.1.12										X		X
-dashmap@6.1.0										X		
-delegate@0.13.5	X									X		
-digest@0.10.7	X									X		
-displaydoc@0.2.5	X									X		
-either@1.15.0	X									X		
-equivalent@1.0.2	X									X		
-errno@0.3.13	X									X		
-fastrand@2.3.0	X									X		
-fixedbitset@0.5.7	X									X		
-flatbuffers@25.2.10	X											
-fluss-rs@0.1.0	X											
-fnv@1.0.7	X									X		
-form_urlencoded@1.2.2	X									X		
-funty@2.0.0										X		
-futures@0.3.31	X									X		
-futures-channel@0.3.31	X									X		
-futures-core@0.3.31	X									X		
-futures-executor@0.3.31	X									X		
-futures-io@0.3.31	X									X		
-futures-macro@0.3.31	X									X		
-futures-sink@0.3.31	X									X		
-futures-task@0.3.31	X									X		
-futures-util@0.3.31	X									X		
-generic-array@0.14.7										X		
-getrandom@0.2.16	X									X		
-getrandom@0.3.3	X									X		
-gloo-timers@0.3.0	X									X		
-h2@0.4.12										X		
-half@2.6.0	X									X		
-hashbrown@0.14.5	X									X		
-hashbrown@0.15.5	X									X		
-hashbrown@0.16.1	X									X		
-heck@0.5.0	X									X		
-hex@0.4.3	X									X		
-hmac@0.12.1	X									X		
-home@0.5.11	X									X		
-http@1.3.1	X									X		
-http-body@1.0.1										X		
-http-body-util@0.1.3										X		
-httparse@1.10.1	X									X		
-httpdate@1.0.3	X									X		
-hyper@1.7.0										X		
-hyper-rustls@0.27.7	X							X		X		
-hyper-util@0.1.17										X		
-iana-time-zone@0.1.63	X									X		
-iana-time-zone-haiku@0.1.2	X									X		
-icu_collections@2.0.0											X	
-icu_locale_core@2.0.0											X	
-icu_normalizer@2.0.0											X	
-icu_normalizer_data@2.0.0											X	
-icu_properties@2.0.1											X	
-icu_properties_data@2.0.1											X	
-icu_provider@2.0.0											X	
-idna@1.1.0	X									X		
-idna_adapter@1.2.1	X									X		
-indexmap@2.11.0	X									X		
-ipnet@2.11.0	X									X		
-iri-string@0.7.9	X									X		
-is_terminal_polyfill@1.70.1	X									X		
-itertools@0.14.0	X									X		
-itoa@1.0.15	X									X		
-jiff@0.2.16										X		X
-jiff-tzdb@0.1.5										X		X
-jiff-tzdb-platform@0.1.3										X		X
-jobserver@0.1.34	X									X		
-js-sys@0.3.77	X									X		
-lexical-core@1.0.5	X									X		
-lexical-parse-float@1.0.5	X									X		
-lexical-parse-integer@1.0.5	X									X		
-lexical-util@1.0.6	X									X		
-lexical-write-float@1.0.5	X									X		
-lexical-write-integer@1.0.5	X									X		
-libc@0.2.175	X									X		
-libm@0.2.15										X		
-linked-hash-map@0.5.6	X									X		
-linux-raw-sys@0.9.4	X	X								X		
-litemap@0.8.0											X	
-lock_api@0.4.13	X									X		
-log@0.4.27	X									X		
-lz4_flex@0.12.0										X		
-md-5@0.10.6	X									X		
-memchr@2.7.5										X		X
-mio@1.0.4										X		
-multimap@0.10.1	X									X		
-num-bigint@0.4.6	X									X		
-num-complex@0.4.6	X									X		
-num-integer@0.1.46	X									X		
-num-traits@0.2.19	X									X		
-once_cell@1.21.3	X									X		
-once_cell_polyfill@1.70.1	X									X		
-opendal@0.55.0	X											
-ordered-float@5.1.0										X		
-parking_lot@0.12.4	X									X		
-parking_lot_core@0.9.11	X									X		
-parse-display@0.10.0	X									X		
-parse-display-derive@0.10.0	X									X		
-percent-encoding@2.3.2	X									X		
-petgraph@0.7.1	X									X		
-pin-project-lite@0.2.16	X									X		
-pin-utils@0.1.0	X									X		
-pkg-config@0.3.32	X									X		
-portable-atomic@1.11.1	X									X		
-portable-atomic-util@0.2.4	X									X		
-potential_utf@0.1.3											X	
-ppv-lite86@0.2.21	X									X		
-prettyplease@0.2.37	X									X		
-proc-macro2@1.0.101	X									X		
-prost@0.14.1	X											
-prost-build@0.14.1	X											
-prost-derive@0.14.1	X											
-prost-types@0.14.1	X											
-quick-xml@0.37.5										X		
-quick-xml@0.38.4										X		
-quote@1.0.40	X									X		
-r-efi@5.3.0	X								X	X		
-radium@0.7.0										X		
-rand@0.8.5	X									X		
-rand@0.9.2	X									X		
-rand_chacha@0.3.1	X									X		
-rand_chacha@0.9.0	X									X		
-rand_core@0.6.4	X									X		
-rand_core@0.9.3	X									X		
-redox_syscall@0.5.17										X		
-regex@1.11.2	X									X		
-regex-automata@0.4.10	X									X		
-regex-syntax@0.8.6	X									X		
-reqsign@0.16.5	X											
-reqwest@0.12.25	X									X		
-ring@0.17.14	X							X				
-rustc_version@0.4.1	X									X		
-rustix@1.0.8	X	X								X		
-rustls@0.23.32	X							X		X		
-rustls-pki-types@1.12.0	X									X		
-rustls-webpki@0.103.7								X				
-rustversion@1.0.22	X									X		
-ryu@1.0.20	X				X							
-scopeguard@1.2.0	X									X		
-semver@1.0.26	X									X		
-serde@1.0.228	X									X		
-serde_core@1.0.228	X									X		
-serde_derive@1.0.228	X									X		
-serde_json@1.0.143	X									X		
-serde_urlencoded@0.7.1	X									X		
-sha1@0.10.6	X									X		
-sha2@0.10.9	X									X		
-shlex@1.3.0	X									X		
-signal-hook-registry@1.4.6	X									X		
-simdutf8@0.1.5	X									X		
-slab@0.4.11										X		
-smallvec@1.15.1	X									X		
-snafu@0.8.9	X									X		
-snafu-derive@0.8.9	X									X		
-socket2@0.6.0	X									X		
-stable_deref_trait@1.2.1	X									X		
-static_assertions@1.1.0	X									X		
-strsim@0.11.1										X		
-structmeta@0.3.0	X									X		
-structmeta-derive@0.3.0	X									X		
-strum@0.26.3										X		
-strum_macros@0.26.4										X		
-subtle@2.6.1				X								
-syn@2.0.106	X									X		
-sync_wrapper@1.0.2	X											
-synstructure@0.13.2										X		
-tap@1.0.1										X		
-tempfile@3.23.0	X									X		
-thiserror@1.0.69	X									X		
-thiserror-impl@1.0.69	X									X		
-tiny-keccak@2.0.2						X						
-tinystr@0.8.1											X	
-tokio@1.48.0										X		
-tokio-macros@2.6.0										X		
-tokio-rustls@0.26.4	X									X		
-tokio-util@0.7.16										X		
-tower@0.5.2										X		
-tower-http@0.6.8										X		
-tower-layer@0.3.3										X		
-tower-service@0.3.3										X		
-tracing@0.1.41										X		
-tracing-attributes@0.1.30										X		
-tracing-core@0.1.34										X		
-try-lock@0.2.5										X		
-twox-hash@2.1.2										X		
-typenum@1.19.0	X									X		
-unicode-ident@1.0.18	X									X	X	
-untrusted@0.9.0								X				
-url@2.5.7	X									X		
-utf8_iter@1.0.4	X									X		
-utf8parse@0.2.2	X									X		
-uuid@1.18.0	X									X		
-value-bag@1.12.0	X									X		
-version_check@0.9.5	X									X		
-want@0.3.1										X		
-wasi@0.11.1+wasi-snapshot-preview1	X	X								X		
-wasi@0.14.2+wasi-0.2.4	X	X								X		
-wasm-bindgen@0.2.100	X									X		
-wasm-bindgen-backend@0.2.100	X									X		
-wasm-bindgen-futures@0.4.50	X									X		
-wasm-bindgen-macro@0.2.100	X									X		
-wasm-bindgen-macro-support@0.2.100	X									X		
-wasm-bindgen-shared@0.2.100	X									X		
-wasm-streams@0.4.2	X									X		
-web-sys@0.3.77	X									X		
-webpki-roots@1.0.3							X					
-windows-core@0.61.2	X									X		
-windows-implement@0.60.0	X									X		
-windows-interface@0.59.1	X									X		
-windows-link@0.1.3	X									X		
-windows-link@0.2.1	X									X		
-windows-result@0.3.4	X									X		
-windows-strings@0.4.2	X									X		
-windows-sys@0.52.0	X									X		
-windows-sys@0.59.0	X									X		
-windows-sys@0.60.2	X									X		
-windows-sys@0.61.2	X									X		
-windows-targets@0.52.6	X									X		
-windows-targets@0.53.3	X									X		
-windows_aarch64_gnullvm@0.52.6	X									X		
-windows_aarch64_gnullvm@0.53.0	X									X		
-windows_aarch64_msvc@0.52.6	X									X		
-windows_aarch64_msvc@0.53.0	X									X		
-windows_i686_gnu@0.52.6	X									X		
-windows_i686_gnu@0.53.0	X									X		
-windows_i686_gnullvm@0.52.6	X									X		
-windows_i686_gnullvm@0.53.0	X									X		
-windows_i686_msvc@0.52.6	X									X		
-windows_i686_msvc@0.53.0	X									X		
-windows_x86_64_gnu@0.52.6	X									X		
-windows_x86_64_gnu@0.53.0	X									X		
-windows_x86_64_gnullvm@0.52.6	X									X		
-windows_x86_64_gnullvm@0.53.0	X									X		
-windows_x86_64_msvc@0.52.6	X									X		
-windows_x86_64_msvc@0.53.0	X									X		
-wit-bindgen-rt@0.39.0	X	X								X		
-writeable@0.6.1											X	
-wyz@0.5.1										X		
-yoke@0.8.0											X	
-yoke-derive@0.8.0											X	
-zerocopy@0.8.26	X		X							X		
-zerofrom@0.1.6											X	
-zerofrom-derive@0.1.6											X	
-zeroize@1.8.2	X									X		
-zerotrie@0.2.2											X	
-zerovec@0.11.4											X	
-zerovec-derive@0.11.1											X	
-zstd@0.13.3										X		
-zstd-safe@7.2.4	X									X		
-zstd-sys@2.0.16+zstd.1.5.7	X									X		
+crate	Apache-2.0	Apache-2.0 WITH LLVM-exception	BSD-2-Clause	BSD-3-Clause	BSL-1.0	CC0-1.0	CDLA-Permissive-2.0	ISC	LGPL-2.1-or-later	MIT	Unicode-3.0	Unlicense	Zlib
+ahash@0.8.12	X									X			
+aho-corasick@1.1.4										X		X	
+android_system_properties@0.1.5	X									X			
+anstream@1.0.0	X									X			
+anstyle@1.0.14	X									X			
+anstyle-parse@1.0.0	X									X			
+anstyle-query@1.1.5	X									X			
+anstyle-wincon@3.0.11	X									X			
+anyhow@1.0.102	X									X			
+arrow@57.3.0	X												
+arrow-arith@57.3.0	X												
+arrow-array@57.3.0	X												
+arrow-buffer@57.3.0	X												
+arrow-cast@57.3.0	X												
+arrow-csv@57.3.0	X												
+arrow-data@57.3.0	X												
+arrow-ipc@57.3.0	X												
+arrow-json@57.3.0	X												
+arrow-ord@57.3.0	X												
+arrow-row@57.3.0	X												
+arrow-schema@57.3.0	X												
+arrow-select@57.3.0	X												
+arrow-string@57.3.0	X												
+async-trait@0.1.89	X									X			
+atoi@2.0.0										X			
+atomic-waker@1.1.2	X									X			
+autocfg@1.5.0	X									X			
+backon@1.6.0	X												
+base64@0.22.1	X									X			
+bigdecimal@0.4.10	X									X			
+bitflags@2.11.0	X									X			
+bitvec@1.0.1										X			
+block-buffer@0.10.4	X									X			
+bumpalo@3.20.2	X									X			
+byteorder@1.5.0										X		X	
+bytes@1.11.1										X			
+cc@1.2.57	X									X			
+cfg-if@1.0.4	X									X			
+chrono@0.4.44	X									X			
+clap@4.6.0	X									X			
+clap_builder@4.6.0	X									X			
+clap_derive@4.6.0	X									X			
+clap_lex@1.1.0	X									X			
+colorchoice@1.0.5	X									X			
+const-oid@0.9.6	X									X			
+const-random@0.1.18	X									X			
+const-random-macro@0.1.16	X									X			
+core-foundation-sys@0.8.7	X									X			
+cpufeatures@0.2.17	X									X			
+crc32c@0.6.8	X									X			
+crossbeam-utils@0.8.21	X									X			
+crunchy@0.2.4										X			
+crypto-common@0.1.7	X									X			
+csv@1.4.0										X		X	
+csv-core@0.1.13										X		X	
+dashmap@6.1.0										X			
+delegate@0.13.5	X									X			
+digest@0.10.7	X									X			
+displaydoc@0.2.5	X									X			
+either@1.15.0	X									X			
+equivalent@1.0.2	X									X			
+errno@0.3.14	X									X			
+fastrand@2.3.0	X									X			
+find-msvc-tools@0.1.9	X									X			
+fixedbitset@0.5.7	X									X			
+flatbuffers@25.12.19	X												
+fluss-rs@0.1.0	X												
+fnv@1.0.7	X									X			
+foldhash@0.1.5													X
+form_urlencoded@1.2.2	X									X			
+funty@2.0.0										X			
+futures@0.3.32	X									X			
+futures-channel@0.3.32	X									X			
+futures-core@0.3.32	X									X			
+futures-executor@0.3.32	X									X			
+futures-io@0.3.32	X									X			
+futures-macro@0.3.32	X									X			
+futures-sink@0.3.32	X									X			
+futures-task@0.3.32	X									X			
+futures-util@0.3.32	X									X			
+generic-array@0.14.7										X			
+getrandom@0.2.17	X									X			
+getrandom@0.3.4	X									X			
+getrandom@0.4.2	X									X			
+gloo-timers@0.3.0	X									X			
+h2@0.4.13										X			
+half@2.7.1	X									X			
+hashbrown@0.14.5	X									X			
+hashbrown@0.15.5	X									X			
+hashbrown@0.16.1	X									X			
+heck@0.5.0	X									X			
+hex@0.4.3	X									X			
+hmac@0.12.1	X									X			
+home@0.5.12	X									X			
+http@1.4.0	X									X			
+http-body@1.0.1										X			
+http-body-util@0.1.3										X			
+httparse@1.10.1	X									X			
+httpdate@1.0.3	X									X			
+hyper@1.8.1										X			
+hyper-rustls@0.27.7	X							X		X			
+hyper-util@0.1.20										X			
+iana-time-zone@0.1.65	X									X			
+iana-time-zone-haiku@0.1.2	X									X			
+icu_collections@2.1.1											X		
+icu_locale_core@2.1.1											X		
+icu_normalizer@2.1.1											X		
+icu_normalizer_data@2.1.1											X		
+icu_properties@2.1.2											X		
+icu_properties_data@2.1.2											X		
+icu_provider@2.1.1											X		
+idna@1.1.0	X									X			
+idna_adapter@1.2.1	X									X			
+indexmap@2.13.0	X									X			
+ipnet@2.12.0	X									X			
+iri-string@0.7.11	X									X			
+is_terminal_polyfill@1.70.2	X									X			
+itertools@0.14.0	X									X			
+itoa@1.0.18	X									X			
+jiff@0.2.23										X		X	
+jiff-tzdb@0.1.6										X		X	
+jiff-tzdb-platform@0.1.3										X		X	
+jobserver@0.1.34	X									X			
+js-sys@0.3.91	X									X			
+lexical-core@1.0.6	X									X			
+lexical-parse-float@1.0.6	X									X			
+lexical-parse-integer@1.0.6	X									X			
+lexical-util@1.0.7	X									X			
+lexical-write-float@1.0.6	X									X			
+lexical-write-integer@1.0.6	X									X			
+libc@0.2.183	X									X			
+libm@0.2.16										X			
+linked-hash-map@0.5.6	X									X			
+linux-raw-sys@0.12.1	X	X								X			
+litemap@0.8.1											X		
+lock_api@0.4.14	X									X			
+log@0.4.29	X									X			
+lz4_flex@0.12.1										X			
+md-5@0.10.6	X									X			
+memchr@2.8.0										X		X	
+mio@1.1.1										X			
+multimap@0.10.1	X									X			
+num-bigint@0.4.6	X									X			
+num-complex@0.4.6	X									X			
+num-integer@0.1.46	X									X			
+num-traits@0.2.19	X									X			
+once_cell@1.21.4	X									X			
+once_cell_polyfill@1.70.2	X									X			
+opendal@0.55.0	X												
+ordered-float@5.1.0										X			
+parking_lot@0.12.5	X									X			
+parking_lot_core@0.9.12	X									X			
+parse-display@0.10.0	X									X			
+parse-display-derive@0.10.0	X									X			
+percent-encoding@2.3.2	X									X			
+petgraph@0.8.3	X									X			
+pin-project-lite@0.2.17	X									X			
+pin-utils@0.1.0	X									X			
+pkg-config@0.3.32	X									X			
+portable-atomic@1.13.1	X									X			
+portable-atomic-util@0.2.6	X									X			
+potential_utf@0.1.4											X		
+ppv-lite86@0.2.21	X									X			
+prettyplease@0.2.37	X									X			
+proc-macro2@1.0.106	X									X			
+prost@0.14.3	X												
+prost-build@0.14.3	X												
+prost-derive@0.14.3	X												
+prost-types@0.14.3	X												
+quick-xml@0.37.5										X			
+quick-xml@0.38.4										X			
+quote@1.0.45	X									X			
+r-efi@5.3.0	X								X	X			
+r-efi@6.0.0	X								X	X			
+radium@0.7.0										X			
+rand@0.8.5	X									X			
+rand@0.9.2	X									X			
+rand_chacha@0.3.1	X									X			
+rand_chacha@0.9.0	X									X			
+rand_core@0.6.4	X									X			
+rand_core@0.9.5	X									X			
+redox_syscall@0.5.18										X			
+regex@1.12.3	X									X			
+regex-automata@0.4.14	X									X			
+regex-syntax@0.8.10	X									X			
+reqsign@0.16.5	X												
+reqwest@0.12.28	X									X			
+ring@0.17.14	X							X					
+rustc_version@0.4.1	X									X			
+rustix@1.1.4	X	X								X			
+rustls@0.23.37	X							X		X			
+rustls-pki-types@1.14.0	X									X			
+rustls-webpki@0.103.10								X					
+rustversion@1.0.22	X									X			
+ryu@1.0.23	X				X								
+scopeguard@1.2.0	X									X			
+semver@1.0.27	X									X			
+serde@1.0.228	X									X			
+serde_core@1.0.228	X									X			
+serde_derive@1.0.228	X									X			
+serde_json@1.0.149	X									X			
+serde_urlencoded@0.7.1	X									X			
+sha1@0.10.6	X									X			
+sha2@0.10.9	X									X			
+shlex@1.3.0	X									X			
+signal-hook-registry@1.4.8	X									X			
+simdutf8@0.1.5	X									X			
+slab@0.4.12										X			
+smallvec@1.15.1	X									X			
+snafu@0.8.9	X									X			
+snafu-derive@0.8.9	X									X			
+socket2@0.6.3	X									X			
+stable_deref_trait@1.2.1	X									X			
+strsim@0.11.1										X			
+structmeta@0.3.0	X									X			
+structmeta-derive@0.3.0	X									X			
+strum@0.26.3										X			
+strum_macros@0.26.4										X			
+subtle@2.6.1				X									
+syn@2.0.117	X									X			
+sync_wrapper@1.0.2	X												
+synstructure@0.13.2										X			
+tap@1.0.1										X			
+tempfile@3.27.0	X									X			
+thiserror@1.0.69	X									X			
+thiserror-impl@1.0.69	X									X			
+tiny-keccak@2.0.2						X							
+tinystr@0.8.2											X		
+tokio@1.50.0										X			
+tokio-macros@2.6.1										X			
+tokio-rustls@0.26.4	X									X			
+tokio-util@0.7.18										X			
+tower@0.5.3										X			
+tower-http@0.6.8										X			
+tower-layer@0.3.3										X			
+tower-service@0.3.3										X			
+tracing@0.1.44										X			
+tracing-attributes@0.1.31										X			
+tracing-core@0.1.36										X			
+try-lock@0.2.5										X			
+twox-hash@2.1.2										X			
+typenum@1.19.0	X									X			
+unicode-ident@1.0.24	X									X	X		
+untrusted@0.9.0								X					
+url@2.5.8	X									X			
+utf8_iter@1.0.4	X									X			
+utf8parse@0.2.2	X									X			
+uuid@1.22.0	X									X			
+value-bag@1.12.0	X									X			
+version_check@0.9.5	X									X			
+want@0.3.1										X			
+wasi@0.11.1+wasi-snapshot-preview1	X	X								X			
+wasip2@1.0.2+wasi-0.2.9	X	X								X			
+wasip3@0.4.0+wasi-0.3.0-rc-2026-01-06	X	X								X			
+wasm-bindgen@0.2.114	X									X			
+wasm-bindgen-futures@0.4.64	X									X			
+wasm-bindgen-macro@0.2.114	X									X			
+wasm-bindgen-macro-support@0.2.114	X									X			
+wasm-bindgen-shared@0.2.114	X									X			
+wasm-streams@0.4.2	X									X			
+web-sys@0.3.91	X									X			
+webpki-roots@1.0.6							X						
+windows-core@0.62.2	X									X			
+windows-implement@0.60.2	X									X			
+windows-interface@0.59.3	X									X			
+windows-link@0.2.1	X									X			
+windows-result@0.4.1	X									X			
+windows-strings@0.5.1	X									X			
+windows-sys@0.52.0	X									X			
+windows-sys@0.61.2	X									X			
+windows-targets@0.52.6	X									X			
+windows_aarch64_gnullvm@0.52.6	X									X			
+windows_aarch64_msvc@0.52.6	X									X			
+windows_i686_gnu@0.52.6	X									X			
+windows_i686_gnullvm@0.52.6	X									X			
+windows_i686_msvc@0.52.6	X									X			
+windows_x86_64_gnu@0.52.6	X									X			
+windows_x86_64_gnullvm@0.52.6	X									X			
+windows_x86_64_msvc@0.52.6	X									X			
+wit-bindgen@0.51.0	X	X								X			
+writeable@0.6.2											X		
+wyz@0.5.1										X			
+yoke@0.8.1											X		
+yoke-derive@0.8.1											X		
+zerocopy@0.8.47	X		X							X			
+zerocopy-derive@0.8.47	X		X							X			
+zerofrom@0.1.6											X		
+zerofrom-derive@0.1.6											X		
+zeroize@1.8.2	X									X			
+zerotrie@0.2.3											X		
+zerovec@0.11.5											X		
+zerovec-derive@0.11.2											X		
+zmij@1.0.21										X			
+zstd@0.13.3										X			
+zstd-safe@7.2.4	X									X			
+zstd-sys@2.0.16+zstd.1.5.7	X									X			

From bcea56689595925fc50120d8be54886bc185691a Mon Sep 17 00:00:00 2001
From: "zhengyunhong.zyh" <zhengyunhong.zyh@alibaba-inc.com>
Date: Mon, 23 Mar 2026 20:24:19 +0800
Subject: [PATCH 212/287] Bump version to 0.2.0

---
 fluss-rust/Cargo.toml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index cd473e74d9..d4d262adaf 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -23,7 +23,7 @@ homepage = "https://clients.fluss.apache.org/"
 license = "Apache-2.0"
 repository = "https://github.com/apache/fluss-rust"
 rust-version = "1.85"
-version = "0.1.0"
+version = "0.2.0"
 keywords = ["fluss", "streaming-storage", "datalake"]
 
 [workspace]
@@ -31,7 +31,7 @@ resolver = "2"
 members = ["crates/fluss", "crates/examples", "bindings/python", "bindings/cpp"]
 
 [workspace.dependencies]
-fluss = { package = "fluss-rs", version = "0.1.0", path = "crates/fluss", features = ["storage-all"] }
+fluss = { package = "fluss-rs", version = "0.2.0", path = "crates/fluss", features = ["storage-all"] }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression"] }

From aed85b755daa8e4660c60b929a6b0392f3df952e Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sat, 28 Mar 2026 21:20:24 +0100
Subject: [PATCH 213/287] feat: Add array data type support (#433)

* add array data type support

* add docs

* address comments

* avoid intermediate record batch in get-array

* Address comments

* address review comments

* address comments and improve doc

* address comments

* add todo

* remove todo from reference.md to code
---
 fluss-rust/bindings/cpp/src/types.rs          |   6 +
 fluss-rust/crates/fluss/src/record/arrow.rs   |  65 ++
 .../fluss/src/row/binary/binary_writer.rs     |  10 +-
 .../crates/fluss/src/row/binary_array.rs      | 848 ++++++++++++++++++
 fluss-rust/crates/fluss/src/row/column.rs     | 463 +++++++++-
 .../src/row/compacted/compacted_key_writer.rs |  11 +
 .../fluss/src/row/compacted/compacted_row.rs  | 202 ++++-
 .../src/row/compacted/compacted_row_reader.rs | 204 +++--
 .../src/row/compacted/compacted_row_writer.rs |   4 +
 fluss-rust/crates/fluss/src/row/datum.rs      | 122 ++-
 .../src/row/encode/compacted_key_encoder.rs   | 160 +++-
 .../crates/fluss/src/row/field_getter.rs      |  55 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |  14 +
 .../docs/user-guide/rust/api-reference.md     |  13 +
 .../docs/user-guide/rust/data-types.md        |  24 +
 15 files changed, 2078 insertions(+), 123 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/row/binary_array.rs

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 3c0c6f7685..f7aabe9424 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -351,6 +351,9 @@ pub fn resolve_row_types(
             Datum::Time(t) => Datum::Time(*t),
             Datum::TimestampNtz(ts) => Datum::TimestampNtz(*ts),
             Datum::TimestampLtz(ts) => Datum::TimestampLtz(*ts),
+            // TODO: C++ bindings need proper CXX wrapper types for FlussArray
+            // before C++ users can construct or inspect array values through FFI.
+            Datum::Array(a) => Datum::Array(a.clone()),
         };
         out.set_field(idx, resolved);
     }
@@ -408,6 +411,9 @@ pub fn compacted_row_to_owned(
             fcore::metadata::DataType::Binary(dt) => {
                 Datum::Blob(Cow::Owned(row.get_binary(i, dt.length())?.to_vec()))
             }
+            // TODO: C++ bindings need proper CXX wrapper types for FlussArray
+            // before C++ users can construct or inspect array values through FFI.
+            fcore::metadata::DataType::Array(_) => Datum::Array(row.get_array(i)?),
             other => return Err(anyhow!("Unsupported data type for column {i}: {other:?}")),
         };
 
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index d8ba6d95c9..7dd745baa9 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -1091,6 +1091,71 @@ pub fn to_arrow_type(fluss_type: &DataType) -> Result<ArrowDataType> {
     })
 }
 
+/// Converts an Arrow data type back to a Fluss `DataType`.
+/// Used for reading array elements from Arrow ListArray back into Fluss types.
+pub(crate) fn from_arrow_type(arrow_type: &ArrowDataType) -> Result<DataType> {
+    use crate::metadata::DataTypes;
+
+    Ok(match arrow_type {
+        ArrowDataType::Boolean => DataTypes::boolean(),
+        ArrowDataType::Int8 => DataTypes::tinyint(),
+        ArrowDataType::Int16 => DataTypes::smallint(),
+        ArrowDataType::Int32 => DataTypes::int(),
+        ArrowDataType::Int64 => DataTypes::bigint(),
+        ArrowDataType::Float32 => DataTypes::float(),
+        ArrowDataType::Float64 => DataTypes::double(),
+        ArrowDataType::Utf8 => DataTypes::string(),
+        ArrowDataType::Binary => DataTypes::bytes(),
+        ArrowDataType::Date32 => DataTypes::date(),
+        ArrowDataType::FixedSizeBinary(len) => {
+            if *len < 0 {
+                return Err(Error::IllegalArgument {
+                    message: format!("FixedSizeBinary length must be >= 0, got {len}"),
+                });
+            }
+            DataTypes::binary(*len as usize)
+        }
+        ArrowDataType::Decimal128(p, s) => {
+            if *s < 0 {
+                return Err(Error::IllegalArgument {
+                    message: format!("Decimal scale must be >= 0, got {s}"),
+                });
+            }
+            DataTypes::decimal(*p as u32, *s as u32)
+        }
+        ArrowDataType::Time32(arrow_schema::TimeUnit::Second) => DataTypes::time_with_precision(0),
+        ArrowDataType::Time32(arrow_schema::TimeUnit::Millisecond) => {
+            DataTypes::time_with_precision(3)
+        }
+        ArrowDataType::Time64(arrow_schema::TimeUnit::Microsecond) => {
+            DataTypes::time_with_precision(6)
+        }
+        ArrowDataType::Time64(arrow_schema::TimeUnit::Nanosecond) => {
+            DataTypes::time_with_precision(9)
+        }
+        ArrowDataType::Timestamp(unit, tz) => {
+            let precision = match unit {
+                arrow_schema::TimeUnit::Second => 0,
+                arrow_schema::TimeUnit::Millisecond => 3,
+                arrow_schema::TimeUnit::Microsecond => 6,
+                arrow_schema::TimeUnit::Nanosecond => 9,
+            };
+
+            if tz.is_some() {
+                DataTypes::timestamp_ltz_with_precision(precision)
+            } else {
+                DataTypes::timestamp_with_precision(precision)
+            }
+        }
+        ArrowDataType::List(field) => DataTypes::array(from_arrow_type(field.data_type())?),
+        other => {
+            return Err(Error::IllegalArgument {
+                message: format!("Cannot convert Arrow type to Fluss type: {other:?}"),
+            });
+        }
+    })
+}
+
 #[derive(Clone)]
 pub struct ReadContext {
     target_schema: SchemaRef,
diff --git a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
index af2765c445..f51a6e80f1 100644
--- a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
@@ -67,8 +67,7 @@ pub trait BinaryWriter {
 
     fn write_timestamp_ltz(&mut self, value: &crate::row::datum::TimestampLtz, precision: u32);
 
-    // TODO InternalArray, ArraySerializer
-    // fn write_array(&mut self, pos: i32, value: i64);
+    fn write_array(&mut self, value: &[u8]);
 
     // TODO Row serializer
     // fn write_row(&mut self, pos: i32, value: &InternalRow);
@@ -136,7 +135,8 @@ pub enum InnerValueWriter {
     Time(u32),         // precision (not used in wire format, but kept for consistency)
     TimestampNtz(u32), // precision
     TimestampLtz(u32), // precision
-                       // TODO Array, Row
+    Array,
+    // TODO Row
 }
 
 /// Accessor for writing the fields/elements of a binary writer during runtime, the
@@ -175,6 +175,7 @@ impl InnerValueWriter {
                 // Validation is done at TimestampLTzType construction time
                 Ok(InnerValueWriter::TimestampLtz(t.precision()))
             }
+            DataType::Array(_) => Ok(InnerValueWriter::Array),
             _ => unimplemented!(
                 "ValueWriter for DataType {:?} is currently not implemented",
                 data_type
@@ -237,6 +238,9 @@ impl InnerValueWriter {
             (InnerValueWriter::TimestampLtz(p), Datum::TimestampLtz(ts)) => {
                 writer.write_timestamp_ltz(ts, *p);
             }
+            (InnerValueWriter::Array, Datum::Array(arr)) => {
+                writer.write_array(arr.as_bytes());
+            }
             _ => {
                 return Err(IllegalArgument {
                     message: format!("{self:?} used to write value {value:?}"),
diff --git a/fluss-rust/crates/fluss/src/row/binary_array.rs b/fluss-rust/crates/fluss/src/row/binary_array.rs
new file mode 100644
index 0000000000..9008bc5467
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/binary_array.rs
@@ -0,0 +1,848 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Binary array format matching Java's `BinaryArray.java` layout.
+//!
+//! Binary layout:
+//! ```text
+//! [size(4B)] + [null bits (4-byte word aligned)] + [fixed-length part] + [variable-length part]
+//! ```
+//!
+//! Java reference: `BinaryArray.java`, `BinaryArrayWriter.java`
+
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::DataType;
+use crate::row::Decimal;
+use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+use bytes::Bytes;
+use serde::Serialize;
+use std::fmt;
+use std::hash::{Hash, Hasher};
+
+const MAX_FIX_PART_DATA_SIZE: usize = 7;
+const HIGHEST_FIRST_BIT: u64 = 0x80_u64 << 56;
+const HIGHEST_SECOND_TO_EIGHTH_BIT: u64 = 0x7F_u64 << 56;
+
+/// Calculates the header size in bytes: 4 (for element count) + null bits (4-byte word aligned).
+/// Matches Java's `BinaryArray.calculateHeaderInBytes(numFields)`.
+pub fn calculate_header_in_bytes(num_elements: usize) -> usize {
+    4 + num_elements.div_ceil(32) * 4
+}
+
+/// Calculates the fixed-length part size per element for a given data type.
+/// Matches Java's `BinaryArray.calculateFixLengthPartSize(DataType)`.
+pub fn calculate_fix_length_part_size(element_type: &DataType) -> usize {
+    match element_type {
+        DataType::Boolean(_) | DataType::TinyInt(_) => 1,
+        DataType::SmallInt(_) => 2,
+        DataType::Int(_) | DataType::Float(_) | DataType::Date(_) | DataType::Time(_) => 4,
+        DataType::BigInt(_)
+        | DataType::Double(_)
+        | DataType::Char(_)
+        | DataType::String(_)
+        | DataType::Binary(_)
+        | DataType::Bytes(_)
+        | DataType::Decimal(_)
+        | DataType::Timestamp(_)
+        | DataType::TimestampLTz(_)
+        | DataType::Array(_)
+        | DataType::Map(_)
+        | DataType::Row(_) => 8,
+    }
+}
+
+/// Rounds a byte count up to the nearest 8-byte word boundary.
+/// Matches Java's `roundNumberOfBytesToNearestWord`.
+fn round_to_nearest_word(num_bytes: usize) -> usize {
+    (num_bytes + 7) & !7
+}
+
+/// A Fluss binary array, wire-compatible with Java's `BinaryArray`.
+///
+/// Stores elements in a flat byte buffer with a header (element count + null bitmap)
+/// followed by fixed-length slots and an optional variable-length section.
+///
+/// Uses `Bytes` internally so cloning is O(1) reference-counted.
+// TODO: FlussArray currently exposes only fallible getters. Infallible
+// fast-path variants may be added later as non-breaking extensions.
+#[derive(Clone)]
+pub struct FlussArray {
+    data: Bytes,
+    size: usize,
+    element_offset: usize,
+}
+
+impl fmt::Debug for FlussArray {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.debug_struct("FlussArray")
+            .field("size", &self.size)
+            .field("data_len", &self.data.len())
+            .finish()
+    }
+}
+
+impl fmt::Display for FlussArray {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        write!(f, "FlussArray[size={}]", self.size)
+    }
+}
+
+impl PartialEq for FlussArray {
+    fn eq(&self, other: &Self) -> bool {
+        self.data == other.data
+    }
+}
+
+impl Eq for FlussArray {}
+
+impl PartialOrd for FlussArray {
+    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
+        Some(self.cmp(other))
+    }
+}
+
+impl Ord for FlussArray {
+    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
+        self.data.cmp(&other.data)
+    }
+}
+
+impl Hash for FlussArray {
+    fn hash<H: Hasher>(&self, state: &mut H) {
+        self.data.hash(state);
+    }
+}
+
+impl Serialize for FlussArray {
+    fn serialize<S>(&self, serializer: S) -> std::result::Result<S::Ok, S::Error>
+    where
+        S: serde::Serializer,
+    {
+        serializer.serialize_bytes(&self.data)
+    }
+}
+
+impl FlussArray {
+    /// Validates the raw bytes and computes derived fields (size, element_offset).
+    fn validate(data: &[u8]) -> Result<(usize, usize)> {
+        if data.len() < 4 {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussArray data too short: need at least 4 bytes, got {}",
+                    data.len()
+                ),
+            });
+        }
+        let raw_size = i32::from_le_bytes(data[0..4].try_into().unwrap());
+        if raw_size < 0 {
+            return Err(IllegalArgument {
+                message: format!("FlussArray size must be non-negative, got {raw_size}"),
+            });
+        }
+        let size = raw_size as usize;
+        let element_offset = calculate_header_in_bytes(size);
+        if element_offset > data.len() {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussArray header exceeds payload: header={}, payload={}",
+                    element_offset,
+                    data.len()
+                ),
+            });
+        }
+        Ok((size, element_offset))
+    }
+
+    /// Creates a FlussArray from a byte slice (copies data).
+    pub fn from_bytes(data: &[u8]) -> Result<Self> {
+        let (size, element_offset) = Self::validate(data)?;
+        Ok(FlussArray {
+            data: Bytes::copy_from_slice(data),
+            size,
+            element_offset,
+        })
+    }
+
+    /// Creates a FlussArray from an owned `Vec<u8>` without copying.
+    pub fn from_vec(data: Vec<u8>) -> Result<Self> {
+        let (size, element_offset) = Self::validate(&data)?;
+        Ok(FlussArray {
+            data: Bytes::from(data),
+            size,
+            element_offset,
+        })
+    }
+
+    /// Creates a FlussArray from owned bytes without copying.
+    fn from_owned_bytes(data: Bytes) -> Result<Self> {
+        let (size, element_offset) = Self::validate(&data)?;
+        Ok(FlussArray {
+            data,
+            size,
+            element_offset,
+        })
+    }
+
+    /// Returns the number of elements.
+    pub fn size(&self) -> usize {
+        self.size
+    }
+
+    /// Returns the raw bytes of this array (the complete binary representation).
+    pub fn as_bytes(&self) -> &[u8] {
+        &self.data
+    }
+
+    /// Returns true if the element at position `pos` is null.
+    pub fn is_null_at(&self, pos: usize) -> bool {
+        let byte_index = pos >> 3;
+        let bit = pos & 7;
+        (self.data[4 + byte_index] & (1u8 << bit)) != 0
+    }
+
+    fn checked_slice(&self, start: usize, len: usize, context: &str) -> Result<&[u8]> {
+        let end = start.checked_add(len).ok_or_else(|| IllegalArgument {
+            message: format!("Overflow while reading {context}: start={start}, len={len}"),
+        })?;
+        if end > self.data.len() {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Out-of-bounds while reading {context}: start={start}, len={len}, payload={}",
+                    self.data.len()
+                ),
+            });
+        }
+        Ok(&self.data[start..end])
+    }
+
+    fn checked_element_offset(
+        &self,
+        pos: usize,
+        element_size: usize,
+        context: &str,
+    ) -> Result<usize> {
+        if pos >= self.size {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Array element index out of bounds while reading {context}: pos={pos}, size={}",
+                    self.size
+                ),
+            });
+        }
+        let rel = pos.checked_mul(element_size).ok_or_else(|| IllegalArgument {
+            message: format!(
+                "Overflow while calculating array element offset for {context}: pos={pos}, element_size={element_size}"
+            ),
+        })?;
+        self.element_offset
+            .checked_add(rel)
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "Overflow while adding base offset for {context}: base={}, rel={rel}",
+                    self.element_offset
+                ),
+            })
+    }
+
+    fn read_fixed_bytes(&self, pos: usize, len: usize, context: &str) -> Result<&[u8]> {
+        let offset = self.checked_element_offset(pos, len, context)?;
+        self.checked_slice(offset, len, context)
+    }
+
+    fn read_i16(&self, pos: usize, context: &str) -> Result<i16> {
+        let bytes = self.read_fixed_bytes(pos, 2, context)?;
+        Ok(i16::from_le_bytes([bytes[0], bytes[1]]))
+    }
+
+    fn read_i32(&self, pos: usize, context: &str) -> Result<i32> {
+        let bytes = self.read_fixed_bytes(pos, 4, context)?;
+        Ok(i32::from_le_bytes([bytes[0], bytes[1], bytes[2], bytes[3]]))
+    }
+
+    fn read_i64(&self, pos: usize, context: &str) -> Result<i64> {
+        let bytes = self.read_fixed_bytes(pos, 8, context)?;
+        let mut buf = [0_u8; 8];
+        buf.copy_from_slice(bytes);
+        Ok(i64::from_le_bytes(buf))
+    }
+
+    fn read_i64_at_offset(&self, offset: usize, context: &str) -> Result<i64> {
+        let bytes = self.checked_slice(offset, 8, context)?;
+        let mut buf = [0_u8; 8];
+        buf.copy_from_slice(bytes);
+        Ok(i64::from_le_bytes(buf))
+    }
+
+    fn read_var_len_span(&self, pos: usize) -> Result<(usize, usize)> {
+        let field_offset = self.checked_element_offset(pos, 8, "variable-length array element")?;
+        let packed = self.read_i64(pos, "variable-length array element")? as u64;
+        let mark = packed & HIGHEST_FIRST_BIT;
+
+        if mark == 0 {
+            let offset = (packed >> 32) as usize;
+            let len = (packed & 0xFFFF_FFFF) as usize;
+            let _ = self.checked_slice(offset, len, "variable-length array element")?;
+            Ok((offset, len))
+        } else {
+            let len = ((packed & HIGHEST_SECOND_TO_EIGHTH_BIT) >> 56) as usize;
+            if len > MAX_FIX_PART_DATA_SIZE {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "Inline array element length must be <= {MAX_FIX_PART_DATA_SIZE}, got {len}"
+                    ),
+                });
+            }
+            // Java stores inline bytes in the 8-byte slot itself.
+            // On little-endian, bytes start at field_offset; on big-endian they start at +1.
+            let start = if cfg!(target_endian = "little") {
+                field_offset
+            } else {
+                field_offset + 1
+            };
+            let _ = self.checked_slice(start, len, "inline array element")?;
+            Ok((start, len))
+        }
+    }
+
+    fn read_var_len_bytes(&self, pos: usize) -> Result<&[u8]> {
+        let (start, len) = self.read_var_len_span(pos)?;
+        Ok(&self.data[start..start + len])
+    }
+
+    pub fn get_boolean(&self, pos: usize) -> Result<bool> {
+        let bytes = self.read_fixed_bytes(pos, 1, "boolean array element")?;
+        Ok(bytes[0] != 0)
+    }
+
+    pub fn get_byte(&self, pos: usize) -> Result<i8> {
+        let bytes = self.read_fixed_bytes(pos, 1, "byte array element")?;
+        Ok(bytes[0] as i8)
+    }
+
+    pub fn get_short(&self, pos: usize) -> Result<i16> {
+        self.read_i16(pos, "short array element")
+    }
+
+    pub fn get_int(&self, pos: usize) -> Result<i32> {
+        self.read_i32(pos, "int array element")
+    }
+
+    pub fn get_long(&self, pos: usize) -> Result<i64> {
+        self.read_i64(pos, "long array element")
+    }
+
+    pub fn get_float(&self, pos: usize) -> Result<f32> {
+        let bits = self.read_i32(pos, "float array element")? as u32;
+        Ok(f32::from_bits(bits))
+    }
+
+    pub fn get_double(&self, pos: usize) -> Result<f64> {
+        let bits = self.read_i64(pos, "double array element")? as u64;
+        Ok(f64::from_bits(bits))
+    }
+
+    /// Reads the offset_and_size packed long for variable-length elements.
+    fn get_offset_and_size(&self, pos: usize) -> Result<(usize, usize)> {
+        let packed = self.get_long(pos)? as u64;
+        let offset = (packed >> 32) as usize;
+        let size = (packed & 0xFFFF_FFFF) as usize;
+        Ok((offset, size))
+    }
+
+    pub fn get_string(&self, pos: usize) -> Result<&str> {
+        let bytes = self.read_var_len_bytes(pos)?;
+        std::str::from_utf8(bytes).map_err(|e| IllegalArgument {
+            message: format!("Invalid UTF-8 in array element at position {pos}: {e}"),
+        })
+    }
+
+    pub fn get_binary(&self, pos: usize) -> Result<&[u8]> {
+        self.read_var_len_bytes(pos)
+    }
+
+    pub fn get_decimal(&self, pos: usize, precision: u32, scale: u32) -> Result<Decimal> {
+        if Decimal::is_compact_precision(precision) {
+            let unscaled = self.get_long(pos)?;
+            Decimal::from_unscaled_long(unscaled, precision, scale)
+        } else {
+            let (offset, size) = self.get_offset_and_size(pos)?;
+            let bytes = self.checked_slice(offset, size, "decimal bytes")?;
+            Decimal::from_unscaled_bytes(bytes, precision, scale)
+        }
+    }
+
+    pub fn get_date(&self, pos: usize) -> Result<Date> {
+        Ok(Date::new(self.get_int(pos)?))
+    }
+
+    pub fn get_time(&self, pos: usize) -> Result<Time> {
+        Ok(Time::new(self.get_int(pos)?))
+    }
+
+    pub fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> Result<TimestampNtz> {
+        if TimestampNtz::is_compact(precision) {
+            Ok(TimestampNtz::new(self.get_long(pos)?))
+        } else {
+            let (offset, nanos_of_millis) = self.get_offset_and_size(pos)?;
+            let millis = self.read_i64_at_offset(offset, "timestamp ntz millis")?;
+            TimestampNtz::from_millis_nanos(millis, nanos_of_millis as i32)
+        }
+    }
+
+    pub fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> Result<TimestampLtz> {
+        if TimestampLtz::is_compact(precision) {
+            Ok(TimestampLtz::new(self.get_long(pos)?))
+        } else {
+            let (offset, nanos_of_millis) = self.get_offset_and_size(pos)?;
+            let millis = self.read_i64_at_offset(offset, "timestamp ltz millis")?;
+            TimestampLtz::from_millis_nanos(millis, nanos_of_millis as i32)
+        }
+    }
+
+    pub fn get_array(&self, pos: usize) -> Result<FlussArray> {
+        let (start, len) = self.read_var_len_span(pos)?;
+        FlussArray::from_owned_bytes(self.data.slice(start..start + len))
+    }
+}
+
+/// Writer for building a `FlussArray` element by element.
+/// Matches Java's `BinaryArrayWriter`.
+pub struct FlussArrayWriter {
+    data: Vec<u8>,
+    null_bits_offset: usize,
+    element_offset: usize,
+    element_size: usize,
+    cursor: usize,
+    num_elements: usize,
+}
+
+impl FlussArrayWriter {
+    /// Creates a new writer for an array with `num_elements` elements of the given element type.
+    pub fn new(num_elements: usize, element_type: &DataType) -> Self {
+        let element_size = calculate_fix_length_part_size(element_type);
+        Self::with_element_size(num_elements, element_size)
+    }
+
+    /// Creates a new writer with an explicit element size (in bytes).
+    pub fn with_element_size(num_elements: usize, element_size: usize) -> Self {
+        let header_in_bytes = calculate_header_in_bytes(num_elements);
+        let fixed_size = round_to_nearest_word(header_in_bytes + element_size * num_elements);
+        let mut data = vec![0u8; fixed_size];
+
+        // Java's MemorySegment.putInt() stores little-endian.
+        data[0..4].copy_from_slice(&(num_elements as i32).to_le_bytes());
+
+        FlussArrayWriter {
+            data,
+            null_bits_offset: 4,
+            element_offset: header_in_bytes,
+            element_size,
+            cursor: fixed_size,
+            num_elements,
+        }
+    }
+
+    fn get_element_offset(&self, pos: usize) -> usize {
+        self.element_offset + self.element_size * pos
+    }
+
+    /// Sets the null bit for the element at position `pos`.
+    pub fn set_null_at(&mut self, pos: usize) {
+        let byte_index = pos >> 3;
+        let bit = pos & 7;
+        self.data[self.null_bits_offset + byte_index] |= 1u8 << bit;
+    }
+
+    pub fn write_boolean(&mut self, pos: usize, value: bool) {
+        let offset = self.get_element_offset(pos);
+        self.data[offset] = if value { 1 } else { 0 };
+    }
+
+    pub fn write_byte(&mut self, pos: usize, value: i8) {
+        let offset = self.get_element_offset(pos);
+        self.data[offset] = value as u8;
+    }
+
+    pub fn write_short(&mut self, pos: usize, value: i16) {
+        let offset = self.get_element_offset(pos);
+        self.data[offset..offset + 2].copy_from_slice(&value.to_le_bytes());
+    }
+
+    pub fn write_int(&mut self, pos: usize, value: i32) {
+        let offset = self.get_element_offset(pos);
+        self.data[offset..offset + 4].copy_from_slice(&value.to_le_bytes());
+    }
+
+    pub fn write_long(&mut self, pos: usize, value: i64) {
+        let offset = self.get_element_offset(pos);
+        self.data[offset..offset + 8].copy_from_slice(&value.to_le_bytes());
+    }
+
+    pub fn write_float(&mut self, pos: usize, value: f32) {
+        let offset = self.get_element_offset(pos);
+        self.data[offset..offset + 4].copy_from_slice(&value.to_le_bytes());
+    }
+
+    pub fn write_double(&mut self, pos: usize, value: f64) {
+        let offset = self.get_element_offset(pos);
+        self.data[offset..offset + 8].copy_from_slice(&value.to_le_bytes());
+    }
+
+    /// Writes variable-length bytes to the variable part and stores offset+size in the fixed slot.
+    fn write_bytes_to_var_len_part(&mut self, pos: usize, bytes: &[u8]) {
+        let rounded = round_to_nearest_word(bytes.len());
+        let var_offset = self.cursor;
+        self.data.resize(self.data.len() + rounded, 0);
+        self.data[var_offset..var_offset + bytes.len()].copy_from_slice(bytes);
+        self.set_offset_and_size(pos, var_offset, bytes.len());
+        self.cursor += rounded;
+    }
+
+    fn set_offset_and_size(&mut self, pos: usize, offset: usize, size: usize) {
+        let packed = ((offset as i64) << 32) | (size as i64);
+        self.write_long(pos, packed);
+    }
+
+    fn write_bytes_to_fix_len_part(&mut self, pos: usize, bytes: &[u8]) {
+        let len = bytes.len();
+        debug_assert!(len <= MAX_FIX_PART_DATA_SIZE);
+        let first_byte = (len as u64) | 0x80;
+        let mut seven_bytes = 0_u64;
+        if cfg!(target_endian = "little") {
+            for (i, b) in bytes.iter().enumerate() {
+                seven_bytes |= ((*b as u64) & 0xFF) << (i * 8);
+            }
+        } else {
+            for (i, b) in bytes.iter().enumerate() {
+                seven_bytes |= ((*b as u64) & 0xFF) << ((6 - i) * 8);
+            }
+        }
+        let packed = ((first_byte << 56) | seven_bytes) as i64;
+        self.write_long(pos, packed);
+    }
+
+    pub fn write_string(&mut self, pos: usize, value: &str) {
+        let bytes = value.as_bytes();
+        if bytes.len() <= MAX_FIX_PART_DATA_SIZE {
+            self.write_bytes_to_fix_len_part(pos, bytes);
+        } else {
+            self.write_bytes_to_var_len_part(pos, bytes);
+        }
+    }
+
+    pub fn write_binary_bytes(&mut self, pos: usize, value: &[u8]) {
+        if value.len() <= MAX_FIX_PART_DATA_SIZE {
+            self.write_bytes_to_fix_len_part(pos, value);
+        } else {
+            self.write_bytes_to_var_len_part(pos, value);
+        }
+    }
+
+    pub fn write_decimal(&mut self, pos: usize, value: &Decimal, precision: u32) {
+        if Decimal::is_compact_precision(precision) {
+            self.write_long(
+                pos,
+                value
+                    .to_unscaled_long()
+                    .expect("Decimal should fit in i64 for compact precision"),
+            );
+        } else {
+            let bytes = value.to_unscaled_bytes();
+            self.write_bytes_to_var_len_part(pos, &bytes);
+        }
+    }
+
+    pub fn write_date(&mut self, pos: usize, value: Date) {
+        self.write_int(pos, value.get_inner());
+    }
+
+    pub fn write_time(&mut self, pos: usize, value: Time) {
+        self.write_int(pos, value.get_inner());
+    }
+
+    pub fn write_timestamp_ntz(&mut self, pos: usize, value: &TimestampNtz, precision: u32) {
+        if TimestampNtz::is_compact(precision) {
+            self.write_long(pos, value.get_millisecond());
+        } else {
+            let millis_bytes = value.get_millisecond().to_le_bytes();
+            let var_offset = self.cursor;
+            let rounded = round_to_nearest_word(8);
+            self.data.resize(self.data.len() + rounded, 0);
+            self.data[var_offset..var_offset + 8].copy_from_slice(&millis_bytes);
+            self.set_offset_and_size(pos, var_offset, value.get_nano_of_millisecond() as usize);
+            self.cursor += rounded;
+        }
+    }
+
+    pub fn write_timestamp_ltz(&mut self, pos: usize, value: &TimestampLtz, precision: u32) {
+        if TimestampLtz::is_compact(precision) {
+            self.write_long(pos, value.get_epoch_millisecond());
+        } else {
+            let millis_bytes = value.get_epoch_millisecond().to_le_bytes();
+            let var_offset = self.cursor;
+            let rounded = round_to_nearest_word(8);
+            self.data.resize(self.data.len() + rounded, 0);
+            self.data[var_offset..var_offset + 8].copy_from_slice(&millis_bytes);
+            self.set_offset_and_size(pos, var_offset, value.get_nano_of_millisecond() as usize);
+            self.cursor += rounded;
+        }
+    }
+
+    /// Writes a nested FlussArray into this array at position `pos`.
+    pub fn write_array(&mut self, pos: usize, value: &FlussArray) {
+        self.write_bytes_to_var_len_part(pos, value.as_bytes());
+    }
+
+    /// Finalizes the writer and returns the completed FlussArray.
+    pub fn complete(self) -> Result<FlussArray> {
+        let mut data = self.data;
+        data.truncate(self.cursor);
+        FlussArray::from_vec(data)
+    }
+
+    /// Returns the number of elements this writer was initialized with.
+    pub fn num_elements(&self) -> usize {
+        self.num_elements
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::DataTypes;
+
+    #[test]
+    fn test_header_calculation() {
+        assert_eq!(calculate_header_in_bytes(0), 4);
+        assert_eq!(calculate_header_in_bytes(1), 8);
+        assert_eq!(calculate_header_in_bytes(31), 8);
+        assert_eq!(calculate_header_in_bytes(32), 8);
+        assert_eq!(calculate_header_in_bytes(33), 12);
+        assert_eq!(calculate_header_in_bytes(64), 12);
+        assert_eq!(calculate_header_in_bytes(65), 16);
+    }
+
+    #[test]
+    fn test_fix_length_part_size() {
+        assert_eq!(calculate_fix_length_part_size(&DataTypes::boolean()), 1);
+        assert_eq!(calculate_fix_length_part_size(&DataTypes::tinyint()), 1);
+        assert_eq!(calculate_fix_length_part_size(&DataTypes::smallint()), 2);
+        assert_eq!(calculate_fix_length_part_size(&DataTypes::int()), 4);
+        assert_eq!(calculate_fix_length_part_size(&DataTypes::bigint()), 8);
+        assert_eq!(calculate_fix_length_part_size(&DataTypes::float()), 4);
+        assert_eq!(calculate_fix_length_part_size(&DataTypes::double()), 8);
+        assert_eq!(calculate_fix_length_part_size(&DataTypes::string()), 8);
+        assert_eq!(
+            calculate_fix_length_part_size(&DataTypes::array(DataTypes::int())),
+            8
+        );
+    }
+
+    #[test]
+    fn test_round_trip_int_array() {
+        let elem_type = DataTypes::int();
+        let mut writer = FlussArrayWriter::new(3, &elem_type);
+        writer.write_int(0, 10);
+        writer.write_int(1, 20);
+        writer.write_int(2, 30);
+        let array = writer.complete().unwrap();
+
+        assert_eq!(array.size(), 3);
+        assert!(!array.is_null_at(0));
+        assert_eq!(array.get_int(0).unwrap(), 10);
+        assert_eq!(array.get_int(1).unwrap(), 20);
+        assert_eq!(array.get_int(2).unwrap(), 30);
+    }
+
+    #[test]
+    fn test_round_trip_with_nulls() {
+        let elem_type = DataTypes::int();
+        let mut writer = FlussArrayWriter::new(3, &elem_type);
+        writer.write_int(0, 1);
+        writer.set_null_at(1);
+        writer.write_int(2, 3);
+        let array = writer.complete().unwrap();
+
+        assert_eq!(array.size(), 3);
+        assert!(!array.is_null_at(0));
+        assert!(array.is_null_at(1));
+        assert!(!array.is_null_at(2));
+        assert_eq!(array.get_int(0).unwrap(), 1);
+        assert_eq!(array.get_int(2).unwrap(), 3);
+    }
+
+    #[test]
+    fn test_round_trip_string_array() {
+        let elem_type = DataTypes::string();
+        let mut writer = FlussArrayWriter::new(3, &elem_type);
+        writer.write_string(0, "hello");
+        writer.write_string(1, "world");
+        writer.write_string(2, "!");
+        let array = writer.complete().unwrap();
+
+        assert_eq!(array.size(), 3);
+        assert_eq!(array.get_string(0).unwrap(), "hello");
+        assert_eq!(array.get_string(1).unwrap(), "world");
+        assert_eq!(array.get_string(2).unwrap(), "!");
+    }
+
+    #[test]
+    fn test_java_inline_short_string_decoding() {
+        // Manually construct Java-style inline encoded short string ("abc")
+        // slot payload: [len|0x80 in top byte] + [bytes in low 7 bytes on little-endian]
+        let mut data = vec![0_u8; 16];
+        data[0..4].copy_from_slice(&(1_i32).to_le_bytes());
+        // null bits remain 0
+        let first_byte = (3_u64 | 0x80) << 56;
+        let seven_bytes = (b'a' as u64) | ((b'b' as u64) << 8) | ((b'c' as u64) << 16);
+        let packed = first_byte | seven_bytes;
+        data[8..16].copy_from_slice(&packed.to_le_bytes());
+
+        let arr = FlussArray::from_bytes(&data).unwrap();
+        assert_eq!(arr.size(), 1);
+        assert_eq!(arr.get_string(0).unwrap(), "abc");
+    }
+
+    #[test]
+    fn test_java_inline_short_binary_decoding() {
+        let elem_type = DataTypes::bytes();
+        let mut writer = FlussArrayWriter::new(1, &elem_type);
+        writer.write_binary_bytes(0, b"abc");
+        let arr = writer.complete().unwrap();
+        assert_eq!(arr.get_binary(0).unwrap(), b"abc");
+    }
+
+    #[test]
+    fn test_round_trip_empty_array() {
+        let elem_type = DataTypes::int();
+        let writer = FlussArrayWriter::new(0, &elem_type);
+        let array = writer.complete().unwrap();
+        assert_eq!(array.size(), 0);
+    }
+
+    #[test]
+    fn test_round_trip_boolean_array() {
+        let elem_type = DataTypes::boolean();
+        let mut writer = FlussArrayWriter::new(3, &elem_type);
+        writer.write_boolean(0, true);
+        writer.write_boolean(1, false);
+        writer.write_boolean(2, true);
+        let array = writer.complete().unwrap();
+
+        assert_eq!(array.size(), 3);
+        assert!(array.get_boolean(0).unwrap());
+        assert!(!array.get_boolean(1).unwrap());
+        assert!(array.get_boolean(2).unwrap());
+    }
+
+    #[test]
+    fn test_round_trip_long_array() {
+        let elem_type = DataTypes::bigint();
+        let mut writer = FlussArrayWriter::new(2, &elem_type);
+        writer.write_long(0, i64::MAX);
+        writer.write_long(1, i64::MIN);
+        let array = writer.complete().unwrap();
+
+        assert_eq!(array.get_long(0).unwrap(), i64::MAX);
+        assert_eq!(array.get_long(1).unwrap(), i64::MIN);
+    }
+
+    #[test]
+    fn test_round_trip_double_array() {
+        let elem_type = DataTypes::double();
+        let mut writer = FlussArrayWriter::new(2, &elem_type);
+        writer.write_double(0, 1.23);
+        writer.write_double(1, -4.56);
+        let array = writer.complete().unwrap();
+
+        assert_eq!(array.get_double(0).unwrap(), 1.23);
+        assert_eq!(array.get_double(1).unwrap(), -4.56);
+    }
+
+    #[test]
+    fn test_round_trip_nested_array() {
+        let inner_type = DataTypes::int();
+        let outer_type = DataTypes::array(DataTypes::int());
+
+        // Build inner array [1, 2]
+        let mut inner_writer = FlussArrayWriter::new(2, &inner_type);
+        inner_writer.write_int(0, 1);
+        inner_writer.write_int(1, 2);
+        let inner_array = inner_writer.complete().unwrap();
+
+        // Build outer array containing the inner array
+        let mut outer_writer = FlussArrayWriter::new(1, &outer_type);
+        outer_writer.write_array(0, &inner_array);
+        let outer_array = outer_writer.complete().unwrap();
+
+        assert_eq!(outer_array.size(), 1);
+        let nested = outer_array.get_array(0).unwrap();
+        assert_eq!(nested.size(), 2);
+        assert_eq!(nested.get_int(0).unwrap(), 1);
+        assert_eq!(nested.get_int(1).unwrap(), 2);
+    }
+
+    #[test]
+    fn test_primitive_getter_out_of_bounds_returns_error() {
+        let elem_type = DataTypes::int();
+        let mut writer = FlussArrayWriter::new(1, &elem_type);
+        writer.write_int(0, 10);
+        let array = writer.complete().unwrap();
+
+        let err = array.get_int(1).unwrap_err();
+        assert!(
+            err.to_string().contains("out of bounds"),
+            "unexpected error: {err}"
+        );
+    }
+
+    #[test]
+    fn test_primitive_getter_on_malformed_payload_returns_error() {
+        // Size says 1, but payload only contains header (no element bytes).
+        let mut data = vec![0_u8; 8];
+        data[0..4].copy_from_slice(&(1_i32).to_le_bytes());
+        let arr = FlussArray::from_bytes(&data).unwrap();
+
+        let err = arr.get_int(0).unwrap_err();
+        assert!(
+            err.to_string().contains("Out-of-bounds"),
+            "unexpected error: {err}"
+        );
+    }
+
+    #[test]
+    fn test_binary_layout_matches_java() {
+        // Verify exact byte layout for a simple [1, 2, 3] int array
+        let elem_type = DataTypes::int();
+        let mut writer = FlussArrayWriter::new(3, &elem_type);
+        writer.write_int(0, 1);
+        writer.write_int(1, 2);
+        writer.write_int(2, 3);
+        let array = writer.complete().unwrap();
+        let bytes = array.as_bytes();
+
+        // size = 3 at offset 0 (4 bytes, little-endian per Java MemorySegment.putInt)
+        assert_eq!(i32::from_le_bytes(bytes[0..4].try_into().unwrap()), 3);
+        // null bits: 4 bytes starting at offset 4, should be all zeros
+        assert_eq!(&bytes[4..8], &[0, 0, 0, 0]);
+        // elements start at offset 8 (header = 4 + 4), each 4 bytes (little-endian)
+        assert_eq!(i32::from_le_bytes(bytes[8..12].try_into().unwrap()), 1);
+        assert_eq!(i32::from_le_bytes(bytes[12..16].try_into().unwrap()), 2);
+        assert_eq!(i32::from_le_bytes(bytes[16..20].try_into().unwrap()), 3);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index c07fe97c5c..4a3e708bb6 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -19,7 +19,10 @@ use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::row::InternalRow;
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
-use arrow::array::{Array, AsArray, BinaryArray, RecordBatch, StringArray};
+use arrow::array::{
+    Array, AsArray, BinaryArray, BooleanArray, FixedSizeBinaryArray, ListArray, RecordBatch,
+    StringArray,
+};
 use arrow::datatypes::{
     DataType as ArrowDataType, Date32Type, Decimal128Type, Float32Type, Float64Type, Int8Type,
     Int16Type, Int32Type, Int64Type, Time32MillisecondType, Time32SecondType,
@@ -407,17 +410,379 @@ impl InternalRow for ColumnarRow {
             })?
             .value(self.row_id))
     }
+
+    fn get_array(&self, pos: usize) -> Result<crate::row::FlussArray> {
+        use crate::record::from_arrow_type;
+        use crate::row::binary_array::FlussArrayWriter;
+
+        let column = self.column(pos)?;
+        let list_array =
+            column
+                .as_any()
+                .downcast_ref::<ListArray>()
+                .ok_or_else(|| IllegalArgument {
+                    message: format!("expected List array at position {pos}"),
+                })?;
+
+        let values = list_array.value(self.row_id);
+        let element_fluss_type = from_arrow_type(values.data_type())?;
+        let mut writer = FlussArrayWriter::new(values.len(), &element_fluss_type);
+
+        write_arrow_values_to_fluss_array(&*values, &element_fluss_type, &mut writer)?;
+        writer.complete()
+    }
+}
+
+/// Downcast to a primitive Arrow array type, then loop with null checks calling a writer method.
+macro_rules! write_primitive_elements {
+    ($values:expr, $arrow_type:ty, $element_type:expr, $writer:expr, $write_method:ident) => {{
+        let arr = $values
+            .as_primitive_opt::<$arrow_type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "Expected {} for {:?} element",
+                    stringify!($arrow_type),
+                    $element_type
+                ),
+            })?;
+        for i in 0..arr.len() {
+            if arr.is_null(i) {
+                $writer.set_null_at(i);
+            } else {
+                $writer.$write_method(i, arr.value(i));
+            }
+        }
+    }};
+}
+
+/// Downcast via `downcast_ref`, then loop with null checks calling a writer method.
+macro_rules! write_downcast_elements {
+    ($values:expr, $array_type:ty, $element_type:expr, $writer:expr, $write_method:ident) => {{
+        let arr = $values
+            .as_any()
+            .downcast_ref::<$array_type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "Expected {} for {:?} element",
+                    stringify!($array_type),
+                    $element_type
+                ),
+            })?;
+        for i in 0..arr.len() {
+            if arr.is_null(i) {
+                $writer.set_null_at(i);
+            } else {
+                $writer.$write_method(i, arr.value(i));
+            }
+        }
+    }};
+}
+
+/// Converts all elements of an Arrow array into a `FlussArrayWriter`, downcasting
+/// the Arrow array once per call rather than per element.
+fn write_arrow_values_to_fluss_array(
+    values: &dyn Array,
+    element_type: &crate::metadata::DataType,
+    writer: &mut crate::row::binary_array::FlussArrayWriter,
+) -> Result<()> {
+    use crate::metadata::DataType;
+    use crate::record::from_arrow_type;
+    use crate::row::binary_array::FlussArrayWriter;
+
+    let len = values.len();
+
+    match element_type {
+        DataType::Boolean(_) => {
+            write_downcast_elements!(values, BooleanArray, element_type, writer, write_boolean)
+        }
+        DataType::TinyInt(_) => {
+            write_primitive_elements!(values, Int8Type, element_type, writer, write_byte)
+        }
+        DataType::SmallInt(_) => {
+            write_primitive_elements!(values, Int16Type, element_type, writer, write_short)
+        }
+        DataType::Int(_) => {
+            write_primitive_elements!(values, Int32Type, element_type, writer, write_int)
+        }
+        DataType::BigInt(_) => {
+            write_primitive_elements!(values, Int64Type, element_type, writer, write_long)
+        }
+        DataType::Float(_) => {
+            write_primitive_elements!(values, Float32Type, element_type, writer, write_float)
+        }
+        DataType::Double(_) => {
+            write_primitive_elements!(values, Float64Type, element_type, writer, write_double)
+        }
+        DataType::Char(_) | DataType::String(_) => {
+            write_downcast_elements!(values, StringArray, element_type, writer, write_string)
+        }
+        DataType::Binary(_) => {
+            write_downcast_elements!(
+                values,
+                FixedSizeBinaryArray,
+                element_type,
+                writer,
+                write_binary_bytes
+            )
+        }
+        DataType::Bytes(_) => {
+            write_downcast_elements!(
+                values,
+                BinaryArray,
+                element_type,
+                writer,
+                write_binary_bytes
+            )
+        }
+        DataType::Decimal(dt) => {
+            let arr =
+                values
+                    .as_primitive_opt::<Decimal128Type>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("Expected Decimal128Array for {element_type:?} element"),
+                    })?;
+            let arrow_scale = match values.data_type() {
+                ArrowDataType::Decimal128(_p, s) => *s as i64,
+                other => {
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "Expected Decimal128 data type for {element_type:?} element, got {other:?}"
+                        ),
+                    });
+                }
+            };
+            let precision = dt.precision();
+            let scale = dt.scale();
+            for i in 0..len {
+                if arr.is_null(i) {
+                    writer.set_null_at(i);
+                } else {
+                    let d = crate::row::Decimal::from_arrow_decimal128(
+                        arr.value(i),
+                        arrow_scale,
+                        precision,
+                        scale,
+                    )?;
+                    writer.write_decimal(i, &d, precision);
+                }
+            }
+        }
+        DataType::Date(_) => {
+            let arr = values
+                .as_primitive_opt::<Date32Type>()
+                .ok_or_else(|| IllegalArgument {
+                    message: format!("Expected Date32Array for {element_type:?} element"),
+                })?;
+            for i in 0..len {
+                if arr.is_null(i) {
+                    writer.set_null_at(i);
+                } else {
+                    writer.write_date(i, Date::new(arr.value(i)));
+                }
+            }
+        }
+        DataType::Time(_) => {
+            write_time_elements(values, element_type, writer)?;
+        }
+        DataType::Timestamp(ts_type) => {
+            write_timestamp_elements(
+                values,
+                element_type,
+                writer,
+                ts_type.precision(),
+                TimestampNtz::new,
+                TimestampNtz::from_millis_nanos,
+                |w, i, ts, p| w.write_timestamp_ntz(i, &ts, p),
+            )?;
+        }
+        DataType::TimestampLTz(ts_type) => {
+            write_timestamp_elements(
+                values,
+                element_type,
+                writer,
+                ts_type.precision(),
+                TimestampLtz::new,
+                TimestampLtz::from_millis_nanos,
+                |w, i, ts, p| w.write_timestamp_ltz(i, &ts, p),
+            )?;
+        }
+        DataType::Array(_) => {
+            let list_arr =
+                values
+                    .as_any()
+                    .downcast_ref::<ListArray>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!("Expected ListArray for {element_type:?} element"),
+                    })?;
+            let nested_element_type = from_arrow_type(&list_arr.value_type())?;
+            for i in 0..len {
+                if list_arr.is_null(i) {
+                    writer.set_null_at(i);
+                } else {
+                    let nested_values = list_arr.value(i);
+                    let mut nested_writer =
+                        FlussArrayWriter::new(nested_values.len(), &nested_element_type);
+                    write_arrow_values_to_fluss_array(
+                        &*nested_values,
+                        &nested_element_type,
+                        &mut nested_writer,
+                    )?;
+                    let nested_array = nested_writer.complete()?;
+                    writer.write_array(i, &nested_array);
+                }
+            }
+        }
+        _ => {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Unsupported element type for Arrow → FlussArray conversion: {element_type:?}"
+                ),
+            });
+        }
+    }
+    Ok(())
+}
+
+fn write_time_elements(
+    values: &dyn Array,
+    element_type: &crate::metadata::DataType,
+    writer: &mut crate::row::binary_array::FlussArrayWriter,
+) -> Result<()> {
+    macro_rules! process_time {
+        ($arrow_type:ty, $to_millis:expr) => {{
+            let arr = values
+                .as_primitive_opt::<$arrow_type>()
+                .ok_or_else(|| IllegalArgument {
+                    message: format!(
+                        "Expected {} for {:?} element",
+                        stringify!($arrow_type),
+                        element_type
+                    ),
+                })?;
+            for i in 0..arr.len() {
+                if arr.is_null(i) {
+                    writer.set_null_at(i);
+                } else {
+                    let to_millis_fn = $to_millis;
+                    writer.write_time(i, Time::new(to_millis_fn(arr.value(i))));
+                }
+            }
+        }};
+    }
+
+    match values.data_type() {
+        ArrowDataType::Time32(TimeUnit::Second) => {
+            process_time!(Time32SecondType, |v: i32| v * 1000);
+        }
+        ArrowDataType::Time32(TimeUnit::Millisecond) => {
+            process_time!(Time32MillisecondType, |v: i32| v);
+        }
+        ArrowDataType::Time64(TimeUnit::Microsecond) => {
+            process_time!(Time64MicrosecondType, |v: i64| (v / 1000) as i32);
+        }
+        ArrowDataType::Time64(TimeUnit::Nanosecond) => {
+            process_time!(Time64NanosecondType, |v: i64| (v / 1_000_000) as i32);
+        }
+        other => {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Expected Time column for {element_type:?} element, got {other:?}"
+                ),
+            });
+        }
+    }
+    Ok(())
+}
+
+fn convert_timestamp_raw(raw: i64, unit: &TimeUnit) -> (i64, i32) {
+    match unit {
+        TimeUnit::Second => (raw * 1000, 0),
+        TimeUnit::Millisecond => (raw, 0),
+        TimeUnit::Microsecond => {
+            let millis = raw.div_euclid(1000);
+            let nanos = (raw.rem_euclid(1000) * 1000) as i32;
+            (millis, nanos)
+        }
+        TimeUnit::Nanosecond => {
+            let millis = raw.div_euclid(1_000_000);
+            let nanos = raw.rem_euclid(1_000_000) as i32;
+            (millis, nanos)
+        }
+    }
+}
+
+fn write_timestamp_elements<T>(
+    values: &dyn Array,
+    element_type: &crate::metadata::DataType,
+    writer: &mut crate::row::binary_array::FlussArrayWriter,
+    precision: u32,
+    construct_compact: impl Fn(i64) -> T,
+    construct_with_nanos: impl Fn(i64, i32) -> Result<T>,
+    write_fn: impl Fn(&mut crate::row::binary_array::FlussArrayWriter, usize, T, u32),
+) -> Result<()> {
+    let unit = match values.data_type() {
+        ArrowDataType::Timestamp(unit, _) => unit,
+        other => {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Expected Timestamp column for {element_type:?} element, got {other:?}"
+                ),
+            });
+        }
+    };
+
+    macro_rules! process_ts {
+        ($arrow_type:ty) => {{
+            let arr = values
+                .as_primitive_opt::<$arrow_type>()
+                .ok_or_else(|| IllegalArgument {
+                    message: format!(
+                        "Expected {} for {:?} element",
+                        stringify!($arrow_type),
+                        element_type
+                    ),
+                })?;
+            for i in 0..arr.len() {
+                if arr.is_null(i) {
+                    writer.set_null_at(i);
+                    continue;
+                }
+                let (millis, nanos) = convert_timestamp_raw(arr.value(i), unit);
+                let ts = if nanos == 0 {
+                    construct_compact(millis)
+                } else {
+                    construct_with_nanos(millis, nanos)?
+                };
+                write_fn(writer, i, ts, precision);
+            }
+        }};
+    }
+
+    match unit {
+        TimeUnit::Second => process_ts!(TimestampSecondType),
+        TimeUnit::Millisecond => process_ts!(TimestampMillisecondType),
+        TimeUnit::Microsecond => process_ts!(TimestampMicrosecondType),
+        TimeUnit::Nanosecond => process_ts!(TimestampNanosecondType),
+    }
+    Ok(())
 }
 
 #[cfg(test)]
 mod tests {
     use super::*;
     use arrow::array::{
-        BinaryArray, BooleanArray, Decimal128Array, Float32Array, Float64Array, Int8Array,
-        Int16Array, Int32Array, Int64Array, StringArray,
+        ArrayRef, BinaryArray, BooleanArray, Decimal128Array, Float32Array, Float64Array,
+        Int8Array, Int16Array, Int32Array, Int32Builder, Int64Array, ListBuilder, StringArray,
+        UInt32Builder,
     };
     use arrow::datatypes::{DataType, Field, Schema};
 
+    fn single_column_row(array: ArrayRef) -> ColumnarRow {
+        let batch =
+            RecordBatch::try_from_iter(vec![("arr", array)]).expect("record batch with one column");
+        ColumnarRow::new(Arc::new(batch))
+    }
+
     #[test]
     fn columnar_row_reads_values() {
         let schema = Arc::new(Schema::new(vec![
@@ -533,4 +898,96 @@ mod tests {
             .unwrap()
         );
     }
+
+    #[test]
+    fn columnar_row_get_array_int_roundtrip() {
+        let mut builder = ListBuilder::new(Int32Builder::new());
+        builder.values().append_value(1);
+        builder.values().append_value(2);
+        builder.values().append_value(3);
+        builder.append(true);
+        let array = Arc::new(builder.finish()) as ArrayRef;
+
+        let row = single_column_row(array);
+        let arr = row.get_array(0).unwrap();
+        assert_eq!(arr.size(), 3);
+        assert_eq!(arr.get_int(0).unwrap(), 1);
+        assert_eq!(arr.get_int(1).unwrap(), 2);
+        assert_eq!(arr.get_int(2).unwrap(), 3);
+    }
+
+    #[test]
+    fn columnar_row_get_array_with_nulls() {
+        let mut builder = ListBuilder::new(Int32Builder::new());
+        builder.values().append_value(1);
+        builder.values().append_null();
+        builder.values().append_value(3);
+        builder.append(true);
+        let array = Arc::new(builder.finish()) as ArrayRef;
+
+        let row = single_column_row(array);
+        let arr = row.get_array(0).unwrap();
+        assert_eq!(arr.size(), 3);
+        assert_eq!(arr.get_int(0).unwrap(), 1);
+        assert!(arr.is_null_at(1));
+        assert_eq!(arr.get_int(2).unwrap(), 3);
+    }
+
+    #[test]
+    fn columnar_row_get_array_nested_array() {
+        let mut outer = ListBuilder::new(ListBuilder::new(Int32Builder::new()));
+
+        // first nested array: [1, 2]
+        outer.values().values().append_value(1);
+        outer.values().values().append_value(2);
+        outer.values().append(true);
+
+        // second nested array: [99]
+        outer.values().values().append_value(99);
+        outer.values().append(true);
+
+        // one row containing two nested arrays
+        outer.append(true);
+        let array = Arc::new(outer.finish()) as ArrayRef;
+
+        let row = single_column_row(array);
+        let arr = row.get_array(0).unwrap();
+        assert_eq!(arr.size(), 2);
+
+        let nested0 = arr.get_array(0).unwrap();
+        assert_eq!(nested0.size(), 2);
+        assert_eq!(nested0.get_int(0).unwrap(), 1);
+        assert_eq!(nested0.get_int(1).unwrap(), 2);
+
+        let nested1 = arr.get_array(1).unwrap();
+        assert_eq!(nested1.size(), 1);
+        assert_eq!(nested1.get_int(0).unwrap(), 99);
+    }
+
+    #[test]
+    fn columnar_row_get_array_non_list_column_returns_error() {
+        let array = Arc::new(Int32Array::from(vec![1, 2, 3])) as ArrayRef;
+        let row = single_column_row(array);
+        let err = row.get_array(0).unwrap_err();
+        assert!(
+            err.to_string().contains("expected List array"),
+            "unexpected error: {err}"
+        );
+    }
+
+    #[test]
+    fn columnar_row_get_array_unsupported_element_type_returns_error() {
+        let mut builder = ListBuilder::new(UInt32Builder::new());
+        builder.values().append_value(7);
+        builder.append(true);
+        let array = Arc::new(builder.finish()) as ArrayRef;
+
+        let row = single_column_row(array);
+        let err = row.get_array(0).unwrap_err();
+        assert!(
+            err.to_string()
+                .contains("Cannot convert Arrow type to Fluss type"),
+            "unexpected error: {err}"
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
index 339e366155..c6940652f5 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
@@ -47,6 +47,15 @@ impl CompactedKeyWriter {
     }
 
     pub fn create_value_writer(field_type: &DataType) -> Result<ValueWriter> {
+        // Java's CompactedKeyEncoder allows encoding Array types (Map/Row
+        // are not yet supported by ValueWriter). The server rejects
+        // unsupported key types at table-creation time, so encoding is
+        // allowed here to match Java parity.
+        if matches!(field_type, DataType::Map(_) | DataType::Row(_)) {
+            return Err(crate::error::Error::IllegalArgument {
+                message: format!("Cannot use {field_type:?} as a key column type"),
+            });
+        }
         ValueWriter::create_value_writer(field_type, Some(&BinaryRowFormat::Compacted))
     }
 
@@ -101,6 +110,8 @@ impl BinaryWriter for CompactedKeyWriter {
             fn write_timestamp_ntz(&mut self, value: &crate::row::datum::TimestampNtz, precision: u32);
 
             fn write_timestamp_ltz(&mut self, value: &crate::row::datum::TimestampLtz, precision: u32);
+
+            fn write_array(&mut self, value: &[u8]);
         }
     }
 
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 918ebdfd5f..267ae13cd1 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -68,9 +68,16 @@ impl<'a> CompactedRow<'a> {
         self.size_in_bytes
     }
 
-    fn decoded_row(&self) -> &GenericRow<'_> {
-        self.decoded_row
-            .get_or_init(|| self.deserializer.deserialize(&self.reader))
+    fn decoded_row(&self) -> Result<&GenericRow<'_>> {
+        if let Some(row) = self.decoded_row.get() {
+            return Ok(row);
+        }
+
+        // `OnceLock::get_or_try_init` is still unstable on our toolchain.
+        // Keep the same semantics by performing the fallible decode first,
+        // then atomically installing it via `get_or_init`.
+        let decoded = self.deserializer.deserialize(&self.reader)?;
+        Ok(self.decoded_row.get_or_init(|| decoded))
     }
 
     pub fn as_bytes(&self) -> &[u8] {
@@ -97,67 +104,71 @@ impl<'a> InternalRow for CompactedRow<'a> {
     }
 
     fn get_boolean(&self, pos: usize) -> Result<bool> {
-        self.decoded_row().get_boolean(pos)
+        self.decoded_row()?.get_boolean(pos)
     }
 
     fn get_byte(&self, pos: usize) -> Result<i8> {
-        self.decoded_row().get_byte(pos)
+        self.decoded_row()?.get_byte(pos)
     }
 
     fn get_short(&self, pos: usize) -> Result<i16> {
-        self.decoded_row().get_short(pos)
+        self.decoded_row()?.get_short(pos)
     }
 
     fn get_int(&self, pos: usize) -> Result<i32> {
-        self.decoded_row().get_int(pos)
+        self.decoded_row()?.get_int(pos)
     }
 
     fn get_long(&self, pos: usize) -> Result<i64> {
-        self.decoded_row().get_long(pos)
+        self.decoded_row()?.get_long(pos)
     }
 
     fn get_float(&self, pos: usize) -> Result<f32> {
-        self.decoded_row().get_float(pos)
+        self.decoded_row()?.get_float(pos)
     }
 
     fn get_double(&self, pos: usize) -> Result<f64> {
-        self.decoded_row().get_double(pos)
+        self.decoded_row()?.get_double(pos)
     }
 
     fn get_char(&self, pos: usize, length: usize) -> Result<&str> {
-        self.decoded_row().get_char(pos, length)
+        self.decoded_row()?.get_char(pos, length)
     }
 
     fn get_string(&self, pos: usize) -> Result<&str> {
-        self.decoded_row().get_string(pos)
+        self.decoded_row()?.get_string(pos)
     }
 
     fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Result<Decimal> {
-        self.decoded_row().get_decimal(pos, precision, scale)
+        self.decoded_row()?.get_decimal(pos, precision, scale)
     }
 
     fn get_date(&self, pos: usize) -> Result<Date> {
-        self.decoded_row().get_date(pos)
+        self.decoded_row()?.get_date(pos)
     }
 
     fn get_time(&self, pos: usize) -> Result<Time> {
-        self.decoded_row().get_time(pos)
+        self.decoded_row()?.get_time(pos)
     }
 
     fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> Result<TimestampNtz> {
-        self.decoded_row().get_timestamp_ntz(pos, precision)
+        self.decoded_row()?.get_timestamp_ntz(pos, precision)
     }
 
     fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> Result<TimestampLtz> {
-        self.decoded_row().get_timestamp_ltz(pos, precision)
+        self.decoded_row()?.get_timestamp_ltz(pos, precision)
     }
 
     fn get_binary(&self, pos: usize, length: usize) -> Result<&[u8]> {
-        self.decoded_row().get_binary(pos, length)
+        self.decoded_row()?.get_binary(pos, length)
     }
 
     fn get_bytes(&self, pos: usize) -> Result<&[u8]> {
-        self.decoded_row().get_bytes(pos)
+        self.decoded_row()?.get_bytes(pos)
+    }
+
+    fn get_array(&self, pos: usize) -> Result<crate::row::FlussArray> {
+        self.decoded_row()?.get_array(pos)
     }
 
     fn as_encoded_bytes(&self, write_format: WriteFormat) -> Option<&[u8]> {
@@ -327,4 +338,157 @@ mod tests {
             999999999999999999i64
         );
     }
+
+    #[test]
+    fn test_compacted_row_int_array() {
+        use crate::metadata::DataTypes;
+        use crate::row::binary_array::FlussArrayWriter;
+
+        let row_type =
+            RowType::with_data_types(vec![DataTypes::int(), DataTypes::array(DataTypes::int())]);
+
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+        writer.write_int(42);
+
+        let elem_type = DataTypes::int();
+        let mut arr_writer = FlussArrayWriter::new(3, &elem_type);
+        arr_writer.write_int(0, 1);
+        arr_writer.write_int(1, 2);
+        arr_writer.write_int(2, 3);
+        let arr = arr_writer.complete().unwrap();
+        writer.write_array(arr.as_bytes());
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        assert_eq!(row.get_int(0).unwrap(), 42);
+        let read_arr = row.get_array(1).unwrap();
+        assert_eq!(read_arr.size(), 3);
+        assert_eq!(read_arr.get_int(0).unwrap(), 1);
+        assert_eq!(read_arr.get_int(1).unwrap(), 2);
+        assert_eq!(read_arr.get_int(2).unwrap(), 3);
+    }
+
+    #[test]
+    fn test_compacted_row_string_array() {
+        use crate::metadata::DataTypes;
+        use crate::row::binary_array::FlussArrayWriter;
+
+        let row_type = RowType::with_data_types(vec![DataTypes::array(DataTypes::string())]);
+
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+
+        let elem_type = DataTypes::string();
+        let mut arr_writer = FlussArrayWriter::new(3, &elem_type);
+        arr_writer.write_string(0, "hello");
+        arr_writer.write_string(1, "fluss");
+        arr_writer.write_string(2, "rust");
+        let arr = arr_writer.complete().unwrap();
+        writer.write_array(arr.as_bytes());
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        let read_arr = row.get_array(0).unwrap();
+        assert_eq!(read_arr.size(), 3);
+        assert_eq!(read_arr.get_string(0).unwrap(), "hello");
+        assert_eq!(read_arr.get_string(1).unwrap(), "fluss");
+        assert_eq!(read_arr.get_string(2).unwrap(), "rust");
+    }
+
+    #[test]
+    fn test_compacted_row_array_with_nulls() {
+        use crate::metadata::DataTypes;
+        use crate::row::binary_array::FlussArrayWriter;
+
+        let row_type = RowType::with_data_types(vec![DataTypes::array(DataTypes::int())]);
+
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+
+        let elem_type = DataTypes::int();
+        let mut arr_writer = FlussArrayWriter::new(3, &elem_type);
+        arr_writer.write_int(0, 10);
+        arr_writer.set_null_at(1);
+        arr_writer.write_int(2, 30);
+        let arr = arr_writer.complete().unwrap();
+        writer.write_array(arr.as_bytes());
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        let read_arr = row.get_array(0).unwrap();
+        assert_eq!(read_arr.size(), 3);
+        assert!(!read_arr.is_null_at(0));
+        assert_eq!(read_arr.get_int(0).unwrap(), 10);
+        assert!(read_arr.is_null_at(1));
+        assert!(!read_arr.is_null_at(2));
+        assert_eq!(read_arr.get_int(2).unwrap(), 30);
+    }
+
+    #[test]
+    fn test_compacted_row_empty_array() {
+        use crate::metadata::DataTypes;
+        use crate::row::binary_array::FlussArrayWriter;
+
+        let row_type = RowType::with_data_types(vec![DataTypes::array(DataTypes::int())]);
+
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+
+        let elem_type = DataTypes::int();
+        let arr_writer = FlussArrayWriter::new(0, &elem_type);
+        let arr = arr_writer.complete().unwrap();
+        writer.write_array(arr.as_bytes());
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        let read_arr = row.get_array(0).unwrap();
+        assert_eq!(read_arr.size(), 0);
+    }
+
+    #[test]
+    fn test_compacted_row_nested_array() {
+        use crate::metadata::DataTypes;
+        use crate::row::binary_array::FlussArrayWriter;
+
+        let row_type =
+            RowType::with_data_types(vec![DataTypes::array(DataTypes::array(DataTypes::int()))]);
+
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+
+        // Build inner arrays
+        let inner_type = DataTypes::int();
+        let mut inner1 = FlussArrayWriter::new(2, &inner_type);
+        inner1.write_int(0, 1);
+        inner1.write_int(1, 2);
+        let inner1_arr = inner1.complete().unwrap();
+
+        let mut inner2 = FlussArrayWriter::new(1, &inner_type);
+        inner2.write_int(0, 99);
+        let inner2_arr = inner2.complete().unwrap();
+
+        // Build outer array
+        let outer_type = DataTypes::array(DataTypes::int());
+        let mut outer_writer = FlussArrayWriter::new(2, &outer_type);
+        outer_writer.write_array(0, &inner1_arr);
+        outer_writer.write_array(1, &inner2_arr);
+        let outer_arr = outer_writer.complete().unwrap();
+
+        writer.write_array(outer_arr.as_bytes());
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        let read_outer = row.get_array(0).unwrap();
+        assert_eq!(read_outer.size(), 2);
+
+        let nested1 = read_outer.get_array(0).unwrap();
+        assert_eq!(nested1.size(), 2);
+        assert_eq!(nested1.get_int(0).unwrap(), 1);
+        assert_eq!(nested1.get_int(1).unwrap(), 2);
+
+        let nested2 = read_outer.get_array(1).unwrap();
+        assert_eq!(nested2.size(), 1);
+        assert_eq!(nested2.get_int(0).unwrap(), 99);
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 00e53aa142..4ae442fc0e 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -18,6 +18,7 @@
 use crate::metadata::RowType;
 use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 use crate::{
+    error::{Error::IllegalArgument, Result},
     metadata::DataType,
     row::{Datum, Decimal, GenericRow, compacted::compacted_row_writer::CompactedRowWriter},
     util::varint::{read_unsigned_varint_at, read_unsigned_varint_u64_at},
@@ -49,7 +50,7 @@ impl<'a> CompactedRowDeserializer<'a> {
         self.row_type.as_ref()
     }
 
-    pub fn deserialize(&self, reader: &CompactedRowReader<'a>) -> GenericRow<'a> {
+    pub fn deserialize(&self, reader: &CompactedRowReader<'a>) -> Result<GenericRow<'a>> {
         let mut row = GenericRow::new(self.row_type.fields().len());
         let mut cursor = reader.initial_position();
         for (col_pos, data_field) in self.row_type.fields().iter().enumerate() {
@@ -60,41 +61,41 @@ impl<'a> CompactedRowDeserializer<'a> {
             }
             let (datum, next_cursor) = match dtype {
                 DataType::Boolean(_) => {
-                    let (val, next) = reader.read_boolean(cursor);
+                    let (val, next) = reader.read_boolean(cursor)?;
                     (Datum::Bool(val), next)
                 }
                 DataType::TinyInt(_) => {
-                    let (val, next) = reader.read_byte(cursor);
+                    let (val, next) = reader.read_byte(cursor)?;
                     (Datum::Int8(val as i8), next)
                 }
                 DataType::SmallInt(_) => {
-                    let (val, next) = reader.read_short(cursor);
+                    let (val, next) = reader.read_short(cursor)?;
                     (Datum::Int16(val), next)
                 }
                 DataType::Int(_) => {
-                    let (val, next) = reader.read_int(cursor);
+                    let (val, next) = reader.read_int(cursor)?;
                     (Datum::Int32(val), next)
                 }
                 DataType::BigInt(_) => {
-                    let (val, next) = reader.read_long(cursor);
+                    let (val, next) = reader.read_long(cursor)?;
                     (Datum::Int64(val), next)
                 }
                 DataType::Float(_) => {
-                    let (val, next) = reader.read_float(cursor);
+                    let (val, next) = reader.read_float(cursor)?;
                     (Datum::Float32(val.into()), next)
                 }
                 DataType::Double(_) => {
-                    let (val, next) = reader.read_double(cursor);
+                    let (val, next) = reader.read_double(cursor)?;
                     (Datum::Float64(val.into()), next)
                 }
                 // TODO: use read_char(length) in the future, but need to keep compatibility
                 DataType::Char(_) | DataType::String(_) => {
-                    let (val, next) = reader.read_string(cursor);
+                    let (val, next) = reader.read_string(cursor)?;
                     (Datum::String(val.into()), next)
                 }
                 // TODO: use read_binary(length) in the future, but need to keep compatibility
                 DataType::Bytes(_) | DataType::Binary(_) => {
-                    let (val, next) = reader.read_bytes(cursor);
+                    let (val, next) = reader.read_bytes(cursor)?;
                     (Datum::Blob(val.into()), next)
                 }
                 DataType::Decimal(decimal_type) => {
@@ -102,42 +103,57 @@ impl<'a> CompactedRowDeserializer<'a> {
                     let scale = decimal_type.scale();
                     if Decimal::is_compact_precision(precision) {
                         // Compact: stored as i64
-                        let (val, next) = reader.read_long(cursor);
-                        let decimal = Decimal::from_unscaled_long(val, precision, scale)
-                            .expect("Failed to create decimal from unscaled long");
+                        let (val, next) = reader.read_long(cursor)?;
+                        let decimal =
+                            Decimal::from_unscaled_long(val, precision, scale).map_err(|e| {
+                                IllegalArgument {
+                                    message: format!(
+                                        "Failed to create decimal from unscaled long: {e}"
+                                    ),
+                                }
+                            })?;
                         (Datum::Decimal(decimal), next)
                     } else {
                         // Non-compact: stored as minimal big-endian bytes
-                        let (bytes, next) = reader.read_bytes(cursor);
+                        let (bytes, next) = reader.read_bytes(cursor)?;
                         let decimal = Decimal::from_unscaled_bytes(bytes, precision, scale)
-                            .expect("Failed to create decimal from unscaled bytes");
+                            .map_err(|e| IllegalArgument {
+                                message: format!(
+                                    "Failed to create decimal from unscaled bytes: {e}"
+                                ),
+                            })?;
                         (Datum::Decimal(decimal), next)
                     }
                 }
                 DataType::Date(_) => {
-                    let (val, next) = reader.read_int(cursor);
+                    let (val, next) = reader.read_int(cursor)?;
                     (Datum::Date(crate::row::datum::Date::new(val)), next)
                 }
                 DataType::Time(_) => {
-                    let (val, next) = reader.read_int(cursor);
+                    let (val, next) = reader.read_int(cursor)?;
                     (Datum::Time(crate::row::datum::Time::new(val)), next)
                 }
                 DataType::Timestamp(timestamp_type) => {
                     let precision = timestamp_type.precision();
                     if crate::row::datum::TimestampNtz::is_compact(precision) {
                         // Compact: only milliseconds
-                        let (millis, next) = reader.read_long(cursor);
+                        let (millis, next) = reader.read_long(cursor)?;
                         (
                             Datum::TimestampNtz(crate::row::datum::TimestampNtz::new(millis)),
                             next,
                         )
                     } else {
                         // Non-compact: milliseconds + nanos
-                        let (millis, mid) = reader.read_long(cursor);
-                        let (nanos, next) = reader.read_int(mid);
-                        let timestamp =
-                            crate::row::datum::TimestampNtz::from_millis_nanos(millis, nanos)
-                                .expect("Invalid nano_of_millisecond value in compacted row");
+                        let (millis, mid) = reader.read_long(cursor)?;
+                        let (nanos, next) = reader.read_int(mid)?;
+                        let timestamp = crate::row::datum::TimestampNtz::from_millis_nanos(
+                            millis, nanos,
+                        )
+                        .map_err(|e| IllegalArgument {
+                            message: format!(
+                                "Invalid nano_of_millisecond value in compacted row timestamp: {e}"
+                            ),
+                        })?;
                         (Datum::TimestampNtz(timestamp), next)
                     }
                 }
@@ -145,29 +161,44 @@ impl<'a> CompactedRowDeserializer<'a> {
                     let precision = timestamp_ltz_type.precision();
                     if crate::row::datum::TimestampLtz::is_compact(precision) {
                         // Compact: only epoch milliseconds
-                        let (epoch_millis, next) = reader.read_long(cursor);
+                        let (epoch_millis, next) = reader.read_long(cursor)?;
                         (
                             Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(epoch_millis)),
                             next,
                         )
                     } else {
                         // Non-compact: epoch milliseconds + nanos
-                        let (epoch_millis, mid) = reader.read_long(cursor);
-                        let (nanos, next) = reader.read_int(mid);
-                        let timestamp_ltz =
-                            crate::row::datum::TimestampLtz::from_millis_nanos(epoch_millis, nanos)
-                                .expect("Invalid nano_of_millisecond value in compacted row");
+                        let (epoch_millis, mid) = reader.read_long(cursor)?;
+                        let (nanos, next) = reader.read_int(mid)?;
+                        let timestamp_ltz = crate::row::datum::TimestampLtz::from_millis_nanos(
+                            epoch_millis,
+                            nanos,
+                        )
+                        .map_err(|e| IllegalArgument {
+                            message: format!(
+                                "Invalid nano_of_millisecond value in compacted row timestamp_ltz: {e}"
+                            ),
+                        })?;
                         (Datum::TimestampLtz(timestamp_ltz), next)
                     }
                 }
+                DataType::Array(_) => {
+                    let (bytes, next) = reader.read_bytes(cursor)?;
+                    let array = crate::row::binary_array::FlussArray::from_bytes(bytes)?;
+                    (Datum::Array(array), next)
+                }
                 _ => {
-                    panic!("Unsupported DataType in CompactedRowDeserializer: {dtype:?}");
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "Unsupported DataType in CompactedRowDeserializer: {dtype:?}"
+                        ),
+                    });
                 }
             };
             cursor = next_cursor;
             row.set_field(col_pos, datum);
         }
-        row
+        Ok(row)
     }
 }
 
@@ -202,6 +233,21 @@ impl<'a> CompactedRowReader<'a> {
         self.offset + self.header_size_in_bytes
     }
 
+    fn checked_pos(&self, pos: usize, width: usize, context: &str) -> Result<usize> {
+        let next = pos.checked_add(width).ok_or_else(|| IllegalArgument {
+            message: format!("Overflow while reading {context}: pos={pos}, width={width}"),
+        })?;
+        if next > self.limit {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Out-of-bounds while reading {context}: pos={pos}, width={width}, limit={}",
+                    self.limit
+                ),
+            });
+        }
+        Ok(next)
+    }
+
     pub fn is_null_at(&self, col_pos: usize) -> bool {
         let byte_index = col_pos >> 3;
         let bit = col_pos & 7;
@@ -210,79 +256,73 @@ impl<'a> CompactedRowReader<'a> {
         (self.segment[idx] & (1u8 << bit)) != 0
     }
 
-    pub fn read_boolean(&self, pos: usize) -> (bool, usize) {
-        let (val, next) = self.read_byte(pos);
-        (val != 0, next)
+    pub fn read_boolean(&self, pos: usize) -> Result<(bool, usize)> {
+        let (val, next) = self.read_byte(pos)?;
+        Ok((val != 0, next))
     }
 
-    pub fn read_byte(&self, pos: usize) -> (u8, usize) {
-        debug_assert!(pos < self.limit);
-        (self.segment[pos], pos + 1)
+    pub fn read_byte(&self, pos: usize) -> Result<(u8, usize)> {
+        let next = self.checked_pos(pos, 1, "byte")?;
+        Ok((self.segment[pos], next))
     }
 
-    pub fn read_short(&self, pos: usize) -> (i16, usize) {
-        let next_pos = pos + 2;
-        debug_assert!(next_pos <= self.limit);
-        let bytes_slice = &self.segment[pos..pos + 2];
-        let val = i16::from_ne_bytes(
-            bytes_slice
-                .try_into()
-                .expect("Slice must be exactly 2 bytes long"),
-        );
-        (val, next_pos)
+    pub fn read_short(&self, pos: usize) -> Result<(i16, usize)> {
+        let next_pos = self.checked_pos(pos, 2, "short")?;
+        let mut arr = [0u8; 2];
+        arr.copy_from_slice(&self.segment[pos..next_pos]);
+        Ok((i16::from_ne_bytes(arr), next_pos))
     }
 
-    pub fn read_int(&self, pos: usize) -> (i32, usize) {
+    pub fn read_int(&self, pos: usize) -> Result<(i32, usize)> {
         match read_unsigned_varint_at(self.segment, pos, CompactedRowWriter::MAX_INT_SIZE) {
-            Ok((value, next_pos)) => (value as i32, next_pos),
-            Err(_) => panic!("Invalid VarInt32 input stream."),
+            Ok((value, next_pos)) => Ok((value as i32, next_pos)),
+            Err(e) => Err(IllegalArgument {
+                message: format!("Invalid VarInt32 input stream at pos {pos}: {e}"),
+            }),
         }
     }
 
-    pub fn read_long(&self, pos: usize) -> (i64, usize) {
+    pub fn read_long(&self, pos: usize) -> Result<(i64, usize)> {
         match read_unsigned_varint_u64_at(self.segment, pos, CompactedRowWriter::MAX_LONG_SIZE) {
-            Ok((value, next_pos)) => (value as i64, next_pos),
-            Err(_) => panic!("Invalid VarInt64 input stream."),
+            Ok((value, next_pos)) => Ok((value as i64, next_pos)),
+            Err(e) => Err(IllegalArgument {
+                message: format!("Invalid VarInt64 input stream at pos {pos}: {e}"),
+            }),
         }
     }
 
-    pub fn read_float(&self, pos: usize) -> (f32, usize) {
-        let next_pos = pos + 4;
-        debug_assert!(next_pos <= self.limit);
-        let val = f32::from_ne_bytes(
-            self.segment[pos..pos + 4]
-                .try_into()
-                .expect("Slice must be exactly 4 bytes long"),
-        );
-        (val, next_pos)
+    pub fn read_float(&self, pos: usize) -> Result<(f32, usize)> {
+        let next_pos = self.checked_pos(pos, 4, "float")?;
+        let mut arr = [0u8; 4];
+        arr.copy_from_slice(&self.segment[pos..next_pos]);
+        Ok((f32::from_ne_bytes(arr), next_pos))
     }
 
-    pub fn read_double(&self, pos: usize) -> (f64, usize) {
-        let next_pos = pos + 8;
-        debug_assert!(next_pos <= self.limit);
-        let val = f64::from_ne_bytes(
-            self.segment[pos..pos + 8]
-                .try_into()
-                .expect("Slice must be exactly 8 bytes long"),
-        );
-        (val, next_pos)
+    pub fn read_double(&self, pos: usize) -> Result<(f64, usize)> {
+        let next_pos = self.checked_pos(pos, 8, "double")?;
+        let mut arr = [0u8; 8];
+        arr.copy_from_slice(&self.segment[pos..next_pos]);
+        Ok((f64::from_ne_bytes(arr), next_pos))
     }
 
-    pub fn read_binary(&self, pos: usize) -> (&'a [u8], usize) {
+    pub fn read_binary(&self, pos: usize) -> Result<(&'a [u8], usize)> {
         self.read_bytes(pos)
     }
 
-    pub fn read_bytes(&self, pos: usize) -> (&'a [u8], usize) {
-        let (len, data_pos) = self.read_int(pos);
-        let len = len as usize;
-        let next_pos = data_pos + len;
-        debug_assert!(next_pos <= self.limit);
-        (&self.segment[data_pos..next_pos], next_pos)
+    pub fn read_bytes(&self, pos: usize) -> Result<(&'a [u8], usize)> {
+        let (len, data_pos) = self.read_int(pos)?;
+        let len = usize::try_from(len).map_err(|_| IllegalArgument {
+            message: format!("Negative length while reading bytes at pos {pos}: {len}"),
+        })?;
+        let next_pos = self.checked_pos(data_pos, len, "bytes payload")?;
+        Ok((&self.segment[data_pos..next_pos], next_pos))
     }
 
-    pub fn read_string(&self, pos: usize) -> (&'a str, usize) {
-        let (bytes, next_pos) = self.read_bytes(pos);
-        let s = from_utf8(bytes).expect("Invalid UTF-8 when reading string");
-        (s, next_pos)
+    pub fn read_string(&self, pos: usize) -> Result<(&'a str, usize)> {
+        let (bytes, next_pos) = self.read_bytes(pos)?;
+        let s = from_utf8(bytes).map_err(|e| IllegalArgument {
+            message: format!("Invalid UTF-8 when reading string at pos {pos}: {e}"),
+        })?;
+        Ok((s, next_pos))
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index ac0100eefb..3627174315 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -165,6 +165,10 @@ impl BinaryWriter for CompactedRowWriter {
         self.write_bytes(&bytes[..length.min(bytes.len())])
     }
 
+    fn write_array(&mut self, value: &[u8]) {
+        self.write_bytes(value)
+    }
+
     fn complete(&mut self) {
         // do nothing
     }
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 9b2e80a641..2f1d1839fc 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -18,12 +18,14 @@
 use crate::error::Error::RowConvertError;
 use crate::error::Result;
 use crate::row::Decimal;
+use crate::row::binary_array::FlussArray;
 use arrow::array::{
     ArrayBuilder, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
     FixedSizeBinaryBuilder, Float32Builder, Float64Builder, Int8Builder, Int16Builder,
-    Int32Builder, Int64Builder, StringBuilder, Time32MillisecondBuilder, Time32SecondBuilder,
-    Time64MicrosecondBuilder, Time64NanosecondBuilder, TimestampMicrosecondBuilder,
-    TimestampMillisecondBuilder, TimestampNanosecondBuilder, TimestampSecondBuilder,
+    Int32Builder, Int64Builder, ListBuilder, StringBuilder, Time32MillisecondBuilder,
+    Time32SecondBuilder, Time64MicrosecondBuilder, Time64NanosecondBuilder,
+    TimestampMicrosecondBuilder, TimestampMillisecondBuilder, TimestampNanosecondBuilder,
+    TimestampSecondBuilder,
 };
 use arrow::datatypes as arrow_schema;
 use arrow::error::ArrowError;
@@ -68,6 +70,8 @@ pub enum Datum<'a> {
     TimestampNtz(TimestampNtz),
     #[display("{0}")]
     TimestampLtz(TimestampLtz),
+    #[display("{0}")]
+    Array(FlussArray),
 }
 
 impl Datum<'_> {
@@ -123,6 +127,13 @@ impl Datum<'_> {
             _ => panic!("not a timestamp ltz: {self:?}"),
         }
     }
+
+    pub fn as_array(&self) -> &FlussArray {
+        match self {
+            Self::Array(a) => a,
+            _ => panic!("not an array: {self:?}"),
+        }
+    }
 }
 
 // ----------- implement from
@@ -388,6 +399,13 @@ impl<'a> From<TimestampLtz> for Datum<'a> {
     }
 }
 
+impl<'a> From<FlussArray> for Datum<'a> {
+    #[inline]
+    fn from(arr: FlussArray) -> Datum<'a> {
+        Datum::Array(arr)
+    }
+}
+
 pub trait ToArrow {
     fn append_to(
         &self,
@@ -494,6 +512,89 @@ impl AppendResult for std::result::Result<(), ArrowError> {
     }
 }
 
+fn append_fluss_array_to_list_builder(
+    arr: &FlussArray,
+    builder: &mut dyn ArrayBuilder,
+    data_type: &arrow_schema::DataType,
+) -> Result<()> {
+    use crate::record::from_arrow_type;
+
+    let list_builder = builder
+        .as_any_mut()
+        .downcast_mut::<ListBuilder<Box<dyn ArrayBuilder>>>()
+        .ok_or_else(|| RowConvertError {
+            message: "Builder type mismatch for Array: expected ListBuilder".to_string(),
+        })?;
+
+    let element_arrow_type = match data_type {
+        arrow_schema::DataType::List(field) => field.data_type().clone(),
+        _ => {
+            return Err(RowConvertError {
+                message: format!("Expected List Arrow type for Array datum, got: {data_type:?}"),
+            });
+        }
+    };
+
+    let element_fluss_type = from_arrow_type(&element_arrow_type)?;
+    let values_builder = list_builder.values();
+
+    for i in 0..arr.size() {
+        if arr.is_null_at(i) {
+            // TODO: Datum::Null triggers a chain of downcast attempts in append_to.
+            // For sparse arrays with many nulls, call append_null directly on the
+            // typed inner builder to avoid the overhead.
+            let null_datum = Datum::Null;
+            null_datum.append_to(values_builder, &element_arrow_type)?;
+        } else {
+            let datum = read_datum_from_fluss_array(arr, i, &element_fluss_type)?;
+            datum.append_to(values_builder, &element_arrow_type)?;
+        }
+    }
+    list_builder.append(true);
+    Ok(())
+}
+
+fn read_datum_from_fluss_array<'a>(
+    arr: &FlussArray,
+    pos: usize,
+    element_type: &crate::metadata::DataType,
+) -> Result<Datum<'a>> {
+    use crate::metadata::DataType;
+
+    Ok(match element_type {
+        DataType::Boolean(_) => Datum::Bool(arr.get_boolean(pos)?),
+        DataType::TinyInt(_) => Datum::Int8(arr.get_byte(pos)?),
+        DataType::SmallInt(_) => Datum::Int16(arr.get_short(pos)?),
+        DataType::Int(_) => Datum::Int32(arr.get_int(pos)?),
+        DataType::BigInt(_) => Datum::Int64(arr.get_long(pos)?),
+        DataType::Float(_) => Datum::Float32(arr.get_float(pos)?.into()),
+        DataType::Double(_) => Datum::Float64(arr.get_double(pos)?.into()),
+        DataType::Char(_) | DataType::String(_) => {
+            Datum::String(Cow::Owned(arr.get_string(pos)?.to_string()))
+        }
+        DataType::Binary(_) | DataType::Bytes(_) => {
+            Datum::Blob(Cow::Owned(arr.get_binary(pos)?.to_vec()))
+        }
+        DataType::Decimal(dt) => {
+            Datum::Decimal(arr.get_decimal(pos, dt.precision(), dt.scale())?)
+        }
+        DataType::Date(_) => Datum::Date(arr.get_date(pos)?),
+        DataType::Time(_) => Datum::Time(arr.get_time(pos)?),
+        DataType::Timestamp(t) => Datum::TimestampNtz(arr.get_timestamp_ntz(pos, t.precision())?),
+        DataType::TimestampLTz(t) => {
+            Datum::TimestampLtz(arr.get_timestamp_ltz(pos, t.precision())?)
+        }
+        DataType::Array(_) => Datum::Array(arr.get_array(pos)?),
+        _ => {
+            return Err(RowConvertError {
+                message: format!(
+                    "Unsupported element type for FlussArray → Arrow conversion: {element_type:?}"
+                ),
+            });
+        }
+    })
+}
+
 impl Datum<'_> {
     pub fn append_to(
         &self,
@@ -540,6 +641,18 @@ impl Datum<'_> {
                 append_null_to_arrow!(TimestampMillisecondBuilder);
                 append_null_to_arrow!(TimestampMicrosecondBuilder);
                 append_null_to_arrow!(TimestampNanosecondBuilder);
+                if let arrow_schema::DataType::List(_) = data_type {
+                    let b = builder
+                        .as_any_mut()
+                        .downcast_mut::<ListBuilder<Box<dyn ArrayBuilder>>>()
+                        .ok_or_else(|| RowConvertError {
+                            message:
+                                "Expected ListBuilder<Box<dyn ArrayBuilder>> for List Arrow type"
+                                    .to_string(),
+                        })?;
+                    b.append_null();
+                    return Ok(());
+                }
             }
             Datum::Bool(v) => append_value_to_arrow!(BooleanBuilder, *v),
             Datum::Int8(v) => append_value_to_arrow!(Int8Builder, *v),
@@ -742,6 +855,9 @@ impl Datum<'_> {
                     message: "Builder type mismatch for TimestampLtz".to_string(),
                 });
             }
+            Datum::Array(arr) => {
+                return append_fluss_array_to_list_builder(arr, builder, data_type);
+            }
         }
 
         Err(RowConvertError {
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
index d201450be4..877b3ecdb1 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
@@ -64,8 +64,12 @@ impl CompactedKeyEncoder {
 
         for pos in &encode_field_pos {
             let data_type = row_type.fields().get(*pos).unwrap().data_type();
-            field_getters.push(FieldGetter::create(data_type, *pos));
-            field_encoders.push(CompactedKeyWriter::create_value_writer(data_type)?);
+            // Validate key type support first, so unsupported types return a
+            // typed error instead of panicking in FieldGetter::create.
+            let field_encoder = CompactedKeyWriter::create_value_writer(data_type)?;
+            let field_getter = FieldGetter::create(data_type, *pos);
+            field_getters.push(field_getter);
+            field_encoders.push(field_encoder);
         }
 
         Ok(CompactedKeyEncoder {
@@ -82,18 +86,19 @@ impl KeyEncoder for CompactedKeyEncoder {
         self.compacted_encoder.reset();
 
         // iterate all the fields of the row, and encode each field
-        for (pos, field_getter) in self.field_getters.iter().enumerate() {
+        for (pos, (field_getter, field_encoder)) in self
+            .field_getters
+            .iter()
+            .zip(self.field_encoders.iter())
+            .enumerate()
+        {
             match &field_getter.get_field(row)? {
                 Datum::Null => {
                     return Err(IllegalArgument {
                         message: format!("Cannot encode key with null value at position: {pos:?}"),
                     });
                 }
-                value => self.field_encoders.get(pos).unwrap().write_value(
-                    &mut self.compacted_encoder,
-                    pos,
-                    value,
-                )?,
+                value => field_encoder.write_value(&mut self.compacted_encoder, pos, value)?,
             }
         }
 
@@ -105,8 +110,55 @@ impl KeyEncoder for CompactedKeyEncoder {
 mod tests {
     use super::*;
     use crate::metadata::DataTypes;
+    use crate::row::binary_array::FlussArrayWriter;
     use crate::row::{Datum, GenericRow};
 
+    fn build_int_array(values: &[i32]) -> crate::row::FlussArray {
+        let mut w = FlussArrayWriter::new(values.len(), &DataTypes::int());
+        for (i, v) in values.iter().enumerate() {
+            w.write_int(i, *v);
+        }
+        w.complete().unwrap()
+    }
+
+    fn build_nullable_int_array(values: &[Option<i32>]) -> crate::row::FlussArray {
+        let mut w = FlussArrayWriter::new(values.len(), &DataTypes::int());
+        for (i, v) in values.iter().enumerate() {
+            match v {
+                Some(value) => w.write_int(i, *value),
+                None => w.set_null_at(i),
+            }
+        }
+        w.complete().unwrap()
+    }
+
+    fn build_float_array(values: &[f32]) -> crate::row::FlussArray {
+        let mut w = FlussArrayWriter::new(values.len(), &DataTypes::float().as_non_nullable());
+        for (i, v) in values.iter().enumerate() {
+            w.write_float(i, *v);
+        }
+        w.complete().unwrap()
+    }
+
+    fn build_nested_string_array() -> crate::row::FlussArray {
+        let mut inner_1 = FlussArrayWriter::new(3, &DataTypes::string());
+        inner_1.write_string(0, "a");
+        inner_1.set_null_at(1);
+        inner_1.write_string(2, "c");
+        let inner_1 = inner_1.complete().unwrap();
+
+        let mut inner_2 = FlussArrayWriter::new(2, &DataTypes::string());
+        inner_2.write_string(0, "hello");
+        inner_2.write_string(1, "world");
+        let inner_2 = inner_2.complete().unwrap();
+
+        let mut outer = FlussArrayWriter::new(3, &DataTypes::array(DataTypes::string()));
+        outer.write_array(0, &inner_1);
+        outer.set_null_at(1);
+        outer.write_array(2, &inner_2);
+        outer.complete().unwrap()
+    }
+
     pub fn for_test_row_type(row_type: &RowType) -> CompactedKeyEncoder {
         CompactedKeyEncoder::new(row_type, (0..row_type.fields().len()).collect())
             .expect("CompactedKeyEncoder initialization failed")
@@ -237,6 +289,51 @@ mod tests {
         );
     }
 
+    #[test]
+    fn test_array_type_allowed_as_key() {
+        // Java's CompactedKeyEncoder allows Array as a key column type
+        // (the server rejects unsupported key types at table-creation time).
+        let row_type =
+            RowType::with_data_types(vec![DataTypes::int(), DataTypes::array(DataTypes::int())]);
+        let mut encoder = CompactedKeyEncoder::new(&row_type, vec![0, 1]).unwrap();
+
+        let row_a = GenericRow::from_data(vec![
+            Datum::Int32(42),
+            Datum::Array(build_int_array(&[10, 20])),
+        ]);
+        let row_b = GenericRow::from_data(vec![
+            Datum::Int32(42),
+            Datum::Array(build_int_array(&[10, 30])),
+        ]);
+
+        let encoded_a = encoder.encode_key(&row_a).unwrap();
+        let encoded_b = encoder.encode_key(&row_b).unwrap();
+
+        assert!(!encoded_a.is_empty());
+        assert_ne!(
+            encoded_a.iter().as_slice(),
+            encoded_b.iter().as_slice(),
+            "Array key payload should affect compacted key encoding"
+        );
+    }
+
+    #[test]
+    fn test_map_type_rejected_as_key() {
+        let row_type = RowType::with_data_types(vec![
+            DataTypes::int(),
+            DataTypes::map(DataTypes::int(), DataTypes::string()),
+        ]);
+        match CompactedKeyEncoder::new(&row_type, vec![0, 1]) {
+            Ok(_) => panic!("Expected error when using Map as key type"),
+            Err(err) => {
+                assert!(
+                    err.to_string().contains("Cannot use"),
+                    "Expected 'Cannot use' error, got: {err}"
+                );
+            }
+        }
+    }
+
     #[test]
     fn test_all_data_types_java_compatible() {
         // Test encoding compatibility with Java using reference from:
@@ -263,9 +360,11 @@ mod tests {
             DataType::Timestamp(TimestampType::with_nullable(false, 5).unwrap()), // TIMESTAMP(5)
             DataType::TimestampLTz(TimestampLTzType::with_nullable(false, 1).unwrap()), // TIMESTAMP_LTZ(1)
             DataType::TimestampLTz(TimestampLTzType::with_nullable(false, 5).unwrap()), // TIMESTAMP_LTZ(5)
-                                                                                        // TODO: Add support for ARRAY type
-                                                                                        // TODO: Add support for MAP type
-                                                                                        // TODO: Add support for ROW type
+            DataTypes::array(DataTypes::int()), // ARRAY<INT>
+            DataTypes::array(DataTypes::float().as_non_nullable()), // ARRAY<FLOAT NOT NULL>
+            DataTypes::array(DataTypes::array(DataTypes::string())), // ARRAY<ARRAY<STRING>>
+                                                // TODO: Add support for MAP type
+                                                // TODO: Add support for ROW type
         ]);
 
         // Exact values from Java's IndexedRowTest.genRecordForAllTypes()
@@ -296,6 +395,26 @@ mod tests {
             Datum::TimestampNtz(crate::row::datum::TimestampNtz::new(1698235273182)), // TIMESTAMP(5)
             Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(1698235273182)), // TIMESTAMP_LTZ(1)
             Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(1698235273182)), // TIMESTAMP_LTZ(5)
+            Datum::Array(build_nullable_int_array(&[
+                Some(1),
+                Some(2),
+                Some(3),
+                Some(4),
+                Some(5),
+                Some(-11),
+                None,
+                Some(444),
+                Some(102234),
+            ])), // ARRAY<INT>: GenericArray.of(1, 2, 3, 4, 5, -11, null, 444, 102234)
+            Datum::Array(build_float_array(&[
+                0.1_f32,
+                1.1_f32,
+                -0.5_f32,
+                6.6_f32,
+                f32::MAX,
+                f32::from_bits(1),
+            ])), // ARRAY<FLOAT NOT NULL>: GenericArray.of(0.1f, 1.1f, -0.5f, 6.6f, MAX, MIN)
+            Datum::Array(build_nested_string_array()), // ARRAY<ARRAY<STRING>>
         ]);
 
         // Expected bytes from Java's encoded_key.hex reference file
@@ -339,6 +458,25 @@ mod tests {
             0xDE, 0x9F, 0xD7, 0xB5, 0xB6, 0x31,
             // TIMESTAMP_LTZ(5): 1698235273182
             0xDE, 0x9F, 0xD7, 0xB5, 0xB6, 0x31, 0x00,
+            // ARRAY<INT>: GenericArray.of(1, 2, 3, 4, 5, -11, null, 444, 102234)
+            0x30, 0x09, 0x00, 0x00, 0x00, 0x40, 0x00, 0x00, 0x00, 0x01, 0x00, 0x00,
+            0x00, 0x02, 0x00, 0x00, 0x00, 0x03, 0x00, 0x00, 0x00, 0x04, 0x00, 0x00,
+            0x00, 0x05, 0x00, 0x00, 0x00, 0xF5, 0xFF, 0xFF, 0xFF, 0x00, 0x00, 0x00,
+            0x00, 0xBC, 0x01, 0x00, 0x00, 0x5A, 0x8F, 0x01, 0x00, 0x00, 0x00, 0x00,
+            0x00,
+            // ARRAY<FLOAT NOT NULL>: GenericArray.of(0.1f, 1.1f, -0.5f, 6.6f, MAX, MIN)
+            0x20, 0x06, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xCD, 0xCC, 0xCC,
+            0x3D, 0xCD, 0xCC, 0x8C, 0x3F, 0x00, 0x00, 0x00, 0xBF, 0x33, 0x33, 0xD3,
+            0x40, 0xFF, 0xFF, 0x7F, 0x7F, 0x01, 0x00, 0x00, 0x00,
+            // ARRAY<ARRAY<STRING>>
+            0x58, 0x03, 0x00, 0x00, 0x00, 0x02, 0x00, 0x00, 0x00, 0x20, 0x00, 0x00,
+            0x00, 0x20, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
+            0x00, 0x18, 0x00, 0x00, 0x00, 0x40, 0x00, 0x00, 0x00, 0x03, 0x00, 0x00,
+            0x00, 0x02, 0x00, 0x00, 0x00, 0x61, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
+            0x81, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x63, 0x00, 0x00,
+            0x00, 0x00, 0x00, 0x00, 0x81, 0x02, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
+            0x00, 0x68, 0x65, 0x6C, 0x6C, 0x6F, 0x00, 0x00, 0x85, 0x77, 0x6F, 0x72,
+            0x6C, 0x64, 0x00, 0x00, 0x85,
         ];
 
         let mut encoder = for_test_row_type(&row_type);
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
index d6b9fc94d7..69e08602c3 100644
--- a/fluss-rust/crates/fluss/src/row/field_getter.rs
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -82,6 +82,8 @@ impl FieldGetter {
                 pos,
                 precision: t.precision(),
             },
+            // TODO: add Map and Row variants when get_map/get_row are available in InternalRow.
+            DataType::Array(_) => InnerFieldGetter::Array { pos },
             _ => unimplemented!("DataType {:?} is currently unimplemented", data_type),
         };
 
@@ -149,6 +151,9 @@ pub enum InnerFieldGetter {
         pos: usize,
         precision: u32,
     },
+    Array {
+        pos: usize,
+    },
 }
 
 impl InnerFieldGetter {
@@ -177,7 +182,9 @@ impl InnerFieldGetter {
             }
             InnerFieldGetter::TimestampLtz { pos, precision } => {
                 Datum::TimestampLtz(row.get_timestamp_ltz(*pos, *precision)?)
-            } //TODO Array, Map, Row
+            }
+            // TODO: add Map and Row field getter support once their binary forms are implemented.
+            InnerFieldGetter::Array { pos } => Datum::Array(row.get_array(*pos)?),
         })
     }
 
@@ -198,7 +205,51 @@ impl InnerFieldGetter {
             | Self::Date { pos }
             | Self::Time { pos }
             | Self::Timestamp { pos, .. }
-            | Self::TimestampLtz { pos, .. } => *pos,
+            | Self::TimestampLtz { pos, .. }
+            | Self::Array { pos } => *pos,
         }
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::DataTypes;
+    use crate::row::GenericRow;
+    use crate::row::binary_array::FlussArrayWriter;
+
+    #[test]
+    fn test_field_getter_array() {
+        let elem_type = DataTypes::int();
+        let mut arr_writer = FlussArrayWriter::new(2, &elem_type);
+        arr_writer.write_int(0, 10);
+        arr_writer.write_int(1, 20);
+        let arr = arr_writer.complete().unwrap();
+
+        let mut row = GenericRow::new(2);
+        row.set_field(0, Datum::Int32(42));
+        row.set_field(1, Datum::Array(arr.clone()));
+
+        let getter = FieldGetter::create(&DataTypes::array(DataTypes::int()), 1);
+        let datum = getter.get_field(&row).unwrap();
+
+        match datum {
+            Datum::Array(a) => {
+                assert_eq!(a.size(), 2);
+                assert_eq!(a.get_int(0).unwrap(), 10);
+                assert_eq!(a.get_int(1).unwrap(), 20);
+            }
+            _ => panic!("Expected Array datum"),
+        }
+    }
+
+    #[test]
+    fn test_field_getter_nullable_array() {
+        let row = GenericRow::from_data(vec![Datum::Null]);
+
+        let data_type = DataTypes::array(DataTypes::int());
+        let getter = FieldGetter::create(&data_type, 0);
+        let datum = getter.get_field(&row).unwrap();
+        assert!(datum.is_null());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index ef99ba297a..359a9a5885 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -15,6 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
+pub mod binary_array;
 mod column;
 
 pub(crate) mod datum;
@@ -28,6 +29,7 @@ pub mod field_getter;
 mod row_decoder;
 
 use crate::client::WriteFormat;
+pub use binary_array::FlussArray;
 use bytes::Bytes;
 pub use column::*;
 pub use compacted::CompactedRow;
@@ -119,6 +121,9 @@ pub trait InternalRow: Send + Sync {
     /// Returns the binary value at the given position
     fn get_bytes(&self, pos: usize) -> Result<&[u8]>;
 
+    /// Returns the array value at the given position
+    fn get_array(&self, pos: usize) -> Result<FlussArray>;
+
     /// Returns encoded bytes if already encoded
     fn as_encoded_bytes(&self, _write_format: WriteFormat) -> Option<&[u8]> {
         None
@@ -274,6 +279,15 @@ impl<'a> InternalRow for GenericRow<'a> {
             }),
         }
     }
+
+    fn get_array(&self, pos: usize) -> Result<FlussArray> {
+        match self.get_value(pos)? {
+            Datum::Array(a) => Ok(a.clone()),
+            other => Err(IllegalArgument {
+                message: format!("type mismatch at position {pos}: expected Array, got {other:?}"),
+            }),
+        }
+    }
 }
 
 impl<'a> GenericRow<'a> {
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index a4befa5e3c..15a62c1ce1 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -407,6 +407,19 @@ Implements the `InternalRow` trait (see below).
 | `fn get_bytes(&self, idx: usize) -> Result<&[u8]>`                                     | Get bytes value                         |
 | `fn get_binary(&self, idx: usize, length: usize) -> Result<&[u8]>`                     | Get fixed-length binary value           |
 | `fn get_char(&self, idx: usize, length: usize) -> Result<&str>`                        | Get fixed-length char value             |
+| `fn get_array(&self, idx: usize) -> Result<FlussArray>`                                | Get array value                         |
+
+## `FlussArray`
+
+`FlussArray` is the Rust row representation for `ARRAY` values. You usually obtain it from `InternalRow::get_array()`.
+
+| Method | Description |
+|--------|-------------|
+| `fn size(&self) -> usize` | Number of elements in the array |
+| `fn is_null_at(&self, pos: usize) -> bool` | Check whether an element is null |
+| `fn as_bytes(&self) -> &[u8]` | Get encoded bytes of the array |
+
+Element getters mirror `InternalRow` typed getters and return `Result<T>`. For example, use `get_int()`, `get_long()`, and `get_double()` for primitive elements, and `get_string()`, `get_binary()`, `get_decimal()`, `get_timestamp_ntz()`, `get_timestamp_ltz()`, and `get_array()` for variable-length or nested elements.
 
 ## `ChangeType`
 
diff --git a/fluss-rust/website/docs/user-guide/rust/data-types.md b/fluss-rust/website/docs/user-guide/rust/data-types.md
index 143fe3457e..63b7fa6239 100644
--- a/fluss-rust/website/docs/user-guide/rust/data-types.md
+++ b/fluss-rust/website/docs/user-guide/rust/data-types.md
@@ -21,6 +21,7 @@ sidebar_position: 3
 | `TIMESTAMP_LTZ` | `TimestampLtz` | `get_timestamp_ltz(idx, precision)`  | `set_field(idx, TimestampLtz)` |
 | `BYTES`         | `&[u8]`        | `get_bytes()`                        | `set_field(idx, &[u8])`        |
 | `BINARY(n)`     | `&[u8]`        | `get_binary(idx, length)`            | `set_field(idx, &[u8])`        |
+| `ARRAY<T>`      | `FlussArray`   | `get_array()`                        | `set_field(idx, FlussArray)`   |
 
 ## Constructing Special Types
 
@@ -59,6 +60,29 @@ let data: Vec<Datum> = vec![1i32.into(), "hello".into(), Datum::Null];
 let row = GenericRow::from_data(data);
 ```
 
+## Arrays
+
+Use `DataTypes::array(element_type)` in schema definitions. At runtime, read arrays with `row.get_array(idx)?`.
+
+To construct array values for writes, build a `FlussArray` and wrap it with `Datum::Array`:
+
+```rust
+use fluss::metadata::DataTypes;
+use fluss::row::binary_array::FlussArrayWriter;
+use fluss::row::{Datum, GenericRow};
+
+let mut writer = FlussArrayWriter::new(3, &DataTypes::int());
+writer.write_int(0, 10);
+writer.write_int(1, 20);
+writer.set_null_at(2);
+let arr = writer.complete()?;
+
+let mut row = GenericRow::new(1);
+row.set_field(0, Datum::Array(arr));
+```
+
+`ARRAY` is supported for row values and nested row fields. For key encoding, Rust follows Java parity: `ARRAY` can be encoded by the compacted key encoder, while table-level key constraints are validated by the server (which may reject unsupported key types).
+
 ## Reading Row Data
 
 ```rust

From f297f2c7e1c3c69ff53f24fb7a49c5c296c0e50b Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 28 Mar 2026 20:42:02 +0000
Subject: [PATCH 214/287] [BUG] Fix possible TOCTOU race between leader
 discovery and server lookup in Lookuper (#451)

---
 fluss-rust/crates/fluss/src/client/table/lookup.rs | 11 +----------
 1 file changed, 1 insertion(+), 10 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index 3d643ed332..aa29ea693e 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -292,7 +292,6 @@ impl Lookuper {
         let table_bucket = TableBucket::new_with_partition(table_id, partition_id, bucket_id);
 
         // Find the leader for this bucket
-        let cluster = self.metadata.get_cluster();
         let leader = self
             .metadata
             .leader_for(self.table_path.as_ref(), &table_bucket)
@@ -303,15 +302,7 @@ impl Lookuper {
                 ))
             })?;
 
-        // Get connection to the tablet server
-        let tablet_server = cluster.get_tablet_server(leader.id()).ok_or_else(|| {
-            Error::leader_not_available(format!(
-                "Tablet server {} is not found in metadata cache",
-                leader.id()
-            ))
-        })?;
-
-        let connection = self.rpc_client.get_connection(tablet_server).await?;
+        let connection = self.rpc_client.get_connection(&leader).await?;
 
         // Send lookup request
         let request = LookupRequest::new(table_id, partition_id, bucket_id, vec![pk_bytes_vec]);

From da7b026d680bc0bcb2cce3a4cb01d3b30f9b7eb2 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 30 Mar 2026 22:49:58 +0100
Subject: [PATCH 215/287] [TASK-470] Optimize null append in Arrow builder
 (#471)

---
 fluss-rust/crates/fluss/src/row/datum.rs | 116 +++++++++++++----------
 1 file changed, 68 insertions(+), 48 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 2f1d1839fc..78dc54982c 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -540,11 +540,7 @@ fn append_fluss_array_to_list_builder(
 
     for i in 0..arr.size() {
         if arr.is_null_at(i) {
-            // TODO: Datum::Null triggers a chain of downcast attempts in append_to.
-            // For sparse arrays with many nulls, call append_null directly on the
-            // typed inner builder to avoid the overhead.
-            let null_datum = Datum::Null;
-            null_datum.append_to(values_builder, &element_arrow_type)?;
+            append_null_for_type(values_builder, &element_arrow_type)?;
         } else {
             let datum = read_datum_from_fluss_array(arr, i, &element_fluss_type)?;
             datum.append_to(values_builder, &element_arrow_type)?;
@@ -595,21 +591,78 @@ fn read_datum_from_fluss_array<'a>(
     })
 }
 
+fn append_null_for_type(
+    builder: &mut dyn ArrayBuilder,
+    data_type: &arrow_schema::DataType,
+) -> Result<()> {
+    macro_rules! downcast_null {
+        ($builder_type:ty) => {{
+            let b = builder
+                .as_any_mut()
+                .downcast_mut::<$builder_type>()
+                .ok_or_else(|| RowConvertError {
+                    message: format!(
+                        "Builder type mismatch: expected {} for {data_type:?}",
+                        stringify!($builder_type),
+                    ),
+                })?;
+            b.append_null();
+            Ok(())
+        }};
+    }
+
+    match data_type {
+        arrow_schema::DataType::Boolean => downcast_null!(BooleanBuilder),
+        arrow_schema::DataType::Int8 => downcast_null!(Int8Builder),
+        arrow_schema::DataType::Int16 => downcast_null!(Int16Builder),
+        arrow_schema::DataType::Int32 => downcast_null!(Int32Builder),
+        arrow_schema::DataType::Int64 => downcast_null!(Int64Builder),
+        arrow_schema::DataType::Float32 => downcast_null!(Float32Builder),
+        arrow_schema::DataType::Float64 => downcast_null!(Float64Builder),
+        arrow_schema::DataType::Utf8 => downcast_null!(StringBuilder),
+        arrow_schema::DataType::Binary => downcast_null!(BinaryBuilder),
+        arrow_schema::DataType::FixedSizeBinary(_) => downcast_null!(FixedSizeBinaryBuilder),
+        arrow_schema::DataType::Decimal128(_, _) => downcast_null!(Decimal128Builder),
+        arrow_schema::DataType::Date32 => downcast_null!(Date32Builder),
+        arrow_schema::DataType::Time32(arrow_schema::TimeUnit::Second) => {
+            downcast_null!(Time32SecondBuilder)
+        }
+        arrow_schema::DataType::Time32(arrow_schema::TimeUnit::Millisecond) => {
+            downcast_null!(Time32MillisecondBuilder)
+        }
+        arrow_schema::DataType::Time64(arrow_schema::TimeUnit::Microsecond) => {
+            downcast_null!(Time64MicrosecondBuilder)
+        }
+        arrow_schema::DataType::Time64(arrow_schema::TimeUnit::Nanosecond) => {
+            downcast_null!(Time64NanosecondBuilder)
+        }
+        arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Second, _) => {
+            downcast_null!(TimestampSecondBuilder)
+        }
+        arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Millisecond, _) => {
+            downcast_null!(TimestampMillisecondBuilder)
+        }
+        arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Microsecond, _) => {
+            downcast_null!(TimestampMicrosecondBuilder)
+        }
+        arrow_schema::DataType::Timestamp(arrow_schema::TimeUnit::Nanosecond, _) => {
+            downcast_null!(TimestampNanosecondBuilder)
+        }
+        arrow_schema::DataType::List(_) => {
+            downcast_null!(ListBuilder<Box<dyn ArrayBuilder>>)
+        }
+        _ => Err(RowConvertError {
+            message: format!("Unsupported Arrow data type for null append: {data_type:?}"),
+        }),
+    }
+}
+
 impl Datum<'_> {
     pub fn append_to(
         &self,
         builder: &mut dyn ArrayBuilder,
         data_type: &arrow_schema::DataType,
     ) -> Result<()> {
-        macro_rules! append_null_to_arrow {
-            ($builder_type:ty) => {
-                if let Some(b) = builder.as_any_mut().downcast_mut::<$builder_type>() {
-                    b.append_null();
-                    return Ok(());
-                }
-            };
-        }
-
         macro_rules! append_value_to_arrow {
             ($builder_type:ty, $value:expr) => {
                 if let Some(b) = builder.as_any_mut().downcast_mut::<$builder_type>() {
@@ -620,40 +673,7 @@ impl Datum<'_> {
         }
 
         match self {
-            Datum::Null => {
-                append_null_to_arrow!(Int8Builder);
-                append_null_to_arrow!(BooleanBuilder);
-                append_null_to_arrow!(Int16Builder);
-                append_null_to_arrow!(Int32Builder);
-                append_null_to_arrow!(Int64Builder);
-                append_null_to_arrow!(Float32Builder);
-                append_null_to_arrow!(Float64Builder);
-                append_null_to_arrow!(StringBuilder);
-                append_null_to_arrow!(BinaryBuilder);
-                append_null_to_arrow!(FixedSizeBinaryBuilder);
-                append_null_to_arrow!(Decimal128Builder);
-                append_null_to_arrow!(Date32Builder);
-                append_null_to_arrow!(Time32SecondBuilder);
-                append_null_to_arrow!(Time32MillisecondBuilder);
-                append_null_to_arrow!(Time64MicrosecondBuilder);
-                append_null_to_arrow!(Time64NanosecondBuilder);
-                append_null_to_arrow!(TimestampSecondBuilder);
-                append_null_to_arrow!(TimestampMillisecondBuilder);
-                append_null_to_arrow!(TimestampMicrosecondBuilder);
-                append_null_to_arrow!(TimestampNanosecondBuilder);
-                if let arrow_schema::DataType::List(_) = data_type {
-                    let b = builder
-                        .as_any_mut()
-                        .downcast_mut::<ListBuilder<Box<dyn ArrayBuilder>>>()
-                        .ok_or_else(|| RowConvertError {
-                            message:
-                                "Expected ListBuilder<Box<dyn ArrayBuilder>> for List Arrow type"
-                                    .to_string(),
-                        })?;
-                    b.append_null();
-                    return Ok(());
-                }
-            }
+            Datum::Null => return append_null_for_type(builder, data_type),
             Datum::Bool(v) => append_value_to_arrow!(BooleanBuilder, *v),
             Datum::Int8(v) => append_value_to_arrow!(Int8Builder, *v),
             Datum::Int16(v) => append_value_to_arrow!(Int16Builder, *v),

From b2f7326191a389d9fabaf500a201f61c60f7c206 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 1 Apr 2026 22:17:21 +0100
Subject: [PATCH 216/287] chore: fix annoying python CI/CD errors due to
 unsuported action (#473)

* chore: fix annoying python CI/CD errors due to unsuported action

* cache uv deps

* cache pyproject.toml

* Use setup-uv action pinned to commit SHA instead of pip install

Replace `pip install uv` with `astral-sh/setup-uv` pinned to commit
SHA for supply chain security. Remove redundant manual uv cache step
as setup-uv handles caching natively.

---------

Co-authored-by: Keith Lee <leekei@apache.org>
---
 fluss-rust/.github/workflows/build_and_test_python.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index 39dfa98047..87787c7374 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -53,7 +53,7 @@ jobs:
           python-version: ${{ matrix.python }}
 
       - name: Install uv
-        uses: astral-sh/setup-uv@v4
+        uses: astral-sh/setup-uv@37802adc94f370d6bfd71619e3f0bf239e1f3b78
 
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler

From 8957671c11b96464d9ed8fba4f307a7ac8cbbecf Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 1 Apr 2026 23:21:06 +0100
Subject: [PATCH 217/287] feat: [TASK-315] Proto + RPC for LimitScan (#472)

---
 .../crates/fluss/src/proto/fluss_api.proto    | 17 ++++++
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |  4 ++
 .../fluss/src/rpc/message/limit_scan.rs       | 58 +++++++++++++++++++
 .../crates/fluss/src/rpc/message/mod.rs       |  2 +
 4 files changed, 81 insertions(+)
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/limit_scan.rs

diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index a733dd7016..8f081c2d3b 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -419,6 +419,23 @@ message AuthenticateResponse {
   optional bytes challenge = 1;
 }
 
+// limit scan request and response
+message LimitScanRequest {
+  required int64 table_id = 2;
+  optional int64 partition_id = 3;
+  required int32 bucket_id = 4;
+  required int32 limit = 5;
+}
+
+message LimitScanResponse{
+  optional int32 error_code = 1;
+  optional string error_message = 2;
+  // flag to indicate the table type
+  optional bool is_log_table = 3;
+  // LogRecordBatch if is_log_table is true, otherwise KvRecordBatch
+  optional bytes records = 4;
+}
+
 // init writer request and response
 message InitWriterRequest {
   repeated PbTablePath table_path = 1;
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index d1b3ea68aa..5e4fddfe52 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -38,6 +38,7 @@ pub enum ApiKey {
     GetFileSystemSecurityToken, // 1025
     InitWriter,                 // 1026
     GetLatestLakeSnapshot,      // 1032
+    LimitScan,                  // 1033
     GetDatabaseInfo,            // 1035
     CreatePartition,            // 1036
     DropPartition,              // 1037
@@ -67,6 +68,7 @@ impl From<i16> for ApiKey {
             1025 => ApiKey::GetFileSystemSecurityToken,
             1026 => ApiKey::InitWriter,
             1032 => ApiKey::GetLatestLakeSnapshot,
+            1033 => ApiKey::LimitScan,
             1035 => ApiKey::GetDatabaseInfo,
             1036 => ApiKey::CreatePartition,
             1037 => ApiKey::DropPartition,
@@ -99,6 +101,7 @@ impl From<ApiKey> for i16 {
             ApiKey::GetFileSystemSecurityToken => 1025,
             ApiKey::InitWriter => 1026,
             ApiKey::GetLatestLakeSnapshot => 1032,
+            ApiKey::LimitScan => 1033,
             ApiKey::GetDatabaseInfo => 1035,
             ApiKey::CreatePartition => 1036,
             ApiKey::DropPartition => 1037,
@@ -134,6 +137,7 @@ mod tests {
             (1025, ApiKey::GetFileSystemSecurityToken),
             (1026, ApiKey::InitWriter),
             (1032, ApiKey::GetLatestLakeSnapshot),
+            (1033, ApiKey::LimitScan),
             (1035, ApiKey::GetDatabaseInfo),
             (1036, ApiKey::CreatePartition),
             (1037, ApiKey::DropPartition),
diff --git a/fluss-rust/crates/fluss/src/rpc/message/limit_scan.rs b/fluss-rust/crates/fluss/src/rpc/message/limit_scan.rs
new file mode 100644
index 0000000000..d83a2e8bf4
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/limit_scan.rs
@@ -0,0 +1,58 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::LimitScanResponse;
+use crate::rpc::frame::ReadError;
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::WriteError;
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{impl_read_version_type, impl_write_version_type, proto};
+use prost::Message;
+
+use bytes::{Buf, BufMut};
+
+pub struct LimitScanRequest {
+    pub inner_request: proto::LimitScanRequest,
+}
+
+impl LimitScanRequest {
+    pub fn new(table_id: i64, partition_id: Option<i64>, bucket_id: i32, limit: i32) -> Self {
+        let request = proto::LimitScanRequest {
+            table_id,
+            partition_id,
+            bucket_id,
+            limit,
+        };
+
+        Self {
+            inner_request: request,
+        }
+    }
+}
+
+impl RequestBody for LimitScanRequest {
+    type ResponseBody = LimitScanResponse;
+
+    const API_KEY: ApiKey = ApiKey::LimitScan;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(LimitScanRequest);
+impl_read_version_type!(LimitScanResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 89a8ba14f4..10808021d4 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -35,6 +35,7 @@ mod get_security_token;
 mod get_table;
 mod header;
 mod init_writer;
+mod limit_scan;
 mod list_databases;
 mod list_offsets;
 mod list_partition_infos;
@@ -61,6 +62,7 @@ pub use get_security_token::*;
 pub use get_table::*;
 pub use header::*;
 pub use init_writer::*;
+pub use limit_scan::*;
 pub use list_databases::*;
 pub use list_offsets::*;
 pub use list_partition_infos::*;

From 0010433ee8a973b353747b59f1e10c6c7c2fd399 Mon Sep 17 00:00:00 2001
From: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 3 Apr 2026 10:17:17 +0800
Subject: [PATCH 218/287] ci: fix release rust issue

---
 fluss-rust/.github/workflows/release_rust.yml     | 13 ++-----------
 fluss-rust/website/docs/release/create-release.md |  3 +++
 2 files changed, 5 insertions(+), 11 deletions(-)

diff --git a/fluss-rust/.github/workflows/release_rust.yml b/fluss-rust/.github/workflows/release_rust.yml
index 0a567a6a22..7ff7c0b72d 100644
--- a/fluss-rust/.github/workflows/release_rust.yml
+++ b/fluss-rust/.github/workflows/release_rust.yml
@@ -19,8 +19,7 @@
 # Trigger: push tag only (e.g. v0.1.0).
 # Pre-release tags (containing '-') do not publish; release tags publish to crates.io.
 #
-# Token auth: set repo variable CARGO_USE_TOKEN_AUTH = 'true' and add secret CARGO_REGISTRY_TOKEN.
-# Trusted Publishing (OIDC): leave CARGO_USE_TOKEN_AUTH unset; token is obtained via OIDC (no secret).
+# Token auth: add secret CARGO_REGISTRY_TOKEN for crates.io publishing.
 
 name: Release Rust
 
@@ -34,7 +33,6 @@ jobs:
     runs-on: ubuntu-latest
     permissions:
       contents: read
-      id-token: write
     steps:
       - uses: actions/checkout@v4
 
@@ -46,15 +44,8 @@ jobs:
       - name: Dry run (crates/fluss)
         run: cargo publish -p fluss-rs --dry-run
 
-      - name: Get crates.io token (OIDC)
-        if: startsWith(github.ref, 'refs/tags/') && !contains(github.ref, '-') && vars.CARGO_USE_TOKEN_AUTH != 'true'
-        uses: rust-lang/crates-io-auth-action@v1
-        id: auth
-        with:
-          token-type: publish
-
       - name: Publish fluss-rs to crates.io
         if: startsWith(github.ref, 'refs/tags/') && !contains(github.ref, '-')
         run: cargo publish -p fluss-rs
         env:
-          CARGO_REGISTRY_TOKEN: "${{ vars.CARGO_USE_TOKEN_AUTH == 'true' && secrets.CARGO_REGISTRY_TOKEN || steps.auth.outputs.token }}"
+          CARGO_REGISTRY_TOKEN: ${{ secrets.CARGO_REGISTRY_TOKEN }}
diff --git a/fluss-rust/website/docs/release/create-release.md b/fluss-rust/website/docs/release/create-release.md
index ba9c8752a1..5df844325a 100644
--- a/fluss-rust/website/docs/release/create-release.md
+++ b/fluss-rust/website/docs/release/create-release.md
@@ -39,10 +39,13 @@ Anybody can propose a release (e.g. on the dev [mailing list](https://fluss.apac
 
 Before your first release, perform one-time configuration. See **[Release Manager Preparation](https://fluss.apache.org/community/how-to-release/release-manager-preparation/)** (GPG key, etc.). For fluss-rust you do **not** need Nexus/Maven; you only need GPG for signing the source archive and (optionally) git signing.
 
+For GitHub Actions publishing, configure the repository secret `CARGO_REGISTRY_TOKEN` with a crates.io API token from an account allowed to publish `fluss-rs`. The `Release Rust` workflow uses this secret directly when a release tag is pushed.
+
 **Checklist (one-time)**
 
 - [ ] GPG key set up and published to [KEYS](https://downloads.apache.org/incubator/fluss/KEYS) or Apache account
 - [ ] Git configured to use your GPG key for signing tags
+- [ ] GitHub Actions secret `CARGO_REGISTRY_TOKEN` configured for crates.io publishing
 
 ### 1. Install Rust (and optional: just)
 

From 037d0a91e046640268af71e7ff80ed0de9230d09 Mon Sep 17 00:00:00 2001
From: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 3 Apr 2026 11:02:42 +0800
Subject: [PATCH 219/287] ci: pin pypi publish action to ASF-approved SHA

---
 .../.github/workflows/release_python.yml      | 31 +++++--------------
 1 file changed, 7 insertions(+), 24 deletions(-)

diff --git a/fluss-rust/.github/workflows/release_python.yml b/fluss-rust/.github/workflows/release_python.yml
index 7e5794693f..d61213e506 100644
--- a/fluss-rust/.github/workflows/release_python.yml
+++ b/fluss-rust/.github/workflows/release_python.yml
@@ -19,8 +19,7 @@
 # Trigger: push tag only (e.g. v0.1.0).
 # Pre-release tags (containing '-') publish to TestPyPI; release tags publish to PyPI.
 #
-# Token auth: set repo variable PYPI_USE_TOKEN_AUTH = 'true' and add secrets PYPI_API_TOKEN / TEST_PYPI_API_TOKEN.
-# Trusted Publishing (OIDC): leave PYPI_USE_TOKEN_AUTH unset; do not pass password so the action uses OIDC.
+# Token auth: add secrets PYPI_API_TOKEN / TEST_PYPI_API_TOKEN for publishing.
 
 name: Release Python
 
@@ -149,7 +148,6 @@ jobs:
     runs-on: ubuntu-latest
     permissions:
       contents: read
-      id-token: write
     needs: [version-check, sdist, wheels]
     if: startsWith(github.ref, 'refs/tags/')
     steps:
@@ -159,34 +157,19 @@ jobs:
           merge-multiple: true
           path: bindings/python/dist
 
-      - name: Publish to TestPyPI (token)
-        if: contains(github.ref, '-') && vars.PYPI_USE_TOKEN_AUTH == 'true'
-        uses: pypa/gh-action-pypi-publish@release/v1
+      - name: Publish to TestPyPI
+        if: contains(github.ref, '-')
+        uses: pypa/gh-action-pypi-publish@ed0c53931b1dc9bd32cbe73a98c7f6766f8a527e
         with:
           repository-url: https://test.pypi.org/legacy/
           skip-existing: true
           packages-dir: bindings/python/dist
           password: ${{ secrets.TEST_PYPI_API_TOKEN }}
 
-      - name: Publish to TestPyPI (Trusted Publishing)
-        if: contains(github.ref, '-') && vars.PYPI_USE_TOKEN_AUTH != 'true'
-        uses: pypa/gh-action-pypi-publish@release/v1
-        with:
-          repository-url: https://test.pypi.org/legacy/
-          skip-existing: true
-          packages-dir: bindings/python/dist
-
-      - name: Publish to PyPI (token)
-        if: ${{ !contains(github.ref, '-') && vars.PYPI_USE_TOKEN_AUTH == 'true' }}
-        uses: pypa/gh-action-pypi-publish@release/v1
+      - name: Publish to PyPI
+        if: ${{ !contains(github.ref, '-') }}
+        uses: pypa/gh-action-pypi-publish@ed0c53931b1dc9bd32cbe73a98c7f6766f8a527e
         with:
           skip-existing: true
           packages-dir: bindings/python/dist
           password: ${{ secrets.PYPI_API_TOKEN }}
-
-      - name: Publish to PyPI (Trusted Publishing)
-        if: ${{ !contains(github.ref, '-') && vars.PYPI_USE_TOKEN_AUTH != 'true' }}
-        uses: pypa/gh-action-pypi-publish@release/v1
-        with:
-          skip-existing: true
-          packages-dir: bindings/python/dist

From 4de077845d8fba2b207ad4533a79c48f8d23e9b4 Mon Sep 17 00:00:00 2001
From: luoyuxia <luoyuxia@alumni.sjtu.edu.cn>
Date: Fri, 3 Apr 2026 12:10:13 +0800
Subject: [PATCH 220/287] ci: improve read me for python

---
 fluss-rust/bindings/python/PYPI_README.md | 2 +-
 fluss-rust/bindings/python/pyproject.toml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/bindings/python/PYPI_README.md b/fluss-rust/bindings/python/PYPI_README.md
index ee9796a46c..2e538f5ca7 100644
--- a/fluss-rust/bindings/python/PYPI_README.md
+++ b/fluss-rust/bindings/python/PYPI_README.md
@@ -21,7 +21,7 @@
 PyFluss is a Python library for programmatic access to Apache Fluss (Incubating).
 It provides Python APIs to work with Fluss table metadata and read or write table data.
 
-The documentation is available at <https://clients.fluss.apache.org/>.
+The documentation is available at <https://clients.fluss.apache.org/user-guide/python/installation/>.
 
 ## Get in Touch
 
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index ce4c436381..b81aad0751 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -42,7 +42,7 @@ dependencies = [
 ]
 
 [project.urls]
-Homepage = "https://clients.fluss.apache.org/user-guide/rust/installation/"
+Homepage = "https://clients.fluss.apache.org/user-guide/python/installation/"
 Repository = "https://github.com/apache/fluss-rust"
 
 [project.optional-dependencies]

From 7e122e49c12ef04cabf726dd25f9c7124136718c Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sun, 5 Apr 2026 21:13:44 +0200
Subject: [PATCH 221/287] feat(iceberg): add IcebergBinaryRowWriter (#366)

* feat(iceberg): add IcebergBinaryRowWriter

* feat(iceberg): add IcebergBinaryRowWriter

* explict panicing and align with java for micros conversions

* address the reviews

* rebase and align how java side behaviour now

* address comments
---
 .../row/binary/iceberg_binary_row_writer.rs   | 555 ++++++++++++++++++
 fluss-rust/crates/fluss/src/row/binary/mod.rs |   2 +
 2 files changed, 557 insertions(+)
 create mode 100644 fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs

diff --git a/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs b/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
new file mode 100644
index 0000000000..c87ae10fec
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
@@ -0,0 +1,555 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use bytes::{Bytes, BytesMut};
+
+use crate::error::{Error, Result};
+use crate::metadata::DataType;
+use crate::row::Decimal;
+use crate::row::binary::{BinaryWriter, ValueWriter};
+
+const MICROS_PER_MILLI: i64 = 1_000;
+
+/// Iceberg-specific binary writer for encoding key columns.
+///
+/// Unlike [`CompactedRowWriter`] which uses varint encoding and length-prefixed
+/// variable-length fields, this writer follows Iceberg's encoding conventions:
+/// - Integers (int, date) are written as i64 (8 bytes, little-endian)
+/// - Time values are converted from milliseconds to microseconds
+/// - Timestamps are converted to microseconds
+/// - Floats/doubles use fixed-width little-endian encoding
+/// - Variable-length types (string, binary) are written without length prefixes
+/// - Decimals are written as unscaled big-endian bytes without length prefixes
+///
+/// The encoded bytes feed directly into [`IcebergBucketingFunction`]'s MurmurHash
+/// for bucket assignment and must match the Java Fluss server's encoding exactly.
+///
+/// [`CompactedRowWriter`]: crate::row::compacted::CompactedRowWriter
+/// [`IcebergBucketingFunction`]: crate::bucketing::IcebergBucketingFunction
+pub struct IcebergBinaryRowWriter {
+    position: usize,
+    buffer: BytesMut,
+}
+
+impl Default for IcebergBinaryRowWriter {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+impl IcebergBinaryRowWriter {
+    pub fn new() -> Self {
+        let buffer = BytesMut::zeroed(64);
+        Self {
+            position: 0,
+            buffer,
+        }
+    }
+
+    // Dependency order note:
+    // 1) Keep this PR scoped to writer-level Java parity.
+    // 2) Wire the writer through IcebergKeyEncoder in follow-up #308.
+    // TODO(#308): add end-to-end key-encoding tests via IcebergKeyEncoder
+    // (similar to CompactedKeyEncoder tests for CompactedKeyWriter).
+    pub fn create_value_writer(field_type: &DataType) -> Result<ValueWriter> {
+        match field_type {
+            // Match Java IcebergBinaryRowWriter.createFieldWriter() supported types exactly.
+            DataType::Int(_)
+            | DataType::Date(_)
+            | DataType::Time(_)
+            | DataType::BigInt(_)
+            | DataType::Float(_)
+            | DataType::Double(_)
+            | DataType::Timestamp(_)
+            | DataType::Decimal(_)
+            | DataType::String(_)
+            | DataType::Char(_)
+            | DataType::Binary(_)
+            | DataType::Bytes(_) => ValueWriter::create_value_writer(field_type, None),
+
+            // Keep Java's explicit scalar-only rejection messaging for ARRAY/MAP.
+            DataType::Array(_) => Err(Error::UnsupportedOperation {
+                message:
+                    "Array types cannot be used as bucket keys. Bucket keys must be scalar types."
+                        .to_string(),
+            }),
+            DataType::Map(_) => Err(Error::UnsupportedOperation {
+                message:
+                    "Map types cannot be used as bucket keys. Bucket keys must be scalar types."
+                        .to_string(),
+            }),
+
+            // BOOLEAN, TINYINT, SMALLINT, TIMESTAMP_LTZ, ROW and any future types.
+            _ => Err(Error::UnsupportedOperation {
+                message: format!(
+                    "Unsupported type for Iceberg binary row writer: {:?}",
+                    field_type
+                ),
+            }),
+        }
+    }
+
+    #[allow(dead_code)]
+    pub fn position(&self) -> usize {
+        self.position
+    }
+
+    #[allow(dead_code)]
+    pub fn buffer(&self) -> &[u8] {
+        &self.buffer[..self.position]
+    }
+
+    pub fn to_bytes(&self) -> Bytes {
+        Bytes::copy_from_slice(&self.buffer[..self.position])
+    }
+
+    fn ensure_capacity(&mut self, need_len: usize) {
+        if (self.buffer.len() - self.position) < need_len {
+            let new_len = std::cmp::max(self.buffer.len() * 2, self.buffer.len() + need_len);
+            self.buffer.resize(new_len, 0);
+        }
+    }
+
+    fn write_raw(&mut self, src: &[u8]) {
+        let end = self.position + src.len();
+        self.ensure_capacity(src.len());
+        self.buffer[self.position..end].copy_from_slice(src);
+        self.position = end;
+    }
+}
+
+impl BinaryWriter for IcebergBinaryRowWriter {
+    fn reset(&mut self) {
+        if self.position > 0 {
+            self.buffer[..self.position].fill(0);
+        }
+        self.position = 0;
+    }
+
+    fn set_null_at(&mut self, _pos: usize) {
+        panic!("Iceberg key columns do not support null values");
+    }
+
+    fn write_boolean(&mut self, value: bool) {
+        self.write_raw(&[if value { 1u8 } else { 0u8 }]);
+    }
+
+    fn write_byte(&mut self, value: u8) {
+        self.write_raw(&[value]);
+    }
+
+    fn write_bytes(&mut self, value: &[u8]) {
+        // Iceberg: raw bytes, no length prefix
+        self.write_raw(value);
+    }
+
+    fn write_char(&mut self, value: &str, _length: usize) {
+        // Iceberg: same as string — raw UTF-8, no length prefix
+        self.write_string(value);
+    }
+
+    fn write_string(&mut self, value: &str) {
+        // Iceberg: raw UTF-8 bytes, no length prefix
+        self.write_raw(value.as_bytes());
+    }
+
+    fn write_short(&mut self, value: i16) {
+        self.write_raw(&value.to_le_bytes());
+    }
+
+    fn write_int(&mut self, value: i32) {
+        // Iceberg: promote i32 to i64, write as 8 bytes little-endian
+        self.write_raw(&(value as i64).to_le_bytes());
+    }
+
+    fn write_long(&mut self, value: i64) {
+        self.write_raw(&value.to_le_bytes());
+    }
+
+    fn write_float(&mut self, value: f32) {
+        self.write_raw(&value.to_le_bytes());
+    }
+
+    fn write_double(&mut self, value: f64) {
+        self.write_raw(&value.to_le_bytes());
+    }
+
+    fn write_binary(&mut self, bytes: &[u8], length: usize) {
+        // Iceberg: raw bytes, no length prefix
+        self.write_raw(&bytes[..length.min(bytes.len())]);
+    }
+
+    fn write_decimal(&mut self, value: &Decimal, _precision: u32) {
+        // Iceberg: unscaled big-endian bytes, no length prefix
+        let unscaled_bytes = value.to_unscaled_bytes();
+        self.write_raw(&unscaled_bytes);
+    }
+
+    fn write_time(&mut self, value: i32, _precision: u32) {
+        // NOTE: this is the same with Java's long arithmetic wraps on overflow.
+        let micros = (value as i64).wrapping_mul(MICROS_PER_MILLI);
+        self.write_raw(&micros.to_le_bytes());
+    }
+
+    fn write_timestamp_ntz(&mut self, value: &crate::row::datum::TimestampNtz, _precision: u32) {
+        // NOTE: this is the same with Java's long arithmetic wraps on overflow.
+        let millis = value.get_millisecond();
+        let nanos = value.get_nano_of_millisecond();
+        let micros = millis
+            .wrapping_mul(MICROS_PER_MILLI)
+            .wrapping_add((nanos as i64) / MICROS_PER_MILLI);
+        self.write_raw(&micros.to_le_bytes());
+    }
+
+    fn write_timestamp_ltz(&mut self, value: &crate::row::datum::TimestampLtz, _precision: u32) {
+        // NOTE: this is the same with Java's long arithmetic wraps on overflow.
+        let millis = value.get_epoch_millisecond();
+        let nanos = value.get_nano_of_millisecond();
+        let micros = millis
+            .wrapping_mul(MICROS_PER_MILLI)
+            .wrapping_add((nanos as i64) / MICROS_PER_MILLI);
+        self.write_raw(&micros.to_le_bytes());
+    }
+
+    fn complete(&mut self) {
+        // No finalization needed for Iceberg key encoding
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{DataTypes, SmallIntType, TinyIntType};
+    use crate::row::datum::{TimestampLtz, TimestampNtz};
+    use bigdecimal::{BigDecimal, num_bigint::BigInt};
+
+    fn assert_unsupported_type(dt: DataType, expected_fragment: &str) {
+        match IcebergBinaryRowWriter::create_value_writer(&dt) {
+            Err(e) => assert!(
+                e.to_string().contains(expected_fragment),
+                "unexpected error for {dt:?}: {e}"
+            ),
+            Ok(_) => panic!("expected error for unsupported type {dt:?}, got Ok"),
+        }
+    }
+
+    #[test]
+    fn test_write_int_as_i64_le() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.write_int(42);
+        assert_eq!(w.buffer(), &42i64.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_int_negative() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.write_int(-1);
+        assert_eq!(w.buffer(), &(-1i64).to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_long() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.write_long(123456789012345i64);
+        assert_eq!(w.buffer(), &123456789012345i64.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_float() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let val = 1.23f32;
+        w.write_float(val);
+        assert_eq!(w.buffer(), &val.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_double() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let val = 9.876543210f64;
+        w.write_double(val);
+        assert_eq!(w.buffer(), &val.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_string_no_length_prefix() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.write_string("hello");
+        assert_eq!(w.buffer(), b"hello");
+    }
+
+    #[test]
+    fn test_write_bytes_no_length_prefix() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let data = &[0xDE, 0xAD, 0xBE, 0xEF];
+        w.write_bytes(data);
+        assert_eq!(w.buffer(), data);
+    }
+
+    #[test]
+    fn test_write_binary_no_length_prefix() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let data = &[1, 2, 3, 4, 5];
+        w.write_binary(data, 3);
+        assert_eq!(w.buffer(), &[1, 2, 3]);
+    }
+
+    #[test]
+    fn test_write_time_millis_to_micros() {
+        let mut w = IcebergBinaryRowWriter::new();
+        // 1000 ms = 1_000_000 µs
+        w.write_time(1000, 0);
+        assert_eq!(w.buffer(), &1_000_000i64.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_timestamp_ntz_compact() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let ts = TimestampNtz::new(1672531200000); // 2023-01-01 00:00:00 UTC
+        w.write_timestamp_ntz(&ts, 3);
+        let expected_micros = 1672531200000i64 * 1000;
+        assert_eq!(w.buffer(), &expected_micros.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_timestamp_ntz_with_nanos() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let ts = TimestampNtz::from_millis_nanos(1000, 500_000).unwrap();
+        w.write_timestamp_ntz(&ts, 6);
+        // 1000ms * 1000 + 500_000ns / 1000 = 1_000_000 + 500 = 1_000_500 µs
+        assert_eq!(w.buffer(), &1_000_500i64.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_timestamp_ltz() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let ts = TimestampLtz::from_millis_nanos(2000, 300_000).unwrap();
+        w.write_timestamp_ltz(&ts, 6);
+        // 2000ms * 1000 + 300_000ns / 1000 = 2_000_000 + 300 = 2_000_300 µs
+        assert_eq!(w.buffer(), &2_000_300i64.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_timestamp_ntz_overflow_wraps_like_java() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let ts = TimestampNtz::from_millis_nanos(i64::MAX, 999_999).unwrap();
+        w.write_timestamp_ntz(&ts, 9);
+
+        let expected = i64::MAX.wrapping_mul(MICROS_PER_MILLI).wrapping_add(999);
+        assert_eq!(w.buffer(), &expected.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_timestamp_ltz_overflow_wraps_like_java() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let ts = TimestampLtz::from_millis_nanos(i64::MIN, 999_999).unwrap();
+        w.write_timestamp_ltz(&ts, 9);
+
+        let expected = i64::MIN.wrapping_mul(MICROS_PER_MILLI).wrapping_add(999);
+        assert_eq!(w.buffer(), &expected.to_le_bytes());
+    }
+
+    #[test]
+    fn test_write_decimal_compact() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let bd = BigDecimal::new(BigInt::from(12345), 2); // 123.45
+        let decimal = Decimal::from_big_decimal(bd, 10, 2).unwrap();
+        w.write_decimal(&decimal, 10);
+
+        let expected = BigInt::from(12345).to_signed_bytes_be();
+        assert_eq!(w.buffer(), expected.as_slice());
+    }
+
+    #[test]
+    fn test_write_decimal_non_compact() {
+        let mut w = IcebergBinaryRowWriter::new();
+        let bd = BigDecimal::new(BigInt::from(12345), 0);
+        let decimal = Decimal::from_big_decimal(bd, 28, 0).unwrap();
+        w.write_decimal(&decimal, 28);
+
+        let expected = BigInt::from(12345).to_signed_bytes_be();
+        assert_eq!(w.buffer(), expected.as_slice());
+    }
+
+    #[test]
+    fn test_write_boolean() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.write_boolean(true);
+        assert_eq!(w.buffer(), &[1u8]);
+
+        w.reset();
+        w.write_boolean(false);
+        assert_eq!(w.buffer(), &[0u8]);
+    }
+
+    #[test]
+    #[should_panic(expected = "Iceberg key columns do not support null values")]
+    fn test_set_null_panics() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.set_null_at(0);
+    }
+
+    #[test]
+    fn test_reset_clears_position() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.write_int(42);
+        assert_eq!(w.position(), 8);
+        w.reset();
+        assert_eq!(w.position(), 0);
+        assert_eq!(w.buffer().len(), 0);
+    }
+
+    #[test]
+    fn test_to_bytes() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.write_string("test");
+        let bytes = w.to_bytes();
+        assert_eq!(bytes.as_ref(), b"test");
+    }
+
+    #[test]
+    fn test_multiple_writes() {
+        let mut w = IcebergBinaryRowWriter::new();
+        w.write_int(1);
+        w.write_string("ab");
+        let buf = w.buffer().to_vec();
+        // 8 bytes for int-as-i64 + 2 bytes for "ab"
+        assert_eq!(buf.len(), 10);
+        assert_eq!(&buf[..8], &1i64.to_le_bytes());
+        assert_eq!(&buf[8..], b"ab");
+    }
+
+    #[test]
+    fn test_buffer_growth() {
+        let mut w = IcebergBinaryRowWriter::new();
+        // Write more than 64 bytes to trigger buffer growth
+        let large = vec![0xAAu8; 128];
+        w.write_bytes(&large);
+        assert_eq!(w.buffer(), large.as_slice());
+    }
+
+    #[test]
+    fn test_create_value_writer_rejects_tinyint() {
+        let dt = DataType::TinyInt(TinyIntType::new());
+        match IcebergBinaryRowWriter::create_value_writer(&dt) {
+            Err(e) => assert!(
+                e.to_string()
+                    .contains("Unsupported type for Iceberg binary row writer"),
+                "unexpected error: {e}",
+            ),
+            Ok(_) => panic!("expected error for TinyInt, got Ok"),
+        }
+    }
+
+    #[test]
+    fn test_create_value_writer_rejects_smallint() {
+        let dt = DataType::SmallInt(SmallIntType::new());
+        match IcebergBinaryRowWriter::create_value_writer(&dt) {
+            Err(e) => assert!(
+                e.to_string()
+                    .contains("Unsupported type for Iceberg binary row writer"),
+                "unexpected error: {e}",
+            ),
+            Ok(_) => panic!("expected error for SmallInt, got Ok"),
+        }
+    }
+
+    #[test]
+    fn test_create_value_writer_rejects_boolean() {
+        assert_unsupported_type(
+            DataTypes::boolean(),
+            "Unsupported type for Iceberg binary row writer",
+        );
+    }
+
+    #[test]
+    fn test_create_value_writer_rejects_timestamp_ltz() {
+        assert_unsupported_type(
+            DataTypes::timestamp_ltz(),
+            "Unsupported type for Iceberg binary row writer",
+        );
+    }
+
+    #[test]
+    fn test_create_value_writer_rejects_array() {
+        assert_unsupported_type(
+            DataTypes::array(DataTypes::int()),
+            "Array types cannot be used as bucket keys",
+        );
+    }
+
+    #[test]
+    fn test_create_value_writer_rejects_map() {
+        assert_unsupported_type(
+            DataTypes::map(DataTypes::string(), DataTypes::int()),
+            "Map types cannot be used as bucket keys",
+        );
+    }
+
+    #[test]
+    fn test_create_value_writer_rejects_row() {
+        assert_unsupported_type(
+            DataTypes::row(vec![DataTypes::field("f0", DataTypes::int())]),
+            "Unsupported type for Iceberg binary row writer",
+        );
+    }
+
+    #[test]
+    fn test_create_value_writer_accepts_java_supported_scalar_types() {
+        let supported_types = vec![
+            ("int", DataTypes::int()),
+            ("date", DataTypes::date()),
+            ("time", DataTypes::time()),
+            ("bigint", DataTypes::bigint()),
+            ("float", DataTypes::float()),
+            ("double", DataTypes::double()),
+            ("timestamp_ntz", DataTypes::timestamp()),
+            ("decimal", DataTypes::decimal(10, 2)),
+            ("string", DataTypes::string()),
+            ("char", DataTypes::char(16)),
+            ("binary", DataTypes::binary(8)),
+            ("bytes", DataTypes::bytes()),
+        ];
+
+        for (name, data_type) in supported_types {
+            let res = IcebergBinaryRowWriter::create_value_writer(&data_type);
+            if let Err(e) = res {
+                panic!("expected {name} to be supported, got error: {e}");
+            }
+        }
+    }
+
+    #[test]
+    fn test_write_char_same_as_string() {
+        let mut w1 = IcebergBinaryRowWriter::new();
+        w1.write_char("hello", 10);
+
+        let mut w2 = IcebergBinaryRowWriter::new();
+        w2.write_string("hello");
+
+        assert_eq!(w1.buffer(), w2.buffer());
+    }
+
+    #[test]
+    fn test_write_date_as_int() {
+        // Date encoding goes through write_int (via InnerValueWriter::Date)
+        // which writes as i64 LE in Iceberg encoding
+        let mut w = IcebergBinaryRowWriter::new();
+        let days_since_epoch = 19000i32; // ~2022-01-06
+        w.write_int(days_since_epoch);
+        assert_eq!(w.buffer(), &(days_since_epoch as i64).to_le_bytes());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/binary/mod.rs b/fluss-rust/crates/fluss/src/row/binary/mod.rs
index 2a88ee1753..d6248dc515 100644
--- a/fluss-rust/crates/fluss/src/row/binary/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/mod.rs
@@ -16,8 +16,10 @@
 // under the License.
 
 mod binary_writer;
+mod iceberg_binary_row_writer;
 
 pub use binary_writer::*;
+pub use iceberg_binary_row_writer::IcebergBinaryRowWriter;
 
 /// The binary row format types, it indicates the generated row type by the [`BinaryWriter`]
 #[allow(dead_code)]

From 0f7cfc1364d325a4b4b42c112cdb8702e9efd287 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekeiabstraction@gmail.com>
Date: Sun, 5 Apr 2026 20:42:55 +0100
Subject: [PATCH 222/287] fix: add missing write_array impl to
 IcebergBinaryRowWriter (#477)

---
 .../crates/fluss/src/row/binary/iceberg_binary_row_writer.rs  | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs b/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
index c87ae10fec..b0e8434d1d 100644
--- a/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
@@ -225,6 +225,10 @@ impl BinaryWriter for IcebergBinaryRowWriter {
         self.write_raw(&micros.to_le_bytes());
     }
 
+    fn write_array(&mut self, _value: &[u8]) {
+        panic!("Iceberg key columns do not support array values");
+    }
+
     fn complete(&mut self) {
         // No finalization needed for Iceberg key encoding
     }

From 6c3c4b53968385d07b43fe3fa66f24003306a3e3 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 5 Apr 2026 22:02:14 +0100
Subject: [PATCH 223/287] chore: improve cargo cache (#478)

* chore: improve cargo cache

* use Cargo.lock

* Cargo.lock to paths-ignore licenserc.yaml
---
 .../.github/workflows/build_and_test_cpp.yml  |    2 +
 .../workflows/build_and_test_python.yml       |    2 +
 .../.github/workflows/build_and_test_rust.yml |    2 +
 fluss-rust/.gitignore                         |    1 -
 fluss-rust/.licenserc.yaml                    |    1 +
 fluss-rust/Cargo.lock                         | 4594 +++++++++++++++++
 6 files changed, 4601 insertions(+), 1 deletion(-)
 create mode 100644 fluss-rust/Cargo.lock

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
index 1931983d4e..88a896bce3 100644
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -63,6 +63,8 @@ jobs:
             ~/.cargo/git
             target
           key: cpp-test-${{ runner.os }}-${{ hashFiles('**/Cargo.lock') }}
+          restore-keys: |
+            cpp-test-${{ runner.os }}-
 
       - name: Build C++ bindings and tests
         working-directory: bindings/cpp
diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index 87787c7374..42b6ffad12 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -66,6 +66,8 @@ jobs:
             ~/.cargo/git
             target
           key: python-test-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
+          restore-keys: |
+            python-test-${{ runner.os }}-${{ matrix.python }}-
 
       - name: Build Python bindings
         working-directory: bindings/python
diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index 1bf7bc58fc..c904e300d0 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -66,6 +66,8 @@ jobs:
             ~/.cargo/git
             target
           key: rust-${{ runner.os }}-${{ hashFiles('**/Cargo.lock') }}
+          restore-keys: |
+            rust-${{ runner.os }}-
 
       - name: Build
         run: cargo build --workspace --all-targets --exclude fluss_python --exclude fluss-cpp
diff --git a/fluss-rust/.gitignore b/fluss-rust/.gitignore
index c821382293..eb3a06e6b1 100644
--- a/fluss-rust/.gitignore
+++ b/fluss-rust/.gitignore
@@ -3,7 +3,6 @@
 # will have compiled files and executables
 debug/
 target/
-Cargo.lock
 
 # These are backup files generated by rustfmt
 **/*.rs.bk
diff --git a/fluss-rust/.licenserc.yaml b/fluss-rust/.licenserc.yaml
index a5b1f76ca8..4afd5a9d20 100644
--- a/fluss-rust/.licenserc.yaml
+++ b/fluss-rust/.licenserc.yaml
@@ -22,6 +22,7 @@ header:
 
   paths-ignore:
     - '.gitignore'
+    - 'Cargo.lock'
     - 'LICENSE'
     - 'NOTICE'
     - 'DISCLAIMER'
diff --git a/fluss-rust/Cargo.lock b/fluss-rust/Cargo.lock
new file mode 100644
index 0000000000..a3b533d9cb
--- /dev/null
+++ b/fluss-rust/Cargo.lock
@@ -0,0 +1,4594 @@
+# This file is automatically @generated by Cargo.
+# It is not intended for manual editing.
+version = 4
+
+[[package]]
+name = "ahash"
+version = "0.8.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5a15f179cd60c4584b8a8c596927aadc462e27f2ca70c04e0071964a73ba7a75"
+dependencies = [
+ "cfg-if",
+ "const-random",
+ "getrandom 0.3.4",
+ "once_cell",
+ "version_check",
+ "zerocopy",
+]
+
+[[package]]
+name = "aho-corasick"
+version = "1.1.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ddd31a130427c27518df266943a5308ed92d4b226cc639f5a8f1002816174301"
+dependencies = [
+ "memchr",
+]
+
+[[package]]
+name = "android_system_properties"
+version = "0.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "819e7219dbd41043ac279b19830f2efc897156490d7fd6ea916720117ee66311"
+dependencies = [
+ "libc",
+]
+
+[[package]]
+name = "anstream"
+version = "1.0.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "824a212faf96e9acacdbd09febd34438f8f711fb84e09a8916013cd7815ca28d"
+dependencies = [
+ "anstyle",
+ "anstyle-parse",
+ "anstyle-query",
+ "anstyle-wincon",
+ "colorchoice",
+ "is_terminal_polyfill",
+ "utf8parse",
+]
+
+[[package]]
+name = "anstyle"
+version = "1.0.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "940b3a0ca603d1eade50a4846a2afffd5ef57a9feac2c0e2ec2e14f9ead76000"
+
+[[package]]
+name = "anstyle-parse"
+version = "1.0.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "52ce7f38b242319f7cabaa6813055467063ecdc9d355bbb4ce0c68908cd8130e"
+dependencies = [
+ "utf8parse",
+]
+
+[[package]]
+name = "anstyle-query"
+version = "1.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "40c48f72fd53cd289104fc64099abca73db4166ad86ea0b4341abe65af83dadc"
+dependencies = [
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "anstyle-wincon"
+version = "3.0.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "291e6a250ff86cd4a820112fb8898808a366d8f9f58ce16d1f538353ad55747d"
+dependencies = [
+ "anstyle",
+ "once_cell_polyfill",
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "anyhow"
+version = "1.0.102"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7f202df86484c868dbad7eaa557ef785d5c66295e41b460ef922eca0723b842c"
+
+[[package]]
+name = "arrow"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e4754a624e5ae42081f464514be454b39711daae0458906dacde5f4c632f33a8"
+dependencies = [
+ "arrow-arith",
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-cast",
+ "arrow-csv",
+ "arrow-data",
+ "arrow-ipc",
+ "arrow-json",
+ "arrow-ord",
+ "arrow-row",
+ "arrow-schema",
+ "arrow-select",
+ "arrow-string",
+]
+
+[[package]]
+name = "arrow-arith"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f7b3141e0ec5145a22d8694ea8b6d6f69305971c4fa1c1a13ef0195aef2d678b"
+dependencies = [
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-data",
+ "arrow-schema",
+ "chrono",
+ "num-traits",
+]
+
+[[package]]
+name = "arrow-array"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4c8955af33b25f3b175ee10af580577280b4bd01f7e823d94c7cdef7cf8c9aef"
+dependencies = [
+ "ahash",
+ "arrow-buffer",
+ "arrow-data",
+ "arrow-schema",
+ "chrono",
+ "half",
+ "hashbrown 0.16.1",
+ "num-complex",
+ "num-integer",
+ "num-traits",
+]
+
+[[package]]
+name = "arrow-buffer"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c697ddca96183182f35b3a18e50b9110b11e916d7b7799cbfd4d34662f2c56c2"
+dependencies = [
+ "bytes",
+ "half",
+ "num-bigint",
+ "num-traits",
+]
+
+[[package]]
+name = "arrow-cast"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "646bbb821e86fd57189c10b4fcdaa941deaf4181924917b0daa92735baa6ada5"
+dependencies = [
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-data",
+ "arrow-ord",
+ "arrow-schema",
+ "arrow-select",
+ "atoi",
+ "base64 0.22.1",
+ "chrono",
+ "half",
+ "lexical-core",
+ "num-traits",
+ "ryu",
+]
+
+[[package]]
+name = "arrow-csv"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8da746f4180004e3ce7b83c977daf6394d768332349d3d913998b10a120b790a"
+dependencies = [
+ "arrow-array",
+ "arrow-cast",
+ "arrow-schema",
+ "chrono",
+ "csv",
+ "csv-core",
+ "regex",
+]
+
+[[package]]
+name = "arrow-data"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1fdd994a9d28e6365aa78e15da3f3950c0fdcea6b963a12fa1c391afb637b304"
+dependencies = [
+ "arrow-buffer",
+ "arrow-schema",
+ "half",
+ "num-integer",
+ "num-traits",
+]
+
+[[package]]
+name = "arrow-ipc"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "abf7df950701ab528bf7c0cf7eeadc0445d03ef5d6ffc151eaae6b38a58feff1"
+dependencies = [
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-data",
+ "arrow-schema",
+ "arrow-select",
+ "flatbuffers",
+ "lz4_flex",
+ "zstd",
+]
+
+[[package]]
+name = "arrow-json"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0ff8357658bedc49792b13e2e862b80df908171275f8e6e075c460da5ee4bf86"
+dependencies = [
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-cast",
+ "arrow-data",
+ "arrow-schema",
+ "chrono",
+ "half",
+ "indexmap 2.13.1",
+ "itoa",
+ "lexical-core",
+ "memchr",
+ "num-traits",
+ "ryu",
+ "serde_core",
+ "serde_json",
+ "simdutf8",
+]
+
+[[package]]
+name = "arrow-ord"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f7d8f1870e03d4cbed632959498bcc84083b5a24bded52905ae1695bd29da45b"
+dependencies = [
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-data",
+ "arrow-schema",
+ "arrow-select",
+]
+
+[[package]]
+name = "arrow-pyarrow"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d18c442b4c266aaf3d7f7dd40fd7ae058cef7f113b00ff0cd8256e1e218ec544"
+dependencies = [
+ "arrow-array",
+ "arrow-data",
+ "arrow-schema",
+ "pyo3",
+]
+
+[[package]]
+name = "arrow-row"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "18228633bad92bff92a95746bbeb16e5fc318e8382b75619dec26db79e4de4c0"
+dependencies = [
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-data",
+ "arrow-schema",
+ "half",
+]
+
+[[package]]
+name = "arrow-schema"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8c872d36b7bf2a6a6a2b40de9156265f0242910791db366a2c17476ba8330d68"
+dependencies = [
+ "bitflags",
+]
+
+[[package]]
+name = "arrow-select"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "68bf3e3efbd1278f770d67e5dc410257300b161b93baedb3aae836144edcaf4b"
+dependencies = [
+ "ahash",
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-data",
+ "arrow-schema",
+ "num-traits",
+]
+
+[[package]]
+name = "arrow-string"
+version = "57.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "85e968097061b3c0e9fe3079cf2e703e487890700546b5b0647f60fca1b5a8d8"
+dependencies = [
+ "arrow-array",
+ "arrow-buffer",
+ "arrow-data",
+ "arrow-schema",
+ "arrow-select",
+ "memchr",
+ "num-traits",
+ "regex",
+ "regex-syntax",
+]
+
+[[package]]
+name = "astral-tokio-tar"
+version = "0.5.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ec179a06c1769b1e42e1e2cbe74c7dcdb3d6383c838454d063eaac5bbb7ebbe5"
+dependencies = [
+ "filetime",
+ "futures-core",
+ "libc",
+ "portable-atomic",
+ "rustc-hash",
+ "tokio",
+ "tokio-stream",
+ "xattr",
+]
+
+[[package]]
+name = "async-stream"
+version = "0.3.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0b5a71a6f37880a80d1d7f19efd781e4b5de42c88f0722cc13bcb6cc2cfe8476"
+dependencies = [
+ "async-stream-impl",
+ "futures-core",
+ "pin-project-lite",
+]
+
+[[package]]
+name = "async-stream-impl"
+version = "0.3.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c7c24de15d275a1ecfd47a380fb4d5ec9bfe0933f309ed5e705b775596a3574d"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "async-trait"
+version = "0.1.89"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9035ad2d096bed7955a320ee7e2230574d28fd3c3a0f186cbea1ff3c7eed5dbb"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "atoi"
+version = "2.0.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f28d99ec8bfea296261ca1af174f24225171fea9664ba9003cbebee704810528"
+dependencies = [
+ "num-traits",
+]
+
+[[package]]
+name = "atomic-waker"
+version = "1.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1505bd5d3d116872e7271a6d4e16d81d0c8570876c8de68093a09ac269d8aac0"
+
+[[package]]
+name = "autocfg"
+version = "1.5.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c08606f8c3cbf4ce6ec8e28fb0014a2c086708fe954eaa885384a6165172e7e8"
+
+[[package]]
+name = "axum"
+version = "0.8.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8b52af3cb4058c895d37317bb27508dccc8e5f2d39454016b297bf4a400597b8"
+dependencies = [
+ "axum-core",
+ "bytes",
+ "futures-util",
+ "http",
+ "http-body",
+ "http-body-util",
+ "itoa",
+ "matchit",
+ "memchr",
+ "mime",
+ "percent-encoding",
+ "pin-project-lite",
+ "serde_core",
+ "sync_wrapper",
+ "tower",
+ "tower-layer",
+ "tower-service",
+]
+
+[[package]]
+name = "axum-core"
+version = "0.5.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "08c78f31d7b1291f7ee735c1c6780ccde7785daae9a9206026862dab7d8792d1"
+dependencies = [
+ "bytes",
+ "futures-core",
+ "http",
+ "http-body",
+ "http-body-util",
+ "mime",
+ "pin-project-lite",
+ "sync_wrapper",
+ "tower-layer",
+ "tower-service",
+]
+
+[[package]]
+name = "backon"
+version = "1.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cffb0e931875b666fc4fcb20fee52e9bbd1ef836fd9e9e04ec21555f9f85f7ef"
+dependencies = [
+ "fastrand",
+ "gloo-timers",
+ "tokio",
+]
+
+[[package]]
+name = "base64"
+version = "0.21.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9d297deb1925b89f2ccc13d7635fa0714f12c87adce1c75356b39ca9b7178567"
+
+[[package]]
+name = "base64"
+version = "0.22.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "72b3254f16251a8381aa12e40e3c4d2f0199f8c6508fbecb9d91f575e0fbb8c6"
+
+[[package]]
+name = "bigdecimal"
+version = "0.4.10"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4d6867f1565b3aad85681f1015055b087fcfd840d6aeee6eee7f2da317603695"
+dependencies = [
+ "autocfg",
+ "libm",
+ "num-bigint",
+ "num-integer",
+ "num-traits",
+ "serde",
+]
+
+[[package]]
+name = "bitflags"
+version = "2.11.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "843867be96c8daad0d758b57df9392b6d8d271134fce549de6ce169ff98a92af"
+
+[[package]]
+name = "bitvec"
+version = "1.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1bc2832c24239b0141d5674bb9174f9d68a8b5b3f2753311927c172ca46f7e9c"
+dependencies = [
+ "funty",
+ "radium",
+ "tap",
+ "wyz",
+]
+
+[[package]]
+name = "block-buffer"
+version = "0.10.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3078c7629b62d3f0439517fa394996acacc5cbc91c5a20d8c658e77abd503a71"
+dependencies = [
+ "generic-array",
+]
+
+[[package]]
+name = "bollard"
+version = "0.19.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "87a52479c9237eb04047ddb94788c41ca0d26eaff8b697ecfbb4c32f7fdc3b1b"
+dependencies = [
+ "async-stream",
+ "base64 0.22.1",
+ "bitflags",
+ "bollard-buildkit-proto",
+ "bollard-stubs",
+ "bytes",
+ "chrono",
+ "futures-core",
+ "futures-util",
+ "hex",
+ "home",
+ "http",
+ "http-body-util",
+ "hyper",
+ "hyper-named-pipe",
+ "hyper-rustls",
+ "hyper-util",
+ "hyperlocal",
+ "log",
+ "num",
+ "pin-project-lite",
+ "rand 0.9.2",
+ "rustls",
+ "rustls-native-certs",
+ "rustls-pemfile",
+ "rustls-pki-types",
+ "serde",
+ "serde_derive",
+ "serde_json",
+ "serde_repr",
+ "serde_urlencoded",
+ "thiserror 2.0.18",
+ "tokio",
+ "tokio-stream",
+ "tokio-util",
+ "tonic",
+ "tower-service",
+ "url",
+ "winapi",
+]
+
+[[package]]
+name = "bollard-buildkit-proto"
+version = "0.7.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "85a885520bf6249ab931a764ffdb87b0ceef48e6e7d807cfdb21b751e086e1ad"
+dependencies = [
+ "prost",
+ "prost-types",
+ "tonic",
+ "tonic-prost",
+ "ureq",
+]
+
+[[package]]
+name = "bollard-stubs"
+version = "1.49.1-rc.28.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5731fe885755e92beff1950774068e0cae67ea6ec7587381536fca84f1779623"
+dependencies = [
+ "base64 0.22.1",
+ "bollard-buildkit-proto",
+ "bytes",
+ "chrono",
+ "prost",
+ "serde",
+ "serde_json",
+ "serde_repr",
+ "serde_with",
+]
+
+[[package]]
+name = "bumpalo"
+version = "3.20.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5d20789868f4b01b2f2caec9f5c4e0213b41e3e5702a50157d699ae31ced2fcb"
+
+[[package]]
+name = "byteorder"
+version = "1.5.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1fd0f2584146f6f2ef48085050886acf353beff7305ebd1ae69500e27c67f64b"
+
+[[package]]
+name = "bytes"
+version = "1.11.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1e748733b7cbc798e1434b6ac524f0c1ff2ab456fe201501e6497c8417a4fc33"
+
+[[package]]
+name = "cc"
+version = "1.2.59"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b7a4d3ec6524d28a329fc53654bbadc9bdd7b0431f5d65f1a56ffb28a1ee5283"
+dependencies = [
+ "find-msvc-tools",
+ "jobserver",
+ "libc",
+ "shlex",
+]
+
+[[package]]
+name = "cfg-if"
+version = "1.0.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9330f8b2ff13f34540b44e946ef35111825727b38d33286ef986142615121801"
+
+[[package]]
+name = "cfg_aliases"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "613afe47fcd5fac7ccf1db93babcb082c5994d996f20b8b159f2ad1658eb5724"
+
+[[package]]
+name = "chrono"
+version = "0.4.44"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c673075a2e0e5f4a1dde27ce9dee1ea4558c7ffe648f576438a20ca1d2acc4b0"
+dependencies = [
+ "iana-time-zone",
+ "js-sys",
+ "num-traits",
+ "serde",
+ "wasm-bindgen",
+ "windows-link",
+]
+
+[[package]]
+name = "clap"
+version = "4.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b193af5b67834b676abd72466a96c1024e6a6ad978a1f484bd90b85c94041351"
+dependencies = [
+ "clap_builder",
+ "clap_derive",
+]
+
+[[package]]
+name = "clap_builder"
+version = "4.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "714a53001bf66416adb0e2ef5ac857140e7dc3a0c48fb28b2f10762fc4b5069f"
+dependencies = [
+ "anstream",
+ "anstyle",
+ "clap_lex",
+ "strsim",
+]
+
+[[package]]
+name = "clap_derive"
+version = "4.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1110bd8a634a1ab8cb04345d8d878267d57c3cf1b38d91b71af6686408bbca6a"
+dependencies = [
+ "heck",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "clap_lex"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c8d4a3bb8b1e0c1050499d1815f5ab16d04f0959b233085fb31653fbfc9d98f9"
+
+[[package]]
+name = "codespan-reporting"
+version = "0.13.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "af491d569909a7e4dee0ad7db7f5341fef5c614d5b8ec8cf765732aba3cff681"
+dependencies = [
+ "serde",
+ "termcolor",
+ "unicode-width",
+]
+
+[[package]]
+name = "colorchoice"
+version = "1.0.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1d07550c9036bf2ae0c684c4297d503f838287c83c53686d05370d0e139ae570"
+
+[[package]]
+name = "const-oid"
+version = "0.9.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c2459377285ad874054d797f3ccebf984978aa39129f6eafde5cdc8315b612f8"
+
+[[package]]
+name = "const-random"
+version = "0.1.18"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "87e00182fe74b066627d63b85fd550ac2998d4b0bd86bfed477a0ae4c7c71359"
+dependencies = [
+ "const-random-macro",
+]
+
+[[package]]
+name = "const-random-macro"
+version = "0.1.16"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f9d839f2a20b0aee515dc581a6172f2321f96cab76c1a38a4c584a194955390e"
+dependencies = [
+ "getrandom 0.2.17",
+ "once_cell",
+ "tiny-keccak",
+]
+
+[[package]]
+name = "core-foundation"
+version = "0.10.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b2a6cd9ae233e7f62ba4e9353e81a88df7fc8a5987b8d445b4d90c879bd156f6"
+dependencies = [
+ "core-foundation-sys",
+ "libc",
+]
+
+[[package]]
+name = "core-foundation-sys"
+version = "0.8.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "773648b94d0e5d620f64f280777445740e61fe701025087ec8b57f45c791888b"
+
+[[package]]
+name = "cpufeatures"
+version = "0.2.17"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "59ed5838eebb26a2bb2e58f6d5b5316989ae9d08bab10e0e6d103e656d1b0280"
+dependencies = [
+ "libc",
+]
+
+[[package]]
+name = "crc32c"
+version = "0.6.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3a47af21622d091a8f0fb295b88bc886ac74efcc613efc19f5d0b21de5c89e47"
+dependencies = [
+ "rustc_version",
+]
+
+[[package]]
+name = "crossbeam-utils"
+version = "0.8.21"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d0a5c400df2834b80a4c3327b3aad3a4c4cd4de0629063962b03235697506a28"
+
+[[package]]
+name = "crunchy"
+version = "0.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "460fbee9c2c2f33933d720630a6a0bac33ba7053db5344fac858d4b8952d77d5"
+
+[[package]]
+name = "crypto-common"
+version = "0.1.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "78c8292055d1c1df0cce5d180393dc8cce0abec0a7102adb6c7b1eef6016d60a"
+dependencies = [
+ "generic-array",
+ "typenum",
+]
+
+[[package]]
+name = "csv"
+version = "1.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "52cd9d68cf7efc6ddfaaee42e7288d3a99d613d4b50f76ce9827ae0c6e14f938"
+dependencies = [
+ "csv-core",
+ "itoa",
+ "ryu",
+ "serde_core",
+]
+
+[[package]]
+name = "csv-core"
+version = "0.1.13"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "704a3c26996a80471189265814dbc2c257598b96b8a7feae2d31ace646bb9782"
+dependencies = [
+ "memchr",
+]
+
+[[package]]
+name = "cxx"
+version = "1.0.194"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "747d8437319e3a2f43d93b341c137927ca70c0f5dabeea7a005a73665e247c7e"
+dependencies = [
+ "cc",
+ "cxx-build",
+ "cxxbridge-cmd",
+ "cxxbridge-flags",
+ "cxxbridge-macro",
+ "foldhash 0.2.0",
+ "link-cplusplus",
+]
+
+[[package]]
+name = "cxx-build"
+version = "1.0.194"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b0f4697d190a142477b16aef7da8a99bfdc41e7e8b1687583c0d23a79c7afc1e"
+dependencies = [
+ "cc",
+ "codespan-reporting",
+ "indexmap 2.13.1",
+ "proc-macro2",
+ "quote",
+ "scratch",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "cxxbridge-cmd"
+version = "1.0.194"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d0956799fa8678d4c50eed028f2de1c0552ae183c76e976cf7ca8c4e36a7c328"
+dependencies = [
+ "clap",
+ "codespan-reporting",
+ "indexmap 2.13.1",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "cxxbridge-flags"
+version = "1.0.194"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "23384a836ab4f0ad98ace7e3955ad2de39de42378ab487dc28d3990392cb283a"
+
+[[package]]
+name = "cxxbridge-macro"
+version = "1.0.194"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e6acc6b5822b9526adfb4fc377b67128fdd60aac757cc4a741a6278603f763cf"
+dependencies = [
+ "indexmap 2.13.1",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "darling"
+version = "0.23.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "25ae13da2f202d56bd7f91c25fba009e7717a1e4a1cc98a76d844b65ae912e9d"
+dependencies = [
+ "darling_core",
+ "darling_macro",
+]
+
+[[package]]
+name = "darling_core"
+version = "0.23.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9865a50f7c335f53564bb694ef660825eb8610e0a53d3e11bf1b0d3df31e03b0"
+dependencies = [
+ "ident_case",
+ "proc-macro2",
+ "quote",
+ "strsim",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "darling_macro"
+version = "0.23.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ac3984ec7bd6cfa798e62b4a642426a5be0e68f9401cfc2a01e3fa9ea2fcdb8d"
+dependencies = [
+ "darling_core",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "dashmap"
+version = "6.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5041cc499144891f3790297212f32a74fb938e5136a14943f338ef9e0ae276cf"
+dependencies = [
+ "cfg-if",
+ "crossbeam-utils",
+ "hashbrown 0.14.5",
+ "lock_api",
+ "once_cell",
+ "parking_lot_core",
+]
+
+[[package]]
+name = "delegate"
+version = "0.13.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "780eb241654bf097afb00fc5f054a09b687dad862e485fdcf8399bb056565370"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "deranged"
+version = "0.5.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7cd812cc2bc1d69d4764bd80df88b4317eaef9e773c75226407d9bc0876b211c"
+dependencies = [
+ "powerfmt",
+ "serde_core",
+]
+
+[[package]]
+name = "digest"
+version = "0.10.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9ed9a281f7bc9b7576e61468ba615a66a5c8cfdff42420a70aa82701a3b1e292"
+dependencies = [
+ "block-buffer",
+ "const-oid",
+ "crypto-common",
+ "subtle",
+]
+
+[[package]]
+name = "displaydoc"
+version = "0.2.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "97369cbbc041bc366949bc74d34658d6cda5621039731c6310521892a3a20ae0"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "dlv-list"
+version = "0.5.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "442039f5147480ba31067cb00ada1adae6892028e40e45fc5de7b7df6dcc1b5f"
+dependencies = [
+ "const-random",
+]
+
+[[package]]
+name = "docker_credential"
+version = "1.3.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1d89dfcba45b4afad7450a99b39e751590463e45c04728cf555d36bb66940de8"
+dependencies = [
+ "base64 0.21.7",
+ "serde",
+ "serde_json",
+]
+
+[[package]]
+name = "dyn-clone"
+version = "1.0.20"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d0881ea181b1df73ff77ffaaf9c7544ecc11e82fba9b5f27b262a3c73a332555"
+
+[[package]]
+name = "either"
+version = "1.15.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "48c757948c5ede0e46177b7add2e67155f70e33c07fea8284df6576da70b3719"
+
+[[package]]
+name = "equivalent"
+version = "1.0.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "877a4ace8713b0bcf2a4e7eec82529c029f1d0619886d18145fea96c3ffe5c0f"
+
+[[package]]
+name = "erased-serde"
+version = "0.4.10"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d2add8a07dd6a8d93ff627029c51de145e12686fbc36ecb298ac22e74cf02dec"
+dependencies = [
+ "serde",
+ "serde_core",
+ "typeid",
+]
+
+[[package]]
+name = "errno"
+version = "0.3.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "39cab71617ae0d63f51a36d69f866391735b51691dbda63cf6f96d042b63efeb"
+dependencies = [
+ "libc",
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "etcetera"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "26c7b13d0780cb82722fd59f6f57f925e143427e4a75313a6c77243bf5326ae6"
+dependencies = [
+ "cfg-if",
+ "home",
+ "windows-sys 0.59.0",
+]
+
+[[package]]
+name = "fastrand"
+version = "2.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a043dc74da1e37d6afe657061213aa6f425f855399a11d3463c6ecccc4dfda1f"
+
+[[package]]
+name = "filetime"
+version = "0.2.27"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f98844151eee8917efc50bd9e8318cb963ae8b297431495d3f758616ea5c57db"
+dependencies = [
+ "cfg-if",
+ "libc",
+ "libredox",
+]
+
+[[package]]
+name = "find-msvc-tools"
+version = "0.1.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5baebc0774151f905a1a2cc41989300b1e6fbb29aff0ceffa1064fdd3088d582"
+
+[[package]]
+name = "fixedbitset"
+version = "0.5.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1d674e81391d1e1ab681a28d99df07927c6d4aa5b027d7da16ba32d1d21ecd99"
+
+[[package]]
+name = "flatbuffers"
+version = "25.12.19"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "35f6839d7b3b98adde531effaf34f0c2badc6f4735d26fe74709d8e513a96ef3"
+dependencies = [
+ "bitflags",
+ "rustc_version",
+]
+
+[[package]]
+name = "fluss-cpp"
+version = "0.2.0"
+dependencies = [
+ "anyhow",
+ "arrow",
+ "bigdecimal",
+ "cxx",
+ "cxx-build",
+ "fluss-rs",
+ "tokio",
+]
+
+[[package]]
+name = "fluss-examples"
+version = "0.2.0"
+dependencies = [
+ "clap",
+ "fluss-rs",
+ "tikv-jemallocator",
+ "tokio",
+]
+
+[[package]]
+name = "fluss-rs"
+version = "0.2.0"
+dependencies = [
+ "arrow",
+ "arrow-schema",
+ "bigdecimal",
+ "bitvec",
+ "byteorder",
+ "bytes",
+ "clap",
+ "crc32c",
+ "dashmap",
+ "delegate",
+ "futures",
+ "jiff",
+ "linked-hash-map",
+ "log",
+ "opendal",
+ "ordered-float",
+ "parking_lot",
+ "parse-display 0.10.0",
+ "prost",
+ "prost-build",
+ "rand 0.9.2",
+ "scopeguard",
+ "serde",
+ "serde_json",
+ "snafu",
+ "strum",
+ "strum_macros",
+ "tempfile",
+ "test-env-helpers",
+ "testcontainers",
+ "thiserror 1.0.69",
+ "tokio",
+ "url",
+ "uuid",
+]
+
+[[package]]
+name = "fluss_python"
+version = "0.2.0"
+dependencies = [
+ "arrow",
+ "arrow-array",
+ "arrow-pyarrow",
+ "arrow-schema",
+ "bigdecimal",
+ "fluss-rs",
+ "indexmap 2.13.1",
+ "jiff",
+ "pyo3",
+ "pyo3-async-runtimes",
+ "tokio",
+]
+
+[[package]]
+name = "fnv"
+version = "1.0.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3f9eec918d3f24069decb9af1554cad7c880e2da24a9afd88aca000531ab82c1"
+
+[[package]]
+name = "foldhash"
+version = "0.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d9c4f5dac5e15c24eb999c26181a6ca40b39fe946cbe4c263c7209467bc83af2"
+
+[[package]]
+name = "foldhash"
+version = "0.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "77ce24cb58228fbb8aa041425bb1050850ac19177686ea6e0f41a70416f56fdb"
+
+[[package]]
+name = "form_urlencoded"
+version = "1.2.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cb4cb245038516f5f85277875cdaa4f7d2c9a0fa0468de06ed190163b1581fcf"
+dependencies = [
+ "percent-encoding",
+]
+
+[[package]]
+name = "funty"
+version = "2.0.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e6d5a32815ae3f33302d95fdcb2ce17862f8c65363dcfd29360480ba1001fc9c"
+
+[[package]]
+name = "futures"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8b147ee9d1f6d097cef9ce628cd2ee62288d963e16fb287bd9286455b241382d"
+dependencies = [
+ "futures-channel",
+ "futures-core",
+ "futures-executor",
+ "futures-io",
+ "futures-sink",
+ "futures-task",
+ "futures-util",
+]
+
+[[package]]
+name = "futures-channel"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "07bbe89c50d7a535e539b8c17bc0b49bdb77747034daa8087407d655f3f7cc1d"
+dependencies = [
+ "futures-core",
+ "futures-sink",
+]
+
+[[package]]
+name = "futures-core"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7e3450815272ef58cec6d564423f6e755e25379b217b0bc688e295ba24df6b1d"
+
+[[package]]
+name = "futures-executor"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "baf29c38818342a3b26b5b923639e7b1f4a61fc5e76102d4b1981c6dc7a7579d"
+dependencies = [
+ "futures-core",
+ "futures-task",
+ "futures-util",
+]
+
+[[package]]
+name = "futures-io"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cecba35d7ad927e23624b22ad55235f2239cfa44fd10428eecbeba6d6a717718"
+
+[[package]]
+name = "futures-macro"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e835b70203e41293343137df5c0664546da5745f82ec9b84d40be8336958447b"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "futures-sink"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c39754e157331b013978ec91992bde1ac089843443c49cbc7f46150b0fad0893"
+
+[[package]]
+name = "futures-task"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "037711b3d59c33004d3856fbdc83b99d4ff37a24768fa1be9ce3538a1cde4393"
+
+[[package]]
+name = "futures-util"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "389ca41296e6190b48053de0321d02a77f32f8a5d2461dd38762c0593805c6d6"
+dependencies = [
+ "futures-channel",
+ "futures-core",
+ "futures-io",
+ "futures-macro",
+ "futures-sink",
+ "futures-task",
+ "memchr",
+ "pin-project-lite",
+ "slab",
+]
+
+[[package]]
+name = "generic-array"
+version = "0.14.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "85649ca51fd72272d7821adaf274ad91c288277713d9c18820d8499a7ff69e9a"
+dependencies = [
+ "typenum",
+ "version_check",
+]
+
+[[package]]
+name = "getrandom"
+version = "0.2.17"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ff2abc00be7fca6ebc474524697ae276ad847ad0a6b3faa4bcb027e9a4614ad0"
+dependencies = [
+ "cfg-if",
+ "js-sys",
+ "libc",
+ "wasi",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "getrandom"
+version = "0.3.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "899def5c37c4fd7b2664648c28120ecec138e4d395b459e5ca34f9cce2dd77fd"
+dependencies = [
+ "cfg-if",
+ "js-sys",
+ "libc",
+ "r-efi 5.3.0",
+ "wasip2",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "getrandom"
+version = "0.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0de51e6874e94e7bf76d726fc5d13ba782deca734ff60d5bb2fb2607c7406555"
+dependencies = [
+ "cfg-if",
+ "libc",
+ "r-efi 6.0.0",
+ "wasip2",
+ "wasip3",
+]
+
+[[package]]
+name = "gloo-timers"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bbb143cf96099802033e0d4f4963b19fd2e0b728bcf076cd9cf7f6634f092994"
+dependencies = [
+ "futures-channel",
+ "futures-core",
+ "js-sys",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "h2"
+version = "0.4.13"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2f44da3a8150a6703ed5d34e164b875fd14c2cdab9af1252a9a1020bde2bdc54"
+dependencies = [
+ "atomic-waker",
+ "bytes",
+ "fnv",
+ "futures-core",
+ "futures-sink",
+ "http",
+ "indexmap 2.13.1",
+ "slab",
+ "tokio",
+ "tokio-util",
+ "tracing",
+]
+
+[[package]]
+name = "half"
+version = "2.7.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6ea2d84b969582b4b1864a92dc5d27cd2b77b622a8d79306834f1be5ba20d84b"
+dependencies = [
+ "cfg-if",
+ "crunchy",
+ "num-traits",
+ "zerocopy",
+]
+
+[[package]]
+name = "hashbrown"
+version = "0.12.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8a9ee70c43aaf417c914396645a0fa852624801b24ebb7ae78fe8272889ac888"
+
+[[package]]
+name = "hashbrown"
+version = "0.14.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e5274423e17b7c9fc20b6e7e208532f9b19825d82dfd615708b70edd83df41f1"
+
+[[package]]
+name = "hashbrown"
+version = "0.15.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9229cfe53dfd69f0609a49f65461bd93001ea1ef889cd5529dd176593f5338a1"
+dependencies = [
+ "foldhash 0.1.5",
+]
+
+[[package]]
+name = "hashbrown"
+version = "0.16.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "841d1cc9bed7f9236f321df977030373f4a4163ae1a7dbfe1a51a2c1a51d9100"
+
+[[package]]
+name = "heck"
+version = "0.5.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2304e00983f87ffb38b55b444b5e3b60a884b5d30c0fca7d82fe33449bbe55ea"
+
+[[package]]
+name = "hex"
+version = "0.4.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7f24254aa9a54b5c858eaee2f5bccdb46aaf0e486a595ed5fd8f86ba55232a70"
+
+[[package]]
+name = "hmac"
+version = "0.12.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6c49c37c09c17a53d937dfbb742eb3a961d65a994e6bcdcf37e7399d0cc8ab5e"
+dependencies = [
+ "digest",
+]
+
+[[package]]
+name = "home"
+version = "0.5.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cc627f471c528ff0c4a49e1d5e60450c8f6461dd6d10ba9dcd3a61d3dff7728d"
+dependencies = [
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "http"
+version = "1.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e3ba2a386d7f85a81f119ad7498ebe444d2e22c2af0b86b069416ace48b3311a"
+dependencies = [
+ "bytes",
+ "itoa",
+]
+
+[[package]]
+name = "http-body"
+version = "1.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1efedce1fb8e6913f23e0c92de8e62cd5b772a67e7b3946df930a62566c93184"
+dependencies = [
+ "bytes",
+ "http",
+]
+
+[[package]]
+name = "http-body-util"
+version = "0.1.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b021d93e26becf5dc7e1b75b1bed1fd93124b374ceb73f43d4d4eafec896a64a"
+dependencies = [
+ "bytes",
+ "futures-core",
+ "http",
+ "http-body",
+ "pin-project-lite",
+]
+
+[[package]]
+name = "httparse"
+version = "1.10.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6dbf3de79e51f3d586ab4cb9d5c3e2c14aa28ed23d180cf89b4df0454a69cc87"
+
+[[package]]
+name = "httpdate"
+version = "1.0.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "df3b46402a9d5adb4c86a0cf463f42e19994e3ee891101b1841f30a545cb49a9"
+
+[[package]]
+name = "hyper"
+version = "1.9.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6299f016b246a94207e63da54dbe807655bf9e00044f73ded42c3ac5305fbcca"
+dependencies = [
+ "atomic-waker",
+ "bytes",
+ "futures-channel",
+ "futures-core",
+ "h2",
+ "http",
+ "http-body",
+ "httparse",
+ "httpdate",
+ "itoa",
+ "pin-project-lite",
+ "smallvec",
+ "tokio",
+ "want",
+]
+
+[[package]]
+name = "hyper-named-pipe"
+version = "0.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "73b7d8abf35697b81a825e386fc151e0d503e8cb5fcb93cc8669c376dfd6f278"
+dependencies = [
+ "hex",
+ "hyper",
+ "hyper-util",
+ "pin-project-lite",
+ "tokio",
+ "tower-service",
+ "winapi",
+]
+
+[[package]]
+name = "hyper-rustls"
+version = "0.27.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e3c93eb611681b207e1fe55d5a71ecf91572ec8a6705cdb6857f7d8d5242cf58"
+dependencies = [
+ "http",
+ "hyper",
+ "hyper-util",
+ "rustls",
+ "rustls-pki-types",
+ "tokio",
+ "tokio-rustls",
+ "tower-service",
+ "webpki-roots",
+]
+
+[[package]]
+name = "hyper-timeout"
+version = "0.5.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2b90d566bffbce6a75bd8b09a05aa8c2cb1fabb6cb348f8840c9e4c90a0d83b0"
+dependencies = [
+ "hyper",
+ "hyper-util",
+ "pin-project-lite",
+ "tokio",
+ "tower-service",
+]
+
+[[package]]
+name = "hyper-util"
+version = "0.1.20"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "96547c2556ec9d12fb1578c4eaf448b04993e7fb79cbaad930a656880a6bdfa0"
+dependencies = [
+ "base64 0.22.1",
+ "bytes",
+ "futures-channel",
+ "futures-util",
+ "http",
+ "http-body",
+ "hyper",
+ "ipnet",
+ "libc",
+ "percent-encoding",
+ "pin-project-lite",
+ "socket2",
+ "tokio",
+ "tower-service",
+ "tracing",
+]
+
+[[package]]
+name = "hyperlocal"
+version = "0.9.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "986c5ce3b994526b3cd75578e62554abd09f0899d6206de48b3e96ab34ccc8c7"
+dependencies = [
+ "hex",
+ "http-body-util",
+ "hyper",
+ "hyper-util",
+ "pin-project-lite",
+ "tokio",
+ "tower-service",
+]
+
+[[package]]
+name = "iana-time-zone"
+version = "0.1.65"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e31bc9ad994ba00e440a8aa5c9ef0ec67d5cb5e5cb0cc7f8b744a35b389cc470"
+dependencies = [
+ "android_system_properties",
+ "core-foundation-sys",
+ "iana-time-zone-haiku",
+ "js-sys",
+ "log",
+ "wasm-bindgen",
+ "windows-core",
+]
+
+[[package]]
+name = "iana-time-zone-haiku"
+version = "0.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f31827a206f56af32e590ba56d5d2d085f558508192593743f16b2306495269f"
+dependencies = [
+ "cc",
+]
+
+[[package]]
+name = "icu_collections"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2984d1cd16c883d7935b9e07e44071dca8d917fd52ecc02c04d5fa0b5a3f191c"
+dependencies = [
+ "displaydoc",
+ "potential_utf",
+ "utf8_iter",
+ "yoke",
+ "zerofrom",
+ "zerovec",
+]
+
+[[package]]
+name = "icu_locale_core"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "92219b62b3e2b4d88ac5119f8904c10f8f61bf7e95b640d25ba3075e6cac2c29"
+dependencies = [
+ "displaydoc",
+ "litemap",
+ "tinystr",
+ "writeable",
+ "zerovec",
+]
+
+[[package]]
+name = "icu_normalizer"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c56e5ee99d6e3d33bd91c5d85458b6005a22140021cc324cea84dd0e72cff3b4"
+dependencies = [
+ "icu_collections",
+ "icu_normalizer_data",
+ "icu_properties",
+ "icu_provider",
+ "smallvec",
+ "zerovec",
+]
+
+[[package]]
+name = "icu_normalizer_data"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "da3be0ae77ea334f4da67c12f149704f19f81d1adf7c51cf482943e84a2bad38"
+
+[[package]]
+name = "icu_properties"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bee3b67d0ea5c2cca5003417989af8996f8604e34fb9ddf96208a033901e70de"
+dependencies = [
+ "icu_collections",
+ "icu_locale_core",
+ "icu_properties_data",
+ "icu_provider",
+ "zerotrie",
+ "zerovec",
+]
+
+[[package]]
+name = "icu_properties_data"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8e2bbb201e0c04f7b4b3e14382af113e17ba4f63e2c9d2ee626b720cbce54a14"
+
+[[package]]
+name = "icu_provider"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "139c4cf31c8b5f33d7e199446eff9c1e02decfc2f0eec2c8d71f65befa45b421"
+dependencies = [
+ "displaydoc",
+ "icu_locale_core",
+ "writeable",
+ "yoke",
+ "zerofrom",
+ "zerotrie",
+ "zerovec",
+]
+
+[[package]]
+name = "id-arena"
+version = "2.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3d3067d79b975e8844ca9eb072e16b31c3c1c36928edf9c6789548c524d0d954"
+
+[[package]]
+name = "ident_case"
+version = "1.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b9e0384b61958566e926dc50660321d12159025e767c18e043daf26b70104c39"
+
+[[package]]
+name = "idna"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3b0875f23caa03898994f6ddc501886a45c7d3d62d04d2d90788d47be1b1e4de"
+dependencies = [
+ "idna_adapter",
+ "smallvec",
+ "utf8_iter",
+]
+
+[[package]]
+name = "idna_adapter"
+version = "1.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3acae9609540aa318d1bc588455225fb2085b9ed0c4f6bd0d9d5bcd86f1a0344"
+dependencies = [
+ "icu_normalizer",
+ "icu_properties",
+]
+
+[[package]]
+name = "indexmap"
+version = "1.9.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bd070e393353796e801d209ad339e89596eb4c8d430d18ede6a1cced8fafbd99"
+dependencies = [
+ "autocfg",
+ "hashbrown 0.12.3",
+ "serde",
+]
+
+[[package]]
+name = "indexmap"
+version = "2.13.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "45a8a2b9cb3e0b0c1803dbb0758ffac5de2f425b23c28f518faabd9d805342ff"
+dependencies = [
+ "equivalent",
+ "hashbrown 0.16.1",
+ "serde",
+ "serde_core",
+]
+
+[[package]]
+name = "indoc"
+version = "2.0.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "79cf5c93f93228cf8efb3ba362535fb11199ac548a09ce117c9b1adc3030d706"
+dependencies = [
+ "rustversion",
+]
+
+[[package]]
+name = "ipnet"
+version = "2.12.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d98f6fed1fde3f8c21bc40a1abb88dd75e67924f9cffc3ef95607bad8017f8e2"
+
+[[package]]
+name = "iri-string"
+version = "0.7.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "25e659a4bb38e810ebc252e53b5814ff908a8c58c2a9ce2fae1bbec24cbf4e20"
+dependencies = [
+ "memchr",
+ "serde",
+]
+
+[[package]]
+name = "is_terminal_polyfill"
+version = "1.70.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a6cb138bb79a146c1bd460005623e142ef0181e3d0219cb493e02f7d08a35695"
+
+[[package]]
+name = "itertools"
+version = "0.14.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2b192c782037fadd9cfa75548310488aabdbf3d2da73885b31bd0abd03351285"
+dependencies = [
+ "either",
+]
+
+[[package]]
+name = "itoa"
+version = "1.0.18"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8f42a60cbdf9a97f5d2305f08a87dc4e09308d1276d28c869c684d7777685682"
+
+[[package]]
+name = "jiff"
+version = "0.2.23"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1a3546dc96b6d42c5f24902af9e2538e82e39ad350b0c766eb3fbf2d8f3d8359"
+dependencies = [
+ "jiff-static",
+ "jiff-tzdb-platform",
+ "js-sys",
+ "log",
+ "portable-atomic",
+ "portable-atomic-util",
+ "serde_core",
+ "wasm-bindgen",
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "jiff-static"
+version = "0.2.23"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2a8c8b344124222efd714b73bb41f8b5120b27a7cc1c75593a6ff768d9d05aa4"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "jiff-tzdb"
+version = "0.1.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c900ef84826f1338a557697dc8fc601df9ca9af4ac137c7fb61d4c6f2dfd3076"
+
+[[package]]
+name = "jiff-tzdb-platform"
+version = "0.1.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "875a5a69ac2bab1a891711cf5eccbec1ce0341ea805560dcd90b7a2e925132e8"
+dependencies = [
+ "jiff-tzdb",
+]
+
+[[package]]
+name = "jobserver"
+version = "0.1.34"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9afb3de4395d6b3e67a780b6de64b51c978ecf11cb9a462c66be7d4ca9039d33"
+dependencies = [
+ "getrandom 0.3.4",
+ "libc",
+]
+
+[[package]]
+name = "js-sys"
+version = "0.3.94"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2e04e2ef80ce82e13552136fabeef8a5ed1f985a96805761cbb9a2c34e7664d9"
+dependencies = [
+ "cfg-if",
+ "futures-util",
+ "once_cell",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "leb128fmt"
+version = "0.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "09edd9e8b54e49e587e4f6295a7d29c3ea94d469cb40ab8ca70b288248a81db2"
+
+[[package]]
+name = "lexical-core"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7d8d125a277f807e55a77304455eb7b1cb52f2b18c143b60e766c120bd64a594"
+dependencies = [
+ "lexical-parse-float",
+ "lexical-parse-integer",
+ "lexical-util",
+ "lexical-write-float",
+ "lexical-write-integer",
+]
+
+[[package]]
+name = "lexical-parse-float"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "52a9f232fbd6f550bc0137dcb5f99ab674071ac2d690ac69704593cb4abbea56"
+dependencies = [
+ "lexical-parse-integer",
+ "lexical-util",
+]
+
+[[package]]
+name = "lexical-parse-integer"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9a7a039f8fb9c19c996cd7b2fcce303c1b2874fe1aca544edc85c4a5f8489b34"
+dependencies = [
+ "lexical-util",
+]
+
+[[package]]
+name = "lexical-util"
+version = "1.0.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2604dd126bb14f13fb5d1bd6a66155079cb9fa655b37f875b3a742c705dbed17"
+
+[[package]]
+name = "lexical-write-float"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "50c438c87c013188d415fbabbb1dceb44249ab81664efbd31b14ae55dabb6361"
+dependencies = [
+ "lexical-util",
+ "lexical-write-integer",
+]
+
+[[package]]
+name = "lexical-write-integer"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "409851a618475d2d5796377cad353802345cba92c867d9fbcde9cf4eac4e14df"
+dependencies = [
+ "lexical-util",
+]
+
+[[package]]
+name = "libc"
+version = "0.2.184"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "48f5d2a454e16a5ea0f4ced81bd44e4cfc7bd3a507b61887c99fd3538b28e4af"
+
+[[package]]
+name = "libm"
+version = "0.2.16"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b6d2cec3eae94f9f509c767b45932f1ada8350c4bdb85af2fcab4a3c14807981"
+
+[[package]]
+name = "libredox"
+version = "0.1.15"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7ddbf48fd451246b1f8c2610bd3b4ac0cc6e149d89832867093ab69a17194f08"
+dependencies = [
+ "bitflags",
+ "libc",
+ "plain",
+ "redox_syscall 0.7.3",
+]
+
+[[package]]
+name = "link-cplusplus"
+version = "1.0.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7f78c730aaa7d0b9336a299029ea49f9ee53b0ed06e9202e8cb7db9bae7b8c82"
+dependencies = [
+ "cc",
+]
+
+[[package]]
+name = "linked-hash-map"
+version = "0.5.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0717cef1bc8b636c6e1c1bbdefc09e6322da8a9321966e8928ef80d20f7f770f"
+
+[[package]]
+name = "linux-raw-sys"
+version = "0.12.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "32a66949e030da00e8c7d4434b251670a91556f4144941d37452769c25d58a53"
+
+[[package]]
+name = "litemap"
+version = "0.8.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "92daf443525c4cce67b150400bc2316076100ce0b3686209eb8cf3c31612e6f0"
+
+[[package]]
+name = "lock_api"
+version = "0.4.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "224399e74b87b5f3557511d98dff8b14089b3dadafcab6bb93eab67d3aace965"
+dependencies = [
+ "scopeguard",
+]
+
+[[package]]
+name = "log"
+version = "0.4.29"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5e5032e24019045c762d3c0f28f5b6b8bbf38563a65908389bf7978758920897"
+dependencies = [
+ "value-bag",
+]
+
+[[package]]
+name = "lru-slab"
+version = "0.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "112b39cec0b298b6c1999fee3e31427f74f676e4cb9879ed1a121b43661a4154"
+
+[[package]]
+name = "lz4_flex"
+version = "0.12.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "98c23545df7ecf1b16c303910a69b079e8e251d60f7dd2cc9b4177f2afaf1746"
+dependencies = [
+ "twox-hash",
+]
+
+[[package]]
+name = "matchit"
+version = "0.8.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "47e1ffaa40ddd1f3ed91f717a33c8c0ee23fff369e3aa8772b9605cc1d22f4c3"
+
+[[package]]
+name = "md-5"
+version = "0.10.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d89e7ee0cfbedfc4da3340218492196241d89eefb6dab27de5df917a6d2e78cf"
+dependencies = [
+ "cfg-if",
+ "digest",
+]
+
+[[package]]
+name = "memchr"
+version = "2.8.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f8ca58f447f06ed17d5fc4043ce1b10dd205e060fb3ce5b979b8ed8e59ff3f79"
+
+[[package]]
+name = "memoffset"
+version = "0.9.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "488016bfae457b036d996092f6cb448677611ce4449e970ceaf42695203f218a"
+dependencies = [
+ "autocfg",
+]
+
+[[package]]
+name = "mime"
+version = "0.3.17"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6877bb514081ee2a7ff5ef9de3281f14a4dd4bceac4c09388074a6b5df8a139a"
+
+[[package]]
+name = "mio"
+version = "1.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "50b7e5b27aa02a74bac8c3f23f448f8d87ff11f92d3aac1a6ed369ee08cc56c1"
+dependencies = [
+ "libc",
+ "wasi",
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "multimap"
+version = "0.10.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1d87ecb2933e8aeadb3e3a02b828fed80a7528047e68b4f424523a0981a3a084"
+
+[[package]]
+name = "num"
+version = "0.4.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "35bd024e8b2ff75562e5f34e7f4905839deb4b22955ef5e73d2fea1b9813cb23"
+dependencies = [
+ "num-bigint",
+ "num-complex",
+ "num-integer",
+ "num-iter",
+ "num-rational",
+ "num-traits",
+]
+
+[[package]]
+name = "num-bigint"
+version = "0.4.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a5e44f723f1133c9deac646763579fdb3ac745e418f2a7af9cd0c431da1f20b9"
+dependencies = [
+ "num-integer",
+ "num-traits",
+]
+
+[[package]]
+name = "num-complex"
+version = "0.4.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "73f88a1307638156682bada9d7604135552957b7818057dcef22705b4d509495"
+dependencies = [
+ "num-traits",
+]
+
+[[package]]
+name = "num-conv"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c6673768db2d862beb9b39a78fdcb1a69439615d5794a1be50caa9bc92c81967"
+
+[[package]]
+name = "num-integer"
+version = "0.1.46"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7969661fd2958a5cb096e56c8e1ad0444ac2bbcd0061bd28660485a44879858f"
+dependencies = [
+ "num-traits",
+]
+
+[[package]]
+name = "num-iter"
+version = "0.1.45"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1429034a0490724d0075ebb2bc9e875d6503c3cf69e235a8941aa757d83ef5bf"
+dependencies = [
+ "autocfg",
+ "num-integer",
+ "num-traits",
+]
+
+[[package]]
+name = "num-rational"
+version = "0.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f83d14da390562dca69fc84082e73e548e1ad308d24accdedd2720017cb37824"
+dependencies = [
+ "num-bigint",
+ "num-integer",
+ "num-traits",
+]
+
+[[package]]
+name = "num-traits"
+version = "0.2.19"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "071dfc062690e90b734c0b2273ce72ad0ffa95f0c74596bc250dcfd960262841"
+dependencies = [
+ "autocfg",
+ "libm",
+]
+
+[[package]]
+name = "once_cell"
+version = "1.21.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9f7c3e4beb33f85d45ae3e3a1792185706c8e16d043238c593331cc7cd313b50"
+
+[[package]]
+name = "once_cell_polyfill"
+version = "1.70.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "384b8ab6d37215f3c5301a95a4accb5d64aa607f1fcb26a11b5303878451b4fe"
+
+[[package]]
+name = "opendal"
+version = "0.55.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d075ab8a203a6ab4bc1bce0a4b9fe486a72bf8b939037f4b78d95386384bc80a"
+dependencies = [
+ "anyhow",
+ "backon",
+ "base64 0.22.1",
+ "bytes",
+ "crc32c",
+ "futures",
+ "getrandom 0.2.17",
+ "http",
+ "http-body",
+ "jiff",
+ "log",
+ "md-5",
+ "percent-encoding",
+ "quick-xml 0.38.4",
+ "reqsign",
+ "reqwest",
+ "serde",
+ "serde_json",
+ "tokio",
+ "url",
+ "uuid",
+]
+
+[[package]]
+name = "openssl-probe"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7c87def4c32ab89d880effc9e097653c8da5d6ef28e6b539d313baaacfbafcbe"
+
+[[package]]
+name = "ordered-float"
+version = "5.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b7d950ca161dc355eaf28f82b11345ed76c6e1f6eb1f4f4479e0323b9e2fbd0e"
+dependencies = [
+ "num-traits",
+ "rand 0.8.5",
+ "serde",
+]
+
+[[package]]
+name = "ordered-multimap"
+version = "0.7.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "49203cdcae0030493bad186b28da2fa25645fa276a51b6fec8010d281e02ef79"
+dependencies = [
+ "dlv-list",
+ "hashbrown 0.14.5",
+]
+
+[[package]]
+name = "parking_lot"
+version = "0.12.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "93857453250e3077bd71ff98b6a65ea6621a19bb0f559a85248955ac12c45a1a"
+dependencies = [
+ "lock_api",
+ "parking_lot_core",
+]
+
+[[package]]
+name = "parking_lot_core"
+version = "0.9.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2621685985a2ebf1c516881c026032ac7deafcda1a2c9b7850dc81e3dfcb64c1"
+dependencies = [
+ "cfg-if",
+ "libc",
+ "redox_syscall 0.5.18",
+ "smallvec",
+ "windows-link",
+]
+
+[[package]]
+name = "parse-display"
+version = "0.9.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "914a1c2265c98e2446911282c6ac86d8524f495792c38c5bd884f80499c7538a"
+dependencies = [
+ "parse-display-derive 0.9.1",
+ "regex",
+ "regex-syntax",
+]
+
+[[package]]
+name = "parse-display"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "287d8d3ebdce117b8539f59411e4ed9ec226e0a4153c7f55495c6070d68e6f72"
+dependencies = [
+ "parse-display-derive 0.10.0",
+ "regex",
+ "regex-syntax",
+]
+
+[[package]]
+name = "parse-display-derive"
+version = "0.9.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2ae7800a4c974efd12df917266338e79a7a74415173caf7e70aa0a0707345281"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "regex",
+ "regex-syntax",
+ "structmeta",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "parse-display-derive"
+version = "0.10.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7fc048687be30d79502dea2f623d052f3a074012c6eac41726b7ab17213616b1"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "regex",
+ "regex-syntax",
+ "structmeta",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "percent-encoding"
+version = "2.3.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9b4f627cb1b25917193a259e49bdad08f671f8d9708acfd5fe0a8c1455d87220"
+
+[[package]]
+name = "petgraph"
+version = "0.8.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8701b58ea97060d5e5b155d383a69952a60943f0e6dfe30b04c287beb0b27455"
+dependencies = [
+ "fixedbitset",
+ "hashbrown 0.15.5",
+ "indexmap 2.13.1",
+]
+
+[[package]]
+name = "pin-project"
+version = "1.1.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f1749c7ed4bcaf4c3d0a3efc28538844fb29bcdd7d2b67b2be7e20ba861ff517"
+dependencies = [
+ "pin-project-internal",
+]
+
+[[package]]
+name = "pin-project-internal"
+version = "1.1.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d9b20ed30f105399776b9c883e68e536ef602a16ae6f596d2c473591d6ad64c6"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "pin-project-lite"
+version = "0.2.17"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a89322df9ebe1c1578d689c92318e070967d1042b512afbe49518723f4e6d5cd"
+
+[[package]]
+name = "pkg-config"
+version = "0.3.32"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7edddbd0b52d732b21ad9a5fab5c704c14cd949e5e9a1ec5929a24fded1b904c"
+
+[[package]]
+name = "plain"
+version = "0.2.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b4596b6d070b27117e987119b4dac604f3c58cfb0b191112e24771b2faeac1a6"
+
+[[package]]
+name = "portable-atomic"
+version = "1.13.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c33a9471896f1c69cecef8d20cbe2f7accd12527ce60845ff44c153bb2a21b49"
+
+[[package]]
+name = "portable-atomic-util"
+version = "0.2.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "091397be61a01d4be58e7841595bd4bfedb15f1cd54977d79b8271e94ed799a3"
+dependencies = [
+ "portable-atomic",
+]
+
+[[package]]
+name = "potential_utf"
+version = "0.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0103b1cef7ec0cf76490e969665504990193874ea05c85ff9bab8b911d0a0564"
+dependencies = [
+ "zerovec",
+]
+
+[[package]]
+name = "powerfmt"
+version = "0.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "439ee305def115ba05938db6eb1644ff94165c5ab5e9420d1c1bcedbba909391"
+
+[[package]]
+name = "ppv-lite86"
+version = "0.2.21"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "85eae3c4ed2f50dcfe72643da4befc30deadb458a9b590d720cde2f2b1e97da9"
+dependencies = [
+ "zerocopy",
+]
+
+[[package]]
+name = "prettyplease"
+version = "0.2.37"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "479ca8adacdd7ce8f1fb39ce9ecccbfe93a3f1344b3d0d97f20bc0196208f62b"
+dependencies = [
+ "proc-macro2",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "proc-macro2"
+version = "1.0.106"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8fd00f0bb2e90d81d1044c2b32617f68fcb9fa3bb7640c23e9c748e53fb30934"
+dependencies = [
+ "unicode-ident",
+]
+
+[[package]]
+name = "prost"
+version = "0.14.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d2ea70524a2f82d518bce41317d0fae74151505651af45faf1ffbd6fd33f0568"
+dependencies = [
+ "bytes",
+ "prost-derive",
+]
+
+[[package]]
+name = "prost-build"
+version = "0.14.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "343d3bd7056eda839b03204e68deff7d1b13aba7af2b2fd16890697274262ee7"
+dependencies = [
+ "heck",
+ "itertools",
+ "log",
+ "multimap",
+ "petgraph",
+ "prettyplease",
+ "prost",
+ "prost-types",
+ "regex",
+ "syn 2.0.117",
+ "tempfile",
+]
+
+[[package]]
+name = "prost-derive"
+version = "0.14.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "27c6023962132f4b30eb4c172c91ce92d933da334c59c23cddee82358ddafb0b"
+dependencies = [
+ "anyhow",
+ "itertools",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "prost-types"
+version = "0.14.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8991c4cbdb8bc5b11f0b074ffe286c30e523de90fee5ba8132f1399f23cb3dd7"
+dependencies = [
+ "prost",
+]
+
+[[package]]
+name = "pyo3"
+version = "0.26.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7ba0117f4212101ee6544044dae45abe1083d30ce7b29c4b5cbdfa2354e07383"
+dependencies = [
+ "indoc",
+ "libc",
+ "memoffset",
+ "once_cell",
+ "portable-atomic",
+ "pyo3-build-config",
+ "pyo3-ffi",
+ "pyo3-macros",
+ "unindent",
+]
+
+[[package]]
+name = "pyo3-async-runtimes"
+version = "0.26.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e6ee6d4cb3e8d5b925f5cdb38da183e0ff18122eb2048d4041c9e7034d026e23"
+dependencies = [
+ "futures",
+ "once_cell",
+ "pin-project-lite",
+ "pyo3",
+ "tokio",
+]
+
+[[package]]
+name = "pyo3-build-config"
+version = "0.26.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4fc6ddaf24947d12a9aa31ac65431fb1b851b8f4365426e182901eabfb87df5f"
+dependencies = [
+ "python3-dll-a",
+ "target-lexicon",
+]
+
+[[package]]
+name = "pyo3-ffi"
+version = "0.26.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "025474d3928738efb38ac36d4744a74a400c901c7596199e20e45d98eb194105"
+dependencies = [
+ "libc",
+ "pyo3-build-config",
+]
+
+[[package]]
+name = "pyo3-macros"
+version = "0.26.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2e64eb489f22fe1c95911b77c44cc41e7c19f3082fc81cce90f657cdc42ffded"
+dependencies = [
+ "proc-macro2",
+ "pyo3-macros-backend",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "pyo3-macros-backend"
+version = "0.26.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "100246c0ecf400b475341b8455a9213344569af29a3c841d29270e53102e0fcf"
+dependencies = [
+ "heck",
+ "proc-macro2",
+ "pyo3-build-config",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "python3-dll-a"
+version = "0.2.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d381ef313ae70b4da5f95f8a4de773c6aa5cd28f73adec4b4a31df70b66780d8"
+dependencies = [
+ "cc",
+]
+
+[[package]]
+name = "quick-xml"
+version = "0.37.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "331e97a1af0bf59823e6eadffe373d7b27f485be8748f71471c662c1f269b7fb"
+dependencies = [
+ "memchr",
+ "serde",
+]
+
+[[package]]
+name = "quick-xml"
+version = "0.38.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b66c2058c55a409d601666cffe35f04333cf1013010882cec174a7467cd4e21c"
+dependencies = [
+ "memchr",
+ "serde",
+]
+
+[[package]]
+name = "quinn"
+version = "0.11.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b9e20a958963c291dc322d98411f541009df2ced7b5a4f2bd52337638cfccf20"
+dependencies = [
+ "bytes",
+ "cfg_aliases",
+ "pin-project-lite",
+ "quinn-proto",
+ "quinn-udp",
+ "rustc-hash",
+ "rustls",
+ "socket2",
+ "thiserror 2.0.18",
+ "tokio",
+ "tracing",
+ "web-time",
+]
+
+[[package]]
+name = "quinn-proto"
+version = "0.11.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "434b42fec591c96ef50e21e886936e66d3cc3f737104fdb9b737c40ffb94c098"
+dependencies = [
+ "bytes",
+ "getrandom 0.3.4",
+ "lru-slab",
+ "rand 0.9.2",
+ "ring",
+ "rustc-hash",
+ "rustls",
+ "rustls-pki-types",
+ "slab",
+ "thiserror 2.0.18",
+ "tinyvec",
+ "tracing",
+ "web-time",
+]
+
+[[package]]
+name = "quinn-udp"
+version = "0.5.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "addec6a0dcad8a8d96a771f815f0eaf55f9d1805756410b39f5fa81332574cbd"
+dependencies = [
+ "cfg_aliases",
+ "libc",
+ "once_cell",
+ "socket2",
+ "tracing",
+ "windows-sys 0.60.2",
+]
+
+[[package]]
+name = "quote"
+version = "1.0.45"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "41f2619966050689382d2b44f664f4bc593e129785a36d6ee376ddf37259b924"
+dependencies = [
+ "proc-macro2",
+]
+
+[[package]]
+name = "r-efi"
+version = "5.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "69cdb34c158ceb288df11e18b4bd39de994f6657d83847bdffdbd7f346754b0f"
+
+[[package]]
+name = "r-efi"
+version = "6.0.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f8dcc9c7d52a811697d2151c701e0d08956f92b0e24136cf4cf27b57a6a0d9bf"
+
+[[package]]
+name = "radium"
+version = "0.7.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dc33ff2d4973d518d823d61aa239014831e521c75da58e3df4840d3f47749d09"
+
+[[package]]
+name = "rand"
+version = "0.8.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "34af8d1a0e25924bc5b7c43c079c942339d8f0a8b57c39049bef581b46327404"
+dependencies = [
+ "libc",
+ "rand_chacha 0.3.1",
+ "rand_core 0.6.4",
+ "serde",
+]
+
+[[package]]
+name = "rand"
+version = "0.9.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6db2770f06117d490610c7488547d543617b21bfa07796d7a12f6f1bd53850d1"
+dependencies = [
+ "rand_chacha 0.9.0",
+ "rand_core 0.9.5",
+]
+
+[[package]]
+name = "rand_chacha"
+version = "0.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e6c10a63a0fa32252be49d21e7709d4d4baf8d231c2dbce1eaa8141b9b127d88"
+dependencies = [
+ "ppv-lite86",
+ "rand_core 0.6.4",
+]
+
+[[package]]
+name = "rand_chacha"
+version = "0.9.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d3022b5f1df60f26e1ffddd6c66e8aa15de382ae63b3a0c1bfc0e4d3e3f325cb"
+dependencies = [
+ "ppv-lite86",
+ "rand_core 0.9.5",
+]
+
+[[package]]
+name = "rand_core"
+version = "0.6.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ec0be4795e2f6a28069bec0b5ff3e2ac9bafc99e6a9a7dc3547996c5c816922c"
+dependencies = [
+ "getrandom 0.2.17",
+ "serde",
+]
+
+[[package]]
+name = "rand_core"
+version = "0.9.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "76afc826de14238e6e8c374ddcc1fa19e374fd8dd986b0d2af0d02377261d83c"
+dependencies = [
+ "getrandom 0.3.4",
+]
+
+[[package]]
+name = "redox_syscall"
+version = "0.5.18"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ed2bf2547551a7053d6fdfafda3f938979645c44812fbfcda098faae3f1a362d"
+dependencies = [
+ "bitflags",
+]
+
+[[package]]
+name = "redox_syscall"
+version = "0.7.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6ce70a74e890531977d37e532c34d45e9055d2409ed08ddba14529471ed0be16"
+dependencies = [
+ "bitflags",
+]
+
+[[package]]
+name = "ref-cast"
+version = "1.0.25"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f354300ae66f76f1c85c5f84693f0ce81d747e2c3f21a45fef496d89c960bf7d"
+dependencies = [
+ "ref-cast-impl",
+]
+
+[[package]]
+name = "ref-cast-impl"
+version = "1.0.25"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b7186006dcb21920990093f30e3dea63b7d6e977bf1256be20c3563a5db070da"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "regex"
+version = "1.12.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e10754a14b9137dd7b1e3e5b0493cc9171fdd105e0ab477f51b72e7f3ac0e276"
+dependencies = [
+ "aho-corasick",
+ "memchr",
+ "regex-automata",
+ "regex-syntax",
+]
+
+[[package]]
+name = "regex-automata"
+version = "0.4.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6e1dd4122fc1595e8162618945476892eefca7b88c52820e74af6262213cae8f"
+dependencies = [
+ "aho-corasick",
+ "memchr",
+ "regex-syntax",
+]
+
+[[package]]
+name = "regex-syntax"
+version = "0.8.10"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dc897dd8d9e8bd1ed8cdad82b5966c3e0ecae09fb1907d58efaa013543185d0a"
+
+[[package]]
+name = "reqsign"
+version = "0.16.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "43451dbf3590a7590684c25fb8d12ecdcc90ed3ac123433e500447c7d77ed701"
+dependencies = [
+ "anyhow",
+ "async-trait",
+ "base64 0.22.1",
+ "chrono",
+ "form_urlencoded",
+ "getrandom 0.2.17",
+ "hex",
+ "hmac",
+ "home",
+ "http",
+ "log",
+ "once_cell",
+ "percent-encoding",
+ "quick-xml 0.37.5",
+ "rand 0.8.5",
+ "reqwest",
+ "rust-ini",
+ "serde",
+ "serde_json",
+ "sha1",
+ "sha2",
+ "tokio",
+]
+
+[[package]]
+name = "reqwest"
+version = "0.12.28"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "eddd3ca559203180a307f12d114c268abf583f59b03cb906fd0b3ff8646c1147"
+dependencies = [
+ "base64 0.22.1",
+ "bytes",
+ "futures-core",
+ "futures-util",
+ "http",
+ "http-body",
+ "http-body-util",
+ "hyper",
+ "hyper-rustls",
+ "hyper-util",
+ "js-sys",
+ "log",
+ "percent-encoding",
+ "pin-project-lite",
+ "quinn",
+ "rustls",
+ "rustls-pki-types",
+ "serde",
+ "serde_json",
+ "serde_urlencoded",
+ "sync_wrapper",
+ "tokio",
+ "tokio-rustls",
+ "tokio-util",
+ "tower",
+ "tower-http",
+ "tower-service",
+ "url",
+ "wasm-bindgen",
+ "wasm-bindgen-futures",
+ "wasm-streams",
+ "web-sys",
+ "webpki-roots",
+]
+
+[[package]]
+name = "ring"
+version = "0.17.14"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a4689e6c2294d81e88dc6261c768b63bc4fcdb852be6d1352498b114f61383b7"
+dependencies = [
+ "cc",
+ "cfg-if",
+ "getrandom 0.2.17",
+ "libc",
+ "untrusted",
+ "windows-sys 0.52.0",
+]
+
+[[package]]
+name = "rust-ini"
+version = "0.21.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "796e8d2b6696392a43bea58116b667fb4c29727dc5abd27d6acf338bb4f688c7"
+dependencies = [
+ "cfg-if",
+ "ordered-multimap",
+]
+
+[[package]]
+name = "rustc-hash"
+version = "2.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "94300abf3f1ae2e2b8ffb7b58043de3d399c73fa6f4b73826402a5c457614dbe"
+
+[[package]]
+name = "rustc_version"
+version = "0.4.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cfcb3a22ef46e85b45de6ee7e79d063319ebb6594faafcf1c225ea92ab6e9b92"
+dependencies = [
+ "semver",
+]
+
+[[package]]
+name = "rustix"
+version = "1.1.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b6fe4565b9518b83ef4f91bb47ce29620ca828bd32cb7e408f0062e9930ba190"
+dependencies = [
+ "bitflags",
+ "errno",
+ "libc",
+ "linux-raw-sys",
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "rustls"
+version = "0.23.37"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "758025cb5fccfd3bc2fd74708fd4682be41d99e5dff73c377c0646c6012c73a4"
+dependencies = [
+ "log",
+ "once_cell",
+ "ring",
+ "rustls-pki-types",
+ "rustls-webpki",
+ "subtle",
+ "zeroize",
+]
+
+[[package]]
+name = "rustls-native-certs"
+version = "0.8.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "612460d5f7bea540c490b2b6395d8e34a953e52b491accd6c86c8164c5932a63"
+dependencies = [
+ "openssl-probe",
+ "rustls-pki-types",
+ "schannel",
+ "security-framework",
+]
+
+[[package]]
+name = "rustls-pemfile"
+version = "2.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dce314e5fee3f39953d46bb63bb8a46d40c2f8fb7cc5a3b6cab2bde9721d6e50"
+dependencies = [
+ "rustls-pki-types",
+]
+
+[[package]]
+name = "rustls-pki-types"
+version = "1.14.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "be040f8b0a225e40375822a563fa9524378b9d63112f53e19ffff34df5d33fdd"
+dependencies = [
+ "web-time",
+ "zeroize",
+]
+
+[[package]]
+name = "rustls-webpki"
+version = "0.103.10"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "df33b2b81ac578cabaf06b89b0631153a3f416b0a886e8a7a1707fb51abbd1ef"
+dependencies = [
+ "ring",
+ "rustls-pki-types",
+ "untrusted",
+]
+
+[[package]]
+name = "rustversion"
+version = "1.0.22"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b39cdef0fa800fc44525c84ccb54a029961a8215f9619753635a9c0d2538d46d"
+
+[[package]]
+name = "ryu"
+version = "1.0.23"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9774ba4a74de5f7b1c1451ed6cd5285a32eddb5cccb8cc655a4e50009e06477f"
+
+[[package]]
+name = "schannel"
+version = "0.1.29"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "91c1b7e4904c873ef0710c1f407dde2e6287de2bebc1bbbf7d430bb7cbffd939"
+dependencies = [
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "schemars"
+version = "0.9.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4cd191f9397d57d581cddd31014772520aa448f65ef991055d7f61582c65165f"
+dependencies = [
+ "dyn-clone",
+ "ref-cast",
+ "serde",
+ "serde_json",
+]
+
+[[package]]
+name = "schemars"
+version = "1.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a2b42f36aa1cd011945615b92222f6bf73c599a102a300334cd7f8dbeec726cc"
+dependencies = [
+ "dyn-clone",
+ "ref-cast",
+ "serde",
+ "serde_json",
+]
+
+[[package]]
+name = "scopeguard"
+version = "1.2.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "94143f37725109f92c262ed2cf5e59bce7498c01bcc1502d7b9afe439a4e9f49"
+
+[[package]]
+name = "scratch"
+version = "1.0.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d68f2ec51b097e4c1a75b681a8bec621909b5e91f15bb7b840c4f2f7b01148b2"
+
+[[package]]
+name = "security-framework"
+version = "3.7.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b7f4bc775c73d9a02cde8bf7b2ec4c9d12743edf609006c7facc23998404cd1d"
+dependencies = [
+ "bitflags",
+ "core-foundation",
+ "core-foundation-sys",
+ "libc",
+ "security-framework-sys",
+]
+
+[[package]]
+name = "security-framework-sys"
+version = "2.17.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6ce2691df843ecc5d231c0b14ece2acc3efb62c0a398c7e1d875f3983ce020e3"
+dependencies = [
+ "core-foundation-sys",
+ "libc",
+]
+
+[[package]]
+name = "semver"
+version = "1.0.28"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8a7852d02fc848982e0c167ef163aaff9cd91dc640ba85e263cb1ce46fae51cd"
+
+[[package]]
+name = "serde"
+version = "1.0.228"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9a8e94ea7f378bd32cbbd37198a4a91436180c5bb472411e48b5ec2e2124ae9e"
+dependencies = [
+ "serde_core",
+ "serde_derive",
+]
+
+[[package]]
+name = "serde_core"
+version = "1.0.228"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "41d385c7d4ca58e59fc732af25c3983b67ac852c1a25000afe1175de458b67ad"
+dependencies = [
+ "serde_derive",
+]
+
+[[package]]
+name = "serde_derive"
+version = "1.0.228"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d540f220d3187173da220f885ab66608367b6574e925011a9353e4badda91d79"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "serde_fmt"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6e497af288b3b95d067a23a4f749f2861121ffcb2f6d8379310dcda040c345ed"
+dependencies = [
+ "serde_core",
+]
+
+[[package]]
+name = "serde_json"
+version = "1.0.149"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "83fc039473c5595ace860d8c4fafa220ff474b3fc6bfdb4293327f1a37e94d86"
+dependencies = [
+ "itoa",
+ "memchr",
+ "serde",
+ "serde_core",
+ "zmij",
+]
+
+[[package]]
+name = "serde_repr"
+version = "0.1.20"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "175ee3e80ae9982737ca543e96133087cbd9a485eecc3bc4de9c1a37b47ea59c"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "serde_urlencoded"
+version = "0.7.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d3491c14715ca2294c4d6a88f15e84739788c1d030eed8c110436aafdaa2f3fd"
+dependencies = [
+ "form_urlencoded",
+ "itoa",
+ "ryu",
+ "serde",
+]
+
+[[package]]
+name = "serde_with"
+version = "3.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dd5414fad8e6907dbdd5bc441a50ae8d6e26151a03b1de04d89a5576de61d01f"
+dependencies = [
+ "base64 0.22.1",
+ "chrono",
+ "hex",
+ "indexmap 1.9.3",
+ "indexmap 2.13.1",
+ "schemars 0.9.0",
+ "schemars 1.2.1",
+ "serde_core",
+ "serde_json",
+ "serde_with_macros",
+ "time",
+]
+
+[[package]]
+name = "serde_with_macros"
+version = "3.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d3db8978e608f1fe7357e211969fd9abdcae80bac1ba7a3369bb7eb6b404eb65"
+dependencies = [
+ "darling",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "sha1"
+version = "0.10.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e3bf829a2d51ab4a5ddf1352d8470c140cadc8301b2ae1789db023f01cedd6ba"
+dependencies = [
+ "cfg-if",
+ "cpufeatures",
+ "digest",
+]
+
+[[package]]
+name = "sha2"
+version = "0.10.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a7507d819769d01a365ab707794a4084392c824f54a7a6a7862f8c3d0892b283"
+dependencies = [
+ "cfg-if",
+ "cpufeatures",
+ "digest",
+]
+
+[[package]]
+name = "shlex"
+version = "1.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0fda2ff0d084019ba4d7c6f371c95d8fd75ce3524c3cb8fb653a3023f6323e64"
+
+[[package]]
+name = "signal-hook-registry"
+version = "1.4.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c4db69cba1110affc0e9f7bcd48bbf87b3f4fc7c61fc9155afd4c469eb3d6c1b"
+dependencies = [
+ "errno",
+ "libc",
+]
+
+[[package]]
+name = "simdutf8"
+version = "0.1.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e3a9fe34e3e7a50316060351f37187a3f546bce95496156754b601a5fa71b76e"
+
+[[package]]
+name = "slab"
+version = "0.4.12"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0c790de23124f9ab44544d7ac05d60440adc586479ce501c1d6d7da3cd8c9cf5"
+
+[[package]]
+name = "smallvec"
+version = "1.15.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "67b1b7a3b5fe4f1376887184045fcf45c69e92af734b7aaddc05fb777b6fbd03"
+
+[[package]]
+name = "snafu"
+version = "0.8.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6e84b3f4eacbf3a1ce05eac6763b4d629d60cbc94d632e4092c54ade71f1e1a2"
+dependencies = [
+ "snafu-derive",
+]
+
+[[package]]
+name = "snafu-derive"
+version = "0.8.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c1c97747dbf44bb1ca44a561ece23508e99cb592e862f22222dcf42f51d1e451"
+dependencies = [
+ "heck",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "socket2"
+version = "0.6.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3a766e1110788c36f4fa1c2b71b387a7815aa65f88ce0229841826633d93723e"
+dependencies = [
+ "libc",
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "stable_deref_trait"
+version = "1.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "6ce2be8dc25455e1f91df71bfa12ad37d7af1092ae736f3a6cd0e37bc7810596"
+
+[[package]]
+name = "strsim"
+version = "0.11.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7da8b5736845d9f2fcb837ea5d9e2628564b3b043a70948a3f0b778838c5fb4f"
+
+[[package]]
+name = "structmeta"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2e1575d8d40908d70f6fd05537266b90ae71b15dbbe7a8b7dffa2b759306d329"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "structmeta-derive",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "structmeta-derive"
+version = "0.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "152a0b65a590ff6c3da95cabe2353ee04e6167c896b28e3b14478c2636c922fc"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "strum"
+version = "0.26.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8fec0f0aef304996cf250b31b5a10dee7980c85da9d759361292b8bca5a18f06"
+
+[[package]]
+name = "strum_macros"
+version = "0.26.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4c6bee85a5a24955dc440386795aa378cd9cf82acd5f764469152d2270e581be"
+dependencies = [
+ "heck",
+ "proc-macro2",
+ "quote",
+ "rustversion",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "subtle"
+version = "2.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "13c2bddecc57b384dee18652358fb23172facb8a2c51ccc10d74c157bdea3292"
+
+[[package]]
+name = "sval"
+version = "2.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2eb9318255ebd817902d7e279d8f8e39b35b1b9954decd5eb9ea0e30e5fd2b6a"
+
+[[package]]
+name = "sval_buffer"
+version = "2.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "12571299185e653fdb0fbfe36cd7f6529d39d4e747a60b15a3f34574b7b97c61"
+dependencies = [
+ "sval",
+ "sval_ref",
+]
+
+[[package]]
+name = "sval_dynamic"
+version = "2.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "39526f24e997706c0de7f03fb7371f7f5638b66a504ded508e20ad173d0a3677"
+dependencies = [
+ "sval",
+]
+
+[[package]]
+name = "sval_fmt"
+version = "2.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "933dd3bb26965d682280fcc49400ac2a05036f4ee1e6dbd61bf8402d5a5c3a54"
+dependencies = [
+ "itoa",
+ "ryu",
+ "sval",
+]
+
+[[package]]
+name = "sval_json"
+version = "2.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a0cda08f6d5c9948024a6551077557b1fdcc3880ff2f20ae839667d2ec2d87ed"
+dependencies = [
+ "itoa",
+ "ryu",
+ "sval",
+]
+
+[[package]]
+name = "sval_nested"
+version = "2.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "88d49d5e6c1f9fd0e53515819b03a97ca4eb1bff5c8ee097c43391c09ecfb19f"
+dependencies = [
+ "sval",
+ "sval_buffer",
+ "sval_ref",
+]
+
+[[package]]
+name = "sval_ref"
+version = "2.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "14f876c5a78405375b4e19cbb9554407513b59c93dea12dc6a4af4e1d30899ca"
+dependencies = [
+ "sval",
+]
+
+[[package]]
+name = "sval_serde"
+version = "2.18.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5f9ccd3b7f7200239a655e517dd3fd48d960b9111ad24bd6a5e055bef17607c7"
+dependencies = [
+ "serde_core",
+ "sval",
+ "sval_nested",
+]
+
+[[package]]
+name = "syn"
+version = "1.0.109"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "72b64191b275b66ffe2469e8af2c1cfe3bafa67b529ead792a6d0160888b4237"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "unicode-ident",
+]
+
+[[package]]
+name = "syn"
+version = "2.0.117"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e665b8803e7b1d2a727f4023456bbbbe74da67099c585258af0ad9c5013b9b99"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "unicode-ident",
+]
+
+[[package]]
+name = "sync_wrapper"
+version = "1.0.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0bf256ce5efdfa370213c1dabab5935a12e49f2c58d15e9eac2870d3b4f27263"
+dependencies = [
+ "futures-core",
+]
+
+[[package]]
+name = "synstructure"
+version = "0.13.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "728a70f3dbaf5bab7f0c4b1ac8d7ae5ea60a4b5549c8a5914361c99147a709d2"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "tap"
+version = "1.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "55937e1799185b12863d447f42597ed69d9928686b8d88a1df17376a097d8369"
+
+[[package]]
+name = "target-lexicon"
+version = "0.13.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "adb6935a6f5c20170eeceb1a3835a49e12e19d792f6dd344ccc76a985ca5a6ca"
+
+[[package]]
+name = "tempfile"
+version = "3.27.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "32497e9a4c7b38532efcdebeef879707aa9f794296a4f0244f6f69e9bc8574bd"
+dependencies = [
+ "fastrand",
+ "getrandom 0.4.2",
+ "once_cell",
+ "rustix",
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "termcolor"
+version = "1.4.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "06794f8f6c5c898b3275aebefa6b8a1cb24cd2c6c79397ab15774837a0bc5755"
+dependencies = [
+ "winapi-util",
+]
+
+[[package]]
+name = "test-env-helpers"
+version = "0.2.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c6ab8f4822c904dadef9dd99f228f58a10d1b2c6ece06b108257e72fea72b1c6"
+dependencies = [
+ "quote",
+ "syn 1.0.109",
+]
+
+[[package]]
+name = "testcontainers"
+version = "0.25.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3f3ac71069f20ecfa60c396316c283fbf35e6833a53dff551a31b5458da05edc"
+dependencies = [
+ "astral-tokio-tar",
+ "async-trait",
+ "bollard",
+ "bytes",
+ "docker_credential",
+ "either",
+ "etcetera",
+ "futures",
+ "log",
+ "memchr",
+ "parse-display 0.9.1",
+ "pin-project-lite",
+ "serde",
+ "serde_json",
+ "serde_with",
+ "thiserror 2.0.18",
+ "tokio",
+ "tokio-stream",
+ "tokio-util",
+ "ulid",
+ "url",
+]
+
+[[package]]
+name = "thiserror"
+version = "1.0.69"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b6aaf5339b578ea85b50e080feb250a3e8ae8cfcdff9a461c9ec2904bc923f52"
+dependencies = [
+ "thiserror-impl 1.0.69",
+]
+
+[[package]]
+name = "thiserror"
+version = "2.0.18"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4288b5bcbc7920c07a1149a35cf9590a2aa808e0bc1eafaade0b80947865fbc4"
+dependencies = [
+ "thiserror-impl 2.0.18",
+]
+
+[[package]]
+name = "thiserror-impl"
+version = "1.0.69"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4fee6c4efc90059e10f81e6d42c60a18f76588c3d74cb83a0b242a2b6c7504c1"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "thiserror-impl"
+version = "2.0.18"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ebc4ee7f67670e9b64d05fa4253e753e016c6c95ff35b89b7941d6b856dec1d5"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "tikv-jemalloc-sys"
+version = "0.6.1+5.3.0-1-ge13ca993e8ccb9ba9847cc330696e02839f328f7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cd8aa5b2ab86a2cefa406d889139c162cbb230092f7d1d7cbc1716405d852a3b"
+dependencies = [
+ "cc",
+ "libc",
+]
+
+[[package]]
+name = "tikv-jemallocator"
+version = "0.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0359b4327f954e0567e69fb191cf1436617748813819c94b8cd4a431422d053a"
+dependencies = [
+ "libc",
+ "tikv-jemalloc-sys",
+]
+
+[[package]]
+name = "time"
+version = "0.3.47"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "743bd48c283afc0388f9b8827b976905fb217ad9e647fae3a379a9283c4def2c"
+dependencies = [
+ "deranged",
+ "itoa",
+ "num-conv",
+ "powerfmt",
+ "serde_core",
+ "time-core",
+ "time-macros",
+]
+
+[[package]]
+name = "time-core"
+version = "0.1.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7694e1cfe791f8d31026952abf09c69ca6f6fa4e1a1229e18988f06a04a12dca"
+
+[[package]]
+name = "time-macros"
+version = "0.2.27"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2e70e4c5a0e0a8a4823ad65dfe1a6930e4f4d756dcd9dd7939022b5e8c501215"
+dependencies = [
+ "num-conv",
+ "time-core",
+]
+
+[[package]]
+name = "tiny-keccak"
+version = "2.0.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2c9d3793400a45f954c52e73d068316d76b6f4e36977e3fcebb13a2721e80237"
+dependencies = [
+ "crunchy",
+]
+
+[[package]]
+name = "tinystr"
+version = "0.8.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c8323304221c2a851516f22236c5722a72eaa19749016521d6dff0824447d96d"
+dependencies = [
+ "displaydoc",
+ "zerovec",
+]
+
+[[package]]
+name = "tinyvec"
+version = "1.11.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3e61e67053d25a4e82c844e8424039d9745781b3fc4f32b8d55ed50f5f667ef3"
+dependencies = [
+ "tinyvec_macros",
+]
+
+[[package]]
+name = "tinyvec_macros"
+version = "0.1.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1f3ccbac311fea05f86f61904b462b55fb3df8837a366dfc601a0161d0532f20"
+
+[[package]]
+name = "tokio"
+version = "1.51.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "2bd1c4c0fc4a7ab90fc15ef6daaa3ec3b893f004f915f2392557ed23237820cd"
+dependencies = [
+ "bytes",
+ "libc",
+ "mio",
+ "parking_lot",
+ "pin-project-lite",
+ "signal-hook-registry",
+ "socket2",
+ "tokio-macros",
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "tokio-macros"
+version = "2.7.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "385a6cb71ab9ab790c5fe8d67f1645e6c450a7ce006a33de03daa956cf70a496"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "tokio-rustls"
+version = "0.26.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1729aa945f29d91ba541258c8df89027d5792d85a8841fb65e8bf0f4ede4ef61"
+dependencies = [
+ "rustls",
+ "tokio",
+]
+
+[[package]]
+name = "tokio-stream"
+version = "0.1.18"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "32da49809aab5c3bc678af03902d4ccddea2a87d028d86392a4b1560c6906c70"
+dependencies = [
+ "futures-core",
+ "pin-project-lite",
+ "tokio",
+]
+
+[[package]]
+name = "tokio-util"
+version = "0.7.18"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9ae9cec805b01e8fc3fd2fe289f89149a9b66dd16786abd8b19cfa7b48cb0098"
+dependencies = [
+ "bytes",
+ "futures-core",
+ "futures-sink",
+ "pin-project-lite",
+ "tokio",
+]
+
+[[package]]
+name = "tonic"
+version = "0.14.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fec7c61a0695dc1887c1b53952990f3ad2e3a31453e1f49f10e75424943a93ec"
+dependencies = [
+ "async-trait",
+ "axum",
+ "base64 0.22.1",
+ "bytes",
+ "h2",
+ "http",
+ "http-body",
+ "http-body-util",
+ "hyper",
+ "hyper-timeout",
+ "hyper-util",
+ "percent-encoding",
+ "pin-project",
+ "socket2",
+ "sync_wrapper",
+ "tokio",
+ "tokio-stream",
+ "tower",
+ "tower-layer",
+ "tower-service",
+ "tracing",
+]
+
+[[package]]
+name = "tonic-prost"
+version = "0.14.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a55376a0bbaa4975a3f10d009ad763d8f4108f067c7c2e74f3001fb49778d309"
+dependencies = [
+ "bytes",
+ "prost",
+ "tonic",
+]
+
+[[package]]
+name = "tower"
+version = "0.5.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ebe5ef63511595f1344e2d5cfa636d973292adc0eec1f0ad45fae9f0851ab1d4"
+dependencies = [
+ "futures-core",
+ "futures-util",
+ "indexmap 2.13.1",
+ "pin-project-lite",
+ "slab",
+ "sync_wrapper",
+ "tokio",
+ "tokio-util",
+ "tower-layer",
+ "tower-service",
+ "tracing",
+]
+
+[[package]]
+name = "tower-http"
+version = "0.6.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d4e6559d53cc268e5031cd8429d05415bc4cb4aefc4aa5d6cc35fbf5b924a1f8"
+dependencies = [
+ "bitflags",
+ "bytes",
+ "futures-util",
+ "http",
+ "http-body",
+ "iri-string",
+ "pin-project-lite",
+ "tower",
+ "tower-layer",
+ "tower-service",
+]
+
+[[package]]
+name = "tower-layer"
+version = "0.3.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "121c2a6cda46980bb0fcd1647ffaf6cd3fc79a013de288782836f6df9c48780e"
+
+[[package]]
+name = "tower-service"
+version = "0.3.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8df9b6e13f2d32c91b9bd719c00d1958837bc7dec474d94952798cc8e69eeec3"
+
+[[package]]
+name = "tracing"
+version = "0.1.44"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "63e71662fa4b2a2c3a26f570f037eb95bb1f85397f3cd8076caed2f026a6d100"
+dependencies = [
+ "pin-project-lite",
+ "tracing-attributes",
+ "tracing-core",
+]
+
+[[package]]
+name = "tracing-attributes"
+version = "0.1.31"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7490cfa5ec963746568740651ac6781f701c9c5ea257c58e057f3ba8cf69e8da"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "tracing-core"
+version = "0.1.36"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "db97caf9d906fbde555dd62fa95ddba9eecfd14cb388e4f491a66d74cd5fb79a"
+dependencies = [
+ "once_cell",
+]
+
+[[package]]
+name = "try-lock"
+version = "0.2.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e421abadd41a4225275504ea4d6566923418b7f05506fbc9c0fe86ba7396114b"
+
+[[package]]
+name = "twox-hash"
+version = "2.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9ea3136b675547379c4bd395ca6b938e5ad3c3d20fad76e7fe85f9e0d011419c"
+
+[[package]]
+name = "typeid"
+version = "1.0.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bc7d623258602320d5c55d1bc22793b57daff0ec7efc270ea7d55ce1d5f5471c"
+
+[[package]]
+name = "typenum"
+version = "1.19.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "562d481066bde0658276a35467c4af00bdc6ee726305698a55b86e61d7ad82bb"
+
+[[package]]
+name = "ulid"
+version = "1.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "470dbf6591da1b39d43c14523b2b469c86879a53e8b758c8e090a470fe7b1fbe"
+dependencies = [
+ "rand 0.9.2",
+ "web-time",
+]
+
+[[package]]
+name = "unicode-ident"
+version = "1.0.24"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e6e4313cd5fcd3dad5cafa179702e2b244f760991f45397d14d4ebf38247da75"
+
+[[package]]
+name = "unicode-width"
+version = "0.2.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b4ac048d71ede7ee76d585517add45da530660ef4390e49b098733c6e897f254"
+
+[[package]]
+name = "unicode-xid"
+version = "0.2.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ebc1c04c71510c7f702b52b7c350734c9ff1295c464a03335b00bb84fc54f853"
+
+[[package]]
+name = "unindent"
+version = "0.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7264e107f553ccae879d21fbea1d6724ac785e8c3bfc762137959b5802826ef3"
+
+[[package]]
+name = "untrusted"
+version = "0.9.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8ecb6da28b8a351d773b68d5825ac39017e680750f980f3a1a85cd8dd28a47c1"
+
+[[package]]
+name = "ureq"
+version = "3.3.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dea7109cdcd5864d4eeb1b58a1648dc9bf520360d7af16ec26d0a9354bafcfc0"
+dependencies = [
+ "base64 0.22.1",
+ "log",
+ "percent-encoding",
+ "rustls",
+ "rustls-pki-types",
+ "ureq-proto",
+ "utf8-zero",
+]
+
+[[package]]
+name = "ureq-proto"
+version = "0.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e994ba84b0bd1b1b0cf92878b7ef898a5c1760108fe7b6010327e274917a808c"
+dependencies = [
+ "base64 0.22.1",
+ "http",
+ "httparse",
+ "log",
+]
+
+[[package]]
+name = "url"
+version = "2.5.8"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ff67a8a4397373c3ef660812acab3268222035010ab8680ec4215f38ba3d0eed"
+dependencies = [
+ "form_urlencoded",
+ "idna",
+ "percent-encoding",
+ "serde",
+ "serde_derive",
+]
+
+[[package]]
+name = "utf8-zero"
+version = "0.8.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b8c0a043c9540bae7c578c88f91dda8bd82e59ae27c21baca69c8b191aaf5a6e"
+
+[[package]]
+name = "utf8_iter"
+version = "1.0.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b6c140620e7ffbb22c2dee59cafe6084a59b5ffc27a8859a5f0d494b5d52b6be"
+
+[[package]]
+name = "utf8parse"
+version = "0.2.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "06abde3611657adf66d383f00b093d7faecc7fa57071cce2578660c9f1010821"
+
+[[package]]
+name = "uuid"
+version = "1.23.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5ac8b6f42ead25368cf5b098aeb3dc8a1a2c05a3eee8a9a1a68c640edbfc79d9"
+dependencies = [
+ "getrandom 0.4.2",
+ "js-sys",
+ "serde_core",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "value-bag"
+version = "1.12.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7ba6f5989077681266825251a52748b8c1d8a4ad098cc37e440103d0ea717fc0"
+dependencies = [
+ "value-bag-serde1",
+ "value-bag-sval2",
+]
+
+[[package]]
+name = "value-bag-serde1"
+version = "1.12.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "16530907bfe2999a1773ca5900a65101e092c70f642f25cc23ca0c43573262c5"
+dependencies = [
+ "erased-serde",
+ "serde_core",
+ "serde_fmt",
+]
+
+[[package]]
+name = "value-bag-sval2"
+version = "1.12.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d00ae130edd690eaa877e4f40605d534790d1cf1d651e7685bd6a144521b251f"
+dependencies = [
+ "sval",
+ "sval_buffer",
+ "sval_dynamic",
+ "sval_fmt",
+ "sval_json",
+ "sval_ref",
+ "sval_serde",
+]
+
+[[package]]
+name = "version_check"
+version = "0.9.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0b928f33d975fc6ad9f86c8f283853ad26bdd5b10b7f1542aa2fa15e2289105a"
+
+[[package]]
+name = "want"
+version = "0.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bfa7760aed19e106de2c7c0b581b509f2f25d3dacaf737cb82ac61bc6d760b0e"
+dependencies = [
+ "try-lock",
+]
+
+[[package]]
+name = "wasi"
+version = "0.11.1+wasi-snapshot-preview1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ccf3ec651a847eb01de73ccad15eb7d99f80485de043efb2f370cd654f4ea44b"
+
+[[package]]
+name = "wasip2"
+version = "1.0.2+wasi-0.2.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9517f9239f02c069db75e65f174b3da828fe5f5b945c4dd26bd25d89c03ebcf5"
+dependencies = [
+ "wit-bindgen",
+]
+
+[[package]]
+name = "wasip3"
+version = "0.4.0+wasi-0.3.0-rc-2026-01-06"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5428f8bf88ea5ddc08faddef2ac4a67e390b88186c703ce6dbd955e1c145aca5"
+dependencies = [
+ "wit-bindgen",
+]
+
+[[package]]
+name = "wasm-bindgen"
+version = "0.2.117"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0551fc1bb415591e3372d0bc4780db7e587d84e2a7e79da121051c5c4b89d0b0"
+dependencies = [
+ "cfg-if",
+ "once_cell",
+ "rustversion",
+ "wasm-bindgen-macro",
+ "wasm-bindgen-shared",
+]
+
+[[package]]
+name = "wasm-bindgen-futures"
+version = "0.4.67"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "03623de6905b7206edd0a75f69f747f134b7f0a2323392d664448bf2d3c5d87e"
+dependencies = [
+ "js-sys",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "wasm-bindgen-macro"
+version = "0.2.117"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7fbdf9a35adf44786aecd5ff89b4563a90325f9da0923236f6104e603c7e86be"
+dependencies = [
+ "quote",
+ "wasm-bindgen-macro-support",
+]
+
+[[package]]
+name = "wasm-bindgen-macro-support"
+version = "0.2.117"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dca9693ef2bab6d4e6707234500350d8dad079eb508dca05530c85dc3a529ff2"
+dependencies = [
+ "bumpalo",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+ "wasm-bindgen-shared",
+]
+
+[[package]]
+name = "wasm-bindgen-shared"
+version = "0.2.117"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "39129a682a6d2d841b6c429d0c51e5cb0ed1a03829d8b3d1e69a011e62cb3d3b"
+dependencies = [
+ "unicode-ident",
+]
+
+[[package]]
+name = "wasm-encoder"
+version = "0.244.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "990065f2fe63003fe337b932cfb5e3b80e0b4d0f5ff650e6985b1048f62c8319"
+dependencies = [
+ "leb128fmt",
+ "wasmparser",
+]
+
+[[package]]
+name = "wasm-metadata"
+version = "0.244.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bb0e353e6a2fbdc176932bbaab493762eb1255a7900fe0fea1a2f96c296cc909"
+dependencies = [
+ "anyhow",
+ "indexmap 2.13.1",
+ "wasm-encoder",
+ "wasmparser",
+]
+
+[[package]]
+name = "wasm-streams"
+version = "0.4.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "15053d8d85c7eccdbefef60f06769760a563c7f0a9d6902a13d35c7800b0ad65"
+dependencies = [
+ "futures-util",
+ "js-sys",
+ "wasm-bindgen",
+ "wasm-bindgen-futures",
+ "web-sys",
+]
+
+[[package]]
+name = "wasmparser"
+version = "0.244.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "47b807c72e1bac69382b3a6fb3dbe8ea4c0ed87ff5629b8685ae6b9a611028fe"
+dependencies = [
+ "bitflags",
+ "hashbrown 0.15.5",
+ "indexmap 2.13.1",
+ "semver",
+]
+
+[[package]]
+name = "web-sys"
+version = "0.3.94"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cd70027e39b12f0849461e08ffc50b9cd7688d942c1c8e3c7b22273236b4dd0a"
+dependencies = [
+ "js-sys",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "web-time"
+version = "1.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5a6580f308b1fad9207618087a65c04e7a10bc77e02c8e84e9b00dd4b12fa0bb"
+dependencies = [
+ "js-sys",
+ "wasm-bindgen",
+]
+
+[[package]]
+name = "webpki-roots"
+version = "1.0.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "22cfaf3c063993ff62e73cb4311efde4db1efb31ab78a3e5c457939ad5cc0bed"
+dependencies = [
+ "rustls-pki-types",
+]
+
+[[package]]
+name = "winapi"
+version = "0.3.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5c839a674fcd7a98952e593242ea400abe93992746761e38641405d28b00f419"
+dependencies = [
+ "winapi-i686-pc-windows-gnu",
+ "winapi-x86_64-pc-windows-gnu",
+]
+
+[[package]]
+name = "winapi-i686-pc-windows-gnu"
+version = "0.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ac3b87c63620426dd9b991e5ce0329eff545bccbbb34f3be09ff6fb6ab51b7b6"
+
+[[package]]
+name = "winapi-util"
+version = "0.1.11"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c2a7b1c03c876122aa43f3020e6c3c3ee5c05081c9a00739faf7503aeba10d22"
+dependencies = [
+ "windows-sys 0.61.2",
+]
+
+[[package]]
+name = "winapi-x86_64-pc-windows-gnu"
+version = "0.4.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "712e227841d057c1ee1cd2fb22fa7e5a5461ae8e48fa2ca79ec42cfc1931183f"
+
+[[package]]
+name = "windows-core"
+version = "0.62.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b8e83a14d34d0623b51dce9581199302a221863196a1dde71a7663a4c2be9deb"
+dependencies = [
+ "windows-implement",
+ "windows-interface",
+ "windows-link",
+ "windows-result",
+ "windows-strings",
+]
+
+[[package]]
+name = "windows-implement"
+version = "0.60.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "053e2e040ab57b9dc951b72c264860db7eb3b0200ba345b4e4c3b14f67855ddf"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "windows-interface"
+version = "0.59.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3f316c4a2570ba26bbec722032c4099d8c8bc095efccdc15688708623367e358"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "windows-link"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f0805222e57f7521d6a62e36fa9163bc891acd422f971defe97d64e70d0a4fe5"
+
+[[package]]
+name = "windows-result"
+version = "0.4.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7781fa89eaf60850ac3d2da7af8e5242a5ea78d1a11c49bf2910bb5a73853eb5"
+dependencies = [
+ "windows-link",
+]
+
+[[package]]
+name = "windows-strings"
+version = "0.5.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "7837d08f69c77cf6b07689544538e017c1bfcf57e34b4c0ff58e6c2cd3b37091"
+dependencies = [
+ "windows-link",
+]
+
+[[package]]
+name = "windows-sys"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "282be5f36a8ce781fad8c8ae18fa3f9beff57ec1b52cb3de0789201425d9a33d"
+dependencies = [
+ "windows-targets 0.52.6",
+]
+
+[[package]]
+name = "windows-sys"
+version = "0.59.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1e38bc4d79ed67fd075bcc251a1c39b32a1776bbe92e5bef1f0bf1f8c531853b"
+dependencies = [
+ "windows-targets 0.52.6",
+]
+
+[[package]]
+name = "windows-sys"
+version = "0.60.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f2f500e4d28234f72040990ec9d39e3a6b950f9f22d3dba18416c35882612bcb"
+dependencies = [
+ "windows-targets 0.53.5",
+]
+
+[[package]]
+name = "windows-sys"
+version = "0.61.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ae137229bcbd6cdf0f7b80a31df61766145077ddf49416a728b02cb3921ff3fc"
+dependencies = [
+ "windows-link",
+]
+
+[[package]]
+name = "windows-targets"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9b724f72796e036ab90c1021d4780d4d3d648aca59e491e6b98e725b84e99973"
+dependencies = [
+ "windows_aarch64_gnullvm 0.52.6",
+ "windows_aarch64_msvc 0.52.6",
+ "windows_i686_gnu 0.52.6",
+ "windows_i686_gnullvm 0.52.6",
+ "windows_i686_msvc 0.52.6",
+ "windows_x86_64_gnu 0.52.6",
+ "windows_x86_64_gnullvm 0.52.6",
+ "windows_x86_64_msvc 0.52.6",
+]
+
+[[package]]
+name = "windows-targets"
+version = "0.53.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "4945f9f551b88e0d65f3db0bc25c33b8acea4d9e41163edf90dcd0b19f9069f3"
+dependencies = [
+ "windows-link",
+ "windows_aarch64_gnullvm 0.53.1",
+ "windows_aarch64_msvc 0.53.1",
+ "windows_i686_gnu 0.53.1",
+ "windows_i686_gnullvm 0.53.1",
+ "windows_i686_msvc 0.53.1",
+ "windows_x86_64_gnu 0.53.1",
+ "windows_x86_64_gnullvm 0.53.1",
+ "windows_x86_64_msvc 0.53.1",
+]
+
+[[package]]
+name = "windows_aarch64_gnullvm"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "32a4622180e7a0ec044bb555404c800bc9fd9ec262ec147edd5989ccd0c02cd3"
+
+[[package]]
+name = "windows_aarch64_gnullvm"
+version = "0.53.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a9d8416fa8b42f5c947f8482c43e7d89e73a173cead56d044f6a56104a6d1b53"
+
+[[package]]
+name = "windows_aarch64_msvc"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "09ec2a7bb152e2252b53fa7803150007879548bc709c039df7627cabbd05d469"
+
+[[package]]
+name = "windows_aarch64_msvc"
+version = "0.53.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b9d782e804c2f632e395708e99a94275910eb9100b2114651e04744e9b125006"
+
+[[package]]
+name = "windows_i686_gnu"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8e9b5ad5ab802e97eb8e295ac6720e509ee4c243f69d781394014ebfe8bbfa0b"
+
+[[package]]
+name = "windows_i686_gnu"
+version = "0.53.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "960e6da069d81e09becb0ca57a65220ddff016ff2d6af6a223cf372a506593a3"
+
+[[package]]
+name = "windows_i686_gnullvm"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0eee52d38c090b3caa76c563b86c3a4bd71ef1a819287c19d586d7334ae8ed66"
+
+[[package]]
+name = "windows_i686_gnullvm"
+version = "0.53.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "fa7359d10048f68ab8b09fa71c3daccfb0e9b559aed648a8f95469c27057180c"
+
+[[package]]
+name = "windows_i686_msvc"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "240948bc05c5e7c6dabba28bf89d89ffce3e303022809e73deaefe4f6ec56c66"
+
+[[package]]
+name = "windows_i686_msvc"
+version = "0.53.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1e7ac75179f18232fe9c285163565a57ef8d3c89254a30685b57d83a38d326c2"
+
+[[package]]
+name = "windows_x86_64_gnu"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "147a5c80aabfbf0c7d901cb5895d1de30ef2907eb21fbbab29ca94c5b08b1a78"
+
+[[package]]
+name = "windows_x86_64_gnu"
+version = "0.53.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9c3842cdd74a865a8066ab39c8a7a473c0778a3f29370b5fd6b4b9aa7df4a499"
+
+[[package]]
+name = "windows_x86_64_gnullvm"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "24d5b23dc417412679681396f2b49f3de8c1473deb516bd34410872eff51ed0d"
+
+[[package]]
+name = "windows_x86_64_gnullvm"
+version = "0.53.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0ffa179e2d07eee8ad8f57493436566c7cc30ac536a3379fdf008f47f6bb7ae1"
+
+[[package]]
+name = "windows_x86_64_msvc"
+version = "0.52.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "589f6da84c646204747d1270a2a5661ea66ed1cced2631d546fdfb155959f9ec"
+
+[[package]]
+name = "windows_x86_64_msvc"
+version = "0.53.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d6bbff5f0aada427a1e5a6da5f1f98158182f26556f345ac9e04d36d0ebed650"
+
+[[package]]
+name = "wit-bindgen"
+version = "0.51.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "d7249219f66ced02969388cf2bb044a09756a083d0fab1e566056b04d9fbcaa5"
+dependencies = [
+ "wit-bindgen-rust-macro",
+]
+
+[[package]]
+name = "wit-bindgen-core"
+version = "0.51.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ea61de684c3ea68cb082b7a88508a8b27fcc8b797d738bfc99a82facf1d752dc"
+dependencies = [
+ "anyhow",
+ "heck",
+ "wit-parser",
+]
+
+[[package]]
+name = "wit-bindgen-rust"
+version = "0.51.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b7c566e0f4b284dd6561c786d9cb0142da491f46a9fbed79ea69cdad5db17f21"
+dependencies = [
+ "anyhow",
+ "heck",
+ "indexmap 2.13.1",
+ "prettyplease",
+ "syn 2.0.117",
+ "wasm-metadata",
+ "wit-bindgen-core",
+ "wit-component",
+]
+
+[[package]]
+name = "wit-bindgen-rust-macro"
+version = "0.51.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0c0f9bfd77e6a48eccf51359e3ae77140a7f50b1e2ebfe62422d8afdaffab17a"
+dependencies = [
+ "anyhow",
+ "prettyplease",
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+ "wit-bindgen-core",
+ "wit-bindgen-rust",
+]
+
+[[package]]
+name = "wit-component"
+version = "0.244.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9d66ea20e9553b30172b5e831994e35fbde2d165325bec84fc43dbf6f4eb9cb2"
+dependencies = [
+ "anyhow",
+ "bitflags",
+ "indexmap 2.13.1",
+ "log",
+ "serde",
+ "serde_derive",
+ "serde_json",
+ "wasm-encoder",
+ "wasm-metadata",
+ "wasmparser",
+ "wit-parser",
+]
+
+[[package]]
+name = "wit-parser"
+version = "0.244.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ecc8ac4bc1dc3381b7f59c34f00b67e18f910c2c0f50015669dde7def656a736"
+dependencies = [
+ "anyhow",
+ "id-arena",
+ "indexmap 2.13.1",
+ "log",
+ "semver",
+ "serde",
+ "serde_derive",
+ "serde_json",
+ "unicode-xid",
+ "wasmparser",
+]
+
+[[package]]
+name = "writeable"
+version = "0.6.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1ffae5123b2d3fc086436f8834ae3ab053a283cfac8fe0a0b8eaae044768a4c4"
+
+[[package]]
+name = "wyz"
+version = "0.5.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "05f360fc0b24296329c78fda852a1e9ae82de9cf7b27dae4b7f62f118f77b9ed"
+dependencies = [
+ "tap",
+]
+
+[[package]]
+name = "xattr"
+version = "1.6.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "32e45ad4206f6d2479085147f02bc2ef834ac85886624a23575ae137c8aa8156"
+dependencies = [
+ "libc",
+ "rustix",
+]
+
+[[package]]
+name = "yoke"
+version = "0.8.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "abe8c5fda708d9ca3df187cae8bfb9ceda00dd96231bed36e445a1a48e66f9ca"
+dependencies = [
+ "stable_deref_trait",
+ "yoke-derive",
+ "zerofrom",
+]
+
+[[package]]
+name = "yoke-derive"
+version = "0.8.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "de844c262c8848816172cef550288e7dc6c7b7814b4ee56b3e1553f275f1858e"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+ "synstructure",
+]
+
+[[package]]
+name = "zerocopy"
+version = "0.8.48"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "eed437bf9d6692032087e337407a86f04cd8d6a16a37199ed57949d415bd68e9"
+dependencies = [
+ "zerocopy-derive",
+]
+
+[[package]]
+name = "zerocopy-derive"
+version = "0.8.48"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "70e3cd084b1788766f53af483dd21f93881ff30d7320490ec3ef7526d203bad4"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "zerofrom"
+version = "0.1.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "69faa1f2a1ea75661980b013019ed6687ed0e83d069bc1114e2cc74c6c04c4df"
+dependencies = [
+ "zerofrom-derive",
+]
+
+[[package]]
+name = "zerofrom-derive"
+version = "0.1.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "11532158c46691caf0f2593ea8358fed6bbf68a0315e80aae9bd41fbade684a1"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+ "synstructure",
+]
+
+[[package]]
+name = "zeroize"
+version = "1.8.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b97154e67e32c85465826e8bcc1c59429aaaf107c1e4a9e53c8d8ccd5eff88d0"
+
+[[package]]
+name = "zerotrie"
+version = "0.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0f9152d31db0792fa83f70fb2f83148effb5c1f5b8c7686c3459e361d9bc20bf"
+dependencies = [
+ "displaydoc",
+ "yoke",
+ "zerofrom",
+]
+
+[[package]]
+name = "zerovec"
+version = "0.11.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "90f911cbc359ab6af17377d242225f4d75119aec87ea711a880987b18cd7b239"
+dependencies = [
+ "yoke",
+ "zerofrom",
+ "zerovec-derive",
+]
+
+[[package]]
+name = "zerovec-derive"
+version = "0.11.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "625dc425cab0dca6dc3c3319506e6593dcb08a9f387ea3b284dbd52a92c40555"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.117",
+]
+
+[[package]]
+name = "zmij"
+version = "1.0.21"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b8848ee67ecc8aedbaf3e4122217aff892639231befc6a1b58d29fff4c2cabaa"
+
+[[package]]
+name = "zstd"
+version = "0.13.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e91ee311a569c327171651566e07972200e76fcfe2242a4fa446149a3881c08a"
+dependencies = [
+ "zstd-safe",
+]
+
+[[package]]
+name = "zstd-safe"
+version = "7.2.4"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8f49c4d5f0abb602a93fb8736af2a4f4dd9512e36f7f570d66e65ff867ed3b9d"
+dependencies = [
+ "zstd-sys",
+]
+
+[[package]]
+name = "zstd-sys"
+version = "2.0.16+zstd.1.5.7"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "91e19ebc2adc8f83e43039e79776e3fda8ca919132d68a1fed6a5faca2683748"
+dependencies = [
+ "cc",
+ "pkg-config",
+]

From 8fa67f6cd2bfe6833d20d927fd3fc2b2c9321ef2 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekei@apache.org>
Date: Sun, 5 Apr 2026 22:13:52 +0100
Subject: [PATCH 224/287] fix: upgrade testcontainers to 0.27.2 to resolve CVEs
 (#482)

* fix: upgrade testcontainers to 0.27.2 to resolve CVEs

Fixes RUSTSEC-2026-0066 (astral-tokio-tar) and
RUSTSEC-2025-0134 (rustls-pemfile unmaintained).

* chore: remove unused test-env-helpers dev-dependency
---
 fluss-rust/Cargo.lock              | 179 +++++++++++------------------
 fluss-rust/crates/fluss/Cargo.toml |   3 +-
 2 files changed, 70 insertions(+), 112 deletions(-)

diff --git a/fluss-rust/Cargo.lock b/fluss-rust/Cargo.lock
index a3b533d9cb..5af3f8758e 100644
--- a/fluss-rust/Cargo.lock
+++ b/fluss-rust/Cargo.lock
@@ -324,9 +324,9 @@ dependencies = [
 
 [[package]]
 name = "astral-tokio-tar"
-version = "0.5.6"
+version = "0.6.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ec179a06c1769b1e42e1e2cbe74c7dcdb3d6383c838454d063eaac5bbb7ebbe5"
+checksum = "3c23f3af104b40a3430ccb90ed5f7bd877a8dc5c26fc92fde51a22b40890dcf9"
 dependencies = [
  "filetime",
  "futures-core",
@@ -357,7 +357,7 @@ checksum = "c7c24de15d275a1ecfd47a380fb4d5ec9bfe0933f309ed5e705b775596a3574d"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -368,7 +368,7 @@ checksum = "9035ad2d096bed7955a320ee7e2230574d28fd3c3a0f186cbea1ff3c7eed5dbb"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -501,9 +501,9 @@ dependencies = [
 
 [[package]]
 name = "bollard"
-version = "0.19.4"
+version = "0.20.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "87a52479c9237eb04047ddb94788c41ca0d26eaff8b697ecfbb4c32f7fdc3b1b"
+checksum = "ee04c4c84f1f811b017f2fbb7dd8815c976e7ca98593de9c1e2afad0f636bff4"
 dependencies = [
  "async-stream",
  "base64 0.22.1",
@@ -511,7 +511,6 @@ dependencies = [
  "bollard-buildkit-proto",
  "bollard-stubs",
  "bytes",
- "chrono",
  "futures-core",
  "futures-util",
  "hex",
@@ -529,14 +528,13 @@ dependencies = [
  "rand 0.9.2",
  "rustls",
  "rustls-native-certs",
- "rustls-pemfile",
  "rustls-pki-types",
  "serde",
  "serde_derive",
  "serde_json",
- "serde_repr",
  "serde_urlencoded",
  "thiserror 2.0.18",
+ "time",
  "tokio",
  "tokio-stream",
  "tokio-util",
@@ -561,19 +559,18 @@ dependencies = [
 
 [[package]]
 name = "bollard-stubs"
-version = "1.49.1-rc.28.4.0"
+version = "1.52.1-rc.29.1.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5731fe885755e92beff1950774068e0cae67ea6ec7587381536fca84f1779623"
+checksum = "0f0a8ca8799131c1837d1282c3f81f31e76ceb0ce426e04a7fe1ccee3287c066"
 dependencies = [
  "base64 0.22.1",
  "bollard-buildkit-proto",
  "bytes",
- "chrono",
  "prost",
  "serde",
  "serde_json",
  "serde_repr",
- "serde_with",
+ "time",
 ]
 
 [[package]]
@@ -663,7 +660,7 @@ dependencies = [
  "heck",
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -819,7 +816,7 @@ dependencies = [
  "proc-macro2",
  "quote",
  "scratch",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -833,7 +830,7 @@ dependencies = [
  "indexmap 2.13.1",
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -851,7 +848,7 @@ dependencies = [
  "indexmap 2.13.1",
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -874,7 +871,7 @@ dependencies = [
  "proc-macro2",
  "quote",
  "strsim",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -885,7 +882,7 @@ checksum = "ac3984ec7bd6cfa798e62b4a642426a5be0e68f9401cfc2a01e3fa9ea2fcdb8d"
 dependencies = [
  "darling_core",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -910,7 +907,7 @@ checksum = "780eb241654bf097afb00fc5f054a09b687dad862e485fdcf8399bb056565370"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -943,7 +940,7 @@ checksum = "97369cbbc041bc366949bc74d34658d6cda5621039731c6310521892a3a20ae0"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -1007,13 +1004,12 @@ dependencies = [
 
 [[package]]
 name = "etcetera"
-version = "0.10.0"
+version = "0.11.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "26c7b13d0780cb82722fd59f6f57f925e143427e4a75313a6c77243bf5326ae6"
+checksum = "de48cc4d1c1d97a20fd819def54b890cadde72ed3ad0c614822a0a433361be96"
 dependencies = [
  "cfg-if",
- "home",
- "windows-sys 0.59.0",
+ "windows-sys 0.61.2",
 ]
 
 [[package]]
@@ -1022,6 +1018,17 @@ version = "2.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "a043dc74da1e37d6afe657061213aa6f425f855399a11d3463c6ecccc4dfda1f"
 
+[[package]]
+name = "ferroid"
+version = "0.8.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bb330bbd4cb7a5b9f559427f06f98a4f853a137c8298f3bd3f8ca57663e21986"
+dependencies = [
+ "portable-atomic",
+ "rand 0.9.2",
+ "web-time",
+]
+
 [[package]]
 name = "filetime"
 version = "0.2.27"
@@ -1110,7 +1117,6 @@ dependencies = [
  "strum",
  "strum_macros",
  "tempfile",
- "test-env-helpers",
  "testcontainers",
  "thiserror 1.0.69",
  "tokio",
@@ -1224,7 +1230,7 @@ checksum = "e835b70203e41293343137df5c0664546da5745f82ec9b84d40be8336958447b"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -1789,7 +1795,7 @@ checksum = "2a8c8b344124222efd714b73bb41f8b5120b27a7cc1c75593a6ff768d9d05aa4"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2234,7 +2240,7 @@ dependencies = [
  "regex",
  "regex-syntax",
  "structmeta",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2248,7 +2254,7 @@ dependencies = [
  "regex",
  "regex-syntax",
  "structmeta",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2285,7 +2291,7 @@ checksum = "d9b20ed30f105399776b9c883e68e536ef602a16ae6f596d2c473591d6ad64c6"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2352,7 +2358,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "479ca8adacdd7ce8f1fb39ce9ecccbfe93a3f1344b3d0d97f20bc0196208f62b"
 dependencies = [
  "proc-macro2",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2389,7 +2395,7 @@ dependencies = [
  "prost",
  "prost-types",
  "regex",
- "syn 2.0.117",
+ "syn",
  "tempfile",
 ]
 
@@ -2403,7 +2409,7 @@ dependencies = [
  "itertools",
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2474,7 +2480,7 @@ dependencies = [
  "proc-macro2",
  "pyo3-macros-backend",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2487,7 +2493,7 @@ dependencies = [
  "proc-macro2",
  "pyo3-build-config",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2697,7 +2703,7 @@ checksum = "b7186006dcb21920990093f30e3dea63b7d6e977bf1256be20c3563a5db070da"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -2879,15 +2885,6 @@ dependencies = [
  "security-framework",
 ]
 
-[[package]]
-name = "rustls-pemfile"
-version = "2.2.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dce314e5fee3f39953d46bb63bb8a46d40c2f8fb7cc5a3b6cab2bde9721d6e50"
-dependencies = [
- "rustls-pki-types",
-]
-
 [[package]]
 name = "rustls-pki-types"
 version = "1.14.0"
@@ -3022,7 +3019,7 @@ checksum = "d540f220d3187173da220f885ab66608367b6574e925011a9353e4badda91d79"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3055,7 +3052,7 @@ checksum = "175ee3e80ae9982737ca543e96133087cbd9a485eecc3bc4de9c1a37b47ea59c"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3098,7 +3095,7 @@ dependencies = [
  "darling",
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3175,7 +3172,7 @@ dependencies = [
  "heck",
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3209,7 +3206,7 @@ dependencies = [
  "proc-macro2",
  "quote",
  "structmeta-derive",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3220,7 +3217,7 @@ checksum = "152a0b65a590ff6c3da95cabe2353ee04e6167c896b28e3b14478c2636c922fc"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3239,7 +3236,7 @@ dependencies = [
  "proc-macro2",
  "quote",
  "rustversion",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3326,17 +3323,6 @@ dependencies = [
  "sval_nested",
 ]
 
-[[package]]
-name = "syn"
-version = "1.0.109"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "72b64191b275b66ffe2469e8af2c1cfe3bafa67b529ead792a6d0160888b4237"
-dependencies = [
- "proc-macro2",
- "quote",
- "unicode-ident",
-]
-
 [[package]]
 name = "syn"
 version = "2.0.117"
@@ -3365,7 +3351,7 @@ checksum = "728a70f3dbaf5bab7f0c4b1ac8d7ae5ea60a4b5549c8a5914361c99147a709d2"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3402,21 +3388,11 @@ dependencies = [
  "winapi-util",
 ]
 
-[[package]]
-name = "test-env-helpers"
-version = "0.2.2"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c6ab8f4822c904dadef9dd99f228f58a10d1b2c6ece06b108257e72fea72b1c6"
-dependencies = [
- "quote",
- "syn 1.0.109",
-]
-
 [[package]]
 name = "testcontainers"
-version = "0.25.2"
+version = "0.27.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3f3ac71069f20ecfa60c396316c283fbf35e6833a53dff551a31b5458da05edc"
+checksum = "0bd36b06a2a6c0c3c81a83be1ab05fe86460d054d4d51bf513bc56b3e15bdc22"
 dependencies = [
  "astral-tokio-tar",
  "async-trait",
@@ -3425,7 +3401,10 @@ dependencies = [
  "docker_credential",
  "either",
  "etcetera",
+ "ferroid",
  "futures",
+ "http",
+ "itertools",
  "log",
  "memchr",
  "parse-display 0.9.1",
@@ -3437,7 +3416,6 @@ dependencies = [
  "tokio",
  "tokio-stream",
  "tokio-util",
- "ulid",
  "url",
 ]
 
@@ -3467,7 +3445,7 @@ checksum = "4fee6c4efc90059e10f81e6d42c60a18f76588c3d74cb83a0b242a2b6c7504c1"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3478,7 +3456,7 @@ checksum = "ebc4ee7f67670e9b64d05fa4253e753e016c6c95ff35b89b7941d6b856dec1d5"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3591,7 +3569,7 @@ checksum = "385a6cb71ab9ab790c5fe8d67f1645e6c450a7ce006a33de03daa956cf70a496"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3736,7 +3714,7 @@ checksum = "7490cfa5ec963746568740651ac6781f701c9c5ea257c58e057f3ba8cf69e8da"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -3772,16 +3750,6 @@ version = "1.19.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "562d481066bde0658276a35467c4af00bdc6ee726305698a55b86e61d7ad82bb"
 
-[[package]]
-name = "ulid"
-version = "1.2.1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "470dbf6591da1b39d43c14523b2b469c86879a53e8b758c8e090a470fe7b1fbe"
-dependencies = [
- "rand 0.9.2",
- "web-time",
-]
-
 [[package]]
 name = "unicode-ident"
 version = "1.0.24"
@@ -3999,7 +3967,7 @@ dependencies = [
  "bumpalo",
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
  "wasm-bindgen-shared",
 ]
 
@@ -4140,7 +4108,7 @@ checksum = "053e2e040ab57b9dc951b72c264860db7eb3b0200ba345b4e4c3b14f67855ddf"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -4151,7 +4119,7 @@ checksum = "3f316c4a2570ba26bbec722032c4099d8c8bc095efccdc15688708623367e358"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -4187,15 +4155,6 @@ dependencies = [
  "windows-targets 0.52.6",
 ]
 
-[[package]]
-name = "windows-sys"
-version = "0.59.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1e38bc4d79ed67fd075bcc251a1c39b32a1776bbe92e5bef1f0bf1f8c531853b"
-dependencies = [
- "windows-targets 0.52.6",
-]
-
 [[package]]
 name = "windows-sys"
 version = "0.60.2"
@@ -4373,7 +4332,7 @@ dependencies = [
  "heck",
  "indexmap 2.13.1",
  "prettyplease",
- "syn 2.0.117",
+ "syn",
  "wasm-metadata",
  "wit-bindgen-core",
  "wit-component",
@@ -4389,7 +4348,7 @@ dependencies = [
  "prettyplease",
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
  "wit-bindgen-core",
  "wit-bindgen-rust",
 ]
@@ -4475,7 +4434,7 @@ checksum = "de844c262c8848816172cef550288e7dc6c7b7814b4ee56b3e1553f275f1858e"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
  "synstructure",
 ]
 
@@ -4496,7 +4455,7 @@ checksum = "70e3cd084b1788766f53af483dd21f93881ff30d7320490ec3ef7526d203bad4"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
@@ -4516,7 +4475,7 @@ checksum = "11532158c46691caf0f2593ea8358fed6bbf68a0315e80aae9bd41fbade684a1"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
  "synstructure",
 ]
 
@@ -4556,7 +4515,7 @@ checksum = "625dc425cab0dca6dc3c3319506e6593dcb08a9f387ea3b284dbd52a92c40555"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.117",
+ "syn",
 ]
 
 [[package]]
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 7b68e51f4e..ef6a62d3a7 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -79,8 +79,7 @@ strum_macros = "0.26"
 jiff = { workspace = true, features = ["js"] }
 
 [dev-dependencies]
-testcontainers = "0.25.0"
-test-env-helpers = "0.2.2"
+testcontainers = "0.27.2"
 
 [build-dependencies]
 prost-build = "0.14"

From 1d97a10100e0194e0774b9dc87ce3ba329e03438 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 5 Apr 2026 22:19:56 +0100
Subject: [PATCH 225/287] chore: skip duplicate pyfluss build in Python CI
 (#483)

---
 fluss-rust/.github/workflows/build_and_test_python.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index 42b6ffad12..3f67157f6c 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -72,7 +72,7 @@ jobs:
       - name: Build Python bindings
         working-directory: bindings/python
         run: |
-          uv sync --extra dev
+          uv sync --extra dev --no-install-project
           uv run maturin develop
 
       - name: Run Python integration tests (parallel)

From cbe878f17a1e865b380913e3d4307bae76a3c240 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jared=20Yu=20=28=E4=BD=99=E5=90=AF=E6=AD=A3=29?=
 <qzyu999@gmail.com>
Date: Thu, 9 Apr 2026 14:35:02 -0700
Subject: [PATCH 226/287] feat: add async 'for' loop support to LogScanner
 (#424) (#438)

---
 fluss-rust/bindings/python/fluss/__init__.pyi |  14 +-
 fluss-rust/bindings/python/src/table.rs       | 168 +++++++-
 .../bindings/python/test/test_log_table.py    | 377 ++++++++++++++++++
 3 files changed, 538 insertions(+), 21 deletions(-)

diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 977845718a..02edcdb367 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -19,7 +19,17 @@
 
 from enum import IntEnum
 from types import TracebackType
-from typing import Dict, Iterator, List, Optional, Tuple, Union, overload
+from typing import (
+    Any,
+    AsyncIterator,
+    Dict,
+    Iterator,
+    List,
+    Optional,
+    Tuple,
+    Union,
+    overload,
+)
 
 import pandas as pd
 import pyarrow as pa
@@ -797,8 +807,8 @@ class LogScanner:
 
         You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
         """
-        ...
     def __repr__(self) -> str: ...
+    def __aiter__(self) -> AsyncIterator[Union[ScanRecord, RecordBatch]]: ...
 
 class Schema:
     def __init__(
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index cda8d3b201..8d92aba167 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -23,6 +23,7 @@ use arrow_schema::SchemaRef;
 use fluss::record::to_arrow_schema;
 use fluss::rpc::message::OffsetSpec;
 use indexmap::IndexMap;
+use pyo3::IntoPyObjectExt;
 use pyo3::exceptions::{PyIndexError, PyRuntimeError, PyTypeError};
 use pyo3::sync::PyOnceLock;
 use pyo3::types::{
@@ -44,6 +45,7 @@ const MICROS_PER_SECOND: i64 = 1_000_000;
 const MICROS_PER_DAY: i64 = 86_400_000_000;
 const NANOS_PER_MILLI: i64 = 1_000_000;
 const NANOS_PER_MICRO: i64 = 1_000;
+const DEFAULT_POLL_INTERVAL_MS: i64 = 1000;
 
 /// Represents a single scan record with metadata.
 ///
@@ -1886,7 +1888,7 @@ impl ScannerKind {
 /// Both `LogScanner` and `RecordBatchLogScanner` share the same subscribe interface.
 macro_rules! with_scanner {
     ($scanner:expr, $method:ident($($arg:expr),*)) => {
-        match $scanner {
+        match $scanner.as_ref() {
             ScannerKind::Record(s) => s.$method($($arg),*).await,
             ScannerKind::Batch(s) => s.$method($($arg),*).await,
         }
@@ -1900,7 +1902,7 @@ macro_rules! with_scanner {
 /// - Batch-based scanning via `poll_arrow()` / `poll_record_batch()` - returns Arrow batches
 #[pyclass]
 pub struct LogScanner {
-    scanner: ScannerKind,
+    kind: Arc<ScannerKind>,
     admin: Arc<fcore::client::FlussAdmin>,
     table_info: fcore::metadata::TableInfo,
     /// The projected Arrow schema to use for empty table creation
@@ -1921,7 +1923,7 @@ impl LogScanner {
     fn subscribe(&self, py: Python, bucket_id: i32, start_offset: i64) -> PyResult<()> {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
-                with_scanner!(&self.scanner, subscribe(bucket_id, start_offset))
+                with_scanner!(&self.kind, subscribe(bucket_id, start_offset))
                     .map_err(|e| FlussError::from_core_error(&e))
             })
         })
@@ -1934,7 +1936,7 @@ impl LogScanner {
     fn subscribe_buckets(&self, py: Python, bucket_offsets: HashMap<i32, i64>) -> PyResult<()> {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
-                with_scanner!(&self.scanner, subscribe_buckets(&bucket_offsets))
+                with_scanner!(&self.kind, subscribe_buckets(&bucket_offsets))
                     .map_err(|e| FlussError::from_core_error(&e))
             })
         })
@@ -1956,7 +1958,7 @@ impl LogScanner {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
                 with_scanner!(
-                    &self.scanner,
+                    &self.kind,
                     subscribe_partition(partition_id, bucket_id, start_offset)
                 )
                 .map_err(|e| FlussError::from_core_error(&e))
@@ -1976,7 +1978,7 @@ impl LogScanner {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
                 with_scanner!(
-                    &self.scanner,
+                    &self.kind,
                     subscribe_partition_buckets(&partition_bucket_offsets)
                 )
                 .map_err(|e| FlussError::from_core_error(&e))
@@ -1991,7 +1993,7 @@ impl LogScanner {
     fn unsubscribe(&self, py: Python, bucket_id: i32) -> PyResult<()> {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
-                with_scanner!(&self.scanner, unsubscribe(bucket_id))
+                with_scanner!(&self.kind, unsubscribe(bucket_id))
                     .map_err(|e| FlussError::from_core_error(&e))
             })
         })
@@ -2005,11 +2007,8 @@ impl LogScanner {
     fn unsubscribe_partition(&self, py: Python, partition_id: i64, bucket_id: i32) -> PyResult<()> {
         py.detach(|| {
             TOKIO_RUNTIME.block_on(async {
-                with_scanner!(
-                    &self.scanner,
-                    unsubscribe_partition(partition_id, bucket_id)
-                )
-                .map_err(|e| FlussError::from_core_error(&e))
+                with_scanner!(&self.kind, unsubscribe_partition(partition_id, bucket_id))
+                    .map_err(|e| FlussError::from_core_error(&e))
             })
         })
     }
@@ -2029,7 +2028,7 @@ impl LogScanner {
     ///     - Returns an empty ScanRecords if no records are available
     ///     - When timeout expires, returns an empty ScanRecords (NOT an error)
     fn poll(&self, py: Python, timeout_ms: i64) -> PyResult<ScanRecords> {
-        let scanner = self.scanner.as_record()?;
+        let scanner = self.kind.as_record()?;
 
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
@@ -2078,7 +2077,7 @@ impl LogScanner {
     ///     - Returns an empty list if no batches are available
     ///     - When timeout expires, returns an empty list (NOT an error)
     fn poll_record_batch(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<RecordBatch>> {
-        let scanner = self.scanner.as_batch()?;
+        let scanner = self.kind.as_batch()?;
 
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
@@ -2113,7 +2112,7 @@ impl LogScanner {
     ///     - Returns an empty table (with correct schema) if no records are available
     ///     - When timeout expires, returns an empty table (NOT an error)
     fn poll_arrow(&self, py: Python, timeout_ms: i64) -> PyResult<Py<PyAny>> {
-        let scanner = self.scanner.as_batch()?;
+        let scanner = self.kind.as_batch()?;
 
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
@@ -2166,8 +2165,9 @@ impl LogScanner {
     /// Returns:
     ///     PyArrow Table containing all data from subscribed buckets
     fn to_arrow(&self, py: Python) -> PyResult<Py<PyAny>> {
-        let scanner = self.scanner.as_batch()?;
+        let scanner = self.kind.as_batch()?;
         let subscribed = scanner.get_subscribed_buckets();
+
         if subscribed.is_empty() {
             return Err(FlussError::new_err(
                 "No buckets subscribed. Call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.",
@@ -2198,6 +2198,136 @@ impl LogScanner {
         Ok(df)
     }
 
+    fn __aiter__<'py>(slf: PyRef<'py, Self>) -> PyResult<Bound<'py, PyAny>> {
+        let py = slf.py();
+
+        // Single lock for the generic async generator
+        static ASYNC_GEN_FN: PyOnceLock<Py<PyAny>> = PyOnceLock::new();
+
+        let gen_fn = ASYNC_GEN_FN.get_or_init(py, || {
+            let code = pyo3::ffi::c_str!(
+                r#"
+async def _async_scan_generic(scanner, method_name):
+    # Dynamically resolve the polling method (e.g., _async_poll or _async_poll_batches)
+    poll_method = getattr(scanner, method_name)
+    while True:
+        items = await poll_method()
+        if items:
+            for item in items:
+                yield item
+"#
+            );
+            let globals = pyo3::types::PyDict::new(py);
+            py.run(code, Some(&globals), None).unwrap();
+            globals
+                .get_item("_async_scan_generic")
+                .unwrap()
+                .unwrap()
+                .unbind()
+        });
+
+        // Determine which internal method to call based on the scanner kind
+        let method_name = match slf.kind.as_ref() {
+            ScannerKind::Record(_) => "_async_poll",
+            ScannerKind::Batch(_) => "_async_poll_batches",
+        };
+
+        // Instantiate the generator with the scanner instance and the target method name
+        gen_fn
+            .bind(py)
+            .call1((slf.into_bound_py_any(py)?, method_name))
+    }
+
+    /// Perform a single bounded poll and return a list of ScanRecord objects.
+    ///
+    /// This is the async building block used by `__aiter__` (record mode) to
+    /// implement `async for`. Each call does exactly one network poll (bounded
+    /// by `DEFAULT_POLL_INTERVAL_MS`), converts any results to Python ScanRecord objects,
+    /// and returns them as a list. An empty list signals a timeout (no data yet), not
+    /// end-of-stream.
+    ///
+    /// Returns:
+    ///     Awaitable that resolves to a list of ScanRecord objects
+    fn _async_poll<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let timeout = Duration::from_millis(DEFAULT_POLL_INTERVAL_MS as u64);
+
+        let scanner = Arc::clone(&self.kind);
+        let projected_row_type = self.projected_row_type.clone();
+
+        future_into_py(py, async move {
+            let core_scanner = match scanner.as_ref() {
+                ScannerKind::Record(s) => s,
+                ScannerKind::Batch(_) => {
+                    return Err(PyTypeError::new_err(
+                        "This internal method only supports record-based scanners. \
+                         For batch-based scanners, use 'async for' or 'poll_record_batch' instead.",
+                    ));
+                }
+            };
+
+            let scan_records = core_scanner
+                .poll(timeout)
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
+
+            // Convert to Python list
+            Python::attach(|py| {
+                let mut result: Vec<Py<ScanRecord>> = Vec::new();
+                for (_, records) in scan_records.into_records_by_buckets() {
+                    for core_record in records {
+                        let scan_record =
+                            ScanRecord::from_core(py, &core_record, &projected_row_type)?;
+                        result.push(Py::new(py, scan_record)?);
+                    }
+                }
+                Ok(result)
+            })
+        })
+    }
+
+    /// Perform a single bounded poll and return a list of RecordBatch objects.
+    ///
+    /// This is the async building block used by `__aiter__` (batch mode) to
+    /// implement `async for`. Each call does exactly one network poll (bounded
+    /// by `DEFAULT_POLL_INTERVAL_MS`), converts any results to Python RecordBatch objects,
+    /// and returns them as a list. An empty list signals a timeout (no data
+    /// yet), not end-of-stream.
+    ///
+    /// Returns:
+    ///     Awaitable that resolves to a list of RecordBatch objects
+    fn _async_poll_batches<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let timeout = Duration::from_millis(DEFAULT_POLL_INTERVAL_MS as u64);
+
+        let scanner = Arc::clone(&self.kind);
+
+        future_into_py(py, async move {
+            let core_scanner = match scanner.as_ref() {
+                ScannerKind::Batch(s) => s,
+                ScannerKind::Record(_) => {
+                    return Err(PyTypeError::new_err(
+                        "This internal method only supports batch-based scanners. \
+                         For record-based scanners, use 'async for' or 'poll' instead.",
+                    ));
+                }
+            };
+
+            let scan_batches = core_scanner
+                .poll(timeout)
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
+
+            // Convert to Python list of RecordBatch objects
+            Python::attach(|py| {
+                let mut result: Vec<Py<RecordBatch>> = Vec::new();
+                for scan_batch in scan_batches {
+                    let rb = RecordBatch::from_scan_batch(scan_batch);
+                    result.push(Py::new(py, rb)?);
+                }
+                Ok(result)
+            })
+        })
+    }
+
     fn __repr__(&self) -> String {
         format!("LogScanner(table={})", self.table_info.table_path)
     }
@@ -2212,7 +2342,7 @@ impl LogScanner {
         projected_row_type: fcore::metadata::RowType,
     ) -> Self {
         Self {
-            scanner,
+            kind: Arc::new(scanner),
             admin,
             table_info,
             projected_schema,
@@ -2263,7 +2393,7 @@ impl LogScanner {
         py: Python,
         subscribed: &[(fcore::metadata::TableBucket, i64)],
     ) -> PyResult<HashMap<fcore::metadata::TableBucket, i64>> {
-        let scanner = self.scanner.as_batch()?;
+        let scanner = self.kind.as_batch()?;
         let is_partitioned = scanner.is_partitioned();
         let table_path = &self.table_info.table_path;
 
@@ -2366,7 +2496,7 @@ impl LogScanner {
         py: Python,
         mut stopping_offsets: HashMap<fcore::metadata::TableBucket, i64>,
     ) -> PyResult<Py<PyAny>> {
-        let scanner = self.scanner.as_batch()?;
+        let scanner = self.kind.as_batch()?;
         let mut all_batches = Vec::new();
 
         while !stopping_offsets.is_empty() {
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index dd1a4d4f3e..eb11874864 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -729,6 +729,382 @@ async def test_scan_records_indexing_and_slicing(connection, admin):
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
+async def test_async_iterator(connection, admin):
+    """Test the Python asynchronous iterator loop (`async for`) on LogScanner."""
+    table_path = fluss.TablePath("fluss", "py_test_async_iterator")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())])
+    )
+    await admin.create_table(table_path, fluss.TableDescriptor(schema))
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+    
+    # Write 5 records
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [pa.array(list(range(1, 6)), type=pa.int32()),
+             pa.array([f"async{i}" for i in range(1, 6)])],
+            schema=pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())]),
+        )
+    )
+    await writer.flush()
+
+    scanner = await table.new_scan().create_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    collected = []
+    
+    # Here is the magical Issue #424 async iterator logic at work:
+    async def consume_scanner():
+        async for record in scanner:
+            collected.append(record)
+            if len(collected) == 5:
+                break
+                
+    # We must race the consumption against a timeout so the test doesn't hang if the iterator is broken
+    await asyncio.wait_for(consume_scanner(), timeout=10.0)
+    
+    assert len(collected) == 5, f"Expected 5 records, got {len(collected)}"
+    
+    collected.sort(key=lambda r: r.row["id"])
+    for i, record in enumerate(collected):
+        assert record.row["id"] == i + 1
+        assert record.row["val"] == f"async{i + 1}"
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_async_iterator_break_no_leak(connection, admin):
+    """Verify that breaking out of `async for` does not leak resources.
+
+    After breaking, the scanner must still be usable for synchronous
+    `poll()` calls.  If the old implementation's tokio::spawn'd task
+    were still alive, it would hold the Mutex and cause `poll()` to
+    deadlock or error.
+    """
+    table_path = fluss.TablePath("fluss", "py_test_async_break_leak")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())])
+    )
+    await admin.create_table(table_path, fluss.TableDescriptor(schema))
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [
+                pa.array(list(range(1, 11)), type=pa.int32()),
+                pa.array([f"v{i}" for i in range(1, 11)]),
+            ],
+            schema=pa.schema(
+                [pa.field("id", pa.int32()), pa.field("val", pa.string())]
+            ),
+        )
+    )
+    await writer.flush()
+
+    scanner = await table.new_scan().create_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner.subscribe_buckets(
+        {i: fluss.EARLIEST_OFFSET for i in range(num_buckets)}
+    )
+
+    # Phase 1: async for with early break (collect only 3 of 10)
+    collected_async = []
+
+    async def consume_and_break():
+        async for record in scanner:
+            collected_async.append(record)
+            if len(collected_async) >= 3:
+                break
+
+    await asyncio.wait_for(consume_and_break(), timeout=10.0)
+    assert len(collected_async) == 3, (
+        f"Expected 3 records from async for, got {len(collected_async)}"
+    )
+
+    # Phase 2: sync poll() must still work — proves no leaked task / lock.
+    # With small data and few buckets, _async_poll may have fetched all
+    # records in one batch. After break, the un-yielded records from that
+    # batch are lost. So sync poll may return 0 records — the key assertion
+    # is that poll() completes without deadlock (returns within timeout).
+    remaining = scanner.poll(2000)
+    assert remaining is not None, "poll() should return (not deadlock)"
+
+    # If we got records, verify no duplicates
+    async_ids = {r.row["id"] for r in collected_async}
+    sync_ids = {r.row["id"] for r in remaining}
+    assert async_ids.isdisjoint(sync_ids), (
+        f"Duplicate IDs between async and sync: {async_ids & sync_ids}"
+    )
+
+    # All IDs must be from the original 1-10 range
+    all_ids = async_ids | sync_ids
+    assert all_ids.issubset(set(range(1, 11))), (
+        f"Unexpected IDs: {all_ids - set(range(1, 11))}"
+    )
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_async_iterator_multiple_batches(connection, admin):
+    """Verify async iteration works across multiple network poll cycles.
+
+    _async_poll does a single bounded poll per call.  Writing 20 records
+    to multiple buckets ensures the Python generator must loop through
+    several _async_poll calls to collect them all.
+    """
+    table_path = fluss.TablePath("fluss", "py_test_async_multi_batch")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(
+        schema, bucket_count=3, bucket_keys=["id"]
+    )
+    await admin.create_table(
+        table_path, table_descriptor, ignore_if_exists=False
+    )
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+
+    num_records = 20
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [
+                pa.array(list(range(1, num_records + 1)), type=pa.int32()),
+                pa.array([f"multi{i}" for i in range(1, num_records + 1)]),
+            ],
+            schema=pa.schema(
+                [pa.field("id", pa.int32()), pa.field("val", pa.string())]
+            ),
+        )
+    )
+    await writer.flush()
+
+    scanner = await table.new_scan().create_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner.subscribe_buckets(
+        {i: fluss.EARLIEST_OFFSET for i in range(num_buckets)}
+    )
+
+    collected = []
+
+    async def consume_all():
+        async for record in scanner:
+            collected.append(record)
+            if len(collected) >= num_records:
+                break
+
+    await asyncio.wait_for(consume_all(), timeout=15.0)
+    assert len(collected) == num_records, (
+        f"Expected {num_records} records, got {len(collected)}"
+    )
+
+    # Verify all IDs are present (order may vary due to bucketing)
+    ids = sorted(r.row["id"] for r in collected)
+    assert ids == list(range(1, num_records + 1))
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_batch_async_iterator(connection, admin):
+    """Test the Python asynchronous iterator loop (`async for`) on a batch LogScanner.
+
+    With our __aiter__ dispatch, a batch-based scanner should yield RecordBatch
+    objects (not ScanRecord). Each yielded item has .batch (PyArrow RecordBatch),
+    .bucket, .base_offset, .last_offset.
+    """
+    table_path = fluss.TablePath("fluss", "py_test_batch_async_iter")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())])
+    )
+    await admin.create_table(table_path, fluss.TableDescriptor(schema))
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [
+                pa.array(list(range(1, 7)), type=pa.int32()),
+                pa.array([f"bv{i}" for i in range(1, 7)]),
+            ],
+            schema=pa.schema(
+                [pa.field("id", pa.int32()), pa.field("val", pa.string())]
+            ),
+        )
+    )
+    await writer.flush()
+
+    batch_scanner = await table.new_scan().create_record_batch_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    batch_scanner.subscribe_buckets(
+        {i: fluss.EARLIEST_OFFSET for i in range(num_buckets)}
+    )
+
+    collected_batches = []
+    total_rows = 0
+
+    async def consume_batches():
+        nonlocal total_rows
+        async for rb in batch_scanner:
+            collected_batches.append(rb)
+            total_rows += rb.batch.num_rows
+            if total_rows >= 6:
+                break
+
+    await asyncio.wait_for(consume_batches(), timeout=15.0)
+
+    assert total_rows >= 6, f"Expected >=6 total rows, got {total_rows}"
+    assert len(collected_batches) > 0
+
+    # Verify each yielded item is a RecordBatch with expected attributes
+    for rb in collected_batches:
+        assert hasattr(rb, "batch"), "RecordBatch should have .batch"
+        assert hasattr(rb, "bucket"), "RecordBatch should have .bucket"
+        assert hasattr(rb, "base_offset"), "RecordBatch should have .base_offset"
+        assert hasattr(rb, "last_offset"), "RecordBatch should have .last_offset"
+        # .batch should be a PyArrow RecordBatch
+        arrow_batch = rb.batch
+        assert isinstance(arrow_batch, pa.RecordBatch), (
+            f"Expected PyArrow RecordBatch, got {type(arrow_batch).__name__}"
+        )
+        assert arrow_batch.num_columns == 2
+        assert set(arrow_batch.schema.names) == {"id", "val"}
+
+    # Verify all 6 IDs are present
+    all_ids = []
+    for rb in collected_batches:
+        all_ids.extend(rb.batch.column("id").to_pylist())
+    assert sorted(all_ids[:6]) == [1, 2, 3, 4, 5, 6]
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_batch_async_iterator_break_no_leak(connection, admin):
+    """Verify that breaking out of batch `async for` does not leak resources.
+
+    After breaking, the scanner must still be usable for synchronous
+    poll_record_batch() calls, proving no leaked task or lock.
+    """
+    table_path = fluss.TablePath("fluss", "py_test_batch_async_break")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())])
+    )
+    await admin.create_table(table_path, fluss.TableDescriptor(schema))
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [
+                pa.array(list(range(1, 11)), type=pa.int32()),
+                pa.array([f"bl{i}" for i in range(1, 11)]),
+            ],
+            schema=pa.schema(
+                [pa.field("id", pa.int32()), pa.field("val", pa.string())]
+            ),
+        )
+    )
+    await writer.flush()
+
+    batch_scanner = await table.new_scan().create_record_batch_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    batch_scanner.subscribe_buckets(
+        {i: fluss.EARLIEST_OFFSET for i in range(num_buckets)}
+    )
+
+    # Phase 1: async for with early break (collect just 1 batch)
+    first_batch = None
+
+    async def consume_and_break():
+        nonlocal first_batch
+        async for rb in batch_scanner:
+            first_batch = rb
+            break
+
+    await asyncio.wait_for(consume_and_break(), timeout=10.0)
+    assert first_batch is not None, "Should have received at least 1 batch"
+    assert first_batch.batch.num_rows > 0
+
+    # Phase 2: sync poll_record_batch() must still work — proves no leak
+    remaining = batch_scanner.poll_record_batch(2000)
+    assert remaining is not None, "poll_record_batch() should return (not deadlock)"
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_batch_async_iterator_multiple_batches(connection, admin):
+    """Verify batch async iteration works across multiple network poll cycles.
+
+    Writing 20 records to 3 buckets ensures the generator must loop through
+    several _async_poll_batches calls to collect them all.
+    """
+    table_path = fluss.TablePath("fluss", "py_test_batch_async_multi")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("val", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(
+        schema, bucket_count=3, bucket_keys=["id"]
+    )
+    await admin.create_table(
+        table_path, table_descriptor, ignore_if_exists=False
+    )
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+
+    num_records = 20
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [
+                pa.array(list(range(1, num_records + 1)), type=pa.int32()),
+                pa.array([f"bm{i}" for i in range(1, num_records + 1)]),
+            ],
+            schema=pa.schema(
+                [pa.field("id", pa.int32()), pa.field("val", pa.string())]
+            ),
+        )
+    )
+    await writer.flush()
+
+    batch_scanner = await table.new_scan().create_record_batch_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    batch_scanner.subscribe_buckets(
+        {i: fluss.EARLIEST_OFFSET for i in range(num_buckets)}
+    )
+
+    all_ids = []
+
+    async def consume_all():
+        async for rb in batch_scanner:
+            all_ids.extend(rb.batch.column("id").to_pylist())
+            if len(all_ids) >= num_records:
+                break
+
+    await asyncio.wait_for(consume_all(), timeout=15.0)
+    assert len(all_ids) >= num_records, (
+        f"Expected >={num_records} IDs, got {len(all_ids)}"
+    )
+    assert sorted(all_ids[:num_records]) == list(range(1, num_records + 1))
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
 # ---------------------------------------------------------------------------
 # Helpers
 # ---------------------------------------------------------------------------
@@ -755,3 +1131,4 @@ def _poll_arrow_ids(scanner, expected_count, timeout_s=10):
         if arrow_table.num_rows > 0:
             all_ids.extend(arrow_table.column("id").to_pylist())
     return all_ids
+

From a36bf1be3e85f1658a7b83a93ebf2c0ac29f091b Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Fri, 10 Apr 2026 00:16:30 +0100
Subject: [PATCH 227/287] [test][infra] Unify IT infrastructure for all clients
 (#476)

---
 .../.github/workflows/build_and_test_cpp.yml  |   7 +-
 .../workflows/build_and_test_python.yml       |   9 +-
 .../.github/workflows/build_and_test_rust.yml |  29 +-
 fluss-rust/.licenserc.yaml                    |   1 +
 fluss-rust/Cargo.lock                         |  14 +-
 fluss-rust/Cargo.toml                         |   2 +-
 fluss-rust/bindings/cpp/CMakeLists.txt        |  17 +-
 fluss-rust/bindings/cpp/test/test_main.cpp    |   6 -
 fluss-rust/bindings/cpp/test/test_utils.h     | 319 +++--------
 fluss-rust/bindings/python/pyproject.toml     |   2 +-
 fluss-rust/bindings/python/test/conftest.py   | 259 +++------
 .../crates/fluss-test-cluster/Cargo.toml      |  36 ++
 fluss-rust/crates/fluss-test-cluster/build.rs |  32 ++
 .../crates/fluss-test-cluster/src/lib.rs      | 514 ++++++++++++++++++
 .../crates/fluss-test-cluster/src/main.rs     | 103 ++++
 .../crates/fluss-test-cluster/test-images.env |   4 +
 fluss-rust/crates/fluss/Cargo.toml            |   2 +-
 .../fluss/tests/integration/fluss_cluster.rs  | 451 +--------------
 .../crates/fluss/tests/integration/utils.rs   |   2 +-
 19 files changed, 903 insertions(+), 906 deletions(-)
 create mode 100644 fluss-rust/crates/fluss-test-cluster/Cargo.toml
 create mode 100644 fluss-rust/crates/fluss-test-cluster/build.rs
 create mode 100644 fluss-rust/crates/fluss-test-cluster/src/lib.rs
 create mode 100644 fluss-rust/crates/fluss-test-cluster/src/main.rs
 create mode 100644 fluss-rust/crates/fluss-test-cluster/test-images.env

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
index 88a896bce3..7b6383afcb 100644
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -38,9 +38,11 @@ concurrency:
   cancel-in-progress: true
 
 jobs:
-  build-and-test-cpp:
+  build-and-test:
     timeout-minutes: 60
     runs-on: ubuntu-latest
+    env:
+      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/target/debug/fluss-test-cluster
     steps:
       - uses: actions/checkout@v4
 
@@ -66,6 +68,9 @@ jobs:
           restore-keys: |
             cpp-test-${{ runner.os }}-
 
+      - name: Build fluss-test-cluster binary
+        run: cargo build -p fluss-test-cluster
+
       - name: Build C++ bindings and tests
         working-directory: bindings/cpp
         run: |
diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index 3f67157f6c..5eec8c39ce 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -38,12 +38,14 @@ concurrency:
   cancel-in-progress: true
 
 jobs:
-  build-and-test-python:
+  build-and-test:
     timeout-minutes: 60
     runs-on: ubuntu-latest
     strategy:
       matrix:
         python: ["3.9", "3.10", "3.11", "3.12"]
+    env:
+      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/target/debug/fluss-test-cluster
     steps:
       - uses: actions/checkout@v4
 
@@ -69,13 +71,16 @@ jobs:
           restore-keys: |
             python-test-${{ runner.os }}-${{ matrix.python }}-
 
+      - name: Build fluss-test-cluster binary
+        run: cargo build -p fluss-test-cluster
+
       - name: Build Python bindings
         working-directory: bindings/python
         run: |
           uv sync --extra dev --no-install-project
           uv run maturin develop
 
-      - name: Run Python integration tests (parallel)
+      - name: Run tests (parallel)
         working-directory: bindings/python
         run: uv run pytest test/ -v -n auto
         env:
diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index c904e300d0..1c5a99ab3f 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -39,7 +39,7 @@ concurrency:
   cancel-in-progress: true
 
 jobs:
-  build-and-test-rust:
+  build-and-unit-test:
     timeout-minutes: 60
     runs-on: ${{ matrix.os }}
     strategy:
@@ -78,10 +78,29 @@ jobs:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
 
-      - name: Integration Test (Linux only)
-        if: runner.os == 'Linux'
-        run: |
-          cargo test --features integration_tests --all-targets --workspace --exclude fluss_python --exclude fluss-cpp
+  integration-test:
+    needs: build-and-unit-test
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Rust Cache
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cargo/registry
+            ~/.cargo/git
+            target
+          key: rust-${{ runner.os }}-${{ hashFiles('**/Cargo.lock') }}
+          restore-keys: |
+            rust-${{ runner.os }}-
+
+      - name: Integration Test
+        run: cargo test --features integration_tests --all-targets --workspace --exclude fluss_python --exclude fluss-cpp
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
diff --git a/fluss-rust/.licenserc.yaml b/fluss-rust/.licenserc.yaml
index 4afd5a9d20..275585377f 100644
--- a/fluss-rust/.licenserc.yaml
+++ b/fluss-rust/.licenserc.yaml
@@ -30,4 +30,5 @@ header:
     - 'website/**'
     - '**/*.md'
     - '**/DEPENDENCIES.*.tsv'
+    - '**/*.env'
   comment: on-failure
diff --git a/fluss-rust/Cargo.lock b/fluss-rust/Cargo.lock
index 5af3f8758e..388d1a259e 100644
--- a/fluss-rust/Cargo.lock
+++ b/fluss-rust/Cargo.lock
@@ -1099,6 +1099,7 @@ dependencies = [
  "crc32c",
  "dashmap",
  "delegate",
+ "fluss-test-cluster",
  "futures",
  "jiff",
  "linked-hash-map",
@@ -1117,13 +1118,24 @@ dependencies = [
  "strum",
  "strum_macros",
  "tempfile",
- "testcontainers",
  "thiserror 1.0.69",
  "tokio",
  "url",
  "uuid",
 ]
 
+[[package]]
+name = "fluss-test-cluster"
+version = "0.2.0"
+dependencies = [
+ "clap",
+ "fluss-rs",
+ "serde",
+ "serde_json",
+ "testcontainers",
+ "tokio",
+]
+
 [[package]]
 name = "fluss_python"
 version = "0.2.0"
diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index d4d262adaf..2abdbf0626 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -28,7 +28,7 @@ keywords = ["fluss", "streaming-storage", "datalake"]
 
 [workspace]
 resolver = "2"
-members = ["crates/fluss", "crates/examples", "bindings/python", "bindings/cpp"]
+members = ["crates/fluss", "crates/fluss-test-cluster", "crates/examples", "bindings/python", "bindings/cpp"]
 
 [workspace.dependencies]
 fluss = { package = "fluss-rs", version = "0.2.0", path = "crates/fluss", features = ["storage-all"] }
diff --git a/fluss-rust/bindings/cpp/CMakeLists.txt b/fluss-rust/bindings/cpp/CMakeLists.txt
index ac93611685..44407ac860 100644
--- a/fluss-rust/bindings/cpp/CMakeLists.txt
+++ b/fluss-rust/bindings/cpp/CMakeLists.txt
@@ -25,6 +25,7 @@ project(fluss-cpp LANGUAGES CXX)
 
 include(FetchContent)
 set(FLUSS_GOOGLETEST_VERSION 1.15.2 CACHE STRING "version of GoogleTest")
+set(FLUSS_NLOHMANN_JSON_VERSION 3.12.0 CACHE STRING "version of nlohmann/json")
 set(CMAKE_EXPORT_COMPILE_COMMANDS ON)
 
 set(FLUSS_CPP_DEP_MODE "system" CACHE STRING "Dependency provisioning mode for fluss-cpp (system|build)")
@@ -253,14 +254,25 @@ if (FLUSS_ENABLE_TESTING)
         URL https://github.com/google/googletest/archive/refs/tags/v${FLUSS_GOOGLETEST_VERSION}.tar.gz
     )
     set(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
+
     FetchContent_MakeAvailable(googletest)
 
+    if (NOT TARGET nlohmann_json::nlohmann_json)
+        set(JSON_BuildTests OFF CACHE INTERNAL "")
+        FetchContent_Declare(
+            nlohmann_json
+            URL https://github.com/nlohmann/json/archive/refs/tags/v${FLUSS_NLOHMANN_JSON_VERSION}.tar.gz
+            URL_HASH SHA256=4b92eb0c06d10683f7447ce9406cb97cd4b453be18d7279320f7b2f025c10187
+        )
+        FetchContent_MakeAvailable(nlohmann_json)
+    endif()
+
     enable_testing()
     include(GoogleTest)
 
     file(GLOB TEST_SOURCE_FILES "test/*.cpp")
     add_executable(fluss_cpp_test ${TEST_SOURCE_FILES})
-    target_link_libraries(fluss_cpp_test PRIVATE fluss_cpp GTest::gtest)
+    target_link_libraries(fluss_cpp_test PRIVATE fluss_cpp GTest::gtest nlohmann_json::nlohmann_json)
     target_link_libraries(fluss_cpp_test PRIVATE Arrow::arrow_shared)
     target_compile_definitions(fluss_cpp_test PRIVATE ARROW_FOUND)
     target_include_directories(fluss_cpp_test PRIVATE
@@ -268,15 +280,12 @@ if (FLUSS_ENABLE_TESTING)
         ${PROJECT_SOURCE_DIR}/test
     )
 
-    # Individual tests for parallel execution via ctest -j.
     gtest_discover_tests(fluss_cpp_test
         PROPERTIES
             TIMEOUT 120
             FIXTURES_REQUIRED fluss_cluster
     )
 
-    # Cleanup: stop Docker containers after all tests finish.
-    # Mirrors Python's pytest_unconfigure and Rust's atexit cleanup.
     add_test(NAME fluss_cluster_cleanup COMMAND fluss_cpp_test --cleanup)
     set_tests_properties(fluss_cluster_cleanup PROPERTIES
         FIXTURES_CLEANUP fluss_cluster
diff --git a/fluss-rust/bindings/cpp/test/test_main.cpp b/fluss-rust/bindings/cpp/test/test_main.cpp
index 7b132d2c37..48d1050b8d 100644
--- a/fluss-rust/bindings/cpp/test/test_main.cpp
+++ b/fluss-rust/bindings/cpp/test/test_main.cpp
@@ -22,20 +22,14 @@
 #include "test_utils.h"
 
 int main(int argc, char** argv) {
-    // --cleanup: stop Docker containers and exit (used by ctest FIXTURES_CLEANUP).
     for (int i = 1; i < argc; ++i) {
         if (std::string(argv[i]) == "--cleanup") {
-            const char* env = std::getenv("FLUSS_BOOTSTRAP_SERVERS");
-            if (env && std::strlen(env) > 0) return 0;
             fluss_test::FlussTestCluster::StopAll();
             return 0;
         }
     }
 
     ::testing::InitGoogleTest(&argc, argv);
-
-    // Register the global test environment (manages the Fluss cluster lifecycle).
     ::testing::AddGlobalTestEnvironment(fluss_test::FlussTestEnvironment::Instance());
-
     return RUN_ALL_TESTS();
 }
diff --git a/fluss-rust/bindings/cpp/test/test_utils.h b/fluss-rust/bindings/cpp/test/test_utils.h
index 1ff7e2810b..5d40afbaf3 100644
--- a/fluss-rust/bindings/cpp/test/test_utils.h
+++ b/fluss-rust/bindings/cpp/test/test_utils.h
@@ -21,266 +21,136 @@
 
 #include <gtest/gtest.h>
 
-#include <algorithm>
 #include <chrono>
 #include <cstdio>
 #include <cstdlib>
 #include <cstring>
+#include <fstream>
+#include <sstream>
+#include <nlohmann/json.hpp>
 #include <string>
-#include <thread>
 #include <vector>
 
-#ifdef _WIN32
-#include <winsock2.h>
-#include <ws2tcpip.h>
-#pragma comment(lib, "ws2_32.lib")
-#else
-#include <arpa/inet.h>
-#include <netinet/in.h>
-#include <sys/socket.h>
-#include <unistd.h>
-#endif
-
 #include "fluss.hpp"
 
-// Macro to assert Result is OK and print error message on failure
 #define ASSERT_OK(result) ASSERT_TRUE((result).Ok()) << (result).error_message
 #define EXPECT_OK(result) EXPECT_TRUE((result).Ok()) << (result).error_message
 
 namespace fluss_test {
 
-static constexpr const char* kFlussImage = "apache/fluss";
-static constexpr const char* kFlussVersion = "0.9.0-incubating";
-static constexpr const char* kNetworkName = "fluss-cpp-test-network";
-static constexpr const char* kZookeeperName = "zookeeper-cpp-test";
-static constexpr const char* kCoordinatorName = "coordinator-server-cpp-test";
-static constexpr const char* kTabletServerName = "tablet-server-cpp-test";
-static constexpr int kCoordinatorPort = 9123;
-static constexpr int kTabletServerPort = 9124;
-static constexpr int kPlainClientPort = 9223;
-static constexpr int kPlainClientTabletPort = 9224;
-
-/// Execute a shell command and return its exit code.
-inline int RunCommand(const std::string& cmd) { return system(cmd.c_str()); }
-
-/// Join property lines with the escaped newline separator used by `printf` in docker commands.
-inline std::string JoinProps(const std::vector<std::string>& lines) {
-    std::string result;
-    for (size_t i = 0; i < lines.size(); ++i) {
-        if (i > 0) result += "\\n";
-        result += lines[i];
+inline std::string FindCliBinary() {
+    const char* env_bin = std::getenv("FLUSS_TEST_CLUSTER_BIN");
+    if (env_bin && std::strlen(env_bin) > 0) {
+        if (std::ifstream(env_bin).good()) {
+            return env_bin;
+        }
+        std::cerr << "FLUSS_TEST_CLUSTER_BIN is set to '" << env_bin
+                  << "' but that file does not exist." << std::endl;
+        std::abort();
     }
-    return result;
-}
-
-/// Build a `docker run` command with FLUSS_PROPERTIES.
-inline std::string DockerRunCmd(const std::string& name, const std::string& props,
-                                const std::vector<std::string>& port_mappings,
-                                const std::string& server_type) {
-    std::string cmd = "docker run -d --rm --name " + name + " --network " + kNetworkName;
-    for (const auto& pm : port_mappings) {
-        cmd += " -p " + pm;
+    FILE* pipe = popen("cargo locate-project --workspace --message-format plain", "r");
+    if (pipe) {
+        char buf[512];
+        std::string root;
+        while (fgets(buf, sizeof(buf), pipe)) root += buf;
+        if (pclose(pipe) == 0) {
+            // cargo returns path to Cargo.toml; strip filename + trailing whitespace.
+            while (!root.empty() && (root.back() == '\n' || root.back() == '\r')) root.pop_back();
+            auto slash = root.rfind('/');
+            if (slash != std::string::npos) {
+                std::string dir = root.substr(0, slash);
+                for (const char* profile : {"debug", "release"}) {
+                    std::string path = dir + "/target/" + profile + "/fluss-test-cluster";
+                    if (std::ifstream(path).good()) return path;
+                }
+            }
+        }
     }
-    cmd += " -e FLUSS_PROPERTIES=\"$(printf '" + props + "')\"";
-    cmd += " " + std::string(kFlussImage) + ":" + kFlussVersion + " " + server_type;
-    return cmd;
+    return "fluss-test-cluster";
 }
 
-/// Wait until a TCP port is accepting connections, or timeout.
-inline bool WaitForPort(const std::string& host, int port, int timeout_seconds = 60) {
-    auto deadline = std::chrono::steady_clock::now() + std::chrono::seconds(timeout_seconds);
-
-    while (std::chrono::steady_clock::now() < deadline) {
-        int sock = socket(AF_INET, SOCK_STREAM, 0);
-        if (sock < 0) {
-            std::this_thread::sleep_for(std::chrono::milliseconds(500));
-            continue;
-        }
+constexpr const char* kClusterName = "shared-test";
 
-        struct sockaddr_in addr {};
-        addr.sin_family = AF_INET;
-        addr.sin_port = htons(static_cast<uint16_t>(port));
-        inet_pton(AF_INET, host.c_str(), &addr.sin_addr);
+inline std::string CliStartCmd() {
+    return FindCliBinary() + " start --sasl --name " + kClusterName;
+}
 
-        int result = connect(sock, reinterpret_cast<struct sockaddr*>(&addr), sizeof(addr));
-#ifdef _WIN32
-        closesocket(sock);
-#else
-        close(sock);
-#endif
-        if (result == 0) {
+constexpr const char* kClusterJsonPrefix = "CLUSTER_JSON: ";
+
+inline bool ParseClusterJson(const std::string& output, std::string& bootstrap,
+                             std::string& sasl_bootstrap) {
+    // Look for the CLUSTER_JSON: token in output lines.
+    std::istringstream stream(output);
+    std::string line;
+    while (std::getline(stream, line)) {
+        if (line.rfind(kClusterJsonPrefix, 0) != 0) continue;
+        std::string json_str = line.substr(std::strlen(kClusterJsonPrefix));
+        try {
+            auto info = nlohmann::json::parse(json_str);
+            bootstrap = info.at("bootstrap_servers").get<std::string>();
+            if (info.contains("sasl_bootstrap_servers") &&
+                !info["sasl_bootstrap_servers"].is_null()) {
+                sasl_bootstrap = info["sasl_bootstrap_servers"].get<std::string>();
+            }
             return true;
+        } catch (const nlohmann::json::exception& e) {
+            std::cerr << "Failed to parse cluster JSON: " << e.what() << "\n"
+                      << "Line: " << line << std::endl;
+            return false;
         }
-
-        std::this_thread::sleep_for(std::chrono::milliseconds(500));
     }
+    std::cerr << "No CLUSTER_JSON token found in output:\n" << output << std::endl;
     return false;
 }
 
-/// Manages a Docker-based Fluss cluster for integration testing.
 class FlussTestCluster {
    public:
     FlussTestCluster() = default;
 
     bool Start() {
-        const char* env_servers = std::getenv("FLUSS_BOOTSTRAP_SERVERS");
-        if (env_servers && std::strlen(env_servers) > 0) {
-            bootstrap_servers_ = env_servers;
+        const char* env = std::getenv("FLUSS_BOOTSTRAP_SERVERS");
+        if (env && std::strlen(env) > 0) {
+            bootstrap_servers_ = env;
             const char* env_sasl = std::getenv("FLUSS_SASL_BOOTSTRAP_SERVERS");
-            if (env_sasl && std::strlen(env_sasl) > 0) {
-                sasl_bootstrap_servers_ = env_sasl;
-            }
-            external_cluster_ = true;
-            std::cout << "Using external cluster: " << bootstrap_servers_ << std::endl;
-            return true;
-        }
-
-        // Reuse cluster started by another parallel test process or previous run.
-        if (WaitForPort("127.0.0.1", kPlainClientPort, /*timeout_seconds=*/1)) {
-            SetBootstrapServers();
-            external_cluster_ = true;
+            sasl_bootstrap_servers_ = (env_sasl && std::strlen(env_sasl) > 0) ? env_sasl : env;
             return true;
         }
 
-        std::cout << "Starting Fluss cluster via Docker..." << std::endl;
-
-        // Remove stopped (not running) containers from previous runs.
-        RunCommand(std::string("docker rm ") + kTabletServerName + " 2>/dev/null || true");
-        RunCommand(std::string("docker rm ") + kCoordinatorName + " 2>/dev/null || true");
-        RunCommand(std::string("docker rm ") + kZookeeperName + " 2>/dev/null || true");
-        RunCommand(std::string("docker network rm ") + kNetworkName + " 2>/dev/null || true");
-
-        RunCommand(std::string("docker network create ") + kNetworkName + " 2>/dev/null || true");
-
-        std::string zk_cmd = std::string("docker run -d --rm") + " --name " + kZookeeperName +
-                             " --network " + kNetworkName + " zookeeper:3.9.2";
-        if (RunCommand(zk_cmd) != 0) {
-            return WaitForCluster();
-        }
-
-        // Wait for ZooKeeper to be ready
-        std::this_thread::sleep_for(std::chrono::seconds(5));
-
-        // Coordinator Server (dual listeners: SASL on 9123, plaintext on 9223)
-        std::string sasl_jaas =
-            "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required"
-            " user_admin=\"admin-secret\" user_alice=\"alice-secret\";";
-
-        std::string coord = std::string(kCoordinatorName);
-        std::string zk = std::string(kZookeeperName);
-        std::string coord_props = JoinProps({
-            "zookeeper.address: " + zk + ":2181",
-            "bind.listeners: INTERNAL://" + coord + ":0, CLIENT://" + coord +
-                ":9123, PLAIN_CLIENT://" + coord + ":9223",
-            "advertised.listeners: CLIENT://localhost:9123, PLAIN_CLIENT://localhost:9223",
-            "internal.listener.name: INTERNAL",
-            "security.protocol.map: CLIENT:sasl",
-            "security.sasl.enabled.mechanisms: plain",
-            "security.sasl.plain.jaas.config: " + sasl_jaas,
-            "netty.server.num-network-threads: 1",
-            "netty.server.num-worker-threads: 3",
-        });
-
-        std::string coord_cmd = DockerRunCmd(kCoordinatorName, coord_props,
-                                             {"9123:9123", "9223:9223"}, "coordinatorServer");
-        if (RunCommand(coord_cmd) != 0) {
-            return WaitForCluster();
-        }
-
-        if (!WaitForPort("127.0.0.1", kCoordinatorPort)) {
-            std::cerr << "Coordinator Server did not become ready" << std::endl;
+        std::string cli_cmd = CliStartCmd();
+        FILE* pipe = popen(cli_cmd.c_str(), "r");
+        if (!pipe) {
+            std::cerr << "Failed to launch fluss-test-cluster binary" << std::endl;
             return false;
         }
-
-        // Tablet Server (dual listeners: SASL on 9124, plaintext on 9224)
-        std::string ts = std::string(kTabletServerName);
-        std::string ts_props = JoinProps({
-            "zookeeper.address: " + zk + ":2181",
-            "bind.listeners: INTERNAL://" + ts + ":0, CLIENT://" + ts + ":9123, PLAIN_CLIENT://" +
-                ts + ":9223",
-            "advertised.listeners: CLIENT://localhost:" + std::to_string(kTabletServerPort) +
-                ", PLAIN_CLIENT://localhost:" + std::to_string(kPlainClientTabletPort),
-            "internal.listener.name: INTERNAL",
-            "security.protocol.map: CLIENT:sasl",
-            "security.sasl.enabled.mechanisms: plain",
-            "security.sasl.plain.jaas.config: " + sasl_jaas,
-            "tablet-server.id: 0",
-            "netty.server.num-network-threads: 1",
-            "netty.server.num-worker-threads: 3",
-        });
-
-        std::string ts_cmd = DockerRunCmd(kTabletServerName, ts_props,
-                                          {std::to_string(kTabletServerPort) + ":9123",
-                                           std::to_string(kPlainClientTabletPort) + ":9223"},
-                                          "tabletServer");
-        if (RunCommand(ts_cmd) != 0) {
-            return WaitForCluster();
+        std::string output;
+        char buf[512];
+        while (fgets(buf, sizeof(buf), pipe)) output += buf;
+        int rc = pclose(pipe);
+        if (rc != 0) {
+            std::cerr << "fluss-test-cluster start failed (exit " << rc << "):\n"
+                      << output << std::endl;
+            return false;
         }
-
-        if (!WaitForPort("127.0.0.1", kTabletServerPort) ||
-            !WaitForPort("127.0.0.1", kPlainClientPort) ||
-            !WaitForPort("127.0.0.1", kPlainClientTabletPort)) {
-            std::cerr << "Cluster listeners did not become ready" << std::endl;
+        if (!ParseClusterJson(output, bootstrap_servers_, sasl_bootstrap_servers_)) {
+            std::cerr << "Failed to parse cluster JSON from:\n" << output << std::endl;
             return false;
         }
-
-        SetBootstrapServers();
-        std::cout << "Fluss cluster started successfully." << std::endl;
         return true;
     }
 
-    void Stop() {
-        if (external_cluster_) return;
-        StopAll();
-    }
-
-    /// Unconditionally stop and remove all cluster containers and the network.
-    /// Used by the --cleanup flag from ctest FIXTURES_CLEANUP.
     static void StopAll() {
-        std::cout << "Stopping Fluss cluster..." << std::endl;
-        RunCommand(std::string("docker rm -f ") + kTabletServerName + " 2>/dev/null || true");
-        RunCommand(std::string("docker rm -f ") + kCoordinatorName + " 2>/dev/null || true");
-        RunCommand(std::string("docker rm -f ") + kZookeeperName + " 2>/dev/null || true");
-        RunCommand(std::string("docker network rm ") + kNetworkName + " 2>/dev/null || true");
-        std::cout << "Fluss cluster stopped." << std::endl;
+        std::string cmd = FindCliBinary() + " stop --name " + kClusterName;
+        system(cmd.c_str());
     }
 
     const std::string& GetBootstrapServers() const { return bootstrap_servers_; }
     const std::string& GetSaslBootstrapServers() const { return sasl_bootstrap_servers_; }
 
    private:
-    void SetBootstrapServers() {
-        bootstrap_servers_ = "127.0.0.1:" + std::to_string(kPlainClientPort);
-        sasl_bootstrap_servers_ = "127.0.0.1:" + std::to_string(kCoordinatorPort);
-    }
-
-    /// Wait for a cluster being started by another process.
-    /// Fails fast if no containers exist (real Docker failure vs race).
-    bool WaitForCluster() {
-        if (RunCommand(std::string("docker inspect ") + kZookeeperName + " >/dev/null 2>&1") != 0) {
-            std::cerr << "Failed to start cluster (docker error)" << std::endl;
-            return false;
-        }
-        std::cout << "Waiting for cluster started by another process..." << std::endl;
-        if (!WaitForPort("127.0.0.1", kPlainClientPort) ||
-            !WaitForPort("127.0.0.1", kPlainClientTabletPort) ||
-            !WaitForPort("127.0.0.1", kCoordinatorPort) ||
-            !WaitForPort("127.0.0.1", kTabletServerPort)) {
-            std::cerr << "Cluster did not become ready" << std::endl;
-            return false;
-        }
-        SetBootstrapServers();
-        external_cluster_ = true;
-        std::cout << "Cluster ready." << std::endl;
-        return true;
-    }
-
     std::string bootstrap_servers_;
     std::string sasl_bootstrap_servers_;
-    bool external_cluster_{false};
 };
 
-/// GoogleTest Environment that manages the Fluss cluster lifecycle.
 class FlussTestEnvironment : public ::testing::Environment {
    public:
     static FlussTestEnvironment* Instance() {
@@ -296,35 +166,18 @@ class FlussTestEnvironment : public ::testing::Environment {
             GTEST_SKIP() << "Failed to start Fluss cluster. Skipping integration tests.";
         }
 
-        // Retry connection creation until the coordinator is fully initialized.
         fluss::Configuration config;
         config.bootstrap_servers = cluster_.GetBootstrapServers();
-
-        auto deadline = std::chrono::steady_clock::now() + std::chrono::seconds(60);
-        while (std::chrono::steady_clock::now() < deadline) {
-            auto result = fluss::Connection::Create(config, connection_);
-            if (result.Ok()) {
-                auto admin_result = connection_.GetAdmin(admin_);
-                if (admin_result.Ok()) {
-                    std::vector<fluss::ServerNode> nodes;
-                    auto nodes_result = admin_.GetServerNodes(nodes);
-                    if (nodes_result.Ok() &&
-                        std::any_of(nodes.begin(), nodes.end(),
-                                    [](const fluss::ServerNode& n) {
-                                        return n.server_type == "TabletServer";
-                                    })) {
-                        std::cout << "Connected to Fluss cluster." << std::endl;
-                        return;
-                    }
-                }
-            }
-            std::cout << "Waiting for Fluss cluster to be ready..." << std::endl;
-            std::this_thread::sleep_for(std::chrono::seconds(2));
+        auto result = fluss::Connection::Create(config, connection_);
+        if (!result.Ok()) {
+            GTEST_SKIP() << "Failed to connect: " << result.error_message;
+        }
+        auto admin_result = connection_.GetAdmin(admin_);
+        if (!admin_result.Ok()) {
+            GTEST_SKIP() << "Failed to get admin: " << admin_result.error_message;
         }
-        GTEST_SKIP() << "Fluss cluster did not become ready within timeout.";
     }
 
-    // Cluster stays alive for parallel processes and subsequent runs.
     void TearDown() override {}
 
     fluss::Connection& GetConnection() { return connection_; }
@@ -340,7 +193,6 @@ class FlussTestEnvironment : public ::testing::Environment {
     fluss::Admin admin_;
 };
 
-/// Helper: create a table (assert success). Drops existing table first if it exists.
 inline void CreateTable(fluss::Admin& admin, const fluss::TablePath& path,
                         const fluss::TableDescriptor& descriptor) {
     admin.DropTable(path, true);  // ignore if not exists
@@ -348,7 +200,6 @@ inline void CreateTable(fluss::Admin& admin, const fluss::TablePath& path,
     ASSERT_OK(result);
 }
 
-/// Helper: create partitions for a partitioned table.
 inline void CreatePartitions(fluss::Admin& admin, const fluss::TablePath& path,
                              const std::string& partition_column,
                              const std::vector<std::string>& values) {
@@ -360,8 +211,6 @@ inline void CreatePartitions(fluss::Admin& admin, const fluss::TablePath& path,
     }
 }
 
-/// Poll a LogScanner for ScanRecords until `expected_count` items are collected or timeout.
-/// `extract_fn` is called for each ScanRecord and should return a value of type T.
 template <typename T, typename ExtractFn>
 void PollRecords(fluss::LogScanner& scanner, size_t expected_count, ExtractFn extract_fn,
                  std::vector<T>& out) {
@@ -375,8 +224,6 @@ void PollRecords(fluss::LogScanner& scanner, size_t expected_count, ExtractFn ex
     }
 }
 
-/// Poll a LogScanner for ArrowRecordBatches until `expected_count` items are collected or timeout.
-/// `extract_fn` is called with the full ArrowRecordBatches and should return a std::vector<T>.
 template <typename T, typename ExtractFn>
 void PollRecordBatches(fluss::LogScanner& scanner, size_t expected_count, ExtractFn extract_fn,
                        std::vector<T>& out) {
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index b81aad0751..41463027bc 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -51,9 +51,9 @@ dev = [
     "pytest>=8.3.5",
     "pytest-asyncio>=0.25.3",
     "pytest-xdist>=3.5.0",
+    "filelock>=3.0",
     "ruff>=0.9.10",
     "maturin>=1.8.2",
-    "testcontainers>=4.0.0",
 ]
 docs = [
     "pdoc>=15.0.4",
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index 420747e66a..7da0f3d978 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -15,270 +15,135 @@
 # specific language governing permissions and limitations
 # under the License.
 
-"""Shared fixtures for Fluss Python integration tests.
-
-If FLUSS_BOOTSTRAP_SERVERS is set, tests connect to an existing cluster.
-Otherwise, a Fluss cluster is started automatically via testcontainers.
-
-The first pytest-xdist worker to run starts the cluster; other workers
-detect it via port check and reuse it (matching the C++ test pattern).
-Containers are cleaned up after all workers finish via pytest_unconfigure.
-
-Run with:
-    uv run maturin develop && uv run pytest test/ -v -n auto
-"""
-
 import asyncio
+import json
 import os
-import socket
 import subprocess
+import tempfile
 import time
-
-# Disable testcontainers Ryuk reaper for xdist runs — it would kill
-# containers when the first worker exits, while others are still running.
-# We handle cleanup ourselves in pytest_unconfigure.
-# In single-process mode, keep Ryuk as a safety net for hard crashes.
-if "PYTEST_XDIST_WORKER" in os.environ:
-    os.environ.setdefault("TESTCONTAINERS_RYUK_DISABLED", "true")
+from pathlib import Path
 
 import pytest
 import pytest_asyncio
+from filelock import FileLock
 
 import fluss
 
-FLUSS_IMAGE = "apache/fluss"
-FLUSS_VERSION = "0.9.0-incubating"
-BOOTSTRAP_SERVERS_ENV = os.environ.get("FLUSS_BOOTSTRAP_SERVERS")
-
-# Container / network names
-NETWORK_NAME = "fluss-python-test-network"
-ZOOKEEPER_NAME = "zookeeper-python-test"
-COORDINATOR_NAME = "coordinator-server-python-test"
-TABLET_SERVER_NAME = "tablet-server-python-test"
-
-# Fixed host ports (must match across workers)
-COORDINATOR_PORT = 9123
-TABLET_SERVER_PORT = 9124
-PLAIN_CLIENT_PORT = 9223
-PLAIN_CLIENT_TABLET_PORT = 9224
-
-ALL_PORTS = [COORDINATOR_PORT, TABLET_SERVER_PORT, PLAIN_CLIENT_PORT, PLAIN_CLIENT_TABLET_PORT]
-
-
-def _wait_for_port(host, port, timeout=60):
-    """Wait for a TCP port to become available."""
-    start = time.time()
-    while time.time() - start < timeout:
-        try:
-            with socket.create_connection((host, port), timeout=1):
-                return True
-        except (ConnectionRefusedError, TimeoutError, OSError):
-            time.sleep(1)
-    return False
-
-
-def _all_ports_ready(timeout=60):
-    """Wait for all cluster ports to become available."""
-    deadline = time.time() + timeout
-    for port in ALL_PORTS:
-        remaining = deadline - time.time()
-        if remaining <= 0 or not _wait_for_port("localhost", port, timeout=remaining):
-            return False
-    return True
-
-
-def _run_cmd(cmd):
-    """Run a command (list form), return exit code."""
-    return subprocess.run(cmd, capture_output=True).returncode
-
-
-def _start_cluster():
-    """Start the Fluss Docker cluster via testcontainers.
-
-    If another worker already started the cluster (detected via port check),
-    reuse it. If container creation fails (name conflict from a racing worker),
-    wait for the other worker's cluster to become ready.
-    """
-    # Reuse cluster started by another parallel worker or previous run.
-    if _wait_for_port("localhost", PLAIN_CLIENT_PORT, timeout=1):
-        print("Reusing existing cluster via port check.")
-        return
-
-    from testcontainers.core.container import DockerContainer
-
-    print("Starting Fluss cluster via testcontainers...")
-
-    # Create a named network via Docker CLI (idempotent, avoids orphaned
-    # random-named networks when multiple xdist workers race).
-    _run_cmd(["docker", "network", "create", NETWORK_NAME])
+CLUSTER_NAME = "shared-test"
 
-    sasl_jaas = (
-        "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required"
-        ' user_admin="admin-secret" user_alice="alice-secret";'
-    )
-    coordinator_props = "\n".join([
-        f"zookeeper.address: {ZOOKEEPER_NAME}:2181",
-        f"bind.listeners: INTERNAL://{COORDINATOR_NAME}:0,"
-        f" CLIENT://{COORDINATOR_NAME}:9123,"
-        f" PLAIN_CLIENT://{COORDINATOR_NAME}:9223",
-        "advertised.listeners: CLIENT://localhost:9123,"
-        " PLAIN_CLIENT://localhost:9223",
-        "internal.listener.name: INTERNAL",
-        "security.protocol.map: CLIENT:sasl",
-        "security.sasl.enabled.mechanisms: plain",
-        f"security.sasl.plain.jaas.config: {sasl_jaas}",
-        "netty.server.num-network-threads: 1",
-        "netty.server.num-worker-threads: 3",
-    ])
-    tablet_props = "\n".join([
-        f"zookeeper.address: {ZOOKEEPER_NAME}:2181",
-        f"bind.listeners: INTERNAL://{TABLET_SERVER_NAME}:0,"
-        f" CLIENT://{TABLET_SERVER_NAME}:9123,"
-        f" PLAIN_CLIENT://{TABLET_SERVER_NAME}:9223",
-        "advertised.listeners: CLIENT://localhost:9124,"
-        " PLAIN_CLIENT://localhost:9224",
-        "internal.listener.name: INTERNAL",
-        "security.protocol.map: CLIENT:sasl",
-        "security.sasl.enabled.mechanisms: plain",
-        f"security.sasl.plain.jaas.config: {sasl_jaas}",
-        "tablet-server.id: 0",
-        "netty.server.num-network-threads: 1",
-        "netty.server.num-worker-threads: 3",
-    ])
 
-    zookeeper = (
-        DockerContainer("zookeeper:3.9.2")
-        .with_kwargs(network=NETWORK_NAME)
-        .with_name(ZOOKEEPER_NAME)
-    )
-    coordinator = (
-        DockerContainer(f"{FLUSS_IMAGE}:{FLUSS_VERSION}")
-        .with_kwargs(network=NETWORK_NAME)
-        .with_name(COORDINATOR_NAME)
-        .with_bind_ports(9123, 9123)
-        .with_bind_ports(9223, 9223)
-        .with_command("coordinatorServer")
-        .with_env("FLUSS_PROPERTIES", coordinator_props)
+def _find_cli_binary():
+    env_bin = os.environ.get("FLUSS_TEST_CLUSTER_BIN")
+    if env_bin:
+        if os.path.isfile(env_bin):
+            return env_bin
+        raise FileNotFoundError(f"FLUSS_TEST_CLUSTER_BIN={env_bin!r} does not exist")
+    result = subprocess.run(
+        ["cargo", "locate-project", "--workspace", "--message-format", "plain"],
+        capture_output=True,
+        text=True,
     )
-    tablet_server = (
-        DockerContainer(f"{FLUSS_IMAGE}:{FLUSS_VERSION}")
-        .with_kwargs(network=NETWORK_NAME)
-        .with_name(TABLET_SERVER_NAME)
-        .with_bind_ports(9123, 9124)
-        .with_bind_ports(9223, 9224)
-        .with_command("tabletServer")
-        .with_env("FLUSS_PROPERTIES", tablet_props)
+    if result.returncode == 0:
+        root = Path(result.stdout.strip()).parent
+        for profile in ("debug", "release"):
+            bin_path = root / "target" / profile / "fluss-test-cluster"
+            if bin_path.is_file():
+                return str(bin_path)
+    raise FileNotFoundError(
+        "fluss-test-cluster not found. Run: cargo build -p fluss-test-cluster"
     )
 
-    try:
-        zookeeper.start()
-        coordinator.start()
-        tablet_server.start()
-    except Exception as e:
-        # Another worker may have started containers with the same names.
-        # Wait for the cluster to become ready instead of failing.
-        print(f"Container start failed ({e}), waiting for cluster from another worker...")
-        if _all_ports_ready():
-            return
-        raise
 
-    if not _all_ports_ready():
-        raise RuntimeError("Cluster listeners did not become ready")
-
-    print("Fluss cluster started successfully.")
+def _start_cluster():
+    lock = Path(tempfile.gettempdir()) / f"fluss-{CLUSTER_NAME}.lock"
+    with FileLock(lock):
+        cli = _find_cli_binary()
+        result = subprocess.run(
+            [cli, "start", "--sasl", "--name", CLUSTER_NAME],
+            capture_output=True,
+            text=True,
+        )
+        if result.returncode != 0:
+            raise RuntimeError(
+                f"fluss-test-cluster start failed:\n{result.stderr}\n{result.stdout}"
+            )
+        prefix = "CLUSTER_JSON: "
+        for line in result.stdout.strip().split("\n"):
+            if line.startswith(prefix):
+                info = json.loads(line[len(prefix) :])
+                return info["bootstrap_servers"], info.get("sasl_bootstrap_servers")
+        raise RuntimeError(
+            f"No CLUSTER_JSON token in output:\n{result.stdout}\n{result.stderr}"
+        )
 
 
 def _stop_cluster():
-    """Stop and remove the Fluss Docker cluster containers."""
-    for name in [TABLET_SERVER_NAME, COORDINATOR_NAME, ZOOKEEPER_NAME]:
-        subprocess.run(["docker", "rm", "-f", name], capture_output=True)
-    subprocess.run(["docker", "network", "rm", NETWORK_NAME], capture_output=True)
-
+    try:
+        cli = _find_cli_binary()
+    except FileNotFoundError:
+        return
+    subprocess.run([cli, "stop", "--name", CLUSTER_NAME], capture_output=True)
 
-async def _connect_with_retry(bootstrap_servers, timeout=60):
-    """Connect to the Fluss cluster with retries until it's fully ready.
 
-    Waits until both the coordinator and at least one tablet server are
-    available, matching the Rust wait_for_cluster_ready pattern.
-    """
+async def _connect(bootstrap_servers):
     config = fluss.Config({"bootstrap.servers": bootstrap_servers})
     start = time.time()
     last_err = None
-    while time.time() - start < timeout:
-        conn = None
+    while time.time() - start < 60:
         try:
             conn = await fluss.FlussConnection.create(config)
             admin = conn.get_admin()
             nodes = await admin.get_server_nodes()
             if any(n.server_type == "TabletServer" for n in nodes):
                 return conn
+            conn.close()
             last_err = RuntimeError("No TabletServer available yet")
         except Exception as e:
             last_err = e
-        if conn is not None:
-            conn.close()
         await asyncio.sleep(1)
-    raise RuntimeError(
-        f"Could not connect to cluster after {timeout}s: {last_err}"
-    )
+    raise RuntimeError(f"Could not connect after 60s: {last_err}")
 
 
 def pytest_unconfigure(config):
-    """Clean up Docker containers after all xdist workers finish.
-
-    Runs once on the controller process (or the single process when
-    not using xdist). Workers are identified by the 'workerinput' attr.
-    """
-    if BOOTSTRAP_SERVERS_ENV:
+    if os.environ.get("FLUSS_BOOTSTRAP_SERVERS"):
         return
     if hasattr(config, "workerinput"):
-        return  # This is a worker, skip
+        return
     _stop_cluster()
 
 
 @pytest.fixture(scope="session")
 def fluss_cluster():
-    """Start a Fluss cluster using testcontainers, or use an existing one."""
-    if BOOTSTRAP_SERVERS_ENV:
-        sasl_env = os.environ.get(
-            "FLUSS_SASL_BOOTSTRAP_SERVERS", BOOTSTRAP_SERVERS_ENV
-        )
-        yield (BOOTSTRAP_SERVERS_ENV, sasl_env)
+    env = os.environ.get("FLUSS_BOOTSTRAP_SERVERS")
+    if env:
+        sasl_env = os.environ.get("FLUSS_SASL_BOOTSTRAP_SERVERS", env)
+        yield (env, sasl_env)
         return
 
-    _start_cluster()
-
-    # (plaintext_bootstrap, sasl_bootstrap)
-    yield (
-        f"127.0.0.1:{PLAIN_CLIENT_PORT}",
-        f"127.0.0.1:{COORDINATOR_PORT}",
-    )
+    plaintext_addr, sasl_addr = _start_cluster()
+    yield (plaintext_addr, sasl_addr or plaintext_addr)
 
 
 @pytest_asyncio.fixture(scope="session")
 async def connection(fluss_cluster):
-    """Session-scoped connection to the Fluss cluster (plaintext)."""
     plaintext_addr, _sasl_addr = fluss_cluster
-    conn = await _connect_with_retry(plaintext_addr)
+    conn = await _connect(plaintext_addr)
     yield conn
     conn.close()
 
 
 @pytest.fixture(scope="session")
 def sasl_bootstrap_servers(fluss_cluster):
-    """Bootstrap servers for the SASL listener."""
     _plaintext_addr, sasl_addr = fluss_cluster
     return sasl_addr
 
 
 @pytest.fixture(scope="session")
 def plaintext_bootstrap_servers(fluss_cluster):
-    """Bootstrap servers for the plaintext (non-SASL) listener."""
     plaintext_addr, _sasl_addr = fluss_cluster
     return plaintext_addr
 
 
 @pytest_asyncio.fixture(scope="session")
 async def admin(connection):
-    """Session-scoped admin client."""
     return connection.get_admin()
diff --git a/fluss-rust/crates/fluss-test-cluster/Cargo.toml b/fluss-rust/crates/fluss-test-cluster/Cargo.toml
new file mode 100644
index 0000000000..977df307b8
--- /dev/null
+++ b/fluss-rust/crates/fluss-test-cluster/Cargo.toml
@@ -0,0 +1,36 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[package]
+name = "fluss-test-cluster"
+edition.workspace = true
+version.workspace = true
+license.workspace = true
+rust-version.workspace = true
+publish = false
+
+[[bin]]
+name = "fluss-test-cluster"
+path = "src/main.rs"
+
+[dependencies]
+fluss = { workspace = true }
+testcontainers = "0.27.2"
+tokio = { workspace = true }
+clap = { workspace = true }
+serde = { workspace = true }
+serde_json = { workspace = true }
diff --git a/fluss-rust/crates/fluss-test-cluster/build.rs b/fluss-rust/crates/fluss-test-cluster/build.rs
new file mode 100644
index 0000000000..0145196bc3
--- /dev/null
+++ b/fluss-rust/crates/fluss-test-cluster/build.rs
@@ -0,0 +1,32 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+fn main() {
+    println!("cargo:rerun-if-changed=test-images.env");
+    for line in std::fs::read_to_string("test-images.env")
+        .expect("test-images.env not found")
+        .lines()
+    {
+        let line = line.trim();
+        if line.is_empty() || line.starts_with('#') {
+            continue;
+        }
+        if let Some((key, value)) = line.split_once('=') {
+            println!("cargo:rustc-env={}={}", key.trim(), value.trim());
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss-test-cluster/src/lib.rs b/fluss-rust/crates/fluss-test-cluster/src/lib.rs
new file mode 100644
index 0000000000..041c21b06c
--- /dev/null
+++ b/fluss-rust/crates/fluss-test-cluster/src/lib.rs
@@ -0,0 +1,514 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+use std::collections::HashMap;
+use std::mem::ManuallyDrop;
+use std::sync::Arc;
+use std::time::Duration;
+use testcontainers::core::ContainerPort;
+use testcontainers::runners::AsyncRunner;
+use testcontainers::{ContainerAsync, GenericImage, ImageExt};
+
+pub const FLUSS_IMAGE: &str = env!("FLUSS_IMAGE");
+pub const FLUSS_VERSION: &str = env!("FLUSS_VERSION");
+pub const ZOOKEEPER_IMAGE: &str = env!("ZOOKEEPER_IMAGE");
+pub const ZOOKEEPER_VERSION: &str = env!("ZOOKEEPER_VERSION");
+
+#[derive(serde::Serialize, serde::Deserialize, Debug)]
+pub struct ClusterInfo {
+    pub bootstrap_servers: String,
+    pub sasl_bootstrap_servers: Option<String>,
+}
+
+pub struct FlussTestingClusterBuilder {
+    number_of_tablet_servers: u16,
+    network: &'static str,
+    cluster_conf: HashMap<String, String>,
+    testing_name: String,
+    remote_data_dir: Option<std::path::PathBuf>,
+    sasl_enabled: bool,
+    sasl_users: Vec<(String, String)>,
+    coordinator_host_port: u16,
+    plain_client_port: Option<u16>,
+    image: String,
+    image_tag: String,
+}
+
+impl FlussTestingClusterBuilder {
+    pub fn new(testing_name: impl Into<String>) -> Self {
+        Self::new_with_cluster_conf(testing_name.into(), &HashMap::default())
+    }
+
+    pub fn with_remote_data_dir(mut self, dir: std::path::PathBuf) -> Self {
+        std::fs::create_dir_all(&dir).expect("Failed to create remote data directory");
+        self.remote_data_dir = Some(dir);
+        self
+    }
+
+    pub fn with_sasl(mut self, users: Vec<(String, String)>) -> Self {
+        self.sasl_enabled = true;
+        self.sasl_users = users;
+        self.plain_client_port = Some(self.coordinator_host_port + 100);
+        self
+    }
+
+    pub fn with_port(mut self, port: u16) -> Self {
+        self.coordinator_host_port = port;
+        // Re-derive SASL port if SASL was already enabled.
+        if self.sasl_enabled {
+            self.plain_client_port = Some(port + 100);
+        }
+        self
+    }
+
+    pub fn new_with_cluster_conf(
+        testing_name: impl Into<String>,
+        conf: &HashMap<String, String>,
+    ) -> Self {
+        let mut cluster_conf = conf.clone();
+        cluster_conf.insert(
+            "netty.server.num-network-threads".to_string(),
+            "1".to_string(),
+        );
+        cluster_conf.insert(
+            "netty.server.num-worker-threads".to_string(),
+            "3".to_string(),
+        );
+
+        FlussTestingClusterBuilder {
+            number_of_tablet_servers: 1,
+            cluster_conf,
+            network: "fluss-cluster-network",
+            testing_name: testing_name.into(),
+            remote_data_dir: None,
+            sasl_enabled: false,
+            sasl_users: Vec::new(),
+            coordinator_host_port: 9123,
+            plain_client_port: None,
+            image: FLUSS_IMAGE.to_string(),
+            image_tag: FLUSS_VERSION.to_string(),
+        }
+    }
+
+    fn tablet_server_container_name(&self, server_id: u16) -> String {
+        format!("tablet-server-{}-{}", self.testing_name, server_id)
+    }
+
+    fn coordinator_server_container_name(&self) -> String {
+        format!("coordinator-server-{}", self.testing_name)
+    }
+
+    fn zookeeper_container_name(&self) -> String {
+        format!("zookeeper-{}", self.testing_name)
+    }
+
+    fn container_names(&self) -> Vec<String> {
+        std::iter::once(self.zookeeper_container_name())
+            .chain(std::iter::once(self.coordinator_server_container_name()))
+            .chain(
+                (0..self.number_of_tablet_servers).map(|id| self.tablet_server_container_name(id)),
+            )
+            .collect()
+    }
+
+    fn inject_sasl_conf(&mut self) {
+        if self.sasl_enabled
+            && !self.sasl_users.is_empty()
+            && !self.cluster_conf.contains_key("security.protocol.map")
+        {
+            self.cluster_conf.insert(
+                "security.protocol.map".to_string(),
+                "CLIENT:sasl".to_string(),
+            );
+            self.cluster_conf.insert(
+                "security.sasl.enabled.mechanisms".to_string(),
+                "plain".to_string(),
+            );
+            let user_entries: Vec<String> = self
+                .sasl_users
+                .iter()
+                .map(|(u, p)| format!("user_{}=\"{}\"", u, p))
+                .collect();
+            let jaas_config = format!(
+                "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required {};",
+                user_entries.join(" ")
+            );
+            self.cluster_conf
+                .insert("security.sasl.plain.jaas.config".to_string(), jaas_config);
+        }
+    }
+
+    fn bootstrap_addresses(&self) -> (String, Option<String>) {
+        if let Some(plain_port) = self.plain_client_port {
+            (
+                format!("127.0.0.1:{}", plain_port),
+                Some(format!("127.0.0.1:{}", self.coordinator_host_port)),
+            )
+        } else {
+            (format!("127.0.0.1:{}", self.coordinator_host_port), None)
+        }
+    }
+
+    fn all_containers_exist(&self) -> bool {
+        self.container_names().iter().all(|name| {
+            std::process::Command::new("docker")
+                .args(["ps", "-q", "--filter", &format!("name=^{}$", name)])
+                .output()
+                .map(|o| !String::from_utf8_lossy(&o.stdout).trim().is_empty())
+                .unwrap_or(false)
+        })
+    }
+
+    async fn start_all_containers(&mut self) -> Vec<ContainerAsync<GenericImage>> {
+        for name in &self.container_names() {
+            let _ = std::process::Command::new("docker")
+                .args(["rm", "-f", name])
+                .output();
+        }
+        self.inject_sasl_conf();
+
+        let mut containers = Vec::new();
+        containers.push(self.start_zookeeper().await);
+        containers.push(self.start_coordinator_server().await);
+        for server_id in 0..self.number_of_tablet_servers {
+            containers.push(self.start_tablet_server(server_id).await);
+        }
+        containers
+    }
+
+    /// Containers stop when the returned struct is dropped.
+    pub async fn build(&mut self) -> FlussTestingCluster {
+        let container_names = self.container_names();
+        let containers = self.start_all_containers().await;
+
+        let mut iter = containers.into_iter();
+        let zookeeper = Arc::new(iter.next().unwrap());
+        let coordinator_server = Arc::new(iter.next().unwrap());
+        let mut tablet_servers = HashMap::new();
+        for server_id in 0..self.number_of_tablet_servers {
+            tablet_servers.insert(server_id, Arc::new(iter.next().unwrap()));
+        }
+
+        let (bootstrap_servers, sasl_bootstrap_servers) = self.bootstrap_addresses();
+
+        FlussTestingCluster {
+            zookeeper,
+            coordinator_server,
+            tablet_servers,
+            bootstrap_servers,
+            sasl_bootstrap_servers,
+            remote_data_dir: self.remote_data_dir.clone(),
+            sasl_users: self.sasl_users.clone(),
+            container_names,
+        }
+    }
+
+    /// Containers outlive the process. Clean up via `stop_cluster()`.
+    /// Idempotent: if the cluster is already running, returns its info.
+    pub async fn build_detached(&mut self) -> ClusterInfo {
+        if !self.all_containers_exist() {
+            let containers = self.start_all_containers().await;
+            let _ = ManuallyDrop::new(containers);
+        }
+
+        let (bootstrap_servers, sasl_bootstrap_servers) = self.bootstrap_addresses();
+        ClusterInfo {
+            bootstrap_servers,
+            sasl_bootstrap_servers,
+        }
+    }
+
+    async fn start_zookeeper(&self) -> ContainerAsync<GenericImage> {
+        GenericImage::new(ZOOKEEPER_IMAGE, ZOOKEEPER_VERSION)
+            .with_network(self.network)
+            .with_container_name(self.zookeeper_container_name())
+            .start()
+            .await
+            .unwrap()
+    }
+
+    async fn start_coordinator_server(&mut self) -> ContainerAsync<GenericImage> {
+        let port = self.coordinator_host_port;
+        let container_name = self.coordinator_server_container_name();
+        let mut coordinator_confs = HashMap::new();
+        coordinator_confs.insert(
+            "zookeeper.address",
+            format!("{}:2181", self.zookeeper_container_name()),
+        );
+
+        if let Some(plain_port) = self.plain_client_port {
+            coordinator_confs.insert(
+                "bind.listeners",
+                format!(
+                    "INTERNAL://{}:0, CLIENT://{}:{}, PLAIN_CLIENT://{}:{}",
+                    container_name, container_name, port, container_name, plain_port
+                ),
+            );
+            coordinator_confs.insert(
+                "advertised.listeners",
+                format!(
+                    "CLIENT://localhost:{}, PLAIN_CLIENT://localhost:{}",
+                    port, plain_port
+                ),
+            );
+        } else {
+            coordinator_confs.insert(
+                "bind.listeners",
+                format!(
+                    "INTERNAL://{}:0, CLIENT://{}:{}",
+                    container_name, container_name, port
+                ),
+            );
+            coordinator_confs.insert(
+                "advertised.listeners",
+                format!("CLIENT://localhost:{}", port),
+            );
+        }
+
+        coordinator_confs.insert("internal.listener.name", "INTERNAL".to_string());
+
+        let mut image = GenericImage::new(&self.image, &self.image_tag)
+            .with_container_name(self.coordinator_server_container_name())
+            .with_mapped_port(port, ContainerPort::Tcp(port))
+            .with_network(self.network)
+            .with_cmd(vec!["coordinatorServer"])
+            .with_env_var(
+                "FLUSS_PROPERTIES",
+                self.to_fluss_properties_with(coordinator_confs),
+            );
+
+        if let Some(plain_port) = self.plain_client_port {
+            image = image.with_mapped_port(plain_port, ContainerPort::Tcp(plain_port));
+        }
+
+        image.start().await.unwrap()
+    }
+
+    async fn start_tablet_server(&self, server_id: u16) -> ContainerAsync<GenericImage> {
+        let port = self.coordinator_host_port;
+        let container_name = self.tablet_server_container_name(server_id);
+        let mut tablet_server_confs = HashMap::new();
+        let expose_host_port = port + 1 + server_id;
+        let tablet_server_id = format!("{}", server_id);
+
+        if let Some(plain_port) = self.plain_client_port {
+            let bind_listeners = format!(
+                "INTERNAL://{}:0, CLIENT://{}:{}, PLAIN_CLIENT://{}:{}",
+                container_name, container_name, port, container_name, plain_port,
+            );
+            let plain_expose_host_port = plain_port + 1 + server_id;
+            let advertised_listeners = format!(
+                "CLIENT://localhost:{}, PLAIN_CLIENT://localhost:{}",
+                expose_host_port, plain_expose_host_port
+            );
+            tablet_server_confs.insert("bind.listeners", bind_listeners);
+            tablet_server_confs.insert("advertised.listeners", advertised_listeners);
+        } else {
+            let bind_listeners = format!(
+                "INTERNAL://{}:0, CLIENT://{}:{}",
+                container_name, container_name, port,
+            );
+            let advertised_listeners = format!("CLIENT://localhost:{}", expose_host_port);
+            tablet_server_confs.insert("bind.listeners", bind_listeners);
+            tablet_server_confs.insert("advertised.listeners", advertised_listeners);
+        }
+
+        tablet_server_confs.insert(
+            "zookeeper.address",
+            format!("{}:2181", self.zookeeper_container_name()),
+        );
+        tablet_server_confs.insert("internal.listener.name", "INTERNAL".to_string());
+        tablet_server_confs.insert("tablet-server.id", tablet_server_id);
+
+        if let Some(remote_data_dir) = &self.remote_data_dir {
+            tablet_server_confs.insert(
+                "remote.data.dir",
+                remote_data_dir.to_string_lossy().to_string(),
+            );
+        }
+        let mut image = GenericImage::new(&self.image, &self.image_tag)
+            .with_cmd(vec!["tabletServer"])
+            .with_mapped_port(expose_host_port, ContainerPort::Tcp(port))
+            .with_network(self.network)
+            .with_container_name(self.tablet_server_container_name(server_id))
+            .with_env_var(
+                "FLUSS_PROPERTIES",
+                self.to_fluss_properties_with(tablet_server_confs),
+            );
+
+        if let Some(plain_port) = self.plain_client_port {
+            let plain_expose_host_port = plain_port + 1 + server_id;
+            image = image.with_mapped_port(plain_expose_host_port, ContainerPort::Tcp(plain_port));
+        }
+
+        if let Some(ref remote_data_dir) = self.remote_data_dir {
+            use testcontainers::core::Mount;
+            std::fs::create_dir_all(remote_data_dir)
+                .expect("Failed to create remote data directory for mount");
+            let host_path = remote_data_dir.to_string_lossy().to_string();
+            let container_path = remote_data_dir.to_string_lossy().to_string();
+            image = image.with_mount(Mount::bind_mount(host_path, container_path));
+        }
+
+        image.start().await.unwrap()
+    }
+
+    fn to_fluss_properties_with(&self, extra_properties: HashMap<&str, String>) -> String {
+        let mut fluss_properties = Vec::new();
+        for (k, v) in self.cluster_conf.iter() {
+            fluss_properties.push(format!("{}: {}", k, v));
+        }
+        for (k, v) in extra_properties.iter() {
+            fluss_properties.push(format!("{}: {}", k, v));
+        }
+        fluss_properties.join("\n")
+    }
+}
+
+#[derive(Clone)]
+#[allow(dead_code)] // Fields held for RAII.
+pub struct FlussTestingCluster {
+    zookeeper: Arc<ContainerAsync<GenericImage>>,
+    coordinator_server: Arc<ContainerAsync<GenericImage>>,
+    tablet_servers: HashMap<u16, Arc<ContainerAsync<GenericImage>>>,
+    bootstrap_servers: String,
+    sasl_bootstrap_servers: Option<String>,
+    remote_data_dir: Option<std::path::PathBuf>,
+    sasl_users: Vec<(String, String)>,
+    container_names: Vec<String>,
+}
+
+impl FlussTestingCluster {
+    pub fn stop(&self) {
+        for name in &self.container_names {
+            let _ = std::process::Command::new("docker")
+                .args(["rm", "-f", name])
+                .output();
+        }
+        if let Some(ref dir) = self.remote_data_dir {
+            let _ = std::fs::remove_dir_all(dir);
+        }
+    }
+
+    pub fn sasl_users(&self) -> &[(String, String)] {
+        &self.sasl_users
+    }
+
+    pub fn plaintext_bootstrap_servers(&self) -> &str {
+        &self.bootstrap_servers
+    }
+
+    pub async fn get_fluss_connection(&self) -> FlussConnection {
+        let config = Config {
+            writer_acks: "all".to_string(),
+            bootstrap_servers: self.bootstrap_servers.clone(),
+            ..Default::default()
+        };
+
+        self.connect_with_retry(config).await
+    }
+
+    pub async fn get_fluss_connection_with_sasl(
+        &self,
+        username: &str,
+        password: &str,
+    ) -> FlussConnection {
+        let bootstrap = self
+            .sasl_bootstrap_servers
+            .clone()
+            .unwrap_or_else(|| self.bootstrap_servers.clone());
+        let config = Config {
+            writer_acks: "all".to_string(),
+            bootstrap_servers: bootstrap,
+            security_protocol: "sasl".to_string(),
+            security_sasl_mechanism: "PLAIN".to_string(),
+            security_sasl_username: username.to_string(),
+            security_sasl_password: password.to_string(),
+            ..Default::default()
+        };
+
+        self.connect_with_retry(config).await
+    }
+
+    pub async fn try_fluss_connection_with_sasl(
+        &self,
+        username: &str,
+        password: &str,
+    ) -> fluss::error::Result<FlussConnection> {
+        let bootstrap = self
+            .sasl_bootstrap_servers
+            .clone()
+            .unwrap_or_else(|| self.bootstrap_servers.clone());
+        let config = Config {
+            writer_acks: "all".to_string(),
+            bootstrap_servers: bootstrap,
+            security_protocol: "sasl".to_string(),
+            security_sasl_mechanism: "PLAIN".to_string(),
+            security_sasl_username: username.to_string(),
+            security_sasl_password: password.to_string(),
+            ..Default::default()
+        };
+
+        FlussConnection::new(config).await
+    }
+
+    async fn connect_with_retry(&self, config: Config) -> FlussConnection {
+        let max_retries = 60;
+        let retry_interval = Duration::from_secs(1);
+
+        for attempt in 1..=max_retries {
+            match FlussConnection::new(config.clone()).await {
+                Ok(connection) => {
+                    return connection;
+                }
+                Err(e) => {
+                    if attempt == max_retries {
+                        panic!(
+                            "Failed to connect to Fluss cluster after {} attempts: {}",
+                            max_retries, e
+                        );
+                    }
+                    tokio::time::sleep(retry_interval).await;
+                }
+            }
+        }
+        unreachable!()
+    }
+}
+
+pub fn stop_cluster(name: &str) {
+    let prefixes = [
+        format!("zookeeper-{}", name),
+        format!("coordinator-server-{}", name),
+        format!("tablet-server-{}-", name),
+    ];
+    for prefix in &prefixes {
+        if let Ok(output) = std::process::Command::new("docker")
+            .args(["ps", "-aq", "--filter", &format!("name={}", prefix)])
+            .output()
+        {
+            let ids = String::from_utf8_lossy(&output.stdout);
+            for id in ids.split_whitespace() {
+                let _ = std::process::Command::new("docker")
+                    .args(["rm", "-f", id])
+                    .output();
+            }
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss-test-cluster/src/main.rs b/fluss-rust/crates/fluss-test-cluster/src/main.rs
new file mode 100644
index 0000000000..fc3a19f60e
--- /dev/null
+++ b/fluss-rust/crates/fluss-test-cluster/src/main.rs
@@ -0,0 +1,103 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use clap::{Parser, Subcommand};
+use fluss::ServerType;
+use fluss::config::Config;
+use fluss_test_cluster::FlussTestingClusterBuilder;
+use std::time::Duration;
+
+#[derive(Parser)]
+#[command(about = "Manage a Fluss test cluster via testcontainers")]
+struct Cli {
+    #[command(subcommand)]
+    command: Command,
+}
+
+#[derive(Subcommand)]
+enum Command {
+    /// Start a Fluss test cluster (idempotent). Prints cluster info as JSON to stdout.
+    Start {
+        #[arg(long, default_value = "shared-test")]
+        name: String,
+        #[arg(long)]
+        sasl: bool,
+        #[arg(long, default_value_t = 9123)]
+        port: u16,
+    },
+    /// Stop and remove all containers for a cluster.
+    Stop {
+        #[arg(long, default_value = "shared-test")]
+        name: String,
+    },
+}
+
+#[tokio::main]
+async fn main() {
+    let cli = Cli::parse();
+
+    match cli.command {
+        Command::Start { name, sasl, port } => {
+            eprintln!("Starting Fluss test cluster '{}'...", name);
+
+            let mut builder = FlussTestingClusterBuilder::new(&name).with_port(port);
+
+            if sasl {
+                builder = builder.with_sasl(vec![
+                    ("admin".to_string(), "admin-secret".to_string()),
+                    ("alice".to_string(), "alice-secret".to_string()),
+                ]);
+            }
+
+            let info = builder.build_detached().await;
+            let start = std::time::Instant::now();
+
+            // Check plaintext endpoint only — can't verify SASL without credentials.
+            eprintln!("Waiting for cluster to be ready...");
+            loop {
+                let config = Config {
+                    bootstrap_servers: info.bootstrap_servers.clone(),
+                    ..Default::default()
+                };
+                if let Ok(conn) = fluss::client::FlussConnection::new(config).await {
+                    if let Ok(admin) = conn.get_admin() {
+                        if let Ok(nodes) = admin.get_server_nodes().await {
+                            if nodes
+                                .iter()
+                                .any(|n| *n.server_type() == ServerType::TabletServer)
+                            {
+                                break;
+                            }
+                        }
+                    }
+                }
+                if start.elapsed() >= Duration::from_secs(60) {
+                    eprintln!("TIMEOUT: cluster did not become ready within 60s");
+                    std::process::exit(1);
+                }
+                tokio::time::sleep(Duration::from_secs(1)).await;
+            }
+            eprintln!("Cluster ready.");
+            println!("CLUSTER_JSON: {}", serde_json::to_string(&info).unwrap());
+        }
+        Command::Stop { name } => {
+            eprintln!("Stopping Fluss test cluster '{}'...", name);
+            fluss_test_cluster::stop_cluster(&name);
+            eprintln!("Cluster stopped.");
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss-test-cluster/test-images.env b/fluss-rust/crates/fluss-test-cluster/test-images.env
new file mode 100644
index 0000000000..3aa8e735cf
--- /dev/null
+++ b/fluss-rust/crates/fluss-test-cluster/test-images.env
@@ -0,0 +1,4 @@
+FLUSS_IMAGE=apache/fluss
+FLUSS_VERSION=0.9.0-incubating
+ZOOKEEPER_IMAGE=zookeeper
+ZOOKEEPER_VERSION=3.9.2
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index ef6a62d3a7..040599ed06 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -79,7 +79,7 @@ strum_macros = "0.26"
 jiff = { workspace = true, features = ["js"] }
 
 [dev-dependencies]
-testcontainers = "0.27.2"
+fluss-test-cluster = { path = "../fluss-test-cluster" }
 
 [build-dependencies]
 prost-build = "0.14"
diff --git a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
index 5dc3e33e22..0860be5d74 100644
--- a/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
+++ b/fluss-rust/crates/fluss/tests/integration/fluss_cluster.rs
@@ -15,453 +15,4 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use fluss::client::FlussConnection;
-use fluss::config::Config;
-use std::collections::HashMap;
-use std::string::ToString;
-use std::sync::Arc;
-use std::time::Duration;
-use testcontainers::core::ContainerPort;
-use testcontainers::runners::AsyncRunner;
-use testcontainers::{ContainerAsync, GenericImage, ImageExt};
-
-const FLUSS_VERSION: &str = "0.9.0-incubating";
-const FLUSS_IMAGE: &str = "apache/fluss";
-
-pub struct FlussTestingClusterBuilder {
-    number_of_tablet_servers: i32,
-    network: &'static str,
-    cluster_conf: HashMap<String, String>,
-    testing_name: String,
-    remote_data_dir: Option<std::path::PathBuf>,
-    sasl_enabled: bool,
-    sasl_users: Vec<(String, String)>,
-    /// Host port for the coordinator server (default 9123).
-    coordinator_host_port: u16,
-    /// Host port for the plaintext (PLAIN_CLIENT) listener.
-    /// When set together with `sasl_enabled`, the cluster exposes two listeners:
-    /// CLIENT (SASL) on `coordinator_host_port` and PLAIN_CLIENT on this port.
-    plain_client_port: Option<u16>,
-    image: String,
-    image_tag: String,
-}
-
-impl FlussTestingClusterBuilder {
-    #[allow(dead_code)]
-    pub fn new(testing_name: impl Into<String>) -> Self {
-        Self::new_with_cluster_conf(testing_name.into(), &HashMap::default())
-    }
-
-    pub fn with_remote_data_dir(mut self, dir: std::path::PathBuf) -> Self {
-        // Ensure the directory exists before mounting
-        std::fs::create_dir_all(&dir).expect("Failed to create remote data directory");
-        self.remote_data_dir = Some(dir);
-        self
-    }
-
-    /// Enable SASL/PLAIN authentication on the cluster with dual listeners.
-    /// Users are specified as `(username, password)` pairs.
-    /// This automatically configures a PLAIN_CLIENT (plaintext) listener in addition
-    /// to the CLIENT (SASL) listener, allowing both authenticated and unauthenticated
-    /// connections on the same cluster.
-    pub fn with_sasl(mut self, users: Vec<(String, String)>) -> Self {
-        self.sasl_enabled = true;
-        self.sasl_users = users;
-        self.plain_client_port = Some(self.coordinator_host_port + 100);
-        self
-    }
-
-    pub fn new_with_cluster_conf(
-        testing_name: impl Into<String>,
-        conf: &HashMap<String, String>,
-    ) -> Self {
-        // reduce testing resources
-        let mut cluster_conf = conf.clone();
-        cluster_conf.insert(
-            "netty.server.num-network-threads".to_string(),
-            "1".to_string(),
-        );
-        cluster_conf.insert(
-            "netty.server.num-worker-threads".to_string(),
-            "3".to_string(),
-        );
-
-        FlussTestingClusterBuilder {
-            number_of_tablet_servers: 1,
-            cluster_conf,
-            network: "fluss-cluster-network",
-            testing_name: testing_name.into(),
-            remote_data_dir: None,
-            sasl_enabled: false,
-            sasl_users: Vec::new(),
-            coordinator_host_port: 9123,
-            plain_client_port: None,
-            image: FLUSS_IMAGE.to_string(),
-            image_tag: FLUSS_VERSION.to_string(),
-        }
-    }
-
-    fn tablet_server_container_name(&self, server_id: i32) -> String {
-        format!("tablet-server-{}-{}", self.testing_name, server_id)
-    }
-
-    fn coordinator_server_container_name(&self) -> String {
-        format!("coordinator-server-{}", self.testing_name)
-    }
-
-    fn zookeeper_container_name(&self) -> String {
-        format!("zookeeper-{}", self.testing_name)
-    }
-
-    pub async fn build(&mut self) -> FlussTestingCluster {
-        // Remove stale containers from previous runs (if any) so we can reuse names.
-        let stale_containers: Vec<String> = std::iter::once(self.zookeeper_container_name())
-            .chain(std::iter::once(self.coordinator_server_container_name()))
-            .chain(
-                (0..self.number_of_tablet_servers).map(|id| self.tablet_server_container_name(id)),
-            )
-            .collect();
-        for name in &stale_containers {
-            let _ = std::process::Command::new("docker")
-                .args(["rm", "-f", name])
-                .output();
-        }
-
-        // Inject SASL server-side configuration into cluster_conf
-        if self.sasl_enabled && !self.sasl_users.is_empty() {
-            self.cluster_conf.insert(
-                "security.protocol.map".to_string(),
-                "CLIENT:sasl".to_string(),
-            );
-            self.cluster_conf.insert(
-                "security.sasl.enabled.mechanisms".to_string(),
-                "plain".to_string(),
-            );
-            // Build JAAS config: user_<name>="<password>" for each user
-            let user_entries: Vec<String> = self
-                .sasl_users
-                .iter()
-                .map(|(u, p)| format!("user_{}=\"{}\"", u, p))
-                .collect();
-            let jaas_config = format!(
-                "org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required {};",
-                user_entries.join(" ")
-            );
-            self.cluster_conf
-                .insert("security.sasl.plain.jaas.config".to_string(), jaas_config);
-        }
-
-        let zookeeper = Arc::new(
-            GenericImage::new("zookeeper", "3.9.2")
-                .with_network(self.network)
-                .with_container_name(self.zookeeper_container_name())
-                .start()
-                .await
-                .unwrap(),
-        );
-
-        let coordinator_server = Arc::new(self.start_coordinator_server().await);
-
-        let mut tablet_servers = HashMap::new();
-        for server_id in 0..self.number_of_tablet_servers {
-            tablet_servers.insert(
-                server_id,
-                Arc::new(self.start_tablet_server(server_id).await),
-            );
-        }
-
-        // When dual listeners are configured, bootstrap_servers points to the plaintext
-        // listener and sasl_bootstrap_servers points to the SASL listener.
-        let (bootstrap_servers, sasl_bootstrap_servers) =
-            if let Some(plain_port) = self.plain_client_port {
-                (
-                    format!("127.0.0.1:{}", plain_port),
-                    Some(format!("127.0.0.1:{}", self.coordinator_host_port)),
-                )
-            } else {
-                (format!("127.0.0.1:{}", self.coordinator_host_port), None)
-            };
-
-        FlussTestingCluster {
-            zookeeper,
-            coordinator_server,
-            tablet_servers,
-            bootstrap_servers,
-            sasl_bootstrap_servers,
-            remote_data_dir: self.remote_data_dir.clone(),
-            sasl_users: self.sasl_users.clone(),
-            container_names: stale_containers,
-        }
-    }
-
-    async fn start_coordinator_server(&mut self) -> ContainerAsync<GenericImage> {
-        let port = self.coordinator_host_port;
-        let container_name = self.coordinator_server_container_name();
-        let mut coordinator_confs = HashMap::new();
-        coordinator_confs.insert(
-            "zookeeper.address",
-            format!("{}:2181", self.zookeeper_container_name()),
-        );
-
-        if let Some(plain_port) = self.plain_client_port {
-            // Dual listeners: CLIENT (SASL) + PLAIN_CLIENT (plaintext)
-            coordinator_confs.insert(
-                "bind.listeners",
-                format!(
-                    "INTERNAL://{}:0, CLIENT://{}:{}, PLAIN_CLIENT://{}:{}",
-                    container_name, container_name, port, container_name, plain_port
-                ),
-            );
-            coordinator_confs.insert(
-                "advertised.listeners",
-                format!(
-                    "CLIENT://localhost:{}, PLAIN_CLIENT://localhost:{}",
-                    port, plain_port
-                ),
-            );
-        } else {
-            coordinator_confs.insert(
-                "bind.listeners",
-                format!(
-                    "INTERNAL://{}:0, CLIENT://{}:{}",
-                    container_name, container_name, port
-                ),
-            );
-            coordinator_confs.insert(
-                "advertised.listeners",
-                format!("CLIENT://localhost:{}", port),
-            );
-        }
-
-        coordinator_confs.insert("internal.listener.name", "INTERNAL".to_string());
-
-        let mut image = GenericImage::new(&self.image, &self.image_tag)
-            .with_container_name(self.coordinator_server_container_name())
-            .with_mapped_port(port, ContainerPort::Tcp(port))
-            .with_network(self.network)
-            .with_cmd(vec!["coordinatorServer"])
-            .with_env_var(
-                "FLUSS_PROPERTIES",
-                self.to_fluss_properties_with(coordinator_confs),
-            );
-
-        if let Some(plain_port) = self.plain_client_port {
-            image = image.with_mapped_port(plain_port, ContainerPort::Tcp(plain_port));
-        }
-
-        image.start().await.unwrap()
-    }
-
-    async fn start_tablet_server(&self, server_id: i32) -> ContainerAsync<GenericImage> {
-        let port = self.coordinator_host_port;
-        let container_name = self.tablet_server_container_name(server_id);
-        let mut tablet_server_confs = HashMap::new();
-        let expose_host_port = (port as i32) + 1 + server_id;
-        let tablet_server_id = format!("{}", server_id);
-
-        if let Some(plain_port) = self.plain_client_port {
-            // Dual listeners: CLIENT (SASL) + PLAIN_CLIENT (plaintext)
-            let bind_listeners = format!(
-                "INTERNAL://{}:0, CLIENT://{}:{}, PLAIN_CLIENT://{}:{}",
-                container_name, container_name, port, container_name, plain_port,
-            );
-            let plain_expose_host_port = (plain_port as i32) + 1 + server_id;
-            let advertised_listeners = format!(
-                "CLIENT://localhost:{}, PLAIN_CLIENT://localhost:{}",
-                expose_host_port, plain_expose_host_port
-            );
-            tablet_server_confs.insert("bind.listeners", bind_listeners);
-            tablet_server_confs.insert("advertised.listeners", advertised_listeners);
-        } else {
-            let bind_listeners = format!(
-                "INTERNAL://{}:0, CLIENT://{}:{}",
-                container_name, container_name, port,
-            );
-            let advertised_listeners = format!("CLIENT://localhost:{}", expose_host_port);
-            tablet_server_confs.insert("bind.listeners", bind_listeners);
-            tablet_server_confs.insert("advertised.listeners", advertised_listeners);
-        }
-
-        tablet_server_confs.insert(
-            "zookeeper.address",
-            format!("{}:2181", self.zookeeper_container_name()),
-        );
-        tablet_server_confs.insert("internal.listener.name", "INTERNAL".to_string());
-        tablet_server_confs.insert("tablet-server.id", tablet_server_id);
-
-        // Set remote.data.dir to use the same path as host when volume mount is provided
-        // This ensures the path is consistent between host and container
-        if let Some(remote_data_dir) = &self.remote_data_dir {
-            tablet_server_confs.insert(
-                "remote.data.dir",
-                remote_data_dir.to_string_lossy().to_string(),
-            );
-        }
-        let mut image = GenericImage::new(&self.image, &self.image_tag)
-            .with_cmd(vec!["tabletServer"])
-            .with_mapped_port(expose_host_port as u16, ContainerPort::Tcp(port))
-            .with_network(self.network)
-            .with_container_name(self.tablet_server_container_name(server_id))
-            .with_env_var(
-                "FLUSS_PROPERTIES",
-                self.to_fluss_properties_with(tablet_server_confs),
-            );
-
-        // Add port mapping for plaintext listener
-        if let Some(plain_port) = self.plain_client_port {
-            let plain_expose_host_port = (plain_port as i32) + 1 + server_id;
-            image = image.with_mapped_port(
-                plain_expose_host_port as u16,
-                ContainerPort::Tcp(plain_port),
-            );
-        }
-
-        // Add volume mount if remote_data_dir is provided
-        if let Some(ref remote_data_dir) = self.remote_data_dir {
-            use testcontainers::core::Mount;
-            // Ensure directory exists before mounting (double check)
-            std::fs::create_dir_all(remote_data_dir)
-                .expect("Failed to create remote data directory for mount");
-            let host_path = remote_data_dir.to_string_lossy().to_string();
-            let container_path = remote_data_dir.to_string_lossy().to_string();
-            image = image.with_mount(Mount::bind_mount(host_path, container_path));
-        }
-
-        image.start().await.unwrap()
-    }
-
-    fn to_fluss_properties_with(&self, extra_properties: HashMap<&str, String>) -> String {
-        let mut fluss_properties = Vec::new();
-        for (k, v) in self.cluster_conf.iter() {
-            fluss_properties.push(format!("{}: {}", k, v));
-        }
-        for (k, v) in extra_properties.iter() {
-            fluss_properties.push(format!("{}: {}", k, v));
-        }
-        fluss_properties.join("\n")
-    }
-}
-
-/// Provides an easy way to launch a Fluss cluster with coordinator and tablet servers.
-#[derive(Clone)]
-#[allow(dead_code)] // Fields held for RAII (keeping Docker containers alive).
-pub struct FlussTestingCluster {
-    zookeeper: Arc<ContainerAsync<GenericImage>>,
-    coordinator_server: Arc<ContainerAsync<GenericImage>>,
-    tablet_servers: HashMap<i32, Arc<ContainerAsync<GenericImage>>>,
-    /// Bootstrap servers for plaintext connections.
-    /// When dual listeners are configured, this points to the PLAIN_CLIENT listener.
-    bootstrap_servers: String,
-    /// Bootstrap servers for SASL connections (only set when dual listeners are configured).
-    sasl_bootstrap_servers: Option<String>,
-    remote_data_dir: Option<std::path::PathBuf>,
-    sasl_users: Vec<(String, String)>,
-    container_names: Vec<String>,
-}
-
-impl FlussTestingCluster {
-    /// Synchronously stops and removes all Docker containers and cleans up the
-    /// remote data directory. Safe to call from non-async contexts (e.g. atexit).
-    #[allow(dead_code)]
-    pub fn stop(&self) {
-        for name in &self.container_names {
-            let _ = std::process::Command::new("docker")
-                .args(["rm", "-f", name])
-                .output();
-        }
-        if let Some(ref dir) = self.remote_data_dir {
-            let _ = std::fs::remove_dir_all(dir);
-        }
-    }
-
-    pub fn sasl_users(&self) -> &[(String, String)] {
-        &self.sasl_users
-    }
-
-    /// Returns the plaintext (non-SASL) bootstrap servers address.
-    pub fn plaintext_bootstrap_servers(&self) -> &str {
-        &self.bootstrap_servers
-    }
-
-    pub async fn get_fluss_connection(&self) -> FlussConnection {
-        let config = Config {
-            writer_acks: "all".to_string(),
-            bootstrap_servers: self.bootstrap_servers.clone(),
-            ..Default::default()
-        };
-
-        self.connect_with_retry(config).await
-    }
-
-    /// Connect with SASL/PLAIN credentials.
-    /// Uses `sasl_bootstrap_servers` when dual listeners are configured.
-    pub async fn get_fluss_connection_with_sasl(
-        &self,
-        username: &str,
-        password: &str,
-    ) -> FlussConnection {
-        let bootstrap = self
-            .sasl_bootstrap_servers
-            .clone()
-            .unwrap_or_else(|| self.bootstrap_servers.clone());
-        let config = Config {
-            writer_acks: "all".to_string(),
-            bootstrap_servers: bootstrap,
-            security_protocol: "sasl".to_string(),
-            security_sasl_mechanism: "PLAIN".to_string(),
-            security_sasl_username: username.to_string(),
-            security_sasl_password: password.to_string(),
-            ..Default::default()
-        };
-
-        self.connect_with_retry(config).await
-    }
-
-    /// Try to connect with SASL/PLAIN credentials, returning the error on failure.
-    /// Uses `sasl_bootstrap_servers` when dual listeners are configured.
-    pub async fn try_fluss_connection_with_sasl(
-        &self,
-        username: &str,
-        password: &str,
-    ) -> fluss::error::Result<FlussConnection> {
-        let bootstrap = self
-            .sasl_bootstrap_servers
-            .clone()
-            .unwrap_or_else(|| self.bootstrap_servers.clone());
-        let config = Config {
-            writer_acks: "all".to_string(),
-            bootstrap_servers: bootstrap,
-            security_protocol: "sasl".to_string(),
-            security_sasl_mechanism: "PLAIN".to_string(),
-            security_sasl_username: username.to_string(),
-            security_sasl_password: password.to_string(),
-            ..Default::default()
-        };
-
-        FlussConnection::new(config).await
-    }
-
-    async fn connect_with_retry(&self, config: Config) -> FlussConnection {
-        // Retry mechanism: retry for up to 1 minute
-        let max_retries = 60; // 60 retry attempts
-        let retry_interval = Duration::from_secs(1); // 1 second interval between retries
-
-        for attempt in 1..=max_retries {
-            match FlussConnection::new(config.clone()).await {
-                Ok(connection) => {
-                    return connection;
-                }
-                Err(e) => {
-                    if attempt == max_retries {
-                        panic!(
-                            "Failed to connect to Fluss cluster after {} attempts: {}",
-                            max_retries, e
-                        );
-                    }
-                    tokio::time::sleep(retry_interval).await;
-                }
-            }
-        }
-        unreachable!()
-    }
-}
+pub use fluss_test_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index 970b84ae8e..dc2876f899 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -53,7 +53,7 @@ static SHARED_CLUSTER: LazyLock<FlussTestingCluster> = LazyLock::new(|| {
             );
 
             let cluster =
-                FlussTestingClusterBuilder::new_with_cluster_conf("shared-test", &cluster_conf)
+                FlussTestingClusterBuilder::new_with_cluster_conf("rust-test", &cluster_conf)
                     .with_sasl(vec![
                         ("admin".to_string(), "admin-secret".to_string()),
                         ("alice".to_string(), "alice-secret".to_string()),

From 411b1dc798f14a0c5d870483152b4095310f0025 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Fri, 10 Apr 2026 23:14:35 +0100
Subject: [PATCH 228/287] fix python 3.11 bug in tests with async wait_for
 (#488)

---
 fluss-rust/bindings/python/pyproject.toml         |  2 ++
 fluss-rust/bindings/python/test/test_log_table.py | 13 ++++++-------
 2 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index 41463027bc..9163835fe3 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -51,6 +51,7 @@ dev = [
     "pytest>=8.3.5",
     "pytest-asyncio>=0.25.3",
     "pytest-xdist>=3.5.0",
+    "pytest-timeout>=2.3.1",
     "filelock>=3.0",
     "ruff>=0.9.10",
     "maturin>=1.8.2",
@@ -95,6 +96,7 @@ known-first-party = ["fluss"]
 [tool.pytest.ini_options]
 asyncio_mode = "auto"
 asyncio_default_fixture_loop_scope = "session"
+timeout = 30
 
 [tool.mypy]
 python_version = "3.9"
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index eb11874864..d5397b7d6b 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -765,8 +765,7 @@ async def consume_scanner():
             if len(collected) == 5:
                 break
                 
-    # We must race the consumption against a timeout so the test doesn't hang if the iterator is broken
-    await asyncio.wait_for(consume_scanner(), timeout=10.0)
+    await consume_scanner()
     
     assert len(collected) == 5, f"Expected 5 records, got {len(collected)}"
     
@@ -824,7 +823,7 @@ async def consume_and_break():
             if len(collected_async) >= 3:
                 break
 
-    await asyncio.wait_for(consume_and_break(), timeout=10.0)
+    await consume_and_break()
     assert len(collected_async) == 3, (
         f"Expected 3 records from async for, got {len(collected_async)}"
     )
@@ -904,7 +903,7 @@ async def consume_all():
             if len(collected) >= num_records:
                 break
 
-    await asyncio.wait_for(consume_all(), timeout=15.0)
+    await consume_all()
     assert len(collected) == num_records, (
         f"Expected {num_records} records, got {len(collected)}"
     )
@@ -963,7 +962,7 @@ async def consume_batches():
             if total_rows >= 6:
                 break
 
-    await asyncio.wait_for(consume_batches(), timeout=15.0)
+    await consume_batches()
 
     assert total_rows >= 6, f"Expected >=6 total rows, got {total_rows}"
     assert len(collected_batches) > 0
@@ -1035,7 +1034,7 @@ async def consume_and_break():
             first_batch = rb
             break
 
-    await asyncio.wait_for(consume_and_break(), timeout=10.0)
+    await consume_and_break()
     assert first_batch is not None, "Should have received at least 1 batch"
     assert first_batch.batch.num_rows > 0
 
@@ -1096,7 +1095,7 @@ async def consume_all():
             if len(all_ids) >= num_records:
                 break
 
-    await asyncio.wait_for(consume_all(), timeout=15.0)
+    await consume_all()
     assert len(all_ids) >= num_records, (
         f"Expected >={num_records} IDs, got {len(all_ids)}"
     )

From d9b5358dd89ee4e6a871f3687d5ac4f8f8e77ff1 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 11 Apr 2026 02:46:56 +0100
Subject: [PATCH 229/287] chore: fix docusaurus (#486)

---
 fluss-rust/website/package.json | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/fluss-rust/website/package.json b/fluss-rust/website/package.json
index 75f1499fb4..e725e9e47c 100644
--- a/fluss-rust/website/package.json
+++ b/fluss-rust/website/package.json
@@ -40,5 +40,9 @@
   },
   "engines": {
     "node": ">=20.0"
-  }
+  },
+  "overrides": {
+    "webpackbar": "^7.0.0"
+  },
+  "comment:overrides": "webpackbar 6.x passes its own options (name, color) as this.options, which webpack 5.106.0+ rejects via strict ProgressPlugin schema validation. webpackbar 7.0.0 fixes this. Remove this override once Docusaurus bumps its webpackbar dependency to ^7.0.0."
 }

From 1da2c108dcca1e12d37f6d4285be0e5467c30588 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 11 Apr 2026 02:55:35 +0100
Subject: [PATCH 230/287] [ci] use swatinem/rust-cache (#485)

---
 .../.github/workflows/build_and_test_cpp.yml       | 10 +---------
 .../.github/workflows/build_and_test_python.yml    | 14 +++-----------
 .../.github/workflows/build_and_test_rust.yml      | 10 +---------
 3 files changed, 5 insertions(+), 29 deletions(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
index 7b6383afcb..a091d08d43 100644
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -58,15 +58,7 @@ jobs:
           sudo apt-get install -y -V libarrow-dev
 
       - name: Rust Cache
-        uses: actions/cache@v4
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: cpp-test-${{ runner.os }}-${{ hashFiles('**/Cargo.lock') }}
-          restore-keys: |
-            cpp-test-${{ runner.os }}-
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
 
       - name: Build fluss-test-cluster binary
         run: cargo build -p fluss-test-cluster
diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index 5eec8c39ce..c843fec674 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -61,15 +61,7 @@ jobs:
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
 
       - name: Rust Cache
-        uses: actions/cache@v4
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: python-test-${{ runner.os }}-${{ matrix.python }}-${{ hashFiles('**/Cargo.lock') }}
-          restore-keys: |
-            python-test-${{ runner.os }}-${{ matrix.python }}-
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
 
       - name: Build fluss-test-cluster binary
         run: cargo build -p fluss-test-cluster
@@ -78,11 +70,11 @@ jobs:
         working-directory: bindings/python
         run: |
           uv sync --extra dev --no-install-project
-          uv run maturin develop
+          uv run --no-sync maturin develop --uv
 
       - name: Run tests (parallel)
         working-directory: bindings/python
-        run: uv run pytest test/ -v -n auto
+        run: uv run --no-sync pytest test/ -v -n auto
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index 1c5a99ab3f..a4fe12b6c2 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -59,15 +59,7 @@ jobs:
           fi
 
       - name: Rust Cache
-        uses: actions/cache@v4
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: rust-${{ runner.os }}-${{ hashFiles('**/Cargo.lock') }}
-          restore-keys: |
-            rust-${{ runner.os }}-
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
 
       - name: Build
         run: cargo build --workspace --all-targets --exclude fluss_python --exclude fluss-cpp

From e43d35a09c7608936fe8156c4a96484a6bedcfdc Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jared=20Yu=20=28=E4=BD=99=E5=90=AF=E6=AD=A3=29?=
 <qzyu999@gmail.com>
Date: Sun, 12 Apr 2026 23:11:09 -0700
Subject: [PATCH 231/287] feat: Add array data type support for Python (#474)

* feat: add support for Arrow List and LargeList types with Python bindings and tests

* feat: add support for Arrow FixedSizeList arrays

* fix: Fix the error message in columnar_row_get_array_non_list_column_returns_error to match the new error message from get_array()

* chore: Fix the line length error after running cargo fmt

* fix: Remove the as_encoded_bytes to allow it to revert to the default return of None

* fix: Remove the pytest skip for test_append_and_scan_with_fixed_size_array

* feat: Add python_value_to_datum

* feat: Add more null tests

* feat: Add .pyi stubs for DataType, DataTypes

* fix: Remove DataType, DataTypes as they are dead code only used within tests

* perf: Hoist array downcast and type resolution out of loop

* fix: Remove the pytest skip in test_log_table for fixed_size_array

* fix: Add back the pytest.mark.skip and provide a valid reason

* feat: Add FixedSizeList to handle all Arrow list variants defensively

* feat: Add test_append_and_scan_with_large_list_array for LargeList

* docs: Update documentation to indicate Array data type support

* refactor: Drop FixedSizeList/LargeList and use nested ColumnWriter instead of ListBuilder<Box>

* chore: Run formatting

* fix: Remove references to FixedSizeList and LargeList

* refactor: pass nullability to finish_list_array and add test for non-nullable array types

* chore: Formatting

* feat: add as_nullable, not_null, and nullable methods to DataType and primitive type structs

* test: update non-nullable array type test to verify Arrow schema field nullability

* Revert "feat: add as_nullable, not_null, and nullable methods to DataType and primitive type structs"

This reverts commit 60a14d1f33a78adf75a763d39348482e1b7493d5.
---
 fluss-rust/bindings/python/src/table.rs       |  80 ++++++-
 fluss-rust/bindings/python/src/utils.rs       |   4 +
 .../bindings/python/test/test_log_table.py    | 202 ++++++++++++++++-
 .../bindings/python/test/test_schema.py       |  13 ++
 .../crates/fluss/src/row/binary_array.rs      |  69 ++++++
 fluss-rust/crates/fluss/src/row/column.rs     |  83 ++++---
 .../crates/fluss/src/row/column_writer.rs     | 203 ++++++++++++++++--
 .../fluss/tests/integration/kv_table.rs       |   4 +-
 .../fluss/tests/integration/log_table.rs      |  20 +-
 .../docs/user-guide/python/data-types.md      |   3 +
 10 files changed, 612 insertions(+), 69 deletions(-)

diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 8d92aba167..c1b467343e 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -28,8 +28,8 @@ use pyo3::exceptions::{PyIndexError, PyRuntimeError, PyTypeError};
 use pyo3::sync::PyOnceLock;
 use pyo3::types::{
     IntoPyDict, PyBool, PyByteArray, PyBytes, PyDate, PyDateAccess, PyDateTime, PyDelta,
-    PyDeltaAccess, PyDict, PyList, PySequence, PySlice, PyTime, PyTimeAccess, PyTuple, PyType,
-    PyTzInfo,
+    PyDeltaAccess, PyDict, PyList, PySequence, PySlice, PyString, PyTime, PyTimeAccess, PyTuple,
+    PyType, PyTzInfo,
 };
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::collections::HashMap;
@@ -1240,6 +1240,68 @@ fn python_value_to_datum(
         fcore::metadata::DataType::Time(_) => python_time_to_datum(value),
         fcore::metadata::DataType::Timestamp(_) => python_datetime_to_timestamp_ntz(value),
         fcore::metadata::DataType::TimestampLTz(_) => python_datetime_to_timestamp_ltz(value),
+        fcore::metadata::DataType::Array(array_type) => {
+            let element_type = array_type.get_element_type();
+            if value.is_instance_of::<PyString>() {
+                return Err(FlussError::new_err(format!(
+                    "Expected sequence for Array column, got {}",
+                    get_type_name(value)
+                )));
+            }
+            let seq = value.downcast::<PySequence>().map_err(|_| {
+                FlussError::new_err(format!(
+                    "Expected sequence for Array column, got {}",
+                    get_type_name(value)
+                ))
+            })?;
+
+            let len = seq.len()?;
+            let mut writer = fcore::row::binary_array::FlussArrayWriter::new(len, element_type);
+
+            for i in 0..len {
+                let item = seq.get_item(i)?;
+                if item.is_none() {
+                    writer.set_null_at(i);
+                } else {
+                    let val_datum = python_value_to_datum(&item, element_type)?;
+                    match val_datum {
+                        Datum::Null => writer.set_null_at(i),
+                        Datum::Bool(v) => writer.write_boolean(i, v),
+                        Datum::Int8(v) => writer.write_byte(i, v),
+                        Datum::Int16(v) => writer.write_short(i, v),
+                        Datum::Int32(v) => writer.write_int(i, v),
+                        Datum::Int64(v) => writer.write_long(i, v),
+                        Datum::Float32(v) => writer.write_float(i, v.into_inner()),
+                        Datum::Float64(v) => writer.write_double(i, v.into_inner()),
+                        Datum::String(v) => writer.write_string(i, &v),
+                        Datum::Blob(v) => writer.write_binary_bytes(i, v.as_ref()),
+                        Datum::Decimal(v) => {
+                            if let fcore::metadata::DataType::Decimal(dt) = element_type {
+                                writer.write_decimal(i, &v, dt.precision());
+                            }
+                        }
+                        Datum::Date(v) => writer.write_date(i, v),
+                        Datum::Time(v) => writer.write_time(i, v),
+                        Datum::TimestampNtz(v) => {
+                            if let fcore::metadata::DataType::Timestamp(dt) = element_type {
+                                writer.write_timestamp_ntz(i, &v, dt.precision());
+                            }
+                        }
+                        Datum::TimestampLtz(v) => {
+                            if let fcore::metadata::DataType::TimestampLTz(dt) = element_type {
+                                writer.write_timestamp_ltz(i, &v, dt.precision());
+                            }
+                        }
+                        Datum::Array(v) => writer.write_array(i, &v),
+                    }
+                }
+            }
+
+            let array = writer
+                .complete()
+                .map_err(|e| FlussError::from_core_error(&e))?;
+            Ok(Datum::Array(array))
+        }
         _ => Err(FlussError::new_err(format!(
             "Unsupported data type for row-level operations: {data_type}"
         ))),
@@ -1372,6 +1434,20 @@ pub fn datum_to_python_value(
                 .map_err(|e| FlussError::from_core_error(&e))?;
             rust_timestamp_ltz_to_python(py, ts)
         }
+        DataType::Array(array_type) => {
+            let array_data = row
+                .get_array(pos)
+                .map_err(|e| FlussError::from_core_error(&e))?;
+
+            let element_type = array_type.get_element_type();
+            let py_list = pyo3::types::PyList::empty(py);
+
+            for i in 0..array_data.size() {
+                let py_val = datum_to_python_value(py, &array_data, i, element_type)?;
+                py_list.append(py_val)?;
+            }
+            Ok(py_list.into_any().unbind())
+        }
         _ => Err(FlussError::new_err(format!(
             "Unsupported data type for conversion to Python: {data_type}"
         ))),
diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
index c92f1b9fd9..76b95f7a9f 100644
--- a/fluss-rust/bindings/python/src/utils.rs
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -95,6 +95,10 @@ impl Utils {
             ArrowDataType::Decimal128(precision, scale) => {
                 DataTypes::decimal(*precision as u32, *scale as u32)
             }
+            ArrowDataType::List(field) => {
+                let element_type = Utils::arrow_type_to_fluss_type(field.data_type())?;
+                DataTypes::array(element_type)
+            }
             _ => {
                 return Err(FlussError::new_err(format!(
                     "Unsupported Arrow data type: {arrow_type:?}"
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index d5397b7d6b..5708a93cdd 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -24,6 +24,7 @@
 import time
 
 import pyarrow as pa
+import pytest
 
 import fluss
 
@@ -1119,8 +1120,6 @@ def _poll_records(scanner, expected_count, timeout_s=10):
     return collected
 
 
-
-
 def _poll_arrow_ids(scanner, expected_count, timeout_s=10):
     """Poll a batch scanner and extract 'id' column values."""
     all_ids = []
@@ -1131,3 +1130,202 @@ def _poll_arrow_ids(scanner, expected_count, timeout_s=10):
             all_ids.extend(arrow_table.column("id").to_pylist())
     return all_ids
 
+
+async def test_append_and_scan_with_array(connection, admin):
+    """Test appending and scanning with array columns."""
+    table_path = fluss.TablePath("fluss", "py_test_append_and_scan_with_array")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    pa_schema = pa.schema(
+        [
+            pa.field("id", pa.int32()),
+            pa.field("tags", pa.list_(pa.string())),
+            pa.field("scores", pa.list_(pa.int32())),
+        ]
+    )
+    schema = fluss.Schema(pa_schema)
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+
+    # Batch 1: Testing standard lists
+    batch1 = pa.RecordBatch.from_arrays(
+        [
+            pa.array([1, 2], type=pa.int32()),
+            pa.array([["a", "b"], ["c"]], type=pa.list_(pa.string())),
+            pa.array([[10, 20], [30]], type=pa.list_(pa.int32())),
+        ],
+        schema=pa_schema,
+    )
+    append_writer.write_arrow_batch(batch1)
+
+    # Batch 2: Testing null values inside arrays and null arrays
+    batch2 = pa.RecordBatch.from_arrays(
+        [
+            pa.array([3, 4, 5, 6], type=pa.int32()),
+            pa.array([["d", None], None, [], [None]], type=pa.list_(pa.string())),
+            pa.array([[40, 50], [60], None, []], type=pa.list_(pa.int32())),
+        ],
+        schema=pa_schema,
+    )
+    append_writer.write_arrow_batch(batch2)
+    await append_writer.flush()
+
+    # Verify via LogScanner (record-by-record)
+    scanner = await table.new_scan().create_log_scanner()
+    scanner.subscribe_buckets({0: fluss.EARLIEST_OFFSET})
+    records = _poll_records(scanner, expected_count=6)
+
+    assert len(records) == 6
+    records.sort(key=lambda r: r.row["id"])
+
+    # Verify Batch 1
+    assert records[0].row["tags"] == ["a", "b"]
+    assert records[0].row["scores"] == [10, 20]
+    assert records[1].row["tags"] == ["c"]
+    assert records[1].row["scores"] == [30]
+
+    # Verify Batch 2
+    assert records[2].row["tags"] == ["d", None]
+    assert records[2].row["scores"] == [40, 50]
+    assert records[3].row["tags"] is None
+    assert records[3].row["scores"] == [60]
+    assert records[4].row["tags"] == []
+    assert records[4].row["scores"] is None
+    assert records[5].row["tags"] == [None]
+    assert records[5].row["scores"] == []
+
+    # Verify via to_arrow (batch-based)
+    scanner2 = await table.new_scan().create_record_batch_log_scanner()
+    scanner2.subscribe_buckets({0: fluss.EARLIEST_OFFSET})
+    result_table = scanner2.to_arrow()
+
+    assert result_table.num_rows == 6
+    assert result_table.column("tags").to_pylist() == [
+        ["a", "b"],
+        ["c"],
+        ["d", None],
+        None,
+        [],
+        [None],
+    ]
+    assert result_table.column("scores").to_pylist() == [
+        [10, 20],
+        [30],
+        [40, 50],
+        [60],
+        None,
+        [],
+    ]
+
+
+
+
+async def test_append_rows_with_array(connection, admin):
+    """Test appending rows with array data as Python lists and scanning."""
+    table_path = fluss.TablePath("fluss", "py_test_append_rows_with_array")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    pa_schema = pa.schema(
+        [
+            pa.field("id", pa.int32()),
+            pa.field("tags", pa.list_(pa.string())),
+            pa.field("scores", pa.list_(pa.int32())),
+        ]
+    )
+    schema = fluss.Schema(pa_schema)
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+
+    # Append rows using dicts with lists
+    append_writer.append({"id": 1, "tags": ["a", "b"], "scores": [10, 20]})
+    append_writer.append({"id": 2, "tags": ["c"], "scores": [30]})
+    # Append row using list with nested list (null handling)
+    append_writer.append([3, None, [40, None, 60]])
+    
+    await append_writer.flush()
+
+    scanner = await table.new_scan().create_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    records = _poll_records(scanner, expected_count=3)
+    assert len(records) == 3
+
+    rows = sorted([r.row for r in records], key=lambda r: r["id"])
+    assert rows[0] == {"id": 1, "tags": ["a", "b"], "scores": [10, 20]}
+    assert rows[1] == {"id": 2, "tags": ["c"], "scores": [30]}
+    # Note: records[2].row["tags"] will be None, records[2].row["scores"] will be [40, None, 60]
+    assert rows[2]["id"] == 3
+    assert rows[2]["tags"] is None
+    assert rows[2]["scores"] == [40, None, 60]
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_append_rows_with_nested_array(connection, admin):
+    """Test appending rows with nested array data (ARRAY<ARRAY<INT>>) and scanning."""
+    table_path = fluss.TablePath("fluss", "py_test_append_rows_with_nested_array")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    pa_schema = pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("matrix", pa.list_(pa.list_(pa.int32()))),
+    ])
+    schema = fluss.Schema(pa_schema)
+    await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+
+    # Append nested lists
+    append_writer.append({"id": 1, "matrix": [[1, 2], [3, 4]]})
+    append_writer.append({"id": 2, "matrix": [[], [5], [6, 7, 8]]})
+    append_writer.append({"id": 3, "matrix": None})
+    append_writer.append({"id": 4, "matrix": [[1, None], None, []]})
+    append_writer.append({"id": 5, "matrix": [[None, None]]})
+    
+    await append_writer.flush()
+
+    scanner = await table.new_scan().create_log_scanner()
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    records = _poll_records(scanner, expected_count=5)
+    assert len(records) == 5
+
+    rows = sorted([r.row for r in records], key=lambda r: r["id"])
+    assert rows[0] == {"id": 1, "matrix": [[1, 2], [3, 4]]}
+    assert rows[1] == {"id": 2, "matrix": [[], [5], [6, 7, 8]]}
+    assert rows[2] == {"id": 3, "matrix": None}
+    assert rows[3] == {"id": 4, "matrix": [[1, None], None, []]}
+    assert rows[4] == {"id": 5, "matrix": [[None, None]]}
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_append_rows_with_invalid_array(connection, admin):
+    """Test that appending invalid data to an array column raises an error."""
+    table_path = fluss.TablePath("fluss", "py_test_append_rows_with_invalid_array")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    pa_schema = pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("tags", pa.list_(pa.string())),
+    ])
+    schema = fluss.Schema(pa_schema)
+    await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    append_writer = table.new_append().create_writer()
+
+    # Appending a string instead of a list should raise an error
+    with pytest.raises(Exception, match="Expected sequence for Array column"):
+        append_writer.append({"id": 4, "tags": "not_a_list"})
+    
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
diff --git a/fluss-rust/bindings/python/test/test_schema.py b/fluss-rust/bindings/python/test/test_schema.py
index a72d933453..ab2d1ab447 100644
--- a/fluss-rust/bindings/python/test/test_schema.py
+++ b/fluss-rust/bindings/python/test/test_schema.py
@@ -35,3 +35,16 @@ def test_get_primary_keys():
     assert schema_without_pk.get_primary_keys() == []
 
 
+def test_schema_with_array():
+    # Test that a schema can be constructed from a pyarrow schema containing a list
+    fields = pa.schema(
+        [
+            pa.field("id", pa.int32()),
+            pa.field("tags", pa.list_(pa.string())),
+        ]
+    )
+    schema = fluss.Schema(fields)
+    assert schema.get_column_names() == ["id", "tags"]
+    assert schema.get_column_types() == ["int", "array<string>"]
+
+
diff --git a/fluss-rust/crates/fluss/src/row/binary_array.rs b/fluss-rust/crates/fluss/src/row/binary_array.rs
index 9008bc5467..3383a366df 100644
--- a/fluss-rust/crates/fluss/src/row/binary_array.rs
+++ b/fluss-rust/crates/fluss/src/row/binary_array.rs
@@ -621,6 +621,75 @@ impl FlussArrayWriter {
     }
 }
 
+impl crate::row::InternalRow for FlussArray {
+    fn get_field_count(&self) -> usize {
+        self.size()
+    }
+
+    fn is_null_at(&self, pos: usize) -> Result<bool> {
+        Ok(self.is_null_at(pos))
+    }
+
+    fn get_boolean(&self, pos: usize) -> Result<bool> {
+        self.get_boolean(pos)
+    }
+    fn get_byte(&self, pos: usize) -> Result<i8> {
+        self.get_byte(pos)
+    }
+    fn get_short(&self, pos: usize) -> Result<i16> {
+        self.get_short(pos)
+    }
+    fn get_int(&self, pos: usize) -> Result<i32> {
+        self.get_int(pos)
+    }
+    fn get_long(&self, pos: usize) -> Result<i64> {
+        self.get_long(pos)
+    }
+    fn get_float(&self, pos: usize) -> Result<f32> {
+        self.get_float(pos)
+    }
+    fn get_double(&self, pos: usize) -> Result<f64> {
+        self.get_double(pos)
+    }
+
+    fn get_char(&self, pos: usize, _length: usize) -> Result<&str> {
+        self.get_string(pos)
+    }
+
+    fn get_string(&self, pos: usize) -> Result<&str> {
+        self.get_string(pos)
+    }
+
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Result<Decimal> {
+        self.get_decimal(pos, precision as u32, scale as u32)
+    }
+
+    fn get_date(&self, pos: usize) -> Result<Date> {
+        self.get_date(pos)
+    }
+    fn get_time(&self, pos: usize) -> Result<Time> {
+        self.get_time(pos)
+    }
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> Result<TimestampNtz> {
+        self.get_timestamp_ntz(pos, precision)
+    }
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> Result<TimestampLtz> {
+        self.get_timestamp_ltz(pos, precision)
+    }
+
+    fn get_binary(&self, pos: usize, _length: usize) -> Result<&[u8]> {
+        self.get_binary(pos)
+    }
+
+    fn get_bytes(&self, pos: usize) -> Result<&[u8]> {
+        self.get_binary(pos)
+    }
+
+    fn get_array(&self, pos: usize) -> Result<FlussArray> {
+        self.get_array(pos)
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 4a3e708bb6..be5b850d80 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -416,15 +416,17 @@ impl InternalRow for ColumnarRow {
         use crate::row::binary_array::FlussArrayWriter;
 
         let column = self.column(pos)?;
-        let list_array =
-            column
-                .as_any()
-                .downcast_ref::<ListArray>()
-                .ok_or_else(|| IllegalArgument {
-                    message: format!("expected List array at position {pos}"),
-                })?;
+        let values = if let Some(list_arr) = column.as_any().downcast_ref::<ListArray>() {
+            list_arr.value(self.row_id)
+        } else {
+            return Err(IllegalArgument {
+                message: format!(
+                    "expected List array at position {pos}, got {:?}",
+                    column.data_type()
+                ),
+            });
+        };
 
-        let values = list_array.value(self.row_id);
         let element_fluss_type = from_arrow_type(values.data_type())?;
         let mut writer = FlussArrayWriter::new(values.len(), &element_fluss_type);
 
@@ -478,6 +480,39 @@ macro_rules! write_downcast_elements {
     }};
 }
 
+/// Downcast via `downcast_ref` to a List array type, then loop with null checks.
+macro_rules! write_list_elements {
+    ($values:expr, $list_array_type:ty, $len:expr, $element_type:expr, $writer:expr) => {{
+        let arr = $values
+            .as_any()
+            .downcast_ref::<$list_array_type>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "Expected {} for {:?} element",
+                    stringify!($list_array_type),
+                    $element_type
+                ),
+            })?;
+        let nested_element_type = from_arrow_type(&arr.value_type())?;
+        for i in 0..$len {
+            if arr.is_null(i) {
+                $writer.set_null_at(i);
+            } else {
+                let nested_values = arr.value(i);
+                let mut nested_writer =
+                    FlussArrayWriter::new(nested_values.len(), &nested_element_type);
+                write_arrow_values_to_fluss_array(
+                    &*nested_values,
+                    &nested_element_type,
+                    &mut nested_writer,
+                )?;
+                let nested_array = nested_writer.complete()?;
+                $writer.write_array(i, &nested_array);
+            }
+        }
+    }};
+}
+
 /// Converts all elements of an Arrow array into a `FlussArrayWriter`, downcasting
 /// the Arrow array once per call rather than per element.
 fn write_arrow_values_to_fluss_array(
@@ -607,29 +642,15 @@ fn write_arrow_values_to_fluss_array(
             )?;
         }
         DataType::Array(_) => {
-            let list_arr =
-                values
-                    .as_any()
-                    .downcast_ref::<ListArray>()
-                    .ok_or_else(|| IllegalArgument {
-                        message: format!("Expected ListArray for {element_type:?} element"),
-                    })?;
-            let nested_element_type = from_arrow_type(&list_arr.value_type())?;
-            for i in 0..len {
-                if list_arr.is_null(i) {
-                    writer.set_null_at(i);
-                } else {
-                    let nested_values = list_arr.value(i);
-                    let mut nested_writer =
-                        FlussArrayWriter::new(nested_values.len(), &nested_element_type);
-                    write_arrow_values_to_fluss_array(
-                        &*nested_values,
-                        &nested_element_type,
-                        &mut nested_writer,
-                    )?;
-                    let nested_array = nested_writer.complete()?;
-                    writer.write_array(i, &nested_array);
-                }
+            if values.as_any().is::<ListArray>() {
+                write_list_elements!(values, ListArray, len, element_type, writer);
+            } else {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "Expected ListArray for {element_type:?} element, got {:?}",
+                        values.data_type()
+                    ),
+                });
             }
         }
         _ => {
diff --git a/fluss-rust/crates/fluss/src/row/column_writer.rs b/fluss-rust/crates/fluss/src/row/column_writer.rs
index 34dd0f5cc3..fbaa000dbe 100644
--- a/fluss-rust/crates/fluss/src/row/column_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/column_writer.rs
@@ -111,6 +111,11 @@ enum TypedWriter {
         precision: u32,
         builder: TimestampNanosecondBuilder,
     },
+    List {
+        element_writer: Box<ColumnWriter>,
+        offsets: Vec<i32>,
+        validity: Vec<bool>,
+    },
 }
 
 /// Dispatch to the inner builder across all `TypedWriter` variants.
@@ -143,6 +148,7 @@ macro_rules! with_builder {
             TypedWriter::TimestampLtzMillisecond { builder: $b, .. } => $body,
             TypedWriter::TimestampLtzMicrosecond { builder: $b, .. } => $body,
             TypedWriter::TimestampLtzNanosecond { builder: $b, .. } => $body,
+            TypedWriter::List { .. } => panic!("List variant not supported in with_builder!"),
         }
     };
 }
@@ -321,6 +327,26 @@ impl ColumnWriter {
                     }
                 }
             }
+            DataType::Array(array_type) => {
+                let element_type = array_type.get_element_type();
+                let arrow_element_type = match arrow_type {
+                    ArrowDataType::List(field) => field.data_type(),
+                    _ => {
+                        return Err(Error::IllegalArgument {
+                            message: format!(
+                                "Expected List Arrow type for Array, got: {arrow_type:?}"
+                            ),
+                        });
+                    }
+                };
+                let element_writer =
+                    ColumnWriter::create(element_type, arrow_element_type, 0, capacity)?;
+                TypedWriter::List {
+                    element_writer: Box::new(element_writer),
+                    offsets: vec![0],
+                    validity: Vec::with_capacity(capacity),
+                }
+            }
             _ => {
                 return Err(Error::IllegalArgument {
                     message: format!("Unsupported Fluss DataType: {fluss_type:?}"),
@@ -339,41 +365,69 @@ impl ColumnWriter {
     /// directly to the concrete Arrow builder.
     #[inline]
     pub fn write_field(&mut self, row: &dyn InternalRow) -> Result<()> {
-        if self.nullable && row.is_null_at(self.pos)? {
+        self.write_field_at(row, self.pos)
+    }
+
+    /// Read one value from `row` at position `pos` and append it
+    /// directly to the concrete Arrow builder.
+    #[inline]
+    pub fn write_field_at(&mut self, row: &dyn InternalRow, pos: usize) -> Result<()> {
+        if self.nullable && row.is_null_at(pos)? {
             self.append_null();
             return Ok(());
         }
-        self.write_non_null(row)
+        self.write_non_null_at(row, pos)
     }
 
     /// Finish the builder, producing the final Arrow array.
     pub fn finish(&mut self) -> ArrayRef {
-        self.as_builder_mut().finish()
+        match &mut self.inner {
+            TypedWriter::List {
+                element_writer,
+                offsets,
+                validity,
+            } => {
+                let item_nullable = element_writer.nullable;
+                let values = element_writer.finish();
+                let taken_offsets = std::mem::replace(offsets, vec![0]);
+                let taken_validity = std::mem::take(validity);
+                finish_list_array(values, item_nullable, &taken_offsets, &taken_validity)
+            }
+            _ => with_builder!(&mut self.inner, b => (b as &mut dyn ArrayBuilder).finish()),
+        }
     }
 
     /// Clone-finish the builder for size estimation (does not reset the builder).
     pub fn finish_cloned(&self) -> ArrayRef {
-        self.as_builder_ref().finish_cloned()
+        match &self.inner {
+            TypedWriter::List {
+                element_writer,
+                offsets,
+                validity,
+            } => {
+                let item_nullable = element_writer.nullable;
+                let values = element_writer.finish_cloned();
+                finish_list_array(values, item_nullable, offsets, validity)
+            }
+            _ => with_builder!(&self.inner, b => (b as &dyn ArrayBuilder).finish_cloned()),
+        }
     }
 
     fn append_null(&mut self) {
-        with_builder!(&mut self.inner, b => b.append_null());
-    }
-
-    /// Returns a trait-object reference to the inner builder.
-    /// Used for type-agnostic operations (`finish`, `finish_cloned`).
-    fn as_builder_mut(&mut self) -> &mut dyn ArrayBuilder {
-        with_builder!(&mut self.inner, b => b)
-    }
-
-    fn as_builder_ref(&self) -> &dyn ArrayBuilder {
-        with_builder!(&self.inner, b => b)
+        match &mut self.inner {
+            TypedWriter::List {
+                offsets, validity, ..
+            } => {
+                let last = *offsets.last().unwrap_or(&0);
+                offsets.push(last);
+                validity.push(false);
+            }
+            _ => with_builder!(&mut self.inner, b => b.append_null()),
+        }
     }
 
     #[inline]
-    fn write_non_null(&mut self, row: &dyn InternalRow) -> Result<()> {
-        let pos = self.pos;
-
+    fn write_non_null_at(&mut self, row: &dyn InternalRow, pos: usize) -> Result<()> {
         match &mut self.inner {
             TypedWriter::Bool(b) => {
                 b.append_value(row.get_boolean(pos)?);
@@ -550,15 +604,62 @@ impl ColumnWriter {
                 )?);
                 Ok(())
             }
+            TypedWriter::List {
+                element_writer,
+                offsets,
+                validity,
+            } => {
+                let array = row.get_array(pos)?;
+                for i in 0..array.size() {
+                    element_writer.write_field_at(&array, i)?;
+                }
+                let last = *offsets.last().unwrap();
+                offsets.push(
+                    last + i32::try_from(array.size()).map_err(|_| RowConvertError {
+                        message: format!("Array size {} exceeds i32 range", array.size()),
+                    })?,
+                );
+                validity.push(true);
+                Ok(())
+            }
         }
     }
 }
 
+fn finish_list_array(
+    values: ArrayRef,
+    item_nullable: bool,
+    offsets: &[i32],
+    validity: &[bool],
+) -> ArrayRef {
+    use arrow::array::ListArray;
+    use arrow::buffer::{NullBuffer, OffsetBuffer, ScalarBuffer};
+    use arrow::datatypes::{Field, FieldRef};
+    use std::sync::Arc;
+
+    let offsets_buffer = OffsetBuffer::new(ScalarBuffer::from(offsets.to_vec()));
+    let null_buffer = NullBuffer::from(validity.to_vec());
+    let field = Arc::new(Field::new(
+        "item",
+        values.data_type().clone(),
+        item_nullable,
+    ));
+    let field_ref: FieldRef = field;
+
+    Arc::new(ListArray::new(
+        field_ref,
+        offsets_buffer,
+        values,
+        Some(null_buffer),
+    ))
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
     use crate::metadata::DataTypes;
     use crate::record::to_arrow_type;
+    use crate::row::binary_array::FlussArrayWriter;
     use crate::row::{Date, Datum, GenericRow, Time, TimestampLtz, TimestampNtz};
     use arrow::array::*;
     use bigdecimal::BigDecimal;
@@ -760,12 +861,70 @@ mod tests {
         assert_eq!((int_arr.value(0), int_arr.value(1)), (42, 99));
     }
 
+    #[test]
+    fn write_array_type() {
+        let element_type = DataTypes::int();
+        let mut array_writer = FlussArrayWriter::new(3, &element_type);
+        array_writer.write_int(0, 10);
+        array_writer.set_null_at(1);
+        array_writer.write_int(2, 30);
+        let fluss_array = array_writer.complete().unwrap();
+
+        let fluss_type = DataTypes::array(element_type);
+
+        let arr = write_one(&fluss_type, Datum::Array(fluss_array));
+        let list_arr = arr.as_any().downcast_ref::<ListArray>().unwrap();
+        assert_eq!(list_arr.len(), 1);
+        let values = list_arr.value(0);
+        let int_values = values.as_any().downcast_ref::<Int32Array>().unwrap();
+        assert_eq!(int_values.len(), 3);
+        assert_eq!(int_values.value(0), 10);
+        assert!(int_values.is_null(1));
+        assert_eq!(int_values.value(2), 30);
+    }
+
     #[test]
     fn unsupported_type_returns_error() {
-        let fluss_type = DataTypes::array(DataTypes::int());
-        let arrow_type = ArrowDataType::List(arrow_schema::FieldRef::new(
-            arrow_schema::Field::new("item", ArrowDataType::Int32, true),
-        ));
+        // Map is currently unsupported in ColumnWriter
+        let fluss_type = DataTypes::map(DataTypes::int(), DataTypes::string());
+        let arrow_type = ArrowDataType::Boolean; // Any arrow type
         assert!(ColumnWriter::create(&fluss_type, &arrow_type, 0, 4).is_err());
     }
+
+    #[test]
+    fn write_non_nullable_array_type() {
+        // 1. Define an array of non-nullable integers
+        let element_type = DataTypes::int().as_non_nullable();
+        let array_type = DataTypes::array(element_type);
+
+        // 2. Create the writer
+        let mut writer = writer_for(&array_type, 4);
+
+        // (Optional but good practice) Write a dummy row containing an empty array
+        // to ensure the builder processes it without panicking.
+        let array_writer = FlussArrayWriter::new(0, &DataTypes::int().as_non_nullable());
+        let fluss_array = array_writer.complete().unwrap();
+        writer
+            .write_field(&GenericRow::from_data(vec![Datum::Array(fluss_array)]))
+            .unwrap();
+
+        // 3. FINISH the array to get the actual Arrow output
+        let arrow_array = writer.finish();
+
+        // 4. Assert against the actual Arrow schema!
+        let list_array = arrow_array
+            .as_any()
+            .downcast_ref::<ListArray>()
+            .expect("Expected ListArray");
+        let list_field = match list_array.data_type() {
+            ArrowDataType::List(field) => field,
+            _ => panic!("Expected List type"),
+        };
+
+        // This is the true test: Did the Arrow field get marked as NOT NULL?
+        assert!(
+            !list_field.is_nullable(),
+            "Arrow field inside the list should be non-nullable"
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index b942988512..f35e507bd6 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -632,8 +632,8 @@ mod kv_table_test {
         let col_smallint = 32767i16;
         let col_int = 2147483647i32;
         let col_bigint = 9223372036854775807i64;
-        let col_float = 3.14f32;
-        let col_double = 2.718281828459045f64;
+        let col_float = std::f32::consts::PI;
+        let col_double = std::f64::consts::E;
         let col_char = "hello";
         let col_string = "world of fluss rust client";
         let col_decimal = Decimal::from_unscaled_long(12345, 10, 2).unwrap(); // 123.45
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 330e143674..d10834e87e 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -684,8 +684,8 @@ mod table_test {
         let col_smallint = 32767i16;
         let col_int = 2147483647i32;
         let col_bigint = 9223372036854775807i64;
-        let col_float = 3.14f32;
-        let col_double = 2.718281828459045f64;
+        let col_float = std::f32::consts::PI;
+        let col_double = std::f64::consts::E;
         let col_boolean = true;
         let col_char = "hello";
         let col_string = "world of fluss rust client";
@@ -738,18 +738,18 @@ mod table_test {
         row.set_field(14, col_time_ns);
         row.set_field(15, col_timestamp_s);
         row.set_field(16, col_timestamp_ms);
-        row.set_field(17, col_timestamp_us.clone());
-        row.set_field(18, col_timestamp_ns.clone());
+        row.set_field(17, col_timestamp_us);
+        row.set_field(18, col_timestamp_ns);
         row.set_field(19, col_timestamp_ltz_s);
         row.set_field(20, col_timestamp_ltz_ms);
-        row.set_field(21, col_timestamp_ltz_us.clone());
-        row.set_field(22, col_timestamp_ltz_ns.clone());
+        row.set_field(21, col_timestamp_ltz_us);
+        row.set_field(22, col_timestamp_ltz_ns);
         row.set_field(23, col_bytes.as_slice());
         row.set_field(24, col_binary.as_slice());
-        row.set_field(25, col_timestamp_us_neg.clone());
-        row.set_field(26, col_timestamp_ns_neg.clone());
-        row.set_field(27, col_timestamp_ltz_us_neg.clone());
-        row.set_field(28, col_timestamp_ltz_ns_neg.clone());
+        row.set_field(25, col_timestamp_us_neg);
+        row.set_field(26, col_timestamp_ns_neg);
+        row.set_field(27, col_timestamp_ltz_us_neg);
+        row.set_field(28, col_timestamp_ltz_ns_neg);
 
         append_writer
             .append(&row)
diff --git a/fluss-rust/website/docs/user-guide/python/data-types.md b/fluss-rust/website/docs/user-guide/python/data-types.md
index 6d7e78d16f..c0acb4c7ea 100644
--- a/fluss-rust/website/docs/user-guide/python/data-types.md
+++ b/fluss-rust/website/docs/user-guide/python/data-types.md
@@ -17,6 +17,7 @@ The Python client uses PyArrow types for schema definitions:
 | `pa.timestamp("us")`                            | Timestamp (NTZ)                   | `datetime.datetime` |
 | `pa.timestamp("us", tz="UTC")`                  | TimestampLTZ                      | `datetime.datetime` |
 | `pa.decimal128(precision, scale)`               | Decimal                           | `decimal.Decimal`   |
+| `pa.list_(type)`                                  | Array                             | `list`              |
 
 All Python native types (`date`, `time`, `datetime`, `Decimal`) work when appending rows via dicts.
 
@@ -38,6 +39,8 @@ row = {
     "login_time": time(9, 30, 0),
     "created_at": datetime(2024, 1, 1, 0, 0, 0),
     "nickname": None,  # null value
+    "tags": ["active", "premium"],  # Array of strings
+    "scores": [10, None, 30],       # Array with null values
 }
 handle = writer.append(row)
 ```

From 82d08bc0d0a1f5b9742bb6d99bc6fac8b2764fe3 Mon Sep 17 00:00:00 2001
From: Keith Lee <leekei@apache.org>
Date: Mon, 13 Apr 2026 08:27:09 +0100
Subject: [PATCH 232/287] [ci] Upgrade checkout@v4 to v6 and setup-python@v5 to
 v6 (#491)

* [ci] upgrade checkout@v4 to v6 and setup-python@v5 to v6

Migrate away from deprecated Node.js 20 GitHub Actions before the
June 2026 forced migration deadline.

Closes #490

* [ci] remove unrelated audit.yml from this PR
---
 fluss-rust/.github/workflows/build_and_test_cpp.yml         | 2 +-
 fluss-rust/.github/workflows/build_and_test_python.yml      | 4 ++--
 fluss-rust/.github/workflows/build_and_test_rust.yml        | 4 ++--
 .../.github/workflows/check_license_and_formatting.yml      | 2 +-
 fluss-rust/.github/workflows/release_python.yml             | 6 +++---
 fluss-rust/.github/workflows/release_rust.yml               | 2 +-
 6 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
index a091d08d43..7d30b8f7c5 100644
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -44,7 +44,7 @@ jobs:
     env:
       FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/target/debug/fluss-test-cluster
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
 
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index c843fec674..69202c03e6 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -47,10 +47,10 @@ jobs:
     env:
       FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/target/debug/fluss-test-cluster
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
 
       - name: Set up Python
-        uses: actions/setup-python@v5
+        uses: actions/setup-python@v6
         with:
           python-version: ${{ matrix.python }}
 
diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index a4fe12b6c2..9b763b3eb5 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -48,7 +48,7 @@ jobs:
           - ubuntu-latest
           - macos-latest
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
 
       - name: Install protoc
         run: |
@@ -75,7 +75,7 @@ jobs:
     timeout-minutes: 60
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
 
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
diff --git a/fluss-rust/.github/workflows/check_license_and_formatting.yml b/fluss-rust/.github/workflows/check_license_and_formatting.yml
index 1b83b749e8..1108c20ad5 100644
--- a/fluss-rust/.github/workflows/check_license_and_formatting.yml
+++ b/fluss-rust/.github/workflows/check_license_and_formatting.yml
@@ -37,7 +37,7 @@ jobs:
   check-license-and-formatting:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
 
       - name: Check License Header
         uses: apache/skywalking-eyes/header@v0.6.0
diff --git a/fluss-rust/.github/workflows/release_python.yml b/fluss-rust/.github/workflows/release_python.yml
index d61213e506..9aaaf6f348 100644
--- a/fluss-rust/.github/workflows/release_python.yml
+++ b/fluss-rust/.github/workflows/release_python.yml
@@ -39,14 +39,14 @@ jobs:
   version-check:
     runs-on: ubuntu-latest
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
       - uses: ./.github/actions/verify-tag-version
 
   sdist:
     runs-on: ubuntu-latest
     needs: [version-check]
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
 
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
@@ -75,7 +75,7 @@ jobs:
           - { os: ubuntu-latest, target: "x86_64" }
           - { os: ubuntu-latest, target: "aarch64", manylinux: "manylinux_2_28" }
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
 
       - name: Install protoc (Linux)
         if: runner.os == 'Linux'
diff --git a/fluss-rust/.github/workflows/release_rust.yml b/fluss-rust/.github/workflows/release_rust.yml
index 7ff7c0b72d..946b2b26a8 100644
--- a/fluss-rust/.github/workflows/release_rust.yml
+++ b/fluss-rust/.github/workflows/release_rust.yml
@@ -34,7 +34,7 @@ jobs:
     permissions:
       contents: read
     steps:
-      - uses: actions/checkout@v4
+      - uses: actions/checkout@v6
 
       - uses: ./.github/actions/verify-tag-version
 

From b01930f0ca8fa5d1fb73dc98da1acb313b0fac1f Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 13 Apr 2026 20:04:38 +0100
Subject: [PATCH 233/287] feat: Byte-sized cap instead of hard one for
 ArrowWriter (#443)

* [TASK-431] Byte-sized cap instead of hard one for ArrowWriter

* Address feedback

* rebase fix

* Remove unused as_builder_mut

* Remove unused finish_cloned

---------

Co-authored-by: Keith Lee <leekei@apache.org>
---
 .../src/client/table/log_fetch_buffer.rs      |   5 +-
 .../crates/fluss/src/client/table/scanner.rs  |   5 +-
 .../fluss/src/client/write/accumulator.rs     |  52 +++--
 .../crates/fluss/src/client/write/batch.rs    | 206 +++++++++++++++++-
 .../arrow_compression_ratio_estimator.rs      | 105 +++++++++
 .../crates/fluss/src/compression/mod.rs       |   2 +
 fluss-rust/crates/fluss/src/record/arrow.rs   | 200 +++++++++++++++--
 .../crates/fluss/src/row/column_writer.rs     |  84 ++++++-
 8 files changed, 614 insertions(+), 45 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/compression/arrow_compression_ratio_estimator.rs

diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index edab91d5cf..0dff4e8749 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -831,7 +831,8 @@ mod tests {
     use super::*;
     use crate::client::WriteRecord;
     use crate::compression::{
-        ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+        ArrowCompressionInfo, ArrowCompressionRatioEstimator, ArrowCompressionType,
+        DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
     };
     use crate::metadata::{DataField, DataTypes, PhysicalTablePath, RowType, TablePath};
     use crate::record::{MemoryLogRecordsArrowBuilder, ReadContext, to_arrow_schema};
@@ -908,6 +909,8 @@ mod tests {
                 compression_type: ArrowCompressionType::None,
                 compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
             },
+            usize::MAX,
+            Arc::new(ArrowCompressionRatioEstimator::default()),
         )?;
 
         let mut row = GenericRow::new(2);
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index ab7d441c0e..00c5b23859 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -1700,7 +1700,8 @@ mod tests {
     use crate::client::WriteRecord;
     use crate::client::metadata::Metadata;
     use crate::compression::{
-        ArrowCompressionInfo, ArrowCompressionType, DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+        ArrowCompressionInfo, ArrowCompressionRatioEstimator, ArrowCompressionType,
+        DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
     };
     use crate::metadata::{DataTypes, PhysicalTablePath, Schema, TableInfo, TablePath};
     use crate::record::MemoryLogRecordsArrowBuilder;
@@ -1717,6 +1718,8 @@ mod tests {
                 compression_type: ArrowCompressionType::None,
                 compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
             },
+            usize::MAX,
+            Arc::new(ArrowCompressionRatioEstimator::default()),
         )?;
         let physical_table_path = Arc::new(PhysicalTablePath::of(table_path));
         let row = GenericRow {
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 53d004012a..019d3b05d4 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -21,6 +21,7 @@ use crate::client::write::batch::WriteBatch::{ArrowLog, Kv};
 use crate::client::write::batch::{ArrowLogWriteBatch, KvWriteBatch, WriteBatch};
 use crate::client::{LogWriteRecord, Record, ResultHandle, WriteRecord};
 use crate::cluster::{BucketLocation, Cluster, ServerNode};
+use crate::compression::ArrowCompressionRatioEstimator;
 use crate::config::Config;
 use crate::error::{Error, Result};
 use crate::metadata::{PhysicalTablePath, TableBucket};
@@ -235,6 +236,7 @@ impl RecordAccumulator {
         dq: &mut VecDeque<WriteBatch>,
         permit: MemoryPermit,
         alloc_size: usize,
+        compression_ratio_estimator: Arc<ArrowCompressionRatioEstimator>,
     ) -> Result<RecordAppendResult> {
         let physical_table_path = &record.physical_table_path;
         let table_path = physical_table_path.get_table_path();
@@ -253,6 +255,8 @@ impl RecordAccumulator {
                 row_type,
                 current_time_ms(),
                 matches!(&record.record, Record::Log(LogWriteRecord::RecordBatch(_))),
+                alloc_size,
+                compression_ratio_estimator,
             )?),
             Record::Kv(kv_record) => Kv(KvWriteBatch::new(
                 self.batch_id.fetch_add(1, Ordering::Relaxed),
@@ -303,22 +307,29 @@ impl RecordAccumulator {
             None
         };
 
-        let dq = {
-            let mut binding = self
-                .write_batches
-                .entry(Arc::clone(physical_table_path))
-                .or_insert_with(|| BucketAndWriteBatches {
-                    table_id: table_info.table_id,
-                    is_partitioned_table,
-                    partition_id,
-                    batches: Default::default(),
-                });
+        let (dq, compression_ratio_estimator) = {
+            let mut binding =
+                self.write_batches
+                    .entry(Arc::clone(physical_table_path))
+                    .or_insert_with(|| BucketAndWriteBatches {
+                        table_id: table_info.table_id,
+                        is_partitioned_table,
+                        partition_id,
+                        batches: Default::default(),
+                        compression_ratio_estimator: Arc::new(
+                            ArrowCompressionRatioEstimator::default(),
+                        ),
+                    });
             let bucket_and_batches = binding.value_mut();
-            bucket_and_batches
+            let dq = bucket_and_batches
                 .batches
                 .entry(bucket_id)
                 .or_insert_with(|| Arc::new(Mutex::new(VecDeque::new())))
-                .clone()
+                .clone();
+            (
+                dq,
+                Arc::clone(&bucket_and_batches.compression_ratio_estimator),
+            )
         };
 
         let mut dq_guard = dq.lock();
@@ -336,6 +347,11 @@ impl RecordAccumulator {
         // producer holds dq + blocks on memory, while sender needs dq to drain.
         drop(dq_guard);
 
+        // TODO: Implement DynamicWriteBatchSizeEstimator matching Java's
+        // client.writer.dynamic-batch-size-enabled. Adjusts the batch size target
+        // per table based on observed actual batch sizes (grow 10% when >80% full,
+        // shrink 5% when <50% full, clamped to [2*pageSize, maxBatchSize]).
+        // This would improve memory limiter utilization for tables with small rows.
         let batch_size = self.config.writer_batch_size as usize;
         let record_size = record.estimated_record_size();
         let alloc_size = batch_size.max(record_size);
@@ -348,7 +364,14 @@ impl RecordAccumulator {
             return Ok(append_result); // permit drops here, memory released
         }
 
-        self.append_new_batch(cluster, record, &mut dq_guard, permit, alloc_size)
+        self.append_new_batch(
+            cluster,
+            record,
+            &mut dq_guard,
+            permit,
+            alloc_size,
+            compression_ratio_estimator,
+        )
     }
 
     pub fn ready(&self, cluster: &Arc<Cluster>) -> Result<ReadyCheckResult> {
@@ -767,6 +790,7 @@ impl RecordAccumulator {
                 is_partitioned_table,
                 partition_id,
                 batches: Default::default(),
+                compression_ratio_estimator: Arc::new(ArrowCompressionRatioEstimator::default()),
             });
         let bucket_and_batches = binding.value_mut();
         bucket_and_batches
@@ -912,6 +936,8 @@ struct BucketAndWriteBatches {
     is_partitioned_table: bool,
     partition_id: Option<PartitionId>,
     batches: HashMap<BucketId, Arc<Mutex<VecDeque<WriteBatch>>>>,
+    /// Compression ratio estimator shared across Arrow log batches for this table.
+    compression_ratio_estimator: Arc<ArrowCompressionRatioEstimator>,
 }
 
 pub struct RecordAppendResult {
diff --git a/fluss-rust/crates/fluss/src/client/write/batch.rs b/fluss-rust/crates/fluss/src/client/write/batch.rs
index e3cd2ca46d..fd70cb9715 100644
--- a/fluss-rust/crates/fluss/src/client/write/batch.rs
+++ b/fluss-rust/crates/fluss/src/client/write/batch.rs
@@ -17,7 +17,7 @@
 
 use crate::client::broadcast::{BatchWriteResult, BroadcastOnce};
 use crate::client::{Record, ResultHandle, WriteRecord};
-use crate::compression::ArrowCompressionInfo;
+use crate::compression::{ArrowCompressionInfo, ArrowCompressionRatioEstimator};
 use crate::error::{Error, Result};
 use crate::metadata::{KvFormat, PhysicalTablePath, RowType};
 use crate::record::MemoryLogRecordsArrowBuilder;
@@ -230,6 +230,8 @@ impl ArrowLogWriteBatch {
         row_type: &RowType,
         create_ms: i64,
         to_append_record_batch: bool,
+        write_limit: usize,
+        compression_ratio_estimator: Arc<ArrowCompressionRatioEstimator>,
     ) -> Result<Self> {
         let base = InnerWriteBatch::new(batch_id, physical_table_path, create_ms);
         Ok(Self {
@@ -239,6 +241,8 @@ impl ArrowLogWriteBatch {
                 row_type,
                 to_append_record_batch,
                 arrow_compression_info,
+                write_limit,
+                compression_ratio_estimator,
             )?,
             built_records: None,
         })
@@ -464,6 +468,8 @@ mod tests {
                 &row_type,
                 0,
                 false,
+                2 * 1024 * 1024,
+                Arc::new(ArrowCompressionRatioEstimator::default()),
             )
             .unwrap();
 
@@ -487,7 +493,7 @@ mod tests {
             let built_data = batch.build().unwrap();
             let actual_size = built_data.len();
 
-            let diff = actual_size - estimated_size;
+            let diff = actual_size.abs_diff(estimated_size);
             let threshold = actual_size / 10; // 10% tolerance
             assert!(
                 diff <= threshold,
@@ -508,6 +514,8 @@ mod tests {
                 &row_type,
                 0,
                 true,
+                2 * 1024 * 1024,
+                Arc::new(ArrowCompressionRatioEstimator::default()),
             )
             .unwrap();
 
@@ -538,7 +546,7 @@ mod tests {
             let built_data = batch.build().unwrap();
             let actual_size = built_data.len();
 
-            let diff = actual_size - estimated_size;
+            let diff = actual_size.abs_diff(estimated_size);
             let threshold = actual_size / 10; // 10% tolerance
             assert!(
                 diff <= threshold,
@@ -587,4 +595,196 @@ mod tests {
             "estimated size {estimated_size} is not equal to actual size"
         );
     }
+
+    /// Verifies byte-size-based fullness:
+    /// 1. Actual built size stays within the configured limit (no compression).
+    /// 2. Old 256-record cap is gone — large batches accept >256 small rows.
+    /// 3. Compression feedback loop: shared estimator updates after build(),
+    ///    second batch with same estimator accepts more records.
+    #[test]
+    fn test_arrow_batch_byte_size_fullness() {
+        use crate::client::WriteRecord;
+        use crate::compression::{
+            ArrowCompressionInfo, ArrowCompressionRatioEstimator, ArrowCompressionType,
+            DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+        };
+        use crate::metadata::{DataField, DataTypes, RowType};
+        use crate::row::GenericRow;
+        use std::sync::Arc;
+
+        let row_type = RowType::new(vec![
+            DataField::new("id".to_string(), DataTypes::int(), None),
+            DataField::new("name".to_string(), DataTypes::string(), None),
+        ]);
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path)));
+
+        // --- Part 1: actual built size stays within limit (uncompressed) ---
+        let write_limit: usize = 16 * 1024;
+        let mut batch = ArrowLogWriteBatch::new(
+            1,
+            Arc::clone(&physical_table_path),
+            1,
+            ArrowCompressionInfo {
+                compression_type: ArrowCompressionType::None,
+                compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+            },
+            &row_type,
+            0,
+            false,
+            write_limit,
+            Arc::new(ArrowCompressionRatioEstimator::default()),
+        )
+        .unwrap();
+
+        let mut appended = 0;
+        for i in 0..100_000 {
+            let mut row = GenericRow::new(2);
+            row.set_field(0, i);
+            row.set_field(1, "hello_world");
+            let record = WriteRecord::for_append(
+                Arc::clone(&table_info),
+                Arc::clone(&physical_table_path),
+                1,
+                &row,
+            );
+            match batch.try_append(&record).unwrap() {
+                Some(_) => appended += 1,
+                None => break,
+            }
+        }
+
+        assert!(
+            appended > 0 && appended < 100_000,
+            "batch should have filled, appended: {appended}"
+        );
+        let built = batch.build().unwrap();
+        assert!(
+            built.len() <= write_limit * 120 / 100,
+            "actual size {} exceeds write_limit {write_limit} by more than 20%",
+            built.len()
+        );
+
+        // --- Part 2: old 256-record cap is gone ---
+        let row_type_small = RowType::new(vec![DataField::new(
+            "id".to_string(),
+            DataTypes::int(),
+            None,
+        )]);
+        let mut batch = ArrowLogWriteBatch::new(
+            2,
+            Arc::clone(&physical_table_path),
+            1,
+            ArrowCompressionInfo {
+                compression_type: ArrowCompressionType::None,
+                compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+            },
+            &row_type_small,
+            0,
+            false,
+            2 * 1024 * 1024,
+            Arc::new(ArrowCompressionRatioEstimator::default()),
+        )
+        .unwrap();
+
+        let mut appended = 0;
+        for i in 0..1000 {
+            let mut row = GenericRow::new(1);
+            row.set_field(0, i);
+            let record = WriteRecord::for_append(
+                Arc::clone(&table_info),
+                Arc::clone(&physical_table_path),
+                1,
+                &row,
+            );
+            match batch.try_append(&record).unwrap() {
+                Some(_) => appended += 1,
+                None => break,
+            }
+        }
+        assert_eq!(appended, 1000, "2MB batch should fit 1000 tiny rows");
+
+        // --- Part 3: compression feedback loop ---
+        let estimator = Arc::new(ArrowCompressionRatioEstimator::default());
+        assert_eq!(estimator.estimation(), 1.0);
+
+        let write_limit = 64 * 1024;
+        let compression = ArrowCompressionInfo {
+            compression_type: ArrowCompressionType::Zstd,
+            compression_level: 3,
+        };
+
+        // First batch: fill and build with ZSTD.
+        let mut batch1 = ArrowLogWriteBatch::new(
+            3,
+            Arc::clone(&physical_table_path),
+            1,
+            compression.clone(),
+            &row_type,
+            0,
+            false,
+            write_limit,
+            Arc::clone(&estimator),
+        )
+        .unwrap();
+
+        for i in 0..500 {
+            let mut row = GenericRow::new(2);
+            row.set_field(0, i);
+            row.set_field(1, "aaaaaaaaaaaaaaaa");
+            let record = WriteRecord::for_append(
+                Arc::clone(&table_info),
+                Arc::clone(&physical_table_path),
+                1,
+                &row,
+            );
+            if batch1.try_append(&record).unwrap().is_none() {
+                break;
+            }
+        }
+        batch1.build().unwrap();
+
+        // Estimator should have decreased (ZSTD compresses repeated data well).
+        assert!(
+            estimator.estimation() < 1.0,
+            "ratio should decrease after compressed build, got: {}",
+            estimator.estimation()
+        );
+
+        // Second batch: same estimator → knows data compresses well → accepts more rows.
+        let mut batch2 = ArrowLogWriteBatch::new(
+            4,
+            Arc::clone(&physical_table_path),
+            1,
+            compression,
+            &row_type,
+            0,
+            false,
+            write_limit,
+            Arc::clone(&estimator),
+        )
+        .unwrap();
+
+        let mut appended2 = 0;
+        for i in 0..10_000 {
+            let mut row = GenericRow::new(2);
+            row.set_field(0, i);
+            row.set_field(1, "aaaaaaaaaaaaaaaa");
+            let record = WriteRecord::for_append(
+                Arc::clone(&table_info),
+                Arc::clone(&physical_table_path),
+                1,
+                &row,
+            );
+            match batch2.try_append(&record).unwrap() {
+                Some(_) => appended2 += 1,
+                None => break,
+            }
+        }
+        assert!(
+            appended2 > 500,
+            "second batch should accept more records with updated ratio, got: {appended2}"
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/compression/arrow_compression_ratio_estimator.rs b/fluss-rust/crates/fluss/src/compression/arrow_compression_ratio_estimator.rs
new file mode 100644
index 0000000000..08b8048aa4
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/compression/arrow_compression_ratio_estimator.rs
@@ -0,0 +1,105 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use std::sync::atomic::{AtomicU32, Ordering};
+
+/// Adaptive estimator for Arrow compression ratios.
+///
+/// Tracks the ratio between compressed and uncompressed Arrow body sizes.
+/// The estimate adjusts asymmetrically: it increases quickly when compression
+/// worsens (to avoid underestimating batch sizes) and decreases slowly when
+/// compression improves (conservative).
+///
+/// Thread-safe: uses atomic f32 (stored as u32 bits) matching Java's `volatile float`.
+///
+/// Matching Java's `ArrowCompressionRatioEstimator`.
+pub struct ArrowCompressionRatioEstimator {
+    /// Stored as `f32::to_bits()` for atomic access.
+    ratio_bits: AtomicU32,
+}
+
+const COMPRESSION_RATIO_IMPROVING_STEP: f32 = 0.005;
+const COMPRESSION_RATIO_DETERIORATE_STEP: f32 = 0.05;
+const DEFAULT_COMPRESSION_RATIO: f32 = 1.0;
+
+impl ArrowCompressionRatioEstimator {
+    pub fn new() -> Self {
+        Self {
+            ratio_bits: AtomicU32::new(DEFAULT_COMPRESSION_RATIO.to_bits()),
+        }
+    }
+
+    pub fn estimation(&self) -> f32 {
+        f32::from_bits(self.ratio_bits.load(Ordering::Relaxed))
+    }
+
+    pub fn update_estimation(&self, observed_ratio: f32) {
+        let current = self.estimation();
+        let new_ratio = if observed_ratio > current {
+            (current + COMPRESSION_RATIO_DETERIORATE_STEP).max(observed_ratio)
+        } else if observed_ratio < current {
+            (current - COMPRESSION_RATIO_IMPROVING_STEP).max(observed_ratio)
+        } else {
+            return;
+        };
+        self.ratio_bits
+            .store(new_ratio.to_bits(), Ordering::Relaxed);
+    }
+}
+
+impl Default for ArrowCompressionRatioEstimator {
+    fn default() -> Self {
+        Self::new()
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    #[test]
+    fn test_default_ratio_is_one() {
+        let e = ArrowCompressionRatioEstimator::new();
+        assert_eq!(e.estimation(), 1.0);
+    }
+
+    #[test]
+    fn test_deterioration_jumps_quickly() {
+        let e = ArrowCompressionRatioEstimator::new();
+        // Observed ratio worse than estimate: jump by at least DETERIORATE_STEP
+        e.update_estimation(1.1);
+        assert!(e.estimation() >= 1.05);
+    }
+
+    #[test]
+    fn test_improvement_moves_slowly() {
+        let e = ArrowCompressionRatioEstimator::new();
+        // Observed ratio better than estimate: move down by at most IMPROVING_STEP
+        e.update_estimation(0.5);
+        assert!((e.estimation() - 0.995).abs() < 0.001);
+    }
+
+    #[test]
+    fn test_converges_to_observed() {
+        let e = ArrowCompressionRatioEstimator::new();
+        // After many updates with same ratio, should converge
+        for _ in 0..1000 {
+            e.update_estimation(0.7);
+        }
+        assert!((e.estimation() - 0.7).abs() < 0.01);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/compression/mod.rs b/fluss-rust/crates/fluss/src/compression/mod.rs
index 2b86dba77d..29923c0a84 100644
--- a/fluss-rust/crates/fluss/src/compression/mod.rs
+++ b/fluss-rust/crates/fluss/src/compression/mod.rs
@@ -16,5 +16,7 @@
 // under the License.
 
 mod arrow_compression;
+mod arrow_compression_ratio_estimator;
 
 pub use arrow_compression::*;
+pub use arrow_compression_ratio_estimator::*;
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 7dd745baa9..d03f1454d2 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -16,17 +16,20 @@
 // under the License.
 
 use crate::client::{LogWriteRecord, Record, WriteRecord};
-use crate::compression::ArrowCompressionInfo;
+use crate::compression::{
+    ArrowCompressionInfo, ArrowCompressionRatioEstimator, ArrowCompressionType,
+};
 use crate::error::{Error, Result};
 use crate::metadata::{DataType, RowType};
 use crate::record::{ChangeType, ScanRecord};
-use crate::row::column_writer::ColumnWriter;
+use crate::row::column_writer::{ColumnWriter, round_up_to_8};
 use crate::row::{ColumnarRow, InternalRow};
 use arrow::array::{ArrayBuilder, ArrayRef};
 use arrow::{
     array::RecordBatch,
     buffer::Buffer,
     ipc::{
+        CompressionType,
         reader::{StreamReader, read_record_batch},
         root_as_message,
         writer::StreamWriter,
@@ -40,6 +43,7 @@ use byteorder::{ByteOrder, LittleEndian};
 use bytes::Bytes;
 use crc32c::crc32c;
 use std::{
+    cell::Cell,
     collections::HashMap,
     fs::File,
     io::{Cursor, Read, Seek, SeekFrom, Write},
@@ -144,8 +148,13 @@ pub const NO_BATCH_SEQUENCE: i32 = -1;
 
 pub const BUILDER_DEFAULT_OFFSET: i64 = 0;
 
-// TODO: Switch to byte-size-based is_full() like Java's ArrowWriter instead of a hard record cap.
-pub const DEFAULT_MAX_RECORD: i32 = 256;
+/// Initial capacity for Arrow column vectors (pre-allocation hint, not a record cap).
+/// Matching Java's `ArrowWriter.INITIAL_CAPACITY`.
+const INITIAL_ROW_CAPACITY: usize = 1024;
+
+/// Fraction of the allocated buffer used as the effective write limit.
+/// Matching Java's `ArrowWriter.BUFFER_USAGE_RATIO`.
+const BUFFER_USAGE_RATIO: f32 = 0.95;
 
 pub struct MemoryLogRecordsArrowBuilder {
     base_log_offset: i64,
@@ -156,9 +165,25 @@ pub struct MemoryLogRecordsArrowBuilder {
     arrow_record_batch_builder: Box<dyn ArrowRecordBatchInnerBuilder>,
     is_closed: bool,
     arrow_compression_info: ArrowCompressionInfo,
+    /// Effective write limit in bytes (after applying BUFFER_USAGE_RATIO).
+    write_limit: usize,
+    /// Pre-computed Arrow IPC overhead (metadata + body framing) for this schema.
+    /// Constant per schema+compression combination.
+    ipc_overhead: usize,
+    /// Estimated record count at which the next byte-size check should occur.
+    /// -1 means "unknown — check on the next append". Updated dynamically to
+    /// skip expensive `estimated_size_in_bytes()` calls on every append.
+    /// Matching Java's `ArrowWriter.estimatedMaxRecordsCount`.
+    estimated_max_records_count: Cell<i32>,
+    /// Compression ratio estimator shared across batches for the same table.
+    compression_ratio_estimator: Arc<ArrowCompressionRatioEstimator>,
+    /// Snapshot of the compression ratio at batch creation time.
+    /// Matching Java's `ArrowWriter.estimatedCompressionRatio` which is
+    /// cached per batch and only refreshed on `reset()`.
+    estimated_compression_ratio: f32,
 }
 
-pub trait ArrowRecordBatchInnerBuilder: Send + Sync {
+pub trait ArrowRecordBatchInnerBuilder: Send {
     fn build_arrow_record_batch(&mut self) -> Result<Arc<RecordBatch>>;
 
     fn append(&mut self, row: &dyn InternalRow) -> Result<bool>;
@@ -229,7 +254,7 @@ pub struct RowAppendRecordBatchBuilder {
 
 impl RowAppendRecordBatchBuilder {
     pub fn new(row_type: &RowType) -> Result<Self> {
-        let capacity = DEFAULT_MAX_RECORD as usize;
+        let capacity = INITIAL_ROW_CAPACITY;
         let schema_ref = to_arrow_schema(row_type)?;
         let writers: Result<Vec<_>> = row_type
             .fields()
@@ -310,26 +335,34 @@ impl ArrowRecordBatchInnerBuilder for RowAppendRecordBatchBuilder {
     }
 
     fn is_full(&self) -> bool {
-        self.records_count() >= DEFAULT_MAX_RECORD
+        // Size-based fullness is handled by MemoryLogRecordsArrowBuilder,
+        // which accounts for metadata length and compression ratio.
+        false
     }
 
     fn estimated_size_in_bytes(&self) -> usize {
-        // Returns the uncompressed Arrow array memory size (same as Java's arrowWriter.estimatedSizeInBytes()).
-        // Note: This is the size before compression. After build(), the actual size may be smaller
-        // if compression is enabled.
-        self.column_writers
-            .iter()
-            .map(|writer| writer.finish_cloned().get_array_memory_size())
-            .sum()
+        // Returns the uncompressed Arrow IPC body size by reading buffer lengths
+        // directly from the builders — O(num_columns), zero allocation.
+        // Analogous to Java's `ArrowUtils.estimateArrowBodyLength()`.
+        // Java reads exact IPC buffer sizes from vectors; we read builder
+        // buffer lengths. The IPC framing overhead is accounted for
+        // separately by `ipc_overhead`.
+        self.column_writers.iter().map(|w| w.buffer_size()).sum()
     }
 }
 
+// TODO: Pool and reuse MemoryLogRecordsArrowBuilder instances per table/schema like
+// Java's ArrowWriterPool. Reused writers can seed `estimated_max_records_count` from
+// the previous batch (recordsCount / 2) for a warm start, avoiding the first-record
+// size check on every new batch.
 impl MemoryLogRecordsArrowBuilder {
     pub fn new(
         schema_id: i32,
         row_type: &RowType,
         to_append_record_batch: bool,
         arrow_compression_info: ArrowCompressionInfo,
+        write_limit: usize,
+        compression_ratio_estimator: Arc<ArrowCompressionRatioEstimator>,
     ) -> Result<Self> {
         let arrow_batch_builder: Box<dyn ArrowRecordBatchInnerBuilder> = {
             if to_append_record_batch {
@@ -338,6 +371,11 @@ impl MemoryLogRecordsArrowBuilder {
                 Box::new(RowAppendRecordBatchBuilder::new(row_type)?)
             }
         };
+        let schema = to_arrow_schema(row_type)?;
+        let ipc_overhead =
+            estimate_arrow_ipc_overhead(&schema, arrow_compression_info.get_compression_type())?;
+        let effective_limit = (write_limit as f32 * BUFFER_USAGE_RATIO) as usize;
+        let estimated_compression_ratio = compression_ratio_estimator.estimation();
         Ok(MemoryLogRecordsArrowBuilder {
             base_log_offset: BUILDER_DEFAULT_OFFSET,
             schema_id,
@@ -347,6 +385,11 @@ impl MemoryLogRecordsArrowBuilder {
             is_closed: false,
             arrow_record_batch_builder: arrow_batch_builder,
             arrow_compression_info,
+            write_limit: effective_limit,
+            ipc_overhead,
+            estimated_max_records_count: Cell::new(-1),
+            compression_ratio_estimator,
+            estimated_compression_ratio,
         })
     }
 
@@ -367,8 +410,50 @@ impl MemoryLogRecordsArrowBuilder {
         // todo: consider write other change type
     }
 
+    /// Check if the builder is full based on estimated serialized size.
+    ///
+    /// Uses a threshold-based optimization to skip expensive size checks:
+    /// only computes the actual estimated size when the record count reaches
+    /// the predicted threshold. Matching Java's `ArrowWriter.isFull()`.
     pub fn is_full(&self) -> bool {
-        self.arrow_record_batch_builder.records_count() >= DEFAULT_MAX_RECORD
+        // Delegate to inner builder first (e.g. PrebuiltRecordBatchBuilder
+        // is always full after one batch, regardless of size).
+        if self.arrow_record_batch_builder.is_full() {
+            return true;
+        }
+        let records_count = self.arrow_record_batch_builder.records_count();
+        let threshold = self.estimated_max_records_count.get();
+        if records_count > 0 && records_count >= threshold {
+            let body_size = self.arrow_record_batch_builder.estimated_size_in_bytes();
+            let estimated_body = self.estimated_compressed_size(body_size);
+            let current_size = self.ipc_overhead + estimated_body;
+            if current_size >= self.write_limit {
+                return true;
+            }
+            if estimated_body == 0 {
+                self.estimated_max_records_count.set(records_count + 1);
+                return false;
+            }
+            // Matching Java: subtract fixed metadata overhead from the limit,
+            // divide remaining body budget by per-record body cost.
+            let body_per_record = estimated_body as f64 / records_count as f64;
+            let next = ((self.write_limit.saturating_sub(self.ipc_overhead) as f64
+                / body_per_record)
+                .ceil() as i32)
+                .max(records_count + 1);
+            self.estimated_max_records_count.set(next);
+        }
+        false
+    }
+
+    /// Estimate the compressed body size using the ratio snapshot taken at batch creation.
+    /// Matching Java's `ArrowWriter.estimatedBytesWritten()`.
+    fn estimated_compressed_size(&self, uncompressed_body: usize) -> usize {
+        if self.arrow_compression_info.compression_type == ArrowCompressionType::None {
+            uncompressed_body
+        } else {
+            (uncompressed_body as f64 * self.estimated_compression_ratio as f64) as usize
+        }
     }
 
     pub fn is_closed(&self) -> bool {
@@ -380,6 +465,9 @@ impl MemoryLogRecordsArrowBuilder {
     }
 
     pub fn build(&mut self) -> Result<Vec<u8>> {
+        // Capture uncompressed body size before serialization for compression ratio update.
+        let uncompressed_body_size = self.arrow_record_batch_builder.estimated_size_in_bytes();
+
         // serialize arrow batch
         let mut arrow_batch_bytes = vec![];
         let table_schema = self.arrow_record_batch_builder.schema();
@@ -396,9 +484,23 @@ impl MemoryLogRecordsArrowBuilder {
         let header = writer.get_ref().len();
         let record_batch = self.arrow_record_batch_builder.build_arrow_record_batch()?;
         writer.write(record_batch.as_ref())?;
-        // get real arrow batch bytes
+        // get real arrow batch bytes (metadata + body, potentially compressed)
         let real_arrow_batch_bytes = &arrow_batch_bytes[header..];
 
+        // Update compression ratio estimator with actual ratio.
+        // The serialized bytes include metadata + compressed body. Subtract
+        // metadata to isolate the compressed body for an accurate ratio.
+        if uncompressed_body_size > 0
+            && self.arrow_compression_info.compression_type != ArrowCompressionType::None
+        {
+            let compressed_body_size = real_arrow_batch_bytes
+                .len()
+                .saturating_sub(self.ipc_overhead);
+            let actual_ratio = compressed_body_size as f32 / uncompressed_body_size as f32;
+            self.compression_ratio_estimator
+                .update_estimation(actual_ratio);
+        }
+
         // now, write batch header and arrow batch
         let mut batch_bytes = vec![0u8; RECORD_BATCH_HEADER_SIZE + real_arrow_batch_bytes.len()];
         // write batch header
@@ -451,12 +553,72 @@ impl MemoryLogRecordsArrowBuilder {
     }
 
     /// Get an estimate of the number of bytes written to the underlying buffer.
-    /// This includes the batch header size plus the estimated arrow data size.
+    /// Includes Fluss record batch header + Arrow IPC metadata + estimated
+    /// compressed body size.
     pub fn estimated_size_in_bytes(&self) -> usize {
-        RECORD_BATCH_HEADER_SIZE + self.arrow_record_batch_builder.estimated_size_in_bytes()
+        let body = self.arrow_record_batch_builder.estimated_size_in_bytes();
+        let estimated_body = self.estimated_compressed_size(body);
+        RECORD_BATCH_HEADER_SIZE + self.ipc_overhead + estimated_body
     }
 }
 
+/// Estimate the Arrow IPC overhead (metadata + body framing) for a given schema.
+///
+/// Serializes a 1-row RecordBatch with known data sizes, then subtracts the
+/// raw data contribution to isolate the fixed overhead: IPC message header,
+/// RecordBatch flatbuffer, and per-buffer alignment padding within the body.
+/// This overhead is constant for a given schema+compression combination.
+///
+/// Note: called once per batch creation. With writer pooling (see TODO above),
+/// this would be computed once per pooled writer and reused across batches.
+/// Analogous to Java's `ArrowUtils.estimateArrowMetadataLength()`.
+fn estimate_arrow_ipc_overhead(
+    schema: &SchemaRef,
+    compression: Option<CompressionType>,
+) -> Result<usize> {
+    use arrow::array::new_null_array;
+
+    // Create a 1-row batch of nulls. Null arrays have minimal, predictable
+    // data: no validity bitmap, no variable-length data, just fixed-width
+    // zero buffers. This lets us compute raw data size exactly.
+    let null_arrays: Vec<ArrayRef> = schema
+        .fields()
+        .iter()
+        .map(|field| new_null_array(field.data_type(), 1))
+        .collect();
+    let batch = RecordBatch::try_new(schema.clone(), null_arrays)?;
+
+    // Sum the raw buffer sizes — this is what buffer_size() would report.
+    let raw_data: usize = batch
+        .columns()
+        .iter()
+        .map(|col| {
+            col.to_data()
+                .buffers()
+                .iter()
+                .map(|buf| round_up_to_8(buf.len()))
+                .sum::<usize>()
+                // Validity buffer (null bitmap)
+                + col
+                    .nulls()
+                    .map_or(0, |n| round_up_to_8(n.buffer().len()))
+        })
+        .sum();
+
+    // Serialize the batch via IPC and measure total output.
+    let mut buf = vec![];
+    let write_option =
+        IpcWriteOptions::try_with_compression(IpcWriteOptions::default(), compression);
+    let mut writer = StreamWriter::try_new_with_options(&mut buf, schema, write_option?)?;
+    let header_len = writer.get_ref().len();
+    writer.write(&batch)?;
+    let total_len = writer.get_ref().len();
+
+    // IPC overhead = total message size - raw data we put in.
+    let ipc_message_len = total_len - header_len;
+    Ok(ipc_message_len.saturating_sub(raw_data))
+}
+
 pub trait ToArrow {
     fn append_to(&self, builder: &mut dyn ArrayBuilder) -> Result<()>;
 }
@@ -1975,6 +2137,8 @@ mod tests {
                 compression_type: ArrowCompressionType::None,
                 compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
             },
+            usize::MAX,
+            Arc::new(ArrowCompressionRatioEstimator::default()),
         )?;
 
         let mut row = GenericRow::new(2);
diff --git a/fluss-rust/crates/fluss/src/row/column_writer.rs b/fluss-rust/crates/fluss/src/row/column_writer.rs
index fbaa000dbe..be94cf062b 100644
--- a/fluss-rust/crates/fluss/src/row/column_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/column_writer.rs
@@ -36,9 +36,16 @@ use arrow::array::{
 };
 use arrow_schema::DataType as ArrowDataType;
 
+/// Round up to the next multiple of 8 (Arrow IPC buffer alignment).
+#[inline]
+pub(crate) fn round_up_to_8(n: usize) -> usize {
+    (n + 7) & !7
+}
+
 /// Estimated average byte size for variable-width columns (Utf8, Binary).
 /// Used to pre-allocate data buffers and avoid reallocations during batch building.
-const VARIABLE_WIDTH_AVG_BYTES: usize = 64;
+/// Matches Java Arrow's `BaseVariableWidthVector.DEFAULT_RECORD_BYTE_COUNT`.
+const VARIABLE_WIDTH_AVG_BYTES: usize = 8;
 
 /// A typed column writer that reads one column from an [`InternalRow`] and
 /// appends directly to a concrete Arrow builder — no intermediate [`Datum`],
@@ -397,19 +404,78 @@ impl ColumnWriter {
         }
     }
 
-    /// Clone-finish the builder for size estimation (does not reset the builder).
-    pub fn finish_cloned(&self) -> ArrayRef {
+    /// Returns the total buffer size in bytes, rounded up to 8-byte alignment
+    /// per buffer. Reads buffer lengths directly from the builders — O(1), no
+    /// allocation. Analogous to Java's `ArrowUtils.estimateArrowBodyLength()`
+    /// which sums `buf.readableBytes()` with 8-byte rounding per buffer.
+    /// The IPC framing overhead not captured here is accounted for separately
+    /// by `estimate_arrow_ipc_overhead()`.
+    pub fn buffer_size(&self) -> usize {
+        /// Validity bitmap size, rounded to 8-byte alignment.
+        /// When no nulls have been appended, the builder does not materialize
+        /// the bitmap and the IPC body contributes 0 bytes for this buffer.
+        #[inline]
+        fn validity_size(slice: Option<&[u8]>) -> usize {
+            round_up_to_8(slice.map_or(0, |s| s.len()))
+        }
+
+        /// Primitive builder: validity + values (values_slice returns &[T::Native]).
+        macro_rules! primitive_size {
+            ($b:expr) => {
+                validity_size($b.validity_slice())
+                    + round_up_to_8(std::mem::size_of_val($b.values_slice()))
+            };
+        }
+
+        /// Variable-width builder: validity + offsets + values.
+        macro_rules! var_width_size {
+            ($b:expr) => {
+                validity_size($b.validity_slice())
+                    + round_up_to_8(std::mem::size_of_val($b.offsets_slice()))
+                    + round_up_to_8($b.values_slice().len())
+            };
+        }
+
         match &self.inner {
+            TypedWriter::Bool(b) => {
+                validity_size(b.validity_slice()) + round_up_to_8(b.values_slice().len())
+            }
+            TypedWriter::Int8(b) => primitive_size!(b),
+            TypedWriter::Int16(b) => primitive_size!(b),
+            TypedWriter::Int32(b) => primitive_size!(b),
+            TypedWriter::Int64(b) => primitive_size!(b),
+            TypedWriter::Float32(b) => primitive_size!(b),
+            TypedWriter::Float64(b) => primitive_size!(b),
+            TypedWriter::Decimal128 { builder: b, .. } => primitive_size!(b),
+            TypedWriter::Date32(b) => primitive_size!(b),
+            TypedWriter::Time32Second(b) => primitive_size!(b),
+            TypedWriter::Time32Millisecond(b) => primitive_size!(b),
+            TypedWriter::Time64Microsecond(b) => primitive_size!(b),
+            TypedWriter::Time64Nanosecond(b) => primitive_size!(b),
+            TypedWriter::TimestampNtzSecond { builder: b, .. } => primitive_size!(b),
+            TypedWriter::TimestampNtzMillisecond { builder: b, .. } => primitive_size!(b),
+            TypedWriter::TimestampNtzMicrosecond { builder: b, .. } => primitive_size!(b),
+            TypedWriter::TimestampNtzNanosecond { builder: b, .. } => primitive_size!(b),
+            TypedWriter::TimestampLtzSecond { builder: b, .. } => primitive_size!(b),
+            TypedWriter::TimestampLtzMillisecond { builder: b, .. } => primitive_size!(b),
+            TypedWriter::TimestampLtzMicrosecond { builder: b, .. } => primitive_size!(b),
+            TypedWriter::TimestampLtzNanosecond { builder: b, .. } => primitive_size!(b),
+            // Variable-width types: validity + offsets + values
+            TypedWriter::Char { builder: b, .. } => var_width_size!(b),
+            TypedWriter::String(b) => var_width_size!(b),
+            TypedWriter::Bytes(b) => var_width_size!(b),
+            TypedWriter::Binary { builder: b, .. } => {
+                validity_size(b.validity_slice()) + round_up_to_8(b.values_slice().len())
+            }
             TypedWriter::List {
                 element_writer,
                 offsets,
                 validity,
             } => {
-                let item_nullable = element_writer.nullable;
-                let values = element_writer.finish_cloned();
-                finish_list_array(values, item_nullable, offsets, validity)
+                let validity_bytes = round_up_to_8(validity.len().div_ceil(8));
+                let offsets_bytes = round_up_to_8(offsets.len() * std::mem::size_of::<i32>());
+                validity_bytes + offsets_bytes + element_writer.buffer_size()
             }
-            _ => with_builder!(&self.inner, b => (b as &dyn ArrayBuilder).finish_cloned()),
         }
     }
 
@@ -847,10 +913,10 @@ mod tests {
         assert_eq!(int_arr.value(1), 20);
         assert_eq!(int_arr.value(2), 30);
 
-        // finish_cloned does not reset
+        // buffer_size grows with appended data and does not reset the builder
         let mut w = writer_for(&DataTypes::int(), 4);
         w.write_field(&GenericRow::from_data(vec![42_i32])).unwrap();
-        assert_eq!(w.finish_cloned().len(), 1);
+        assert!(w.buffer_size() > 0);
         w.write_field(&GenericRow::from_data(vec![99_i32])).unwrap();
         let int_arr = w
             .finish()

From d1e60150968ffdb408b1e183bd5f2885eea5c1fc Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Thu, 16 Apr 2026 10:48:47 +0100
Subject: [PATCH 234/287] feat: Elixir bindings initial PR (#452)

---
 fluss-rust/.licenserc.yaml                    |   1 +
 fluss-rust/Cargo.lock                         |  60 +++
 fluss-rust/Cargo.toml                         |   2 +-
 fluss-rust/bindings/elixir/.formatter.exs     |  20 +
 fluss-rust/bindings/elixir/.gitignore         |   9 +
 fluss-rust/bindings/elixir/README.md          |  60 +++
 fluss-rust/bindings/elixir/lib/fluss.ex       |  52 +++
 fluss-rust/bindings/elixir/lib/fluss/admin.ex | 111 +++++
 .../elixir/lib/fluss/append_writer.ex         |  75 ++++
 .../bindings/elixir/lib/fluss/config.ex       |  67 +++
 .../bindings/elixir/lib/fluss/connection.ex   |  51 +++
 .../bindings/elixir/lib/fluss/log_scanner.ex  |  96 ++++
 .../bindings/elixir/lib/fluss/native.ex       |  80 ++++
 .../bindings/elixir/lib/fluss/schema.ex       |  74 ++++
 fluss-rust/bindings/elixir/lib/fluss/table.ex |  47 ++
 .../elixir/lib/fluss/table_descriptor.ex      |  45 ++
 .../bindings/elixir/lib/fluss/write_handle.ex |  44 ++
 fluss-rust/bindings/elixir/mix.exs            |  61 +++
 fluss-rust/bindings/elixir/mix.lock           |  13 +
 .../elixir/native/fluss_nif/Cargo.toml        |  34 ++
 .../elixir/native/fluss_nif/src/admin.rs      | 121 +++++
 .../native/fluss_nif/src/append_writer.rs     |  69 +++
 .../elixir/native/fluss_nif/src/async_nif.rs  |  92 ++++
 .../elixir/native/fluss_nif/src/atoms.rs      |  45 ++
 .../elixir/native/fluss_nif/src/config.rs     |  44 ++
 .../elixir/native/fluss_nif/src/connection.rs |  43 ++
 .../elixir/native/fluss_nif/src/lib.rs        |  47 ++
 .../native/fluss_nif/src/log_scanner.rs       | 164 +++++++
 .../native/fluss_nif/src/row_convert.rs       | 267 +++++++++++
 .../elixir/native/fluss_nif/src/schema.rs     | 110 +++++
 .../elixir/native/fluss_nif/src/table.rs      |  89 ++++
 .../native/fluss_nif/src/write_handle.rs      |  47 ++
 .../bindings/elixir/test/fluss_test.exs       |  66 +++
 .../test/integration/log_table_test.exs       | 413 ++++++++++++++++++
 .../bindings/elixir/test/support/cluster.ex   | 211 +++++++++
 .../bindings/elixir/test/test_helper.exs      |  27 ++
 36 files changed, 2856 insertions(+), 1 deletion(-)
 create mode 100644 fluss-rust/bindings/elixir/.formatter.exs
 create mode 100644 fluss-rust/bindings/elixir/.gitignore
 create mode 100644 fluss-rust/bindings/elixir/README.md
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/admin.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/append_writer.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/config.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/connection.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/log_scanner.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/native.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/schema.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/table.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/table_descriptor.ex
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/write_handle.ex
 create mode 100644 fluss-rust/bindings/elixir/mix.exs
 create mode 100644 fluss-rust/bindings/elixir/mix.lock
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/Cargo.toml
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/admin.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/append_writer.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/async_nif.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/connection.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/lib.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/log_scanner.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/row_convert.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/schema.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/table.rs
 create mode 100644 fluss-rust/bindings/elixir/native/fluss_nif/src/write_handle.rs
 create mode 100644 fluss-rust/bindings/elixir/test/fluss_test.exs
 create mode 100644 fluss-rust/bindings/elixir/test/integration/log_table_test.exs
 create mode 100644 fluss-rust/bindings/elixir/test/support/cluster.ex
 create mode 100644 fluss-rust/bindings/elixir/test/test_helper.exs

diff --git a/fluss-rust/.licenserc.yaml b/fluss-rust/.licenserc.yaml
index 275585377f..5fcd99829a 100644
--- a/fluss-rust/.licenserc.yaml
+++ b/fluss-rust/.licenserc.yaml
@@ -27,6 +27,7 @@ header:
     - 'NOTICE'
     - 'DISCLAIMER'
     - 'bindings/python/fluss/py.typed'
+    - '**/mix.lock'
     - 'website/**'
     - '**/*.md'
     - '**/DEPENDENCIES.*.tsv'
diff --git a/fluss-rust/Cargo.lock b/fluss-rust/Cargo.lock
index 388d1a259e..ac5b27f883 100644
--- a/fluss-rust/Cargo.lock
+++ b/fluss-rust/Cargo.lock
@@ -1136,6 +1136,16 @@ dependencies = [
  "tokio",
 ]
 
+[[package]]
+name = "fluss_nif"
+version = "0.2.0"
+dependencies = [
+ "bigdecimal",
+ "fluss-rs",
+ "rustler",
+ "tokio",
+]
+
 [[package]]
 name = "fluss_python"
 version = "0.2.0"
@@ -1745,6 +1755,15 @@ dependencies = [
  "rustversion",
 ]
 
+[[package]]
+name = "inventory"
+version = "0.3.24"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a4f0c30c76f2f4ccee3fe55a2435f691ca00c0e4bd87abe4f4a851b1d4dac39b"
+dependencies = [
+ "rustversion",
+]
+
 [[package]]
 name = "ipnet"
 version = "2.12.0"
@@ -1916,6 +1935,16 @@ version = "0.2.184"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "48f5d2a454e16a5ea0f4ced81bd44e4cfc7bd3a507b61887c99fd3538b28e4af"
 
+[[package]]
+name = "libloading"
+version = "0.9.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "754ca22de805bb5744484a5b151a9e1a8e837d5dc232c2d7d8c2e3492edc8b60"
+dependencies = [
+ "cfg-if",
+ "windows-link",
+]
+
 [[package]]
 name = "libm"
 version = "0.2.16"
@@ -2741,6 +2770,12 @@ dependencies = [
  "regex-syntax",
 ]
 
+[[package]]
+name = "regex-lite"
+version = "0.1.9"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cab834c73d247e67f4fae452806d17d3c7501756d98c8808d7c9c7aa7d18f973"
+
 [[package]]
 name = "regex-syntax"
 version = "0.8.10"
@@ -2870,6 +2905,31 @@ dependencies = [
  "windows-sys 0.61.2",
 ]
 
+[[package]]
+name = "rustler"
+version = "0.37.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c779e2cbfa2987990205d0d8fc142163739e45a4c6592dc637896c77fec01280"
+dependencies = [
+ "inventory",
+ "libloading",
+ "regex-lite",
+ "rustler_codegen",
+]
+
+[[package]]
+name = "rustler_codegen"
+version = "0.37.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "e6e120f8936c779b6c2e09992a2dfa9a4e8bcd0794c02bb654fde03e03ce8c31"
+dependencies = [
+ "heck",
+ "inventory",
+ "proc-macro2",
+ "quote",
+ "syn",
+]
+
 [[package]]
 name = "rustls"
 version = "0.23.37"
diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 2abdbf0626..b625ab3485 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -28,7 +28,7 @@ keywords = ["fluss", "streaming-storage", "datalake"]
 
 [workspace]
 resolver = "2"
-members = ["crates/fluss", "crates/fluss-test-cluster", "crates/examples", "bindings/python", "bindings/cpp"]
+members = ["crates/fluss", "crates/fluss-test-cluster", "crates/examples", "bindings/python", "bindings/cpp", "bindings/elixir/native/fluss_nif"]
 
 [workspace.dependencies]
 fluss = { package = "fluss-rs", version = "0.2.0", path = "crates/fluss", features = ["storage-all"] }
diff --git a/fluss-rust/bindings/elixir/.formatter.exs b/fluss-rust/bindings/elixir/.formatter.exs
new file mode 100644
index 0000000000..dd63ff521c
--- /dev/null
+++ b/fluss-rust/bindings/elixir/.formatter.exs
@@ -0,0 +1,20 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[
+  inputs: ["{mix,.formatter}.exs", "{config,lib,test}/**/*.{ex,exs}"]
+]
diff --git a/fluss-rust/bindings/elixir/.gitignore b/fluss-rust/bindings/elixir/.gitignore
new file mode 100644
index 0000000000..90277ffb16
--- /dev/null
+++ b/fluss-rust/bindings/elixir/.gitignore
@@ -0,0 +1,9 @@
+# Elixir build artifacts
+_build/
+deps/
+
+# Generated NIF shared library
+priv/native/
+
+# Crash dumps
+erl_crash.dump
diff --git a/fluss-rust/bindings/elixir/README.md b/fluss-rust/bindings/elixir/README.md
new file mode 100644
index 0000000000..656b03c51d
--- /dev/null
+++ b/fluss-rust/bindings/elixir/README.md
@@ -0,0 +1,60 @@
+# Fluss Elixir Client
+
+Elixir client for [Apache Fluss (Incubating)](https://fluss.apache.org/), built on the official Rust client via [Rustler](https://github.com/rusterlium/rustler) NIFs.
+
+Currently supports **log tables** (append + scan). Primary key (KV) table support is planned.
+
+## Requirements
+
+- Elixir >= 1.15
+- Rust stable toolchain (for compiling the NIF)
+
+## Quick Start
+
+```elixir
+config = Fluss.Config.new("localhost:9123")
+conn = Fluss.Connection.new!(config)
+admin = Fluss.Admin.new!(conn)
+
+schema =
+  Fluss.Schema.build()
+  |> Fluss.Schema.column("ts", :bigint)
+  |> Fluss.Schema.column("message", :string)
+  |> Fluss.Schema.build!()
+
+:ok = Fluss.Admin.create_table(admin, "my_db", "events", Fluss.TableDescriptor.new!(schema))
+
+table = Fluss.Table.get!(conn, "my_db", "events")
+writer = Fluss.AppendWriter.new!(table)
+Fluss.AppendWriter.append(writer, [1_700_000_000, "hello"])
+:ok = Fluss.AppendWriter.flush(writer)
+
+scanner = Fluss.LogScanner.new!(table)
+:ok = Fluss.LogScanner.subscribe(scanner, 0, Fluss.earliest_offset())
+:ok = Fluss.LogScanner.poll(scanner, 5_000)
+
+receive do
+  {:fluss_records, records} ->
+    for record <- records, do: IO.inspect(record[:row])
+end
+```
+
+## Data Types
+
+Simple: `:boolean`, `:tinyint`, `:smallint`, `:int`, `:bigint`, `:float`, `:double`, `:string`, `:bytes`, `:date`, `:time`, `:timestamp`, `:timestamp_ltz`
+
+Parameterized: `{:decimal, precision, scale}`, `{:char, length}`, `{:binary, length}`
+
+## Development
+
+```bash
+cd bindings/elixir
+mix test                        # unit tests
+mix test --include integration  # starts Docker cluster
+```
+
+Set `FLUSS_BOOTSTRAP_SERVERS` to use an existing cluster.
+
+## License
+
+Apache License 2.0
diff --git a/fluss-rust/bindings/elixir/lib/fluss.ex b/fluss-rust/bindings/elixir/lib/fluss.ex
new file mode 100644
index 0000000000..25aa649160
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss.ex
@@ -0,0 +1,52 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss do
+  @moduledoc """
+  Elixir client for Apache Fluss (Incubating).
+
+  ## Examples
+
+      config = Fluss.Config.new("localhost:9123")
+      conn = Fluss.Connection.new!(config)
+      admin = Fluss.Admin.new!(conn)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("ts", :bigint)
+        |> Fluss.Schema.column("message", :string)
+
+      :ok = Fluss.Admin.create_table(admin, "my_db", "events", Fluss.TableDescriptor.new!(schema))
+
+      table = Fluss.Table.get!(conn, "my_db", "events")
+      writer = Fluss.AppendWriter.new!(table)
+      Fluss.AppendWriter.append(writer, [1_700_000_000, "hello"])
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      scanner = Fluss.LogScanner.new!(table)
+      :ok = Fluss.LogScanner.subscribe(scanner, 0, Fluss.earliest_offset())
+      :ok = Fluss.LogScanner.poll(scanner, 5_000)
+      receive do
+        {:fluss_records, records} -> records
+      end
+
+  """
+
+  alias Fluss.Native
+
+  def earliest_offset, do: Native.earliest_offset()
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/admin.ex b/fluss-rust/bindings/elixir/lib/fluss/admin.ex
new file mode 100644
index 0000000000..a40f2d65f3
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/admin.ex
@@ -0,0 +1,111 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Admin do
+  @moduledoc """
+  Admin client for DDL operations (create/drop databases and tables).
+
+  ## Examples
+
+      admin = Fluss.Admin.new!(conn)
+      :ok = Fluss.Admin.create_database(admin, "my_db")
+
+      schema = Fluss.Schema.new() |> Fluss.Schema.column("ts", :bigint)
+      descriptor = Fluss.TableDescriptor.new!(schema)
+      :ok = Fluss.Admin.create_table(admin, "my_db", "events", descriptor)
+
+  """
+
+  alias Fluss.Native
+
+  @type t :: reference()
+
+  @spec new(Fluss.Connection.t()) :: {:ok, t()} | {:error, String.t()}
+  def new(conn) do
+    case Native.admin_new(conn) do
+      {:error, _} = err -> err
+      admin -> {:ok, admin}
+    end
+  end
+
+  @spec new!(Fluss.Connection.t()) :: t()
+  def new!(conn) do
+    case new(conn) do
+      {:ok, admin} -> admin
+      {:error, reason} -> raise "failed to create admin: #{reason}"
+    end
+  end
+
+  @spec create_database(t(), String.t(), boolean()) :: :ok | {:error, String.t()}
+  def create_database(admin, name, ignore_if_exists \\ true) do
+    admin
+    |> Native.admin_create_database(name, ignore_if_exists)
+    |> Native.await_nif()
+  end
+
+  @spec drop_database(t(), String.t(), boolean()) :: :ok | {:error, String.t()}
+  def drop_database(admin, name, ignore_if_not_exists \\ true) do
+    admin
+    |> Native.admin_drop_database(name, ignore_if_not_exists)
+    |> Native.await_nif()
+  end
+
+  @spec list_databases(t()) :: {:ok, [String.t()]} | {:error, String.t()}
+  def list_databases(admin) do
+    admin
+    |> Native.admin_list_databases()
+    |> Native.await_nif()
+  end
+
+  @spec list_databases!(t()) :: [String.t()]
+  def list_databases!(admin) do
+    case list_databases(admin) do
+      {:ok, dbs} -> dbs
+      {:error, reason} -> raise "failed to list databases: #{reason}"
+    end
+  end
+
+  @spec create_table(t(), String.t(), String.t(), Fluss.TableDescriptor.t(), boolean()) ::
+          :ok | {:error, String.t()}
+  def create_table(admin, database, table, descriptor, ignore_if_exists \\ true) do
+    admin
+    |> Native.admin_create_table(database, table, descriptor, ignore_if_exists)
+    |> Native.await_nif()
+  end
+
+  @spec drop_table(t(), String.t(), String.t(), boolean()) :: :ok | {:error, String.t()}
+  def drop_table(admin, database, table, ignore_if_not_exists \\ true) do
+    admin
+    |> Native.admin_drop_table(database, table, ignore_if_not_exists)
+    |> Native.await_nif()
+  end
+
+  @spec list_tables(t(), String.t()) :: {:ok, [String.t()]} | {:error, String.t()}
+  def list_tables(admin, database) do
+    admin
+    |> Native.admin_list_tables(database)
+    |> Native.await_nif()
+  end
+
+  @spec list_tables!(t(), String.t()) :: [String.t()]
+  def list_tables!(admin, database) do
+    case list_tables(admin, database) do
+      {:ok, tables} -> tables
+      {:error, reason} -> raise "failed to list tables: #{reason}"
+    end
+  end
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/append_writer.ex b/fluss-rust/bindings/elixir/lib/fluss/append_writer.ex
new file mode 100644
index 0000000000..767802ac02
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/append_writer.ex
@@ -0,0 +1,75 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.AppendWriter do
+  @moduledoc """
+  Writer for appending records to a log table.
+
+  Values are passed as a list in column order. Use `nil` for null values.
+  `append/2` returns a `Fluss.WriteHandle` — drop it for fire-and-forget,
+  or call `Fluss.WriteHandle.wait/1` for per-record acknowledgment.
+
+  ## Examples
+
+      writer = Fluss.AppendWriter.new!(table)
+
+      # Fire-and-forget
+      Fluss.AppendWriter.append(writer, [1_700_000_000, "hello"])
+      Fluss.AppendWriter.append(writer, [1_700_000_001, "world"])
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      # Per-record ack
+      {:ok, handle} = Fluss.AppendWriter.append(writer, [1_700_000_002, "critical"])
+      :ok = Fluss.WriteHandle.wait(handle)
+
+  """
+
+  alias Fluss.Native
+
+  @type t :: reference()
+
+  @spec new(Fluss.Table.t()) :: {:ok, t()} | {:error, String.t()}
+  def new(table) do
+    case Native.append_writer_new(table) do
+      {:error, _} = err -> err
+      w -> {:ok, w}
+    end
+  end
+
+  @spec new!(Fluss.Table.t()) :: t()
+  def new!(table) do
+    case new(table) do
+      {:ok, w} -> w
+      {:error, reason} -> raise "failed to create append writer: #{reason}"
+    end
+  end
+
+  @spec append(t(), list()) :: {:ok, Fluss.WriteHandle.t()} | {:error, String.t()}
+  def append(writer, values) when is_list(values) do
+    case Native.append_writer_append(writer, values) do
+      {:error, _} = err -> err
+      handle -> {:ok, handle}
+    end
+  end
+
+  @spec flush(t()) :: :ok | {:error, String.t()}
+  def flush(writer) do
+    writer
+    |> Native.append_writer_flush()
+    |> Native.await_nif()
+  end
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/config.ex b/fluss-rust/bindings/elixir/lib/fluss/config.ex
new file mode 100644
index 0000000000..1120a5f450
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/config.ex
@@ -0,0 +1,67 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Config do
+  @moduledoc """
+  Client configuration for connecting to a Fluss cluster.
+
+  Fields left as `nil` use the client's defaults.
+
+  ## Examples
+
+      config = Fluss.Config.new("localhost:9123")
+
+      config =
+        Fluss.Config.new("host1:9123,host2:9123")
+        |> Fluss.Config.set_writer_batch_size(1_048_576)
+
+  """
+
+  @enforce_keys [:bootstrap_servers]
+  defstruct bootstrap_servers: nil,
+            writer_batch_size: nil,
+            writer_batch_timeout_ms: nil
+
+  @type t :: %__MODULE__{
+          bootstrap_servers: String.t(),
+          writer_batch_size: non_neg_integer() | nil,
+          writer_batch_timeout_ms: non_neg_integer() | nil
+        }
+
+  @spec new(String.t()) :: t()
+  def new(bootstrap_servers) when is_binary(bootstrap_servers) do
+    %__MODULE__{bootstrap_servers: bootstrap_servers}
+  end
+
+  @spec default() :: t()
+  def default, do: %__MODULE__{bootstrap_servers: ""}
+
+  @spec set_bootstrap_servers(t(), String.t()) :: t()
+  def set_bootstrap_servers(%__MODULE__{} = config, servers) when is_binary(servers),
+    do: %{config | bootstrap_servers: servers}
+
+  @spec set_writer_batch_size(t(), non_neg_integer()) :: t()
+  def set_writer_batch_size(%__MODULE__{} = config, size) when is_integer(size),
+    do: %{config | writer_batch_size: size}
+
+  @spec set_writer_batch_timeout_ms(t(), non_neg_integer()) :: t()
+  def set_writer_batch_timeout_ms(%__MODULE__{} = config, ms) when is_integer(ms),
+    do: %{config | writer_batch_timeout_ms: ms}
+
+  @spec get_bootstrap_servers(t()) :: String.t()
+  def get_bootstrap_servers(%__MODULE__{bootstrap_servers: servers}), do: servers
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/connection.ex b/fluss-rust/bindings/elixir/lib/fluss/connection.ex
new file mode 100644
index 0000000000..0fd664682e
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/connection.ex
@@ -0,0 +1,51 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Connection do
+  @moduledoc """
+  A connection to a Fluss cluster.
+
+  Errors are per-operation, not per-connection. If the server becomes
+  unreachable, individual calls fail but the connection recovers
+  transparently — there is no need to recreate it.
+
+  ## Examples
+
+      config = Fluss.Config.new("localhost:9123")
+      {:ok, conn} = Fluss.Connection.new(config)
+
+  """
+
+  alias Fluss.Native
+
+  @type t :: reference()
+
+  @spec new(Fluss.Config.t()) :: {:ok, t()} | {:error, String.t()}
+  def new(%Fluss.Config{} = config) do
+    config
+    |> Native.connection_new()
+    |> Native.await_nif()
+  end
+
+  @spec new!(Fluss.Config.t()) :: t()
+  def new!(%Fluss.Config{} = config) do
+    case new(config) do
+      {:ok, conn} -> conn
+      {:error, reason} -> raise "failed to connect to Fluss: #{reason}"
+    end
+  end
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/log_scanner.ex b/fluss-rust/bindings/elixir/lib/fluss/log_scanner.ex
new file mode 100644
index 0000000000..a47ea92e6e
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/log_scanner.ex
@@ -0,0 +1,96 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.LogScanner do
+  @moduledoc """
+  Scanner for reading records from a log table.
+
+  `poll/2` is non-blocking — it returns `:ok` immediately and sends results
+  as `{:fluss_records, records}` or `{:fluss_poll_error, reason}` to the
+  calling process. No dirty scheduler threads are held during the wait.
+
+  Each record is an atom-keyed map: `:offset`, `:timestamp`, `:change_type`, `:row`.
+  Row values are also atom-keyed (column names interned as atoms).
+
+  ## Examples
+
+      scanner = Fluss.LogScanner.new!(table)
+      :ok = Fluss.LogScanner.subscribe(scanner, 0, Fluss.earliest_offset())
+      :ok = Fluss.LogScanner.poll(scanner, 5_000)
+
+      receive do
+        {:fluss_records, records} ->
+          for record <- records, do: IO.inspect(record[:row])
+        {:fluss_poll_error, reason} ->
+          IO.puts("poll error: \#{reason}")
+      end
+
+  """
+
+  alias Fluss.Native
+
+  @type t :: reference()
+  @type record :: %{atom() => term()}
+
+  @spec new(Fluss.Table.t()) :: {:ok, t()} | {:error, String.t()}
+  def new(table) do
+    case Native.log_scanner_new(table) do
+      {:error, _} = err -> err
+      s -> {:ok, s}
+    end
+  end
+
+  @spec new!(Fluss.Table.t()) :: t()
+  def new!(table) do
+    case new(table) do
+      {:ok, s} -> s
+      {:error, reason} -> raise "failed to create log scanner: #{reason}"
+    end
+  end
+
+  @spec subscribe(t(), integer(), integer()) :: :ok | {:error, String.t()}
+  def subscribe(scanner, bucket, offset) do
+    scanner
+    |> Native.log_scanner_subscribe(bucket, offset)
+    |> Native.await_nif()
+  end
+
+  @doc """
+  Subscribes to multiple buckets. Takes a list of `{bucket_id, offset}` tuples.
+  """
+  @spec subscribe_buckets(t(), [{integer(), integer()}]) :: :ok | {:error, String.t()}
+  def subscribe_buckets(scanner, bucket_offsets) when is_list(bucket_offsets) do
+    scanner
+    |> Native.log_scanner_subscribe_buckets(bucket_offsets)
+    |> Native.await_nif()
+  end
+
+  @spec unsubscribe(t(), integer()) :: :ok | {:error, String.t()}
+  def unsubscribe(scanner, bucket) do
+    scanner
+    |> Native.log_scanner_unsubscribe(bucket)
+    |> Native.await_nif()
+  end
+
+  @doc """
+  Starts a non-blocking poll. Returns `:ok` immediately.
+  Results arrive as `{:fluss_records, [record]}` or `{:fluss_poll_error, reason}`.
+  """
+  @spec poll(t(), non_neg_integer()) :: :ok
+  def poll(scanner, timeout_ms),
+    do: Native.log_scanner_poll(scanner, timeout_ms)
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/native.ex b/fluss-rust/bindings/elixir/lib/fluss/native.ex
new file mode 100644
index 0000000000..865dda142d
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/native.ex
@@ -0,0 +1,80 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Native do
+  @moduledoc false
+  use Rustler, otp_app: :fluss, crate: "fluss_nif"
+
+  # Connection
+  def connection_new(_config), do: :erlang.nif_error(:nif_not_loaded)
+
+  # Admin
+  def admin_new(_conn), do: :erlang.nif_error(:nif_not_loaded)
+
+  def admin_create_database(_admin, _name, _ignore_if_exists),
+    do: :erlang.nif_error(:nif_not_loaded)
+
+  def admin_drop_database(_admin, _name, _ignore_if_not_exists),
+    do: :erlang.nif_error(:nif_not_loaded)
+
+  def admin_list_databases(_admin), do: :erlang.nif_error(:nif_not_loaded)
+
+  def admin_create_table(_admin, _db, _table, _descriptor, _ignore_if_exists),
+    do: :erlang.nif_error(:nif_not_loaded)
+
+  def admin_drop_table(_admin, _db, _table, _ignore_if_not_exists),
+    do: :erlang.nif_error(:nif_not_loaded)
+
+  def admin_list_tables(_admin, _database), do: :erlang.nif_error(:nif_not_loaded)
+
+  # Schema / TableDescriptor
+  def table_descriptor_new(_schema, _bucket_count, _properties),
+    do: :erlang.nif_error(:nif_not_loaded)
+
+  # Table
+  def table_get(_conn, _database, _table), do: :erlang.nif_error(:nif_not_loaded)
+  def table_has_primary_key(_table), do: :erlang.nif_error(:nif_not_loaded)
+  def table_column_names(_table), do: :erlang.nif_error(:nif_not_loaded)
+
+  # AppendWriter
+  def append_writer_new(_table), do: :erlang.nif_error(:nif_not_loaded)
+  def append_writer_append(_writer, _values), do: :erlang.nif_error(:nif_not_loaded)
+  def append_writer_flush(_writer), do: :erlang.nif_error(:nif_not_loaded)
+
+  # LogScanner
+  def log_scanner_new(_table), do: :erlang.nif_error(:nif_not_loaded)
+  def log_scanner_subscribe(_scanner, _bucket, _offset), do: :erlang.nif_error(:nif_not_loaded)
+
+  def log_scanner_subscribe_buckets(_scanner, _bucket_offsets),
+    do: :erlang.nif_error(:nif_not_loaded)
+
+  def log_scanner_unsubscribe(_scanner, _bucket), do: :erlang.nif_error(:nif_not_loaded)
+  def log_scanner_poll(_scanner, _timeout_ms), do: :erlang.nif_error(:nif_not_loaded)
+
+  # WriteHandle
+  def write_handle_wait(_handle), do: :erlang.nif_error(:nif_not_loaded)
+
+  # Constants
+  def earliest_offset, do: :erlang.nif_error(:nif_not_loaded)
+
+  @doc false
+  def await_nif(ref) do
+    receive do
+      {^ref, result} -> result
+    end
+  end
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/schema.ex b/fluss-rust/bindings/elixir/lib/fluss/schema.ex
new file mode 100644
index 0000000000..e11911eee7
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/schema.ex
@@ -0,0 +1,74 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Schema do
+  @moduledoc """
+  Schema definition for a Fluss table.
+
+  Simple types: `:boolean`, `:tinyint`, `:smallint`, `:int`, `:bigint`,
+  `:float`, `:double`, `:string`, `:bytes`, `:date`, `:time`, `:timestamp`, `:timestamp_ltz`
+
+  Parameterized types: `{:decimal, precision, scale}`, `{:char, length}`, `{:binary, length}`
+
+  ## Examples
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("id", :int)
+        |> Fluss.Schema.column("name", :string)
+        |> Fluss.Schema.column("amount", {:decimal, 10, 2})
+
+  """
+
+  defstruct columns: [], primary_key: []
+
+  @type data_type ::
+          :boolean
+          | :tinyint
+          | :smallint
+          | :int
+          | :bigint
+          | :float
+          | :double
+          | :string
+          | :bytes
+          | :date
+          | :time
+          | :timestamp
+          | :timestamp_ltz
+          | {:decimal, non_neg_integer(), non_neg_integer()}
+          | {:char, non_neg_integer()}
+          | {:binary, non_neg_integer()}
+
+  @type t :: %__MODULE__{
+          columns: [{String.t(), data_type()}],
+          primary_key: [String.t()]
+        }
+
+  @spec new() :: t()
+  def new, do: %__MODULE__{}
+
+  @spec column(t(), String.t(), data_type()) :: t()
+  def column(%__MODULE__{} = schema, name, data_type) when is_binary(name) do
+    %{schema | columns: schema.columns ++ [{name, data_type}]}
+  end
+
+  @spec primary_key(t(), [String.t()]) :: t()
+  def primary_key(%__MODULE__{} = schema, keys) when is_list(keys) do
+    %{schema | primary_key: keys}
+  end
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/table.ex b/fluss-rust/bindings/elixir/lib/fluss/table.ex
new file mode 100644
index 0000000000..59f864af94
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/table.ex
@@ -0,0 +1,47 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Table do
+  @moduledoc """
+  A handle to a Fluss table, used to create writers and scanners.
+  """
+
+  alias Fluss.Native
+
+  @type t :: reference()
+
+  @spec get(Fluss.Connection.t(), String.t(), String.t()) :: {:ok, t()} | {:error, String.t()}
+  def get(conn, database, table) do
+    conn
+    |> Native.table_get(database, table)
+    |> Native.await_nif()
+  end
+
+  @spec get!(Fluss.Connection.t(), String.t(), String.t()) :: t()
+  def get!(conn, database, table) do
+    case get(conn, database, table) do
+      {:ok, t} -> t
+      {:error, reason} -> raise "failed to get table: #{reason}"
+    end
+  end
+
+  @spec has_primary_key?(t()) :: boolean()
+  def has_primary_key?(table), do: Native.table_has_primary_key(table)
+
+  @spec column_names(t()) :: [String.t()]
+  def column_names(table), do: Native.table_column_names(table)
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/table_descriptor.ex b/fluss-rust/bindings/elixir/lib/fluss/table_descriptor.ex
new file mode 100644
index 0000000000..96c3e1dfb3
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/table_descriptor.ex
@@ -0,0 +1,45 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.TableDescriptor do
+  @moduledoc """
+  Descriptor for creating a Fluss table.
+
+  Options: `:bucket_count`, `:properties` (list of `{key, value}` string tuples).
+
+  ## Examples
+
+      Fluss.TableDescriptor.new!(schema)
+      Fluss.TableDescriptor.new!(schema, bucket_count: 3)
+
+  """
+
+  alias Fluss.Native
+
+  @type t :: reference()
+
+  @spec new!(Fluss.Schema.t(), keyword()) :: t()
+  def new!(%Fluss.Schema{} = schema, opts \\ []) do
+    bucket_count = Keyword.get(opts, :bucket_count)
+    properties = Keyword.get(opts, :properties, [])
+
+    case Native.table_descriptor_new(schema, bucket_count, properties) do
+      {:error, reason} -> raise "failed to create table descriptor: #{reason}"
+      ref -> ref
+    end
+  end
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/write_handle.ex b/fluss-rust/bindings/elixir/lib/fluss/write_handle.ex
new file mode 100644
index 0000000000..f0ec295be0
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/write_handle.ex
@@ -0,0 +1,44 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.WriteHandle do
+  @moduledoc """
+  Handle for a pending write operation.
+
+  Returned by `Fluss.AppendWriter.append/2`. Drop for fire-and-forget,
+  or call `wait/1` for per-record server acknowledgment.
+  """
+
+  alias Fluss.Native
+
+  @type t :: reference()
+
+  @spec wait(t()) :: :ok | {:error, String.t()}
+  def wait(handle) do
+    handle
+    |> Native.write_handle_wait()
+    |> Native.await_nif()
+  end
+
+  @spec wait!(t()) :: :ok
+  def wait!(handle) do
+    case wait(handle) do
+      :ok -> :ok
+      {:error, reason} -> raise "write failed: #{reason}"
+    end
+  end
+end
diff --git a/fluss-rust/bindings/elixir/mix.exs b/fluss-rust/bindings/elixir/mix.exs
new file mode 100644
index 0000000000..f5d416d807
--- /dev/null
+++ b/fluss-rust/bindings/elixir/mix.exs
@@ -0,0 +1,61 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.MixProject do
+  use Mix.Project
+
+  @version "0.1.0"
+
+  def project do
+    [
+      app: :fluss,
+      version: @version,
+      elixir: "~> 1.15",
+      start_permanent: Mix.env() == :prod,
+      elixirc_paths: elixirc_paths(Mix.env()),
+      deps: deps(),
+      description: "Elixir client for Apache Fluss",
+      package: package()
+    ]
+  end
+
+  def application do
+    [
+      extra_applications: [:logger]
+    ]
+  end
+
+  defp elixirc_paths(:test), do: ["lib", "test/support"]
+  defp elixirc_paths(_), do: ["lib"]
+
+  defp deps do
+    [
+      {:rustler, "~> 0.37"},
+      {:ex_doc, "~> 0.31", only: :dev, runtime: false},
+      {:credo, "~> 1.7", only: [:dev, :test], runtime: false}
+    ]
+  end
+
+  defp package do
+    [
+      licenses: ["Apache-2.0"],
+      links: %{
+        "GitHub" => "https://github.com/apache/fluss-rust"
+      }
+    ]
+  end
+end
diff --git a/fluss-rust/bindings/elixir/mix.lock b/fluss-rust/bindings/elixir/mix.lock
new file mode 100644
index 0000000000..b1170d3f5b
--- /dev/null
+++ b/fluss-rust/bindings/elixir/mix.lock
@@ -0,0 +1,13 @@
+%{
+  "bunt": {:hex, :bunt, "1.0.0", "081c2c665f086849e6d57900292b3a161727ab40431219529f13c4ddcf3e7a44", [:mix], [], "hexpm", "dc5f86aa08a5f6fa6b8096f0735c4e76d54ae5c9fa2c143e5a1fc7c1cd9bb6b5"},
+  "credo": {:hex, :credo, "1.7.17", "f92b6aa5b26301eaa5a35e4d48ebf5aa1e7094ac00ae38f87086c562caf8a22f", [:mix], [{:bunt, "~> 0.2.1 or ~> 1.0", [hex: :bunt, repo: "hexpm", optional: false]}, {:file_system, "~> 0.2 or ~> 1.0", [hex: :file_system, repo: "hexpm", optional: false]}, {:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: false]}], "hexpm", "1eb5645c835f0b6c9b5410f94b5a185057bcf6d62a9c2b476da971cde8749645"},
+  "earmark_parser": {:hex, :earmark_parser, "1.4.44", "f20830dd6b5c77afe2b063777ddbbff09f9759396500cdbe7523efd58d7a339c", [:mix], [], "hexpm", "4778ac752b4701a5599215f7030989c989ffdc4f6df457c5f36938cc2d2a2750"},
+  "ex_doc": {:hex, :ex_doc, "0.40.1", "67542e4b6dde74811cfd580e2c0149b78010fd13001fda7cfeb2b2c2ffb1344d", [:mix], [{:earmark_parser, "~> 1.4.44", [hex: :earmark_parser, repo: "hexpm", optional: false]}, {:makeup_c, ">= 0.1.0", [hex: :makeup_c, repo: "hexpm", optional: true]}, {:makeup_elixir, "~> 0.14 or ~> 1.0", [hex: :makeup_elixir, repo: "hexpm", optional: false]}, {:makeup_erlang, "~> 0.1 or ~> 1.0", [hex: :makeup_erlang, repo: "hexpm", optional: false]}, {:makeup_html, ">= 0.1.0", [hex: :makeup_html, repo: "hexpm", optional: true]}], "hexpm", "bcef0e2d360d93ac19f01a85d58f91752d930c0a30e2681145feea6bd3516e00"},
+  "file_system": {:hex, :file_system, "1.1.1", "31864f4685b0148f25bd3fbef2b1228457c0c89024ad67f7a81a3ffbc0bbad3a", [:mix], [], "hexpm", "7a15ff97dfe526aeefb090a7a9d3d03aa907e100e262a0f8f7746b78f8f87a5d"},
+  "jason": {:hex, :jason, "1.4.4", "b9226785a9aa77b6857ca22832cffa5d5011a667207eb2a0ad56adb5db443b8a", [:mix], [{:decimal, "~> 1.0 or ~> 2.0", [hex: :decimal, repo: "hexpm", optional: true]}], "hexpm", "c5eb0cab91f094599f94d55bc63409236a8ec69a21a67814529e8d5f6cc90b3b"},
+  "makeup": {:hex, :makeup, "1.2.1", "e90ac1c65589ef354378def3ba19d401e739ee7ee06fb47f94c687016e3713d1", [:mix], [{:nimble_parsec, "~> 1.4", [hex: :nimble_parsec, repo: "hexpm", optional: false]}], "hexpm", "d36484867b0bae0fea568d10131197a4c2e47056a6fbe84922bf6ba71c8d17ce"},
+  "makeup_elixir": {:hex, :makeup_elixir, "1.0.1", "e928a4f984e795e41e3abd27bfc09f51db16ab8ba1aebdba2b3a575437efafc2", [:mix], [{:makeup, "~> 1.0", [hex: :makeup, repo: "hexpm", optional: false]}, {:nimble_parsec, "~> 1.2.3 or ~> 1.3", [hex: :nimble_parsec, repo: "hexpm", optional: false]}], "hexpm", "7284900d412a3e5cfd97fdaed4f5ed389b8f2b4cb49efc0eb3bd10e2febf9507"},
+  "makeup_erlang": {:hex, :makeup_erlang, "1.0.3", "4252d5d4098da7415c390e847c814bad3764c94a814a0b4245176215615e1035", [:mix], [{:makeup, "~> 1.0", [hex: :makeup, repo: "hexpm", optional: false]}], "hexpm", "953297c02582a33411ac6208f2c6e55f0e870df7f80da724ed613f10e6706afd"},
+  "nimble_parsec": {:hex, :nimble_parsec, "1.4.2", "8efba0122db06df95bfaa78f791344a89352ba04baedd3849593bfce4d0dc1c6", [:mix], [], "hexpm", "4b21398942dda052b403bbe1da991ccd03a053668d147d53fb8c4e0efe09c973"},
+  "rustler": {:hex, :rustler, "0.37.3", "5f4e6634d43b26f0a69834dd1d3ed4e1710b022a053bf4a670220c9540c92602", [:mix], [{:jason, "~> 1.0", [hex: :jason, repo: "hexpm", optional: false]}], "hexpm", "a6872c6f53dcf00486d1e7f9e046e20e01bf1654bdacc4193016c2e8002b32a2"},
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/Cargo.toml b/fluss-rust/bindings/elixir/native/fluss_nif/Cargo.toml
new file mode 100644
index 0000000000..dd4d453506
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/Cargo.toml
@@ -0,0 +1,34 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+[package]
+name = "fluss_nif"
+version.workspace = true
+edition.workspace = true
+license.workspace = true
+rust-version.workspace = true
+
+[lib]
+name = "fluss_nif"
+path = "src/lib.rs"
+crate-type = ["cdylib"]
+
+[dependencies]
+bigdecimal = { workspace = true }
+fluss = { workspace = true }
+rustler = "0.37"
+tokio = { workspace = true }
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/admin.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/admin.rs
new file mode 100644
index 0000000000..e3f29aebcd
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/admin.rs
@@ -0,0 +1,121 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::async_nif;
+use crate::atoms::to_nif_err;
+use crate::connection::ConnectionResource;
+use crate::schema::TableDescriptorResource;
+use fluss::client::FlussAdmin;
+use fluss::metadata::TablePath;
+use rustler::{Env, ResourceArc, Term};
+use std::sync::Arc;
+
+pub struct AdminResource {
+    pub inner: Arc<FlussAdmin>,
+}
+
+impl std::panic::RefUnwindSafe for AdminResource {}
+
+#[rustler::resource_impl]
+impl rustler::Resource for AdminResource {}
+
+#[rustler::nif]
+fn admin_new(
+    conn: ResourceArc<ConnectionResource>,
+) -> Result<ResourceArc<AdminResource>, rustler::Error> {
+    let inner = conn.inner.get_admin().map_err(to_nif_err)?;
+    Ok(ResourceArc::new(AdminResource { inner }))
+}
+
+#[rustler::nif]
+fn admin_create_database<'a>(
+    env: Env<'a>,
+    admin: ResourceArc<AdminResource>,
+    database_name: String,
+    ignore_if_exists: bool,
+) -> Term<'a> {
+    async_nif::spawn_task(env, async move {
+        admin
+            .inner
+            .create_database(&database_name, None, ignore_if_exists)
+            .await
+    })
+}
+
+#[rustler::nif]
+fn admin_drop_database<'a>(
+    env: Env<'a>,
+    admin: ResourceArc<AdminResource>,
+    database_name: String,
+    ignore_if_not_exists: bool,
+) -> Term<'a> {
+    async_nif::spawn_task(env, async move {
+        admin
+            .inner
+            .drop_database(&database_name, ignore_if_not_exists, false)
+            .await
+    })
+}
+
+#[rustler::nif]
+fn admin_list_databases<'a>(env: Env<'a>, admin: ResourceArc<AdminResource>) -> Term<'a> {
+    async_nif::spawn_task_with_result(env, async move { admin.inner.list_databases().await })
+}
+
+#[rustler::nif]
+fn admin_create_table<'a>(
+    env: Env<'a>,
+    admin: ResourceArc<AdminResource>,
+    database_name: String,
+    table_name: String,
+    descriptor: ResourceArc<TableDescriptorResource>,
+    ignore_if_exists: bool,
+) -> Term<'a> {
+    async_nif::spawn_task(env, async move {
+        let path = TablePath::new(&database_name, &table_name);
+        admin
+            .inner
+            .create_table(&path, &descriptor.inner, ignore_if_exists)
+            .await
+    })
+}
+
+#[rustler::nif]
+fn admin_drop_table<'a>(
+    env: Env<'a>,
+    admin: ResourceArc<AdminResource>,
+    database_name: String,
+    table_name: String,
+    ignore_if_not_exists: bool,
+) -> Term<'a> {
+    async_nif::spawn_task(env, async move {
+        let path = TablePath::new(&database_name, &table_name);
+        admin.inner.drop_table(&path, ignore_if_not_exists).await
+    })
+}
+
+#[rustler::nif]
+fn admin_list_tables<'a>(
+    env: Env<'a>,
+    admin: ResourceArc<AdminResource>,
+    database_name: String,
+) -> Term<'a> {
+    async_nif::spawn_task_with_result(
+        env,
+        async move { admin.inner.list_tables(&database_name).await },
+    )
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/append_writer.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/append_writer.rs
new file mode 100644
index 0000000000..d78f564e0c
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/append_writer.rs
@@ -0,0 +1,69 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::RUNTIME;
+use crate::async_nif;
+use crate::atoms::to_nif_err;
+use crate::row_convert;
+use crate::table::TableResource;
+use crate::write_handle::WriteHandleResource;
+use fluss::client::AppendWriter;
+use fluss::metadata::Column;
+use rustler::{Env, ResourceArc, Term};
+
+pub struct AppendWriterResource {
+    pub inner: AppendWriter,
+    pub columns: Vec<Column>,
+}
+
+impl std::panic::RefUnwindSafe for AppendWriterResource {}
+
+#[rustler::resource_impl]
+impl rustler::Resource for AppendWriterResource {}
+
+#[rustler::nif]
+fn append_writer_new(
+    table: ResourceArc<TableResource>,
+) -> Result<ResourceArc<AppendWriterResource>, rustler::Error> {
+    // WriterClient::new() calls tokio::spawn internally.
+    let _guard = RUNTIME.enter();
+    let (inner, columns) = table.with_table(|t| {
+        let inner = t
+            .new_append()
+            .map_err(to_nif_err)?
+            .create_writer()
+            .map_err(to_nif_err)?;
+        Ok((inner, t.get_table_info().schema.columns().to_vec()))
+    })?;
+    Ok(ResourceArc::new(AppendWriterResource { inner, columns }))
+}
+
+#[rustler::nif]
+fn append_writer_append<'a>(
+    env: Env<'a>,
+    writer: ResourceArc<AppendWriterResource>,
+    values: Term<'a>,
+) -> Result<ResourceArc<WriteHandleResource>, rustler::Error> {
+    let row = row_convert::term_to_row(env, values, &writer.columns).map_err(to_nif_err)?;
+    let future = writer.inner.append(&row).map_err(to_nif_err)?;
+    Ok(ResourceArc::new(WriteHandleResource::new(future)))
+}
+
+#[rustler::nif]
+fn append_writer_flush<'a>(env: Env<'a>, writer: ResourceArc<AppendWriterResource>) -> Term<'a> {
+    async_nif::spawn_task(env, async move { writer.inner.flush().await })
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/async_nif.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/async_nif.rs
new file mode 100644
index 0000000000..fd6e495be3
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/async_nif.rs
@@ -0,0 +1,92 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Async NIF helpers — spawn on tokio, send `{ref, result}` back
+//! as a BEAM message instead of blocking dirty schedulers.
+
+use crate::RUNTIME;
+use crate::atoms;
+use rustler::env::OwnedEnv;
+use rustler::{Encoder, Env, Term};
+use std::future::Future;
+
+/// Sends `{ref, :ok}` or `{ref, {:error, reason}}` on completion.
+pub fn spawn_task<'a, F, E>(env: Env<'a>, future: F) -> Term<'a>
+where
+    F: Future<Output = Result<(), E>> + Send + 'static,
+    E: std::fmt::Display + Send + 'static,
+{
+    let pid = env.pid();
+    let ref_term: Term<'a> = *env.make_ref();
+    let mut task_env = OwnedEnv::new();
+    let saved_ref = task_env.save(ref_term);
+
+    RUNTIME.spawn(async move {
+        let result = future.await;
+        let _ = task_env.send_and_clear(&pid, |env| {
+            let r = saved_ref.load(env);
+            match result {
+                Ok(()) => (r, atoms::ok()).encode(env),
+                Err(e) => (r, (atoms::error(), e.to_string())).encode(env),
+            }
+        });
+    });
+
+    ref_term
+}
+
+/// Sends `{ref, {:ok, value}}` or `{ref, {:error, reason}}` on completion.
+pub fn spawn_task_with_result<'a, F, T, E>(env: Env<'a>, future: F) -> Term<'a>
+where
+    F: Future<Output = Result<T, E>> + Send + 'static,
+    T: Encoder + Send + 'static,
+    E: std::fmt::Display + Send + 'static,
+{
+    let pid = env.pid();
+    let ref_term: Term<'a> = *env.make_ref();
+    let mut task_env = OwnedEnv::new();
+    let saved_ref = task_env.save(ref_term);
+
+    RUNTIME.spawn(async move {
+        let result = future.await;
+        let _ = task_env.send_and_clear(&pid, |env| {
+            let r = saved_ref.load(env);
+            match result {
+                Ok(val) => (r, (atoms::ok(), val)).encode(env),
+                Err(e) => (r, (atoms::error(), e.to_string())).encode(env),
+            }
+        });
+    });
+
+    ref_term
+}
+
+/// Sends `{ref, {:error, reason}}` immediately (no async work).
+pub fn send_error<'a>(env: Env<'a>, msg: &str) -> Term<'a> {
+    let pid = env.pid();
+    let ref_term: Term<'a> = *env.make_ref();
+    let mut task_env = OwnedEnv::new();
+    let saved_ref = task_env.save(ref_term);
+    let msg = msg.to_string();
+
+    let _ = task_env.send_and_clear(&pid, |env| {
+        let r = saved_ref.load(env);
+        (r, (atoms::error(), msg)).encode(env)
+    });
+
+    ref_term
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
new file mode 100644
index 0000000000..20beec7184
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
@@ -0,0 +1,45 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+rustler::atoms! {
+    ok,
+    error,
+    nil,
+
+    // Change types
+    append_only,
+    insert,
+    update_before,
+    update_after,
+    delete,
+
+    // Poll result message tags
+    fluss_records,
+    fluss_poll_error,
+
+    // Record map keys
+    offset,
+    timestamp,
+    change_type,
+    row,
+}
+
+/// Convert any `Display` error into `rustler::Error::Term`, which the NIF
+/// framework encodes as `{:error, reason_string}`.
+pub fn to_nif_err(e: impl std::fmt::Display) -> rustler::Error {
+    rustler::Error::Term(Box::new(e.to_string()))
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
new file mode 100644
index 0000000000..536ed68f3a
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
@@ -0,0 +1,44 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use fluss::config::Config;
+use rustler::NifStruct;
+
+/// Decoded from `%Fluss.Config{}` Elixir struct.
+#[derive(NifStruct)]
+#[module = "Fluss.Config"]
+pub struct NifConfig {
+    pub bootstrap_servers: String,
+    pub writer_batch_size: Option<i32>,
+    pub writer_batch_timeout_ms: Option<i64>,
+}
+
+impl NifConfig {
+    pub fn into_core(self) -> Config {
+        let mut config = Config {
+            bootstrap_servers: self.bootstrap_servers,
+            ..Config::default()
+        };
+        if let Some(size) = self.writer_batch_size {
+            config.writer_batch_size = size;
+        }
+        if let Some(ms) = self.writer_batch_timeout_ms {
+            config.writer_batch_timeout_ms = ms;
+        }
+        config
+    }
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/connection.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/connection.rs
new file mode 100644
index 0000000000..4c788eeec7
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/connection.rs
@@ -0,0 +1,43 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::async_nif;
+use crate::config::NifConfig;
+use fluss::client::FlussConnection;
+use rustler::{Env, ResourceArc, Term};
+use std::sync::Arc;
+
+pub struct ConnectionResource {
+    pub inner: Arc<FlussConnection>,
+}
+
+impl std::panic::RefUnwindSafe for ConnectionResource {}
+
+#[rustler::resource_impl]
+impl rustler::Resource for ConnectionResource {}
+
+#[rustler::nif]
+fn connection_new<'a>(env: Env<'a>, config: NifConfig) -> Term<'a> {
+    let core_config = config.into_core();
+    async_nif::spawn_task_with_result(env, async move {
+        FlussConnection::new(core_config).await.map(|conn| {
+            ResourceArc::new(ConnectionResource {
+                inner: Arc::new(conn),
+            })
+        })
+    })
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/lib.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/lib.rs
new file mode 100644
index 0000000000..a843d65f21
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/lib.rs
@@ -0,0 +1,47 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+// Rustler 0.37 wraps every NIF body in `std::panic::catch_unwind`, which requires
+// all captured values (including `ResourceArc<T>`) to be `RefUnwindSafe`.
+// `ResourceArc` contains `*mut T`, so it is only `RefUnwindSafe` when `T` is.
+// Our resource types contain `parking_lot` locks (`UnsafeCell`) which opt out of
+// the auto-trait. We manually impl `RefUnwindSafe` on each resource type because
+// panic safety is already guaranteed by the NIF boundary — a panic is caught and
+// converted to an Erlang exception, never observed by Rust code.
+
+mod admin;
+mod append_writer;
+mod async_nif;
+mod atoms;
+mod config;
+mod connection;
+mod log_scanner;
+mod row_convert;
+mod schema;
+mod table;
+mod write_handle;
+
+use std::sync::LazyLock;
+
+static RUNTIME: LazyLock<tokio::runtime::Runtime> = LazyLock::new(|| {
+    tokio::runtime::Builder::new_multi_thread()
+        .enable_all()
+        .build()
+        .expect("failed to create tokio runtime")
+});
+
+rustler::init!("Elixir.Fluss.Native");
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/log_scanner.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/log_scanner.rs
new file mode 100644
index 0000000000..93f1d04ed5
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/log_scanner.rs
@@ -0,0 +1,164 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::RUNTIME;
+use crate::async_nif;
+use crate::atoms::{self, to_nif_err};
+use crate::row_convert;
+use crate::table::TableResource;
+use fluss::client::{EARLIEST_OFFSET, LogScanner};
+use fluss::error::Error;
+use fluss::metadata::Column;
+use fluss::record::{ChangeType, ScanRecords};
+use rustler::env::OwnedEnv;
+use rustler::types::LocalPid;
+use rustler::{Atom, Encoder, Env, ResourceArc, Term};
+use std::collections::HashMap;
+use std::time::Duration;
+
+pub struct LogScannerResource {
+    pub inner: LogScanner,
+    pub columns: Vec<Column>,
+}
+
+impl std::panic::RefUnwindSafe for LogScannerResource {}
+
+#[rustler::resource_impl]
+impl rustler::Resource for LogScannerResource {}
+
+#[rustler::nif]
+fn log_scanner_new(
+    table: ResourceArc<TableResource>,
+) -> Result<ResourceArc<LogScannerResource>, rustler::Error> {
+    let _guard = RUNTIME.enter();
+    let (inner, columns) = table.with_table(|t| {
+        let inner = t.new_scan().create_log_scanner().map_err(to_nif_err)?;
+        Ok((inner, t.get_table_info().schema.columns().to_vec()))
+    })?;
+    Ok(ResourceArc::new(LogScannerResource { inner, columns }))
+}
+
+#[rustler::nif]
+fn log_scanner_subscribe<'a>(
+    env: Env<'a>,
+    scanner: ResourceArc<LogScannerResource>,
+    bucket: i32,
+    offset: i64,
+) -> Term<'a> {
+    async_nif::spawn_task(
+        env,
+        async move { scanner.inner.subscribe(bucket, offset).await },
+    )
+}
+
+#[rustler::nif]
+fn log_scanner_subscribe_buckets<'a>(
+    env: Env<'a>,
+    scanner: ResourceArc<LogScannerResource>,
+    bucket_offsets: Vec<(i32, i64)>,
+) -> Term<'a> {
+    let map: HashMap<i32, i64> = bucket_offsets.into_iter().collect();
+    async_nif::spawn_task(
+        env,
+        async move { scanner.inner.subscribe_buckets(&map).await },
+    )
+}
+
+#[rustler::nif]
+fn log_scanner_unsubscribe<'a>(
+    env: Env<'a>,
+    scanner: ResourceArc<LogScannerResource>,
+    bucket: i32,
+) -> Term<'a> {
+    async_nif::spawn_task(env, async move { scanner.inner.unsubscribe(bucket).await })
+}
+
+#[rustler::nif]
+fn log_scanner_poll(env: Env, scanner: ResourceArc<LogScannerResource>, timeout_ms: u64) -> Atom {
+    let pid = env.pid();
+    let scanner = scanner.clone();
+
+    RUNTIME.spawn(async move {
+        let result = scanner.inner.poll(Duration::from_millis(timeout_ms)).await;
+        send_poll_result(&pid, result, &scanner.columns);
+    });
+
+    atoms::ok()
+}
+
+fn send_poll_result(pid: &LocalPid, result: Result<ScanRecords, Error>, columns: &[Column]) {
+    let mut msg_env = OwnedEnv::new();
+
+    match result {
+        Ok(scan_records) => {
+            let _ = msg_env.send_and_clear(pid, |env| {
+                match encode_scan_records(env, scan_records, columns) {
+                    Ok(records) => (atoms::fluss_records(), records).encode(env),
+                    Err(e) => (atoms::fluss_poll_error(), e).encode(env),
+                }
+            });
+        }
+        Err(e) => {
+            let _ = msg_env.send_and_clear(pid, |env| {
+                (atoms::fluss_poll_error(), e.to_string()).encode(env)
+            });
+        }
+    }
+}
+
+fn encode_scan_records<'a>(
+    env: Env<'a>,
+    scan_records: ScanRecords,
+    columns: &[Column],
+) -> Result<rustler::Term<'a>, String> {
+    let column_atoms = row_convert::intern_column_atoms(env, columns);
+    let mut result = Vec::new();
+
+    for record in scan_records {
+        let row_map = row_convert::row_to_term(env, record.row(), columns, &column_atoms)
+            .map_err(|e| format!("failed to convert row at offset {}: {e}", record.offset()))?;
+        let change_type_atom = match record.change_type() {
+            ChangeType::AppendOnly => atoms::append_only().encode(env),
+            ChangeType::Insert => atoms::insert().encode(env),
+            ChangeType::UpdateBefore => atoms::update_before().encode(env),
+            ChangeType::UpdateAfter => atoms::update_after().encode(env),
+            ChangeType::Delete => atoms::delete().encode(env),
+        };
+
+        let record_map = rustler::Term::map_from_pairs(
+            env,
+            &[
+                (atoms::offset().encode(env), record.offset().encode(env)),
+                (
+                    atoms::timestamp().encode(env),
+                    record.timestamp().encode(env),
+                ),
+                (atoms::change_type().encode(env), change_type_atom),
+                (atoms::row().encode(env), row_map),
+            ],
+        )
+        .map_err(|_| "failed to create record map".to_string())?;
+        result.push(record_map);
+    }
+
+    Ok(result.encode(env))
+}
+
+#[rustler::nif]
+fn earliest_offset() -> i64 {
+    EARLIEST_OFFSET
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/row_convert.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/row_convert.rs
new file mode 100644
index 0000000000..c72395e900
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/row_convert.rs
@@ -0,0 +1,267 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use std::str::FromStr;
+
+use fluss::metadata::{Column, DataType};
+use fluss::row::{Date, Decimal, GenericRow, InternalRow, Time, TimestampLtz, TimestampNtz};
+use rustler::types::binary::NewBinary;
+use rustler::{Encoder, Env, Term};
+
+use crate::atoms;
+
+/// Convert column names to BEAM atoms for use as map keys.
+///
+/// Note: BEAM atoms are never garbage-collected. This is safe because column
+/// names come from server-defined table schemas (bounded set), not arbitrary
+/// user input. The BEAM deduplicates atoms, so repeated calls with the same
+/// column names do not grow the atom table.
+pub fn intern_column_atoms<'a>(env: Env<'a>, columns: &[Column]) -> Vec<rustler::Atom> {
+    columns
+        .iter()
+        .map(|col| rustler::Atom::from_str(env, col.name()).expect("valid atom"))
+        .collect()
+}
+
+pub fn row_to_term<'a>(
+    env: Env<'a>,
+    row: &dyn InternalRow,
+    columns: &[Column],
+    column_atoms: &[rustler::Atom],
+) -> Result<Term<'a>, String> {
+    let pairs: Vec<(Term<'a>, Term<'a>)> = columns
+        .iter()
+        .enumerate()
+        .map(|(i, col)| {
+            let key = column_atoms[i].encode(env);
+            let value = field_to_term(env, row, i, col.data_type())?;
+            Ok((key, value))
+        })
+        .collect::<Result<_, String>>()?;
+    Term::map_from_pairs(env, &pairs).map_err(|_| "failed to create map".to_string())
+}
+
+fn field_to_term<'a>(
+    env: Env<'a>,
+    row: &dyn InternalRow,
+    pos: usize,
+    data_type: &DataType,
+) -> Result<Term<'a>, String> {
+    if row.is_null_at(pos).map_err(|e| e.to_string())? {
+        return Ok(atoms::nil().encode(env));
+    }
+
+    match data_type {
+        DataType::Boolean(_) => {
+            let v = row.get_boolean(pos).map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::TinyInt(_) => {
+            let v = row.get_byte(pos).map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::SmallInt(_) => {
+            let v = row.get_short(pos).map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::Int(_) => {
+            let v = row.get_int(pos).map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::BigInt(_) => {
+            let v = row.get_long(pos).map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::Float(_) => {
+            let v = row.get_float(pos).map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::Double(_) => {
+            let v = row.get_double(pos).map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::String(_) => {
+            let v = row.get_string(pos).map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::Char(ct) => {
+            let v = row
+                .get_char(pos, ct.length() as usize)
+                .map_err(|e| e.to_string())?;
+            Ok(v.encode(env))
+        }
+        DataType::Bytes(_) => {
+            let v = row.get_bytes(pos).map_err(|e| e.to_string())?;
+            let mut bin = NewBinary::new(env, v.len());
+            bin.as_mut_slice().copy_from_slice(v);
+            let binary: rustler::Binary = bin.into();
+            Ok(binary.encode(env))
+        }
+        DataType::Binary(bt) => {
+            let v = row
+                .get_binary(pos, bt.length())
+                .map_err(|e| e.to_string())?;
+            let mut bin = NewBinary::new(env, v.len());
+            bin.as_mut_slice().copy_from_slice(v);
+            let binary: rustler::Binary = bin.into();
+            Ok(binary.encode(env))
+        }
+        DataType::Date(_) => {
+            let v = row.get_date(pos).map_err(|e| e.to_string())?;
+            Ok(v.get_inner().encode(env))
+        }
+        DataType::Time(_) => {
+            let v = row.get_time(pos).map_err(|e| e.to_string())?;
+            Ok(v.get_inner().encode(env))
+        }
+        DataType::Timestamp(ts) => {
+            let v = row
+                .get_timestamp_ntz(pos, ts.precision())
+                .map_err(|e| e.to_string())?;
+            Ok((v.get_millisecond(), v.get_nano_of_millisecond()).encode(env))
+        }
+        DataType::TimestampLTz(ts) => {
+            let v = row
+                .get_timestamp_ltz(pos, ts.precision())
+                .map_err(|e| e.to_string())?;
+            Ok((v.get_epoch_millisecond(), v.get_nano_of_millisecond()).encode(env))
+        }
+        DataType::Decimal(dt) => {
+            let v = row
+                .get_decimal(pos, dt.precision() as usize, dt.scale() as usize)
+                .map_err(|e| e.to_string())?;
+            Ok(v.to_string().encode(env))
+        }
+        _ => Err(format!("unsupported data type: {data_type:?}")),
+    }
+}
+
+pub fn term_to_row<'a>(
+    env: Env<'a>,
+    values: Term<'a>,
+    columns: &[Column],
+) -> Result<GenericRow<'static>, String> {
+    let list: Vec<Term<'a>> = values
+        .decode()
+        .map_err(|_| "expected a list of values".to_string())?;
+    if list.len() != columns.len() {
+        return Err(format!(
+            "expected {} values, got {}",
+            columns.len(),
+            list.len()
+        ));
+    }
+
+    let mut row = GenericRow::new(columns.len());
+    for (i, (term, col)) in list.iter().zip(columns.iter()).enumerate() {
+        if term.is_atom()
+            && let Ok(atom) = term.decode::<rustler::Atom>()
+            && atom == atoms::nil()
+        {
+            continue; // leave as null
+        }
+        set_field_from_term(env, &mut row, i, *term, col.data_type())?;
+    }
+    Ok(row)
+}
+
+fn set_field_from_term<'a>(
+    _env: Env<'a>,
+    row: &mut GenericRow<'static>,
+    pos: usize,
+    term: Term<'a>,
+    data_type: &DataType,
+) -> Result<(), String> {
+    match data_type {
+        DataType::Boolean(_) => {
+            let v: bool = term.decode().map_err(|_| "expected boolean")?;
+            row.set_field(pos, v);
+        }
+        DataType::TinyInt(_) => {
+            let v: i8 = term
+                .decode()
+                .map_err(|_| "expected integer in range -128..127 for tinyint")?;
+            row.set_field(pos, v);
+        }
+        DataType::SmallInt(_) => {
+            let v: i16 = term
+                .decode()
+                .map_err(|_| "expected integer in range -32768..32767 for smallint")?;
+            row.set_field(pos, v);
+        }
+        DataType::Int(_) => {
+            let v: i32 = term.decode().map_err(|_| "expected integer")?;
+            row.set_field(pos, v);
+        }
+        DataType::BigInt(_) => {
+            let v: i64 = term.decode().map_err(|_| "expected integer")?;
+            row.set_field(pos, v);
+        }
+        DataType::Date(_) => {
+            let v: i32 = term
+                .decode()
+                .map_err(|_| "expected integer (days since epoch)")?;
+            row.set_field(pos, Date::new(v));
+        }
+        DataType::Time(_) => {
+            let v: i32 = term
+                .decode()
+                .map_err(|_| "expected integer (millis since midnight)")?;
+            row.set_field(pos, Time::new(v));
+        }
+        DataType::Timestamp(_) => {
+            let (millis, nanos): (i64, i32) = term
+                .decode()
+                .map_err(|_| "expected {millis, nanos} tuple for timestamp")?;
+            let ts = TimestampNtz::from_millis_nanos(millis, nanos).map_err(|e| e.to_string())?;
+            row.set_field(pos, ts);
+        }
+        DataType::TimestampLTz(_) => {
+            let (millis, nanos): (i64, i32) = term
+                .decode()
+                .map_err(|_| "expected {millis, nanos} tuple for timestamp_ltz")?;
+            let ts = TimestampLtz::from_millis_nanos(millis, nanos).map_err(|e| e.to_string())?;
+            row.set_field(pos, ts);
+        }
+        DataType::Float(_) => {
+            let v: f64 = term.decode().map_err(|_| "expected number for float")?;
+            row.set_field(pos, v as f32);
+        }
+        DataType::Double(_) => {
+            let v: f64 = term.decode().map_err(|_| "expected number for double")?;
+            row.set_field(pos, v);
+        }
+        DataType::String(_) | DataType::Char(_) => {
+            let v: String = term.decode().map_err(|_| "expected string")?;
+            row.set_field(pos, v);
+        }
+        DataType::Decimal(dt) => {
+            let v: String = term.decode().map_err(|_| "expected string for decimal")?;
+            let bd = bigdecimal::BigDecimal::from_str(&v)
+                .map_err(|e| format!("failed to parse decimal '{v}': {e}"))?;
+            let decimal = Decimal::from_big_decimal(bd, dt.precision(), dt.scale())
+                .map_err(|e| e.to_string())?;
+            row.set_field(pos, decimal);
+        }
+        DataType::Bytes(_) | DataType::Binary(_) => {
+            let bin: rustler::Binary = term.decode().map_err(|_| "expected binary")?;
+            row.set_field(pos, bin.as_slice().to_vec());
+        }
+        _ => return Err(format!("unsupported data type for writing: {data_type:?}")),
+    }
+    Ok(())
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/schema.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/schema.rs
new file mode 100644
index 0000000000..5d61d29daf
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/schema.rs
@@ -0,0 +1,110 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::atoms::to_nif_err;
+use fluss::metadata::{self, DataTypes, Schema, TableDescriptor};
+use rustler::{NifStruct, NifTaggedEnum, ResourceArc};
+
+pub struct TableDescriptorResource {
+    pub inner: TableDescriptor,
+}
+
+impl std::panic::RefUnwindSafe for TableDescriptorResource {}
+
+#[rustler::resource_impl]
+impl rustler::Resource for TableDescriptorResource {}
+
+/// Fluss data type for NIF interop.
+///
+/// Simple types map to atoms: `:int`, `:string`, etc.
+/// Parameterized types map to tuples: `{:decimal, 10, 2}`, `{:char, 20}`.
+#[derive(NifTaggedEnum)]
+pub enum DataType {
+    Boolean,
+    Tinyint,
+    Smallint,
+    Int,
+    Bigint,
+    Float,
+    Double,
+    String,
+    Bytes,
+    Date,
+    Time,
+    Timestamp,
+    TimestampLtz,
+    Decimal(u32, u32),
+    Char(u32),
+    Binary(usize),
+}
+
+fn to_fluss_type(dt: &DataType) -> metadata::DataType {
+    match dt {
+        DataType::Boolean => DataTypes::boolean(),
+        DataType::Tinyint => DataTypes::tinyint(),
+        DataType::Smallint => DataTypes::smallint(),
+        DataType::Int => DataTypes::int(),
+        DataType::Bigint => DataTypes::bigint(),
+        DataType::Float => DataTypes::float(),
+        DataType::Double => DataTypes::double(),
+        DataType::String => DataTypes::string(),
+        DataType::Bytes => DataTypes::bytes(),
+        DataType::Date => DataTypes::date(),
+        DataType::Time => DataTypes::time(),
+        DataType::Timestamp => DataTypes::timestamp(),
+        DataType::TimestampLtz => DataTypes::timestamp_ltz(),
+        DataType::Decimal(precision, scale) => DataTypes::decimal(*precision, *scale),
+        DataType::Char(length) => DataTypes::char(*length),
+        DataType::Binary(length) => DataTypes::binary(*length),
+    }
+}
+
+/// Decoded from `%Fluss.Schema{}` Elixir struct.
+#[derive(NifStruct)]
+#[module = "Fluss.Schema"]
+pub struct NifSchema {
+    pub columns: Vec<(String, DataType)>,
+    pub primary_key: Vec<String>,
+}
+
+#[rustler::nif]
+fn table_descriptor_new(
+    schema: NifSchema,
+    bucket_count: Option<i32>,
+    properties: Vec<(String, String)>,
+) -> Result<ResourceArc<TableDescriptorResource>, rustler::Error> {
+    let mut schema_builder = Schema::builder();
+    for (name, dt) in &schema.columns {
+        schema_builder = schema_builder.column(name, to_fluss_type(dt));
+    }
+    if !schema.primary_key.is_empty() {
+        schema_builder = schema_builder.primary_key(schema.primary_key);
+    }
+    let built_schema = schema_builder.build().map_err(to_nif_err)?;
+
+    let mut builder = TableDescriptor::builder().schema(built_schema);
+    if let Some(count) = bucket_count {
+        builder = builder.distributed_by(Some(count), vec![]);
+    }
+    for (key, value) in properties {
+        builder = builder.property(&key, &value);
+    }
+    let descriptor = builder.build().map_err(to_nif_err)?;
+    Ok(ResourceArc::new(TableDescriptorResource {
+        inner: descriptor,
+    }))
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/table.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/table.rs
new file mode 100644
index 0000000000..d48ff7ab29
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/table.rs
@@ -0,0 +1,89 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::async_nif;
+use crate::connection::ConnectionResource;
+use fluss::client::{FlussConnection, FlussTable, Metadata};
+use fluss::error::Error;
+use fluss::metadata::{Column, TableInfo, TablePath};
+use rustler::{Env, ResourceArc, Term};
+use std::sync::Arc;
+
+/// Holds the data needed to reconstruct FlussTable (which has a lifetime
+/// tied to FlussConnection). We store the Arc<FlussConnection> to keep
+/// it alive and reconstruct short-lived FlussTable instances on demand.
+pub struct TableResource {
+    pub connection: Arc<FlussConnection>,
+    pub metadata: Arc<Metadata>,
+    pub table_info: TableInfo,
+}
+
+impl std::panic::RefUnwindSafe for TableResource {}
+
+#[rustler::resource_impl]
+impl rustler::Resource for TableResource {}
+
+impl TableResource {
+    pub fn columns(&self) -> &[Column] {
+        self.table_info.schema.columns()
+    }
+
+    pub fn with_table<T>(&self, f: impl FnOnce(&FlussTable<'_>) -> T) -> T {
+        let table = FlussTable::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+        );
+        f(&table)
+    }
+}
+
+#[rustler::nif]
+fn table_get<'a>(
+    env: Env<'a>,
+    conn: ResourceArc<ConnectionResource>,
+    database_name: String,
+    table_name: String,
+) -> Term<'a> {
+    let conn_arc = conn.inner.clone();
+    async_nif::spawn_task_with_result(env, async move {
+        let path = TablePath::new(&database_name, &table_name);
+        let (metadata, table_info) = {
+            let table = conn_arc.get_table(&path).await?;
+            (table.metadata().clone(), table.get_table_info().clone())
+        };
+        Ok::<_, Error>(ResourceArc::new(TableResource {
+            connection: conn_arc,
+            metadata,
+            table_info,
+        }))
+    })
+}
+
+#[rustler::nif]
+fn table_has_primary_key(table: ResourceArc<TableResource>) -> bool {
+    table.table_info.has_primary_key()
+}
+
+#[rustler::nif]
+fn table_column_names(table: ResourceArc<TableResource>) -> Vec<String> {
+    table
+        .columns()
+        .iter()
+        .map(|c| c.name().to_string())
+        .collect()
+}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/write_handle.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/write_handle.rs
new file mode 100644
index 0000000000..e3b325d0bf
--- /dev/null
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/write_handle.rs
@@ -0,0 +1,47 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::async_nif;
+use fluss::client::WriteResultFuture;
+use rustler::{Env, ResourceArc, Term};
+use std::sync::Mutex;
+
+pub struct WriteHandleResource {
+    inner: Mutex<Option<WriteResultFuture>>,
+}
+
+impl std::panic::RefUnwindSafe for WriteHandleResource {}
+
+#[rustler::resource_impl]
+impl rustler::Resource for WriteHandleResource {}
+
+impl WriteHandleResource {
+    pub fn new(future: WriteResultFuture) -> Self {
+        Self {
+            inner: Mutex::new(Some(future)),
+        }
+    }
+}
+
+#[rustler::nif]
+fn write_handle_wait<'a>(env: Env<'a>, handle: ResourceArc<WriteHandleResource>) -> Term<'a> {
+    let future = handle.inner.lock().unwrap().take();
+    match future {
+        Some(f) => async_nif::spawn_task(env, f),
+        None => async_nif::send_error(env, "WriteHandle already consumed"),
+    }
+}
diff --git a/fluss-rust/bindings/elixir/test/fluss_test.exs b/fluss-rust/bindings/elixir/test/fluss_test.exs
new file mode 100644
index 0000000000..3eee273482
--- /dev/null
+++ b/fluss-rust/bindings/elixir/test/fluss_test.exs
@@ -0,0 +1,66 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule FlussTest do
+  use ExUnit.Case
+
+  describe "TableDescriptor" do
+    test "creates descriptor from schema" do
+      Fluss.Schema.new()
+      |> Fluss.Schema.column("id", :int)
+      |> Fluss.TableDescriptor.new!()
+    end
+
+    test "creates descriptor with bucket count" do
+      Fluss.Schema.new()
+      |> Fluss.Schema.column("id", :int)
+      |> Fluss.TableDescriptor.new!(bucket_count: 3)
+    end
+
+    test "accepts all simple data types" do
+      Fluss.Schema.new()
+      |> Fluss.Schema.column("a", :boolean)
+      |> Fluss.Schema.column("b", :tinyint)
+      |> Fluss.Schema.column("c", :smallint)
+      |> Fluss.Schema.column("d", :int)
+      |> Fluss.Schema.column("e", :bigint)
+      |> Fluss.Schema.column("f", :float)
+      |> Fluss.Schema.column("g", :double)
+      |> Fluss.Schema.column("h", :string)
+      |> Fluss.Schema.column("i", :bytes)
+      |> Fluss.Schema.column("j", :date)
+      |> Fluss.Schema.column("k", :time)
+      |> Fluss.Schema.column("l", :timestamp)
+      |> Fluss.Schema.column("m", :timestamp_ltz)
+      |> Fluss.TableDescriptor.new!()
+    end
+
+    test "accepts parameterized data types" do
+      Fluss.Schema.new()
+      |> Fluss.Schema.column("amount", {:decimal, 10, 2})
+      |> Fluss.Schema.column("code", {:char, 5})
+      |> Fluss.Schema.column("data", {:binary, 16})
+      |> Fluss.TableDescriptor.new!()
+    end
+  end
+
+  describe "earliest_offset/0" do
+    test "returns -2" do
+      assert Fluss.earliest_offset() == -2
+    end
+  end
+end
diff --git a/fluss-rust/bindings/elixir/test/integration/log_table_test.exs b/fluss-rust/bindings/elixir/test/integration/log_table_test.exs
new file mode 100644
index 0000000000..b3041b9587
--- /dev/null
+++ b/fluss-rust/bindings/elixir/test/integration/log_table_test.exs
@@ -0,0 +1,413 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Integration.LogTableTest do
+  use ExUnit.Case, async: false
+
+  alias Fluss.Test.Cluster
+
+  @moduletag :integration
+
+  @database "fluss"
+
+  setup_all do
+    case Cluster.ensure_started() do
+      {:ok, servers} ->
+        config = Fluss.Config.new(servers)
+
+        # Wait for cluster to be fully ready (connection + admin working)
+        {conn, admin} = connect_with_retry(config, 90)
+
+        %{conn: conn, admin: admin, config: config}
+
+      {:error, reason} ->
+        raise "Failed to start Fluss cluster: #{reason}"
+    end
+  end
+
+  describe "append and scan" do
+    test "append rows and scan with log scanner", %{conn: conn, admin: admin} do
+      table_name = "ex_test_append_and_scan_#{:rand.uniform(100_000)}"
+      cleanup_table(admin, table_name)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("c1", :int)
+        |> Fluss.Schema.column("c2", :string)
+
+      descriptor = Fluss.TableDescriptor.new!(schema)
+      :ok = Fluss.Admin.create_table(admin, @database, table_name, descriptor, false)
+
+      table = Fluss.Table.get!(conn, @database, table_name)
+      writer = Fluss.AppendWriter.new!(table)
+
+      # Append 6 rows
+      for {c1, c2} <- [{1, "a1"}, {2, "a2"}, {3, "a3"}, {4, "a4"}, {5, "a5"}, {6, "a6"}] do
+        {:ok, _} = Fluss.AppendWriter.append(writer, [c1, c2])
+      end
+
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      # Scan all records
+      scanner = Fluss.LogScanner.new!(table)
+      :ok = Fluss.LogScanner.subscribe(scanner, 0, Fluss.earliest_offset())
+
+      records = poll_records(scanner, 6)
+
+      assert length(records) == 6
+
+      sorted = Enum.sort_by(records, fn r -> r[:row][:c1] end)
+
+      for {record, i} <- Enum.with_index(sorted, 1) do
+        assert record[:row][:c1] == i
+        assert record[:row][:c2] == "a#{i}"
+        assert record[:change_type] == :append_only
+      end
+
+      # Unsubscribe should not error
+      :ok = Fluss.LogScanner.unsubscribe(scanner, 0)
+
+      cleanup_table(admin, table_name)
+    end
+
+    test "append with nil values", %{conn: conn, admin: admin} do
+      table_name = "ex_test_append_nil_#{:rand.uniform(100_000)}"
+      cleanup_table(admin, table_name)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("id", :int)
+        |> Fluss.Schema.column("name", :string)
+
+      descriptor = Fluss.TableDescriptor.new!(schema)
+      :ok = Fluss.Admin.create_table(admin, @database, table_name, descriptor, false)
+
+      table = Fluss.Table.get!(conn, @database, table_name)
+      writer = Fluss.AppendWriter.new!(table)
+
+      {:ok, _} = Fluss.AppendWriter.append(writer, [1, nil])
+      {:ok, _} = Fluss.AppendWriter.append(writer, [2, "present"])
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      scanner = Fluss.LogScanner.new!(table)
+      :ok = Fluss.LogScanner.subscribe(scanner, 0, Fluss.earliest_offset())
+
+      records = poll_records(scanner, 2)
+      assert length(records) == 2
+
+      sorted = Enum.sort_by(records, fn r -> r[:row][:id] end)
+      assert Enum.at(sorted, 0)[:row][:name] == nil
+      assert Enum.at(sorted, 1)[:row][:name] == "present"
+
+      cleanup_table(admin, table_name)
+    end
+  end
+
+  describe "multiple data types" do
+    test "tinyint, smallint, int, bigint, float, double, string, boolean", %{
+      conn: conn,
+      admin: admin
+    } do
+      table_name = "ex_test_data_types_#{:rand.uniform(100_000)}"
+      cleanup_table(admin, table_name)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("a_tinyint", :tinyint)
+        |> Fluss.Schema.column("b_smallint", :smallint)
+        |> Fluss.Schema.column("c_int", :int)
+        |> Fluss.Schema.column("d_bigint", :bigint)
+        |> Fluss.Schema.column("e_float", :float)
+        |> Fluss.Schema.column("f_double", :double)
+        |> Fluss.Schema.column("g_string", :string)
+        |> Fluss.Schema.column("h_bool", :boolean)
+
+      descriptor = Fluss.TableDescriptor.new!(schema)
+      :ok = Fluss.Admin.create_table(admin, @database, table_name, descriptor, false)
+
+      table = Fluss.Table.get!(conn, @database, table_name)
+      writer = Fluss.AppendWriter.new!(table)
+
+      {:ok, _} =
+        Fluss.AppendWriter.append(writer, [
+          127,
+          32_000,
+          42,
+          1_000_000_000_000,
+          3.14,
+          2.718281828,
+          "hello",
+          true
+        ])
+
+      {:ok, _} =
+        Fluss.AppendWriter.append(writer, [-128, -32_000, -1, -999, 0.0, -1.5, "", false])
+
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      scanner = Fluss.LogScanner.new!(table)
+      :ok = Fluss.LogScanner.subscribe(scanner, 0, Fluss.earliest_offset())
+
+      records = poll_records(scanner, 2)
+      assert length(records) == 2
+
+      sorted = Enum.sort_by(records, fn r -> r[:row][:c_int] end)
+      row1 = Enum.at(sorted, 0)[:row]
+      row2 = Enum.at(sorted, 1)[:row]
+
+      assert row1[:a_tinyint] == -128
+      assert row1[:b_smallint] == -32_000
+      assert row1[:c_int] == -1
+      assert row1[:d_bigint] == -999
+      assert row1[:g_string] == ""
+      assert row1[:h_bool] == false
+
+      assert row2[:a_tinyint] == 127
+      assert row2[:b_smallint] == 32_000
+      assert row2[:c_int] == 42
+      assert row2[:d_bigint] == 1_000_000_000_000
+      assert row2[:g_string] == "hello"
+      assert row2[:h_bool] == true
+
+      cleanup_table(admin, table_name)
+    end
+  end
+
+  describe "subscribe_buckets" do
+    test "subscribe to multiple buckets at once", %{conn: conn, admin: admin} do
+      table_name = "ex_test_subscribe_buckets_#{:rand.uniform(100_000)}"
+      cleanup_table(admin, table_name)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("id", :int)
+        |> Fluss.Schema.column("val", :string)
+
+      descriptor = Fluss.TableDescriptor.new!(schema, bucket_count: 3)
+      :ok = Fluss.Admin.create_table(admin, @database, table_name, descriptor, false)
+
+      table = Fluss.Table.get!(conn, @database, table_name)
+      writer = Fluss.AppendWriter.new!(table)
+
+      for i <- 1..9 do
+        {:ok, _} = Fluss.AppendWriter.append(writer, [i, "v#{i}"])
+      end
+
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      scanner = Fluss.LogScanner.new!(table)
+      earliest = Fluss.earliest_offset()
+
+      :ok =
+        Fluss.LogScanner.subscribe_buckets(scanner, [
+          {0, earliest},
+          {1, earliest},
+          {2, earliest}
+        ])
+
+      records = poll_records(scanner, 9)
+      assert length(records) == 9
+
+      ids = records |> Enum.map(fn r -> r[:row][:id] end) |> Enum.sort()
+      assert ids == Enum.to_list(1..9)
+
+      cleanup_table(admin, table_name)
+    end
+  end
+
+  describe "admin operations" do
+    test "create and drop database", %{admin: admin} do
+      db_name = "ex_test_db_#{:rand.uniform(100_000)}"
+      :ok = Fluss.Admin.create_database(admin, db_name, true)
+
+      {:ok, databases} = Fluss.Admin.list_databases(admin)
+      assert db_name in databases
+
+      :ok = Fluss.Admin.drop_database(admin, db_name, true)
+    end
+
+    test "list tables", %{admin: admin} do
+      table_name = "ex_test_list_tables_#{:rand.uniform(100_000)}"
+      cleanup_table(admin, table_name)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("id", :int)
+
+      descriptor = Fluss.TableDescriptor.new!(schema)
+      :ok = Fluss.Admin.create_table(admin, @database, table_name, descriptor, false)
+
+      {:ok, tables} = Fluss.Admin.list_tables(admin, @database)
+      assert table_name in tables
+
+      cleanup_table(admin, table_name)
+    end
+
+    test "table metadata", %{conn: conn, admin: admin} do
+      table_name = "ex_test_table_meta_#{:rand.uniform(100_000)}"
+      cleanup_table(admin, table_name)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("id", :int)
+        |> Fluss.Schema.column("name", :string)
+
+      descriptor = Fluss.TableDescriptor.new!(schema)
+      :ok = Fluss.Admin.create_table(admin, @database, table_name, descriptor, false)
+
+      table = Fluss.Table.get!(conn, @database, table_name)
+      assert Fluss.Table.has_primary_key?(table) == false
+      assert Fluss.Table.column_names(table) == ["id", "name"]
+
+      cleanup_table(admin, table_name)
+    end
+  end
+
+  describe "scan from offset" do
+    test "subscribe from specific offset skips earlier records", %{conn: conn, admin: admin} do
+      table_name = "ex_test_scan_offset_#{:rand.uniform(100_000)}"
+      cleanup_table(admin, table_name)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("id", :int)
+
+      descriptor = Fluss.TableDescriptor.new!(schema)
+      :ok = Fluss.Admin.create_table(admin, @database, table_name, descriptor, false)
+
+      table = Fluss.Table.get!(conn, @database, table_name)
+      writer = Fluss.AppendWriter.new!(table)
+
+      for i <- 1..5 do
+        {:ok, _} = Fluss.AppendWriter.append(writer, [i])
+      end
+
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      # Subscribe from offset 3, should skip first 3 records
+      scanner = Fluss.LogScanner.new!(table)
+      :ok = Fluss.LogScanner.subscribe(scanner, 0, 3)
+
+      records = poll_records(scanner, 2)
+      assert length(records) == 2
+
+      ids = records |> Enum.map(fn r -> r[:row][:id] end) |> Enum.sort()
+      assert ids == [4, 5]
+
+      cleanup_table(admin, table_name)
+    end
+  end
+
+  describe "multiple flushes" do
+    test "append, flush, append more, flush, scan all", %{conn: conn, admin: admin} do
+      table_name = "ex_test_multi_flush_#{:rand.uniform(100_000)}"
+      cleanup_table(admin, table_name)
+
+      schema =
+        Fluss.Schema.new()
+        |> Fluss.Schema.column("id", :int)
+        |> Fluss.Schema.column("batch", :string)
+
+      descriptor = Fluss.TableDescriptor.new!(schema)
+      :ok = Fluss.Admin.create_table(admin, @database, table_name, descriptor, false)
+
+      table = Fluss.Table.get!(conn, @database, table_name)
+      writer = Fluss.AppendWriter.new!(table)
+
+      # First batch
+      {:ok, _} = Fluss.AppendWriter.append(writer, [1, "first"])
+      {:ok, _} = Fluss.AppendWriter.append(writer, [2, "first"])
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      # Second batch
+      {:ok, _} = Fluss.AppendWriter.append(writer, [3, "second"])
+      {:ok, _} = Fluss.AppendWriter.append(writer, [4, "second"])
+      :ok = Fluss.AppendWriter.flush(writer)
+
+      scanner = Fluss.LogScanner.new!(table)
+      :ok = Fluss.LogScanner.subscribe(scanner, 0, Fluss.earliest_offset())
+
+      records = poll_records(scanner, 4)
+      assert length(records) == 4
+
+      sorted = Enum.sort_by(records, fn r -> r[:row][:id] end)
+      assert Enum.at(sorted, 0)[:row][:batch] == "first"
+      assert Enum.at(sorted, 1)[:row][:batch] == "first"
+      assert Enum.at(sorted, 2)[:row][:batch] == "second"
+      assert Enum.at(sorted, 3)[:row][:batch] == "second"
+
+      cleanup_table(admin, table_name)
+    end
+  end
+
+  defp poll_records(scanner, expected_count, timeout_ms \\ 10_000) do
+    deadline = System.monotonic_time(:millisecond) + timeout_ms
+    do_poll(scanner, expected_count, deadline, [])
+  end
+
+  defp do_poll(_scanner, expected_count, _deadline, acc) when length(acc) >= expected_count do
+    acc
+  end
+
+  defp do_poll(scanner, expected_count, deadline, acc) do
+    remaining = deadline - System.monotonic_time(:millisecond)
+
+    if remaining <= 0 do
+      acc
+    else
+      :ok = Fluss.LogScanner.poll(scanner, min(5_000, remaining))
+
+      receive do
+        {:fluss_records, records} ->
+          do_poll(scanner, expected_count, deadline, acc ++ records)
+
+        {:fluss_poll_error, reason} ->
+          IO.warn("poll error during test: #{inspect(reason)}")
+          do_poll(scanner, expected_count, deadline, acc)
+      after
+        min(6_000, remaining) ->
+          acc
+      end
+    end
+  end
+
+  defp cleanup_table(admin, table_name) do
+    Fluss.Admin.drop_table(admin, @database, table_name, true)
+  end
+
+  defp connect_with_retry(config, timeout_s) do
+    deadline = System.monotonic_time(:second) + timeout_s
+    do_connect_retry(config, deadline, nil)
+  end
+
+  defp do_connect_retry(config, deadline, last_error) do
+    if System.monotonic_time(:second) >= deadline do
+      raise "Could not connect to Fluss cluster: #{inspect(last_error)}"
+    end
+
+    try do
+      conn = Fluss.Connection.new!(config)
+      admin = Fluss.Admin.new!(conn)
+      {:ok, _databases} = Fluss.Admin.list_databases(admin)
+      {conn, admin}
+    rescue
+      e ->
+        Process.sleep(2_000)
+        do_connect_retry(config, deadline, e)
+    end
+  end
+end
diff --git a/fluss-rust/bindings/elixir/test/support/cluster.ex b/fluss-rust/bindings/elixir/test/support/cluster.ex
new file mode 100644
index 0000000000..59598b4ebd
--- /dev/null
+++ b/fluss-rust/bindings/elixir/test/support/cluster.ex
@@ -0,0 +1,211 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Test.Cluster do
+  @moduledoc false
+
+  @fluss_image "apache/fluss"
+  @fluss_version "0.9.0-incubating"
+
+  @network_name "fluss-elixir-test-network"
+  @zookeeper_name "zookeeper-elixir-test"
+  @coordinator_name "coordinator-server-elixir-test"
+  @tablet_server_name "tablet-server-elixir-test"
+
+  # Same fixed ports used by Python/C++ integration tests.
+  @coordinator_sasl_port 9123
+  @coordinator_plain_port 9223
+  @tablet_sasl_port 9124
+  @tablet_plain_port 9224
+
+  def bootstrap_servers, do: "127.0.0.1:#{@coordinator_plain_port}"
+
+  def ensure_started do
+    case System.get_env("FLUSS_BOOTSTRAP_SERVERS") do
+      nil -> start_cluster()
+      servers -> {:ok, servers}
+    end
+  end
+
+  def stop do
+    for name <- [@tablet_server_name, @coordinator_name, @zookeeper_name] do
+      System.cmd("docker", ["rm", "-f", name], stderr_to_stdout: true)
+    end
+
+    System.cmd("docker", ["network", "rm", @network_name], stderr_to_stdout: true)
+    :ok
+  end
+
+  defp start_cluster do
+    if port_open?(@coordinator_plain_port) do
+      IO.puts("Reusing existing Fluss cluster on port #{@coordinator_plain_port}")
+      {:ok, bootstrap_servers()}
+    else
+      do_start_cluster()
+    end
+  end
+
+  defp do_start_cluster do
+    IO.puts("Starting Fluss cluster via Docker...")
+
+    # Remove any leftover containers from previous runs
+    for name <- [@tablet_server_name, @coordinator_name, @zookeeper_name] do
+      System.cmd("docker", ["rm", "-f", name], stderr_to_stdout: true)
+    end
+
+    System.cmd("docker", ["network", "create", @network_name], stderr_to_stdout: true)
+
+    sasl_jaas =
+      ~s(org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required user_admin="admin-secret" user_alice="alice-secret";)
+
+    coordinator_props =
+      Enum.join(
+        [
+          "zookeeper.address: #{@zookeeper_name}:2181",
+          "bind.listeners: INTERNAL://#{@coordinator_name}:0, CLIENT://#{@coordinator_name}:9123, PLAIN_CLIENT://#{@coordinator_name}:9223",
+          "advertised.listeners: CLIENT://localhost:#{@coordinator_sasl_port}, PLAIN_CLIENT://localhost:#{@coordinator_plain_port}",
+          "internal.listener.name: INTERNAL",
+          "security.protocol.map: CLIENT:sasl",
+          "security.sasl.enabled.mechanisms: plain",
+          "security.sasl.plain.jaas.config: #{sasl_jaas}",
+          "netty.server.num-network-threads: 1",
+          "netty.server.num-worker-threads: 3"
+        ],
+        "\n"
+      )
+
+    tablet_props =
+      Enum.join(
+        [
+          "zookeeper.address: #{@zookeeper_name}:2181",
+          "bind.listeners: INTERNAL://#{@tablet_server_name}:0, CLIENT://#{@tablet_server_name}:9123, PLAIN_CLIENT://#{@tablet_server_name}:9223",
+          "advertised.listeners: CLIENT://localhost:#{@tablet_sasl_port}, PLAIN_CLIENT://localhost:#{@tablet_plain_port}",
+          "internal.listener.name: INTERNAL",
+          "security.protocol.map: CLIENT:sasl",
+          "security.sasl.enabled.mechanisms: plain",
+          "security.sasl.plain.jaas.config: #{sasl_jaas}",
+          "tablet-server.id: 0",
+          "netty.server.num-network-threads: 1",
+          "netty.server.num-worker-threads: 3"
+        ],
+        "\n"
+      )
+
+    docker_run([
+      "--name",
+      @zookeeper_name,
+      "--network",
+      @network_name,
+      "-d",
+      "zookeeper:3.9.2"
+    ])
+
+    docker_run([
+      "--name",
+      @coordinator_name,
+      "--network",
+      @network_name,
+      "-p",
+      "#{@coordinator_sasl_port}:9123",
+      "-p",
+      "#{@coordinator_plain_port}:9223",
+      "-e",
+      "FLUSS_PROPERTIES=#{coordinator_props}",
+      "-d",
+      "#{@fluss_image}:#{@fluss_version}",
+      "coordinatorServer"
+    ])
+
+    docker_run([
+      "--name",
+      @tablet_server_name,
+      "--network",
+      @network_name,
+      "-p",
+      "#{@tablet_sasl_port}:9123",
+      "-p",
+      "#{@tablet_plain_port}:9223",
+      "-e",
+      "FLUSS_PROPERTIES=#{tablet_props}",
+      "-d",
+      "#{@fluss_image}:#{@fluss_version}",
+      "tabletServer"
+    ])
+
+    all_ports = [@coordinator_plain_port, @tablet_plain_port]
+
+    if wait_for_ports(all_ports, 90) do
+      IO.puts("Fluss cluster started successfully.")
+      {:ok, bootstrap_servers()}
+    else
+      {:error, "Cluster ports did not become ready within timeout"}
+    end
+  end
+
+  defp docker_run(args) do
+    {output, code} = System.cmd("docker", ["run" | args], stderr_to_stdout: true)
+
+    if code != 0 do
+      IO.puts("Docker run warning (code #{code}): #{output}")
+    end
+  end
+
+  defp wait_for_ports(ports, timeout_s) do
+    deadline = System.monotonic_time(:second) + timeout_s
+
+    Enum.all?(ports, fn port ->
+      remaining = deadline - System.monotonic_time(:second)
+      remaining > 0 and wait_for_port(port, remaining)
+    end)
+  end
+
+  defp wait_for_port(port, timeout_s) do
+    deadline = System.monotonic_time(:second) + timeout_s
+
+    Stream.repeatedly(fn ->
+      case :gen_tcp.connect(~c"localhost", port, [], 1000) do
+        {:ok, socket} ->
+          :gen_tcp.close(socket)
+          :ok
+
+        {:error, _} ->
+          Process.sleep(1000)
+          :retry
+      end
+    end)
+    |> Enum.reduce_while(false, fn
+      :ok, _acc ->
+        {:halt, true}
+
+      :retry, _acc ->
+        if System.monotonic_time(:second) >= deadline,
+          do: {:halt, false},
+          else: {:cont, false}
+    end)
+  end
+
+  defp port_open?(port) do
+    case :gen_tcp.connect(~c"localhost", port, [], 1000) do
+      {:ok, socket} ->
+        :gen_tcp.close(socket)
+        true
+
+      {:error, _} ->
+        false
+    end
+  end
+end
diff --git a/fluss-rust/bindings/elixir/test/test_helper.exs b/fluss-rust/bindings/elixir/test/test_helper.exs
new file mode 100644
index 0000000000..b15b1f44a8
--- /dev/null
+++ b/fluss-rust/bindings/elixir/test/test_helper.exs
@@ -0,0 +1,27 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# Exclude integration tests by default (they need a Docker cluster).
+# Run with: mix test --include integration
+ExUnit.start(exclude: [:integration])
+
+# Stop Docker containers after all tests finish (matches Python's pytest_unconfigure).
+ExUnit.after_suite(fn _ ->
+  unless System.get_env("FLUSS_BOOTSTRAP_SERVERS") do
+    Fluss.Test.Cluster.stop()
+  end
+end)

From ce1d440fd93f52e9e8251f0779527ba92e721bb1 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Fri, 17 Apr 2026 12:24:30 +0100
Subject: [PATCH 235/287] [ci/cd] fix python tests with more strict scoping
 (#494)

---
 fluss-rust/bindings/python/pyproject.toml   |  4 ++--
 fluss-rust/bindings/python/test/conftest.py | 16 ++++++++++------
 2 files changed, 12 insertions(+), 8 deletions(-)

diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index 9163835fe3..22e641881b 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -95,8 +95,8 @@ known-first-party = ["fluss"]
 
 [tool.pytest.ini_options]
 asyncio_mode = "auto"
-asyncio_default_fixture_loop_scope = "session"
-timeout = 30
+asyncio_default_fixture_loop_scope = "function"
+timeout = 120
 
 [tool.mypy]
 python_version = "3.9"
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index 7da0f3d978..47c928077a 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -124,12 +124,16 @@ def fluss_cluster():
     yield (plaintext_addr, sasl_addr or plaintext_addr)
 
 
-@pytest_asyncio.fixture(scope="session")
+_cached_connection = None
+
+
+@pytest_asyncio.fixture
 async def connection(fluss_cluster):
-    plaintext_addr, _sasl_addr = fluss_cluster
-    conn = await _connect(plaintext_addr)
-    yield conn
-    conn.close()
+    global _cached_connection
+    if _cached_connection is None:
+        plaintext_addr, _sasl_addr = fluss_cluster
+        _cached_connection = await _connect(plaintext_addr)
+    yield _cached_connection
 
 
 @pytest.fixture(scope="session")
@@ -144,6 +148,6 @@ def plaintext_bootstrap_servers(fluss_cluster):
     return plaintext_addr
 
 
-@pytest_asyncio.fixture(scope="session")
+@pytest_asyncio.fixture
 async def admin(connection):
     return connection.get_admin()

From 5e13f46fccf406e565bdb4c478a41a4538b93f90 Mon Sep 17 00:00:00 2001
From: SkylerLin <44233950+linguoxuan@users.noreply.github.com>
Date: Fri, 17 Apr 2026 22:23:44 +0800
Subject: [PATCH 236/287] feat: support batch lookup (#216)

---------

Co-authored-by: Anton Borisov <anton.borisov@fresha.com>
Co-authored-by: Keith Lee <leekei@apache.org>
---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  10 +
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |   5 +
 fluss-rust/bindings/cpp/src/lib.rs            |  10 +
 fluss-rust/bindings/python/src/lookup.rs      |  21 +-
 .../crates/fluss/src/client/connection.rs     |  27 +
 .../fluss/src/client/lookup/lookup_client.rs  | 203 +++++++
 .../fluss/src/client/lookup/lookup_query.rs   |  91 +++
 .../fluss/src/client/lookup/lookup_queue.rs   | 138 +++++
 .../fluss/src/client/lookup/lookup_sender.rs  | 548 ++++++++++++++++++
 .../crates/fluss/src/client/lookup/mod.rs     |  39 ++
 fluss-rust/crates/fluss/src/client/mod.rs     |   2 +
 .../crates/fluss/src/client/table/lookup.rs   |  87 +--
 .../crates/fluss/src/client/table/mod.rs      |   3 +-
 fluss-rust/crates/fluss/src/config.rs         |  37 ++
 .../crates/fluss/src/rpc/message/lookup.rs    |  24 +
 .../fluss/tests/integration/kv_table.rs       | 245 ++++++++
 16 files changed, 1423 insertions(+), 67 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/lookup/lookup_client.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/lookup/lookup_query.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/lookup/lookup_queue.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
 create mode 100644 fluss-rust/crates/fluss/src/client/lookup/mod.rs

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 768db0f740..1937cf276a 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -1039,6 +1039,16 @@ struct Configuration {
     std::string security_sasl_username;
     // SASL password (required when security_protocol is "sasl")
     std::string security_sasl_password;
+    // Maximum number of pending lookup operations
+    size_t lookup_queue_size{25600};
+    // Maximum batch size of merging lookup operations to one lookup request
+    size_t lookup_max_batch_size{128};
+    // Maximum time to wait for the lookup batch to fill (in milliseconds)
+    uint64_t lookup_batch_timeout_ms{100};
+    // Maximum number of unacknowledged lookup requests
+    size_t lookup_max_inflight_requests{128};
+    // Maximum number of lookup retries
+    int32_t lookup_max_retries{std::numeric_limits<int32_t>::max()};
 };
 
 class Connection {
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index fcd4e1dcae..3fe4532a62 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -79,6 +79,11 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.security_sasl_mechanism = rust::String(config.security_sasl_mechanism);
     ffi_config.security_sasl_username = rust::String(config.security_sasl_username);
     ffi_config.security_sasl_password = rust::String(config.security_sasl_password);
+    ffi_config.lookup_queue_size = config.lookup_queue_size;
+    ffi_config.lookup_max_batch_size = config.lookup_max_batch_size;
+    ffi_config.lookup_batch_timeout_ms = config.lookup_batch_timeout_ms;
+    ffi_config.lookup_max_inflight_requests = config.lookup_max_inflight_requests;
+    ffi_config.lookup_max_retries = config.lookup_max_retries;
     return ffi_config;
 }
 
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 778fef30e2..51efb3c157 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -62,6 +62,11 @@ mod ffi {
         security_sasl_mechanism: String,
         security_sasl_username: String,
         security_sasl_password: String,
+        lookup_queue_size: usize,
+        lookup_max_batch_size: usize,
+        lookup_batch_timeout_ms: u64,
+        lookup_max_inflight_requests: usize,
+        lookup_max_retries: i32,
     }
 
     struct FfiResult {
@@ -689,6 +694,11 @@ fn new_connection(config: &ffi::FfiConfig) -> ffi::FfiPtrResult {
         security_sasl_mechanism: config.security_sasl_mechanism.to_string(),
         security_sasl_username: config.security_sasl_username.to_string(),
         security_sasl_password: config.security_sasl_password.to_string(),
+        lookup_queue_size: config.lookup_queue_size,
+        lookup_max_batch_size: config.lookup_max_batch_size,
+        lookup_batch_timeout_ms: config.lookup_batch_timeout_ms,
+        lookup_max_inflight_requests: config.lookup_max_inflight_requests,
+        lookup_max_retries: config.lookup_max_retries,
     };
 
     let conn = RUNTIME.block_on(async { fcore::client::FlussConnection::new(config_core).await });
diff --git a/fluss-rust/bindings/python/src/lookup.rs b/fluss-rust/bindings/python/src/lookup.rs
index e2edbf415a..09465263b5 100644
--- a/fluss-rust/bindings/python/src/lookup.rs
+++ b/fluss-rust/bindings/python/src/lookup.rs
@@ -94,15 +94,18 @@ impl Lookuper {
         metadata: Arc<fcore::client::Metadata>,
         table_info: fcore::metadata::TableInfo,
     ) -> PyResult<Self> {
-        let fluss_table = fcore::client::FlussTable::new(connection, metadata, table_info.clone());
-
-        let table_lookup = fluss_table
-            .new_lookup()
-            .map_err(|e| FlussError::from_core_error(&e))?;
-
-        let lookuper = table_lookup
-            .create_lookuper()
-            .map_err(|e| FlussError::from_core_error(&e))?;
+        // Run inside tokio runtime context because new_lookup()
+        // spawns a background task via tokio::spawn() in LookupClient::new().
+        let lookuper = TOKIO_RUNTIME.block_on(async {
+            let fluss_table =
+                fcore::client::FlussTable::new(connection, metadata, table_info.clone());
+            let table_lookup = fluss_table
+                .new_lookup()
+                .map_err(|e| FlussError::from_core_error(&e))?;
+            table_lookup
+                .create_lookuper()
+                .map_err(|e| FlussError::from_core_error(&e))
+        })?;
 
         Ok(Self {
             inner: Arc::new(Mutex::new(lookuper)),
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 88f87e4c43..62d440bed5 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -17,6 +17,7 @@
 
 use crate::client::WriterClient;
 use crate::client::admin::FlussAdmin;
+use crate::client::lookup::LookupClient;
 use crate::client::metadata::Metadata;
 use crate::client::table::FlussTable;
 use crate::config::Config;
@@ -37,6 +38,7 @@ pub struct FlussConnection {
     args: Config,
     writer_client: RwLock<Option<Arc<WriterClient>>>,
     admin_client: RwLock<Option<Arc<FlussAdmin>>>,
+    lookup_client: RwLock<Option<Arc<LookupClient>>>,
 }
 
 impl FlussConnection {
@@ -67,6 +69,7 @@ impl FlussConnection {
             args: arg.clone(),
             writer_client: Default::default(),
             admin_client: RwLock::new(None),
+            lookup_client: Default::default(),
         })
     }
 
@@ -128,6 +131,30 @@ impl FlussConnection {
         Ok(new_client)
     }
 
+    /// Gets or creates a lookup client for batched lookup operations.
+    pub fn get_or_create_lookup_client(&self) -> Result<Arc<LookupClient>> {
+        // 1. Fast path: Attempt to acquire a read lock to check if the client already exists.
+        if let Some(client) = self.lookup_client.read().as_ref() {
+            return Ok(client.clone());
+        }
+
+        // 2. Slow path: Acquire the write lock.
+        let mut lookup_guard = self.lookup_client.write();
+
+        // 3. Double-check: Another thread might have initialized the client
+        // while this thread was waiting for the write lock.
+        if let Some(client) = lookup_guard.as_ref() {
+            return Ok(client.clone());
+        }
+
+        // 4. Initialize the client since we are certain it doesn't exist yet.
+        let new_client = Arc::new(LookupClient::new(&self.args, self.metadata.clone()));
+
+        // 5. Store and return the newly created client.
+        *lookup_guard = Some(new_client.clone());
+        Ok(new_client)
+    }
+
     pub async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>> {
         self.metadata.update_table_metadata(table_path).await?;
         let table_info = self
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_client.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_client.rs
new file mode 100644
index 0000000000..f80170415a
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_client.rs
@@ -0,0 +1,203 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Lookup client that batches multiple lookups together for improved throughput.
+//!
+//! This client achieves parity with the Java client by:
+//! - Queuing lookup operations instead of sending them immediately
+//! - Batching multiple lookups to the same server/bucket
+//! - Running a background sender task to process batches
+
+use super::{LookupQuery, LookupQueue};
+use crate::client::lookup::lookup_sender::LookupSender;
+use crate::client::metadata::Metadata;
+use crate::config::Config;
+use crate::error::{Error, Result};
+use crate::metadata::{TableBucket, TablePath};
+use bytes::Bytes;
+use log::{debug, error};
+use std::sync::Arc;
+use std::sync::atomic::{AtomicBool, Ordering};
+use std::time::Duration;
+use tokio::sync::{mpsc, watch};
+use tokio::task::JoinHandle;
+
+/// A client that lookups values from the server with batching support.
+///
+/// The lookup client uses a queue and background sender to batch multiple
+/// lookup operations together, reducing network round trips and improving
+/// throughput.
+///
+/// # Example
+///
+/// ```ignore
+/// let lookup_client = LookupClient::new(config, metadata);
+/// let result = lookup_client.lookup(table_path, table_bucket, key_bytes).await?;
+/// ```
+pub struct LookupClient {
+    /// Channel to send lookup requests to the queue
+    lookup_tx: mpsc::Sender<LookupQuery>,
+    /// Handle to the sender task
+    sender_handle: Option<JoinHandle<()>>,
+    /// Watch channel for internal shutdown handling
+    shutdown_tx: watch::Sender<bool>,
+    /// Whether the client is closed
+    closed: AtomicBool,
+}
+
+impl LookupClient {
+    /// Creates a new lookup client.
+    pub fn new(config: &Config, metadata: Arc<Metadata>) -> Self {
+        // Extract configuration values
+        let queue_size = config.lookup_queue_size;
+        let max_batch_size = config.lookup_max_batch_size;
+        let batch_timeout_ms = config.lookup_batch_timeout_ms;
+        let max_inflight = config.lookup_max_inflight_requests;
+        let max_retries = config.lookup_max_retries;
+
+        // Create queue and channels
+        let (queue, lookup_tx, re_enqueue_tx) =
+            LookupQueue::new(queue_size, max_batch_size, batch_timeout_ms);
+
+        // Create shutdown channel
+        let (shutdown_tx, shutdown_rx) = watch::channel(false);
+
+        // Create sender with shutdown receiver
+        let mut sender = LookupSender::new(
+            metadata,
+            queue,
+            re_enqueue_tx,
+            max_inflight,
+            max_retries,
+            shutdown_rx,
+        );
+
+        // Spawn sender task - sender handles shutdown internally
+        let sender_handle = tokio::spawn(async move {
+            sender.run().await;
+            debug!("Lookup sender completed");
+        });
+
+        Self {
+            lookup_tx,
+            sender_handle: Some(sender_handle),
+            shutdown_tx,
+            closed: AtomicBool::new(false),
+        }
+    }
+
+    /// Looks up a value by its primary key.
+    ///
+    /// This method queues the lookup operation and returns a future that will
+    /// complete when the server responds. Multiple lookups may be batched together
+    /// for improved throughput.
+    ///
+    /// # Arguments
+    /// * `table_path` - The table path
+    /// * `table_bucket` - The table bucket
+    /// * `key_bytes` - The encoded primary key bytes
+    ///
+    /// # Returns
+    /// * `Ok(Some(bytes))` - The value bytes if found
+    /// * `Ok(None)` - If the key was not found
+    /// * `Err(Error)` - If the lookup fails
+    pub async fn lookup(
+        &self,
+        table_path: TablePath,
+        table_bucket: TableBucket,
+        key_bytes: Bytes,
+    ) -> Result<Option<Vec<u8>>> {
+        // Check if the client is closed
+        if self.closed.load(Ordering::Acquire) {
+            return Err(Error::UnexpectedError {
+                message: "Lookup client is closed".to_string(),
+                source: None,
+            });
+        }
+
+        let (result_tx, result_rx) = tokio::sync::oneshot::channel();
+
+        let query = LookupQuery::new(table_path, table_bucket, key_bytes, result_tx);
+
+        // Send to queue
+        self.lookup_tx
+            .send(query)
+            .await
+            .map_err(|e| {
+                let failed_query = e.0;
+                error!(
+                    "Failed to queue lookup: channel closed. table_path: {}, table_bucket: {:?}, key_len: {}",
+                    failed_query.table_path(),
+                    failed_query.table_bucket(),
+                    failed_query.key().len()
+                );
+                Error::UnexpectedError {
+                    message: "Failed to queue lookup: channel closed".to_string(),
+                    source: None,
+                }
+            })?;
+
+        // Wait for result
+        result_rx.await.map_err(|_| Error::UnexpectedError {
+            message: "Lookup result channel closed".to_string(),
+            source: None,
+        })?
+    }
+
+    /// Closes the lookup client gracefully.
+    pub async fn close(mut self, timeout: Duration) {
+        debug!("Closing lookup client");
+
+        // Mark as closed to reject new lookups
+        self.closed.store(true, Ordering::Release);
+
+        // Send shutdown signal via watch channel
+        let _ = self.shutdown_tx.send(true);
+
+        // Wait for sender to complete with timeout
+        if let Some(handle) = self.sender_handle.take() {
+            debug!("Waiting for sender task to complete...");
+            let abort_handle = handle.abort_handle();
+
+            match tokio::time::timeout(timeout, handle).await {
+                Ok(Ok(())) => {
+                    debug!("Lookup sender task completed gracefully.");
+                }
+                Ok(Err(join_error)) => {
+                    error!("Lookup sender task panicked: {:?}", join_error);
+                }
+                Err(_elapsed) => {
+                    error!("Lookup sender task did not complete within timeout. Forcing shutdown.");
+                    abort_handle.abort();
+                }
+            }
+        } else {
+            debug!("Lookup client was already closed or never initialized properly.");
+        }
+
+        debug!("Lookup client closed");
+    }
+}
+
+impl Drop for LookupClient {
+    fn drop(&mut self) {
+        // Abort the sender task on drop if it wasn't already consumed by close()
+        if let Some(handle) = self.sender_handle.take() {
+            handle.abort();
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_query.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_query.rs
new file mode 100644
index 0000000000..2da9f7c932
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_query.rs
@@ -0,0 +1,91 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Lookup query representation for batching lookup operations.
+
+use crate::metadata::{TableBucket, TablePath};
+use bytes::Bytes;
+use tokio::sync::oneshot;
+
+/// Represents a single lookup query that will be batched and sent to the server.
+pub struct LookupQuery {
+    /// The table path for this lookup
+    table_path: TablePath,
+    /// The table bucket for this lookup
+    table_bucket: TableBucket,
+    /// The encoded primary key bytes
+    key: Bytes,
+    /// Channel to send the result back to the caller
+    result_tx: Option<oneshot::Sender<Result<Option<Vec<u8>>, crate::error::Error>>>,
+    /// Number of retry attempts
+    retries: i32,
+}
+
+impl LookupQuery {
+    /// Creates a new lookup query.
+    pub fn new(
+        table_path: TablePath,
+        table_bucket: TableBucket,
+        key: Bytes,
+        result_tx: oneshot::Sender<Result<Option<Vec<u8>>, crate::error::Error>>,
+    ) -> Self {
+        Self {
+            table_path,
+            table_bucket,
+            key,
+            result_tx: Some(result_tx),
+            retries: 0,
+        }
+    }
+
+    /// Returns the table path.
+    pub fn table_path(&self) -> &TablePath {
+        &self.table_path
+    }
+
+    /// Returns the table bucket.
+    pub fn table_bucket(&self) -> &TableBucket {
+        &self.table_bucket
+    }
+
+    /// Returns the encoded key bytes.
+    pub fn key(&self) -> &Bytes {
+        &self.key
+    }
+
+    /// Returns the current retry count.
+    pub fn retries(&self) -> i32 {
+        self.retries
+    }
+
+    /// Increments the retry counter.
+    pub fn increment_retries(&mut self) {
+        self.retries += 1;
+    }
+
+    /// Completes the lookup with a result.
+    pub fn complete(&mut self, result: Result<Option<Vec<u8>>, crate::error::Error>) {
+        if let Some(tx) = self.result_tx.take() {
+            let _ = tx.send(result);
+        }
+    }
+
+    /// Returns true if the result has already been sent.
+    pub fn is_done(&self) -> bool {
+        self.result_tx.is_none()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_queue.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_queue.rs
new file mode 100644
index 0000000000..0531913e18
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_queue.rs
@@ -0,0 +1,138 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Lookup queue for buffering pending lookup operations.
+//!
+//! This queue buffers lookup operations and provides batched draining
+//! to improve throughput by reducing network round trips.
+
+use super::LookupQuery;
+use std::time::Duration;
+use tokio::sync::mpsc;
+use tokio::time::timeout;
+
+/// A queue that buffers pending lookup operations and provides batched draining.
+///
+/// The queue supports two types of entries:
+/// - New lookups from client calls
+/// - Re-enqueued lookups from retry logic
+///
+/// Re-enqueued lookups are prioritized over new lookups to ensure fair processing.
+pub struct LookupQueue {
+    /// Channel for receiving lookup requests
+    lookup_rx: mpsc::Receiver<LookupQuery>,
+    /// Channel for receiving re-enqueued lookups
+    re_enqueue_rx: mpsc::UnboundedReceiver<LookupQuery>,
+    /// Maximum batch size for draining
+    max_batch_size: usize,
+    /// Timeout for batch collection
+    batch_timeout: Duration,
+}
+
+impl LookupQueue {
+    /// Creates a new lookup queue with the specified configuration.
+    pub fn new(
+        queue_size: usize,
+        max_batch_size: usize,
+        batch_timeout_ms: u64,
+    ) -> (
+        Self,
+        mpsc::Sender<LookupQuery>,
+        mpsc::UnboundedSender<LookupQuery>,
+    ) {
+        let (lookup_tx, lookup_rx) = mpsc::channel(queue_size);
+        let (re_enqueue_tx, re_enqueue_rx) = mpsc::unbounded_channel();
+
+        let queue = Self {
+            lookup_rx,
+            re_enqueue_rx,
+            max_batch_size,
+            batch_timeout: Duration::from_millis(batch_timeout_ms),
+        };
+
+        (queue, lookup_tx, re_enqueue_tx)
+    }
+
+    /// Drains a batch of lookup queries from the queue.
+    pub async fn drain(&mut self) -> Vec<LookupQuery> {
+        let mut lookups = Vec::with_capacity(self.max_batch_size);
+        let deadline = tokio::time::Instant::now() + self.batch_timeout;
+
+        loop {
+            let remaining = deadline.saturating_duration_since(tokio::time::Instant::now());
+            if remaining.is_zero() {
+                break;
+            }
+
+            // First drain re-enqueued lookups (prioritized)
+            while lookups.len() < self.max_batch_size {
+                match self.re_enqueue_rx.try_recv() {
+                    Ok(lookup) => lookups.push(lookup),
+                    Err(_) => break,
+                }
+            }
+
+            if lookups.len() >= self.max_batch_size {
+                break;
+            }
+
+            // Then try to get from main queue with timeout
+            match timeout(remaining, self.lookup_rx.recv()).await {
+                Ok(Some(lookup)) => {
+                    lookups.push(lookup);
+                    // Try to drain more without waiting
+                    while lookups.len() < self.max_batch_size {
+                        match self.lookup_rx.try_recv() {
+                            Ok(lookup) => lookups.push(lookup),
+                            Err(_) => break,
+                        }
+                    }
+                }
+                Ok(None) => break, // Channel closed
+                Err(_) => break,   // Timeout
+            }
+
+            if lookups.len() >= self.max_batch_size {
+                break;
+            }
+        }
+
+        lookups
+    }
+
+    /// Drains all remaining lookups from the queue.
+    pub fn drain_all(&mut self) -> Vec<LookupQuery> {
+        let mut lookups = Vec::new();
+
+        // Drain re-enqueued lookups
+        while let Ok(lookup) = self.re_enqueue_rx.try_recv() {
+            lookups.push(lookup);
+        }
+
+        // Drain main queue
+        while let Ok(lookup) = self.lookup_rx.try_recv() {
+            lookups.push(lookup);
+        }
+
+        lookups
+    }
+
+    /// Returns true if there are undrained lookups in the queue.
+    pub fn has_undrained(&self) -> bool {
+        !self.lookup_rx.is_empty() || !self.re_enqueue_rx.is_empty()
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
new file mode 100644
index 0000000000..4abb9d7eb7
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
@@ -0,0 +1,548 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Lookup sender that processes batched lookup requests.
+//!
+//! The sender runs as a background task, draining lookups from the queue,
+//! grouping them by destination server, and sending batched requests.
+
+use super::{LookupQuery, LookupQueue};
+use crate::client::metadata::Metadata;
+use crate::error::{Error, FlussError, Result};
+use crate::metadata::{TableBucket, TablePath};
+use crate::proto::LookupResponse;
+use crate::rpc::ServerConnection;
+use crate::rpc::message::LookupRequest;
+use crate::{BucketId, PartitionId, TableId};
+use bytes::Bytes;
+use futures::stream::{FuturesUnordered, StreamExt};
+use log::{debug, error, warn};
+use std::collections::{HashMap, HashSet};
+use std::sync::Arc;
+use std::sync::atomic::{AtomicBool, Ordering};
+use std::time::Duration;
+use tokio::sync::{Semaphore, mpsc, watch};
+
+/// Server ID type alias for clarity.
+type ServerId = i32;
+
+/// Batches grouped by table bucket, keyed by server.
+type BatchesByLeader = HashMap<ServerId, HashMap<TableBucket, LookupBatch>>;
+
+/// Result of grouping lookups by leader.
+struct GroupByLeaderResult {
+    /// Lookup batches grouped by leader server.
+    batches_by_leader: BatchesByLeader,
+    /// Tables with unknown leaders that need metadata refresh.
+    unknown_leader_tables: HashSet<TablePath>,
+    /// Partition IDs with unknown leaders.
+    unknown_leader_partition_ids: HashSet<PartitionId>,
+}
+
+/// Lookup sender that batches and sends lookup requests.
+pub struct LookupSender {
+    /// Metadata for leader lookup
+    metadata: Arc<Metadata>,
+    /// The lookup queue to drain from
+    queue: LookupQueue,
+    /// Channel to re-enqueue failed lookups
+    re_enqueue_tx: mpsc::UnboundedSender<LookupQuery>,
+    /// Semaphore to limit in-flight requests
+    inflight_semaphore: Arc<Semaphore>,
+    /// Maximum number of retries
+    max_retries: i32,
+    /// Whether the sender is running
+    running: AtomicBool,
+    /// Whether to force close (abandon pending lookups)
+    force_close: AtomicBool,
+    /// Shutdown signal receiver
+    shutdown_rx: watch::Receiver<bool>,
+}
+
+/// A batch of lookups going to the same table bucket.
+struct LookupBatch {
+    table_bucket: TableBucket,
+    lookups: Vec<LookupQuery>,
+    keys: Vec<Bytes>,
+}
+
+impl LookupBatch {
+    fn new(table_bucket: TableBucket) -> Self {
+        Self {
+            table_bucket,
+            lookups: Vec::new(),
+            keys: Vec::new(),
+        }
+    }
+
+    fn add_lookup(&mut self, lookup: LookupQuery) {
+        self.keys.push(lookup.key().clone());
+        self.lookups.push(lookup);
+    }
+
+    fn complete(&mut self, values: Vec<Option<Vec<u8>>>) {
+        if values.len() != self.lookups.len() {
+            let err_msg = format!(
+                "The number of return values ({}) does not match the number of lookups ({})",
+                values.len(),
+                self.lookups.len()
+            );
+            for lookup in &mut self.lookups {
+                lookup.complete(Err(Error::UnexpectedError {
+                    message: err_msg.clone(),
+                    source: None,
+                }));
+            }
+            return;
+        }
+
+        for (lookup, value) in self.lookups.iter_mut().zip(values.into_iter()) {
+            lookup.complete(Ok(value));
+        }
+    }
+
+    fn complete_exceptionally(&mut self, error_msg: &str) {
+        for lookup in &mut self.lookups {
+            lookup.complete(Err(Error::UnexpectedError {
+                message: error_msg.to_string(),
+                source: None,
+            }));
+        }
+    }
+}
+
+impl LookupSender {
+    /// Creates a new lookup sender.
+    pub fn new(
+        metadata: Arc<Metadata>,
+        queue: LookupQueue,
+        re_enqueue_tx: mpsc::UnboundedSender<LookupQuery>,
+        max_inflight_requests: usize,
+        max_retries: i32,
+        shutdown_rx: watch::Receiver<bool>,
+    ) -> Self {
+        Self {
+            metadata,
+            queue,
+            re_enqueue_tx,
+            inflight_semaphore: Arc::new(Semaphore::new(max_inflight_requests)),
+            max_retries,
+            running: AtomicBool::new(true),
+            force_close: AtomicBool::new(false),
+            shutdown_rx,
+        }
+    }
+
+    /// Runs the sender loop.
+    pub async fn run(&mut self) {
+        debug!("Starting Fluss lookup sender");
+
+        let mut shutdown_rx = self.shutdown_rx.clone();
+
+        while self.running.load(Ordering::Acquire) {
+            // Check for shutdown signal before entering select
+            if *shutdown_rx.borrow() {
+                debug!("Lookup sender received shutdown signal");
+                self.initiate_close();
+                break;
+            }
+
+            tokio::select! {
+                biased;
+
+                // Check shutdown signal
+                _ = shutdown_rx.changed() => {
+                    if *shutdown_rx.borrow() {
+                        debug!("Lookup sender received shutdown signal during select");
+                        self.initiate_close();
+                    }
+                }
+
+                // Process lookups
+                result = self.run_once(false) => {
+                    if let Err(e) = result {
+                        error!("Error in lookup sender: {}", e);
+                    }
+                }
+            }
+        }
+
+        debug!("Beginning shutdown of lookup sender, sending remaining lookups");
+
+        // Process remaining lookups during shutdown
+        // TODO: Check the in flight request count in the accumulator.
+        if !self.force_close.load(Ordering::Acquire) && self.queue.has_undrained() {
+            if let Err(e) = self.run_once(true).await {
+                error!("Error during lookup sender shutdown: {}", e);
+            }
+        }
+
+        // TODO: If force close failed, add logic to abort incomplete lookup requests.
+        debug!("Lookup sender shutdown complete");
+    }
+
+    /// Runs a single iteration of the sender loop.
+    async fn run_once(&mut self, drain_all: bool) -> Result<()> {
+        let lookups = if drain_all {
+            self.queue.drain_all()
+        } else {
+            self.queue.drain().await
+        };
+
+        self.send_lookups(lookups).await
+    }
+
+    /// Groups and sends lookups to appropriate servers.
+    async fn send_lookups(&self, lookups: Vec<LookupQuery>) -> Result<()> {
+        if lookups.is_empty() {
+            return Ok(());
+        }
+
+        // Group by leader
+        let GroupByLeaderResult {
+            batches_by_leader: lookup_batches,
+            unknown_leader_tables,
+            unknown_leader_partition_ids,
+        } = self.group_by_leader(lookups);
+
+        // Update metadata for tables with unknown leaders
+        if !unknown_leader_tables.is_empty() {
+            let table_paths_refs: HashSet<&TablePath> = unknown_leader_tables.iter().collect();
+            let partition_ids: Vec<PartitionId> =
+                unknown_leader_partition_ids.into_iter().collect();
+            if let Err(e) = self
+                .metadata
+                .update_tables_metadata(&table_paths_refs, &HashSet::new(), partition_ids)
+                .await
+            {
+                warn!("Failed to update metadata for unknown leader tables: {}", e);
+            } else {
+                debug!(
+                    "Updated metadata due to unknown leader tables during lookup: {:?}",
+                    unknown_leader_tables
+                );
+            }
+        }
+
+        // If no lookup batches, sleep a bit to avoid busy loop. This case will happen when there is
+        // no leader for all the lookup request in queue.
+        if lookup_batches.is_empty() && !self.queue.has_undrained() {
+            // TODO: May use wait/notify mechanism to avoid active sleep, and use a dynamic sleep time based on the request waited time.
+            tokio::time::sleep(Duration::from_millis(100)).await;
+            return Ok(());
+        }
+
+        // Send batches to each destination
+        let mut pending = FuturesUnordered::new();
+        for (destination, batches) in lookup_batches {
+            pending.push(self.send_lookup_request(destination, batches));
+        }
+        while let Some(()) = pending.next().await {}
+
+        Ok(())
+    }
+
+    /// Groups lookups by leader server.
+    fn group_by_leader(&self, lookups: Vec<LookupQuery>) -> GroupByLeaderResult {
+        let cluster = self.metadata.get_cluster();
+        let mut batches_by_leader: BatchesByLeader = HashMap::new();
+        let mut unknown_leader_tables: HashSet<TablePath> = HashSet::new();
+        let mut unknown_leader_partition_ids: HashSet<PartitionId> = HashSet::new();
+
+        for lookup in lookups {
+            let table_bucket = lookup.table_bucket().clone();
+
+            let leader = match cluster.leader_for(&table_bucket) {
+                Some(leader) => leader.id(),
+                None => {
+                    warn!(
+                        "No leader found for table bucket {} during lookup",
+                        table_bucket
+                    );
+                    // Collect tables with unknown leaders for metadata update
+                    unknown_leader_tables.insert(lookup.table_path().clone());
+                    if let Some(partition_id) = table_bucket.partition_id() {
+                        unknown_leader_partition_ids.insert(partition_id);
+                    }
+                    self.re_enqueue_lookup(lookup);
+                    continue;
+                }
+            };
+
+            batches_by_leader
+                .entry(leader)
+                .or_default()
+                .entry(table_bucket.clone())
+                .or_insert_with(|| LookupBatch::new(table_bucket))
+                .add_lookup(lookup);
+        }
+
+        GroupByLeaderResult {
+            batches_by_leader,
+            unknown_leader_tables,
+            unknown_leader_partition_ids,
+        }
+    }
+
+    /// Sends lookup requests to a specific destination server.
+    async fn send_lookup_request(
+        &self,
+        destination: i32,
+        batches_by_bucket: HashMap<TableBucket, LookupBatch>,
+    ) {
+        // Group by table_id for request batching
+        let mut batches_by_table: HashMap<TableId, Vec<LookupBatch>> = HashMap::new();
+        for (table_bucket, batch) in batches_by_bucket {
+            batches_by_table
+                .entry(table_bucket.table_id())
+                .or_default()
+                .push(batch);
+        }
+
+        let cluster = self.metadata.get_cluster();
+        let tablet_server = match cluster.get_tablet_server(destination) {
+            Some(server) => server.clone(),
+            None => {
+                let err_msg = format!("Server {} is not found in metadata cache", destination);
+                for batches in batches_by_table.into_values() {
+                    for mut batch in batches {
+                        self.handle_lookup_error(&err_msg, true, &mut batch);
+                    }
+                }
+                return;
+            }
+        };
+
+        let connection = match self.metadata.get_connection(&tablet_server).await {
+            Ok(conn) => conn,
+            Err(e) => {
+                let err_msg = format!("Failed to get connection to server {}: {}", destination, e);
+                for batches in batches_by_table.into_values() {
+                    for mut batch in batches {
+                        self.handle_lookup_error(&err_msg, true, &mut batch);
+                    }
+                }
+                return;
+            }
+        };
+
+        let mut pending = FuturesUnordered::new();
+        for (table_id, mut batches) in batches_by_table {
+            let mut all_keys_by_bucket: Vec<(BucketId, Option<PartitionId>, Vec<Bytes>)> =
+                Vec::new();
+            for batch in &mut batches {
+                all_keys_by_bucket.push((
+                    batch.table_bucket.bucket_id(),
+                    batch.table_bucket.partition_id(),
+                    std::mem::take(&mut batch.keys),
+                ));
+            }
+
+            let request = LookupRequest::new_batched(table_id, all_keys_by_bucket);
+            let conn = connection.clone();
+            pending.push(self.send_single_table_lookup(
+                table_id,
+                destination,
+                conn,
+                request,
+                batches,
+            ));
+        }
+
+        while let Some(()) = pending.next().await {}
+    }
+
+    /// Sends a single lookup request for one table and handles the response.
+    async fn send_single_table_lookup(
+        &self,
+        table_id: TableId,
+        destination: i32,
+        connection: ServerConnection,
+        request: LookupRequest,
+        mut batches: Vec<LookupBatch>,
+    ) {
+        let _permit = match self.inflight_semaphore.clone().acquire_owned().await {
+            Ok(permit) => permit,
+            Err(_) => {
+                error!("Semaphore closed during lookup");
+                for batch in &mut batches {
+                    batch.complete_exceptionally("Lookup sender shutdown");
+                }
+                return;
+            }
+        };
+
+        match connection.request(request).await {
+            Ok(response) => {
+                self.handle_lookup_response(table_id, destination, response, &mut batches);
+            }
+            Err(e) => {
+                let err_msg = format!("Lookup request failed: {}", e);
+                let is_retriable = e.is_retriable();
+                for batch in &mut batches {
+                    self.handle_lookup_error(&err_msg, is_retriable, batch);
+                }
+            }
+        }
+    }
+
+    /// Handles the lookup response.
+    fn handle_lookup_response(
+        &self,
+        table_id: TableId,
+        destination: i32,
+        response: LookupResponse,
+        batches: &mut [LookupBatch],
+    ) {
+        let bucket_to_index: HashMap<TableBucket, usize> = batches
+            .iter()
+            .enumerate()
+            .map(|(idx, batch)| (batch.table_bucket.clone(), idx))
+            .collect();
+
+        // Track which batches have been processed
+        let mut processed_batches = vec![false; batches.len()];
+
+        for bucket_resp in response.buckets_resp {
+            let table_bucket = TableBucket::new_with_partition(
+                table_id,
+                bucket_resp.partition_id,
+                bucket_resp.bucket_id,
+            );
+            if let Some(&batch_idx) = bucket_to_index.get(&table_bucket) {
+                processed_batches[batch_idx] = true;
+                let batch = &mut batches[batch_idx];
+
+                // Check for errors
+                if let Some(error_code) = bucket_resp.error_code {
+                    let fluss_error = FlussError::for_code(error_code);
+                    if fluss_error != FlussError::None {
+                        let err_msg = format!(
+                            "Lookup error for bucket {}: code={}, message={}",
+                            table_bucket,
+                            error_code,
+                            bucket_resp.error_message.unwrap_or_default()
+                        );
+                        let is_retriable = fluss_error.is_retriable();
+                        self.handle_lookup_error(&err_msg, is_retriable, batch);
+                        continue;
+                    }
+                }
+
+                // Extract values
+                let values: Vec<Option<Vec<u8>>> = bucket_resp
+                    .values
+                    .into_iter()
+                    .map(|pb_value| pb_value.values)
+                    .collect();
+
+                batch.complete(values);
+            } else {
+                error!(
+                    "Received response for unknown bucket {} from server {}",
+                    table_bucket, destination
+                );
+            }
+        }
+
+        // Handle any batches that were not included in the response
+        for (idx, processed) in processed_batches.iter().enumerate() {
+            if !processed {
+                let batch = &mut batches[idx];
+                // If the batch has lookups that haven't been processed, retry them
+                if !batch.lookups.is_empty() {
+                    let err_msg = format!(
+                        "Bucket {} response missing from server {}",
+                        batch.table_bucket.bucket_id(),
+                        destination
+                    );
+                    // Treat missing bucket response as retriable
+                    self.handle_lookup_error(&err_msg, true, batch);
+                }
+            }
+        }
+    }
+
+    /// Handles lookup errors with retry logic.
+    fn handle_lookup_error(&self, error_msg: &str, is_retriable: bool, batch: &mut LookupBatch) {
+        let mut lookups_to_retry = Vec::new();
+        let mut lookups_to_complete = Vec::new();
+
+        for lookup in batch.lookups.drain(..) {
+            if is_retriable && lookup.retries() < self.max_retries && !lookup.is_done() {
+                lookups_to_retry.push(lookup);
+            } else {
+                lookups_to_complete.push(lookup);
+            }
+        }
+
+        // Re-enqueue retriable lookups
+        if !lookups_to_retry.is_empty() {
+            warn!(
+                "Lookup error for bucket {}, retrying {} lookups: {}",
+                batch.table_bucket,
+                lookups_to_retry.len(),
+                error_msg
+            );
+            for mut lookup in lookups_to_retry {
+                lookup.increment_retries();
+                self.re_enqueue_lookup(lookup);
+            }
+        }
+
+        // Complete non-retriable lookups with error
+        if !lookups_to_complete.is_empty() {
+            warn!(
+                "Lookup failed for bucket {} ({} lookups): {}",
+                batch.table_bucket,
+                lookups_to_complete.len(),
+                error_msg
+            );
+            for mut lookup in lookups_to_complete {
+                lookup.complete(Err(Error::UnexpectedError {
+                    message: error_msg.to_string(),
+                    source: None,
+                }));
+            }
+        }
+    }
+
+    /// Re-enqueues a lookup for retry.
+    fn re_enqueue_lookup(&self, lookup: LookupQuery) {
+        if let Err(e) = self.re_enqueue_tx.send(lookup) {
+            // Ensure the caller does not hang by completing the lookup with an error.
+            error!("Failed to re-enqueue lookup: {}", e);
+            let mut failed_lookup = e.0;
+            failed_lookup.complete(Err(Error::UnexpectedError {
+                message: "Failed to re-enqueue lookup: channel closed".to_string(),
+                source: None,
+            }));
+        }
+    }
+
+    /// Initiates graceful shutdown of the sender.
+    pub fn initiate_close(&mut self) {
+        self.running.store(false, Ordering::Release);
+    }
+
+    /// Forces immediate shutdown, abandoning pending lookups.
+    #[allow(dead_code)]
+    pub fn force_close(&mut self) {
+        self.force_close.store(true, Ordering::Release);
+        self.initiate_close();
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/lookup/mod.rs b/fluss-rust/crates/fluss/src/client/lookup/mod.rs
new file mode 100644
index 0000000000..f96aa2ed33
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/lookup/mod.rs
@@ -0,0 +1,39 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Lookup client implementation with batching and queuing support.
+//!
+//! This module provides a high-throughput lookup client that batches multiple
+//! lookup operations together to reduce network round trips, achieving parity
+//! with the Java client implementation.
+//!
+//! # Example
+//!
+//! ```ignore
+//! let lookup_client = LookupClient::new(config, metadata);
+//! let future = lookup_client.lookup(table_path, table_bucket, key_bytes);
+//! let result = future.await?;
+//! ```
+
+mod lookup_client;
+mod lookup_query;
+mod lookup_queue;
+mod lookup_sender;
+
+pub use lookup_client::LookupClient;
+pub(crate) use lookup_query::LookupQuery;
+pub(crate) use lookup_queue::LookupQueue;
diff --git a/fluss-rust/crates/fluss/src/client/mod.rs b/fluss-rust/crates/fluss/src/client/mod.rs
index cff218b345..77c30203bc 100644
--- a/fluss-rust/crates/fluss/src/client/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/mod.rs
@@ -18,6 +18,7 @@
 mod admin;
 mod connection;
 mod credentials;
+pub mod lookup;
 mod metadata;
 mod table;
 mod write;
@@ -25,6 +26,7 @@ mod write;
 pub use admin::*;
 pub use connection::*;
 pub use credentials::*;
+pub use lookup::LookupClient;
 pub use metadata::*;
 pub use table::*;
 pub use write::*;
diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index aa29ea693e..add79210dc 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use crate::bucketing::BucketingFunction;
+use crate::client::lookup::LookupClient;
 use crate::client::metadata::Metadata;
 use crate::client::table::partition_getter::PartitionGetter;
 use crate::error::{Error, Result};
@@ -25,9 +26,6 @@ use crate::record::kv::SCHEMA_ID_LENGTH;
 use crate::row::InternalRow;
 use crate::row::compacted::CompactedRow;
 use crate::row::encode::{KeyEncoder, KeyEncoderFactory};
-use crate::rpc::ApiError;
-use crate::rpc::RpcClient;
-use crate::rpc::message::LookupRequest;
 use arrow::array::RecordBatch;
 use std::sync::Arc;
 
@@ -148,19 +146,19 @@ impl LookupResult {
 // TODO: Add lookup_by(column_names) for prefix key lookups (PrefixKeyLookuper)
 // TODO: Add create_typed_lookuper<T>() for typed lookups with POJO mapping
 pub struct TableLookup {
-    rpc_client: Arc<RpcClient>,
+    lookup_client: Arc<LookupClient>,
     table_info: TableInfo,
     metadata: Arc<Metadata>,
 }
 
 impl TableLookup {
     pub(super) fn new(
-        rpc_client: Arc<RpcClient>,
+        lookup_client: Arc<LookupClient>,
         table_info: TableInfo,
         metadata: Arc<Metadata>,
     ) -> Self {
         Self {
-            rpc_client,
+            lookup_client,
             table_info,
             metadata,
         }
@@ -170,6 +168,10 @@ impl TableLookup {
     ///
     /// The lookuper will automatically encode the key and compute the bucket
     /// for each lookup using the appropriate bucketing function.
+    ///
+    /// The lookuper uses a shared `LookupClient` that batches multiple lookup
+    /// operations together to reduce network round trips. This achieves parity
+    /// with the Java client implementation for improved throughput.
     pub fn create_lookuper(self) -> Result<Lookuper> {
         let num_buckets = self.table_info.get_num_buckets();
 
@@ -206,12 +208,13 @@ impl TableLookup {
         };
 
         let row_type = Arc::new(self.table_info.row_type().clone());
+
         Ok(Lookuper {
-            rpc_client: self.rpc_client,
             table_path: Arc::new(self.table_info.table_path.clone()),
             row_type,
             table_info: self.table_info,
             metadata: self.metadata,
+            lookup_client: self.lookup_client,
             bucketing_function,
             primary_key_encoder,
             bucket_key_encoder,
@@ -224,7 +227,7 @@ impl TableLookup {
 /// Performs key-based lookups against a primary key table.
 ///
 /// The `Lookuper` automatically encodes the lookup key, computes the target
-/// bucket, finds the appropriate tablet server, and retrieves the value.
+/// bucket, and retrieves the value using the batched `LookupClient`.
 ///
 /// # Example
 /// ```ignore
@@ -233,11 +236,11 @@ impl TableLookup {
 /// let result = lookuper.lookup(&row).await?;
 /// ```
 pub struct Lookuper {
-    rpc_client: Arc<RpcClient>,
+    table_path: Arc<TablePath>,
     table_info: TableInfo,
     row_type: Arc<RowType>,
-    table_path: Arc<TablePath>,
     metadata: Arc<Metadata>,
+    lookup_client: Arc<LookupClient>,
     bucketing_function: Box<dyn BucketingFunction>,
     primary_key_encoder: Box<dyn KeyEncoder>,
     bucket_key_encoder: Option<Box<dyn KeyEncoder>>,
@@ -249,7 +252,8 @@ impl Lookuper {
     /// Looks up a value by its primary key.
     ///
     /// The key is encoded and the bucket is automatically computed using
-    /// the table's bucketing function.
+    /// the table's bucketing function. The lookup is queued and batched
+    /// with other lookups for improved throughput.
     ///
     /// # Arguments
     /// * `row` - The row containing the primary key field values
@@ -258,12 +262,10 @@ impl Lookuper {
     /// * `Ok(LookupResult)` - The lookup result (may be empty if key not found)
     /// * `Err(Error)` - If the lookup fails
     pub async fn lookup(&mut self, row: &dyn InternalRow) -> Result<LookupResult> {
-        // todo: support batch lookup
         let pk_bytes = self.primary_key_encoder.encode_key(row)?;
-        let pk_bytes_vec = pk_bytes.to_vec();
         let bk_bytes = match &mut self.bucket_key_encoder {
-            Some(encoder) => &encoder.encode_key(row)?,
-            None => &pk_bytes,
+            Some(encoder) => encoder.encode_key(row)?,
+            None => pk_bytes.clone(),
         };
 
         let partition_id = if let Some(ref partition_getter) = self.partition_getter {
@@ -286,53 +288,24 @@ impl Lookuper {
 
         let bucket_id = self
             .bucketing_function
-            .bucketing(bk_bytes, self.num_buckets)?;
+            .bucketing(&bk_bytes, self.num_buckets)?;
 
         let table_id = self.table_info.get_table_id();
         let table_bucket = TableBucket::new_with_partition(table_id, partition_id, bucket_id);
 
-        // Find the leader for this bucket
-        let leader = self
-            .metadata
-            .leader_for(self.table_path.as_ref(), &table_bucket)
-            .await?
-            .ok_or_else(|| {
-                Error::leader_not_available(format!(
-                    "No leader found for table bucket: {table_bucket}"
-                ))
-            })?;
-
-        let connection = self.rpc_client.get_connection(&leader).await?;
-
-        // Send lookup request
-        let request = LookupRequest::new(table_id, partition_id, bucket_id, vec![pk_bytes_vec]);
-        let response = connection.request(request).await?;
-
-        // Extract the values from response
-        if let Some(bucket_resp) = response.buckets_resp.into_iter().next() {
-            // Check for errors
-            if let Some(error_code) = bucket_resp.error_code {
-                if error_code != 0 {
-                    return Err(Error::FlussAPIError {
-                        api_error: ApiError {
-                            code: error_code,
-                            message: bucket_resp.error_message.unwrap_or_default(),
-                        },
-                    });
-                }
-            }
-
-            // Collect all values
-            let rows: Vec<Vec<u8>> = bucket_resp
-                .values
-                .into_iter()
-                .filter_map(|pb_value| pb_value.values)
-                .collect();
-
-            return Ok(LookupResult::new(rows, Arc::clone(&self.row_type)));
+        // Use the batched lookup client
+        let result = self
+            .lookup_client
+            .lookup(self.table_path.as_ref().clone(), table_bucket, pk_bytes)
+            .await?;
+
+        match result {
+            Some(value_bytes) => Ok(LookupResult::new(
+                vec![value_bytes],
+                Arc::clone(&self.row_type),
+            )),
+            None => Ok(LookupResult::empty(Arc::clone(&self.row_type))),
         }
-
-        Ok(LookupResult::empty(Arc::clone(&self.row_type)))
     }
 
     /// Returns a reference to the table info.
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 4c3dfe2ddc..12807988d8 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -120,8 +120,9 @@ impl<'a> FlussTable<'a> {
                 message: "Lookup is only supported for primary key tables".to_string(),
             });
         }
+        let lookup_client = self.conn.get_or_create_lookup_client()?;
         Ok(TableLookup::new(
-            self.conn.get_connections(),
+            lookup_client,
             self.table_info.clone(),
             self.metadata.clone(),
         ))
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 32db44f6a5..2900e2f4bf 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -165,6 +165,30 @@ pub struct Config {
     #[arg(long, default_value_t = String::new())]
     #[serde(skip_serializing)]
     pub security_sasl_password: String,
+    /// Maximum number of pending lookup operations
+    /// Default: 25600 (matching Java CLIENT_LOOKUP_QUEUE_SIZE)
+    #[arg(long, default_value_t = 25600)]
+    pub lookup_queue_size: usize,
+
+    /// Maximum batch size of merging lookup operations to one lookup request
+    /// Default: 128 (matching Java CLIENT_LOOKUP_MAX_BATCH_SIZE)
+    #[arg(long, default_value_t = 128)]
+    pub lookup_max_batch_size: usize,
+
+    /// Maximum time to wait for the lookup batch to fill (in milliseconds)
+    /// Default: 100 (matching Java CLIENT_LOOKUP_BATCH_TIMEOUT)
+    #[arg(long, default_value_t = 100)]
+    pub lookup_batch_timeout_ms: u64,
+
+    /// Maximum number of unacknowledged lookup requests
+    /// Default: 128 (matching Java CLIENT_LOOKUP_MAX_INFLIGHT_SIZE)
+    #[arg(long, default_value_t = 128)]
+    pub lookup_max_inflight_requests: usize,
+
+    /// Maximum number of lookup retries
+    /// Default: i32::MAX (matching Java CLIENT_LOOKUP_MAX_RETRIES)
+    #[arg(long, default_value_t = i32::MAX)]
+    pub lookup_max_retries: i32,
 }
 
 impl std::fmt::Debug for Config {
@@ -223,6 +247,14 @@ impl std::fmt::Debug for Config {
             .field("security_sasl_mechanism", &self.security_sasl_mechanism)
             .field("security_sasl_username", &self.security_sasl_username)
             .field("security_sasl_password", &"[REDACTED]")
+            .field("lookup_queue_size", &self.lookup_queue_size)
+            .field("lookup_max_batch_size", &self.lookup_max_batch_size)
+            .field("lookup_batch_timeout_ms", &self.lookup_batch_timeout_ms)
+            .field(
+                "lookup_max_inflight_requests",
+                &self.lookup_max_inflight_requests,
+            )
+            .field("lookup_max_retries", &self.lookup_max_retries)
             .finish()
     }
 }
@@ -255,6 +287,11 @@ impl Default for Config {
             security_sasl_mechanism: String::from(DEFAULT_SASL_MECHANISM),
             security_sasl_username: String::new(),
             security_sasl_password: String::new(),
+            lookup_queue_size: 25600,
+            lookup_max_batch_size: 128,
+            lookup_batch_timeout_ms: 100,
+            lookup_max_inflight_requests: 128,
+            lookup_max_retries: i32::MAX,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
index 3de47d64dd..e181c5c62a 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
@@ -23,6 +23,7 @@ use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
 use crate::{impl_read_version_type, impl_write_version_type, proto};
+use bytes::Bytes;
 use prost::Message;
 
 use bytes::{Buf, BufMut};
@@ -53,6 +54,29 @@ impl LookupRequest {
             inner_request: request,
         }
     }
+
+    /// Creates a new batched lookup request with multiple buckets.
+    pub fn new_batched(table_id: i64, buckets: Vec<(i32, Option<i64>, Vec<Bytes>)>) -> Self {
+        let buckets_req: Vec<proto::PbLookupReqForBucket> = buckets
+            .into_iter()
+            .map(
+                |(bucket_id, partition_id, keys)| proto::PbLookupReqForBucket {
+                    partition_id,
+                    bucket_id,
+                    key: keys.into_iter().map(|b| b.to_vec()).collect(),
+                },
+            )
+            .collect();
+
+        let request = proto::LookupRequest {
+            table_id,
+            buckets_req,
+        };
+
+        Self {
+            inner_request: request,
+        }
+    }
 }
 
 impl RequestBody for LookupRequest {
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index f35e507bd6..e2dbf4d172 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -886,4 +886,249 @@ mod kv_table_test {
             .await
             .expect("Failed to drop table");
     }
+
+    /// Integration test for concurrent batched lookups across partitions.
+    #[tokio::test]
+    async fn batched_concurrent_lookups_partitioned() {
+        use futures::stream::{FuturesUnordered, StreamExt};
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_batched_lookups_partitioned");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("region", DataTypes::string())
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .primary_key(vec!["region", "id"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .partitioned_by(vec!["region"])
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+        create_partitions(&admin, &table_path, "region", &["US", "EU", "APAC"]).await;
+
+        let connection = cluster.get_fluss_connection().await;
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        // Insert records across all partitions
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+        let writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let regions = ["US", "EU", "APAC"];
+        for region in &regions {
+            for id in 0..5i32 {
+                let mut row = GenericRow::new(3);
+                row.set_field(0, *region);
+                row.set_field(1, id);
+                row.set_field(2, format!("{}-{}", region, id));
+                writer.upsert(&row).expect("Failed to upsert");
+            }
+        }
+        writer.flush().await.expect("Failed to flush");
+
+        let mut lookupers: Vec<_> = (0..regions.len() * 5)
+            .map(|_| {
+                table
+                    .new_lookup()
+                    .expect("Failed to create lookup")
+                    .create_lookuper()
+                    .expect("Failed to create lookuper")
+            })
+            .collect();
+
+        let mut futures = FuturesUnordered::new();
+        for (i, lookuper) in lookupers.iter_mut().enumerate() {
+            let region = regions[i / 5];
+            let id = (i % 5) as i32;
+
+            futures.push(async move {
+                let mut key = GenericRow::new(3);
+                key.set_field(0, region);
+                key.set_field(1, id);
+
+                let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+                let row = result
+                    .get_single_row()
+                    .expect("Failed to get row")
+                    .expect("Row should exist");
+
+                let actual_region = row.get_string(0).unwrap();
+                let actual_id = row.get_int(1).unwrap();
+                let actual_name = row.get_string(2).unwrap();
+
+                assert_eq!(actual_region, region, "region mismatch");
+                assert_eq!(actual_id, id, "id mismatch");
+                assert_eq!(actual_name, format!("{}-{}", region, id), "name mismatch");
+
+                (region.to_string(), id)
+            });
+        }
+
+        let mut results = Vec::new();
+        while let Some(result) = futures.next().await {
+            results.push(result);
+        }
+
+        assert_eq!(
+            results.len(),
+            regions.len() * 5,
+            "Not all lookups completed"
+        );
+
+        // Verify we got results from all partitions
+        for region in &regions {
+            let count = results.iter().filter(|(r, _)| r == region).count();
+            assert_eq!(count, 5, "Expected 5 results for region {}", region);
+        }
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    /// Integration test for concurrent batched lookups.
+    #[tokio::test]
+    async fn batched_concurrent_lookups() {
+        use futures::stream::{FuturesUnordered, StreamExt};
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss".to_string(), "test_batched_lookups".to_string());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .column("value", DataTypes::bigint())
+                    .primary_key(vec!["id".to_string()])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+
+        // Insert only even-numbered records (0, 2, 4, ..., 98) in parallel
+        let num_records = 100i32;
+        let mut upsert_futures = FuturesUnordered::new();
+        for i in (0..num_records).step_by(2) {
+            let writer = table_upsert
+                .create_writer()
+                .expect("Failed to create writer");
+            upsert_futures.push(async move {
+                let mut row = GenericRow::new(3);
+                row.set_field(0, i);
+                row.set_field(1, format!("name_{}", i));
+                row.set_field(2, (i * 100) as i64);
+                writer
+                    .upsert(&row)
+                    .expect("Failed to upsert")
+                    .await
+                    .expect("Failed to await upsert ack");
+            });
+        }
+        // Wait for all upserts to be acknowledged
+        while upsert_futures.next().await.is_some() {}
+
+        // Create multiple lookupers for concurrent lookups
+        let num_lookupers = 50i32;
+        let mut lookupers: Vec<_> = (0..num_lookupers)
+            .map(|_| {
+                table
+                    .new_lookup()
+                    .expect("Failed to create lookup")
+                    .create_lookuper()
+                    .expect("Failed to create lookuper")
+            })
+            .collect();
+
+        // Run concurrent lookups
+        let mut futures = FuturesUnordered::new();
+        for (i, lookuper) in lookupers.iter_mut().enumerate() {
+            // First 10 lookupers all lookup id=0 (same key multiple times)
+            let id = if i < 10 { 0 } else { i as i32 };
+            let expects_result = id % 2 == 0; // Even IDs exist
+
+            futures.push(async move {
+                let key = make_key(id);
+                let result = lookuper.lookup(&key).await.expect("Failed to lookup");
+                let row_opt = result.get_single_row().expect("Failed to get row");
+
+                if expects_result {
+                    let row = row_opt.unwrap_or_else(|| panic!("Row {} should exist", id));
+                    assert_eq!(row.get_int(0).unwrap(), id, "id mismatch for key {}", id);
+                    assert_eq!(
+                        row.get_string(1).unwrap(),
+                        format!("name_{}", id),
+                        "name mismatch for key {}",
+                        id
+                    );
+                    assert_eq!(
+                        row.get_long(2).unwrap(),
+                        (id * 100) as i64,
+                        "value mismatch for key {}",
+                        id
+                    );
+                } else {
+                    assert!(row_opt.is_none(), "Row {} should not exist", id);
+                }
+                (id, expects_result)
+            });
+        }
+
+        // Collect all results and verify
+        let mut results = Vec::with_capacity(num_lookupers as usize);
+        while let Some(result) = futures.next().await {
+            results.push(result);
+        }
+
+        // Verify all lookups completed successfully
+        assert_eq!(
+            results.len(),
+            num_lookupers as usize,
+            "Not all lookups completed"
+        );
+
+        // Verify we had the expected mix of scenarios
+        let same_key_lookups = results.iter().filter(|(id, _)| *id == 0).count();
+        assert_eq!(same_key_lookups, 10, "Should have 10 lookups for same key");
+
+        let non_existing_lookups = results.iter().filter(|(_, exists)| !exists).count();
+        assert!(
+            non_existing_lookups > 0,
+            "Should have some non-existing key lookups"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
 }

From a7c40133797c8c694ca1c2d58e78c18eedc2c58a Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 19 Apr 2026 02:38:51 +0100
Subject: [PATCH 237/287] [ci] optimize check_license_and_formatting (#503)

---
 fluss-rust/.github/workflows/build_and_test_cpp.yml |  4 +++-
 .../.github/workflows/build_and_test_python.yml     |  4 +++-
 .../.github/workflows/build_and_test_rust.yml       | 13 ++++++-------
 .../workflows/check_license_and_formatting.yml      | 12 ++++++++++--
 4 files changed, 22 insertions(+), 11 deletions(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
index 7d30b8f7c5..d32425ab19 100644
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -47,7 +47,9 @@ jobs:
       - uses: actions/checkout@v6
 
       - name: Install protoc
-        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
 
       - name: Install Apache Arrow C++
         run: |
diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index 69202c03e6..eb392d1d2d 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -58,7 +58,9 @@ jobs:
         uses: astral-sh/setup-uv@37802adc94f370d6bfd71619e3f0bf239e1f3b78
 
       - name: Install protoc
-        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
 
       - name: Rust Cache
         uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index 9b763b3eb5..ed007f941f 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -51,12 +51,9 @@ jobs:
       - uses: actions/checkout@v6
 
       - name: Install protoc
-        run: |
-          if [ "$RUNNER_OS" = "Linux" ]; then
-            sudo apt-get update && sudo apt-get install -y protobuf-compiler
-          elif [ "$RUNNER_OS" = "macOS" ]; then
-            brew install protobuf
-          fi
+        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
 
       - name: Rust Cache
         uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
@@ -78,7 +75,9 @@ jobs:
       - uses: actions/checkout@v6
 
       - name: Install protoc
-        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
 
       - name: Rust Cache
         uses: actions/cache@v4
diff --git a/fluss-rust/.github/workflows/check_license_and_formatting.yml b/fluss-rust/.github/workflows/check_license_and_formatting.yml
index 1108c20ad5..784e778e51 100644
--- a/fluss-rust/.github/workflows/check_license_and_formatting.yml
+++ b/fluss-rust/.github/workflows/check_license_and_formatting.yml
@@ -27,6 +27,9 @@ on:
   pull_request:
     branches:
       - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
   workflow_dispatch:
 
 concurrency:
@@ -40,7 +43,7 @@ jobs:
       - uses: actions/checkout@v6
 
       - name: Check License Header
-        uses: apache/skywalking-eyes/header@v0.6.0
+        uses: apache/skywalking-eyes/header@61275cc80d0798a405cb070f7d3a8aaf7cf2c2c1 # v0.8.0
 
       - name: Install cargo-deny
         uses: taiki-e/install-action@v2
@@ -51,7 +54,12 @@ jobs:
         run: cargo deny check licenses
 
       - name: Install protoc
-        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Rust Cache
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
 
       - name: Format
         run: cargo fmt --all -- --check

From 16c895851ce83ffca01830678d3863e6c62336e8 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 19 Apr 2026 03:32:00 +0100
Subject: [PATCH 238/287] [ci] cache C++ build with sccache (#505)

---
 fluss-rust/.github/workflows/build_and_test_cpp.yml | 12 +++++++++++-
 1 file changed, 11 insertions(+), 1 deletion(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
index d32425ab19..c411076045 100644
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -62,14 +62,24 @@ jobs:
       - name: Rust Cache
         uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
 
+      - name: Setup sccache
+        uses: mozilla-actions/sccache-action@7d986dd989559c6ecdb630a3fd2557667be217ad # v0.0.9
+
       - name: Build fluss-test-cluster binary
         run: cargo build -p fluss-test-cluster
 
       - name: Build C++ bindings and tests
         working-directory: bindings/cpp
+        env:
+          SCCACHE_GHA_ENABLED: "true"
         run: |
-          cmake -B build -DFLUSS_ENABLE_TESTING=ON -DCMAKE_BUILD_TYPE=Debug
+          cmake -B build \
+            -DFLUSS_ENABLE_TESTING=ON \
+            -DCMAKE_BUILD_TYPE=Debug \
+            -DCMAKE_C_COMPILER_LAUNCHER=sccache \
+            -DCMAKE_CXX_COMPILER_LAUNCHER=sccache
           cmake --build build --parallel
+          sccache --show-stats
 
       - name: Run C++ integration tests (parallel)
         working-directory: bindings/cpp

From e6f95e62c9568db672ab996fe91ec9e722dfa570 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 19 Apr 2026 20:44:01 +0100
Subject: [PATCH 239/287] [rust][chore] fix unknow error code lost for forward
 compatibility path (#509)

---
 .../crates/fluss/src/rpc/fluss_api_error.rs   | 31 +++++++++++++++++--
 1 file changed, 29 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs b/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
index 95a39c6945..418f5443dc 100644
--- a/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
+++ b/fluss-rust/crates/fluss/src/rpc/fluss_api_error.rs
@@ -385,8 +385,11 @@ impl Display for FlussError {
 
 impl From<ErrorResponse> for ApiError {
     fn from(error_response: ErrorResponse) -> Self {
-        let fluss_error = FlussError::for_code(error_response.error_code);
-        fluss_error.to_api_error(error_response.error_message)
+        let code = error_response.error_code;
+        let message = error_response
+            .error_message
+            .unwrap_or_else(|| FlussError::for_code(code).message().to_string());
+        ApiError { code, message }
     }
 }
 
@@ -430,6 +433,30 @@ mod tests {
         assert_eq!(fluss_error, FlussError::TableNotExist);
     }
 
+    #[test]
+    fn error_response_preserves_unknown_wire_code() {
+        let response = ErrorResponse {
+            error_code: 9999,
+            error_message: Some("NewException: forward compat".to_string()),
+        };
+        let api_error = ApiError::from(response);
+        assert_eq!(api_error.code, 9999);
+        assert_eq!(api_error.message, "NewException: forward compat");
+        assert_eq!(FlussError::from(api_error), FlussError::UnknownServerError);
+    }
+
+    #[test]
+    fn error_response_falls_back_to_default_message_for_unknown_code() {
+        let response = ErrorResponse {
+            error_code: 9999,
+            error_message: None,
+        };
+        let api_error = ApiError::from(response);
+        assert_eq!(api_error.code, 9999);
+        assert_eq!(api_error.message, FlussError::UnknownServerError.message());
+        assert!(!api_error.is_retriable());
+    }
+
     #[test]
     fn is_retriable_known_retriable_errors() {
         let retriable = [

From 7b4d711ab3765da5e29d7dae84945ec424c5cc63 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 19 Apr 2026 20:55:15 +0100
Subject: [PATCH 240/287] feat: [rust] prefix lookup support (#500)

* [rust] prefix lookup support

* fix fmt

* address comments

* address comments

* Address comments 2
---
 fluss-rust/crates/examples/Cargo.toml         |   8 +
 .../src/example_partitioned_prefix_lookup.rs  | 144 ++++
 .../examples/src/example_prefix_lookup.rs     | 120 ++++
 fluss-rust/crates/fluss/build.rs              |   2 +
 .../fluss/src/client/lookup/lookup_client.rs  |  95 ++-
 .../fluss/src/client/lookup/lookup_query.rs   |  87 ++-
 .../fluss/src/client/lookup/lookup_queue.rs   |  56 +-
 .../fluss/src/client/lookup/lookup_sender.rs  | 675 +++++++++++-------
 .../crates/fluss/src/client/lookup/mod.rs     |   2 +-
 .../crates/fluss/src/client/metadata.rs       |  70 +-
 .../crates/fluss/src/client/table/lookup.rs   | 241 ++++++-
 .../crates/fluss/src/client/table/mod.rs      |   2 +-
 .../crates/fluss/src/proto/fluss_api.proto    |  28 +
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |   4 +
 .../crates/fluss/src/rpc/message/lookup.rs    |  32 +-
 .../crates/fluss/src/rpc/message/mod.rs       |   2 +
 .../fluss/src/rpc/message/prefix_lookup.rs    |  73 ++
 .../fluss/tests/integration/kv_table.rs       | 273 +++++++
 .../rust/example/partitioned-tables.md        |   4 +
 .../user-guide/rust/example/prefix-lookup.md  | 110 +++
 .../rust/example/primary-key-tables.md        |   4 +
 21 files changed, 1641 insertions(+), 391 deletions(-)
 create mode 100644 fluss-rust/crates/examples/src/example_partitioned_prefix_lookup.rs
 create mode 100644 fluss-rust/crates/examples/src/example_prefix_lookup.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/prefix_lookup.rs
 create mode 100644 fluss-rust/website/docs/user-guide/rust/example/prefix-lookup.md

diff --git a/fluss-rust/crates/examples/Cargo.toml b/fluss-rust/crates/examples/Cargo.toml
index b9187395a4..45f029ee8c 100644
--- a/fluss-rust/crates/examples/Cargo.toml
+++ b/fluss-rust/crates/examples/Cargo.toml
@@ -42,3 +42,11 @@ path = "src/example_kv_table.rs"
 [[example]]
 name = "example-partitioned-upsert-lookup"
 path = "src/example_partitioned_kv_table.rs"
+
+[[example]]
+name = "example-prefix-lookup"
+path = "src/example_prefix_lookup.rs"
+
+[[example]]
+name = "example-partitioned-prefix-lookup"
+path = "src/example_partitioned_prefix_lookup.rs"
diff --git a/fluss-rust/crates/examples/src/example_partitioned_prefix_lookup.rs b/fluss-rust/crates/examples/src/example_partitioned_prefix_lookup.rs
new file mode 100644
index 0000000000..b212b0fd45
--- /dev/null
+++ b/fluss-rust/crates/examples/src/example_partitioned_prefix_lookup.rs
@@ -0,0 +1,144 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use clap::Parser;
+use fluss::client::{FlussAdmin, FlussConnection};
+use fluss::config::Config;
+use fluss::error::Result;
+use fluss::metadata::{DataTypes, PartitionSpec, Schema, TableDescriptor, TablePath};
+use fluss::row::{GenericRow, InternalRow};
+use std::collections::HashMap;
+
+#[tokio::main]
+#[allow(dead_code)]
+pub async fn main() -> Result<()> {
+    let mut config = Config::parse();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
+
+    let conn = FlussConnection::new(config).await?;
+
+    // Partitioned schema: pk is (region, user_id, session_id, event_seq),
+    // `region` is the partition key, and the bucket key (user_id, session_id)
+    // is a prefix of the *non-partition* portion of the primary key — which is
+    // the condition for prefix lookup on a partitioned table. The lookup
+    // key must include the partition column(s) in addition to the bucket
+    // prefix, so we look up by (region, user_id, session_id).
+    let table_descriptor = TableDescriptor::builder()
+        .schema(
+            Schema::builder()
+                .column("region", DataTypes::string())
+                .column("user_id", DataTypes::int())
+                .column("session_id", DataTypes::string())
+                .column("event_seq", DataTypes::bigint())
+                .column("event_data", DataTypes::string())
+                .primary_key(vec!["region", "user_id", "session_id", "event_seq"])
+                .build()?,
+        )
+        .partitioned_by(vec!["region"])
+        .distributed_by(
+            Some(3),
+            vec!["user_id".to_string(), "session_id".to_string()],
+        )
+        .build()?;
+
+    let table_path = TablePath::new("fluss", "rust_partitioned_prefix_lookup_example");
+
+    let admin = conn.get_admin()?;
+    admin
+        .create_table(&table_path, &table_descriptor, true)
+        .await?;
+    println!(
+        "Created partitioned KV Table:\n {}\n",
+        admin.get_table_info(&table_path).await?
+    );
+
+    create_partition(&table_path, &admin, "US").await;
+    create_partition(&table_path, &admin, "EU").await;
+
+    let table = conn.get_table(&table_path).await?;
+    let table_upsert = table.new_upsert()?;
+    let upsert_writer = table_upsert.create_writer()?;
+
+    println!("\n=== Upserting session events ===");
+    for (region, user_id, session_id, event_seq, event_data) in [
+        ("US", 1, "sess-a", 1i64, "open"),
+        ("US", 1, "sess-a", 2, "click"),
+        ("US", 1, "sess-a", 3, "close"),
+        ("US", 2, "sess-b", 1, "open"),
+        ("EU", 1, "sess-a", 1, "open"),
+    ] {
+        let mut row = GenericRow::new(5);
+        row.set_field(0, region);
+        row.set_field(1, user_id);
+        row.set_field(2, session_id);
+        row.set_field(3, event_seq);
+        row.set_field(4, event_data);
+        upsert_writer.upsert(&row)?;
+        println!("Upserted: {row:?}");
+    }
+    upsert_writer.flush().await?;
+
+    println!("\n=== Prefix lookup by (region, user_id, session_id) ===");
+    let mut prefix_lookuper = table
+        .new_lookup()?
+        .lookup_by(vec![
+            "region".to_string(),
+            "user_id".to_string(),
+            "session_id".to_string(),
+        ])
+        .create_lookuper()?;
+
+    for (region, user_id, session_id) in [
+        ("US", 1, "sess-a"),
+        ("US", 2, "sess-b"),
+        ("EU", 1, "sess-a"),
+        ("EU", 1, "sess-missing"),
+    ] {
+        let result = prefix_lookuper
+            .lookup(&make_prefix(region, user_id, session_id))
+            .await?;
+        let rows = result.get_rows()?;
+        println!(
+            "region={region}, user_id={user_id}, session_id={session_id}: {} event(s)",
+            rows.len()
+        );
+        for row in &rows {
+            println!("  seq={}, data={}", row.get_long(3)?, row.get_string(4)?);
+        }
+    }
+
+    Ok(())
+}
+
+async fn create_partition(table_path: &TablePath, admin: &FlussAdmin, region: &str) {
+    let mut partition_values = HashMap::new();
+    partition_values.insert("region".to_string(), region.to_string());
+    let partition_spec = PartitionSpec::new(partition_values);
+
+    admin
+        .create_partition(table_path, &partition_spec, true)
+        .await
+        .unwrap();
+}
+
+fn make_prefix(region: &str, user_id: i32, session_id: &str) -> GenericRow<'static> {
+    let mut row = GenericRow::new(3);
+    row.set_field(0, region.to_string());
+    row.set_field(1, user_id);
+    row.set_field(2, session_id.to_string());
+    row
+}
diff --git a/fluss-rust/crates/examples/src/example_prefix_lookup.rs b/fluss-rust/crates/examples/src/example_prefix_lookup.rs
new file mode 100644
index 0000000000..12fc76dc13
--- /dev/null
+++ b/fluss-rust/crates/examples/src/example_prefix_lookup.rs
@@ -0,0 +1,120 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use clap::Parser;
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+use fluss::error::Result;
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+use fluss::row::{GenericRow, InternalRow};
+
+#[tokio::main]
+#[allow(dead_code)]
+pub async fn main() -> Result<()> {
+    let mut config = Config::parse();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
+
+    let conn = FlussConnection::new(config).await?;
+
+    // Schema: primary key is (user_id, session_id, event_seq); the bucket key
+    // (user_id, session_id) is a strict prefix of the primary key, which is
+    // what enables prefix lookup.
+    let table_descriptor = TableDescriptor::builder()
+        .schema(
+            Schema::builder()
+                .column("user_id", DataTypes::int())
+                .column("session_id", DataTypes::string())
+                .column("event_seq", DataTypes::bigint())
+                .column("event_data", DataTypes::string())
+                .primary_key(vec!["user_id", "session_id", "event_seq"])
+                .build()?,
+        )
+        .distributed_by(
+            Some(3),
+            vec!["user_id".to_string(), "session_id".to_string()],
+        )
+        .build()?;
+
+    let table_path = TablePath::new("fluss", "rust_prefix_lookup_example");
+
+    let admin = conn.get_admin()?;
+    admin
+        .create_table(&table_path, &table_descriptor, true)
+        .await?;
+    println!(
+        "Created KV Table:\n {}\n",
+        admin.get_table_info(&table_path).await?
+    );
+
+    let table = conn.get_table(&table_path).await?;
+    let table_upsert = table.new_upsert()?;
+    let upsert_writer = table_upsert.create_writer()?;
+
+    println!("\n=== Upserting session events ===");
+    for (user_id, session_id, event_seq, event_data) in [
+        (1, "sess-a", 1i64, "open"),
+        (1, "sess-a", 2, "click"),
+        (1, "sess-a", 3, "close"),
+        (1, "sess-b", 1, "open"),
+        (2, "sess-c", 1, "open"),
+    ] {
+        let mut row = GenericRow::new(4);
+        row.set_field(0, user_id);
+        row.set_field(1, session_id);
+        row.set_field(2, event_seq);
+        row.set_field(3, event_data);
+        upsert_writer.upsert(&row)?;
+        println!("Upserted: {row:?}");
+    }
+    upsert_writer.flush().await?;
+
+    println!("\n=== Prefix lookup by (user_id, session_id) ===");
+    // `lookup_by` names the prefix columns. The resulting lookuper returns all
+    // rows whose primary key starts with the given prefix.
+    let mut prefix_lookuper = table
+        .new_lookup()?
+        .lookup_by(vec!["user_id".to_string(), "session_id".to_string()])
+        .create_lookuper()?;
+
+    for (user_id, session_id) in [
+        (1, "sess-a"),
+        (1, "sess-b"),
+        (2, "sess-c"),
+        (2, "sess-missing"),
+    ] {
+        let result = prefix_lookuper
+            .lookup(&make_prefix(user_id, session_id))
+            .await?;
+        let rows = result.get_rows()?;
+        println!(
+            "user_id={user_id}, session_id={session_id}: {} event(s)",
+            rows.len()
+        );
+        for row in &rows {
+            println!("  seq={}, data={}", row.get_long(2)?, row.get_string(3)?);
+        }
+    }
+
+    Ok(())
+}
+
+fn make_prefix(user_id: i32, session_id: &str) -> GenericRow<'static> {
+    let mut row = GenericRow::new(2);
+    row.set_field(0, user_id);
+    row.set_field(1, session_id.to_string());
+    row
+}
diff --git a/fluss-rust/crates/fluss/build.rs b/fluss-rust/crates/fluss/build.rs
index 265208a7c3..040ee52179 100644
--- a/fluss-rust/crates/fluss/build.rs
+++ b/fluss-rust/crates/fluss/build.rs
@@ -22,6 +22,8 @@ fn main() -> Result<()> {
     config.bytes([
         ".proto.PbProduceLogReqForBucket.records",
         ".proto.PbPutKvReqForBucket.records",
+        ".proto.PbLookupReqForBucket.key",
+        ".proto.PbPrefixLookupReqForBucket.keys",
     ]);
     config.compile_protos(&["src/proto/fluss_api.proto"], &["src/proto"])?;
     Ok(())
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_client.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_client.rs
index f80170415a..4d507aa9bf 100644
--- a/fluss-rust/crates/fluss/src/client/lookup/lookup_client.rs
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_client.rs
@@ -22,7 +22,7 @@
 //! - Batching multiple lookups to the same server/bucket
 //! - Running a background sender task to process batches
 
-use super::{LookupQuery, LookupQueue};
+use super::{LookupQueue, PrefixLookupQuery, PrimaryLookupQuery, QueuedLookup};
 use crate::client::lookup::lookup_sender::LookupSender;
 use crate::client::metadata::Metadata;
 use crate::config::Config;
@@ -50,7 +50,7 @@ use tokio::task::JoinHandle;
 /// ```
 pub struct LookupClient {
     /// Channel to send lookup requests to the queue
-    lookup_tx: mpsc::Sender<LookupQuery>,
+    lookup_tx: mpsc::Sender<QueuedLookup>,
     /// Handle to the sender task
     sender_handle: Option<JoinHandle<()>>,
     /// Watch channel for internal shutdown handling
@@ -70,8 +70,9 @@ impl LookupClient {
         let max_retries = config.lookup_max_retries;
 
         // Create queue and channels
+        let cluster_rx = metadata.subscribe_cluster_changes();
         let (queue, lookup_tx, re_enqueue_tx) =
-            LookupQueue::new(queue_size, max_batch_size, batch_timeout_ms);
+            LookupQueue::new(queue_size, max_batch_size, batch_timeout_ms, cluster_rx);
 
         // Create shutdown channel
         let (shutdown_tx, shutdown_rx) = watch::channel(false);
@@ -121,7 +122,6 @@ impl LookupClient {
         table_bucket: TableBucket,
         key_bytes: Bytes,
     ) -> Result<Option<Vec<u8>>> {
-        // Check if the client is closed
         if self.closed.load(Ordering::Acquire) {
             return Err(Error::UnexpectedError {
                 message: "Lookup client is closed".to_string(),
@@ -130,34 +130,81 @@ impl LookupClient {
         }
 
         let (result_tx, result_rx) = tokio::sync::oneshot::channel();
+        let query = QueuedLookup::Primary(PrimaryLookupQuery::new(
+            table_path,
+            table_bucket,
+            key_bytes,
+            result_tx,
+        ));
 
-        let query = LookupQuery::new(table_path, table_bucket, key_bytes, result_tx);
-
-        // Send to queue
-        self.lookup_tx
-            .send(query)
-            .await
-            .map_err(|e| {
-                let failed_query = e.0;
-                error!(
-                    "Failed to queue lookup: channel closed. table_path: {}, table_bucket: {:?}, key_len: {}",
-                    failed_query.table_path(),
-                    failed_query.table_bucket(),
-                    failed_query.key().len()
-                );
-                Error::UnexpectedError {
-                    message: "Failed to queue lookup: channel closed".to_string(),
-                    source: None,
-                }
-            })?;
+        self.enqueue(query).await?;
+
+        result_rx.await.map_err(|_| Error::UnexpectedError {
+            message: "Lookup result channel closed".to_string(),
+            source: None,
+        })?
+    }
+
+    /// Looks up all values matching a prefix key.
+    ///
+    /// The prefix key must be a prefix subset of the table's primary key
+    /// (specifically, the bucket keys). Returns every row whose primary key
+    /// starts with the supplied prefix. Queries are batched together with
+    /// other lookups going to the same server for improved throughput.
+    ///
+    /// # Arguments
+    /// * `table_path` - The table path
+    /// * `table_bucket` - The table bucket computed from the bucket key part of the prefix
+    /// * `key_bytes` - The encoded prefix key bytes
+    ///
+    /// # Returns
+    /// * `Ok(rows)` - Every row matching the prefix (possibly empty)
+    /// * `Err(Error)` - If the lookup fails
+    pub async fn prefix_lookup(
+        &self,
+        table_path: TablePath,
+        table_bucket: TableBucket,
+        key_bytes: Bytes,
+    ) -> Result<Vec<Vec<u8>>> {
+        if self.closed.load(Ordering::Acquire) {
+            return Err(Error::UnexpectedError {
+                message: "Lookup client is closed".to_string(),
+                source: None,
+            });
+        }
+
+        let (result_tx, result_rx) = tokio::sync::oneshot::channel();
+        let query = QueuedLookup::Prefix(PrefixLookupQuery::new(
+            table_path,
+            table_bucket,
+            key_bytes,
+            result_tx,
+        ));
+
+        self.enqueue(query).await?;
 
-        // Wait for result
         result_rx.await.map_err(|_| Error::UnexpectedError {
             message: "Lookup result channel closed".to_string(),
             source: None,
         })?
     }
 
+    async fn enqueue(&self, query: QueuedLookup) -> Result<()> {
+        self.lookup_tx.send(query).await.map_err(|e| {
+            let failed_query = e.0;
+            error!(
+                "Failed to queue lookup: channel closed. table_path: {}, table_bucket: {:?}, key_len: {}",
+                failed_query.table_path(),
+                failed_query.table_bucket(),
+                failed_query.key().len()
+            );
+            Error::UnexpectedError {
+                message: "Failed to queue lookup: channel closed".to_string(),
+                source: None,
+            }
+        })
+    }
+
     /// Closes the lookup client gracefully.
     pub async fn close(mut self, timeout: Duration) {
         debug!("Closing lookup client");
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_query.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_query.rs
index 2da9f7c932..19830aefa5 100644
--- a/fluss-rust/crates/fluss/src/client/lookup/lookup_query.rs
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_query.rs
@@ -15,77 +15,116 @@
 // specific language governing permissions and limitations
 // under the License.
 
-//! Lookup query representation for batching lookup operations.
-
+use crate::error::{Error, Result};
 use crate::metadata::{TableBucket, TablePath};
 use bytes::Bytes;
 use tokio::sync::oneshot;
 
-/// Represents a single lookup query that will be batched and sent to the server.
-pub struct LookupQuery {
-    /// The table path for this lookup
+pub struct LookupQuery<T> {
     table_path: TablePath,
-    /// The table bucket for this lookup
     table_bucket: TableBucket,
-    /// The encoded primary key bytes
     key: Bytes,
-    /// Channel to send the result back to the caller
-    result_tx: Option<oneshot::Sender<Result<Option<Vec<u8>>, crate::error::Error>>>,
-    /// Number of retry attempts
     retries: i32,
+    result_tx: Option<oneshot::Sender<Result<T>>>,
 }
 
-impl LookupQuery {
-    /// Creates a new lookup query.
+impl<T> LookupQuery<T> {
     pub fn new(
         table_path: TablePath,
         table_bucket: TableBucket,
         key: Bytes,
-        result_tx: oneshot::Sender<Result<Option<Vec<u8>>, crate::error::Error>>,
+        result_tx: oneshot::Sender<Result<T>>,
     ) -> Self {
         Self {
             table_path,
             table_bucket,
             key,
-            result_tx: Some(result_tx),
             retries: 0,
+            result_tx: Some(result_tx),
         }
     }
 
-    /// Returns the table path.
     pub fn table_path(&self) -> &TablePath {
         &self.table_path
     }
 
-    /// Returns the table bucket.
     pub fn table_bucket(&self) -> &TableBucket {
         &self.table_bucket
     }
 
-    /// Returns the encoded key bytes.
     pub fn key(&self) -> &Bytes {
         &self.key
     }
 
-    /// Returns the current retry count.
     pub fn retries(&self) -> i32 {
         self.retries
     }
 
-    /// Increments the retry counter.
     pub fn increment_retries(&mut self) {
         self.retries += 1;
     }
 
-    /// Completes the lookup with a result.
-    pub fn complete(&mut self, result: Result<Option<Vec<u8>>, crate::error::Error>) {
+    pub fn is_done(&self) -> bool {
+        self.result_tx.is_none()
+    }
+
+    pub fn complete(&mut self, result: Result<T>) {
         if let Some(tx) = self.result_tx.take() {
             let _ = tx.send(result);
         }
     }
 
-    /// Returns true if the result has already been sent.
-    pub fn is_done(&self) -> bool {
-        self.result_tx.is_none()
+    pub fn complete_with_error(&mut self, error: Error) {
+        self.complete(Err(error));
+    }
+}
+
+pub type PrimaryLookupQuery = LookupQuery<Option<Vec<u8>>>;
+pub type PrefixLookupQuery = LookupQuery<Vec<Vec<u8>>>;
+
+pub enum QueuedLookup {
+    Primary(PrimaryLookupQuery),
+    Prefix(PrefixLookupQuery),
+}
+
+impl QueuedLookup {
+    pub fn table_path(&self) -> &TablePath {
+        match self {
+            Self::Primary(q) => q.table_path(),
+            Self::Prefix(q) => q.table_path(),
+        }
+    }
+
+    pub fn table_bucket(&self) -> &TableBucket {
+        match self {
+            Self::Primary(q) => q.table_bucket(),
+            Self::Prefix(q) => q.table_bucket(),
+        }
+    }
+
+    pub fn key(&self) -> &Bytes {
+        match self {
+            Self::Primary(q) => q.key(),
+            Self::Prefix(q) => q.key(),
+        }
+    }
+
+    pub fn complete_with_error(&mut self, error: Error) {
+        match self {
+            Self::Primary(q) => q.complete_with_error(error),
+            Self::Prefix(q) => q.complete_with_error(error),
+        }
+    }
+}
+
+impl From<PrimaryLookupQuery> for QueuedLookup {
+    fn from(q: PrimaryLookupQuery) -> Self {
+        QueuedLookup::Primary(q)
+    }
+}
+
+impl From<PrefixLookupQuery> for QueuedLookup {
+    fn from(q: PrefixLookupQuery) -> Self {
+        QueuedLookup::Prefix(q)
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_queue.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_queue.rs
index 0531913e18..295ec93d8c 100644
--- a/fluss-rust/crates/fluss/src/client/lookup/lookup_queue.rs
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_queue.rs
@@ -20,10 +20,9 @@
 //! This queue buffers lookup operations and provides batched draining
 //! to improve throughput by reducing network round trips.
 
-use super::LookupQuery;
+use super::QueuedLookup;
 use std::time::Duration;
-use tokio::sync::mpsc;
-use tokio::time::timeout;
+use tokio::sync::{mpsc, watch};
 
 /// A queue that buffers pending lookup operations and provides batched draining.
 ///
@@ -34,25 +33,27 @@ use tokio::time::timeout;
 /// Re-enqueued lookups are prioritized over new lookups to ensure fair processing.
 pub struct LookupQueue {
     /// Channel for receiving lookup requests
-    lookup_rx: mpsc::Receiver<LookupQuery>,
+    lookup_rx: mpsc::Receiver<QueuedLookup>,
     /// Channel for receiving re-enqueued lookups
-    re_enqueue_rx: mpsc::UnboundedReceiver<LookupQuery>,
+    re_enqueue_rx: mpsc::UnboundedReceiver<QueuedLookup>,
     /// Maximum batch size for draining
     max_batch_size: usize,
     /// Timeout for batch collection
     batch_timeout: Duration,
+    /// Wakes `drain()` early when the cluster changes.
+    cluster_rx: watch::Receiver<u64>,
 }
 
 impl LookupQueue {
-    /// Creates a new lookup queue with the specified configuration.
     pub fn new(
         queue_size: usize,
         max_batch_size: usize,
         batch_timeout_ms: u64,
+        cluster_rx: watch::Receiver<u64>,
     ) -> (
         Self,
-        mpsc::Sender<LookupQuery>,
-        mpsc::UnboundedSender<LookupQuery>,
+        mpsc::Sender<QueuedLookup>,
+        mpsc::UnboundedSender<QueuedLookup>,
     ) {
         let (lookup_tx, lookup_rx) = mpsc::channel(queue_size);
         let (re_enqueue_tx, re_enqueue_rx) = mpsc::unbounded_channel();
@@ -62,13 +63,14 @@ impl LookupQueue {
             re_enqueue_rx,
             max_batch_size,
             batch_timeout: Duration::from_millis(batch_timeout_ms),
+            cluster_rx,
         };
 
         (queue, lookup_tx, re_enqueue_tx)
     }
 
     /// Drains a batch of lookup queries from the queue.
-    pub async fn drain(&mut self) -> Vec<LookupQuery> {
+    pub async fn drain(&mut self) -> Vec<QueuedLookup> {
         let mut lookups = Vec::with_capacity(self.max_batch_size);
         let deadline = tokio::time::Instant::now() + self.batch_timeout;
 
@@ -78,32 +80,40 @@ impl LookupQueue {
                 break;
             }
 
-            // First drain re-enqueued lookups (prioritized)
+            // Prioritize re-enqueued lookups.
             while lookups.len() < self.max_batch_size {
                 match self.re_enqueue_rx.try_recv() {
                     Ok(lookup) => lookups.push(lookup),
                     Err(_) => break,
                 }
             }
-
             if lookups.len() >= self.max_batch_size {
                 break;
             }
 
-            // Then try to get from main queue with timeout
-            match timeout(remaining, self.lookup_rx.recv()).await {
-                Ok(Some(lookup)) => {
-                    lookups.push(lookup);
-                    // Try to drain more without waiting
-                    while lookups.len() < self.max_batch_size {
-                        match self.lookup_rx.try_recv() {
-                            Ok(lookup) => lookups.push(lookup),
-                            Err(_) => break,
+            let sleep = tokio::time::sleep(remaining);
+            tokio::select! {
+                biased;
+                maybe = self.lookup_rx.recv() => {
+                    match maybe {
+                        Some(lookup) => {
+                            lookups.push(lookup);
+                            while lookups.len() < self.max_batch_size {
+                                match self.lookup_rx.try_recv() {
+                                    Ok(lookup) => lookups.push(lookup),
+                                    Err(_) => break,
+                                }
+                            }
                         }
+                        None => break,
+                    }
+                }
+                _ = self.cluster_rx.changed() => {
+                    if !lookups.is_empty() {
+                        break;
                     }
                 }
-                Ok(None) => break, // Channel closed
-                Err(_) => break,   // Timeout
+                _ = sleep => break,
             }
 
             if lookups.len() >= self.max_batch_size {
@@ -115,7 +125,7 @@ impl LookupQueue {
     }
 
     /// Drains all remaining lookups from the queue.
-    pub fn drain_all(&mut self) -> Vec<LookupQuery> {
+    pub fn drain_all(&mut self) -> Vec<QueuedLookup> {
         let mut lookups = Vec::new();
 
         // Drain re-enqueued lookups
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
index 4abb9d7eb7..efcd68538f 100644
--- a/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
@@ -15,72 +15,161 @@
 // specific language governing permissions and limitations
 // under the License.
 
-//! Lookup sender that processes batched lookup requests.
-//!
-//! The sender runs as a background task, draining lookups from the queue,
-//! grouping them by destination server, and sending batched requests.
-
-use super::{LookupQuery, LookupQueue};
+use super::{LookupQueue, QueuedLookup};
+use crate::client::lookup::lookup_query::LookupQuery;
 use crate::client::metadata::Metadata;
 use crate::error::{Error, FlussError, Result};
 use crate::metadata::{TableBucket, TablePath};
-use crate::proto::LookupResponse;
+use crate::proto::{LookupResponse, PrefixLookupResponse};
 use crate::rpc::ServerConnection;
-use crate::rpc::message::LookupRequest;
+use crate::rpc::message::{
+    LookupRequest, PrefixLookupRequest, ReadVersionedType, RequestBody, WriteVersionedType,
+};
 use crate::{BucketId, PartitionId, TableId};
 use bytes::Bytes;
 use futures::stream::{FuturesUnordered, StreamExt};
 use log::{debug, error, warn};
 use std::collections::{HashMap, HashSet};
+use std::io::Cursor;
 use std::sync::Arc;
 use std::sync::atomic::{AtomicBool, Ordering};
 use std::time::Duration;
-use tokio::sync::{Semaphore, mpsc, watch};
+use tokio::sync::{OwnedSemaphorePermit, Semaphore, mpsc, watch};
 
-/// Server ID type alias for clarity.
 type ServerId = i32;
 
-/// Batches grouped by table bucket, keyed by server.
-type BatchesByLeader = HashMap<ServerId, HashMap<TableBucket, LookupBatch>>;
+type BatchesByLeader<T> = HashMap<ServerId, HashMap<TableBucket, LookupBatch<T>>>;
+type PrimaryBatches = BatchesByLeader<Option<Vec<u8>>>;
+type PrefixBatches = BatchesByLeader<Vec<Vec<u8>>>;
+
+struct BucketResponse<V> {
+    partition_id: Option<PartitionId>,
+    bucket_id: BucketId,
+    error_code: Option<i32>,
+    error_message: Option<String>,
+    values: Vec<V>,
+}
+
+trait LookupProtocol {
+    type Request: RequestBody<ResponseBody = Self::Response> + Send + WriteVersionedType<Vec<u8>>;
+    type Response: ReadVersionedType<Cursor<Vec<u8>>> + Send;
+    type Value: Send;
+
+    const OP_NAME: &'static str;
+
+    fn build_request(
+        table_id: TableId,
+        keys_by_bucket: Vec<(BucketId, Option<PartitionId>, Vec<Bytes>)>,
+    ) -> Self::Request;
+
+    fn decode_buckets(
+        response: Self::Response,
+    ) -> impl Iterator<Item = BucketResponse<Self::Value>>;
+}
+
+struct Primary;
+impl LookupProtocol for Primary {
+    type Request = LookupRequest;
+    type Response = LookupResponse;
+    type Value = Option<Vec<u8>>;
+
+    const OP_NAME: &'static str = "Lookup";
+
+    fn build_request(
+        table_id: TableId,
+        keys_by_bucket: Vec<(BucketId, Option<PartitionId>, Vec<Bytes>)>,
+    ) -> Self::Request {
+        LookupRequest::new_batched(table_id, keys_by_bucket)
+    }
+
+    fn decode_buckets(
+        response: Self::Response,
+    ) -> impl Iterator<Item = BucketResponse<Self::Value>> {
+        response.buckets_resp.into_iter().map(|r| BucketResponse {
+            partition_id: r.partition_id,
+            bucket_id: r.bucket_id,
+            error_code: r.error_code,
+            error_message: r.error_message,
+            values: r.values.into_iter().map(|pb| pb.values).collect(),
+        })
+    }
+}
+
+struct Prefix;
+impl LookupProtocol for Prefix {
+    type Request = PrefixLookupRequest;
+    type Response = PrefixLookupResponse;
+    type Value = Vec<Vec<u8>>;
+
+    const OP_NAME: &'static str = "Prefix lookup";
+
+    fn build_request(
+        table_id: TableId,
+        keys_by_bucket: Vec<(BucketId, Option<PartitionId>, Vec<Bytes>)>,
+    ) -> Self::Request {
+        PrefixLookupRequest::new_batched(table_id, keys_by_bucket)
+    }
+
+    fn decode_buckets(
+        response: Self::Response,
+    ) -> impl Iterator<Item = BucketResponse<Self::Value>> {
+        response.buckets_resp.into_iter().map(|r| BucketResponse {
+            partition_id: r.partition_id,
+            bucket_id: r.bucket_id,
+            error_code: r.error_code,
+            error_message: r.error_message,
+            values: r.value_lists.into_iter().map(|pb| pb.values).collect(),
+        })
+    }
+}
 
-/// Result of grouping lookups by leader.
 struct GroupByLeaderResult {
-    /// Lookup batches grouped by leader server.
-    batches_by_leader: BatchesByLeader,
-    /// Tables with unknown leaders that need metadata refresh.
+    primary: PrimaryBatches,
+    prefix: PrefixBatches,
     unknown_leader_tables: HashSet<TablePath>,
-    /// Partition IDs with unknown leaders.
     unknown_leader_partition_ids: HashSet<PartitionId>,
 }
 
-/// Lookup sender that batches and sends lookup requests.
+impl GroupByLeaderResult {
+    fn is_empty(&self) -> bool {
+        self.primary.is_empty() && self.prefix.is_empty()
+    }
+
+    /// Assumes no `(server, bucket)` overlap — safe because the second pass only
+    /// re-groups items unknown in the first.
+    fn merge_batches(&mut self, other: GroupByLeaderResult) {
+        for (server, inner) in other.primary {
+            self.primary.entry(server).or_default().extend(inner);
+        }
+        for (server, inner) in other.prefix {
+            self.prefix.entry(server).or_default().extend(inner);
+        }
+    }
+}
+
+struct GroupingResult {
+    groups: GroupByLeaderResult,
+    unknowns: Vec<QueuedLookup>,
+}
+
 pub struct LookupSender {
-    /// Metadata for leader lookup
     metadata: Arc<Metadata>,
-    /// The lookup queue to drain from
     queue: LookupQueue,
-    /// Channel to re-enqueue failed lookups
-    re_enqueue_tx: mpsc::UnboundedSender<LookupQuery>,
-    /// Semaphore to limit in-flight requests
+    re_enqueue_tx: mpsc::UnboundedSender<QueuedLookup>,
     inflight_semaphore: Arc<Semaphore>,
-    /// Maximum number of retries
     max_retries: i32,
-    /// Whether the sender is running
     running: AtomicBool,
-    /// Whether to force close (abandon pending lookups)
     force_close: AtomicBool,
-    /// Shutdown signal receiver
     shutdown_rx: watch::Receiver<bool>,
 }
 
-/// A batch of lookups going to the same table bucket.
-struct LookupBatch {
+struct LookupBatch<T> {
     table_bucket: TableBucket,
-    lookups: Vec<LookupQuery>,
+    lookups: Vec<LookupQuery<T>>,
     keys: Vec<Bytes>,
 }
 
-impl LookupBatch {
+impl<T> LookupBatch<T> {
     fn new(table_bucket: TableBucket) -> Self {
         Self {
             table_bucket,
@@ -89,12 +178,12 @@ impl LookupBatch {
         }
     }
 
-    fn add_lookup(&mut self, lookup: LookupQuery) {
+    fn add_lookup(&mut self, lookup: LookupQuery<T>) {
         self.keys.push(lookup.key().clone());
         self.lookups.push(lookup);
     }
 
-    fn complete(&mut self, values: Vec<Option<Vec<u8>>>) {
+    fn complete(&mut self, values: Vec<T>) {
         if values.len() != self.lookups.len() {
             let err_msg = format!(
                 "The number of return values ({}) does not match the number of lookups ({})",
@@ -102,10 +191,10 @@ impl LookupBatch {
                 self.lookups.len()
             );
             for lookup in &mut self.lookups {
-                lookup.complete(Err(Error::UnexpectedError {
+                lookup.complete_with_error(Error::UnexpectedError {
                     message: err_msg.clone(),
                     source: None,
-                }));
+                });
             }
             return;
         }
@@ -115,22 +204,29 @@ impl LookupBatch {
         }
     }
 
-    fn complete_exceptionally(&mut self, error_msg: &str) {
+    fn complete_all_with_error(&mut self, error_msg: &str) {
         for lookup in &mut self.lookups {
-            lookup.complete(Err(Error::UnexpectedError {
+            lookup.complete_with_error(Error::UnexpectedError {
                 message: error_msg.to_string(),
                 source: None,
-            }));
+            });
         }
     }
+
+    fn keys_tuple(&mut self) -> (BucketId, Option<PartitionId>, Vec<Bytes>) {
+        (
+            self.table_bucket.bucket_id(),
+            self.table_bucket.partition_id(),
+            std::mem::take(&mut self.keys),
+        )
+    }
 }
 
 impl LookupSender {
-    /// Creates a new lookup sender.
     pub fn new(
         metadata: Arc<Metadata>,
         queue: LookupQueue,
-        re_enqueue_tx: mpsc::UnboundedSender<LookupQuery>,
+        re_enqueue_tx: mpsc::UnboundedSender<QueuedLookup>,
         max_inflight_requests: usize,
         max_retries: i32,
         shutdown_rx: watch::Receiver<bool>,
@@ -147,14 +243,12 @@ impl LookupSender {
         }
     }
 
-    /// Runs the sender loop.
     pub async fn run(&mut self) {
         debug!("Starting Fluss lookup sender");
 
         let mut shutdown_rx = self.shutdown_rx.clone();
 
         while self.running.load(Ordering::Acquire) {
-            // Check for shutdown signal before entering select
             if *shutdown_rx.borrow() {
                 debug!("Lookup sender received shutdown signal");
                 self.initiate_close();
@@ -163,16 +257,12 @@ impl LookupSender {
 
             tokio::select! {
                 biased;
-
-                // Check shutdown signal
                 _ = shutdown_rx.changed() => {
                     if *shutdown_rx.borrow() {
                         debug!("Lookup sender received shutdown signal during select");
                         self.initiate_close();
                     }
                 }
-
-                // Process lookups
                 result = self.run_once(false) => {
                     if let Err(e) = result {
                         error!("Error in lookup sender: {}", e);
@@ -183,8 +273,7 @@ impl LookupSender {
 
         debug!("Beginning shutdown of lookup sender, sending remaining lookups");
 
-        // Process remaining lookups during shutdown
-        // TODO: Check the in flight request count in the accumulator.
+        // TODO: Check the in-flight request count in the accumulator.
         if !self.force_close.load(Ordering::Acquire) && self.queue.has_undrained() {
             if let Err(e) = self.run_once(true).await {
                 error!("Error during lookup sender shutdown: {}", e);
@@ -195,7 +284,6 @@ impl LookupSender {
         debug!("Lookup sender shutdown complete");
     }
 
-    /// Runs a single iteration of the sender loop.
     async fn run_once(&mut self, drain_all: bool) -> Result<()> {
         let lookups = if drain_all {
             self.queue.drain_all()
@@ -206,24 +294,24 @@ impl LookupSender {
         self.send_lookups(lookups).await
     }
 
-    /// Groups and sends lookups to appropriate servers.
-    async fn send_lookups(&self, lookups: Vec<LookupQuery>) -> Result<()> {
+    async fn send_lookups(&self, lookups: Vec<QueuedLookup>) -> Result<()> {
         if lookups.is_empty() {
             return Ok(());
         }
 
-        // Group by leader
-        let GroupByLeaderResult {
-            batches_by_leader: lookup_batches,
-            unknown_leader_tables,
-            unknown_leader_partition_ids,
+        let GroupingResult {
+            mut groups,
+            unknowns,
         } = self.group_by_leader(lookups);
 
-        // Update metadata for tables with unknown leaders
-        if !unknown_leader_tables.is_empty() {
-            let table_paths_refs: HashSet<&TablePath> = unknown_leader_tables.iter().collect();
-            let partition_ids: Vec<PartitionId> =
-                unknown_leader_partition_ids.into_iter().collect();
+        if !unknowns.is_empty() {
+            let table_paths_refs: HashSet<&TablePath> =
+                groups.unknown_leader_tables.iter().collect();
+            let partition_ids: Vec<PartitionId> = groups
+                .unknown_leader_partition_ids
+                .iter()
+                .copied()
+                .collect();
             if let Err(e) = self
                 .metadata
                 .update_tables_metadata(&table_paths_refs, &HashSet::new(), partition_ids)
@@ -233,38 +321,57 @@ impl LookupSender {
             } else {
                 debug!(
                     "Updated metadata due to unknown leader tables during lookup: {:?}",
-                    unknown_leader_tables
+                    groups.unknown_leader_tables
                 );
             }
-        }
 
-        // If no lookup batches, sleep a bit to avoid busy loop. This case will happen when there is
-        // no leader for all the lookup request in queue.
-        if lookup_batches.is_empty() && !self.queue.has_undrained() {
-            // TODO: May use wait/notify mechanism to avoid active sleep, and use a dynamic sleep time based on the request waited time.
-            tokio::time::sleep(Duration::from_millis(100)).await;
-            return Ok(());
-        }
+            // Re-group with fresh cluster state; dispatch what resolved, re-enqueue the rest.
+            let retry = self.group_by_leader(unknowns);
+            groups.merge_batches(retry.groups);
+            for item in retry.unknowns {
+                self.re_enqueue_lookup(item);
+            }
 
-        // Send batches to each destination
-        let mut pending = FuturesUnordered::new();
-        for (destination, batches) in lookup_batches {
-            pending.push(self.send_lookup_request(destination, batches));
+            // Nothing to dispatch even after refresh — back off to avoid a tight RPC loop.
+            if groups.is_empty() {
+                let mut cluster_rx = self.metadata.subscribe_cluster_changes();
+                tokio::select! {
+                    _ = cluster_rx.changed() => {}
+                    _ = tokio::time::sleep(Duration::from_millis(100)) => {}
+                }
+                return Ok(());
+            }
         }
-        while let Some(()) = pending.next().await {}
+
+        let primary_fut = async {
+            let mut pending = FuturesUnordered::new();
+            for (server, batches) in groups.primary {
+                pending.push(self.send_request::<Primary>(server, batches));
+            }
+            while pending.next().await.is_some() {}
+        };
+        let prefix_fut = async {
+            let mut pending = FuturesUnordered::new();
+            for (server, batches) in groups.prefix {
+                pending.push(self.send_request::<Prefix>(server, batches));
+            }
+            while pending.next().await.is_some() {}
+        };
+        tokio::join!(primary_fut, prefix_fut);
 
         Ok(())
     }
 
-    /// Groups lookups by leader server.
-    fn group_by_leader(&self, lookups: Vec<LookupQuery>) -> GroupByLeaderResult {
+    fn group_by_leader(&self, lookups: Vec<QueuedLookup>) -> GroupingResult {
         let cluster = self.metadata.get_cluster();
-        let mut batches_by_leader: BatchesByLeader = HashMap::new();
+        let mut primary: PrimaryBatches = HashMap::new();
+        let mut prefix: PrefixBatches = HashMap::new();
         let mut unknown_leader_tables: HashSet<TablePath> = HashSet::new();
         let mut unknown_leader_partition_ids: HashSet<PartitionId> = HashSet::new();
+        let mut unknowns: Vec<QueuedLookup> = Vec::new();
 
-        for lookup in lookups {
-            let table_bucket = lookup.table_bucket().clone();
+        for query in lookups {
+            let table_bucket = query.table_bucket().clone();
 
             let leader = match cluster.leader_for(&table_bucket) {
                 Some(leader) => leader.id(),
@@ -273,276 +380,334 @@ impl LookupSender {
                         "No leader found for table bucket {} during lookup",
                         table_bucket
                     );
-                    // Collect tables with unknown leaders for metadata update
-                    unknown_leader_tables.insert(lookup.table_path().clone());
+                    unknown_leader_tables.insert(query.table_path().clone());
                     if let Some(partition_id) = table_bucket.partition_id() {
                         unknown_leader_partition_ids.insert(partition_id);
                     }
-                    self.re_enqueue_lookup(lookup);
+                    unknowns.push(query);
                     continue;
                 }
             };
 
-            batches_by_leader
-                .entry(leader)
-                .or_default()
-                .entry(table_bucket.clone())
-                .or_insert_with(|| LookupBatch::new(table_bucket))
-                .add_lookup(lookup);
+            match query {
+                QueuedLookup::Primary(q) => {
+                    primary
+                        .entry(leader)
+                        .or_default()
+                        .entry(table_bucket.clone())
+                        .or_insert_with(|| LookupBatch::new(table_bucket))
+                        .add_lookup(q);
+                }
+                QueuedLookup::Prefix(q) => {
+                    prefix
+                        .entry(leader)
+                        .or_default()
+                        .entry(table_bucket.clone())
+                        .or_insert_with(|| LookupBatch::new(table_bucket))
+                        .add_lookup(q);
+                }
+            }
         }
 
-        GroupByLeaderResult {
-            batches_by_leader,
-            unknown_leader_tables,
-            unknown_leader_partition_ids,
+        GroupingResult {
+            groups: GroupByLeaderResult {
+                primary,
+                prefix,
+                unknown_leader_tables,
+                unknown_leader_partition_ids,
+            },
+            unknowns,
         }
     }
 
-    /// Sends lookup requests to a specific destination server.
-    async fn send_lookup_request(
+    async fn send_request<P: LookupProtocol>(
         &self,
-        destination: i32,
-        batches_by_bucket: HashMap<TableBucket, LookupBatch>,
-    ) {
-        // Group by table_id for request batching
-        let mut batches_by_table: HashMap<TableId, Vec<LookupBatch>> = HashMap::new();
-        for (table_bucket, batch) in batches_by_bucket {
-            batches_by_table
-                .entry(table_bucket.table_id())
-                .or_default()
-                .push(batch);
+        destination: ServerId,
+        batches_by_bucket: HashMap<TableBucket, LookupBatch<P::Value>>,
+    ) where
+        LookupQuery<P::Value>: Into<QueuedLookup>,
+    {
+        let mut batches_by_table = group_by_table(batches_by_bucket);
+        let connection = match self
+            .connect_or_fail(destination, &mut batches_by_table)
+            .await
+        {
+            Some(conn) => conn,
+            None => return,
+        };
+
+        let mut pending = FuturesUnordered::new();
+        for (table_id, mut batches) in batches_by_table {
+            let keys_by_bucket: Vec<_> = batches.iter_mut().map(|b| b.keys_tuple()).collect();
+            let request = P::build_request(table_id, keys_by_bucket);
+            pending.push(self.send_single_table_lookup::<P>(
+                table_id,
+                destination,
+                connection.clone(),
+                request,
+                batches,
+            ));
         }
+        while pending.next().await.is_some() {}
+    }
 
+    async fn connect_or_fail<T>(
+        &self,
+        destination: ServerId,
+        batches_by_table: &mut HashMap<TableId, Vec<LookupBatch<T>>>,
+    ) -> Option<ServerConnection>
+    where
+        LookupQuery<T>: Into<QueuedLookup>,
+    {
         let cluster = self.metadata.get_cluster();
         let tablet_server = match cluster.get_tablet_server(destination) {
             Some(server) => server.clone(),
             None => {
                 let err_msg = format!("Server {} is not found in metadata cache", destination);
-                for batches in batches_by_table.into_values() {
-                    for mut batch in batches {
-                        self.handle_lookup_error(&err_msg, true, &mut batch);
-                    }
-                }
-                return;
+                self.fail_all_batches(&err_msg, true, batches_by_table);
+                return None;
             }
         };
 
-        let connection = match self.metadata.get_connection(&tablet_server).await {
-            Ok(conn) => conn,
+        match self.metadata.get_connection(&tablet_server).await {
+            Ok(conn) => Some(conn),
             Err(e) => {
                 let err_msg = format!("Failed to get connection to server {}: {}", destination, e);
-                for batches in batches_by_table.into_values() {
-                    for mut batch in batches {
-                        self.handle_lookup_error(&err_msg, true, &mut batch);
-                    }
-                }
-                return;
+                self.fail_all_batches(&err_msg, true, batches_by_table);
+                None
             }
-        };
+        }
+    }
 
-        let mut pending = FuturesUnordered::new();
-        for (table_id, mut batches) in batches_by_table {
-            let mut all_keys_by_bucket: Vec<(BucketId, Option<PartitionId>, Vec<Bytes>)> =
-                Vec::new();
-            for batch in &mut batches {
-                all_keys_by_bucket.push((
-                    batch.table_bucket.bucket_id(),
-                    batch.table_bucket.partition_id(),
-                    std::mem::take(&mut batch.keys),
-                ));
+    fn fail_all_batches<T>(
+        &self,
+        err_msg: &str,
+        is_retriable: bool,
+        batches_by_table: &mut HashMap<TableId, Vec<LookupBatch<T>>>,
+    ) where
+        LookupQuery<T>: Into<QueuedLookup>,
+    {
+        for batches in batches_by_table.values_mut() {
+            for batch in batches.iter_mut() {
+                self.handle_batch_error(err_msg, is_retriable, batch);
             }
-
-            let request = LookupRequest::new_batched(table_id, all_keys_by_bucket);
-            let conn = connection.clone();
-            pending.push(self.send_single_table_lookup(
-                table_id,
-                destination,
-                conn,
-                request,
-                batches,
-            ));
         }
-
-        while let Some(()) = pending.next().await {}
     }
 
-    /// Sends a single lookup request for one table and handles the response.
-    async fn send_single_table_lookup(
+    async fn send_single_table_lookup<P: LookupProtocol>(
         &self,
         table_id: TableId,
-        destination: i32,
+        destination: ServerId,
         connection: ServerConnection,
-        request: LookupRequest,
-        mut batches: Vec<LookupBatch>,
-    ) {
-        let _permit = match self.inflight_semaphore.clone().acquire_owned().await {
-            Ok(permit) => permit,
-            Err(_) => {
-                error!("Semaphore closed during lookup");
-                for batch in &mut batches {
-                    batch.complete_exceptionally("Lookup sender shutdown");
-                }
-                return;
-            }
+        request: P::Request,
+        mut batches: Vec<LookupBatch<P::Value>>,
+    ) where
+        LookupQuery<P::Value>: Into<QueuedLookup>,
+    {
+        let _permit = match self.acquire_inflight_permit(&mut batches).await {
+            Some(p) => p,
+            None => return,
         };
 
         match connection.request(request).await {
             Ok(response) => {
-                self.handle_lookup_response(table_id, destination, response, &mut batches);
+                self.handle_response::<P>(table_id, destination, response, &mut batches);
             }
             Err(e) => {
-                let err_msg = format!("Lookup request failed: {}", e);
+                let err_msg = format!("{} request failed: {}", P::OP_NAME, e);
                 let is_retriable = e.is_retriable();
                 for batch in &mut batches {
-                    self.handle_lookup_error(&err_msg, is_retriable, batch);
+                    self.handle_batch_error(&err_msg, is_retriable, batch);
+                }
+            }
+        }
+    }
+
+    async fn acquire_inflight_permit<T>(
+        &self,
+        batches: &mut [LookupBatch<T>],
+    ) -> Option<OwnedSemaphorePermit> {
+        match self.inflight_semaphore.clone().acquire_owned().await {
+            Ok(p) => Some(p),
+            Err(_) => {
+                error!("Semaphore closed during lookup");
+                for batch in batches.iter_mut() {
+                    batch.complete_all_with_error("Lookup sender shutdown");
                 }
+                None
             }
         }
     }
 
-    /// Handles the lookup response.
-    fn handle_lookup_response(
+    fn handle_response<P: LookupProtocol>(
         &self,
         table_id: TableId,
-        destination: i32,
-        response: LookupResponse,
-        batches: &mut [LookupBatch],
-    ) {
-        let bucket_to_index: HashMap<TableBucket, usize> = batches
-            .iter()
-            .enumerate()
-            .map(|(idx, batch)| (batch.table_bucket.clone(), idx))
-            .collect();
-
-        // Track which batches have been processed
-        let mut processed_batches = vec![false; batches.len()];
-
-        for bucket_resp in response.buckets_resp {
+        destination: ServerId,
+        response: P::Response,
+        batches: &mut [LookupBatch<P::Value>],
+    ) where
+        LookupQuery<P::Value>: Into<QueuedLookup>,
+    {
+        let bucket_to_index = build_bucket_index(batches);
+        let mut processed = vec![false; batches.len()];
+
+        for bucket_resp in P::decode_buckets(response) {
             let table_bucket = TableBucket::new_with_partition(
                 table_id,
                 bucket_resp.partition_id,
                 bucket_resp.bucket_id,
             );
-            if let Some(&batch_idx) = bucket_to_index.get(&table_bucket) {
-                processed_batches[batch_idx] = true;
-                let batch = &mut batches[batch_idx];
-
-                // Check for errors
-                if let Some(error_code) = bucket_resp.error_code {
-                    let fluss_error = FlussError::for_code(error_code);
-                    if fluss_error != FlussError::None {
-                        let err_msg = format!(
-                            "Lookup error for bucket {}: code={}, message={}",
-                            table_bucket,
-                            error_code,
-                            bucket_resp.error_message.unwrap_or_default()
-                        );
-                        let is_retriable = fluss_error.is_retriable();
-                        self.handle_lookup_error(&err_msg, is_retriable, batch);
-                        continue;
-                    }
-                }
-
-                // Extract values
-                let values: Vec<Option<Vec<u8>>> = bucket_resp
-                    .values
-                    .into_iter()
-                    .map(|pb_value| pb_value.values)
-                    .collect();
-
-                batch.complete(values);
-            } else {
+            let Some(&idx) = bucket_to_index.get(&table_bucket) else {
                 error!(
-                    "Received response for unknown bucket {} from server {}",
-                    table_bucket, destination
+                    "Received {} response for unknown bucket {} from server {}",
+                    P::OP_NAME,
+                    table_bucket,
+                    destination
                 );
+                continue;
+            };
+            processed[idx] = true;
+            let batch = &mut batches[idx];
+
+            if let Some(err) = extract_bucket_error(
+                bucket_resp.error_code,
+                bucket_resp.error_message,
+                &table_bucket,
+                P::OP_NAME,
+            ) {
+                self.handle_batch_error(&err.message, err.is_retriable, batch);
+                continue;
             }
+
+            batch.complete(bucket_resp.values);
         }
 
-        // Handle any batches that were not included in the response
-        for (idx, processed) in processed_batches.iter().enumerate() {
-            if !processed {
+        self.fail_unprocessed_batches(&processed, batches, destination, P::OP_NAME);
+    }
+
+    fn fail_unprocessed_batches<T>(
+        &self,
+        processed: &[bool],
+        batches: &mut [LookupBatch<T>],
+        destination: ServerId,
+        op_name: &'static str,
+    ) where
+        LookupQuery<T>: Into<QueuedLookup>,
+    {
+        for (idx, was_processed) in processed.iter().enumerate() {
+            if !was_processed {
                 let batch = &mut batches[idx];
-                // If the batch has lookups that haven't been processed, retry them
-                if !batch.lookups.is_empty() {
-                    let err_msg = format!(
-                        "Bucket {} response missing from server {}",
-                        batch.table_bucket.bucket_id(),
-                        destination
-                    );
-                    // Treat missing bucket response as retriable
-                    self.handle_lookup_error(&err_msg, true, batch);
-                }
+                let err_msg = format!(
+                    "Bucket {} {} response missing from server {}",
+                    batch.table_bucket.bucket_id(),
+                    op_name,
+                    destination
+                );
+                self.handle_batch_error(&err_msg, true, batch);
             }
         }
     }
 
-    /// Handles lookup errors with retry logic.
-    fn handle_lookup_error(&self, error_msg: &str, is_retriable: bool, batch: &mut LookupBatch) {
-        let mut lookups_to_retry = Vec::new();
-        let mut lookups_to_complete = Vec::new();
+    fn handle_batch_error<T>(&self, error_msg: &str, is_retriable: bool, batch: &mut LookupBatch<T>)
+    where
+        LookupQuery<T>: Into<QueuedLookup>,
+    {
+        let mut retried = 0usize;
+        let mut failed = 0usize;
+        let table_bucket = batch.table_bucket.clone();
 
-        for lookup in batch.lookups.drain(..) {
+        for mut lookup in batch.lookups.drain(..) {
             if is_retriable && lookup.retries() < self.max_retries && !lookup.is_done() {
-                lookups_to_retry.push(lookup);
+                lookup.increment_retries();
+                self.re_enqueue_lookup(lookup.into());
+                retried += 1;
             } else {
-                lookups_to_complete.push(lookup);
+                lookup.complete_with_error(Error::UnexpectedError {
+                    message: error_msg.to_string(),
+                    source: None,
+                });
+                failed += 1;
             }
         }
 
-        // Re-enqueue retriable lookups
-        if !lookups_to_retry.is_empty() {
+        if retried > 0 {
             warn!(
                 "Lookup error for bucket {}, retrying {} lookups: {}",
-                batch.table_bucket,
-                lookups_to_retry.len(),
-                error_msg
+                table_bucket, retried, error_msg
             );
-            for mut lookup in lookups_to_retry {
-                lookup.increment_retries();
-                self.re_enqueue_lookup(lookup);
-            }
         }
-
-        // Complete non-retriable lookups with error
-        if !lookups_to_complete.is_empty() {
+        if failed > 0 {
             warn!(
                 "Lookup failed for bucket {} ({} lookups): {}",
-                batch.table_bucket,
-                lookups_to_complete.len(),
-                error_msg
+                table_bucket, failed, error_msg
             );
-            for mut lookup in lookups_to_complete {
-                lookup.complete(Err(Error::UnexpectedError {
-                    message: error_msg.to_string(),
-                    source: None,
-                }));
-            }
         }
     }
 
-    /// Re-enqueues a lookup for retry.
-    fn re_enqueue_lookup(&self, lookup: LookupQuery) {
+    fn re_enqueue_lookup(&self, lookup: QueuedLookup) {
         if let Err(e) = self.re_enqueue_tx.send(lookup) {
-            // Ensure the caller does not hang by completing the lookup with an error.
             error!("Failed to re-enqueue lookup: {}", e);
             let mut failed_lookup = e.0;
-            failed_lookup.complete(Err(Error::UnexpectedError {
+            failed_lookup.complete_with_error(Error::UnexpectedError {
                 message: "Failed to re-enqueue lookup: channel closed".to_string(),
                 source: None,
-            }));
+            });
         }
     }
 
-    /// Initiates graceful shutdown of the sender.
     pub fn initiate_close(&mut self) {
         self.running.store(false, Ordering::Release);
     }
 
-    /// Forces immediate shutdown, abandoning pending lookups.
     #[allow(dead_code)]
     pub fn force_close(&mut self) {
         self.force_close.store(true, Ordering::Release);
         self.initiate_close();
     }
 }
+
+fn group_by_table<T>(
+    batches_by_bucket: HashMap<TableBucket, LookupBatch<T>>,
+) -> HashMap<TableId, Vec<LookupBatch<T>>> {
+    let mut out: HashMap<TableId, Vec<LookupBatch<T>>> = HashMap::new();
+    for (table_bucket, batch) in batches_by_bucket {
+        out.entry(table_bucket.table_id()).or_default().push(batch);
+    }
+    out
+}
+
+fn build_bucket_index<T>(batches: &[LookupBatch<T>]) -> HashMap<TableBucket, usize> {
+    batches
+        .iter()
+        .enumerate()
+        .map(|(idx, batch)| (batch.table_bucket.clone(), idx))
+        .collect()
+}
+
+struct BucketError {
+    message: String,
+    is_retriable: bool,
+}
+
+fn extract_bucket_error(
+    error_code: Option<i32>,
+    error_message: Option<String>,
+    table_bucket: &TableBucket,
+    op: &str,
+) -> Option<BucketError> {
+    let code = error_code?;
+    let fluss_error = FlussError::for_code(code);
+    if fluss_error == FlussError::None {
+        return None;
+    }
+    Some(BucketError {
+        message: format!(
+            "{} error for bucket {}: code={}, message={}",
+            op,
+            table_bucket,
+            code,
+            error_message.unwrap_or_default()
+        ),
+        is_retriable: fluss_error.is_retriable(),
+    })
+}
diff --git a/fluss-rust/crates/fluss/src/client/lookup/mod.rs b/fluss-rust/crates/fluss/src/client/lookup/mod.rs
index f96aa2ed33..ac2446a9e4 100644
--- a/fluss-rust/crates/fluss/src/client/lookup/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/lookup/mod.rs
@@ -35,5 +35,5 @@ mod lookup_queue;
 mod lookup_sender;
 
 pub use lookup_client::LookupClient;
-pub(crate) use lookup_query::LookupQuery;
+pub(crate) use lookup_query::{PrefixLookupQuery, PrimaryLookupQuery, QueuedLookup};
 pub(crate) use lookup_queue::LookupQueue;
diff --git a/fluss-rust/crates/fluss/src/client/metadata.rs b/fluss-rust/crates/fluss/src/client/metadata.rs
index 8581464733..1e3ee7fe1c 100644
--- a/fluss-rust/crates/fluss/src/client/metadata.rs
+++ b/fluss-rust/crates/fluss/src/client/metadata.rs
@@ -15,8 +15,9 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::PartitionId;
 use crate::cluster::{Cluster, ServerNode, ServerType};
-use crate::error::{Error, Result};
+use crate::error::{Error, FlussError, Result};
 use crate::metadata::{PhysicalTablePath, TableBucket, TablePath};
 use crate::proto::MetadataResponse;
 use crate::rpc::message::UpdateMetadataRequest;
@@ -26,24 +27,36 @@ use parking_lot::RwLock;
 use std::collections::HashSet;
 use std::net::{SocketAddr, ToSocketAddrs};
 use std::sync::Arc;
+use tokio::sync::watch;
 
-#[derive(Default)]
 pub struct Metadata {
     cluster: RwLock<Arc<Cluster>>,
     connections: Arc<RpcClient>,
     bootstrap: Arc<str>,
+    cluster_version_tx: watch::Sender<u64>,
 }
 
 impl Metadata {
     pub async fn new(bootstrap: &str, connections: Arc<RpcClient>) -> Result<Self> {
         let cluster = Self::init_cluster(bootstrap, connections.clone()).await?;
+        let (cluster_version_tx, _) = watch::channel(0);
         Ok(Metadata {
             cluster: RwLock::new(Arc::new(cluster)),
             connections,
             bootstrap: bootstrap.into(),
+            cluster_version_tx,
         })
     }
 
+    pub fn subscribe_cluster_changes(&self) -> watch::Receiver<u64> {
+        self.cluster_version_tx.subscribe()
+    }
+
+    fn notify_cluster_changed(&self) {
+        self.cluster_version_tx
+            .send_modify(|v| *v = v.wrapping_add(1));
+    }
+
     fn parse_bootstrap(boot_strap: &str) -> Result<SocketAddr> {
         // Resolve all socket addresses and deterministically choose one.
         let addrs = boot_strap
@@ -92,33 +105,41 @@ impl Metadata {
     pub(crate) async fn reinit_cluster(&self) -> Result<()> {
         let cluster = Self::init_cluster(&self.bootstrap, self.connections.clone()).await?;
         *self.cluster.write() = cluster.into();
+        self.notify_cluster_changed();
         Ok(())
     }
 
     pub fn invalidate_server(&self, server_id: &i32, table_ids: Vec<i64>) {
-        // Take a write lock for the entire operation to avoid races between
-        // reading the current cluster state and writing back the updated one.
-        let mut cluster_guard = self.cluster.write();
-        let updated_cluster = cluster_guard.invalidate_server(server_id, table_ids);
-        *cluster_guard = Arc::new(updated_cluster);
+        {
+            let mut cluster_guard = self.cluster.write();
+            let updated_cluster = cluster_guard.invalidate_server(server_id, table_ids);
+            *cluster_guard = Arc::new(updated_cluster);
+        }
+        self.notify_cluster_changed();
     }
 
     pub fn invalidate_physical_table_meta(
         &self,
         physical_tables_to_invalid: &HashSet<PhysicalTablePath>,
     ) {
-        let mut cluster_guard = self.cluster.write();
-        let updated_cluster =
-            cluster_guard.invalidate_physical_table_meta(physical_tables_to_invalid);
-        *cluster_guard = Arc::new(updated_cluster);
+        {
+            let mut cluster_guard = self.cluster.write();
+            let updated_cluster =
+                cluster_guard.invalidate_physical_table_meta(physical_tables_to_invalid);
+            *cluster_guard = Arc::new(updated_cluster);
+        }
+        self.notify_cluster_changed();
     }
 
     pub async fn update(&self, metadata_response: MetadataResponse) -> Result<()> {
         let origin_cluster = self.cluster.read().clone();
         let new_cluster =
             Cluster::from_metadata_response(metadata_response, Some(&origin_cluster))?;
-        let mut cluster = self.cluster.write();
-        *cluster = Arc::new(new_cluster);
+        {
+            let mut cluster = self.cluster.write();
+            *cluster = Arc::new(new_cluster);
+        }
+        self.notify_cluster_changed();
         Ok(())
     }
 
@@ -197,6 +218,27 @@ impl Metadata {
         Ok(())
     }
 
+    /// Resolves the partition id, refreshing metadata once if not cached.
+    /// Returns `None` when the partition does not exist — `PartitionNotExists`
+    /// server errors are swallowed so callers can short-circuit to an empty result.
+    pub async fn check_and_update_partition_metadata(
+        &self,
+        physical_table_path: &PhysicalTablePath,
+    ) -> Result<Option<PartitionId>> {
+        if let Some(id) = self.get_cluster().get_partition_id(physical_table_path) {
+            return Ok(Some(id));
+        }
+        let path = Arc::new(physical_table_path.clone());
+        match self.update_physical_table_metadata(&[path]).await {
+            Ok(()) => {}
+            Err(e) if matches!(e.api_error(), Some(FlussError::PartitionNotExists)) => {
+                return Ok(None);
+            }
+            Err(e) => return Err(e),
+        }
+        Ok(self.get_cluster().get_partition_id(physical_table_path))
+    }
+
     pub async fn get_connection(&self, server_node: &ServerNode) -> Result<ServerConnection> {
         let result = self.connections.get_connection(server_node).await?;
         Ok(result)
@@ -257,10 +299,12 @@ impl Metadata {
 #[cfg(test)]
 impl Metadata {
     pub(crate) fn new_for_test(cluster: Arc<Cluster>) -> Self {
+        let (cluster_version_tx, _) = watch::channel(0);
         Metadata {
             cluster: RwLock::new(cluster),
             connections: Arc::new(RpcClient::new()),
             bootstrap: Arc::from(""),
+            cluster_version_tx,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index add79210dc..2adb53e4c6 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -31,9 +31,9 @@ use std::sync::Arc;
 
 /// The result of a lookup operation.
 ///
-/// Contains the rows returned from a lookup. For primary key lookups,
-/// this will contain at most one row. For prefix key lookups (future),
-/// this may contain multiple rows.
+/// Contains the rows returned from a lookup. For primary-key lookups,
+/// this will contain at most one row. For prefix-key lookups, it may
+/// contain multiple rows.
 pub struct LookupResult {
     rows: Vec<Vec<u8>>,
     row_type: Arc<RowType>,
@@ -128,22 +128,9 @@ impl LookupResult {
     }
 }
 
-/// Configuration and factory struct for creating lookup operations.
-///
-/// `TableLookup` follows the same pattern as `TableScan` and `TableAppend`,
-/// providing a builder-style API for configuring lookup operations before
-/// creating the actual `Lookuper`.
-///
-/// # Example
-/// ```ignore
-/// let table = conn.get_table(&table_path).await?;
-/// let lookuper = table.new_lookup()?.create_lookuper()?;
-/// let result = lookuper.lookup(&row).await?;
-/// if let Some(value) = result.get_single_row() {
-///     println!("Found: {:?}", value);
-/// }
-/// ```
-// TODO: Add lookup_by(column_names) for prefix key lookups (PrefixKeyLookuper)
+/// Builder for lookup operations. `create_lookuper()` builds a primary-key
+/// `Lookuper`; `lookup_by(columns).create_lookuper()` builds a
+/// `PrefixKeyLookuper` for prefix scans.
 // TODO: Add create_typed_lookuper<T>() for typed lookups with POJO mapping
 pub struct TableLookup {
     lookup_client: Arc<LookupClient>,
@@ -164,6 +151,20 @@ impl TableLookup {
         }
     }
 
+    /// Switches the builder into prefix-scan mode. `lookup_column_names`
+    /// must list the table's partition keys (if any) plus the bucket keys,
+    /// in that order — i.e. this is a **bucket-key prefix** scan, not an
+    /// arbitrary primary-key prefix. Validation is deferred to
+    /// `create_lookuper()`.
+    pub fn lookup_by(self, lookup_column_names: Vec<String>) -> TablePrefixLookup {
+        TablePrefixLookup {
+            lookup_client: self.lookup_client,
+            table_info: self.table_info,
+            metadata: self.metadata,
+            lookup_column_names,
+        }
+    }
+
     /// Creates a `Lookuper` for performing key-based lookups.
     ///
     /// The lookuper will automatically encode the key and compute the bucket
@@ -274,13 +275,13 @@ impl Lookuper {
                 Arc::clone(&self.table_path),
                 Some(partition_name),
             );
-            let cluster = self.metadata.get_cluster();
-            match cluster.get_partition_id(&physical_table_path) {
+            match self
+                .metadata
+                .check_and_update_partition_metadata(&physical_table_path)
+                .await?
+            {
                 Some(id) => Some(id),
-                None => {
-                    // Partition doesn't exist, return empty result (like Java)
-                    return Ok(LookupResult::empty(Arc::clone(&self.row_type)));
-                }
+                None => return Ok(LookupResult::empty(Arc::clone(&self.row_type))),
             }
         } else {
             None
@@ -314,6 +315,196 @@ impl Lookuper {
     }
 }
 
+pub struct TablePrefixLookup {
+    lookup_client: Arc<LookupClient>,
+    table_info: TableInfo,
+    metadata: Arc<Metadata>,
+    lookup_column_names: Vec<String>,
+}
+
+impl TablePrefixLookup {
+    pub fn create_lookuper(self) -> Result<PrefixKeyLookuper> {
+        validate_prefix_lookup(&self.table_info, &self.lookup_column_names)?;
+
+        let num_buckets = self.table_info.get_num_buckets();
+        let data_lake_format = self.table_info.get_table_config().get_datalake_format()?;
+        let bucketing_function = <dyn BucketingFunction>::of(data_lake_format.as_ref());
+
+        let row_type = self.table_info.row_type();
+        let lookup_row_type = row_type.project_with_field_names(&self.lookup_column_names)?;
+
+        let bucket_keys = self.table_info.get_bucket_keys().to_vec();
+        let prefix_key_encoder =
+            KeyEncoderFactory::of(&lookup_row_type, &bucket_keys, &data_lake_format)?;
+
+        let partition_getter = if self.table_info.is_partitioned() {
+            Some(PartitionGetter::new(
+                &lookup_row_type,
+                Arc::clone(self.table_info.get_partition_keys()),
+            )?)
+        } else {
+            None
+        };
+
+        let full_row_type = Arc::new(self.table_info.row_type().clone());
+
+        Ok(PrefixKeyLookuper {
+            table_path: Arc::new(self.table_info.table_path.clone()),
+            row_type: full_row_type,
+            table_info: self.table_info,
+            metadata: self.metadata,
+            lookup_client: self.lookup_client,
+            bucketing_function,
+            prefix_key_encoder,
+            partition_getter,
+            num_buckets,
+        })
+    }
+}
+
+fn validate_prefix_lookup(table_info: &TableInfo, lookup_columns: &[String]) -> Result<()> {
+    if !table_info.has_primary_key() {
+        return Err(Error::IllegalArgument {
+            message: format!(
+                "Log table {} doesn't support prefix lookup",
+                table_info.get_table_path()
+            ),
+        });
+    }
+
+    let physical_primary_keys = table_info.get_physical_primary_keys();
+    let bucket_keys = table_info.get_bucket_keys();
+
+    if bucket_keys.is_empty() {
+        return Err(Error::IllegalArgument {
+            message: format!(
+                "Can not perform prefix lookup on table '{}', because it has no bucket keys.",
+                table_info.get_table_path()
+            ),
+        });
+    }
+
+    if !physical_primary_keys.starts_with(bucket_keys) {
+        return Err(Error::IllegalArgument {
+            message: format!(
+                "Can not perform prefix lookup on table '{}', because the bucket keys {:?} \
+                 is not a prefix subset of the physical primary keys {:?} \
+                 (excluded partition fields if present).",
+                table_info.get_table_path(),
+                bucket_keys,
+                physical_primary_keys,
+            ),
+        });
+    }
+
+    let partition_keys: &[String] = table_info.get_partition_keys();
+    if table_info.is_partitioned() {
+        for pk in partition_keys {
+            if !lookup_columns.iter().any(|c| c == pk) {
+                return Err(Error::IllegalArgument {
+                    message: format!(
+                        "Can not perform prefix lookup on table '{}', because the lookup columns \
+                         {:?} must contain all partition fields {:?}.",
+                        table_info.get_table_path(),
+                        lookup_columns,
+                        partition_keys,
+                    ),
+                });
+            }
+        }
+    }
+
+    let physical_lookup_columns: Vec<&String> = lookup_columns
+        .iter()
+        .filter(|c| !partition_keys.iter().any(|p| p == *c))
+        .collect();
+    if physical_lookup_columns.len() != bucket_keys.len()
+        || !physical_lookup_columns
+            .iter()
+            .zip(bucket_keys.iter())
+            .all(|(a, b)| *a == b)
+    {
+        return Err(Error::IllegalArgument {
+            message: format!(
+                "Can not perform prefix lookup on table '{}', because the lookup columns {:?} \
+                 must contain all bucket keys {:?} in order.",
+                table_info.get_table_path(),
+                lookup_columns,
+                bucket_keys,
+            ),
+        });
+    }
+
+    if bucket_keys == physical_primary_keys {
+        return Err(Error::IllegalArgument {
+            message: format!(
+                "Can not perform prefix lookup on table '{}', because the lookup columns {:?} \
+                 equals the physical primary keys {:?}. \
+                 Please use primary key lookup (Lookuper without lookup_by) instead.",
+                table_info.get_table_path(),
+                lookup_columns,
+                physical_primary_keys,
+            ),
+        });
+    }
+
+    Ok(())
+}
+
+pub struct PrefixKeyLookuper {
+    table_path: Arc<TablePath>,
+    table_info: TableInfo,
+    row_type: Arc<RowType>,
+    metadata: Arc<Metadata>,
+    lookup_client: Arc<LookupClient>,
+    bucketing_function: Box<dyn BucketingFunction>,
+    prefix_key_encoder: Box<dyn KeyEncoder>,
+    partition_getter: Option<PartitionGetter>,
+    num_buckets: i32,
+}
+
+impl PrefixKeyLookuper {
+    pub async fn lookup(&mut self, row: &dyn InternalRow) -> Result<LookupResult> {
+        let prefix_bytes = self.prefix_key_encoder.encode_key(row)?;
+
+        let partition_id = if let Some(ref partition_getter) = self.partition_getter {
+            let partition_name = partition_getter.get_partition(row)?;
+            let physical_table_path = PhysicalTablePath::of_partitioned(
+                Arc::clone(&self.table_path),
+                Some(partition_name),
+            );
+            match self
+                .metadata
+                .check_and_update_partition_metadata(&physical_table_path)
+                .await?
+            {
+                Some(id) => Some(id),
+                None => return Ok(LookupResult::empty(Arc::clone(&self.row_type))),
+            }
+        } else {
+            None
+        };
+
+        let bucket_id = self
+            .bucketing_function
+            .bucketing(&prefix_bytes, self.num_buckets)?;
+
+        let table_id = self.table_info.get_table_id();
+        let table_bucket = TableBucket::new_with_partition(table_id, partition_id, bucket_id);
+
+        let rows = self
+            .lookup_client
+            .prefix_lookup(self.table_path.as_ref().clone(), table_bucket, prefix_bytes)
+            .await?;
+
+        Ok(LookupResult::new(rows, Arc::clone(&self.row_type)))
+    }
+
+    pub fn table_info(&self) -> &TableInfo {
+        &self.table_info
+    }
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 12807988d8..2d3d01712d 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -33,7 +33,7 @@ mod scanner;
 mod upsert;
 
 pub use append::{AppendWriter, TableAppend};
-pub use lookup::{LookupResult, Lookuper, TableLookup};
+pub use lookup::{LookupResult, Lookuper, PrefixKeyLookuper, TableLookup, TablePrefixLookup};
 pub use remote_log::{
     DEFAULT_REMOTE_FILE_DOWNLOAD_THREAD_NUM, DEFAULT_SCANNER_REMOTE_LOG_PREFETCH_NUM,
 };
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index 8f081c2d3b..f32d6b2434 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -376,6 +376,34 @@ message PbValue {
   optional bytes values = 1;
 }
 
+// prefix lookup request and response
+message PrefixLookupRequest {
+  required int64 table_id = 1;
+  repeated PbPrefixLookupReqForBucket buckets_req = 2;
+}
+
+message PrefixLookupResponse {
+  repeated PbPrefixLookupRespForBucket buckets_resp = 1;
+}
+
+message PbPrefixLookupReqForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  repeated bytes keys = 3;
+}
+
+message PbPrefixLookupRespForBucket {
+  optional int64 partition_id = 1;
+  required int32 bucket_id = 2;
+  optional int32 error_code = 3;
+  optional string error_message = 4;
+  repeated PbValueList value_lists = 5;
+}
+
+message PbValueList {
+  repeated bytes values = 1;
+}
+
 message PbPartitionSpec {
   repeated PbKeyValue partition_key_values = 1;
 }
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index 5e4fddfe52..d52497837d 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -39,6 +39,7 @@ pub enum ApiKey {
     InitWriter,                 // 1026
     GetLatestLakeSnapshot,      // 1032
     LimitScan,                  // 1033
+    PrefixLookup,               // 1034
     GetDatabaseInfo,            // 1035
     CreatePartition,            // 1036
     DropPartition,              // 1037
@@ -69,6 +70,7 @@ impl From<i16> for ApiKey {
             1026 => ApiKey::InitWriter,
             1032 => ApiKey::GetLatestLakeSnapshot,
             1033 => ApiKey::LimitScan,
+            1034 => ApiKey::PrefixLookup,
             1035 => ApiKey::GetDatabaseInfo,
             1036 => ApiKey::CreatePartition,
             1037 => ApiKey::DropPartition,
@@ -102,6 +104,7 @@ impl From<ApiKey> for i16 {
             ApiKey::InitWriter => 1026,
             ApiKey::GetLatestLakeSnapshot => 1032,
             ApiKey::LimitScan => 1033,
+            ApiKey::PrefixLookup => 1034,
             ApiKey::GetDatabaseInfo => 1035,
             ApiKey::CreatePartition => 1036,
             ApiKey::DropPartition => 1037,
@@ -138,6 +141,7 @@ mod tests {
             (1026, ApiKey::InitWriter),
             (1032, ApiKey::GetLatestLakeSnapshot),
             (1033, ApiKey::LimitScan),
+            (1034, ApiKey::PrefixLookup),
             (1035, ApiKey::GetDatabaseInfo),
             (1036, ApiKey::CreatePartition),
             (1037, ApiKey::DropPartition),
diff --git a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
index e181c5c62a..07f8e06ce7 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
@@ -22,7 +22,9 @@ use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
 use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::{
+    BucketId, PartitionId, TableId, impl_read_version_type, impl_write_version_type, proto,
+};
 use bytes::Bytes;
 use prost::Message;
 
@@ -33,37 +35,17 @@ pub struct LookupRequest {
 }
 
 impl LookupRequest {
-    pub fn new(
-        table_id: i64,
-        partition_id: Option<i64>,
-        bucket_id: i32,
-        keys: Vec<Vec<u8>>,
+    pub fn new_batched(
+        table_id: TableId,
+        buckets: Vec<(BucketId, Option<PartitionId>, Vec<Bytes>)>,
     ) -> Self {
-        let bucket_req = proto::PbLookupReqForBucket {
-            partition_id,
-            bucket_id,
-            key: keys,
-        };
-
-        let request = proto::LookupRequest {
-            table_id,
-            buckets_req: vec![bucket_req],
-        };
-
-        Self {
-            inner_request: request,
-        }
-    }
-
-    /// Creates a new batched lookup request with multiple buckets.
-    pub fn new_batched(table_id: i64, buckets: Vec<(i32, Option<i64>, Vec<Bytes>)>) -> Self {
         let buckets_req: Vec<proto::PbLookupReqForBucket> = buckets
             .into_iter()
             .map(
                 |(bucket_id, partition_id, keys)| proto::PbLookupReqForBucket {
                     partition_id,
                     bucket_id,
-                    key: keys.into_iter().map(|b| b.to_vec()).collect(),
+                    key: keys,
                 },
             )
             .collect();
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 10808021d4..d4739dc632 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -41,6 +41,7 @@ mod list_offsets;
 mod list_partition_infos;
 mod list_tables;
 mod lookup;
+mod prefix_lookup;
 mod produce_log;
 mod put_kv;
 mod table_exists;
@@ -68,6 +69,7 @@ pub use list_offsets::*;
 pub use list_partition_infos::*;
 pub use list_tables::*;
 pub use lookup::*;
+pub use prefix_lookup::*;
 pub use produce_log::*;
 pub use put_kv::*;
 pub use table_exists::*;
diff --git a/fluss-rust/crates/fluss/src/rpc/message/prefix_lookup.rs b/fluss-rust/crates/fluss/src/rpc/message/prefix_lookup.rs
new file mode 100644
index 0000000000..5ee44d2519
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/prefix_lookup.rs
@@ -0,0 +1,73 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::PrefixLookupResponse;
+use crate::rpc::frame::ReadError;
+
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::WriteError;
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::{
+    BucketId, PartitionId, TableId, impl_read_version_type, impl_write_version_type, proto,
+};
+use bytes::Bytes;
+use prost::Message;
+
+use bytes::{Buf, BufMut};
+
+pub struct PrefixLookupRequest {
+    pub inner_request: proto::PrefixLookupRequest,
+}
+
+impl PrefixLookupRequest {
+    pub fn new_batched(
+        table_id: TableId,
+        buckets: Vec<(BucketId, Option<PartitionId>, Vec<Bytes>)>,
+    ) -> Self {
+        let buckets_req: Vec<proto::PbPrefixLookupReqForBucket> = buckets
+            .into_iter()
+            .map(
+                |(bucket_id, partition_id, keys)| proto::PbPrefixLookupReqForBucket {
+                    partition_id,
+                    bucket_id,
+                    keys,
+                },
+            )
+            .collect();
+
+        let request = proto::PrefixLookupRequest {
+            table_id,
+            buckets_req,
+        };
+
+        Self {
+            inner_request: request,
+        }
+    }
+}
+
+impl RequestBody for PrefixLookupRequest {
+    type ResponseBody = PrefixLookupResponse;
+
+    const API_KEY: ApiKey = ApiKey::PrefixLookup;
+
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(PrefixLookupRequest);
+impl_read_version_type!(PrefixLookupResponse);
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index e2dbf4d172..62e206b6f8 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -1001,6 +1001,279 @@ mod kv_table_test {
             .expect("Failed to drop table");
     }
 
+    // Strings >7 chars for `b` force the encoder's variable-length area,
+    // which is where prefix-key / primary-key byte layouts diverge.
+    #[tokio::test]
+    async fn prefix_lookup() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_prefix_lookup");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("a", DataTypes::int())
+                    .column("b", DataTypes::string())
+                    .column("c", DataTypes::bigint())
+                    .column("d", DataTypes::string())
+                    .primary_key(vec!["a", "b", "c"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .distributed_by(Some(3), vec!["a".to_string(), "b".to_string()])
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+        let writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let test_data: &[(i32, &str, i64, &str)] = &[
+            (1, "aaaaaaaaa", 1, "value1"),
+            (1, "aaaaaaaaa", 2, "value2"),
+            (1, "aaaaaaaaa", 3, "value3"),
+            (2, "aaaaaaaaa", 4, "value4"),
+        ];
+        for (a, b, c, d) in test_data {
+            let mut row = GenericRow::new(4);
+            row.set_field(0, *a);
+            row.set_field(1, *b);
+            row.set_field(2, *c);
+            row.set_field(3, *d);
+            writer.upsert(&row).expect("Failed to upsert");
+        }
+        writer.flush().await.expect("Failed to flush");
+
+        let mut prefix_lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .lookup_by(vec!["a".to_string(), "b".to_string()])
+            .create_lookuper()
+            .expect("Failed to create prefix lookuper");
+
+        let mut prefix = GenericRow::new(2);
+        prefix.set_field(0, 1);
+        prefix.set_field(1, "aaaaaaaaa");
+        let result = prefix_lookuper
+            .lookup(&prefix)
+            .await
+            .expect("Failed to prefix lookup");
+        let rows = result.get_rows().expect("Failed to decode rows");
+        assert_eq!(rows.len(), 3, "Prefix (1, 'aaaaaaaaa') should match 3 rows");
+        for (i, row) in rows.iter().enumerate() {
+            assert_eq!(row.get_int(0).unwrap(), 1);
+            assert_eq!(row.get_string(1).unwrap(), "aaaaaaaaa");
+            assert_eq!(row.get_long(2).unwrap(), (i as i64) + 1);
+            assert_eq!(row.get_string(3).unwrap(), format!("value{}", i + 1));
+        }
+
+        let mut prefix = GenericRow::new(2);
+        prefix.set_field(0, 2);
+        prefix.set_field(1, "aaaaaaaaa");
+        let result = prefix_lookuper
+            .lookup(&prefix)
+            .await
+            .expect("Failed to prefix lookup");
+        let rows = result.get_rows().expect("Failed to decode rows");
+        assert_eq!(rows.len(), 1);
+        assert_eq!(rows[0].get_int(0).unwrap(), 2);
+        assert_eq!(rows[0].get_string(1).unwrap(), "aaaaaaaaa");
+        assert_eq!(rows[0].get_long(2).unwrap(), 4);
+        assert_eq!(rows[0].get_string(3).unwrap(), "value4");
+
+        let mut prefix = GenericRow::new(2);
+        prefix.set_field(0, 3);
+        prefix.set_field(1, "a");
+        let result = prefix_lookuper
+            .lookup(&prefix)
+            .await
+            .expect("Failed to prefix lookup");
+        let rows = result.get_rows().expect("Failed to decode rows");
+        assert_eq!(rows.len(), 0);
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn prefix_lookup_partitioned() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_prefix_lookup_partitioned");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("region", DataTypes::string())
+                    .column("a", DataTypes::int())
+                    .column("b", DataTypes::string())
+                    .column("c", DataTypes::bigint())
+                    .column("d", DataTypes::string())
+                    .primary_key(vec!["region", "a", "b", "c"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .partitioned_by(vec!["region"])
+            .distributed_by(Some(3), vec!["a".to_string(), "b".to_string()])
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+        create_partitions(&admin, &table_path, "region", &["US", "EU"]).await;
+
+        let connection = cluster.get_fluss_connection().await;
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+        let writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let test_data: &[(&str, i32, &str, i64, &str)] = &[
+            ("US", 1, "aaaaaaaaa", 1, "us-1"),
+            ("US", 1, "aaaaaaaaa", 2, "us-2"),
+            ("US", 2, "aaaaaaaaa", 3, "us-3"),
+            ("EU", 1, "aaaaaaaaa", 4, "eu-1"),
+            ("EU", 1, "bbbbbbbbb", 5, "eu-2"),
+        ];
+        for (region, a, b, c, d) in test_data {
+            let mut row = GenericRow::new(5);
+            row.set_field(0, *region);
+            row.set_field(1, *a);
+            row.set_field(2, *b);
+            row.set_field(3, *c);
+            row.set_field(4, *d);
+            writer.upsert(&row).expect("Failed to upsert");
+        }
+        writer.flush().await.expect("Failed to flush");
+
+        let mut prefix_lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .lookup_by(vec!["region".to_string(), "a".to_string(), "b".to_string()])
+            .create_lookuper()
+            .expect("Failed to create prefix lookuper");
+
+        // Prefix (US, 1, "aaaaaaaaa") — 2 rows.
+        let mut prefix = GenericRow::new(3);
+        prefix.set_field(0, "US");
+        prefix.set_field(1, 1);
+        prefix.set_field(2, "aaaaaaaaa");
+        let result = prefix_lookuper
+            .lookup(&prefix)
+            .await
+            .expect("Failed to prefix lookup");
+        let rows = result.get_rows().expect("Failed to decode rows");
+        assert_eq!(rows.len(), 2);
+        for row in &rows {
+            assert_eq!(row.get_string(0).unwrap(), "US");
+            assert_eq!(row.get_int(1).unwrap(), 1);
+            assert_eq!(row.get_string(2).unwrap(), "aaaaaaaaa");
+        }
+
+        // Prefix (EU, 1, "bbbbbbbbb") — 1 row.
+        let mut prefix = GenericRow::new(3);
+        prefix.set_field(0, "EU");
+        prefix.set_field(1, 1);
+        prefix.set_field(2, "bbbbbbbbb");
+        let result = prefix_lookuper
+            .lookup(&prefix)
+            .await
+            .expect("Failed to prefix lookup");
+        let rows = result.get_rows().expect("Failed to decode rows");
+        assert_eq!(rows.len(), 1);
+        assert_eq!(rows[0].get_string(4).unwrap(), "eu-2");
+
+        let mut prefix = GenericRow::new(3);
+        prefix.set_field(0, "APAC");
+        prefix.set_field(1, 1);
+        prefix.set_field(2, "aaaaaaaaa");
+        let result = prefix_lookuper
+            .lookup(&prefix)
+            .await
+            .expect("Failed to prefix lookup");
+        let rows = result.get_rows().expect("Failed to decode rows");
+        assert_eq!(rows.len(), 0);
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn prefix_lookup_validation_errors() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_prefix_lookup_validation");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("a", DataTypes::int())
+                    .column("b", DataTypes::string())
+                    .column("c", DataTypes::bigint())
+                    .primary_key(vec!["a", "b", "c"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .distributed_by(Some(3), vec!["a".to_string(), "b".to_string()])
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let err = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .lookup_by(vec!["b".to_string(), "a".to_string()])
+            .create_lookuper()
+            .err()
+            .expect("Expected validation error for wrong order");
+        assert!(err.to_string().contains("must contain all bucket keys"));
+
+        let err = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .lookup_by(vec!["a".to_string(), "b".to_string(), "c".to_string()])
+            .create_lookuper()
+            .err()
+            .expect("Expected validation error for extra lookup columns");
+        assert!(err.to_string().contains("must contain all bucket keys"));
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
     /// Integration test for concurrent batched lookups.
     #[tokio::test]
     async fn batched_concurrent_lookups() {
diff --git a/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
index 38517e165d..e583e06ead 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/partitioned-tables.md
@@ -212,4 +212,8 @@ if let Some(row) = result.get_single_row()? {
 }
 ```
 
+### Prefix Lookup on Partitioned Tables
+
+See [Prefix Lookup — Partitioned Table](./prefix-lookup.md#partitioned-table) for details and a full runnable example.
+
 > **Note:** Scanning partitioned primary key tables is not supported. Use lookup operations instead.
diff --git a/fluss-rust/website/docs/user-guide/rust/example/prefix-lookup.md b/fluss-rust/website/docs/user-guide/rust/example/prefix-lookup.md
new file mode 100644
index 0000000000..619ba8341d
--- /dev/null
+++ b/fluss-rust/website/docs/user-guide/rust/example/prefix-lookup.md
@@ -0,0 +1,110 @@
+---
+sidebar_position: 7
+---
+# Prefix Lookup
+
+Prefix lookup returns all rows whose primary key starts with a given prefix. It's enabled by choosing a **bucket key that is a strict prefix of the primary key** — rows sharing the same bucket-key prefix land in the same bucket, so one bucket lookup returns them all.
+
+## Table Requirements
+
+- The table must have a primary key.
+- The bucket key must be a strict prefix of the primary key (on partitioned tables, of the *non-partition* portion of the primary key).
+- The bucket key cannot equal the full primary key — that's a normal primary-key lookup, use [`Lookuper`](./primary-key-tables.md#looking-up-records) instead.
+- The `lookup_by` columns passed to the client must equal `partition_keys ++ bucket_key` (in that order, if partitioned).
+
+`create_lookuper()` validates these rules and returns `Err(Error::IllegalArgument { .. })` on mismatch, with a message describing the violation.
+
+## Non-Partitioned Table
+
+Pick a schema where the bucket key is a prefix of the primary key:
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("user_id", DataTypes::int())
+            .column("session_id", DataTypes::string())
+            .column("event_seq", DataTypes::bigint())
+            .column("event_data", DataTypes::string())
+            .primary_key(vec!["user_id", "session_id", "event_seq"])
+            .build()?,
+    )
+    // Bucket key (user_id, session_id) is a prefix of the primary key.
+    .distributed_by(Some(3), vec!["user_id".to_string(), "session_id".to_string()])
+    .build()?;
+```
+
+Create the lookuper with `lookup_by(columns)` naming the prefix columns, then call `lookup(prefix_row)`:
+
+```rust
+use fluss::row::{GenericRow, InternalRow};
+
+let mut prefix_lookuper = table
+    .new_lookup()?
+    .lookup_by(vec!["user_id".to_string(), "session_id".to_string()])
+    .create_lookuper()?;
+
+let mut prefix = GenericRow::new(2);
+prefix.set_field(0, 1);                // user_id
+prefix.set_field(1, "sess-a");         // session_id
+
+let result = prefix_lookuper.lookup(&prefix).await?;
+for row in result.get_rows()? {
+    println!(
+        "seq={}, data={}",
+        row.get_long(2)?,
+        row.get_string(3)?,
+    );
+}
+```
+
+Unlike primary-key lookup (which uses `get_single_row()`), prefix lookup returns zero or more rows via `get_rows()`.
+
+## Partitioned Table
+
+On a partitioned table, the partition columns are stripped from the primary key before the bucket-prefix rule is evaluated. The lookup key, though, must still carry the partition values so the client can route the request to the right partition — so the `lookup_by` columns are `partition_keys ++ bucket_key`.
+
+```rust
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("region", DataTypes::string())
+            .column("user_id", DataTypes::int())
+            .column("session_id", DataTypes::string())
+            .column("event_seq", DataTypes::bigint())
+            .column("event_data", DataTypes::string())
+            .primary_key(vec!["region", "user_id", "session_id", "event_seq"])
+            .build()?,
+    )
+    .partitioned_by(vec!["region"])
+    // Bucket key (user_id, session_id) is a prefix of the pk minus partition cols.
+    .distributed_by(Some(3), vec!["user_id".to_string(), "session_id".to_string()])
+    .build()?;
+```
+
+```rust
+let mut prefix_lookuper = table
+    .new_lookup()?
+    .lookup_by(vec![
+        "region".to_string(),
+        "user_id".to_string(),
+        "session_id".to_string(),
+    ])
+    .create_lookuper()?;
+
+let mut prefix = GenericRow::new(3);
+prefix.set_field(0, "US");             // region (partition column)
+prefix.set_field(1, 1);                // user_id
+prefix.set_field(2, "sess-a");         // session_id
+
+let result = prefix_lookuper.lookup(&prefix).await?;
+for row in result.get_rows()? {
+    println!(
+        "seq={}, data={}",
+        row.get_long(3)?,
+        row.get_string(4)?,
+    );
+}
+```
diff --git a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
index 7fe8a553ff..82a07c4cba 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
@@ -120,3 +120,7 @@ let result = lookuper.lookup(&key).await?;
 let batch = result.to_record_batch()?;
 println!("Rows: {}", batch.num_rows());
 ```
+
+## Prefix Lookup
+
+To fetch all rows sharing a common primary-key prefix (by choosing a bucket key that's a strict prefix of the primary key), see [Prefix Lookup](./prefix-lookup.md).

From 61db34e665a01fbc4258957c8b93579f76b56706 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 20 Apr 2026 00:40:59 +0100
Subject: [PATCH 241/287] chore: use the same cache in rust integration tests
 (#506)

* [ci] chore: use the same cache in rust integration tests

* further optimizations
---
 .../.github/workflows/build_and_test_rust.yml    | 16 ++++------------
 fluss-rust/Cargo.toml                            |  2 +-
 2 files changed, 5 insertions(+), 13 deletions(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index ed007f941f..4615575dd7 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -59,10 +59,10 @@ jobs:
         uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
 
       - name: Build
-        run: cargo build --workspace --all-targets --exclude fluss_python --exclude fluss-cpp
+        run: cargo build --workspace --all-targets --exclude fluss_python --exclude fluss-cpp --exclude fluss_nif
 
       - name: Unit Test
-        run: cargo test --all-targets --workspace --exclude fluss_python --exclude fluss-cpp
+        run: cargo test --all-targets --workspace --exclude fluss_python --exclude fluss-cpp --exclude fluss_nif
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
@@ -80,18 +80,10 @@ jobs:
           repo-token: ${{ secrets.GITHUB_TOKEN }}
 
       - name: Rust Cache
-        uses: actions/cache@v4
-        with:
-          path: |
-            ~/.cargo/registry
-            ~/.cargo/git
-            target
-          key: rust-${{ runner.os }}-${{ hashFiles('**/Cargo.lock') }}
-          restore-keys: |
-            rust-${{ runner.os }}-
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
 
       - name: Integration Test
-        run: cargo test --features integration_tests --all-targets --workspace --exclude fluss_python --exclude fluss-cpp
+        run: cargo test --features integration_tests --all-targets --workspace --exclude fluss_python --exclude fluss-cpp --exclude fluss_nif
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index b625ab3485..0aa7e9cfa7 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -34,7 +34,7 @@ members = ["crates/fluss", "crates/fluss-test-cluster", "crates/examples", "bind
 fluss = { package = "fluss-rs", version = "0.2.0", path = "crates/fluss", features = ["storage-all"] }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
-arrow = { version = "57.0.0", features = ["ipc_compression"] }
+arrow = { version = "57.0.0", features = ["ipc_compression", "ffi"] }
 bigdecimal = "0.4"
 serde = { version = "1.0", features = ["derive"] }
 serde_json = "1.0"

From afce91246484b6b4f6c96a02f683e7268954f51c Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Fri, 24 Apr 2026 01:15:46 +0200
Subject: [PATCH 242/287] [c++] Add c++ support for Array data type (#501)

---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  223 +++
 fluss-rust/bindings/cpp/src/admin.cpp         |    7 +-
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  127 +-
 fluss-rust/bindings/cpp/src/lib.rs            | 1260 +++++++++++++++++
 fluss-rust/bindings/cpp/src/table.cpp         |  388 +++++
 fluss-rust/bindings/cpp/src/types.rs          |  169 ++-
 .../bindings/cpp/test/test_ffi_converter.cpp  |   64 +
 .../bindings/cpp/test/test_kv_table.cpp       |  159 +++
 .../bindings/cpp/test/test_log_table.cpp      |  629 ++++++++
 .../docs/user-guide/cpp/api-reference.md      |   85 +-
 .../website/docs/user-guide/cpp/data-types.md |   57 +
 11 files changed, 3126 insertions(+), 42 deletions(-)
 create mode 100644 fluss-rust/bindings/cpp/test/test_ffi_converter.cpp

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 1937cf276a..f222166d35 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -50,6 +50,8 @@ struct Lookuper;
 struct ScanResultInner;
 struct GenericRowInner;
 struct LookupResultInner;
+struct ArrayWriterInner;
+struct ArrayViewInner;
 }  // namespace ffi
 
 /// Named constants for Fluss API error codes.
@@ -276,6 +278,7 @@ enum class TypeId {
     Decimal = 14,
     Char = 15,
     Binary = 16,
+    Array = 17,
 };
 
 class DataType {
@@ -305,15 +308,29 @@ class DataType {
     }
     static DataType Char(int32_t length) { return DataType(TypeId::Char, length, 0); }
     static DataType Binary(int32_t length) { return DataType(TypeId::Binary, length, 0); }
+    /// Constructs an `ARRAY<element>` type. The element DataType (possibly
+    /// itself an array) is deep-copied into a shared owning handle so that
+    /// copies of the outer DataType remain cheap while the element lives
+    /// as long as any reference exists.
+    static DataType Array(DataType element) {
+        DataType dt(TypeId::Array, 0, 0);
+        dt.element_type_ = std::make_shared<DataType>(std::move(element));
+        return dt;
+    }
 
     TypeId id() const { return id_; }
     int32_t precision() const { return precision_; }
     int32_t scale() const { return scale_; }
+    /// Returns the element type of an ARRAY. Returns `nullptr` for non-array
+    /// types. The returned pointer is valid as long as this DataType (or a
+    /// copy holding the same shared element) is alive.
+    const DataType* element_type() const { return element_type_.get(); }
 
    private:
     TypeId id_;
     int32_t precision_{0};
     int32_t scale_{0};
+    std::shared_ptr<DataType> element_type_;
 };
 
 constexpr int64_t EARLIEST_OFFSET = -2;
@@ -493,6 +510,12 @@ inline size_t ResolveColumn(const ColumnMap& map, const std::string& name) {
     return it->second.index;
 }
 
+// Forward declaration so NamedGetters can declare GetArrayView(...) even
+// though the concrete class is defined further down.
+}  // namespace detail
+class ArrayView;
+namespace detail {
+
 /// CRTP mixin that adds name-based getters to any class with index-based getters.
 /// Derived must provide: `size_t Resolve(const std::string&) const`
 /// and all the index-based getters (IsNull(idx), GetBool(idx), etc.).
@@ -518,6 +541,51 @@ struct NamedGetters {
     std::string GetDecimalString(const std::string& n) const {
         return Self().GetDecimalString(Self().Resolve(n));
     }
+    size_t GetArraySize(const std::string& n) const {
+        return Self().GetArraySize(Self().Resolve(n));
+    }
+    TypeId GetArrayElementType(const std::string& n) const {
+        return Self().GetArrayElementType(Self().Resolve(n));
+    }
+    bool IsArrayElementNull(const std::string& n, size_t element) const {
+        return Self().IsArrayElementNull(Self().Resolve(n), element);
+    }
+    bool GetArrayBool(const std::string& n, size_t element) const {
+        return Self().GetArrayBool(Self().Resolve(n), element);
+    }
+    int32_t GetArrayInt32(const std::string& n, size_t element) const {
+        return Self().GetArrayInt32(Self().Resolve(n), element);
+    }
+    int64_t GetArrayInt64(const std::string& n, size_t element) const {
+        return Self().GetArrayInt64(Self().Resolve(n), element);
+    }
+    float GetArrayFloat32(const std::string& n, size_t element) const {
+        return Self().GetArrayFloat32(Self().Resolve(n), element);
+    }
+    double GetArrayFloat64(const std::string& n, size_t element) const {
+        return Self().GetArrayFloat64(Self().Resolve(n), element);
+    }
+    std::string GetArrayString(const std::string& n, size_t element) const {
+        return Self().GetArrayString(Self().Resolve(n), element);
+    }
+    std::vector<uint8_t> GetArrayBytes(const std::string& n, size_t element) const {
+        return Self().GetArrayBytes(Self().Resolve(n), element);
+    }
+    fluss::Date GetArrayDate(const std::string& n, size_t element) const {
+        return Self().GetArrayDate(Self().Resolve(n), element);
+    }
+    fluss::Time GetArrayTime(const std::string& n, size_t element) const {
+        return Self().GetArrayTime(Self().Resolve(n), element);
+    }
+    fluss::Timestamp GetArrayTimestamp(const std::string& n, size_t element) const {
+        return Self().GetArrayTimestamp(Self().Resolve(n), element);
+    }
+    std::string GetArrayDecimalString(const std::string& n, size_t element) const {
+        return Self().GetArrayDecimalString(Self().Resolve(n), element);
+    }
+    // Definition appears below the ArrayView class; return-by-value requires
+    // the complete type so we cannot inline the body here.
+    ArrayView GetArrayView(const std::string& n) const;
 
    private:
     const Derived& Self() const { return static_cast<const Derived&>(*this); }
@@ -535,6 +603,91 @@ struct ScanData {
 };
 }  // namespace detail
 
+/**
+ * @brief Read-only view over a FlussArray column value.
+ *
+ * Obtained from RowView::GetArrayView() / LookupResult::GetArrayView(), and
+ * recursively from ArrayView::GetArray() for nested `ARRAY<ARRAY<...>>`
+ * columns. Owns an opaque Rust handle (FlussArray + element DataType) that
+ * is released on destruction. Move-only.
+ */
+class ArrayView {
+   public:
+    ~ArrayView() noexcept;
+
+    ArrayView(const ArrayView&) = delete;
+    ArrayView& operator=(const ArrayView&) = delete;
+    ArrayView(ArrayView&& other) noexcept;
+    ArrayView& operator=(ArrayView&& other) noexcept;
+
+    size_t Size() const noexcept;
+    TypeId ElementType() const noexcept;
+    bool IsNull(size_t element) const;
+
+    bool GetBool(size_t element) const;
+    int32_t GetInt32(size_t element) const;
+    int64_t GetInt64(size_t element) const;
+    float GetFloat32(size_t element) const;
+    double GetFloat64(size_t element) const;
+    std::string GetString(size_t element) const;
+    std::vector<uint8_t> GetBytes(size_t element) const;
+    fluss::Date GetDate(size_t element) const;
+    fluss::Time GetTime(size_t element) const;
+    fluss::Timestamp GetTimestampNtz(size_t element) const;
+    fluss::Timestamp GetTimestampLtz(size_t element) const;
+    std::string GetDecimalString(size_t element) const;
+    ArrayView GetArray(size_t element) const;
+
+   private:
+    friend class RowView;
+    friend class LookupResult;
+    explicit ArrayView(ffi::ArrayViewInner* inner) : inner_(inner) {}
+    void Destroy() noexcept;
+    ffi::ArrayViewInner* inner_{nullptr};
+};
+
+namespace detail {
+template <typename Derived>
+inline ArrayView NamedGetters<Derived>::GetArrayView(const std::string& n) const {
+    return Self().GetArrayView(Self().Resolve(n));
+}
+}  // namespace detail
+
+class ArrayWriter {
+   public:
+    ArrayWriter(size_t size, DataType element_type);
+    ~ArrayWriter() noexcept;
+
+    ArrayWriter(const ArrayWriter&) = delete;
+    ArrayWriter& operator=(const ArrayWriter&) = delete;
+    ArrayWriter(ArrayWriter&& other) noexcept;
+    ArrayWriter& operator=(ArrayWriter&& other) noexcept;
+
+    bool Available() const;
+    size_t Size() const noexcept;
+
+    void SetNull(size_t idx);
+    void SetBool(size_t idx, bool v);
+    void SetInt32(size_t idx, int32_t v);
+    void SetInt64(size_t idx, int64_t v);
+    void SetFloat32(size_t idx, float v);
+    void SetFloat64(size_t idx, double v);
+    void SetString(size_t idx, const std::string& v);
+    void SetBytes(size_t idx, const std::vector<uint8_t>& v);
+    void SetDate(size_t idx, fluss::Date d);
+    void SetTime(size_t idx, fluss::Time t);
+    void SetTimestampNtz(size_t idx, fluss::Timestamp ts);
+    void SetTimestampLtz(size_t idx, fluss::Timestamp ts);
+    void SetDecimal(size_t idx, const std::string& value);
+    void SetArray(size_t idx, ArrayWriter&& nested);
+
+   private:
+    friend class GenericRow;
+    void Destroy() noexcept;
+    ffi::ArrayWriterInner* inner_{nullptr};
+    DataType element_type_;
+};
+
 class GenericRow {
    public:
     GenericRow();
@@ -563,6 +716,7 @@ class GenericRow {
     void SetTimestampNtz(size_t idx, fluss::Timestamp ts);
     void SetTimestampLtz(size_t idx, fluss::Timestamp ts);
     void SetDecimal(size_t idx, const std::string& value);
+    void SetArray(size_t idx, ArrayWriter&& writer);
 
     // ── Name-based setters (require schema — see Table::NewRow()) ───
     void Set(const std::string& name, std::nullptr_t) { SetNull(Resolve(name)); }
@@ -610,6 +764,7 @@ class GenericRow {
                                      "' is not a timestamp column");
         }
     }
+    void Set(const std::string& name, ArrayWriter&& writer) { SetArray(Resolve(name), std::move(writer)); }
 
    private:
     friend class Table;
@@ -669,6 +824,26 @@ class RowView : public detail::NamedGetters<RowView> {
     bool IsDecimal(size_t idx) const;
     std::string GetDecimalString(size_t idx) const;
 
+    // ── Array getters ────────────────────────────────────────────────
+    size_t GetArraySize(size_t idx) const;
+    TypeId GetArrayElementType(size_t idx) const;
+    bool IsArrayElementNull(size_t idx, size_t element) const;
+    bool GetArrayBool(size_t idx, size_t element) const;
+    int32_t GetArrayInt32(size_t idx, size_t element) const;
+    int64_t GetArrayInt64(size_t idx, size_t element) const;
+    float GetArrayFloat32(size_t idx, size_t element) const;
+    double GetArrayFloat64(size_t idx, size_t element) const;
+    std::string GetArrayString(size_t idx, size_t element) const;
+    std::vector<uint8_t> GetArrayBytes(size_t idx, size_t element) const;
+    fluss::Date GetArrayDate(size_t idx, size_t element) const;
+    fluss::Time GetArrayTime(size_t idx, size_t element) const;
+    fluss::Timestamp GetArrayTimestamp(size_t idx, size_t element) const;
+    std::string GetArrayDecimalString(size_t idx, size_t element) const;
+    /// Returns an owning ArrayView over the array column at `idx`. ArrayView
+    /// supports nested arrays via ArrayView::GetArray(). Parity with Python's
+    /// recursive list return from `row.get_array(i)`.
+    ArrayView GetArrayView(size_t idx) const;
+
     // Name-based getters inherited from detail::NamedGetters<RowView>
     using detail::NamedGetters<RowView>::IsNull;
     using detail::NamedGetters<RowView>::GetBool;
@@ -682,6 +857,21 @@ class RowView : public detail::NamedGetters<RowView> {
     using detail::NamedGetters<RowView>::GetTime;
     using detail::NamedGetters<RowView>::GetTimestamp;
     using detail::NamedGetters<RowView>::GetDecimalString;
+    using detail::NamedGetters<RowView>::GetArraySize;
+    using detail::NamedGetters<RowView>::GetArrayElementType;
+    using detail::NamedGetters<RowView>::IsArrayElementNull;
+    using detail::NamedGetters<RowView>::GetArrayBool;
+    using detail::NamedGetters<RowView>::GetArrayInt32;
+    using detail::NamedGetters<RowView>::GetArrayInt64;
+    using detail::NamedGetters<RowView>::GetArrayFloat32;
+    using detail::NamedGetters<RowView>::GetArrayFloat64;
+    using detail::NamedGetters<RowView>::GetArrayString;
+    using detail::NamedGetters<RowView>::GetArrayBytes;
+    using detail::NamedGetters<RowView>::GetArrayDate;
+    using detail::NamedGetters<RowView>::GetArrayTime;
+    using detail::NamedGetters<RowView>::GetArrayTimestamp;
+    using detail::NamedGetters<RowView>::GetArrayDecimalString;
+    using detail::NamedGetters<RowView>::GetArrayView;
 
    private:
     size_t Resolve(const std::string& name) const {
@@ -951,6 +1141,24 @@ class LookupResult : public detail::NamedGetters<LookupResult> {
     bool IsDecimal(size_t idx) const;
     std::string GetDecimalString(size_t idx) const;
 
+    // ── Array getters ────────────────────────────────────────────────
+    size_t GetArraySize(size_t idx) const;
+    TypeId GetArrayElementType(size_t idx) const;
+    bool IsArrayElementNull(size_t idx, size_t element) const;
+    bool GetArrayBool(size_t idx, size_t element) const;
+    int32_t GetArrayInt32(size_t idx, size_t element) const;
+    int64_t GetArrayInt64(size_t idx, size_t element) const;
+    float GetArrayFloat32(size_t idx, size_t element) const;
+    double GetArrayFloat64(size_t idx, size_t element) const;
+    std::string GetArrayString(size_t idx, size_t element) const;
+    std::vector<uint8_t> GetArrayBytes(size_t idx, size_t element) const;
+    fluss::Date GetArrayDate(size_t idx, size_t element) const;
+    fluss::Time GetArrayTime(size_t idx, size_t element) const;
+    fluss::Timestamp GetArrayTimestamp(size_t idx, size_t element) const;
+    std::string GetArrayDecimalString(size_t idx, size_t element) const;
+    /// See RowView::GetArrayView for semantics. Supports nested arrays.
+    ArrayView GetArrayView(size_t idx) const;
+
     // Name-based getters inherited from detail::NamedGetters<LookupResult>
     using detail::NamedGetters<LookupResult>::IsNull;
     using detail::NamedGetters<LookupResult>::GetBool;
@@ -964,6 +1172,21 @@ class LookupResult : public detail::NamedGetters<LookupResult> {
     using detail::NamedGetters<LookupResult>::GetTime;
     using detail::NamedGetters<LookupResult>::GetTimestamp;
     using detail::NamedGetters<LookupResult>::GetDecimalString;
+    using detail::NamedGetters<LookupResult>::GetArraySize;
+    using detail::NamedGetters<LookupResult>::GetArrayElementType;
+    using detail::NamedGetters<LookupResult>::IsArrayElementNull;
+    using detail::NamedGetters<LookupResult>::GetArrayBool;
+    using detail::NamedGetters<LookupResult>::GetArrayInt32;
+    using detail::NamedGetters<LookupResult>::GetArrayInt64;
+    using detail::NamedGetters<LookupResult>::GetArrayFloat32;
+    using detail::NamedGetters<LookupResult>::GetArrayFloat64;
+    using detail::NamedGetters<LookupResult>::GetArrayString;
+    using detail::NamedGetters<LookupResult>::GetArrayBytes;
+    using detail::NamedGetters<LookupResult>::GetArrayDate;
+    using detail::NamedGetters<LookupResult>::GetArrayTime;
+    using detail::NamedGetters<LookupResult>::GetArrayTimestamp;
+    using detail::NamedGetters<LookupResult>::GetArrayDecimalString;
+    using detail::NamedGetters<LookupResult>::GetArrayView;
 
    private:
     friend class Lookuper;
diff --git a/fluss-rust/bindings/cpp/src/admin.cpp b/fluss-rust/bindings/cpp/src/admin.cpp
index 49300c156b..a689c6143a 100644
--- a/fluss-rust/bindings/cpp/src/admin.cpp
+++ b/fluss-rust/bindings/cpp/src/admin.cpp
@@ -21,6 +21,7 @@
 #include "fluss.hpp"
 #include "lib.rs.h"
 #include "rust/cxx.h"
+#include <exception>
 
 namespace fluss {
 
@@ -83,7 +84,11 @@ Result Admin::GetTableInfo(const TablePath& table_path, TableInfo& out) {
 
     auto result = utils::from_ffi_result(ffi_result.result);
     if (result.Ok()) {
-        out = utils::from_ffi_table_info(ffi_result.table_info);
+        try {
+            out = utils::from_ffi_table_info(ffi_result.table_info);
+        } catch (const std::exception& e) {
+            return utils::make_client_error(std::string("Failed to parse table metadata: ") + e.what());
+        }
     }
 
     return result;
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 3fe4532a62..0ef1487a7d 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -20,6 +20,7 @@
 #pragma once
 
 #include <cassert>
+#include <stdexcept>
 
 #include "fluss.hpp"
 #include "lib.rs.h"
@@ -27,6 +28,64 @@
 namespace fluss {
 namespace utils {
 
+/// Compact FFI representation of a (possibly nested) array type.
+///
+/// `nesting` counts the number of ARRAY wrappers stripped to reach the leaf
+/// element type. `leaf_type`/`leaf_precision`/`leaf_scale` describe that leaf
+/// scalar. A non-array input produces a zero-initialised value (nesting == 0).
+///
+/// Using a flat representation — rather than serialising a recursive
+/// `DataType` — keeps the cxx bridge contract small (four `i32`s inside
+/// `FfiColumn`) while preserving full schema fidelity across the FFI boundary
+/// when paired with rebuild_array_type().
+struct FlattenedArrayType {
+    int32_t nesting{0};
+    int32_t leaf_type{0};
+    int32_t leaf_precision{0};
+    int32_t leaf_scale{0};
+};
+
+/// Flattens an `ARRAY<ARRAY<...<leaf>>>` DataType into a FlattenedArrayType.
+///
+/// Contract:
+///   - If `data_type` is not an ARRAY, returns a zero-valued FlattenedArrayType
+///     and callers must use the column's own `id/precision/scale` instead.
+///   - If `data_type` is an ARRAY but has a null element_type() chain (which
+///     should only happen on malformed input), returns a zero-valued result to
+///     signal the caller to reject the schema.
+///   - Otherwise, `nesting >= 1` and leaf_* describe the innermost scalar.
+inline FlattenedArrayType flatten_array_type(const DataType& data_type) {
+    FlattenedArrayType out;
+    if (data_type.id() != TypeId::Array) {
+        return out;
+    }
+
+    const DataType* current = &data_type;
+    while (current && current->id() == TypeId::Array) {
+        out.nesting += 1;
+        current = current->element_type();
+    }
+    if (!current) {
+        return FlattenedArrayType{};
+    }
+
+    out.leaf_type = static_cast<int32_t>(current->id());
+    out.leaf_precision = current->precision();
+    out.leaf_scale = current->scale();
+    return out;
+}
+
+/// Inverse of flatten_array_type: rebuilds an `ARRAY<ARRAY<...<leaf>>>` type
+/// from the compact flat form. Requires `flat.nesting >= 1`; callers handle
+/// the `nesting == 0` case by using a plain scalar DataType directly.
+inline DataType rebuild_array_type(const FlattenedArrayType& flat) {
+    DataType dt(static_cast<TypeId>(flat.leaf_type), flat.leaf_precision, flat.leaf_scale);
+    for (int32_t i = 0; i < flat.nesting; ++i) {
+        dt = DataType::Array(std::move(dt));
+    }
+    return dt;
+}
+
 inline Result make_error(int32_t code, std::string msg) { return Result{code, std::move(msg)}; }
 
 inline Result make_client_error(std::string msg) {
@@ -94,6 +153,17 @@ inline ffi::FfiColumn to_ffi_column(const Column& col) {
     ffi_col.comment = rust::String(col.comment);
     ffi_col.precision = col.data_type.precision();
     ffi_col.scale = col.data_type.scale();
+    auto flat = flatten_array_type(col.data_type);
+    ffi_col.array_nesting = flat.nesting;
+    if (flat.nesting > 0 && flat.leaf_type != 0) {
+        ffi_col.element_data_type = flat.leaf_type;
+        ffi_col.element_precision = flat.leaf_precision;
+        ffi_col.element_scale = flat.leaf_scale;
+    } else {
+        ffi_col.element_data_type = 0;
+        ffi_col.element_precision = 0;
+        ffi_col.element_scale = 0;
+    }
     return ffi_col;
 }
 
@@ -158,10 +228,59 @@ inline ffi::FfiTableDescriptor to_ffi_table_descriptor(const TableDescriptor& de
 }
 
 inline Column from_ffi_column(const ffi::FfiColumn& ffi_col) {
-    return Column{
-        std::string(ffi_col.name),
-        DataType(static_cast<TypeId>(ffi_col.data_type), ffi_col.precision, ffi_col.scale),
-        std::string(ffi_col.comment)};
+    auto type_id = static_cast<TypeId>(ffi_col.data_type);
+    DataType dt(type_id, ffi_col.precision, ffi_col.scale);
+    if (type_id == TypeId::Array) {
+        if (ffi_col.element_data_type == 0) {
+            throw std::runtime_error("Malformed ARRAY column '" + std::string(ffi_col.name) +
+                                     "': missing element_data_type");
+        }
+        if (ffi_col.array_nesting < 0) {
+            throw std::runtime_error("Malformed ARRAY column '" + std::string(ffi_col.name) +
+                                     "': array_nesting must be non-negative");
+        }
+        if (ffi_col.element_data_type == static_cast<int32_t>(TypeId::Array)) {
+            throw std::runtime_error("Malformed ARRAY column '" + std::string(ffi_col.name) +
+                                     "': leaf element_data_type cannot be ARRAY");
+        }
+        auto is_supported_leaf_type = [](int32_t leaf_type) {
+            switch (static_cast<TypeId>(leaf_type)) {
+                case TypeId::Boolean:
+                case TypeId::TinyInt:
+                case TypeId::SmallInt:
+                case TypeId::Int:
+                case TypeId::BigInt:
+                case TypeId::Float:
+                case TypeId::Double:
+                case TypeId::String:
+                case TypeId::Bytes:
+                case TypeId::Date:
+                case TypeId::Time:
+                case TypeId::Timestamp:
+                case TypeId::TimestampLtz:
+                case TypeId::Decimal:
+                case TypeId::Char:
+                case TypeId::Binary:
+                    return true;
+                default:
+                    return false;
+            }
+        };
+        if (!is_supported_leaf_type(ffi_col.element_data_type)) {
+            throw std::runtime_error("Malformed ARRAY column '" + std::string(ffi_col.name) +
+                                     "': unsupported leaf element_data_type " +
+                                     std::to_string(ffi_col.element_data_type));
+        }
+
+        int32_t nesting = ffi_col.array_nesting > 0 ? ffi_col.array_nesting : 1;
+        dt = rebuild_array_type(FlattenedArrayType{
+            nesting,
+            ffi_col.element_data_type,
+            ffi_col.element_precision,
+            ffi_col.element_scale,
+        });
+    }
+    return Column{std::string(ffi_col.name), std::move(dt), std::string(ffi_col.comment)};
 }
 
 inline Schema from_ffi_schema(const ffi::FfiSchema& ffi_schema) {
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 51efb3c157..facb0e3198 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -17,6 +17,7 @@
 
 mod types;
 
+use std::str::FromStr;
 use std::sync::{Arc, LazyLock};
 use std::time::Duration;
 
@@ -85,6 +86,10 @@ mod ffi {
         comment: String,
         precision: i32,
         scale: i32,
+        array_nesting: i32,
+        element_data_type: i32,
+        element_precision: i32,
+        element_scale: i32,
     }
 
     struct FfiSchema {
@@ -279,6 +284,8 @@ mod ffi {
         type ScanResultInner;
         type GenericRowInner;
         type LookupResultInner;
+        type ArrayWriterInner;
+        type ArrayViewInner;
 
         // Connection
         fn new_connection(config: &FfiConfig) -> FfiPtrResult;
@@ -383,6 +390,49 @@ mod ffi {
         fn gr_set_ts_ntz(self: &mut GenericRowInner, idx: usize, millis: i64, nanos: i32);
         fn gr_set_ts_ltz(self: &mut GenericRowInner, idx: usize, millis: i64, nanos: i32);
         fn gr_set_decimal_str(self: &mut GenericRowInner, idx: usize, val: &str);
+        fn gr_set_array(
+            self: &mut GenericRowInner,
+            idx: usize,
+            writer: &mut ArrayWriterInner,
+        ) -> Result<()>;
+
+        // ArrayWriterInner — opaque array builder for writes
+        fn new_array_writer(
+            size: usize,
+            element_leaf_type_id: i32,
+            precision: u32,
+            scale: u32,
+            array_nesting: u32,
+        ) -> Result<Box<ArrayWriterInner>>;
+        fn aw_size(self: &ArrayWriterInner) -> usize;
+        fn aw_set_null(self: &mut ArrayWriterInner, idx: usize) -> Result<()>;
+        fn aw_set_bool(self: &mut ArrayWriterInner, idx: usize, val: bool) -> Result<()>;
+        fn aw_set_i32(self: &mut ArrayWriterInner, idx: usize, val: i32) -> Result<()>;
+        fn aw_set_i64(self: &mut ArrayWriterInner, idx: usize, val: i64) -> Result<()>;
+        fn aw_set_f32(self: &mut ArrayWriterInner, idx: usize, val: f32) -> Result<()>;
+        fn aw_set_f64(self: &mut ArrayWriterInner, idx: usize, val: f64) -> Result<()>;
+        fn aw_set_str(self: &mut ArrayWriterInner, idx: usize, val: &str) -> Result<()>;
+        fn aw_set_bytes(self: &mut ArrayWriterInner, idx: usize, val: &[u8]) -> Result<()>;
+        fn aw_set_date(self: &mut ArrayWriterInner, idx: usize, days: i32) -> Result<()>;
+        fn aw_set_time(self: &mut ArrayWriterInner, idx: usize, millis: i32) -> Result<()>;
+        fn aw_set_ts_ntz(
+            self: &mut ArrayWriterInner,
+            idx: usize,
+            millis: i64,
+            nanos: i32,
+        ) -> Result<()>;
+        fn aw_set_ts_ltz(
+            self: &mut ArrayWriterInner,
+            idx: usize,
+            millis: i64,
+            nanos: i32,
+        ) -> Result<()>;
+        fn aw_set_decimal_str(self: &mut ArrayWriterInner, idx: usize, val: &str) -> Result<()>;
+        fn aw_set_array(
+            self: &mut ArrayWriterInner,
+            idx: usize,
+            nested: &mut ArrayWriterInner,
+        ) -> Result<()>;
 
         // AppendWriter
         unsafe fn delete_append_writer(writer: *mut AppendWriter);
@@ -431,6 +481,78 @@ mod ffi {
         fn lv_is_ts_ltz(self: &LookupResultInner, field: usize) -> Result<bool>;
         fn lv_get_decimal_str(self: &LookupResultInner, field: usize) -> Result<String>;
 
+        fn lv_get_array_size(self: &LookupResultInner, field: usize) -> Result<usize>;
+        fn lv_get_array_is_null(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<bool>;
+        fn lv_get_array_bool(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<bool>;
+        fn lv_get_array_i32(self: &LookupResultInner, field: usize, element: usize) -> Result<i32>;
+        fn lv_get_array_i64(self: &LookupResultInner, field: usize, element: usize) -> Result<i64>;
+        fn lv_get_array_f32(self: &LookupResultInner, field: usize, element: usize) -> Result<f32>;
+        fn lv_get_array_f64(self: &LookupResultInner, field: usize, element: usize) -> Result<f64>;
+        fn lv_get_array_str(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<String>;
+        fn lv_get_array_bytes(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<Vec<u8>>;
+        fn lv_get_array_date_days(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<i32>;
+        fn lv_get_array_time_millis(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<i32>;
+        fn lv_get_array_ts_millis(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<i64>;
+        fn lv_get_array_ts_nanos(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<i32>;
+        fn lv_get_array_decimal_str(
+            self: &LookupResultInner,
+            field: usize,
+            element: usize,
+        ) -> Result<String>;
+        fn lv_get_array_element_type(self: &LookupResultInner, field: usize) -> Result<i32>;
+        fn lv_get_array_view(self: &LookupResultInner, field: usize)
+        -> Result<Box<ArrayViewInner>>;
+
+        // ArrayViewInner — opaque recursive array reader for C++ bindings
+        fn av_size(self: &ArrayViewInner) -> usize;
+        fn av_element_type_id(self: &ArrayViewInner) -> i32;
+        fn av_is_null(self: &ArrayViewInner, element: usize) -> Result<bool>;
+        fn av_get_bool(self: &ArrayViewInner, element: usize) -> Result<bool>;
+        fn av_get_i32(self: &ArrayViewInner, element: usize) -> Result<i32>;
+        fn av_get_i64(self: &ArrayViewInner, element: usize) -> Result<i64>;
+        fn av_get_f32(self: &ArrayViewInner, element: usize) -> Result<f32>;
+        fn av_get_f64(self: &ArrayViewInner, element: usize) -> Result<f64>;
+        fn av_get_str(self: &ArrayViewInner, element: usize) -> Result<String>;
+        fn av_get_bytes(self: &ArrayViewInner, element: usize) -> Result<Vec<u8>>;
+        fn av_get_date_days(self: &ArrayViewInner, element: usize) -> Result<i32>;
+        fn av_get_time_millis(self: &ArrayViewInner, element: usize) -> Result<i32>;
+        fn av_get_ts_millis(self: &ArrayViewInner, element: usize) -> Result<i64>;
+        fn av_get_ts_nanos(self: &ArrayViewInner, element: usize) -> Result<i32>;
+        fn av_get_decimal_str(self: &ArrayViewInner, element: usize) -> Result<String>;
+        fn av_get_nested(self: &ArrayViewInner, element: usize) -> Result<Box<ArrayViewInner>>;
+
         // LogScanner
         unsafe fn delete_log_scanner(scanner: *mut LogScanner);
         fn subscribe(self: &LogScanner, bucket_id: i32, start_offset: i64) -> FfiResult;
@@ -552,6 +674,111 @@ mod ffi {
             field: usize,
         ) -> Result<String>;
 
+        fn sv_get_array_size(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<usize>;
+        fn sv_get_array_is_null(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<bool>;
+        fn sv_get_array_bool(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<bool>;
+        fn sv_get_array_i32(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<i32>;
+        fn sv_get_array_i64(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<i64>;
+        fn sv_get_array_f32(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<f32>;
+        fn sv_get_array_f64(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<f64>;
+        fn sv_get_array_str(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<String>;
+        fn sv_get_array_bytes(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<Vec<u8>>;
+        fn sv_get_array_date_days(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<i32>;
+        fn sv_get_array_time_millis(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<i32>;
+        fn sv_get_array_ts_millis(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<i64>;
+        fn sv_get_array_ts_nanos(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<i32>;
+        fn sv_get_array_decimal_str(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+            element: usize,
+        ) -> Result<String>;
+        fn sv_get_array_element_type(self: &ScanResultInner, field: usize) -> Result<i32>;
+        fn sv_get_array_view(
+            self: &ScanResultInner,
+            bucket: usize,
+            rec: usize,
+            field: usize,
+        ) -> Result<Box<ArrayViewInner>>;
+
         fn sv_bucket_infos(self: &ScanResultInner) -> &Vec<FfiBucketInfo>;
     }
 }
@@ -1864,6 +2091,16 @@ impl GenericRowInner {
         );
     }
 
+    fn gr_set_array(&mut self, idx: usize, writer: &mut ArrayWriterInner) -> Result<(), String> {
+        self.ensure_size(idx);
+        writer.complete_if_needed()?;
+        let arr = writer.completed.take().ok_or_else(|| {
+            "ArrayWriter invariant violation: completed array missing after finalize".to_string()
+        })?;
+        self.row.set_field(idx, fcore::row::Datum::Array(arr));
+        Ok(())
+    }
+
     fn ensure_size(&mut self, idx: usize) {
         if self.row.values.len() <= idx {
             self.row.values.resize(idx + 1, fcore::row::Datum::Null);
@@ -1876,6 +2113,7 @@ impl GenericRowInner {
 // ============================================================================
 
 mod row_reader {
+    use super::array_reader;
     use fcore::row::InternalRow;
     use fluss as fcore;
 
@@ -2144,6 +2382,555 @@ mod row_reader {
             dt => Err(format!("get_decimal_str: unexpected type {dt}")),
         }
     }
+
+    fn get_fluss_array(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<fcore::row::binary_array::FlussArray, String> {
+        validate(row, columns, field, "get_array", |dt| {
+            matches!(dt, fcore::metadata::DataType::Array(_))
+        })?;
+        row.get_array(field).map_err(|e| e.to_string())
+    }
+
+    pub fn get_array_element_type(
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<&fcore::metadata::DataType, String> {
+        let col = get_column(columns, field)?;
+        match col.data_type() {
+            fcore::metadata::DataType::Array(at) => Ok(at.get_element_type()),
+            dt => Err(format!("get_array: column {field} is not Array, got {dt}")),
+        }
+    }
+
+    pub fn get_array_size(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<usize, String> {
+        let arr = get_fluss_array(row, columns, field)?;
+        Ok(arr.size())
+    }
+
+    pub fn get_array_and_elem_type<'a>(
+        row: &dyn InternalRow,
+        columns: &'a [fcore::metadata::Column],
+        field: usize,
+    ) -> Result<
+        (
+            fcore::row::binary_array::FlussArray,
+            &'a fcore::metadata::DataType,
+        ),
+        String,
+    > {
+        let arr = get_fluss_array(row, columns, field)?;
+        let elem = get_array_element_type(columns, field)?;
+        Ok((arr, elem))
+    }
+
+    pub fn get_array_is_null(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<bool, String> {
+        let arr = get_fluss_array(row, columns, field)?;
+        array_reader::is_null(&arr, element)
+    }
+
+    pub fn get_array_bool(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<bool, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_bool(&arr, elem, element)
+    }
+
+    pub fn get_array_i32(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<i32, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_i32(&arr, elem, element)
+    }
+
+    pub fn get_array_i64(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<i64, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_i64(&arr, elem, element)
+    }
+
+    pub fn get_array_f32(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<f32, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_f32(&arr, elem, element)
+    }
+
+    pub fn get_array_f64(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<f64, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_f64(&arr, elem, element)
+    }
+
+    pub fn get_array_str(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<String, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_str(&arr, elem, element)
+    }
+
+    pub fn get_array_bytes(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<Vec<u8>, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_bytes(&arr, elem, element)
+    }
+
+    pub fn get_array_date_days(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<i32, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_date_days(&arr, elem, element)
+    }
+
+    pub fn get_array_time_millis(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<i32, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_time_millis(&arr, elem, element)
+    }
+
+    pub fn get_array_ts_millis(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<i64, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_ts_millis(&arr, elem, element)
+    }
+
+    pub fn get_array_ts_nanos(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<i32, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_ts_nanos(&arr, elem, element)
+    }
+
+    pub fn get_array_decimal_str(
+        row: &dyn InternalRow,
+        columns: &[fcore::metadata::Column],
+        field: usize,
+        element: usize,
+    ) -> Result<String, String> {
+        let (arr, elem) = get_array_and_elem_type(row, columns, field)?;
+        array_reader::get_decimal_str(&arr, elem, element)
+    }
+
+    pub fn get_array_element_type_id(
+        columns: &[fcore::metadata::Column],
+        field: usize,
+    ) -> Result<i32, String> {
+        let elem_type = get_array_element_type(columns, field)?;
+        Ok(crate::types::core_data_type_to_ffi(elem_type))
+    }
+}
+
+// ============================================================================
+// array_reader — low-level accessors over an already-resolved FlussArray
+//
+// Shared by the top-level `row_reader::get_array_*` wrappers and by
+// `ArrayViewInner` (which exposes recursive/nested access to C++). Keeping
+// one implementation here guarantees identical bounds-checking, null
+// validation, type checking, and type dispatch across flat and nested reads.
+// ============================================================================
+
+mod array_reader {
+    use super::fcore;
+
+    fn validate_index(
+        arr: &fcore::row::binary_array::FlussArray,
+        element: usize,
+        op: &str,
+    ) -> Result<(), String> {
+        if element < arr.size() {
+            Ok(())
+        } else {
+            Err(format!(
+                "{op}: element index out of bounds: element={element}, size={}",
+                arr.size()
+            ))
+        }
+    }
+
+    fn ensure_non_null(
+        arr: &fcore::row::binary_array::FlussArray,
+        element: usize,
+        op: &str,
+    ) -> Result<(), String> {
+        if arr.is_null_at(element) {
+            Err(format!(
+                "{op}: element at index {element} is null; call array_is_null first"
+            ))
+        } else {
+            Ok(())
+        }
+    }
+
+    fn ensure_type(
+        elem_type: &fcore::metadata::DataType,
+        op: &str,
+        expected: &str,
+        allowed: impl FnOnce(&fcore::metadata::DataType) -> bool,
+    ) -> Result<(), String> {
+        if allowed(elem_type) {
+            Ok(())
+        } else {
+            Err(format!(
+                "{op}: element type is {elem_type}, expected {expected}"
+            ))
+        }
+    }
+
+    fn ensure_readable(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+        op: &str,
+        expected: &str,
+        allowed: impl FnOnce(&fcore::metadata::DataType) -> bool,
+    ) -> Result<(), String> {
+        validate_index(arr, element, op)?;
+        ensure_type(elem_type, op, expected, allowed)?;
+        ensure_non_null(arr, element, op)
+    }
+
+    pub fn is_null(
+        arr: &fcore::row::binary_array::FlussArray,
+        element: usize,
+    ) -> Result<bool, String> {
+        validate_index(arr, element, "array_is_null")?;
+        Ok(arr.is_null_at(element))
+    }
+
+    pub fn get_bool(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<bool, String> {
+        ensure_readable(arr, elem_type, element, "array_bool", "BOOLEAN", |dt| {
+            matches!(dt, fcore::metadata::DataType::Boolean(_))
+        })?;
+        arr.get_boolean(element).map_err(|e| e.to_string())
+    }
+
+    pub fn get_i32(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<i32, String> {
+        ensure_readable(
+            arr,
+            elem_type,
+            element,
+            "array_i32",
+            "TINYINT/SMALLINT/INT",
+            |dt| {
+                matches!(
+                    dt,
+                    fcore::metadata::DataType::TinyInt(_)
+                        | fcore::metadata::DataType::SmallInt(_)
+                        | fcore::metadata::DataType::Int(_)
+                )
+            },
+        )?;
+        match elem_type {
+            fcore::metadata::DataType::TinyInt(_) => arr
+                .get_byte(element)
+                .map(|v| v as i32)
+                .map_err(|e| e.to_string()),
+            fcore::metadata::DataType::SmallInt(_) => arr
+                .get_short(element)
+                .map(|v| v as i32)
+                .map_err(|e| e.to_string()),
+            fcore::metadata::DataType::Int(_) => arr.get_int(element).map_err(|e| e.to_string()),
+            _ => unreachable!("type validated by ensure_readable"),
+        }
+    }
+
+    pub fn get_i64(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<i64, String> {
+        ensure_readable(arr, elem_type, element, "array_i64", "BIGINT", |dt| {
+            matches!(dt, fcore::metadata::DataType::BigInt(_))
+        })?;
+        arr.get_long(element).map_err(|e| e.to_string())
+    }
+
+    pub fn get_f32(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<f32, String> {
+        ensure_readable(arr, elem_type, element, "array_f32", "FLOAT", |dt| {
+            matches!(dt, fcore::metadata::DataType::Float(_))
+        })?;
+        arr.get_float(element).map_err(|e| e.to_string())
+    }
+
+    pub fn get_f64(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<f64, String> {
+        ensure_readable(arr, elem_type, element, "array_f64", "DOUBLE", |dt| {
+            matches!(dt, fcore::metadata::DataType::Double(_))
+        })?;
+        arr.get_double(element).map_err(|e| e.to_string())
+    }
+
+    pub fn get_str(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<String, String> {
+        ensure_readable(arr, elem_type, element, "array_str", "STRING/CHAR", |dt| {
+            matches!(
+                dt,
+                fcore::metadata::DataType::String(_) | fcore::metadata::DataType::Char(_)
+            )
+        })?;
+        arr.get_string(element)
+            .map(|s| s.to_string())
+            .map_err(|e| e.to_string())
+    }
+
+    pub fn get_bytes(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<Vec<u8>, String> {
+        ensure_readable(
+            arr,
+            elem_type,
+            element,
+            "array_bytes",
+            "BYTES/BINARY",
+            |dt| {
+                matches!(
+                    dt,
+                    fcore::metadata::DataType::Bytes(_) | fcore::metadata::DataType::Binary(_)
+                )
+            },
+        )?;
+        arr.get_binary(element)
+            .map(|b| b.to_vec())
+            .map_err(|e| e.to_string())
+    }
+
+    pub fn get_date_days(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<i32, String> {
+        ensure_readable(arr, elem_type, element, "array_date", "DATE", |dt| {
+            matches!(dt, fcore::metadata::DataType::Date(_))
+        })?;
+        arr.get_date(element)
+            .map(|d| d.get_inner())
+            .map_err(|e| e.to_string())
+    }
+
+    pub fn get_time_millis(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<i32, String> {
+        ensure_readable(arr, elem_type, element, "array_time", "TIME", |dt| {
+            matches!(dt, fcore::metadata::DataType::Time(_))
+        })?;
+        arr.get_time(element)
+            .map(|t| t.get_inner())
+            .map_err(|e| e.to_string())
+    }
+
+    pub fn get_ts_millis(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<i64, String> {
+        ensure_readable(
+            arr,
+            elem_type,
+            element,
+            "array_ts_millis",
+            "TIMESTAMP/TIMESTAMP_LTZ",
+            |dt| {
+                matches!(
+                    dt,
+                    fcore::metadata::DataType::Timestamp(_)
+                        | fcore::metadata::DataType::TimestampLTz(_)
+                )
+            },
+        )?;
+        match elem_type {
+            fcore::metadata::DataType::TimestampLTz(ts) => arr
+                .get_timestamp_ltz(element, ts.precision())
+                .map(|v| v.get_epoch_millisecond())
+                .map_err(|e| e.to_string()),
+            fcore::metadata::DataType::Timestamp(ts) => arr
+                .get_timestamp_ntz(element, ts.precision())
+                .map(|v| v.get_millisecond())
+                .map_err(|e| e.to_string()),
+            _ => unreachable!("type validated by ensure_readable"),
+        }
+    }
+
+    pub fn get_ts_nanos(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<i32, String> {
+        ensure_readable(
+            arr,
+            elem_type,
+            element,
+            "array_ts_nanos",
+            "TIMESTAMP/TIMESTAMP_LTZ",
+            |dt| {
+                matches!(
+                    dt,
+                    fcore::metadata::DataType::Timestamp(_)
+                        | fcore::metadata::DataType::TimestampLTz(_)
+                )
+            },
+        )?;
+        match elem_type {
+            fcore::metadata::DataType::TimestampLTz(ts) => arr
+                .get_timestamp_ltz(element, ts.precision())
+                .map(|v| v.get_nano_of_millisecond())
+                .map_err(|e| e.to_string()),
+            fcore::metadata::DataType::Timestamp(ts) => arr
+                .get_timestamp_ntz(element, ts.precision())
+                .map(|v| v.get_nano_of_millisecond())
+                .map_err(|e| e.to_string()),
+            _ => unreachable!("type validated by ensure_readable"),
+        }
+    }
+
+    pub fn get_decimal_str(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<String, String> {
+        ensure_readable(arr, elem_type, element, "array_decimal", "DECIMAL", |dt| {
+            matches!(dt, fcore::metadata::DataType::Decimal(_))
+        })?;
+        match elem_type {
+            fcore::metadata::DataType::Decimal(dd) => {
+                let decimal = arr
+                    .get_decimal(element, dd.precision(), dd.scale())
+                    .map_err(|e| e.to_string())?;
+                Ok(decimal.to_big_decimal().to_string())
+            }
+            _ => unreachable!("type validated by ensure_readable"),
+        }
+    }
+
+    pub fn get_nested_array(
+        arr: &fcore::row::binary_array::FlussArray,
+        elem_type: &fcore::metadata::DataType,
+        element: usize,
+    ) -> Result<
+        (
+            fcore::row::binary_array::FlussArray,
+            fcore::metadata::DataType,
+        ),
+        String,
+    > {
+        ensure_readable(arr, elem_type, element, "array_nested", "ARRAY", |dt| {
+            matches!(dt, fcore::metadata::DataType::Array(_))
+        })?;
+        match elem_type {
+            fcore::metadata::DataType::Array(at) => {
+                let nested = arr.get_array(element).map_err(|e| e.to_string())?;
+                Ok((nested, at.get_element_type().clone()))
+            }
+            _ => unreachable!("type validated by ensure_readable"),
+        }
+    }
+}
+
+// ============================================================================
+// Macros that generate uniform sv_/lv_ array element getters (thin wrappers
+// that only forward to `row_reader::get_array_*`).
+// ============================================================================
+
+macro_rules! sv_array_element_getters {
+    ($( $method:ident, $reader_fn:ident, $ret:ty; )+) => {
+        $(
+            fn $method(
+                &self,
+                bucket: usize,
+                rec: usize,
+                field: usize,
+                element: usize,
+            ) -> Result<$ret, String> {
+                row_reader::$reader_fn(
+                    self.resolve(bucket, rec).row(),
+                    &self.columns,
+                    field,
+                    element,
+                )
+            }
+        )+
+    };
+}
+
+macro_rules! lv_array_element_getters {
+    ($( $method:ident, $reader_fn:ident, $ret:ty; )+) => {
+        $(
+            fn $method(&self, field: usize, element: usize) -> Result<$ret, String> {
+                let r = self.lv_row()?;
+                row_reader::$reader_fn(r, &self.columns, field, element)
+            }
+        )+
+    };
 }
 
 // ============================================================================
@@ -2261,6 +3048,44 @@ impl ScanResultInner {
         row_reader::get_decimal_str(self.resolve(bucket, rec).row(), &self.columns, field)
     }
 
+    fn sv_get_array_size(&self, bucket: usize, rec: usize, field: usize) -> Result<usize, String> {
+        row_reader::get_array_size(self.resolve(bucket, rec).row(), &self.columns, field)
+    }
+    sv_array_element_getters! {
+        sv_get_array_is_null, get_array_is_null, bool;
+        sv_get_array_bool,    get_array_bool,    bool;
+        sv_get_array_i32,     get_array_i32,     i32;
+        sv_get_array_i64,     get_array_i64,     i64;
+        sv_get_array_f32,     get_array_f32,     f32;
+        sv_get_array_f64,     get_array_f64,     f64;
+        sv_get_array_str,     get_array_str,     String;
+        sv_get_array_bytes,   get_array_bytes,   Vec<u8>;
+        sv_get_array_date_days,   get_array_date_days,   i32;
+        sv_get_array_time_millis, get_array_time_millis, i32;
+        sv_get_array_ts_millis,   get_array_ts_millis,   i64;
+        sv_get_array_ts_nanos,    get_array_ts_nanos,    i32;
+        sv_get_array_decimal_str, get_array_decimal_str, String;
+    }
+    fn sv_get_array_element_type(&self, field: usize) -> Result<i32, String> {
+        row_reader::get_array_element_type_id(&self.columns, field)
+    }
+    fn sv_get_array_view(
+        &self,
+        bucket: usize,
+        rec: usize,
+        field: usize,
+    ) -> Result<Box<ArrayViewInner>, String> {
+        let (arr, elem) = row_reader::get_array_and_elem_type(
+            self.resolve(bucket, rec).row(),
+            &self.columns,
+            field,
+        )?;
+        Ok(Box::new(ArrayViewInner {
+            array: arr,
+            element_type: elem.clone(),
+        }))
+    }
+
     fn sv_bucket_infos(&self) -> &Vec<ffi::FfiBucketInfo> {
         &self.bucket_infos
     }
@@ -2377,4 +3202,439 @@ impl LookupResultInner {
         let r = self.lv_row()?;
         row_reader::get_decimal_str(r, &self.columns, field)
     }
+    fn lv_get_array_size(&self, field: usize) -> Result<usize, String> {
+        let r = self.lv_row()?;
+        row_reader::get_array_size(r, &self.columns, field)
+    }
+    lv_array_element_getters! {
+        lv_get_array_is_null, get_array_is_null, bool;
+        lv_get_array_bool,    get_array_bool,    bool;
+        lv_get_array_i32,     get_array_i32,     i32;
+        lv_get_array_i64,     get_array_i64,     i64;
+        lv_get_array_f32,     get_array_f32,     f32;
+        lv_get_array_f64,     get_array_f64,     f64;
+        lv_get_array_str,     get_array_str,     String;
+        lv_get_array_bytes,   get_array_bytes,   Vec<u8>;
+        lv_get_array_date_days,   get_array_date_days,   i32;
+        lv_get_array_time_millis, get_array_time_millis, i32;
+        lv_get_array_ts_millis,   get_array_ts_millis,   i64;
+        lv_get_array_ts_nanos,    get_array_ts_nanos,    i32;
+        lv_get_array_decimal_str, get_array_decimal_str, String;
+    }
+    fn lv_get_array_element_type(&self, field: usize) -> Result<i32, String> {
+        row_reader::get_array_element_type_id(&self.columns, field)
+    }
+    fn lv_get_array_view(&self, field: usize) -> Result<Box<ArrayViewInner>, String> {
+        let r = self.lv_row()?;
+        let (arr, elem) = row_reader::get_array_and_elem_type(r, &self.columns, field)?;
+        Ok(Box::new(ArrayViewInner {
+            array: arr,
+            element_type: elem.clone(),
+        }))
+    }
+}
+
+// ============================================================================
+// Opaque types: ArrayViewInner (recursive array reader)
+//
+// Wraps an owned `FlussArray` plus its element `DataType` and exposes the
+// same accessors as `row_reader::get_array_*`, delegating to the shared
+// `array_reader` primitives. Enables C++ bindings to recurse into nested
+// arrays without per-level FFI scaffolding.
+// ============================================================================
+
+pub struct ArrayViewInner {
+    array: fcore::row::binary_array::FlussArray,
+    element_type: fcore::metadata::DataType,
+}
+
+impl ArrayViewInner {
+    fn av_size(&self) -> usize {
+        self.array.size()
+    }
+
+    fn av_element_type_id(&self) -> i32 {
+        crate::types::core_data_type_to_ffi(&self.element_type)
+    }
+
+    fn av_is_null(&self, element: usize) -> Result<bool, String> {
+        array_reader::is_null(&self.array, element)
+    }
+
+    fn av_get_bool(&self, element: usize) -> Result<bool, String> {
+        array_reader::get_bool(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_i32(&self, element: usize) -> Result<i32, String> {
+        array_reader::get_i32(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_i64(&self, element: usize) -> Result<i64, String> {
+        array_reader::get_i64(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_f32(&self, element: usize) -> Result<f32, String> {
+        array_reader::get_f32(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_f64(&self, element: usize) -> Result<f64, String> {
+        array_reader::get_f64(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_str(&self, element: usize) -> Result<String, String> {
+        array_reader::get_str(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_bytes(&self, element: usize) -> Result<Vec<u8>, String> {
+        array_reader::get_bytes(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_date_days(&self, element: usize) -> Result<i32, String> {
+        array_reader::get_date_days(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_time_millis(&self, element: usize) -> Result<i32, String> {
+        array_reader::get_time_millis(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_ts_millis(&self, element: usize) -> Result<i64, String> {
+        array_reader::get_ts_millis(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_ts_nanos(&self, element: usize) -> Result<i32, String> {
+        array_reader::get_ts_nanos(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_decimal_str(&self, element: usize) -> Result<String, String> {
+        array_reader::get_decimal_str(&self.array, &self.element_type, element)
+    }
+
+    fn av_get_nested(&self, element: usize) -> Result<Box<ArrayViewInner>, String> {
+        let (arr, elem) = array_reader::get_nested_array(&self.array, &self.element_type, element)?;
+        Ok(Box::new(ArrayViewInner {
+            array: arr,
+            element_type: elem,
+        }))
+    }
+}
+
+// ============================================================================
+// Opaque types: ArrayWriterInner (array builder for writes)
+// ============================================================================
+
+pub struct ArrayWriterInner {
+    writer: Option<fcore::row::binary_array::FlussArrayWriter>,
+    completed: Option<fcore::row::binary_array::FlussArray>,
+    element_type: fcore::metadata::DataType,
+    num_elements: usize,
+}
+
+fn new_array_writer(
+    size: usize,
+    element_leaf_type_id: i32,
+    precision: u32,
+    scale: u32,
+    array_nesting: u32,
+) -> Result<Box<ArrayWriterInner>, String> {
+    let element_type =
+        types::element_type_from_ffi(element_leaf_type_id, precision, scale, array_nesting)
+            .map_err(|e| e.to_string())?;
+    let writer = fcore::row::binary_array::FlussArrayWriter::new(size, &element_type);
+    Ok(Box::new(ArrayWriterInner {
+        writer: Some(writer),
+        completed: None,
+        element_type,
+        num_elements: size,
+    }))
+}
+
+impl ArrayWriterInner {
+    fn writer_mut(&mut self) -> Result<&mut fcore::row::binary_array::FlussArrayWriter, String> {
+        self.writer
+            .as_mut()
+            .ok_or_else(|| "ArrayWriter is already finalized".to_string())
+    }
+
+    fn validate_index(&self, idx: usize) -> Result<(), String> {
+        if idx < self.num_elements {
+            Ok(())
+        } else {
+            Err(format!(
+                "ArrayWriter index out of bounds: idx={idx}, size={}",
+                self.num_elements
+            ))
+        }
+    }
+
+    fn complete_if_needed(&mut self) -> Result<(), String> {
+        if self.completed.is_none() {
+            let w = self
+                .writer
+                .take()
+                .ok_or_else(|| "ArrayWriter has already been finalized".to_string())?;
+            self.completed = Some(w.complete().map_err(|e| e.to_string())?);
+        }
+        Ok(())
+    }
+
+    /// Checks writer liveness first, then the element index. Returning the
+    /// clearest finalization error before a bounds error keeps diagnostics
+    /// aligned with the caller's intent when a writer is misused after
+    /// completion.
+    fn ensure_writable(&self, idx: usize) -> Result<(), String> {
+        if self.writer.is_none() {
+            return Err("ArrayWriter is already finalized".to_string());
+        }
+        self.validate_index(idx)
+    }
+
+    fn aw_size(&self) -> usize {
+        self.num_elements
+    }
+
+    fn aw_set_null(&mut self, idx: usize) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        self.writer_mut()?.set_null_at(idx);
+        Ok(())
+    }
+
+    fn aw_set_bool(&mut self, idx: usize, val: bool) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        if !matches!(self.element_type, fcore::metadata::DataType::Boolean(_)) {
+            return Err(format!(
+                "ArrayWriter type mismatch: expected BOOLEAN element, got {}",
+                self.element_type
+            ));
+        }
+        self.writer_mut()?.write_boolean(idx, val);
+        Ok(())
+    }
+
+    fn aw_set_i32(&mut self, idx: usize, val: i32) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        match &self.element_type {
+            fcore::metadata::DataType::TinyInt(_) => {
+                let v = i8::try_from(val)
+                    .map_err(|_| format!("Value {val} does not fit TINYINT element"))?;
+                self.writer_mut()?.write_byte(idx, v);
+            }
+            fcore::metadata::DataType::SmallInt(_) => {
+                let v = i16::try_from(val)
+                    .map_err(|_| format!("Value {val} does not fit SMALLINT element"))?;
+                self.writer_mut()?.write_short(idx, v);
+            }
+            fcore::metadata::DataType::Int(_) => {
+                self.writer_mut()?.write_int(idx, val);
+            }
+            _ => {
+                return Err(format!(
+                    "ArrayWriter type mismatch: expected TINYINT/SMALLINT/INT element, got {}",
+                    self.element_type
+                ));
+            }
+        }
+        Ok(())
+    }
+
+    fn aw_set_i64(&mut self, idx: usize, val: i64) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        if !matches!(self.element_type, fcore::metadata::DataType::BigInt(_)) {
+            return Err(format!(
+                "ArrayWriter type mismatch: expected BIGINT element, got {}",
+                self.element_type
+            ));
+        }
+        self.writer_mut()?.write_long(idx, val);
+        Ok(())
+    }
+
+    fn aw_set_f32(&mut self, idx: usize, val: f32) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        if !matches!(self.element_type, fcore::metadata::DataType::Float(_)) {
+            return Err(format!(
+                "ArrayWriter type mismatch: expected FLOAT element, got {}",
+                self.element_type
+            ));
+        }
+        self.writer_mut()?.write_float(idx, val);
+        Ok(())
+    }
+
+    fn aw_set_f64(&mut self, idx: usize, val: f64) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        if !matches!(self.element_type, fcore::metadata::DataType::Double(_)) {
+            return Err(format!(
+                "ArrayWriter type mismatch: expected DOUBLE element, got {}",
+                self.element_type
+            ));
+        }
+        self.writer_mut()?.write_double(idx, val);
+        Ok(())
+    }
+
+    fn aw_set_str(&mut self, idx: usize, val: &str) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        if !matches!(
+            self.element_type,
+            fcore::metadata::DataType::String(_) | fcore::metadata::DataType::Char(_)
+        ) {
+            return Err(format!(
+                "ArrayWriter type mismatch: expected STRING/CHAR element, got {}",
+                self.element_type
+            ));
+        }
+        self.writer_mut()?.write_string(idx, val);
+        Ok(())
+    }
+
+    fn aw_set_bytes(&mut self, idx: usize, val: &[u8]) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        if !matches!(
+            self.element_type,
+            fcore::metadata::DataType::Bytes(_) | fcore::metadata::DataType::Binary(_)
+        ) {
+            return Err(format!(
+                "ArrayWriter type mismatch: expected BYTES/BINARY element, got {}",
+                self.element_type
+            ));
+        }
+        self.writer_mut()?.write_binary_bytes(idx, val);
+        Ok(())
+    }
+
+    fn aw_set_date(&mut self, idx: usize, days: i32) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        if !matches!(self.element_type, fcore::metadata::DataType::Date(_)) {
+            return Err(format!(
+                "ArrayWriter type mismatch: expected DATE element, got {}",
+                self.element_type
+            ));
+        }
+        self.writer_mut()?
+            .write_date(idx, fcore::row::Date::new(days));
+        Ok(())
+    }
+
+    fn aw_set_time(&mut self, idx: usize, millis: i32) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        if !matches!(self.element_type, fcore::metadata::DataType::Time(_)) {
+            return Err(format!(
+                "ArrayWriter type mismatch: expected TIME element, got {}",
+                self.element_type
+            ));
+        }
+        self.writer_mut()?
+            .write_time(idx, fcore::row::Time::new(millis));
+        Ok(())
+    }
+
+    fn aw_set_ts_ntz(&mut self, idx: usize, millis: i64, nanos: i32) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        let precision = match &self.element_type {
+            fcore::metadata::DataType::Timestamp(ts) => ts.precision(),
+            _ => {
+                return Err(format!(
+                    "ArrayWriter type mismatch: expected TIMESTAMP element, got {}",
+                    self.element_type
+                ));
+            }
+        };
+        let ts = fcore::row::TimestampNtz::from_millis_nanos(millis, nanos)
+            .map_err(|e| e.to_string())?;
+        self.writer_mut()?.write_timestamp_ntz(idx, &ts, precision);
+        Ok(())
+    }
+
+    fn aw_set_ts_ltz(&mut self, idx: usize, millis: i64, nanos: i32) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        let precision = match &self.element_type {
+            fcore::metadata::DataType::TimestampLTz(ts) => ts.precision(),
+            _ => {
+                return Err(format!(
+                    "ArrayWriter type mismatch: expected TIMESTAMP_LTZ element, got {}",
+                    self.element_type
+                ));
+            }
+        };
+        let ts = fcore::row::TimestampLtz::from_millis_nanos(millis, nanos)
+            .map_err(|e| e.to_string())?;
+        self.writer_mut()?.write_timestamp_ltz(idx, &ts, precision);
+        Ok(())
+    }
+
+    fn aw_set_decimal_str(&mut self, idx: usize, val: &str) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        let (precision, scale) = match &self.element_type {
+            fcore::metadata::DataType::Decimal(d) => (d.precision(), d.scale()),
+            _ => {
+                return Err(format!(
+                    "ArrayWriter type mismatch: expected DECIMAL element, got {}",
+                    self.element_type
+                ));
+            }
+        };
+        let bd = bigdecimal::BigDecimal::from_str(val).map_err(|e| e.to_string())?;
+        let decimal = fcore::row::Decimal::from_big_decimal(bd, precision, scale)
+            .map_err(|e| e.to_string())?;
+        self.writer_mut()?.write_decimal(idx, &decimal, precision);
+        Ok(())
+    }
+
+    fn aw_set_array(&mut self, idx: usize, nested: &mut ArrayWriterInner) -> Result<(), String> {
+        self.ensure_writable(idx)?;
+        let expected_inner = match &self.element_type {
+            fcore::metadata::DataType::Array(at) => at.get_element_type(),
+            _ => {
+                return Err(format!(
+                    "ArrayWriter type mismatch: expected ARRAY element, got {}",
+                    self.element_type
+                ));
+            }
+        };
+        if !structurally_compatible(expected_inner, &nested.element_type) {
+            return Err(format!(
+                "Nested ArrayWriter type mismatch: expected nested element type {}, got {}",
+                expected_inner, nested.element_type
+            ));
+        }
+        nested.complete_if_needed()?;
+        let arr = nested.completed.as_ref().ok_or_else(|| {
+            "ArrayWriter invariant violation: nested completed array missing after finalize"
+                .to_string()
+        })?;
+        self.writer_mut()?.write_array(idx, arr);
+        Ok(())
+    }
+}
+
+/// Structural type equivalence that ignores nullability flags but preserves
+/// variant and precision/scale semantics. Used to compare ArrayWriter element
+/// types on the binding boundary, where C++ callers never control nullability
+/// explicitly.
+fn structurally_compatible(a: &fcore::metadata::DataType, b: &fcore::metadata::DataType) -> bool {
+    use fcore::metadata::DataType;
+    match (a, b) {
+        (DataType::Boolean(_), DataType::Boolean(_))
+        | (DataType::TinyInt(_), DataType::TinyInt(_))
+        | (DataType::SmallInt(_), DataType::SmallInt(_))
+        | (DataType::Int(_), DataType::Int(_))
+        | (DataType::BigInt(_), DataType::BigInt(_))
+        | (DataType::Float(_), DataType::Float(_))
+        | (DataType::Double(_), DataType::Double(_))
+        | (DataType::String(_), DataType::String(_))
+        | (DataType::Bytes(_), DataType::Bytes(_))
+        | (DataType::Date(_), DataType::Date(_))
+        | (DataType::Time(_), DataType::Time(_)) => true,
+        (DataType::Timestamp(x), DataType::Timestamp(y)) => x.precision() == y.precision(),
+        (DataType::TimestampLTz(x), DataType::TimestampLTz(y)) => x.precision() == y.precision(),
+        (DataType::Char(x), DataType::Char(y)) => x.length() == y.length(),
+        (DataType::Binary(x), DataType::Binary(y)) => x.length() == y.length(),
+        (DataType::Decimal(x), DataType::Decimal(y)) => {
+            x.precision() == y.precision() && x.scale() == y.scale()
+        }
+        (DataType::Array(x), DataType::Array(y)) => {
+            structurally_compatible(x.get_element_type(), y.get_element_type())
+        }
+        _ => false,
+    }
 }
diff --git a/fluss-rust/bindings/cpp/src/table.cpp b/fluss-rust/bindings/cpp/src/table.cpp
index c49a64433b..f389f7ac90 100644
--- a/fluss-rust/bindings/cpp/src/table.cpp
+++ b/fluss-rust/bindings/cpp/src/table.cpp
@@ -19,6 +19,7 @@
 
 #include <arrow/c/bridge.h>
 
+#include <cassert>
 #include <ctime>
 
 #include "ffi_converter.hpp"
@@ -85,6 +86,226 @@ int Date::Day() const {
         if (!inner_) throw std::logic_error(name ": not available (moved-from or null)"); \
     } while (0)
 
+// ============================================================================
+// ArrayWriter — builder for array values backed by Rust ArrayWriterInner
+// ============================================================================
+
+ArrayWriter::ArrayWriter(size_t size, DataType element_type) : element_type_(std::move(element_type)) {
+    auto flat = utils::flatten_array_type(element_type_);
+    int32_t leaf_type_id = flat.nesting > 0 ? flat.leaf_type : static_cast<int32_t>(element_type_.id());
+    uint32_t leaf_precision = static_cast<uint32_t>(flat.nesting > 0 ? flat.leaf_precision
+                                                                      : element_type_.precision());
+    uint32_t leaf_scale = static_cast<uint32_t>(flat.nesting > 0 ? flat.leaf_scale : element_type_.scale());
+    uint32_t array_nesting = static_cast<uint32_t>(flat.nesting);
+
+    auto box = ffi::new_array_writer(size, leaf_type_id, leaf_precision, leaf_scale, array_nesting);
+    inner_ = box.into_raw();
+}
+
+ArrayWriter::~ArrayWriter() noexcept { Destroy(); }
+
+void ArrayWriter::Destroy() noexcept {
+    if (inner_) {
+        rust::Box<ffi::ArrayWriterInner>::from_raw(inner_);
+        inner_ = nullptr;
+    }
+}
+
+ArrayWriter::ArrayWriter(ArrayWriter&& other) noexcept
+    : inner_(other.inner_), element_type_(std::move(other.element_type_)) {
+    other.inner_ = nullptr;
+}
+
+ArrayWriter& ArrayWriter::operator=(ArrayWriter&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        inner_ = other.inner_;
+        element_type_ = std::move(other.element_type_);
+        other.inner_ = nullptr;
+    }
+    return *this;
+}
+
+bool ArrayWriter::Available() const { return inner_ != nullptr; }
+
+size_t ArrayWriter::Size() const noexcept {
+    assert(inner_ && "ArrayWriter::Size called on moved-from instance");
+    return inner_->aw_size();
+}
+
+// NOLINTNEXTLINE(cppcoreguidelines-macro-usage)
+#define CHECK_AW(name)                                                                    \
+    do {                                                                                  \
+        if (!inner_) throw std::logic_error(name ": not available (moved-from or null)"); \
+    } while (0)
+
+void ArrayWriter::SetNull(size_t idx) { CHECK_AW("ArrayWriter"); inner_->aw_set_null(idx); }
+void ArrayWriter::SetBool(size_t idx, bool v) { CHECK_AW("ArrayWriter"); inner_->aw_set_bool(idx, v); }
+void ArrayWriter::SetInt32(size_t idx, int32_t v) { CHECK_AW("ArrayWriter"); inner_->aw_set_i32(idx, v); }
+void ArrayWriter::SetInt64(size_t idx, int64_t v) { CHECK_AW("ArrayWriter"); inner_->aw_set_i64(idx, v); }
+void ArrayWriter::SetFloat32(size_t idx, float v) { CHECK_AW("ArrayWriter"); inner_->aw_set_f32(idx, v); }
+void ArrayWriter::SetFloat64(size_t idx, double v) { CHECK_AW("ArrayWriter"); inner_->aw_set_f64(idx, v); }
+
+void ArrayWriter::SetString(size_t idx, const std::string& v) {
+    CHECK_AW("ArrayWriter");
+    inner_->aw_set_str(idx, v);
+}
+
+void ArrayWriter::SetBytes(size_t idx, const std::vector<uint8_t>& v) {
+    CHECK_AW("ArrayWriter");
+    inner_->aw_set_bytes(idx, rust::Slice<const uint8_t>(v.data(), v.size()));
+}
+
+void ArrayWriter::SetDate(size_t idx, fluss::Date d) {
+    CHECK_AW("ArrayWriter");
+    inner_->aw_set_date(idx, d.days_since_epoch);
+}
+
+void ArrayWriter::SetTime(size_t idx, fluss::Time t) {
+    CHECK_AW("ArrayWriter");
+    inner_->aw_set_time(idx, t.millis_since_midnight);
+}
+
+void ArrayWriter::SetTimestampNtz(size_t idx, fluss::Timestamp ts) {
+    CHECK_AW("ArrayWriter");
+    inner_->aw_set_ts_ntz(idx, ts.epoch_millis, ts.nano_of_millisecond);
+}
+
+void ArrayWriter::SetTimestampLtz(size_t idx, fluss::Timestamp ts) {
+    CHECK_AW("ArrayWriter");
+    inner_->aw_set_ts_ltz(idx, ts.epoch_millis, ts.nano_of_millisecond);
+}
+
+void ArrayWriter::SetDecimal(size_t idx, const std::string& value) {
+    CHECK_AW("ArrayWriter");
+    inner_->aw_set_decimal_str(idx, value);
+}
+
+void ArrayWriter::SetArray(size_t idx, ArrayWriter&& nested) {
+    CHECK_AW("ArrayWriter");
+    if (!nested.inner_) {
+        throw std::logic_error("ArrayWriter::SetArray: nested writer not available");
+    }
+    inner_->aw_set_array(idx, *nested.inner_);
+    nested.Destroy();
+}
+
+// ============================================================================
+// ArrayView — read-only recursive view into an array column value
+// ============================================================================
+
+ArrayView::~ArrayView() noexcept { Destroy(); }
+
+void ArrayView::Destroy() noexcept {
+    if (inner_) {
+        rust::Box<ffi::ArrayViewInner>::from_raw(inner_);
+        inner_ = nullptr;
+    }
+}
+
+ArrayView::ArrayView(ArrayView&& other) noexcept : inner_(other.inner_) { other.inner_ = nullptr; }
+
+ArrayView& ArrayView::operator=(ArrayView&& other) noexcept {
+    if (this != &other) {
+        Destroy();
+        inner_ = other.inner_;
+        other.inner_ = nullptr;
+    }
+    return *this;
+}
+
+// NOLINTNEXTLINE(cppcoreguidelines-macro-usage)
+#define CHECK_AV()                                                                      \
+    do {                                                                                \
+        if (!inner_) throw std::logic_error("ArrayView: not available (moved-from)");  \
+    } while (0)
+
+size_t ArrayView::Size() const noexcept {
+    assert(inner_ && "ArrayView::Size called on moved-from instance");
+    return inner_->av_size();
+}
+
+TypeId ArrayView::ElementType() const noexcept {
+    assert(inner_ && "ArrayView::ElementType called on moved-from instance");
+    return static_cast<TypeId>(inner_->av_element_type_id());
+}
+
+bool ArrayView::IsNull(size_t element) const {
+    CHECK_AV();
+    return inner_->av_is_null(element);
+}
+
+bool ArrayView::GetBool(size_t element) const {
+    CHECK_AV();
+    return inner_->av_get_bool(element);
+}
+
+int32_t ArrayView::GetInt32(size_t element) const {
+    CHECK_AV();
+    return inner_->av_get_i32(element);
+}
+
+int64_t ArrayView::GetInt64(size_t element) const {
+    CHECK_AV();
+    return inner_->av_get_i64(element);
+}
+
+float ArrayView::GetFloat32(size_t element) const {
+    CHECK_AV();
+    return inner_->av_get_f32(element);
+}
+
+double ArrayView::GetFloat64(size_t element) const {
+    CHECK_AV();
+    return inner_->av_get_f64(element);
+}
+
+std::string ArrayView::GetString(size_t element) const {
+    CHECK_AV();
+    return std::string(inner_->av_get_str(element));
+}
+
+std::vector<uint8_t> ArrayView::GetBytes(size_t element) const {
+    CHECK_AV();
+    auto rv = inner_->av_get_bytes(element);
+    return {rv.data(), rv.data() + rv.size()};
+}
+
+fluss::Date ArrayView::GetDate(size_t element) const {
+    CHECK_AV();
+    return fluss::Date{inner_->av_get_date_days(element)};
+}
+
+fluss::Time ArrayView::GetTime(size_t element) const {
+    CHECK_AV();
+    return fluss::Time{inner_->av_get_time_millis(element)};
+}
+
+fluss::Timestamp ArrayView::GetTimestampNtz(size_t element) const {
+    CHECK_AV();
+    return fluss::Timestamp{inner_->av_get_ts_millis(element),
+                            inner_->av_get_ts_nanos(element)};
+}
+
+fluss::Timestamp ArrayView::GetTimestampLtz(size_t element) const {
+    CHECK_AV();
+    return fluss::Timestamp{inner_->av_get_ts_millis(element),
+                            inner_->av_get_ts_nanos(element)};
+}
+
+std::string ArrayView::GetDecimalString(size_t element) const {
+    CHECK_AV();
+    return std::string(inner_->av_get_decimal_str(element));
+}
+
+ArrayView ArrayView::GetArray(size_t element) const {
+    CHECK_AV();
+    auto box = inner_->av_get_nested(element);
+    return ArrayView(box.into_raw());
+}
+
+#undef CHECK_AV
+
 // ============================================================================
 // GenericRow — write-only row backed by opaque Rust GenericRowInner
 // ============================================================================
@@ -191,6 +412,15 @@ void GenericRow::SetDecimal(size_t idx, const std::string& value) {
     inner_->gr_set_decimal_str(idx, value);
 }
 
+void GenericRow::SetArray(size_t idx, ArrayWriter&& writer) {
+    CHECK_INNER("GenericRow");
+    if (!writer.inner_) {
+        throw std::logic_error("GenericRow::SetArray: ArrayWriter not available");
+    }
+    inner_->gr_set_array(idx, *writer.inner_);
+    writer.Destroy();
+}
+
 // ============================================================================
 // ScanData — destructor must live in .cpp where rust::Box is visible
 // ============================================================================
@@ -278,6 +508,85 @@ std::string RowView::GetDecimalString(size_t idx) const {
     return std::string(data_->raw->sv_get_decimal_str(bucket_idx_, rec_idx_, idx));
 }
 
+size_t RowView::GetArraySize(size_t idx) const {
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_array_size(bucket_idx_, rec_idx_, idx);
+}
+
+TypeId RowView::GetArrayElementType(size_t idx) const {
+    CHECK_DATA("RowView");
+    return static_cast<TypeId>(data_->raw->sv_get_array_element_type(idx));
+}
+
+bool RowView::IsArrayElementNull(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_array_is_null(bucket_idx_, rec_idx_, idx, element);
+}
+
+bool RowView::GetArrayBool(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_array_bool(bucket_idx_, rec_idx_, idx, element);
+}
+
+int32_t RowView::GetArrayInt32(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_array_i32(bucket_idx_, rec_idx_, idx, element);
+}
+
+int64_t RowView::GetArrayInt64(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_array_i64(bucket_idx_, rec_idx_, idx, element);
+}
+
+float RowView::GetArrayFloat32(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_array_f32(bucket_idx_, rec_idx_, idx, element);
+}
+
+double RowView::GetArrayFloat64(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return data_->raw->sv_get_array_f64(bucket_idx_, rec_idx_, idx, element);
+}
+
+std::string RowView::GetArrayString(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return std::string(data_->raw->sv_get_array_str(bucket_idx_, rec_idx_, idx, element));
+}
+
+std::vector<uint8_t> RowView::GetArrayBytes(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    auto rv = data_->raw->sv_get_array_bytes(bucket_idx_, rec_idx_, idx, element);
+    return {rv.data(), rv.data() + rv.size()};
+}
+
+fluss::Date RowView::GetArrayDate(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return fluss::Date{data_->raw->sv_get_array_date_days(bucket_idx_, rec_idx_, idx, element)};
+}
+
+fluss::Time RowView::GetArrayTime(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return fluss::Time{data_->raw->sv_get_array_time_millis(bucket_idx_, rec_idx_, idx, element)};
+}
+
+fluss::Timestamp RowView::GetArrayTimestamp(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    auto millis = data_->raw->sv_get_array_ts_millis(bucket_idx_, rec_idx_, idx, element);
+    auto nanos = data_->raw->sv_get_array_ts_nanos(bucket_idx_, rec_idx_, idx, element);
+    return fluss::Timestamp{millis, nanos};
+}
+
+std::string RowView::GetArrayDecimalString(size_t idx, size_t element) const {
+    CHECK_DATA("RowView");
+    return std::string(data_->raw->sv_get_array_decimal_str(bucket_idx_, rec_idx_, idx, element));
+}
+
+ArrayView RowView::GetArrayView(size_t idx) const {
+    CHECK_DATA("RowView");
+    auto box = data_->raw->sv_get_array_view(bucket_idx_, rec_idx_, idx);
+    return ArrayView(box.into_raw());
+}
+
 // ============================================================================
 // ScanRecords — backed by opaque Rust ScanResultInner
 // ============================================================================
@@ -484,6 +793,85 @@ std::string LookupResult::GetDecimalString(size_t idx) const {
     return std::string(inner_->lv_get_decimal_str(idx));
 }
 
+size_t LookupResult::GetArraySize(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_array_size(idx);
+}
+
+TypeId LookupResult::GetArrayElementType(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    return static_cast<TypeId>(inner_->lv_get_array_element_type(idx));
+}
+
+bool LookupResult::IsArrayElementNull(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_array_is_null(idx, element);
+}
+
+bool LookupResult::GetArrayBool(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_array_bool(idx, element);
+}
+
+int32_t LookupResult::GetArrayInt32(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_array_i32(idx, element);
+}
+
+int64_t LookupResult::GetArrayInt64(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_array_i64(idx, element);
+}
+
+float LookupResult::GetArrayFloat32(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_array_f32(idx, element);
+}
+
+double LookupResult::GetArrayFloat64(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return inner_->lv_get_array_f64(idx, element);
+}
+
+std::string LookupResult::GetArrayString(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return std::string(inner_->lv_get_array_str(idx, element));
+}
+
+std::vector<uint8_t> LookupResult::GetArrayBytes(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    auto rv = inner_->lv_get_array_bytes(idx, element);
+    return {rv.data(), rv.data() + rv.size()};
+}
+
+fluss::Date LookupResult::GetArrayDate(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return fluss::Date{inner_->lv_get_array_date_days(idx, element)};
+}
+
+fluss::Time LookupResult::GetArrayTime(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return fluss::Time{inner_->lv_get_array_time_millis(idx, element)};
+}
+
+fluss::Timestamp LookupResult::GetArrayTimestamp(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    auto millis = inner_->lv_get_array_ts_millis(idx, element);
+    auto nanos = inner_->lv_get_array_ts_nanos(idx, element);
+    return fluss::Timestamp{millis, nanos};
+}
+
+std::string LookupResult::GetArrayDecimalString(size_t idx, size_t element) const {
+    CHECK_INNER("LookupResult");
+    return std::string(inner_->lv_get_array_decimal_str(idx, element));
+}
+
+ArrayView LookupResult::GetArrayView(size_t idx) const {
+    CHECK_INNER("LookupResult");
+    auto box = inner_->lv_get_array_view(idx);
+    return ArrayView(box.into_raw());
+}
+
 // ============================================================================
 // Table
 // ============================================================================
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index f7aabe9424..c15aadc980 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -39,10 +39,76 @@ pub const DATA_TYPE_TIMESTAMP_LTZ: i32 = 13;
 pub const DATA_TYPE_DECIMAL: i32 = 14;
 pub const DATA_TYPE_CHAR: i32 = 15;
 pub const DATA_TYPE_BINARY: i32 = 16;
+pub const DATA_TYPE_ARRAY: i32 = 17;
+
+fn ffi_column_to_core_data_type(col: &ffi::FfiColumn) -> Result<fcore::metadata::DataType> {
+    ffi_data_type_to_core(
+        col.data_type,
+        col.precision as u32,
+        col.scale as u32,
+        col.element_data_type,
+        col.element_precision as u32,
+        col.element_scale as u32,
+        col.array_nesting.max(0) as u32,
+    )
+}
 
-// DATUM_TYPE_* constants removed — no longer needed with opaque types.
+fn type_precision_scale(dt: &fcore::metadata::DataType) -> (i32, i32) {
+    match dt {
+        fcore::metadata::DataType::Decimal(d) => (d.precision() as i32, d.scale() as i32),
+        fcore::metadata::DataType::Timestamp(ts) => (ts.precision() as i32, 0),
+        fcore::metadata::DataType::TimestampLTz(ts) => (ts.precision() as i32, 0),
+        fcore::metadata::DataType::Char(ch) => (ch.length() as i32, 0),
+        fcore::metadata::DataType::Binary(bin) => (bin.length() as i32, 0),
+        _ => (0, 0),
+    }
+}
 
-fn ffi_data_type_to_core(dt: i32, precision: u32, scale: u32) -> Result<fcore::metadata::DataType> {
+fn flatten_array_leaf_type(dt: &fcore::metadata::DataType) -> Result<(i32, i32, i32, i32)> {
+    let mut nesting = 0_i32;
+    let mut leaf = dt;
+    while let fcore::metadata::DataType::Array(at) = leaf {
+        nesting += 1;
+        leaf = at.get_element_type();
+    }
+    if nesting == 0 {
+        return Err(anyhow!("Expected ARRAY data type, got {dt}"));
+    }
+    let leaf_type = core_data_type_to_ffi(leaf);
+    if leaf_type == 0 {
+        return Err(anyhow!(
+            "Unsupported ARRAY leaf type for C++ bindings: {leaf}"
+        ));
+    }
+    let (leaf_precision, leaf_scale) = type_precision_scale(leaf);
+    Ok((nesting, leaf_type, leaf_precision, leaf_scale))
+}
+
+fn build_array_type_from_leaf(
+    leaf_dt: i32,
+    leaf_precision: u32,
+    leaf_scale: u32,
+    nesting: u32,
+) -> Result<fcore::metadata::DataType> {
+    if nesting == 0 {
+        return Err(anyhow!("ARRAY nesting must be >= 1"));
+    }
+    let mut dt = ffi_data_type_to_core(leaf_dt, leaf_precision, leaf_scale, 0, 0, 0, 0)?;
+    for _ in 0..nesting {
+        dt = fcore::metadata::DataTypes::array(dt);
+    }
+    Ok(dt)
+}
+
+fn ffi_data_type_to_core(
+    dt: i32,
+    precision: u32,
+    scale: u32,
+    element_dt: i32,
+    element_precision: u32,
+    element_scale: u32,
+    array_nesting: u32,
+) -> Result<fcore::metadata::DataType> {
     match dt {
         DATA_TYPE_BOOLEAN => Ok(fcore::metadata::DataTypes::boolean()),
         DATA_TYPE_TINYINT => Ok(fcore::metadata::DataTypes::tinyint()),
@@ -67,6 +133,31 @@ fn ffi_data_type_to_core(dt: i32, precision: u32, scale: u32) -> Result<fcore::m
         }
         DATA_TYPE_CHAR => Ok(fcore::metadata::DataTypes::char(precision)),
         DATA_TYPE_BINARY => Ok(fcore::metadata::DataTypes::binary(precision as usize)),
+        DATA_TYPE_ARRAY => {
+            if array_nesting > 0 {
+                build_array_type_from_leaf(
+                    element_dt,
+                    element_precision,
+                    element_scale,
+                    array_nesting,
+                )
+            } else {
+                // Backward compatibility for older one-level metadata.
+                if element_dt == 0 {
+                    return Err(anyhow!("ARRAY requires element type metadata"));
+                }
+                let element_type = ffi_data_type_to_core(
+                    element_dt,
+                    element_precision,
+                    element_scale,
+                    0,
+                    0,
+                    0,
+                    0,
+                )?;
+                Ok(fcore::metadata::DataTypes::array(element_type))
+            }
+        }
         _ => Err(anyhow!("Unknown data type: {dt}")),
     }
 }
@@ -89,23 +180,48 @@ pub fn core_data_type_to_ffi(dt: &fcore::metadata::DataType) -> i32 {
         fcore::metadata::DataType::Decimal(_) => DATA_TYPE_DECIMAL,
         fcore::metadata::DataType::Char(_) => DATA_TYPE_CHAR,
         fcore::metadata::DataType::Binary(_) => DATA_TYPE_BINARY,
+        fcore::metadata::DataType::Array(_) => DATA_TYPE_ARRAY,
         _ => 0,
     }
 }
 
+fn core_column_to_ffi(col: &fcore::metadata::Column) -> ffi::FfiColumn {
+    let (precision, scale) = type_precision_scale(col.data_type());
+
+    let (array_nesting, element_data_type, element_precision, element_scale) = match col.data_type()
+    {
+        fcore::metadata::DataType::Array(_) => {
+            flatten_array_leaf_type(col.data_type()).unwrap_or((0, 0, 0, 0))
+        }
+        _ => (0, 0, 0, 0),
+    };
+
+    ffi::FfiColumn {
+        name: col.name().to_string(),
+        data_type: core_data_type_to_ffi(col.data_type()),
+        comment: col.comment().unwrap_or("").to_string(),
+        precision,
+        scale,
+        array_nesting,
+        element_data_type,
+        element_precision,
+        element_scale,
+    }
+}
+
 pub fn ffi_descriptor_to_core(
     descriptor: &ffi::FfiTableDescriptor,
 ) -> Result<fcore::metadata::TableDescriptor> {
     let mut schema_builder = fcore::metadata::Schema::builder();
 
     for col in &descriptor.schema.columns {
-        if col.precision < 0 || col.scale < 0 {
+        if col.precision < 0 || col.scale < 0 || col.array_nesting < 0 {
             return Err(anyhow!(
-                "Column '{}': precision and scale must be non-negative",
+                "Column '{}': precision, scale, and array_nesting must be non-negative",
                 col.name
             ));
         }
-        let dt = ffi_data_type_to_core(col.data_type, col.precision as u32, col.scale as u32)?;
+        let dt = ffi_column_to_core_data_type(col)?;
         schema_builder = schema_builder.column(&col.name, dt);
         if !col.comment.is_empty() {
             schema_builder = schema_builder.with_comment(&col.comment);
@@ -153,29 +269,7 @@ pub fn ffi_descriptor_to_core(
 
 pub fn core_table_info_to_ffi(info: &fcore::metadata::TableInfo) -> ffi::FfiTableInfo {
     let schema = info.get_schema();
-    let columns: Vec<ffi::FfiColumn> = schema
-        .columns()
-        .iter()
-        .map(|col| {
-            let (precision, scale) = match col.data_type() {
-                fcore::metadata::DataType::Decimal(dt) => {
-                    (dt.precision() as i32, dt.scale() as i32)
-                }
-                fcore::metadata::DataType::Timestamp(dt) => (dt.precision() as i32, 0),
-                fcore::metadata::DataType::TimestampLTz(dt) => (dt.precision() as i32, 0),
-                fcore::metadata::DataType::Char(dt) => (dt.length() as i32, 0),
-                fcore::metadata::DataType::Binary(dt) => (dt.length() as i32, 0),
-                _ => (0, 0),
-            };
-            ffi::FfiColumn {
-                name: col.name().to_string(),
-                data_type: core_data_type_to_ffi(col.data_type()),
-                comment: col.comment().unwrap_or("").to_string(),
-                precision,
-                scale,
-            }
-        })
-        .collect();
+    let columns: Vec<ffi::FfiColumn> = schema.columns().iter().map(core_column_to_ffi).collect();
 
     let primary_keys: Vec<String> = schema
         .primary_key()
@@ -251,6 +345,21 @@ pub fn empty_table_info() -> ffi::FfiTableInfo {
     }
 }
 
+/// Convert element type tag + precision/scale to core DataType.
+/// Used by ArrayWriterInner construction from C++.
+pub fn element_type_from_ffi(
+    leaf_dt: i32,
+    precision: u32,
+    scale: u32,
+    array_nesting: u32,
+) -> Result<fcore::metadata::DataType> {
+    if array_nesting == 0 {
+        ffi_data_type_to_core(leaf_dt, precision, scale, 0, 0, 0, 0)
+    } else {
+        build_array_type_from_leaf(leaf_dt, precision, scale, array_nesting)
+    }
+}
+
 /// Convert FFI database descriptor to core. Returns None if descriptor is effectively empty
 /// (no comment and no properties), so create_database can pass Option::None to core.
 pub fn ffi_database_descriptor_to_core(
@@ -351,8 +460,6 @@ pub fn resolve_row_types(
             Datum::Time(t) => Datum::Time(*t),
             Datum::TimestampNtz(ts) => Datum::TimestampNtz(*ts),
             Datum::TimestampLtz(ts) => Datum::TimestampLtz(*ts),
-            // TODO: C++ bindings need proper CXX wrapper types for FlussArray
-            // before C++ users can construct or inspect array values through FFI.
             Datum::Array(a) => Datum::Array(a.clone()),
         };
         out.set_field(idx, resolved);
@@ -411,8 +518,6 @@ pub fn compacted_row_to_owned(
             fcore::metadata::DataType::Binary(dt) => {
                 Datum::Blob(Cow::Owned(row.get_binary(i, dt.length())?.to_vec()))
             }
-            // TODO: C++ bindings need proper CXX wrapper types for FlussArray
-            // before C++ users can construct or inspect array values through FFI.
             fcore::metadata::DataType::Array(_) => Datum::Array(row.get_array(i)?),
             other => return Err(anyhow!("Unsupported data type for column {i}: {other:?}")),
         };
diff --git a/fluss-rust/bindings/cpp/test/test_ffi_converter.cpp b/fluss-rust/bindings/cpp/test/test_ffi_converter.cpp
new file mode 100644
index 0000000000..4bbe3ebbaf
--- /dev/null
+++ b/fluss-rust/bindings/cpp/test/test_ffi_converter.cpp
@@ -0,0 +1,64 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#include <gtest/gtest.h>
+#include <stdexcept>
+
+#include "ffi_converter.hpp"
+
+namespace {
+
+fluss::ffi::FfiColumn MakeArrayColumn(int32_t nesting, int32_t element_type) {
+    fluss::ffi::FfiColumn col;
+    col.name = rust::String("bad_array");
+    col.data_type = static_cast<int32_t>(fluss::TypeId::Array);
+    col.comment = rust::String("");
+    col.precision = 0;
+    col.scale = 0;
+    col.array_nesting = nesting;
+    col.element_data_type = element_type;
+    col.element_precision = 0;
+    col.element_scale = 0;
+    return col;
+}
+
+}  // namespace
+
+TEST(FfiConverterTest, RejectsArrayWithoutElementType) {
+    auto col = MakeArrayColumn(1, 0);
+    EXPECT_THROW((void)fluss::utils::from_ffi_column(col), std::runtime_error);
+}
+
+TEST(FfiConverterTest, RejectsArrayWithArrayLeafType) {
+    auto col = MakeArrayColumn(2, static_cast<int32_t>(fluss::TypeId::Array));
+    EXPECT_THROW((void)fluss::utils::from_ffi_column(col), std::runtime_error);
+}
+
+TEST(FfiConverterTest, RejectsArrayWithUnknownLeafType) {
+    auto col = MakeArrayColumn(1, 999);
+    EXPECT_THROW((void)fluss::utils::from_ffi_column(col), std::runtime_error);
+}
+
+TEST(FfiConverterTest, SupportsLegacyOneLevelArrayMetadata) {
+    auto col = MakeArrayColumn(0, static_cast<int32_t>(fluss::TypeId::Int));
+    auto converted = fluss::utils::from_ffi_column(col);
+    EXPECT_EQ(converted.data_type.id(), fluss::TypeId::Array);
+    ASSERT_NE(converted.data_type.element_type(), nullptr);
+    EXPECT_EQ(converted.data_type.element_type()->id(), fluss::TypeId::Int);
+}
diff --git a/fluss-rust/bindings/cpp/test/test_kv_table.cpp b/fluss-rust/bindings/cpp/test/test_kv_table.cpp
index 9c4f7a02fb..5cc8f79d23 100644
--- a/fluss-rust/bindings/cpp/test/test_kv_table.cpp
+++ b/fluss-rust/bindings/cpp/test/test_kv_table.cpp
@@ -155,6 +155,165 @@ TEST_F(KvTableTest, UpsertDeleteAndLookup) {
     ASSERT_OK(adm.DropTable(table_path, false));
 }
 
+TEST_F(KvTableTest, LookupWithNestedArrayArrayView) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_lookup_nested_array_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("matrix",
+                                 fluss::DataType::Array(fluss::DataType::Array(fluss::DataType::Int())))
+                      .SetPrimaryKeys({"id"})
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    auto upsert = table.NewUpsert();
+    fluss::UpsertWriter writer;
+    ASSERT_OK(upsert.CreateWriter(writer));
+
+    {
+        auto row = table.NewRow();
+        row.Set("id", 1);
+
+        fluss::ArrayWriter inner1(2, fluss::DataType::Int());
+        inner1.SetInt32(0, 11);
+        inner1.SetInt32(1, 12);
+
+        fluss::ArrayWriter inner2(2, fluss::DataType::Int());
+        inner2.SetInt32(0, 21);
+        inner2.SetInt32(1, 22);
+
+        fluss::ArrayWriter outer(2, fluss::DataType::Array(fluss::DataType::Int()));
+        outer.SetArray(0, std::move(inner1));
+        outer.SetArray(1, std::move(inner2));
+        row.Set("matrix", std::move(outer));
+
+        ASSERT_OK(writer.Upsert(row));
+        ASSERT_OK(writer.Flush());
+    }
+
+    fluss::Lookuper lookuper;
+    ASSERT_OK(table.NewLookup().CreateLookuper(lookuper));
+
+    auto key = table.NewRow();
+    key.Set("id", 1);
+
+    fluss::LookupResult result;
+    ASSERT_OK(lookuper.Lookup(key, result));
+    ASSERT_TRUE(result.Found());
+    EXPECT_EQ(result.GetArraySize("matrix"), 2u);
+    EXPECT_EQ(result.GetArrayElementType("matrix"), fluss::TypeId::Array);
+
+    auto outer = result.GetArrayView("matrix");
+    ASSERT_EQ(outer.Size(), 2u);
+    EXPECT_EQ(outer.ElementType(), fluss::TypeId::Array);
+
+    auto first = outer.GetArray(0);
+    ASSERT_EQ(first.Size(), 2u);
+    EXPECT_EQ(first.ElementType(), fluss::TypeId::Int);
+    EXPECT_EQ(first.GetInt32(0), 11);
+    EXPECT_EQ(first.GetInt32(1), 12);
+
+    auto second = outer.GetArray(1);
+    ASSERT_EQ(second.Size(), 2u);
+    EXPECT_EQ(second.ElementType(), fluss::TypeId::Int);
+    EXPECT_EQ(second.GetInt32(0), 21);
+    EXPECT_EQ(second.GetInt32(1), 22);
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(KvTableTest, LookupArrayValidationErrors) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_lookup_array_validation_errors_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("vals", fluss::DataType::Array(fluss::DataType::Int()))
+                      .SetPrimaryKeys({"id"})
+                      .Build();
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+    auto upsert = table.NewUpsert();
+    fluss::UpsertWriter writer;
+    ASSERT_OK(upsert.CreateWriter(writer));
+
+    auto row = table.NewRow();
+    row.Set("id", 1);
+    fluss::ArrayWriter vals(2, fluss::DataType::Int());
+    vals.SetInt32(0, 99);
+    vals.SetNull(1);
+    row.Set("vals", std::move(vals));
+    ASSERT_OK(writer.Upsert(row));
+    ASSERT_OK(writer.Flush());
+
+    fluss::Lookuper lookuper;
+    ASSERT_OK(table.NewLookup().CreateLookuper(lookuper));
+
+    auto key = table.NewRow();
+    key.Set("id", 1);
+    fluss::LookupResult result;
+    ASSERT_OK(lookuper.Lookup(key, result));
+    ASSERT_TRUE(result.Found());
+
+    bool wrong_type_threw = false;
+    try {
+        (void)result.GetArrayInt64("vals", 0);
+    } catch (const std::exception&) {
+        wrong_type_threw = true;
+    }
+    EXPECT_TRUE(wrong_type_threw);
+
+    bool null_typed_getter_threw = false;
+    try {
+        (void)result.GetArrayInt32("vals", 1);
+    } catch (const std::exception&) {
+        null_typed_getter_threw = true;
+    }
+    EXPECT_TRUE(null_typed_getter_threw);
+
+    auto view = result.GetArrayView("vals");
+    EXPECT_EQ(view.Size(), 2u);
+    EXPECT_TRUE(view.IsNull(1));
+
+    bool view_wrong_type_threw = false;
+    try {
+        (void)view.GetInt64(0);
+    } catch (const std::exception&) {
+        view_wrong_type_threw = true;
+    }
+    EXPECT_TRUE(view_wrong_type_threw);
+
+    bool view_null_typed_getter_threw = false;
+    try {
+        (void)view.GetInt32(1);
+    } catch (const std::exception&) {
+        view_null_typed_getter_threw = true;
+    }
+    EXPECT_TRUE(view_null_typed_getter_threw);
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
 TEST_F(KvTableTest, CompositePrimaryKeys) {
     auto& adm = admin();
     auto& conn = connection();
diff --git a/fluss-rust/bindings/cpp/test/test_log_table.cpp b/fluss-rust/bindings/cpp/test/test_log_table.cpp
index 7d316faf34..f36c870766 100644
--- a/fluss-rust/bindings/cpp/test/test_log_table.cpp
+++ b/fluss-rust/bindings/cpp/test/test_log_table.cpp
@@ -22,6 +22,8 @@
 
 #include <algorithm>
 #include <chrono>
+#include <cmath>
+#include <limits>
 #include <thread>
 #include <tuple>
 
@@ -829,3 +831,630 @@ TEST_F(LogTableTest, PartitionedTableAppendScan) {
 
     ASSERT_OK(adm.DropTable(table_path, false));
 }
+
+// ============================================================================
+// Array data type tests
+// ============================================================================
+
+TEST_F(LogTableTest, AppendAndScanWithArray) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_append_scan_with_array_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("tags", fluss::DataType::Array(fluss::DataType::String()))
+                      .AddColumn("scores", fluss::DataType::Array(fluss::DataType::Int()))
+                      .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetBucketCount(1)
+                                .SetBucketKeys({"id"})
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    auto info = table.GetTableInfo();
+    ASSERT_GE(info.schema.columns.size(), 3u);
+    const auto& tags_type = info.schema.columns[1].data_type;
+    ASSERT_EQ(tags_type.id(), fluss::TypeId::Array);
+    ASSERT_NE(tags_type.element_type(), nullptr);
+    ASSERT_EQ(tags_type.element_type()->id(), fluss::TypeId::String);
+    const auto& scores_type = info.schema.columns[2].data_type;
+    ASSERT_EQ(scores_type.id(), fluss::TypeId::Array);
+    ASSERT_NE(scores_type.element_type(), nullptr);
+    ASSERT_EQ(scores_type.element_type()->id(), fluss::TypeId::Int);
+
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table.NewAppend().CreateWriter(append_writer));
+
+    {
+        auto row = table.NewRow();
+        row.Set("id", 1);
+
+        fluss::ArrayWriter tags(2, fluss::DataType::String());
+        tags.SetString(0, "hello");
+        tags.SetString(1, "world");
+        row.SetArray(1, std::move(tags));
+
+        fluss::ArrayWriter scores(3, fluss::DataType::Int());
+        scores.SetInt32(0, 10);
+        scores.SetInt32(1, 20);
+        scores.SetInt32(2, 30);
+        row.SetArray(2, std::move(scores));
+
+        ASSERT_OK(append_writer.Append(row));
+    }
+    {
+        auto row = table.NewRow();
+        row.Set("id", 2);
+
+        fluss::ArrayWriter tags(1, fluss::DataType::String());
+        tags.SetNull(0);
+        row.SetArray(1, std::move(tags));
+
+        fluss::ArrayWriter scores(0, fluss::DataType::Int());
+        row.SetArray(2, std::move(scores));
+
+        ASSERT_OK(append_writer.Append(row));
+    }
+
+    ASSERT_OK(append_writer.Flush());
+
+    auto scan = table.NewScan();
+    fluss::LogScanner scanner;
+    ASSERT_OK(scan.CreateLogScanner(scanner));
+    ASSERT_OK(scanner.Subscribe(0, 0));
+
+    struct Record {
+        int32_t id;
+        size_t tag_count;
+        std::vector<std::string> tags;
+        size_t score_count;
+        std::vector<int32_t> scores;
+    };
+
+    std::vector<Record> collected;
+    auto extract = [](const fluss::ScanRecord& scan_rec) {
+        const auto& rv = scan_rec.row;
+        Record rec;
+        rec.id = rv.GetInt32(0);
+
+        rec.tag_count = rv.GetArraySize(1);
+        for (size_t i = 0; i < rec.tag_count; ++i) {
+            if (rv.IsArrayElementNull(1, i)) {
+                rec.tags.push_back("<null>");
+            } else {
+                rec.tags.push_back(rv.GetArrayString(1, i));
+            }
+        }
+
+        rec.score_count = rv.GetArraySize(2);
+        for (size_t i = 0; i < rec.score_count; ++i) {
+            rec.scores.push_back(rv.GetArrayInt32(2, i));
+        }
+
+        return rec;
+    };
+
+    fluss_test::PollRecords(scanner, 2, extract, collected);
+
+    ASSERT_EQ(collected.size(), 2u);
+
+    std::sort(collected.begin(), collected.end(),
+              [](const Record& a, const Record& b) { return a.id < b.id; });
+
+    EXPECT_EQ(collected[0].id, 1);
+    ASSERT_EQ(collected[0].tag_count, 2u);
+    EXPECT_EQ(collected[0].tags[0], "hello");
+    EXPECT_EQ(collected[0].tags[1], "world");
+    ASSERT_EQ(collected[0].score_count, 3u);
+    EXPECT_EQ(collected[0].scores[0], 10);
+    EXPECT_EQ(collected[0].scores[1], 20);
+    EXPECT_EQ(collected[0].scores[2], 30);
+
+    EXPECT_EQ(collected[1].id, 2);
+    ASSERT_EQ(collected[1].tag_count, 1u);
+    EXPECT_EQ(collected[1].tags[0], "<null>");
+    ASSERT_EQ(collected[1].score_count, 0u);
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, AppendAndScanWithNestedArray) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_append_scan_nested_array_cpp");
+
+    auto schema =
+        fluss::Schema::NewBuilder()
+            .AddColumn("id", fluss::DataType::Int())
+            .AddColumn("matrix",
+                        fluss::DataType::Array(fluss::DataType::Array(fluss::DataType::Int())))
+            .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetBucketCount(1)
+                                .SetBucketKeys({"id"})
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table.NewAppend().CreateWriter(append_writer));
+
+    {
+        auto row = table.NewRow();
+        row.Set("id", 1);
+
+        fluss::ArrayWriter inner1(2, fluss::DataType::Int());
+        inner1.SetInt32(0, 1);
+        inner1.SetInt32(1, 2);
+
+        fluss::ArrayWriter inner2(2, fluss::DataType::Int());
+        inner2.SetInt32(0, 3);
+        inner2.SetInt32(1, 4);
+
+        fluss::ArrayWriter outer(2, fluss::DataType::Array(fluss::DataType::Int()));
+        outer.SetArray(0, std::move(inner1));
+        outer.SetArray(1, std::move(inner2));
+
+        row.SetArray(1, std::move(outer));
+        ASSERT_OK(append_writer.Append(row));
+    }
+
+    ASSERT_OK(append_writer.Flush());
+
+    auto scan = table.NewScan();
+    fluss::LogScanner scanner;
+    ASSERT_OK(scan.CreateLogScanner(scanner));
+    ASSERT_OK(scanner.Subscribe(0, 0));
+
+    struct Record {
+        int32_t id;
+        size_t outer_count;
+        fluss::TypeId element_type;
+        std::vector<std::vector<int32_t>> values;
+    };
+
+    std::vector<Record> collected;
+    auto extract = [](const fluss::ScanRecord& scan_rec) {
+        const auto& rv = scan_rec.row;
+        Record rec;
+        rec.id = rv.GetInt32(0);
+        rec.outer_count = rv.GetArraySize(1);
+        rec.element_type = rv.GetArrayElementType(1);
+        auto outer = rv.GetArrayView(1);
+        rec.values.reserve(outer.Size());
+        for (size_t i = 0; i < outer.Size(); ++i) {
+            auto inner = outer.GetArray(i);
+            std::vector<int32_t> row;
+            row.reserve(inner.Size());
+            for (size_t j = 0; j < inner.Size(); ++j) {
+                row.push_back(inner.GetInt32(j));
+            }
+            rec.values.push_back(std::move(row));
+        }
+        return rec;
+    };
+
+    fluss_test::PollRecords(scanner, 1, extract, collected);
+    ASSERT_EQ(collected.size(), 1u);
+    EXPECT_EQ(collected[0].id, 1);
+    EXPECT_EQ(collected[0].outer_count, 2u);
+    EXPECT_EQ(collected[0].element_type, fluss::TypeId::Array);
+    ASSERT_EQ(collected[0].values.size(), 2u);
+    EXPECT_EQ(collected[0].values[0], (std::vector<int32_t>{1, 2}));
+    EXPECT_EQ(collected[0].values[1], (std::vector<int32_t>{3, 4}));
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, AppendAndScanWithArrayRichTypes) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_append_scan_array_rich_types_cpp");
+
+    auto schema =
+        fluss::Schema::NewBuilder()
+            .AddColumn("id", fluss::DataType::Int())
+            .AddColumn("arr_bytes", fluss::DataType::Array(fluss::DataType::Bytes()))
+            .AddColumn("arr_date", fluss::DataType::Array(fluss::DataType::Date()))
+            .AddColumn("arr_time", fluss::DataType::Array(fluss::DataType::Time()))
+            .AddColumn("arr_ts", fluss::DataType::Array(fluss::DataType::Timestamp(6)))
+            .AddColumn("arr_decimal", fluss::DataType::Array(fluss::DataType::Decimal(10, 2)))
+            .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetBucketCount(1)
+                                .SetBucketKeys({"id"})
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table.NewAppend().CreateWriter(append_writer));
+
+    {
+        auto row = table.NewRow();
+        row.Set("id", 1);
+
+        fluss::ArrayWriter arr_bytes(2, fluss::DataType::Bytes());
+        arr_bytes.SetBytes(0, std::vector<uint8_t>{0x10, 0x20, 0x30});
+        arr_bytes.SetNull(1);
+        row.SetArray(1, std::move(arr_bytes));
+
+        fluss::ArrayWriter arr_date(2, fluss::DataType::Date());
+        auto d0 = fluss::Date::FromDays(20000);
+        arr_date.SetDate(0, d0);
+        arr_date.SetNull(1);
+        row.SetArray(2, std::move(arr_date));
+
+        fluss::ArrayWriter arr_time(1, fluss::DataType::Time());
+        auto t0 = fluss::Time::FromMillis(3600000);
+        arr_time.SetTime(0, t0);
+        row.SetArray(3, std::move(arr_time));
+
+        fluss::ArrayWriter arr_ts(1, fluss::DataType::Timestamp(6));
+        auto ts0 = fluss::Timestamp::FromMillisNanos(1769163227123, 456000);
+        arr_ts.SetTimestampNtz(0, ts0);
+        row.SetArray(4, std::move(arr_ts));
+
+        fluss::ArrayWriter arr_decimal(2, fluss::DataType::Decimal(10, 2));
+        arr_decimal.SetDecimal(0, "123.45");
+        arr_decimal.SetNull(1);
+        row.SetArray(5, std::move(arr_decimal));
+
+        ASSERT_OK(append_writer.Append(row));
+    }
+
+    ASSERT_OK(append_writer.Flush());
+
+    auto scan = table.NewScan();
+    fluss::LogScanner scanner;
+    ASSERT_OK(scan.CreateLogScanner(scanner));
+    ASSERT_OK(scanner.Subscribe(0, 0));
+
+    fluss::ScanRecords records;
+    ASSERT_OK(scanner.Poll(10000, records));
+    ASSERT_EQ(records.Count(), 1u);
+
+    auto it = records.begin();
+    ASSERT_TRUE(it != records.end());
+    auto rec = *it;
+    const auto& rv = rec.row;
+
+    EXPECT_EQ(rv.GetArraySize(1), 2u);
+    auto bytes0 = rv.GetArrayBytes(1, 0);
+    ASSERT_EQ(bytes0.size(), 3u);
+    EXPECT_EQ(bytes0[0], 0x10);
+    EXPECT_EQ(bytes0[1], 0x20);
+    EXPECT_EQ(bytes0[2], 0x30);
+    EXPECT_TRUE(rv.IsArrayElementNull(1, 1));
+
+    EXPECT_EQ(rv.GetArraySize(2), 2u);
+    EXPECT_EQ(rv.GetArrayDate(2, 0).days_since_epoch, fluss::Date::FromDays(20000).days_since_epoch);
+    EXPECT_TRUE(rv.IsArrayElementNull(2, 1));
+
+    EXPECT_EQ(rv.GetArraySize(3), 1u);
+    EXPECT_EQ(rv.GetArrayTime(3, 0).millis_since_midnight, fluss::Time::FromMillis(3600000).millis_since_midnight);
+
+    EXPECT_EQ(rv.GetArraySize(4), 1u);
+    auto ts = rv.GetArrayTimestamp(4, 0);
+    EXPECT_EQ(ts.epoch_millis, 1769163227123);
+    EXPECT_EQ(ts.nano_of_millisecond, 456000);
+
+    EXPECT_EQ(rv.GetArraySize(5), 2u);
+    EXPECT_EQ(rv.GetArrayDecimalString(5, 0), "123.45");
+    EXPECT_TRUE(rv.IsArrayElementNull(5, 1));
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, ArrayApiValidationErrors) {
+    // Type mismatch setter should fail through FFI Result propagation.
+    {
+        fluss::ArrayWriter bool_array(1, fluss::DataType::Boolean());
+        bool threw = false;
+        try {
+            bool_array.SetInt32(0, 42);
+        } catch (const std::exception&) {
+            threw = true;
+        }
+        EXPECT_TRUE(threw);
+    }
+
+    auto& adm = admin();
+    auto& conn = connection();
+    fluss::TablePath table_path("fluss", "test_array_api_validation_errors_cpp");
+
+    auto schema = fluss::Schema::NewBuilder()
+                      .AddColumn("id", fluss::DataType::Int())
+                      .AddColumn("vals", fluss::DataType::Array(fluss::DataType::Int()))
+                      .Build();
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetBucketCount(1)
+                                .SetBucketKeys({"id"})
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table.NewAppend().CreateWriter(append_writer));
+    auto row = table.NewRow();
+    row.Set("id", 1);
+    fluss::ArrayWriter vals(2, fluss::DataType::Int());
+    vals.SetInt32(0, 7);
+    vals.SetNull(1);
+    row.SetArray(1, std::move(vals));
+    ASSERT_OK(append_writer.Append(row));
+    ASSERT_OK(append_writer.Flush());
+
+    auto scan = table.NewScan();
+    fluss::LogScanner scanner;
+    ASSERT_OK(scan.CreateLogScanner(scanner));
+    ASSERT_OK(scanner.Subscribe(0, 0));
+    fluss::ScanRecords records;
+    ASSERT_OK(scanner.Poll(10000, records));
+    ASSERT_EQ(records.Count(), 1u);
+    auto it = records.begin();
+    ASSERT_TRUE(it != records.end());
+    auto rec = *it;
+
+    bool oob_threw = false;
+    try {
+        (void)rec.row.GetArrayInt32(1, 5);
+    } catch (const std::exception&) {
+        oob_threw = true;
+    }
+    EXPECT_TRUE(oob_threw);
+
+    bool wrong_type_threw = false;
+    try {
+        (void)rec.row.GetArrayInt64(1, 0);
+    } catch (const std::exception&) {
+        wrong_type_threw = true;
+    }
+    EXPECT_TRUE(wrong_type_threw);
+
+    bool null_typed_getter_threw = false;
+    try {
+        (void)rec.row.GetArrayInt32(1, 1);
+    } catch (const std::exception&) {
+        null_typed_getter_threw = true;
+    }
+    EXPECT_TRUE(null_typed_getter_threw);
+
+    auto view = rec.row.GetArrayView(1);
+    EXPECT_EQ(view.Size(), 2u);
+    EXPECT_TRUE(view.IsNull(1));
+
+    bool view_wrong_type_threw = false;
+    try {
+        (void)view.GetInt64(0);
+    } catch (const std::exception&) {
+        view_wrong_type_threw = true;
+    }
+    EXPECT_TRUE(view_wrong_type_threw);
+
+    bool view_null_typed_getter_threw = false;
+    try {
+        (void)view.GetInt32(1);
+    } catch (const std::exception&) {
+        view_null_typed_getter_threw = true;
+    }
+    EXPECT_TRUE(view_null_typed_getter_threw);
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, AppendAndScanWithArrayEncodingEdgeCases) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_array_encoding_edge_cases_cpp");
+
+    auto schema =
+        fluss::Schema::NewBuilder()
+            .AddColumn("id", fluss::DataType::Int())
+            .AddColumn("arr_long_str", fluss::DataType::Array(fluss::DataType::String()))
+            .AddColumn("arr_big_decimal", fluss::DataType::Array(fluss::DataType::Decimal(22, 5)))
+            .AddColumn("arr_ts_nano", fluss::DataType::Array(fluss::DataType::Timestamp(9)))
+            .AddColumn("arr_float", fluss::DataType::Array(fluss::DataType::Float()))
+            .AddColumn("arr_double", fluss::DataType::Array(fluss::DataType::Double()))
+            .AddColumn("arr_binary", fluss::DataType::Array(fluss::DataType::Binary(4)))
+            .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetBucketCount(1)
+                                .SetBucketKeys({"id"})
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+    fluss::AppendWriter append_writer;
+    ASSERT_OK(table.NewAppend().CreateWriter(append_writer));
+
+    {
+        auto row = table.NewRow();
+        row.Set("id", 1);
+
+        // >= 8 bytes forces the heap-pointer variable-length path (threshold: 7)
+        fluss::ArrayWriter arr_long_str(2, fluss::DataType::String());
+        arr_long_str.SetString(0, "abcdefgh");
+        arr_long_str.SetString(1, "this is a much longer string that definitely exceeds inline");
+        row.SetArray(1, std::move(arr_long_str));
+
+        // precision > 18 forces non-compact decimal encoding
+        fluss::ArrayWriter arr_big_decimal(2, fluss::DataType::Decimal(22, 5));
+        arr_big_decimal.SetDecimal(0, "12345678901234567.12345");
+        arr_big_decimal.SetDecimal(1, "-99999999999999999.99999");
+        row.SetArray(2, std::move(arr_big_decimal));
+
+        // precision > 3 forces non-compact timestamp (millis + nanos-of-millis)
+        fluss::ArrayWriter arr_ts_nano(1, fluss::DataType::Timestamp(9));
+        auto ts_nano = fluss::Timestamp::FromMillisNanos(1769163227123, 456789);
+        arr_ts_nano.SetTimestampNtz(0, ts_nano);
+        row.SetArray(3, std::move(arr_ts_nano));
+
+        // IEEE 754 special values: NaN, +Infinity, -Infinity
+        fluss::ArrayWriter arr_float(3, fluss::DataType::Float());
+        arr_float.SetFloat32(0, std::numeric_limits<float>::quiet_NaN());
+        arr_float.SetFloat32(1, std::numeric_limits<float>::infinity());
+        arr_float.SetFloat32(2, -std::numeric_limits<float>::infinity());
+        row.SetArray(4, std::move(arr_float));
+
+        fluss::ArrayWriter arr_double(3, fluss::DataType::Double());
+        arr_double.SetFloat64(0, std::numeric_limits<double>::quiet_NaN());
+        arr_double.SetFloat64(1, std::numeric_limits<double>::infinity());
+        arr_double.SetFloat64(2, -std::numeric_limits<double>::infinity());
+        row.SetArray(5, std::move(arr_double));
+
+        // Fixed-length binary
+        fluss::ArrayWriter arr_binary(2, fluss::DataType::Binary(4));
+        arr_binary.SetBytes(0, std::vector<uint8_t>{0xDE, 0xAD, 0xBE, 0xEF});
+        arr_binary.SetNull(1);
+        row.SetArray(6, std::move(arr_binary));
+
+        ASSERT_OK(append_writer.Append(row));
+    }
+
+    ASSERT_OK(append_writer.Flush());
+
+    auto scan = table.NewScan();
+    fluss::LogScanner scanner;
+    ASSERT_OK(scan.CreateLogScanner(scanner));
+    ASSERT_OK(scanner.Subscribe(0, 0));
+
+    fluss::ScanRecords records;
+    ASSERT_OK(scanner.Poll(10000, records));
+    ASSERT_EQ(records.Count(), 1u);
+
+    auto it = records.begin();
+    ASSERT_TRUE(it != records.end());
+    auto rec = *it;
+    const auto& rv = rec.row;
+
+    // Long strings: heap-encoded variable-length round-trip
+    EXPECT_EQ(rv.GetArraySize(1), 2u);
+    EXPECT_EQ(rv.GetArrayString(1, 0), "abcdefgh");
+    EXPECT_EQ(rv.GetArrayString(1, 1), "this is a much longer string that definitely exceeds inline");
+
+    // Non-compact decimal (precision 22 > MAX_COMPACT_PRECISION 18)
+    EXPECT_EQ(rv.GetArraySize(2), 2u);
+    EXPECT_EQ(rv.GetArrayDecimalString(2, 0), "12345678901234567.12345");
+    EXPECT_EQ(rv.GetArrayDecimalString(2, 1), "-99999999999999999.99999");
+
+    // Non-compact timestamp (precision 9 > MAX_COMPACT_TIMESTAMP_PRECISION 3)
+    EXPECT_EQ(rv.GetArraySize(3), 1u);
+    auto ts = rv.GetArrayTimestamp(3, 0);
+    EXPECT_EQ(ts.epoch_millis, 1769163227123);
+    EXPECT_EQ(ts.nano_of_millisecond, 456789);
+
+    // Float NaN / Infinity round-trip
+    EXPECT_EQ(rv.GetArraySize(4), 3u);
+    EXPECT_TRUE(std::isnan(rv.GetArrayFloat32(4, 0)));
+    EXPECT_TRUE(std::isinf(rv.GetArrayFloat32(4, 1)));
+    EXPECT_GT(rv.GetArrayFloat32(4, 1), 0.0f);
+    EXPECT_TRUE(std::isinf(rv.GetArrayFloat32(4, 2)));
+    EXPECT_LT(rv.GetArrayFloat32(4, 2), 0.0f);
+
+    // Double NaN / Infinity round-trip
+    EXPECT_EQ(rv.GetArraySize(5), 3u);
+    EXPECT_TRUE(std::isnan(rv.GetArrayFloat64(5, 0)));
+    EXPECT_TRUE(std::isinf(rv.GetArrayFloat64(5, 1)));
+    EXPECT_GT(rv.GetArrayFloat64(5, 1), 0.0);
+    EXPECT_TRUE(std::isinf(rv.GetArrayFloat64(5, 2)));
+    EXPECT_LT(rv.GetArrayFloat64(5, 2), 0.0);
+
+    // Fixed-length binary round-trip
+    EXPECT_EQ(rv.GetArraySize(6), 2u);
+    auto bin = rv.GetArrayBytes(6, 0);
+    ASSERT_EQ(bin.size(), 4u);
+    EXPECT_EQ(bin[0], 0xDE);
+    EXPECT_EQ(bin[1], 0xAD);
+    EXPECT_EQ(bin[2], 0xBE);
+    EXPECT_EQ(bin[3], 0xEF);
+    EXPECT_TRUE(rv.IsArrayElementNull(6, 1));
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
+
+TEST_F(LogTableTest, ArrayWriterOverflowDetection) {
+    // SetInt32 on TINYINT array must throw when value overflows i8 range (-128..127)
+    {
+        fluss::ArrayWriter tinyint_arr(1, fluss::DataType::TinyInt());
+        EXPECT_EQ(tinyint_arr.Size(), 1u);
+        bool threw = false;
+        try {
+            tinyint_arr.SetInt32(0, 1000);
+        } catch (const std::exception& e) {
+            threw = true;
+            std::string msg(e.what());
+            EXPECT_NE(msg.find("TINYINT"), std::string::npos);
+        }
+        EXPECT_TRUE(threw);
+    }
+
+    // SetInt32 on SMALLINT array must throw when value overflows i16 range (-32768..32767)
+    {
+        fluss::ArrayWriter smallint_arr(1, fluss::DataType::SmallInt());
+        bool threw = false;
+        try {
+            smallint_arr.SetInt32(0, 40000);
+        } catch (const std::exception& e) {
+            threw = true;
+            std::string msg(e.what());
+            EXPECT_NE(msg.find("SMALLINT"), std::string::npos);
+        }
+        EXPECT_TRUE(threw);
+    }
+
+    // Negative overflow: -200 doesn't fit TINYINT
+    {
+        fluss::ArrayWriter tinyint_arr(1, fluss::DataType::TinyInt());
+        bool threw = false;
+        try {
+            tinyint_arr.SetInt32(0, -200);
+        } catch (const std::exception&) {
+            threw = true;
+        }
+        EXPECT_TRUE(threw);
+    }
+
+    // Values within range must succeed
+    {
+        fluss::ArrayWriter tinyint_arr(1, fluss::DataType::TinyInt());
+        EXPECT_NO_THROW(tinyint_arr.SetInt32(0, 127));
+    }
+    {
+        fluss::ArrayWriter tinyint_arr(1, fluss::DataType::TinyInt());
+        EXPECT_NO_THROW(tinyint_arr.SetInt32(0, -128));
+    }
+    {
+        fluss::ArrayWriter smallint_arr(1, fluss::DataType::SmallInt());
+        EXPECT_NO_THROW(smallint_arr.SetInt32(0, 32767));
+    }
+}
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index d14cf16d13..c50d40cda2 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -212,6 +212,7 @@ Complete API reference for the Fluss C++ client.
 | `SetTimestampNtz(size_t idx, const Timestamp& value)`     | Set timestamp without timezone |
 | `SetTimestampLtz(size_t idx, const Timestamp& value)`     | Set timestamp with timezone    |
 | `SetDecimal(size_t idx, const std::string& value)`        | Set decimal from string        |
+| `SetArray(size_t idx, ArrayWriter&& writer)`              | Set array value (consumes the writer) |
 
 ### Name-Based Setters
 
@@ -258,6 +259,28 @@ Read-only row view for scan results. Provides zero-copy access to string and byt
 | `IsDecimal(size_t idx) -> bool`                            | Check if field is a decimal type|
 | `GetDecimalString(size_t idx) -> std::string`              | Get decimal as string at index |
 
+### Array Getters (Index-Based)
+
+| Method                                                             |  Description                              |
+|--------------------------------------------------------------------|-------------------------------------------|
+| `GetArraySize(size_t idx) -> size_t`                               | Get element count of array at index       |
+| `GetArrayElementType(size_t idx) -> TypeId`                        | Get element type of array at index        |
+| `IsArrayElementNull(size_t idx, size_t element) -> bool`           | Check if array element is null            |
+| `GetArrayBool(size_t idx, size_t element) -> bool`                 | Get boolean array element                 |
+| `GetArrayInt32(size_t idx, size_t element) -> int32_t`             | Get 32-bit integer array element          |
+| `GetArrayInt64(size_t idx, size_t element) -> int64_t`             | Get 64-bit integer array element          |
+| `GetArrayFloat32(size_t idx, size_t element) -> float`             | Get 32-bit float array element            |
+| `GetArrayFloat64(size_t idx, size_t element) -> double`            | Get 64-bit float array element            |
+| `GetArrayString(size_t idx, size_t element) -> std::string`        | Get string array element                  |
+| `GetArrayBytes(size_t idx, size_t element) -> std::vector<uint8_t>`| Get binary array element                  |
+| `GetArrayDate(size_t idx, size_t element) -> Date`                 | Get date array element                    |
+| `GetArrayTime(size_t idx, size_t element) -> Time`                 | Get time array element                    |
+| `GetArrayTimestamp(size_t idx, size_t element) -> Timestamp`       | Get timestamp array element               |
+| `GetArrayDecimalString(size_t idx, size_t element) -> std::string` | Get decimal array element as string       |
+| `GetArrayView(size_t idx) -> ArrayView`                            | Get owning ArrayView for nested access    |
+
+All array getters are also available by column name (e.g., `GetArraySize("col")`, `GetArrayView("col")`).
+
 ### Name-Based Getters
 
 | Method                                                  |  Description                       |
@@ -364,6 +387,10 @@ Read-only result for lookup operations. Provides zero-copy access to field value
 | `IsDecimal(size_t idx) -> bool`                            | Check if field is a decimal type|
 | `GetDecimalString(size_t idx) -> std::string`              | Get decimal as string at index |
 
+### Array Getters (Index-Based)
+
+Same array getters as [`RowView`](#array-getters-index-based) — `GetArraySize`, `GetArrayInt32`, `GetArrayView`, etc. Also available by column name.
+
 ### Name-Based Getters
 
 | Method                                                  |  Description                       |
@@ -456,14 +483,61 @@ Read-only result for lookup operations. Provides zero-copy access to field value
 | `DataType::Timestamp(int precision)`          | Timestamp without timezone         |
 | `DataType::TimestampLtz(int precision)`       | Timestamp with timezone            |
 | `DataType::Decimal(int precision, int scale)` | Decimal with precision and scale   |
+| `DataType::Array(DataType element)`           | Array of the given element type    |
 
 ### Accessors
 
-| Method               |  Description                                |
-|----------------------|---------------------------------------------|
-| `id() -> TypeId`     | Get the type ID                             |
-| `precision() -> int` | Get precision (for Decimal/Timestamp types) |
-| `scale() -> int`     | Get scale (for Decimal type)                |
+| Method                              |  Description                                |
+|-------------------------------------|---------------------------------------------|
+| `id() -> TypeId`                    | Get the type ID                             |
+| `precision() -> int`               | Get precision (for Decimal/Timestamp types) |
+| `scale() -> int`                   | Get scale (for Decimal type)                |
+| `element_type() -> const DataType*` | Get element type (for Array type, nullptr otherwise) |
+
+## `ArrayWriter`
+
+Write-only builder for array column values. Constructed with a fixed size and element type, then populated element-by-element. Move-only — consumed by `GenericRow::SetArray()` or `ArrayWriter::SetArray()` for nested arrays.
+
+| Method                                                    |  Description                              |
+|-----------------------------------------------------------|-------------------------------------------|
+| `ArrayWriter(size_t size, DataType element_type)`         | Create an array writer                    |
+| `SetNull(size_t idx)`                                     | Set element to null                       |
+| `SetBool(size_t idx, bool value)`                         | Set boolean element                       |
+| `SetInt32(size_t idx, int32_t value)`                     | Set 32-bit integer element                |
+| `SetInt64(size_t idx, int64_t value)`                     | Set 64-bit integer element                |
+| `SetFloat32(size_t idx, float value)`                     | Set 32-bit float element                  |
+| `SetFloat64(size_t idx, double value)`                    | Set 64-bit float element                  |
+| `SetString(size_t idx, const std::string& value)`         | Set string element                        |
+| `SetBytes(size_t idx, const std::vector<uint8_t>& value)` | Set binary element                        |
+| `SetDate(size_t idx, const Date& value)`                  | Set date element                          |
+| `SetTime(size_t idx, const Time& value)`                  | Set time element                          |
+| `SetTimestampNtz(size_t idx, const Timestamp& value)`     | Set timestamp without timezone element    |
+| `SetTimestampLtz(size_t idx, const Timestamp& value)`     | Set timestamp with timezone element       |
+| `SetDecimal(size_t idx, const std::string& value)`        | Set decimal element from string           |
+| `SetArray(size_t idx, ArrayWriter&& nested)`              | Set nested array element (consumes nested)|
+
+## `ArrayView`
+
+Read-only view over an array column value. Obtained from `RowView::GetArrayView()` or `LookupResult::GetArrayView()`, and recursively from `ArrayView::GetArray()` for nested `ARRAY<ARRAY<...>>` columns. Move-only.
+
+| Method                                                  |  Description                              |
+|---------------------------------------------------------|-------------------------------------------|
+| `Size() -> size_t`                                      | Get element count                         |
+| `ElementType() -> TypeId`                               | Get element type                          |
+| `IsNull(size_t element) -> bool`                        | Check if element is null                  |
+| `GetBool(size_t element) -> bool`                       | Get boolean element                       |
+| `GetInt32(size_t element) -> int32_t`                   | Get 32-bit integer element                |
+| `GetInt64(size_t element) -> int64_t`                   | Get 64-bit integer element                |
+| `GetFloat32(size_t element) -> float`                   | Get 32-bit float element                  |
+| `GetFloat64(size_t element) -> double`                  | Get 64-bit float element                  |
+| `GetString(size_t element) -> std::string`              | Get string element                        |
+| `GetBytes(size_t element) -> std::vector<uint8_t>`      | Get binary element                        |
+| `GetDate(size_t element) -> Date`                       | Get date element                          |
+| `GetTime(size_t element) -> Time`                       | Get time element                          |
+| `GetTimestamp(size_t element) -> Timestamp`              | Get timestamp element                     |
+| `GetTimestampLtz(size_t element) -> Timestamp`          | Get timestamp with timezone element       |
+| `GetDecimalString(size_t element) -> std::string`       | Get decimal element as string             |
+| `GetArray(size_t element) -> ArrayView`                 | Get nested array as child ArrayView       |
 
 ## `TablePath`
 
@@ -632,6 +706,7 @@ inline const char* ChangeTypeShortString(ChangeType ct) {
 | `Timestamp`    | Timestamp without timezone |
 | `TimestampLtz` | Timestamp with timezone    |
 | `Decimal`      | Decimal                    |
+| `Array`        | Array of elements          |
 
 ### `ChangeType`
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/data-types.md b/fluss-rust/website/docs/user-guide/cpp/data-types.md
index bfb296f2b9..400b2ecf07 100644
--- a/fluss-rust/website/docs/user-guide/cpp/data-types.md
+++ b/fluss-rust/website/docs/user-guide/cpp/data-types.md
@@ -21,6 +21,7 @@ sidebar_position: 3
 | `DataType::Timestamp()`    | Timestamp without timezone (default precision 6, microseconds) |
 | `DataType::TimestampLtz()` | Timestamp with timezone (default precision 6, microseconds)    |
 | `DataType::Decimal(p, s)`  | Decimal with precision and scale                               |
+| `DataType::Array(element)` | Array of the given element type (supports nesting)             |
 
 ## GenericRow Setters
 
@@ -38,6 +39,30 @@ row.SetString(6, "hello");
 row.SetBytes(7, {0x01, 0x02, 0x03});
 ```
 
+### Array Columns
+
+Array values are built element-by-element using `ArrayWriter`, then attached to the row via `SetArray`:
+
+```cpp
+fluss::ArrayWriter aw(3, fluss::DataType::Int());
+aw.SetInt32(0, 10);
+aw.SetInt32(1, 20);
+aw.SetNull(2);
+row.SetArray(8, std::move(aw));
+```
+
+For nested arrays (e.g., `ARRAY<ARRAY<INT>>`), build inner arrays first:
+
+```cpp
+fluss::ArrayWriter inner(2, fluss::DataType::Int());
+inner.SetInt32(0, 1);
+inner.SetInt32(1, 2);
+
+fluss::ArrayWriter outer(1, fluss::DataType::Array(fluss::DataType::Int()));
+outer.SetArray(0, std::move(inner));
+row.SetArray(9, std::move(outer));
+```
+
 ## Name-Based Setters
 
 When using `table.NewRow()`, you can set fields by column name. The setter automatically routes to the correct type based on the schema:
@@ -109,6 +134,37 @@ if (result.Found()) {
 }
 ```
 
+### Reading Array Columns
+
+Array columns can be read element-by-element using index-based getters, or via an `ArrayView` for recursive access:
+
+```cpp
+// Element-by-element access (flat arrays)
+size_t len = rec.row.GetArraySize(8);
+for (size_t i = 0; i < len; i++) {
+    if (!rec.row.IsArrayElementNull(8, i)) {
+        int32_t val = rec.row.GetArrayInt32(8, i);
+    }
+}
+
+// ArrayView for nested arrays or when you need a standalone handle
+fluss::ArrayView av = rec.row.GetArrayView(8);
+for (size_t i = 0; i < av.Size(); i++) {
+    if (!av.IsNull(i)) {
+        int32_t val = av.GetInt32(i);
+    }
+}
+
+// Nested arrays: ArrayView::GetArray() returns a child ArrayView
+fluss::ArrayView outer = rec.row.GetArrayView(9);
+for (size_t i = 0; i < outer.Size(); i++) {
+    fluss::ArrayView inner = outer.GetArray(i);
+    for (size_t j = 0; j < inner.Size(); j++) {
+        int32_t val = inner.GetInt32(j);
+    }
+}
+```
+
 ## TypeId Enum
 
 `TinyInt` and `SmallInt` values are widened to `int32_t` on read.
@@ -129,6 +185,7 @@ if (result.Found()) {
 | `Timestamp`     | `Timestamp`                                 | `GetTimestamp(idx)`       |
 | `TimestampLtz`  | `Timestamp`                                 | `GetTimestamp(idx)`       |
 | `Decimal`       | `std::string`                               | `GetDecimalString(idx)`   |
+| `Array`         | `ArrayView`                                 | `GetArrayView(idx)`       |
 
 ## Type Checking
 

From 746391317152936a7fcd8201c48444b9e9b6ae48 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Sat, 25 Apr 2026 10:37:02 +0800
Subject: [PATCH 243/287] build(deps): bump actions/download-artifact from 4 to
 8 (#408)

---
 fluss-rust/.github/workflows/release_python.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/.github/workflows/release_python.yml b/fluss-rust/.github/workflows/release_python.yml
index 9aaaf6f348..5a5ae7a72d 100644
--- a/fluss-rust/.github/workflows/release_python.yml
+++ b/fluss-rust/.github/workflows/release_python.yml
@@ -151,7 +151,7 @@ jobs:
     needs: [version-check, sdist, wheels]
     if: startsWith(github.ref, 'refs/tags/')
     steps:
-      - uses: actions/download-artifact@v4
+      - uses: actions/download-artifact@v8
         with:
           pattern: wheels-*
           merge-multiple: true

From 035fcfa4b50029d654173f218ec738f2ef526ed1 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sun, 26 Apr 2026 04:00:58 +0200
Subject: [PATCH 244/287] feat: [metrics] Create metrics framework and add
 connection metrics (#407)

---
 fluss-rust/Cargo.toml                         |   1 +
 fluss-rust/crates/fluss/Cargo.toml            |   2 +
 fluss-rust/crates/fluss/src/lib.rs            |   1 +
 fluss-rust/crates/fluss/src/metrics.rs        | 270 ++++++++++
 .../crates/fluss/src/rpc/message/header.rs    |   3 +-
 fluss-rust/crates/fluss/src/rpc/mod.rs        |   1 +
 .../crates/fluss/src/rpc/server_connection.rs | 484 +++++++++++++++++-
 7 files changed, 753 insertions(+), 9 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/metrics.rs

diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 0aa7e9cfa7..8f811c82ce 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -38,5 +38,6 @@ arrow = { version = "57.0.0", features = ["ipc_compression", "ffi"] }
 bigdecimal = "0.4"
 serde = { version = "1.0", features = ["derive"] }
 serde_json = "1.0"
+metrics = "0.24"
 opendal = "0.53"
 jiff = { version = "0.2" }
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index 040599ed06..a47fc238f2 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -57,6 +57,7 @@ serde = { workspace = true, features = ["rc"] }
 serde_json = { workspace = true }
 thiserror = "1.0"
 log = { version = "0.4", features = ["kv_std"] }
+metrics = { workspace = true }
 tokio = { workspace = true }
 parking_lot = "0.12"
 bytes = "1.10.1"
@@ -79,6 +80,7 @@ strum_macros = "0.26"
 jiff = { workspace = true, features = ["js"] }
 
 [dev-dependencies]
+metrics-util = "0.20"
 fluss-test-cluster = { path = "../fluss-test-cluster" }
 
 [build-dependencies]
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index 6537189e61..0266e0de6e 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -132,6 +132,7 @@ pub use cluster::{ServerNode, ServerType};
 
 pub mod config;
 pub mod error;
+pub mod metrics;
 
 mod bucketing;
 mod compression;
diff --git a/fluss-rust/crates/fluss/src/metrics.rs b/fluss-rust/crates/fluss/src/metrics.rs
new file mode 100644
index 0000000000..756e2db561
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metrics.rs
@@ -0,0 +1,270 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Metric name constants and helpers for fluss-rust client instrumentation.
+//!
+//! Uses the [`metrics`] crate facade pattern: library code emits metrics via
+//! `counter!`/`gauge!`/`histogram!` macros, and the application installs a
+//! recorder (e.g. `metrics-exporter-prometheus`) to collect them. When no
+//! recorder is installed, all metric calls are no-ops with zero overhead.
+
+use crate::rpc::ApiKey;
+
+// ---------------------------------------------------------------------------
+// Label keys
+// ---------------------------------------------------------------------------
+
+pub const LABEL_API_KEY: &str = "api_key";
+
+// ---------------------------------------------------------------------------
+// Connection / RPC metrics
+//
+// Java reference: ConnectionMetrics.java, ClientMetricGroup.java, MetricNames.java
+//
+// Byte counting matches Java semantics: both sides count only the API message
+// body, excluding the protocol header and framing.
+// Java: rawRequest.totalSize() / response.totalSize() (see MessageCodec.java).
+// Rust: buf.len() - REQUEST_HEADER_LENGTH for sent bytes,
+//       buffer.len() - cursor.position() for received bytes.
+// ---------------------------------------------------------------------------
+
+pub const CLIENT_REQUESTS_TOTAL: &str = "fluss.client.requests.total";
+pub const CLIENT_RESPONSES_TOTAL: &str = "fluss.client.responses.total";
+pub const CLIENT_BYTES_SENT_TOTAL: &str = "fluss.client.bytes_sent.total";
+pub const CLIENT_BYTES_RECEIVED_TOTAL: &str = "fluss.client.bytes_received.total";
+pub const CLIENT_REQUEST_LATENCY_MS: &str = "fluss.client.request_latency_ms";
+pub const CLIENT_REQUESTS_IN_FLIGHT: &str = "fluss.client.requests_in_flight";
+
+/// Returns a label value for reportable API keys, matching Java's
+/// `ConnectionMetrics.REPORT_API_KEYS` filter (`ProduceLog`, `FetchLog`,
+/// `PutKv`, `Lookup`). Returns `None` for admin/metadata/auth calls to
+/// avoid metric cardinality bloat.
+pub(crate) fn api_key_label(api_key: ApiKey) -> Option<&'static str> {
+    match api_key {
+        ApiKey::ProduceLog => Some("produce_log"),
+        ApiKey::FetchLog => Some("fetch_log"),
+        ApiKey::PutKv => Some("put_kv"),
+        ApiKey::Lookup => Some("lookup"),
+        _ => None,
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use metrics_util::debugging::DebuggingRecorder;
+
+    macro_rules! find_counter {
+        ($entries:expr, $name:expr) => {
+            $entries.iter().find_map(|(key, _, _, val)| {
+                if key.key().name() == $name {
+                    match val {
+                        metrics_util::debugging::DebugValue::Counter(v) => Some(*v),
+                        _ => None,
+                    }
+                } else {
+                    None
+                }
+            })
+        };
+    }
+
+    macro_rules! find_histogram {
+        ($entries:expr, $name:expr) => {
+            $entries.iter().find_map(|(key, _, _, val)| {
+                if key.key().name() == $name {
+                    match val {
+                        metrics_util::debugging::DebugValue::Histogram(v) => {
+                            Some(v.iter().map(|f| f.into_inner()).collect::<Vec<_>>())
+                        }
+                        _ => None,
+                    }
+                } else {
+                    None
+                }
+            })
+        };
+    }
+
+    macro_rules! find_gauge {
+        ($entries:expr, $name:expr) => {
+            $entries.iter().find_map(|(key, _, _, val)| {
+                if key.key().name() == $name {
+                    match val {
+                        metrics_util::debugging::DebugValue::Gauge(g) => Some(g.into_inner()),
+                        _ => None,
+                    }
+                } else {
+                    None
+                }
+            })
+        };
+    }
+
+    #[test]
+    fn reportable_api_keys_return_label() {
+        assert_eq!(api_key_label(ApiKey::ProduceLog), Some("produce_log"));
+        assert_eq!(api_key_label(ApiKey::FetchLog), Some("fetch_log"));
+        assert_eq!(api_key_label(ApiKey::PutKv), Some("put_kv"));
+        assert_eq!(api_key_label(ApiKey::Lookup), Some("lookup"));
+    }
+
+    #[test]
+    fn non_reportable_api_keys_return_none() {
+        assert_eq!(api_key_label(ApiKey::MetaData), None);
+        assert_eq!(api_key_label(ApiKey::CreateTable), None);
+        assert_eq!(api_key_label(ApiKey::Authenticate), None);
+        assert_eq!(api_key_label(ApiKey::ListDatabases), None);
+        assert_eq!(api_key_label(ApiKey::GetTable), None);
+    }
+
+    #[test]
+    fn reportable_request_records_all_connection_metrics() {
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            let label = api_key_label(ApiKey::ProduceLog).unwrap();
+
+            metrics::counter!(CLIENT_REQUESTS_TOTAL, LABEL_API_KEY => label).increment(1);
+            metrics::counter!(CLIENT_BYTES_SENT_TOTAL, LABEL_API_KEY => label).increment(256);
+            metrics::gauge!(CLIENT_REQUESTS_IN_FLIGHT, LABEL_API_KEY => label).increment(1.0);
+
+            metrics::counter!(CLIENT_RESPONSES_TOTAL, LABEL_API_KEY => label).increment(1);
+            metrics::counter!(CLIENT_BYTES_RECEIVED_TOTAL, LABEL_API_KEY => label).increment(128);
+            metrics::histogram!(CLIENT_REQUEST_LATENCY_MS, LABEL_API_KEY => label).record(42.5);
+            metrics::gauge!(CLIENT_REQUESTS_IN_FLIGHT, LABEL_API_KEY => label).decrement(1.0);
+        });
+
+        let snapshot = snapshotter.snapshot();
+        let entries: Vec<_> = snapshot.into_vec();
+
+        assert_eq!(find_counter!(entries, CLIENT_REQUESTS_TOTAL), Some(1));
+        assert_eq!(find_counter!(entries, CLIENT_RESPONSES_TOTAL), Some(1));
+        assert_eq!(find_counter!(entries, CLIENT_BYTES_SENT_TOTAL), Some(256));
+        assert_eq!(
+            find_counter!(entries, CLIENT_BYTES_RECEIVED_TOTAL),
+            Some(128)
+        );
+        assert_eq!(
+            find_histogram!(entries, CLIENT_REQUEST_LATENCY_MS),
+            Some(vec![42.5])
+        );
+        assert_eq!(find_gauge!(entries, CLIENT_REQUESTS_IN_FLIGHT), Some(0.0));
+
+        let has_label = entries.iter().all(|(key, _, _, _)| {
+            key.key()
+                .labels()
+                .any(|l| l.key() == LABEL_API_KEY && l.value() == "produce_log")
+        });
+        assert!(has_label, "all metrics must carry the api_key label");
+    }
+
+    #[test]
+    fn non_reportable_request_records_no_metrics() {
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            let label = api_key_label(ApiKey::MetaData);
+            assert!(label.is_none());
+            // When label is None, no metrics calls are made (matching request() logic).
+        });
+
+        let snapshot = snapshotter.snapshot();
+        assert!(
+            snapshot.into_vec().is_empty(),
+            "non-reportable API keys must not produce metrics"
+        );
+    }
+
+    #[test]
+    fn inflight_gauge_nets_to_zero_after_balanced_calls() {
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            let label = api_key_label(ApiKey::FetchLog).unwrap();
+
+            // Simulate 3 concurrent requests completing
+            for _ in 0..3 {
+                metrics::gauge!(CLIENT_REQUESTS_IN_FLIGHT, LABEL_API_KEY => label).increment(1.0);
+            }
+            for _ in 0..3 {
+                metrics::gauge!(CLIENT_REQUESTS_IN_FLIGHT, LABEL_API_KEY => label).decrement(1.0);
+            }
+        });
+
+        let snapshot = snapshotter.snapshot();
+        let entries: Vec<_> = snapshot.into_vec();
+        assert_eq!(
+            find_gauge!(entries, CLIENT_REQUESTS_IN_FLIGHT),
+            Some(0.0),
+            "in-flight gauge should be 0 after balanced inc/dec"
+        );
+    }
+
+    #[test]
+    fn different_api_keys_produce_separate_metric_series() {
+        use std::collections::HashMap;
+
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            let produce_label = api_key_label(ApiKey::ProduceLog).unwrap();
+            let fetch_label = api_key_label(ApiKey::FetchLog).unwrap();
+
+            metrics::counter!(CLIENT_REQUESTS_TOTAL, LABEL_API_KEY => produce_label).increment(5);
+            metrics::counter!(CLIENT_REQUESTS_TOTAL, LABEL_API_KEY => fetch_label).increment(3);
+        });
+
+        let snapshot = snapshotter.snapshot();
+        let entries: Vec<_> = snapshot.into_vec();
+
+        let request_entries: Vec<_> = entries
+            .iter()
+            .filter(|(key, _, _, _)| key.key().name() == CLIENT_REQUESTS_TOTAL)
+            .collect();
+
+        assert_eq!(
+            request_entries.len(),
+            2,
+            "produce_log and fetch_log should be separate metric series"
+        );
+
+        let mut counter_by_api_key: HashMap<String, u64> = HashMap::new();
+        for (key, _, _, val) in request_entries {
+            let api_key = key
+                .key()
+                .labels()
+                .find(|label| label.key() == LABEL_API_KEY)
+                .map(|label| label.value())
+                .expect("requests total metric must include api_key label");
+
+            let counter_value = match val {
+                metrics_util::debugging::DebugValue::Counter(v) => *v,
+                other => panic!("expected Counter, got {other:?}"),
+            };
+
+            counter_by_api_key.insert(api_key.to_string(), counter_value);
+        }
+
+        assert_eq!(counter_by_api_key.get("produce_log"), Some(&5));
+        assert_eq!(counter_by_api_key.get("fetch_log"), Some(&3));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/message/header.rs b/fluss-rust/crates/fluss/src/rpc/message/header.rs
index 77bda7c78c..2f5848aa28 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/header.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/header.rs
@@ -23,8 +23,7 @@ use crate::rpc::message::{ReadVersionedType, WriteVersionedType};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
-#[allow(dead_code)]
-const REQUEST_HEADER_LENGTH: i32 = 8;
+pub(crate) const REQUEST_HEADER_LENGTH: usize = 8;
 const SUCCESS_RESPONSE: u8 = 0;
 #[allow(dead_code)]
 const ERROR_RESPONSE: u8 = 1;
diff --git a/fluss-rust/crates/fluss/src/rpc/mod.rs b/fluss-rust/crates/fluss/src/rpc/mod.rs
index 86e13b1c4c..6f3a88d1ba 100644
--- a/fluss-rust/crates/fluss/src/rpc/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/mod.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 mod api_key;
+pub(crate) use api_key::ApiKey;
 mod api_version;
 pub mod error;
 mod fluss_api_error;
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index 13c5d9ca09..46d99c0d27 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -17,12 +17,18 @@
 
 use crate::cluster::ServerNode;
 use crate::error::Error;
+use crate::metrics::{
+    CLIENT_BYTES_RECEIVED_TOTAL, CLIENT_BYTES_SENT_TOTAL, CLIENT_REQUEST_LATENCY_MS,
+    CLIENT_REQUESTS_IN_FLIGHT, CLIENT_REQUESTS_TOTAL, CLIENT_RESPONSES_TOTAL, LABEL_API_KEY,
+    api_key_label,
+};
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::error::RpcError;
 use crate::rpc::error::RpcError::ConnectionError;
 use crate::rpc::frame::{AsyncMessageRead, AsyncMessageWrite};
 use crate::rpc::message::{
-    ReadVersionedType, RequestBody, RequestHeader, ResponseHeader, WriteVersionedType,
+    REQUEST_HEADER_LENGTH, ReadVersionedType, RequestBody, RequestHeader, ResponseHeader,
+    WriteVersionedType,
 };
 use crate::rpc::transport::Transport;
 use futures::future::BoxFuture;
@@ -35,7 +41,7 @@ use std::ops::DerefMut;
 use std::sync::Arc;
 use std::sync::atomic::{AtomicI32, Ordering};
 use std::task::Poll;
-use std::time::Duration;
+use std::time::{Duration, Instant};
 use tokio::io::{AsyncRead, AsyncWrite, AsyncWriteExt, BufStream, WriteHalf};
 use tokio::sync::Mutex as AsyncMutex;
 use tokio::sync::oneshot::{Sender, channel};
@@ -217,6 +223,59 @@ struct ActiveRequest {
     channel: Sender<Result<Response, RpcError>>,
 }
 
+/// Tracks per-request connection metrics and ensures in-flight gauge cleanup on drop.
+struct RequestMetricsLifecycle {
+    label: Option<&'static str>,
+    start: Instant,
+    completed: bool,
+}
+
+impl RequestMetricsLifecycle {
+    fn begin(api_key: crate::rpc::ApiKey, request_bytes: u64) -> Self {
+        let label = api_key_label(api_key);
+        if let Some(label) = label {
+            metrics::counter!(CLIENT_REQUESTS_TOTAL, LABEL_API_KEY => label).increment(1);
+            metrics::counter!(CLIENT_BYTES_SENT_TOTAL, LABEL_API_KEY => label)
+                .increment(request_bytes);
+            metrics::gauge!(CLIENT_REQUESTS_IN_FLIGHT, LABEL_API_KEY => label).increment(1.0);
+        }
+        Self {
+            label,
+            start: Instant::now(),
+            completed: false,
+        }
+    }
+
+    fn complete(&mut self, response_bytes: u64) {
+        let Some(label) = self.label else {
+            return;
+        };
+        if self.completed {
+            return;
+        }
+
+        metrics::counter!(CLIENT_RESPONSES_TOTAL, LABEL_API_KEY => label).increment(1);
+        metrics::counter!(CLIENT_BYTES_RECEIVED_TOTAL, LABEL_API_KEY => label)
+            .increment(response_bytes);
+        metrics::gauge!(CLIENT_REQUESTS_IN_FLIGHT, LABEL_API_KEY => label).decrement(1.0);
+        metrics::histogram!(CLIENT_REQUEST_LATENCY_MS, LABEL_API_KEY => label)
+            .record(self.start.elapsed().as_secs_f64() * 1000.0);
+        self.completed = true;
+    }
+}
+
+impl Drop for RequestMetricsLifecycle {
+    fn drop(&mut self) {
+        if self.completed {
+            return;
+        }
+        if let Some(label) = self.label {
+            metrics::gauge!(CLIENT_REQUESTS_IN_FLIGHT, LABEL_API_KEY => label).decrement(1.0);
+            self.completed = true;
+        }
+    }
+}
+
 #[derive(Debug)]
 enum ConnectionState {
     /// Currently active requests by request ID.
@@ -386,12 +445,27 @@ where
             ConnectionState::Poison(e) => return Err(RpcError::Poisoned(Arc::clone(e)).into()),
         }
 
-        self.send_message(buf).await?;
+        // count only the API message body, excluding the protocol header.
+        let request_body_bytes = buf.len().saturating_sub(REQUEST_HEADER_LENGTH) as u64;
+        let mut request_metrics = RequestMetricsLifecycle::begin(R::API_KEY, request_body_bytes);
+
+        self.send_message(buf)
+            .await
+            .inspect_err(|_| request_metrics.complete(0))?;
         _cleanup_on_cancel.message_sent();
-        let mut response = rx.await.map_err(|e| Error::UnexpectedError {
-            message: "Got recvError, some one close the channel".to_string(),
-            source: Some(Box::new(e)),
-        })??;
+        let mut response = rx
+            .await
+            .map_err(|e| Error::UnexpectedError {
+                message: "Receive error: response channel closed".to_string(),
+                source: Some(Box::new(e)),
+            })
+            .and_then(|r| r.map_err(Error::from))
+            .inspect_err(|_| request_metrics.complete(0))?;
+
+        // count only the API message body, excluding the response header.
+        let response_bytes =
+            (response.data.get_ref().len() as u64).saturating_sub(response.data.position());
+        request_metrics.complete(response_bytes);
 
         if let Some(error_response) = response.header.error_response {
             return Err(Error::FlussAPIError {
@@ -561,3 +635,399 @@ impl Drop for CleanupRequestStateOnCancel {
         }
     }
 }
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::error::Error;
+    use crate::rpc::ApiKey;
+    use crate::rpc::api_version::ApiVersion;
+    use crate::rpc::frame::{ReadError, WriteError};
+    use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+    use metrics::{SharedString, Unit};
+    use metrics_util::CompositeKey;
+    use metrics_util::debugging::{DebugValue, DebuggingRecorder};
+    use std::sync::OnceLock;
+    use tokio::io::{AsyncReadExt, AsyncWriteExt, BufStream};
+    use tokio::sync::Mutex as AsyncMutex;
+
+    // -- Test-only request/response types --------------------------------
+
+    struct TestProduceRequest;
+    struct TestProduceResponse;
+
+    impl RequestBody for TestProduceRequest {
+        type ResponseBody = TestProduceResponse;
+        const API_KEY: ApiKey = ApiKey::ProduceLog;
+        const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+    }
+
+    impl WriteVersionedType<Vec<u8>> for TestProduceRequest {
+        fn write_versioned(&self, _w: &mut Vec<u8>, _v: ApiVersion) -> Result<(), WriteError> {
+            Ok(())
+        }
+    }
+
+    impl ReadVersionedType<Cursor<Vec<u8>>> for TestProduceResponse {
+        fn read_versioned(_r: &mut Cursor<Vec<u8>>, _v: ApiVersion) -> Result<Self, ReadError> {
+            Ok(TestProduceResponse)
+        }
+    }
+
+    struct TestMetadataRequest;
+    struct TestMetadataResponse;
+
+    impl RequestBody for TestMetadataRequest {
+        type ResponseBody = TestMetadataResponse;
+        const API_KEY: ApiKey = ApiKey::MetaData;
+        const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+    }
+
+    impl WriteVersionedType<Vec<u8>> for TestMetadataRequest {
+        fn write_versioned(&self, _w: &mut Vec<u8>, _v: ApiVersion) -> Result<(), WriteError> {
+            Ok(())
+        }
+    }
+
+    impl ReadVersionedType<Cursor<Vec<u8>>> for TestMetadataResponse {
+        fn read_versioned(_r: &mut Cursor<Vec<u8>>, _v: ApiVersion) -> Result<Self, ReadError> {
+            Ok(TestMetadataResponse)
+        }
+    }
+
+    // -- Mock server -----------------------------------------------------
+
+    /// Reads framed requests and echoes back minimal success responses.
+    async fn mock_echo_server(mut stream: tokio::io::DuplexStream) {
+        loop {
+            let mut len_buf = [0u8; 4];
+            if stream.read_exact(&mut len_buf).await.is_err() {
+                return;
+            }
+            let len = i32::from_be_bytes(len_buf) as usize;
+
+            let mut payload = vec![0u8; len];
+            if stream.read_exact(&mut payload).await.is_err() {
+                return;
+            }
+
+            // Header layout: api_key(2) + api_version(2) + request_id(4)
+            let request_id = i32::from_be_bytes([payload[4], payload[5], payload[6], payload[7]]);
+
+            // Response: resp_type(1, 0=success) + request_id(4)
+            let mut resp = Vec::with_capacity(5);
+            resp.push(0u8);
+            resp.extend_from_slice(&request_id.to_be_bytes());
+
+            let resp_len = (resp.len() as i32).to_be_bytes();
+            if stream.write_all(&resp_len).await.is_err()
+                || stream.write_all(&resp).await.is_err()
+                || stream.flush().await.is_err()
+            {
+                return;
+            }
+        }
+    }
+
+    /// Reads framed requests and echoes back error responses (resp_type=1).
+    async fn mock_error_server(mut stream: tokio::io::DuplexStream) {
+        use prost::Message;
+
+        loop {
+            let mut len_buf = [0u8; 4];
+            if stream.read_exact(&mut len_buf).await.is_err() {
+                return;
+            }
+            let len = i32::from_be_bytes(len_buf) as usize;
+
+            let mut payload = vec![0u8; len];
+            if stream.read_exact(&mut payload).await.is_err() {
+                return;
+            }
+
+            let request_id = i32::from_be_bytes([payload[4], payload[5], payload[6], payload[7]]);
+
+            let err = crate::proto::ErrorResponse {
+                error_code: 1,
+                error_message: Some("test error".to_string()),
+            };
+            let mut err_buf = Vec::new();
+            err.encode(&mut err_buf).expect("ErrorResponse encode");
+
+            let mut resp = Vec::with_capacity(5 + err_buf.len());
+            resp.push(1u8); // ERROR_RESPONSE
+            resp.extend_from_slice(&request_id.to_be_bytes());
+            resp.extend(err_buf);
+
+            let resp_len = (resp.len() as i32).to_be_bytes();
+            if stream.write_all(&resp_len).await.is_err()
+                || stream.write_all(&resp).await.is_err()
+                || stream.flush().await.is_err()
+            {
+                return;
+            }
+        }
+    }
+
+    // -- Recorder setup --------------------------------------------------
+
+    /// Shared test recorder (installed once per test binary).
+    static TEST_SNAPSHOTTER: OnceLock<metrics_util::debugging::Snapshotter> = OnceLock::new();
+    static TEST_LOCK: OnceLock<AsyncMutex<()>> = OnceLock::new();
+
+    fn test_snapshotter() -> &'static metrics_util::debugging::Snapshotter {
+        TEST_SNAPSHOTTER.get_or_init(|| {
+            let recorder = DebuggingRecorder::new();
+            let snapshotter = recorder.snapshotter();
+            recorder
+                .install()
+                .expect("debugging recorder install should succeed in this test binary");
+            snapshotter
+        })
+    }
+
+    fn test_lock() -> &'static AsyncMutex<()> {
+        TEST_LOCK.get_or_init(|| AsyncMutex::new(()))
+    }
+
+    type SnapshotEntry = (CompositeKey, Option<Unit>, Option<SharedString>, DebugValue);
+
+    fn has_api_label(key: &CompositeKey, label: &str) -> bool {
+        key.key()
+            .labels()
+            .any(|l| l.key() == LABEL_API_KEY && l.value() == label)
+    }
+
+    fn counter_for_label(entries: &[SnapshotEntry], metric_name: &str, label: &str) -> u64 {
+        entries
+            .iter()
+            .find_map(|(key, _, _, value)| {
+                if key.key().name() != metric_name || !has_api_label(key, label) {
+                    return None;
+                }
+                match value {
+                    DebugValue::Counter(v) => Some(*v),
+                    _ => None,
+                }
+            })
+            .unwrap_or(0)
+    }
+
+    fn gauge_for_label(entries: &[SnapshotEntry], metric_name: &str, label: &str) -> f64 {
+        entries
+            .iter()
+            .find_map(|(key, _, _, value)| {
+                if key.key().name() != metric_name || !has_api_label(key, label) {
+                    return None;
+                }
+                match value {
+                    DebugValue::Gauge(v) => Some(v.into_inner()),
+                    _ => None,
+                }
+            })
+            .unwrap_or(0.0)
+    }
+
+    fn counter_sum(entries: &[SnapshotEntry], metric_name: &str) -> u64 {
+        entries
+            .iter()
+            .filter_map(|(key, _, _, value)| {
+                if key.key().name() != metric_name {
+                    return None;
+                }
+                match value {
+                    DebugValue::Counter(v) => Some(*v),
+                    _ => None,
+                }
+            })
+            .sum()
+    }
+
+    fn histogram_sample_count_for_label(
+        entries: &[SnapshotEntry],
+        metric_name: &str,
+        label: &str,
+    ) -> usize {
+        entries
+            .iter()
+            .find_map(|(key, _, _, value)| {
+                if key.key().name() != metric_name || !has_api_label(key, label) {
+                    return None;
+                }
+                match value {
+                    DebugValue::Histogram(v) => Some(v.len()),
+                    _ => None,
+                }
+            })
+            .unwrap_or(0)
+    }
+
+    // -- Tests -----------------------------------------------------------
+
+    #[tokio::test]
+    async fn request_records_metrics_for_reportable_api_key() {
+        let _test_guard = test_lock().lock().await;
+        let snapshotter = test_snapshotter();
+
+        let (client, server) = tokio::io::duplex(4096);
+        tokio::spawn(mock_echo_server(server));
+
+        let conn = ServerConnectionInner::new(BufStream::new(client), usize::MAX, Arc::from("t"));
+
+        let before: Vec<_> = snapshotter.snapshot().into_vec();
+        let request_before = counter_for_label(&before, CLIENT_REQUESTS_TOTAL, "produce_log");
+        let response_before = counter_for_label(&before, CLIENT_RESPONSES_TOTAL, "produce_log");
+        let latency_samples_before =
+            histogram_sample_count_for_label(&before, CLIENT_REQUEST_LATENCY_MS, "produce_log");
+
+        conn.request(TestProduceRequest).await.unwrap();
+
+        let after: Vec<_> = snapshotter.snapshot().into_vec();
+        let request_after = counter_for_label(&after, CLIENT_REQUESTS_TOTAL, "produce_log");
+        let response_after = counter_for_label(&after, CLIENT_RESPONSES_TOTAL, "produce_log");
+        let latency_samples_after =
+            histogram_sample_count_for_label(&after, CLIENT_REQUEST_LATENCY_MS, "produce_log");
+        assert_eq!(
+            request_after - request_before,
+            1,
+            "produce_log request counter should increment by 1"
+        );
+        assert_eq!(
+            response_after - response_before,
+            1,
+            "produce_log completion counter should increment by 1"
+        );
+        assert_eq!(
+            latency_samples_after - latency_samples_before,
+            1,
+            "request latency histogram sample count should increment by 1 for produce_log"
+        );
+    }
+
+    #[tokio::test]
+    async fn request_skips_metrics_for_non_reportable_api_key() {
+        let _test_guard = test_lock().lock().await;
+        let snapshotter = test_snapshotter();
+
+        let (client, server) = tokio::io::duplex(4096);
+        tokio::spawn(mock_echo_server(server));
+
+        let conn = ServerConnectionInner::new(BufStream::new(client), usize::MAX, Arc::from("t"));
+        let before: Vec<_> = snapshotter.snapshot().into_vec();
+        let request_sum_before = counter_sum(&before, CLIENT_REQUESTS_TOTAL);
+        let response_sum_before = counter_sum(&before, CLIENT_RESPONSES_TOTAL);
+
+        conn.request(TestMetadataRequest).await.unwrap();
+
+        let snapshot: Vec<_> = snapshotter.snapshot().into_vec();
+        let request_sum_after = counter_sum(&snapshot, CLIENT_REQUESTS_TOTAL);
+        let response_sum_after = counter_sum(&snapshot, CLIENT_RESPONSES_TOTAL);
+        assert_eq!(
+            request_sum_after, request_sum_before,
+            "non-reportable API keys must not change request counters"
+        );
+        assert_eq!(
+            response_sum_after, response_sum_before,
+            "non-reportable API keys must not change response counters"
+        );
+
+        // No metric entry should carry a non-reportable API key label.
+        let non_reportable = snapshot
+            .iter()
+            .any(|(key, _, _, _)| has_api_label(key, "metadata"));
+        assert!(
+            !non_reportable,
+            "non-reportable API keys must not appear in metrics"
+        );
+    }
+
+    #[tokio::test]
+    async fn request_records_completion_metrics_when_send_fails() {
+        let _test_guard = test_lock().lock().await;
+        let snapshotter = test_snapshotter();
+
+        let (client, server) = tokio::io::duplex(64);
+        drop(server); // force write failure on request path
+        let conn = ServerConnectionInner::new(BufStream::new(client), usize::MAX, Arc::from("t"));
+
+        let before: Vec<_> = snapshotter.snapshot().into_vec();
+        let request_before = counter_for_label(&before, CLIENT_REQUESTS_TOTAL, "produce_log");
+        let response_before = counter_for_label(&before, CLIENT_RESPONSES_TOTAL, "produce_log");
+        let bytes_received_before =
+            counter_for_label(&before, CLIENT_BYTES_RECEIVED_TOTAL, "produce_log");
+        let result = conn.request(TestProduceRequest).await;
+        assert!(
+            result.is_err(),
+            "request should fail when transport is closed"
+        );
+        let after: Vec<_> = snapshotter.snapshot().into_vec();
+        let request_after = counter_for_label(&after, CLIENT_REQUESTS_TOTAL, "produce_log");
+        let response_after = counter_for_label(&after, CLIENT_RESPONSES_TOTAL, "produce_log");
+        let bytes_received_after =
+            counter_for_label(&after, CLIENT_BYTES_RECEIVED_TOTAL, "produce_log");
+        let inflight_after = gauge_for_label(&after, CLIENT_REQUESTS_IN_FLIGHT, "produce_log");
+
+        assert_eq!(
+            request_after - request_before,
+            1,
+            "failed request should still count as request"
+        );
+        assert_eq!(
+            response_after - response_before,
+            1,
+            "failed request should still count as a completion like Java ConnectionMetrics"
+        );
+        assert_eq!(
+            bytes_received_after - bytes_received_before,
+            0,
+            "failed send should record zero received bytes"
+        );
+        assert_eq!(
+            inflight_after, 0.0,
+            "in-flight gauge must return to zero after failure"
+        );
+    }
+
+    #[tokio::test]
+    async fn request_records_completion_metrics_when_server_returns_api_error() {
+        let _test_guard = test_lock().lock().await;
+        let snapshotter = test_snapshotter();
+
+        let (client, server) = tokio::io::duplex(4096);
+        tokio::spawn(mock_error_server(server));
+
+        let conn = ServerConnectionInner::new(BufStream::new(client), usize::MAX, Arc::from("t"));
+
+        let before: Vec<_> = snapshotter.snapshot().into_vec();
+        let response_before = counter_for_label(&before, CLIENT_RESPONSES_TOTAL, "produce_log");
+        let bytes_received_before =
+            counter_for_label(&before, CLIENT_BYTES_RECEIVED_TOTAL, "produce_log");
+
+        let result = conn.request(TestProduceRequest).await;
+        assert!(
+            matches!(result, Err(Error::FlussAPIError { .. })),
+            "request should fail with FlussAPIError when server returns error_response"
+        );
+
+        let after: Vec<_> = snapshotter.snapshot().into_vec();
+        let response_after = counter_for_label(&after, CLIENT_RESPONSES_TOTAL, "produce_log");
+        let bytes_received_after =
+            counter_for_label(&after, CLIENT_BYTES_RECEIVED_TOTAL, "produce_log");
+        let inflight_after = gauge_for_label(&after, CLIENT_REQUESTS_IN_FLIGHT, "produce_log");
+
+        assert_eq!(
+            response_after - response_before,
+            1,
+            "API error response should count as completion like Java"
+        );
+        assert_eq!(
+            bytes_received_after - bytes_received_before,
+            0,
+            "API error response should record zero body bytes like Java onRequestFailure"
+        );
+        assert_eq!(
+            inflight_after, 0.0,
+            "in-flight gauge must return to zero after API error"
+        );
+    }
+}

From f6517e80097a7060b658a13394a1a3ffde5209b8 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 26 Apr 2026 20:43:04 +0200
Subject: [PATCH 245/287] feat: Basic CI/CD for elixir (#497)

* [elixir] Basic CI/CD for elixir

* plain install approach

* use now allowlisted action
---
 .../.github/workflows/build_and_test_cpp.yml  |   1 +
 .../workflows/build_and_test_elixir.yml       | 103 ++++++++
 .../workflows/build_and_test_python.yml       |   1 +
 .../.github/workflows/build_and_test_rust.yml |   1 +
 .../bindings/elixir/test/support/cluster.ex   | 229 ++++++------------
 5 files changed, 180 insertions(+), 155 deletions(-)
 create mode 100644 fluss-rust/.github/workflows/build_and_test_elixir.yml

diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
index c411076045..9ede0c3e3c 100644
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ b/fluss-rust/.github/workflows/build_and_test_cpp.yml
@@ -31,6 +31,7 @@ on:
       - 'website/**'
       - '**/*.md'
       - 'bindings/python/**'
+      - 'bindings/elixir/**'
   workflow_dispatch:
 
 concurrency:
diff --git a/fluss-rust/.github/workflows/build_and_test_elixir.yml b/fluss-rust/.github/workflows/build_and_test_elixir.yml
new file mode 100644
index 0000000000..03f3329e0f
--- /dev/null
+++ b/fluss-rust/.github/workflows/build_and_test_elixir.yml
@@ -0,0 +1,103 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+name: Elixir Build and Tests
+
+on:
+  push:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+  pull_request:
+    branches:
+      - main
+    paths-ignore:
+      - 'website/**'
+      - '**/*.md'
+      - 'bindings/cpp/**'
+      - 'bindings/python/**'
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
+  cancel-in-progress: true
+
+jobs:
+  build-and-test:
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    env:
+      OTP_VERSION: "28.0.2"
+      ELIXIR_VERSION: "1.19.5"
+      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/target/debug/fluss-test-cluster
+      MIX_ENV: test
+    steps:
+      - uses: actions/checkout@v6
+
+      - name: Set up BEAM
+        uses: erlef/setup-beam@fc68ffb90438ef2936bbb3251622353b3dcb2f93 # v1.24.0
+        with:
+          otp-version: ${{ env.OTP_VERSION }}
+          elixir-version: ${{ env.ELIXIR_VERSION }}
+
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+
+      - name: Rust Cache
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
+
+      - name: Cache Mix deps and build
+        uses: actions/cache@v4
+        with:
+          path: |
+            bindings/elixir/deps
+            bindings/elixir/_build
+          key: ${{ runner.os }}-mix-otp${{ env.OTP_VERSION }}-elixir${{ env.ELIXIR_VERSION }}-${{ hashFiles('bindings/elixir/mix.lock') }}
+          restore-keys: |
+            ${{ runner.os }}-mix-otp${{ env.OTP_VERSION }}-elixir${{ env.ELIXIR_VERSION }}-
+
+      - name: Build fluss-test-cluster binary
+        run: cargo build -p fluss-test-cluster
+
+      - name: Fetch Elixir deps
+        working-directory: bindings/elixir
+        run: mix deps.get
+
+      - name: Check formatting
+        working-directory: bindings/elixir
+        run: mix format --check-formatted
+
+      - name: Compile (warnings as errors)
+        working-directory: bindings/elixir
+        run: mix compile --warnings-as-errors
+
+      - name: Credo
+        working-directory: bindings/elixir
+        run: mix credo
+
+      - name: Run unit tests
+        working-directory: bindings/elixir
+        run: mix test
+
+      - name: Run integration tests
+        working-directory: bindings/elixir
+        run: mix test --include integration --only integration
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index eb392d1d2d..88c1838ba5 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -31,6 +31,7 @@ on:
       - 'website/**'
       - '**/*.md'
       - 'bindings/cpp/**'
+      - 'bindings/elixir/**'
   workflow_dispatch:
 
 concurrency:
diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index 4615575dd7..af108699cd 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -32,6 +32,7 @@ on:
       - '**/*.md'
       - 'bindings/python/**'
       - 'bindings/cpp/**'
+      - 'bindings/elixir/**'
   workflow_dispatch:
 
 concurrency:
diff --git a/fluss-rust/bindings/elixir/test/support/cluster.ex b/fluss-rust/bindings/elixir/test/support/cluster.ex
index 59598b4ebd..40f0f68d35 100644
--- a/fluss-rust/bindings/elixir/test/support/cluster.ex
+++ b/fluss-rust/bindings/elixir/test/support/cluster.ex
@@ -18,21 +18,11 @@
 defmodule Fluss.Test.Cluster do
   @moduledoc false
 
-  @fluss_image "apache/fluss"
-  @fluss_version "0.9.0-incubating"
+  # Shells out to the `fluss-test-cluster` CLI (from `crates/fluss-test-cluster`),
+  # the same binary used by the Python and C++ integration tests.
 
-  @network_name "fluss-elixir-test-network"
-  @zookeeper_name "zookeeper-elixir-test"
-  @coordinator_name "coordinator-server-elixir-test"
-  @tablet_server_name "tablet-server-elixir-test"
-
-  # Same fixed ports used by Python/C++ integration tests.
-  @coordinator_sasl_port 9123
-  @coordinator_plain_port 9223
-  @tablet_sasl_port 9124
-  @tablet_plain_port 9224
-
-  def bootstrap_servers, do: "127.0.0.1:#{@coordinator_plain_port}"
+  @cluster_name "shared-test"
+  @cluster_json_prefix "CLUSTER_JSON: "
 
   def ensure_started do
     case System.get_env("FLUSS_BOOTSTRAP_SERVERS") do
@@ -42,170 +32,99 @@ defmodule Fluss.Test.Cluster do
   end
 
   def stop do
-    for name <- [@tablet_server_name, @coordinator_name, @zookeeper_name] do
-      System.cmd("docker", ["rm", "-f", name], stderr_to_stdout: true)
-    end
+    if System.get_env("FLUSS_BOOTSTRAP_SERVERS") do
+      :ok
+    else
+      case find_cli_binary() do
+        {:ok, cli} ->
+          System.cmd(cli, ["stop", "--name", @cluster_name], stderr_to_stdout: true)
+          :ok
 
-    System.cmd("docker", ["network", "rm", @network_name], stderr_to_stdout: true)
-    :ok
+        {:error, _} ->
+          :ok
+      end
+    end
   end
 
   defp start_cluster do
-    if port_open?(@coordinator_plain_port) do
-      IO.puts("Reusing existing Fluss cluster on port #{@coordinator_plain_port}")
-      {:ok, bootstrap_servers()}
+    with {:ok, cli} <- find_cli_binary(),
+         {output, 0} <-
+           System.cmd(cli, ["start", "--sasl", "--name", @cluster_name], stderr_to_stdout: true),
+         {:ok, bootstrap} <- parse_cluster_json(output) do
+      {:ok, bootstrap}
     else
-      do_start_cluster()
+      {output, code} when is_binary(output) ->
+        {:error, "fluss-test-cluster start failed (exit #{code}):\n#{output}"}
+
+      {:error, _} = err ->
+        err
     end
   end
 
-  defp do_start_cluster do
-    IO.puts("Starting Fluss cluster via Docker...")
+  defp find_cli_binary do
+    case System.get_env("FLUSS_TEST_CLUSTER_BIN") do
+      bin when is_binary(bin) and bin != "" ->
+        if File.regular?(bin),
+          do: {:ok, bin},
+          else: {:error, "FLUSS_TEST_CLUSTER_BIN=#{bin} does not exist"}
 
-    # Remove any leftover containers from previous runs
-    for name <- [@tablet_server_name, @coordinator_name, @zookeeper_name] do
-      System.cmd("docker", ["rm", "-f", name], stderr_to_stdout: true)
-    end
-
-    System.cmd("docker", ["network", "create", @network_name], stderr_to_stdout: true)
-
-    sasl_jaas =
-      ~s(org.apache.fluss.security.auth.sasl.plain.PlainLoginModule required user_admin="admin-secret" user_alice="alice-secret";)
-
-    coordinator_props =
-      Enum.join(
-        [
-          "zookeeper.address: #{@zookeeper_name}:2181",
-          "bind.listeners: INTERNAL://#{@coordinator_name}:0, CLIENT://#{@coordinator_name}:9123, PLAIN_CLIENT://#{@coordinator_name}:9223",
-          "advertised.listeners: CLIENT://localhost:#{@coordinator_sasl_port}, PLAIN_CLIENT://localhost:#{@coordinator_plain_port}",
-          "internal.listener.name: INTERNAL",
-          "security.protocol.map: CLIENT:sasl",
-          "security.sasl.enabled.mechanisms: plain",
-          "security.sasl.plain.jaas.config: #{sasl_jaas}",
-          "netty.server.num-network-threads: 1",
-          "netty.server.num-worker-threads: 3"
-        ],
-        "\n"
-      )
-
-    tablet_props =
-      Enum.join(
-        [
-          "zookeeper.address: #{@zookeeper_name}:2181",
-          "bind.listeners: INTERNAL://#{@tablet_server_name}:0, CLIENT://#{@tablet_server_name}:9123, PLAIN_CLIENT://#{@tablet_server_name}:9223",
-          "advertised.listeners: CLIENT://localhost:#{@tablet_sasl_port}, PLAIN_CLIENT://localhost:#{@tablet_plain_port}",
-          "internal.listener.name: INTERNAL",
-          "security.protocol.map: CLIENT:sasl",
-          "security.sasl.enabled.mechanisms: plain",
-          "security.sasl.plain.jaas.config: #{sasl_jaas}",
-          "tablet-server.id: 0",
-          "netty.server.num-network-threads: 1",
-          "netty.server.num-worker-threads: 3"
-        ],
-        "\n"
-      )
-
-    docker_run([
-      "--name",
-      @zookeeper_name,
-      "--network",
-      @network_name,
-      "-d",
-      "zookeeper:3.9.2"
-    ])
-
-    docker_run([
-      "--name",
-      @coordinator_name,
-      "--network",
-      @network_name,
-      "-p",
-      "#{@coordinator_sasl_port}:9123",
-      "-p",
-      "#{@coordinator_plain_port}:9223",
-      "-e",
-      "FLUSS_PROPERTIES=#{coordinator_props}",
-      "-d",
-      "#{@fluss_image}:#{@fluss_version}",
-      "coordinatorServer"
-    ])
-
-    docker_run([
-      "--name",
-      @tablet_server_name,
-      "--network",
-      @network_name,
-      "-p",
-      "#{@tablet_sasl_port}:9123",
-      "-p",
-      "#{@tablet_plain_port}:9223",
-      "-e",
-      "FLUSS_PROPERTIES=#{tablet_props}",
-      "-d",
-      "#{@fluss_image}:#{@fluss_version}",
-      "tabletServer"
-    ])
-
-    all_ports = [@coordinator_plain_port, @tablet_plain_port]
-
-    if wait_for_ports(all_ports, 90) do
-      IO.puts("Fluss cluster started successfully.")
-      {:ok, bootstrap_servers()}
-    else
-      {:error, "Cluster ports did not become ready within timeout"}
+      _ ->
+        locate_via_cargo()
     end
   end
 
-  defp docker_run(args) do
-    {output, code} = System.cmd("docker", ["run" | args], stderr_to_stdout: true)
+  defp locate_via_cargo do
+    case System.cmd("cargo", ["locate-project", "--workspace", "--message-format", "plain"],
+           stderr_to_stdout: true
+         ) do
+      {output, 0} ->
+        output |> String.trim() |> Path.dirname() |> find_binary_in_target()
 
-    if code != 0 do
-      IO.puts("Docker run warning (code #{code}): #{output}")
+      {output, code} ->
+        {:error, "cargo locate-project failed (exit #{code}): #{output}"}
     end
   end
 
-  defp wait_for_ports(ports, timeout_s) do
-    deadline = System.monotonic_time(:second) + timeout_s
+  defp find_binary_in_target(root) do
+    Enum.find_value(
+      ["debug", "release"],
+      {:error, "fluss-test-cluster binary not found. Run: cargo build -p fluss-test-cluster"},
+      &check_binary(root, &1)
+    )
+  end
 
-    Enum.all?(ports, fn port ->
-      remaining = deadline - System.monotonic_time(:second)
-      remaining > 0 and wait_for_port(port, remaining)
-    end)
+  defp check_binary(root, profile) do
+    path = Path.join([root, "target", profile, "fluss-test-cluster"])
+    if File.regular?(path), do: {:ok, path}, else: nil
   end
 
-  defp wait_for_port(port, timeout_s) do
-    deadline = System.monotonic_time(:second) + timeout_s
+  defp parse_cluster_json(output) do
+    output
+    |> String.split("\n", trim: true)
+    |> Enum.find_value(
+      {:error, "No #{@cluster_json_prefix} token in output:\n#{output}"},
+      &extract_bootstrap/1
+    )
+  end
 
-    Stream.repeatedly(fn ->
-      case :gen_tcp.connect(~c"localhost", port, [], 1000) do
-        {:ok, socket} ->
-          :gen_tcp.close(socket)
-          :ok
+  defp extract_bootstrap(line) do
+    case String.split(line, @cluster_json_prefix, parts: 2) do
+      [_, json] ->
+        case decode_bootstrap(json) do
+          {:ok, bootstrap} -> {:ok, bootstrap}
+          _ -> nil
+        end
 
-        {:error, _} ->
-          Process.sleep(1000)
-          :retry
-      end
-    end)
-    |> Enum.reduce_while(false, fn
-      :ok, _acc ->
-        {:halt, true}
-
-      :retry, _acc ->
-        if System.monotonic_time(:second) >= deadline,
-          do: {:halt, false},
-          else: {:cont, false}
-    end)
+      _ ->
+        nil
+    end
   end
 
-  defp port_open?(port) do
-    case :gen_tcp.connect(~c"localhost", port, [], 1000) do
-      {:ok, socket} ->
-        :gen_tcp.close(socket)
-        true
-
-      {:error, _} ->
-        false
+  # Minimal JSON extractor for `bootstrap_servers`: avoids adding a JSON dep just for tests.
+  defp decode_bootstrap(json) do
+    case Regex.run(~r/"bootstrap_servers"\s*:\s*"([^"]+)"/, json) do
+      [_, servers] -> {:ok, servers}
+      _ -> {:error, "no bootstrap_servers in: #{json}"}
     end
   end
 end

From cb5908de0b978a1af60dc53abf2b8ee34ce08c6e Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Wed, 29 Apr 2026 20:14:58 +0100
Subject: [PATCH 246/287] feat: [elixir] fine-grained errors (#507)

---
 fluss-rust/bindings/elixir/lib/fluss/admin.ex |  20 +-
 .../elixir/lib/fluss/append_writer.ex         |   8 +-
 .../bindings/elixir/lib/fluss/connection.ex   |   4 +-
 fluss-rust/bindings/elixir/lib/fluss/error.ex | 127 ++++++++++++
 .../bindings/elixir/lib/fluss/log_scanner.ex  |  21 +-
 fluss-rust/bindings/elixir/lib/fluss/table.ex |   5 +-
 .../elixir/lib/fluss/table_descriptor.ex      |   2 +-
 .../bindings/elixir/lib/fluss/write_handle.ex |   4 +-
 .../native/fluss_nif/src/append_writer.rs     |   4 +-
 .../elixir/native/fluss_nif/src/async_nif.rs  |  35 ++--
 .../elixir/native/fluss_nif/src/atoms.rs      | 182 +++++++++++++++++-
 .../native/fluss_nif/src/log_scanner.rs       |   8 +-
 .../native/fluss_nif/src/write_handle.rs      |   2 +-
 .../bindings/elixir/test/error_test.exs       |  87 +++++++++
 14 files changed, 451 insertions(+), 58 deletions(-)
 create mode 100644 fluss-rust/bindings/elixir/lib/fluss/error.ex
 create mode 100644 fluss-rust/bindings/elixir/test/error_test.exs

diff --git a/fluss-rust/bindings/elixir/lib/fluss/admin.ex b/fluss-rust/bindings/elixir/lib/fluss/admin.ex
index a40f2d65f3..6dbdb3a9c1 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/admin.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/admin.ex
@@ -34,7 +34,7 @@ defmodule Fluss.Admin do
 
   @type t :: reference()
 
-  @spec new(Fluss.Connection.t()) :: {:ok, t()} | {:error, String.t()}
+  @spec new(Fluss.Connection.t()) :: {:ok, t()} | {:error, Fluss.Error.t()}
   def new(conn) do
     case Native.admin_new(conn) do
       {:error, _} = err -> err
@@ -46,25 +46,25 @@ defmodule Fluss.Admin do
   def new!(conn) do
     case new(conn) do
       {:ok, admin} -> admin
-      {:error, reason} -> raise "failed to create admin: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
     end
   end
 
-  @spec create_database(t(), String.t(), boolean()) :: :ok | {:error, String.t()}
+  @spec create_database(t(), String.t(), boolean()) :: :ok | {:error, Fluss.Error.t()}
   def create_database(admin, name, ignore_if_exists \\ true) do
     admin
     |> Native.admin_create_database(name, ignore_if_exists)
     |> Native.await_nif()
   end
 
-  @spec drop_database(t(), String.t(), boolean()) :: :ok | {:error, String.t()}
+  @spec drop_database(t(), String.t(), boolean()) :: :ok | {:error, Fluss.Error.t()}
   def drop_database(admin, name, ignore_if_not_exists \\ true) do
     admin
     |> Native.admin_drop_database(name, ignore_if_not_exists)
     |> Native.await_nif()
   end
 
-  @spec list_databases(t()) :: {:ok, [String.t()]} | {:error, String.t()}
+  @spec list_databases(t()) :: {:ok, [String.t()]} | {:error, Fluss.Error.t()}
   def list_databases(admin) do
     admin
     |> Native.admin_list_databases()
@@ -75,26 +75,26 @@ defmodule Fluss.Admin do
   def list_databases!(admin) do
     case list_databases(admin) do
       {:ok, dbs} -> dbs
-      {:error, reason} -> raise "failed to list databases: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
     end
   end
 
   @spec create_table(t(), String.t(), String.t(), Fluss.TableDescriptor.t(), boolean()) ::
-          :ok | {:error, String.t()}
+          :ok | {:error, Fluss.Error.t()}
   def create_table(admin, database, table, descriptor, ignore_if_exists \\ true) do
     admin
     |> Native.admin_create_table(database, table, descriptor, ignore_if_exists)
     |> Native.await_nif()
   end
 
-  @spec drop_table(t(), String.t(), String.t(), boolean()) :: :ok | {:error, String.t()}
+  @spec drop_table(t(), String.t(), String.t(), boolean()) :: :ok | {:error, Fluss.Error.t()}
   def drop_table(admin, database, table, ignore_if_not_exists \\ true) do
     admin
     |> Native.admin_drop_table(database, table, ignore_if_not_exists)
     |> Native.await_nif()
   end
 
-  @spec list_tables(t(), String.t()) :: {:ok, [String.t()]} | {:error, String.t()}
+  @spec list_tables(t(), String.t()) :: {:ok, [String.t()]} | {:error, Fluss.Error.t()}
   def list_tables(admin, database) do
     admin
     |> Native.admin_list_tables(database)
@@ -105,7 +105,7 @@ defmodule Fluss.Admin do
   def list_tables!(admin, database) do
     case list_tables(admin, database) do
       {:ok, tables} -> tables
-      {:error, reason} -> raise "failed to list tables: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
     end
   end
 end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/append_writer.ex b/fluss-rust/bindings/elixir/lib/fluss/append_writer.ex
index 767802ac02..5dddbf7b1d 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/append_writer.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/append_writer.ex
@@ -42,7 +42,7 @@ defmodule Fluss.AppendWriter do
 
   @type t :: reference()
 
-  @spec new(Fluss.Table.t()) :: {:ok, t()} | {:error, String.t()}
+  @spec new(Fluss.Table.t()) :: {:ok, t()} | {:error, Fluss.Error.t()}
   def new(table) do
     case Native.append_writer_new(table) do
       {:error, _} = err -> err
@@ -54,11 +54,11 @@ defmodule Fluss.AppendWriter do
   def new!(table) do
     case new(table) do
       {:ok, w} -> w
-      {:error, reason} -> raise "failed to create append writer: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
     end
   end
 
-  @spec append(t(), list()) :: {:ok, Fluss.WriteHandle.t()} | {:error, String.t()}
+  @spec append(t(), list()) :: {:ok, Fluss.WriteHandle.t()} | {:error, Fluss.Error.t()}
   def append(writer, values) when is_list(values) do
     case Native.append_writer_append(writer, values) do
       {:error, _} = err -> err
@@ -66,7 +66,7 @@ defmodule Fluss.AppendWriter do
     end
   end
 
-  @spec flush(t()) :: :ok | {:error, String.t()}
+  @spec flush(t()) :: :ok | {:error, Fluss.Error.t()}
   def flush(writer) do
     writer
     |> Native.append_writer_flush()
diff --git a/fluss-rust/bindings/elixir/lib/fluss/connection.ex b/fluss-rust/bindings/elixir/lib/fluss/connection.ex
index 0fd664682e..a56c72a664 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/connection.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/connection.ex
@@ -34,7 +34,7 @@ defmodule Fluss.Connection do
 
   @type t :: reference()
 
-  @spec new(Fluss.Config.t()) :: {:ok, t()} | {:error, String.t()}
+  @spec new(Fluss.Config.t()) :: {:ok, t()} | {:error, Fluss.Error.t()}
   def new(%Fluss.Config{} = config) do
     config
     |> Native.connection_new()
@@ -45,7 +45,7 @@ defmodule Fluss.Connection do
   def new!(%Fluss.Config{} = config) do
     case new(config) do
       {:ok, conn} -> conn
-      {:error, reason} -> raise "failed to connect to Fluss: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
     end
   end
 end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/error.ex b/fluss-rust/bindings/elixir/lib/fluss/error.ex
new file mode 100644
index 0000000000..fe5d1ca8b4
--- /dev/null
+++ b/fluss-rust/bindings/elixir/lib/fluss/error.ex
@@ -0,0 +1,127 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.Error do
+  @moduledoc """
+  Structured error returned from Fluss operations.
+
+  Fields:
+
+    * `:code` — stable atom for pattern matching.
+    * `:error_code` — raw integer code. Protocol codes `0..57`, `-1` for
+      `:unknown_server_error`, `-2` for `:client_error`.
+    * `:message` — human-readable description.
+
+  Also an exception, so `raise err` works.
+
+  `:client_error` covers any failure that didn't come from the server API
+  (bad input, transport, I/O, decode, consumed write handle, etc.) and is
+  not retriable, matching the Python and C++ bindings.
+  """
+
+  defexception [:code, :error_code, :message]
+
+  @typedoc "Error code atom."
+  @type code ::
+          :none
+          | :unknown_server_error
+          | :network_exception
+          | :unsupported_version
+          | :corrupt_message
+          | :database_not_exist
+          | :database_not_empty
+          | :database_already_exist
+          | :table_not_exist
+          | :table_already_exist
+          | :schema_not_exist
+          | :log_storage_exception
+          | :kv_storage_exception
+          | :not_leader_or_follower
+          | :record_too_large_exception
+          | :corrupt_record_exception
+          | :invalid_table_exception
+          | :invalid_database_exception
+          | :invalid_replication_factor
+          | :invalid_required_acks
+          | :log_offset_out_of_range_exception
+          | :non_primary_key_table_exception
+          | :unknown_table_or_bucket_exception
+          | :invalid_update_version_exception
+          | :invalid_coordinator_exception
+          | :fenced_leader_epoch_exception
+          | :request_time_out
+          | :storage_exception
+          | :operation_not_attempted_exception
+          | :not_enough_replicas_after_append_exception
+          | :not_enough_replicas_exception
+          | :security_token_exception
+          | :out_of_order_sequence_exception
+          | :duplicate_sequence_exception
+          | :unknown_writer_id_exception
+          | :invalid_column_projection
+          | :invalid_target_column
+          | :partition_not_exists
+          | :table_not_partitioned_exception
+          | :invalid_timestamp_exception
+          | :invalid_config_exception
+          | :lake_storage_not_configured_exception
+          | :kv_snapshot_not_exist
+          | :partition_already_exists
+          | :partition_spec_invalid_exception
+          | :leader_not_available_exception
+          | :partition_max_num_exception
+          | :authenticate_exception
+          | :security_disabled_exception
+          | :authorization_exception
+          | :bucket_max_num_exception
+          | :fenced_tiering_epoch_exception
+          | :retriable_authenticate_exception
+          | :invalid_server_rack_info_exception
+          | :lake_snapshot_not_exist
+          | :lake_table_already_exist
+          | :ineligible_replica_exception
+          | :invalid_alter_table_exception
+          | :deletion_disabled_exception
+          | :client_error
+
+  @type t :: %__MODULE__{code: code(), error_code: integer(), message: String.t()}
+
+  @retriable_codes [
+    :network_exception,
+    :corrupt_message,
+    :schema_not_exist,
+    :log_storage_exception,
+    :kv_storage_exception,
+    :not_leader_or_follower,
+    :corrupt_record_exception,
+    :unknown_table_or_bucket_exception,
+    :request_time_out,
+    :storage_exception,
+    :not_enough_replicas_after_append_exception,
+    :not_enough_replicas_exception,
+    :leader_not_available_exception
+  ]
+
+  @impl true
+  def message(%__MODULE__{code: code, message: msg}) do
+    "Fluss error [#{code}]: #{msg}"
+  end
+
+  @doc "Returns `true` if retrying the operation may succeed."
+  @spec retriable?(t()) :: boolean()
+  def retriable?(%__MODULE__{code: code}), do: code in @retriable_codes
+end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/log_scanner.ex b/fluss-rust/bindings/elixir/lib/fluss/log_scanner.ex
index a47ea92e6e..fca4168c3e 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/log_scanner.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/log_scanner.ex
@@ -20,8 +20,8 @@ defmodule Fluss.LogScanner do
   Scanner for reading records from a log table.
 
   `poll/2` is non-blocking — it returns `:ok` immediately and sends results
-  as `{:fluss_records, records}` or `{:fluss_poll_error, reason}` to the
-  calling process. No dirty scheduler threads are held during the wait.
+  as `{:fluss_records, records}` or `{:fluss_poll_error, %Fluss.Error{}}` to
+  the calling process. No dirty scheduler threads are held during the wait.
 
   Each record is an atom-keyed map: `:offset`, `:timestamp`, `:change_type`, `:row`.
   Row values are also atom-keyed (column names interned as atoms).
@@ -35,8 +35,8 @@ defmodule Fluss.LogScanner do
       receive do
         {:fluss_records, records} ->
           for record <- records, do: IO.inspect(record[:row])
-        {:fluss_poll_error, reason} ->
-          IO.puts("poll error: \#{reason}")
+        {:fluss_poll_error, %Fluss.Error{code: code, message: msg}} ->
+          IO.puts("poll error [\#{code}]: \#{msg}")
       end
 
   """
@@ -46,7 +46,7 @@ defmodule Fluss.LogScanner do
   @type t :: reference()
   @type record :: %{atom() => term()}
 
-  @spec new(Fluss.Table.t()) :: {:ok, t()} | {:error, String.t()}
+  @spec new(Fluss.Table.t()) :: {:ok, t()} | {:error, Fluss.Error.t()}
   def new(table) do
     case Native.log_scanner_new(table) do
       {:error, _} = err -> err
@@ -58,11 +58,11 @@ defmodule Fluss.LogScanner do
   def new!(table) do
     case new(table) do
       {:ok, s} -> s
-      {:error, reason} -> raise "failed to create log scanner: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
     end
   end
 
-  @spec subscribe(t(), integer(), integer()) :: :ok | {:error, String.t()}
+  @spec subscribe(t(), integer(), integer()) :: :ok | {:error, Fluss.Error.t()}
   def subscribe(scanner, bucket, offset) do
     scanner
     |> Native.log_scanner_subscribe(bucket, offset)
@@ -72,14 +72,14 @@ defmodule Fluss.LogScanner do
   @doc """
   Subscribes to multiple buckets. Takes a list of `{bucket_id, offset}` tuples.
   """
-  @spec subscribe_buckets(t(), [{integer(), integer()}]) :: :ok | {:error, String.t()}
+  @spec subscribe_buckets(t(), [{integer(), integer()}]) :: :ok | {:error, Fluss.Error.t()}
   def subscribe_buckets(scanner, bucket_offsets) when is_list(bucket_offsets) do
     scanner
     |> Native.log_scanner_subscribe_buckets(bucket_offsets)
     |> Native.await_nif()
   end
 
-  @spec unsubscribe(t(), integer()) :: :ok | {:error, String.t()}
+  @spec unsubscribe(t(), integer()) :: :ok | {:error, Fluss.Error.t()}
   def unsubscribe(scanner, bucket) do
     scanner
     |> Native.log_scanner_unsubscribe(bucket)
@@ -88,7 +88,8 @@ defmodule Fluss.LogScanner do
 
   @doc """
   Starts a non-blocking poll. Returns `:ok` immediately.
-  Results arrive as `{:fluss_records, [record]}` or `{:fluss_poll_error, reason}`.
+  Results arrive as `{:fluss_records, [record]}` or
+  `{:fluss_poll_error, %Fluss.Error{}}`.
   """
   @spec poll(t(), non_neg_integer()) :: :ok
   def poll(scanner, timeout_ms),
diff --git a/fluss-rust/bindings/elixir/lib/fluss/table.ex b/fluss-rust/bindings/elixir/lib/fluss/table.ex
index 59f864af94..c934fc0c01 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/table.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/table.ex
@@ -24,7 +24,8 @@ defmodule Fluss.Table do
 
   @type t :: reference()
 
-  @spec get(Fluss.Connection.t(), String.t(), String.t()) :: {:ok, t()} | {:error, String.t()}
+  @spec get(Fluss.Connection.t(), String.t(), String.t()) ::
+          {:ok, t()} | {:error, Fluss.Error.t()}
   def get(conn, database, table) do
     conn
     |> Native.table_get(database, table)
@@ -35,7 +36,7 @@ defmodule Fluss.Table do
   def get!(conn, database, table) do
     case get(conn, database, table) do
       {:ok, t} -> t
-      {:error, reason} -> raise "failed to get table: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
     end
   end
 
diff --git a/fluss-rust/bindings/elixir/lib/fluss/table_descriptor.ex b/fluss-rust/bindings/elixir/lib/fluss/table_descriptor.ex
index 96c3e1dfb3..b95b5a503b 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/table_descriptor.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/table_descriptor.ex
@@ -38,7 +38,7 @@ defmodule Fluss.TableDescriptor do
     properties = Keyword.get(opts, :properties, [])
 
     case Native.table_descriptor_new(schema, bucket_count, properties) do
-      {:error, reason} -> raise "failed to create table descriptor: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
       ref -> ref
     end
   end
diff --git a/fluss-rust/bindings/elixir/lib/fluss/write_handle.ex b/fluss-rust/bindings/elixir/lib/fluss/write_handle.ex
index f0ec295be0..f5f16591f4 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/write_handle.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/write_handle.ex
@@ -27,7 +27,7 @@ defmodule Fluss.WriteHandle do
 
   @type t :: reference()
 
-  @spec wait(t()) :: :ok | {:error, String.t()}
+  @spec wait(t()) :: :ok | {:error, Fluss.Error.t()}
   def wait(handle) do
     handle
     |> Native.write_handle_wait()
@@ -38,7 +38,7 @@ defmodule Fluss.WriteHandle do
   def wait!(handle) do
     case wait(handle) do
       :ok -> :ok
-      {:error, reason} -> raise "write failed: #{reason}"
+      {:error, %Fluss.Error{} = err} -> raise err
     end
   end
 end
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/append_writer.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/append_writer.rs
index d78f564e0c..f26884419e 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/append_writer.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/append_writer.rs
@@ -17,7 +17,7 @@
 
 use crate::RUNTIME;
 use crate::async_nif;
-use crate::atoms::to_nif_err;
+use crate::atoms::{client_err, to_nif_err};
 use crate::row_convert;
 use crate::table::TableResource;
 use crate::write_handle::WriteHandleResource;
@@ -58,7 +58,7 @@ fn append_writer_append<'a>(
     writer: ResourceArc<AppendWriterResource>,
     values: Term<'a>,
 ) -> Result<ResourceArc<WriteHandleResource>, rustler::Error> {
-    let row = row_convert::term_to_row(env, values, &writer.columns).map_err(to_nif_err)?;
+    let row = row_convert::term_to_row(env, values, &writer.columns).map_err(client_err)?;
     let future = writer.inner.append(&row).map_err(to_nif_err)?;
     Ok(ResourceArc::new(WriteHandleResource::new(future)))
 }
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/async_nif.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/async_nif.rs
index fd6e495be3..6b26eaaf8a 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/async_nif.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/async_nif.rs
@@ -15,20 +15,23 @@
 // specific language governing permissions and limitations
 // under the License.
 
-//! Async NIF helpers — spawn on tokio, send `{ref, result}` back
-//! as a BEAM message instead of blocking dirty schedulers.
+//! Async NIF helpers — spawn on tokio, send `{ref, result}` back as a BEAM
+//! message instead of blocking dirty schedulers.
 
 use crate::RUNTIME;
-use crate::atoms;
+use crate::atoms::{self, NifFlussError};
+use fluss::error::Error as CoreError;
 use rustler::env::OwnedEnv;
 use rustler::{Encoder, Env, Term};
 use std::future::Future;
 
-/// Sends `{ref, :ok}` or `{ref, {:error, reason}}` on completion.
-pub fn spawn_task<'a, F, E>(env: Env<'a>, future: F) -> Term<'a>
+fn encode_err<'a>(env: Env<'a>, err: CoreError) -> Term<'a> {
+    (atoms::error(), NifFlussError::from_core(&err)).encode(env)
+}
+
+pub fn spawn_task<'a, F>(env: Env<'a>, future: F) -> Term<'a>
 where
-    F: Future<Output = Result<(), E>> + Send + 'static,
-    E: std::fmt::Display + Send + 'static,
+    F: Future<Output = Result<(), CoreError>> + Send + 'static,
 {
     let pid = env.pid();
     let ref_term: Term<'a> = *env.make_ref();
@@ -41,7 +44,7 @@ where
             let r = saved_ref.load(env);
             match result {
                 Ok(()) => (r, atoms::ok()).encode(env),
-                Err(e) => (r, (atoms::error(), e.to_string())).encode(env),
+                Err(e) => (r, encode_err(env, e)).encode(env),
             }
         });
     });
@@ -49,12 +52,10 @@ where
     ref_term
 }
 
-/// Sends `{ref, {:ok, value}}` or `{ref, {:error, reason}}` on completion.
-pub fn spawn_task_with_result<'a, F, T, E>(env: Env<'a>, future: F) -> Term<'a>
+pub fn spawn_task_with_result<'a, F, T>(env: Env<'a>, future: F) -> Term<'a>
 where
-    F: Future<Output = Result<T, E>> + Send + 'static,
+    F: Future<Output = Result<T, CoreError>> + Send + 'static,
     T: Encoder + Send + 'static,
-    E: std::fmt::Display + Send + 'static,
 {
     let pid = env.pid();
     let ref_term: Term<'a> = *env.make_ref();
@@ -67,7 +68,7 @@ where
             let r = saved_ref.load(env);
             match result {
                 Ok(val) => (r, (atoms::ok(), val)).encode(env),
-                Err(e) => (r, (atoms::error(), e.to_string())).encode(env),
+                Err(e) => (r, encode_err(env, e)).encode(env),
             }
         });
     });
@@ -75,17 +76,17 @@ where
     ref_term
 }
 
-/// Sends `{ref, {:error, reason}}` immediately (no async work).
-pub fn send_error<'a>(env: Env<'a>, msg: &str) -> Term<'a> {
+pub fn send_client_error<'a>(env: Env<'a>, msg: &str) -> Term<'a> {
     let pid = env.pid();
     let ref_term: Term<'a> = *env.make_ref();
     let mut task_env = OwnedEnv::new();
     let saved_ref = task_env.save(ref_term);
-    let msg = msg.to_string();
+    let message = msg.to_string();
 
     let _ = task_env.send_and_clear(&pid, |env| {
         let r = saved_ref.load(env);
-        (r, (atoms::error(), msg)).encode(env)
+        let err = NifFlussError::client(message);
+        (r, (atoms::error(), err)).encode(env)
     });
 
     ref_term
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
index 20beec7184..0a8e95b8b4 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
@@ -15,6 +15,9 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use fluss::error::{Error as CoreError, FlussError};
+use rustler::{Atom, NifStruct};
+
 rustler::atoms! {
     ok,
     error,
@@ -36,10 +39,181 @@ rustler::atoms! {
     timestamp,
     change_type,
     row,
+
+    // Error code atoms (mirror of fluss::error::FlussError).
+    none,
+    unknown_server_error,
+    network_exception,
+    unsupported_version,
+    corrupt_message,
+    database_not_exist,
+    database_not_empty,
+    database_already_exist,
+    table_not_exist,
+    table_already_exist,
+    schema_not_exist,
+    log_storage_exception,
+    kv_storage_exception,
+    not_leader_or_follower,
+    record_too_large_exception,
+    corrupt_record_exception,
+    invalid_table_exception,
+    invalid_database_exception,
+    invalid_replication_factor,
+    invalid_required_acks,
+    log_offset_out_of_range_exception,
+    non_primary_key_table_exception,
+    unknown_table_or_bucket_exception,
+    invalid_update_version_exception,
+    invalid_coordinator_exception,
+    fenced_leader_epoch_exception,
+    request_time_out,
+    storage_exception,
+    operation_not_attempted_exception,
+    not_enough_replicas_after_append_exception,
+    not_enough_replicas_exception,
+    security_token_exception,
+    out_of_order_sequence_exception,
+    duplicate_sequence_exception,
+    unknown_writer_id_exception,
+    invalid_column_projection,
+    invalid_target_column,
+    partition_not_exists,
+    table_not_partitioned_exception,
+    invalid_timestamp_exception,
+    invalid_config_exception,
+    lake_storage_not_configured_exception,
+    kv_snapshot_not_exist,
+    partition_already_exists,
+    partition_spec_invalid_exception,
+    leader_not_available_exception,
+    partition_max_num_exception,
+    authenticate_exception,
+    security_disabled_exception,
+    authorization_exception,
+    bucket_max_num_exception,
+    fenced_tiering_epoch_exception,
+    retriable_authenticate_exception,
+    invalid_server_rack_info_exception,
+    lake_snapshot_not_exist,
+    lake_table_already_exist,
+    ineligible_replica_exception,
+    invalid_alter_table_exception,
+    deletion_disabled_exception,
+    client_error,
+}
+
+pub const CLIENT_ERROR_CODE: i32 = -2;
+
+// `__exception__` is the marker `defexception` sets. Rustler bypasses the
+// Elixir constructor, so we must serialize it explicitly or `raise err`
+// rejects the struct at the Elixir side.
+#[derive(NifStruct)]
+#[module = "Fluss.Error"]
+pub struct NifFlussError {
+    pub code: Atom,
+    pub error_code: i32,
+    pub message: String,
+    #[allow(non_snake_case)]
+    pub __exception__: bool,
+}
+
+impl NifFlussError {
+    pub fn from_core(error: &CoreError) -> Self {
+        let (code, error_code) = match error {
+            CoreError::FlussAPIError { api_error } => {
+                (api_error_atom(api_error.code), api_error.code)
+            }
+            _ => (client_error(), CLIENT_ERROR_CODE),
+        };
+        Self {
+            code,
+            error_code,
+            message: error.to_string(),
+            __exception__: true,
+        }
+    }
+
+    pub fn client(message: String) -> Self {
+        Self {
+            code: client_error(),
+            error_code: CLIENT_ERROR_CODE,
+            message,
+            __exception__: true,
+        }
+    }
+}
+
+fn api_error_atom(code: i32) -> Atom {
+    match FlussError::for_code(code) {
+        FlussError::UnknownServerError => unknown_server_error(),
+        FlussError::None => none(),
+        FlussError::NetworkException => network_exception(),
+        FlussError::UnsupportedVersion => unsupported_version(),
+        FlussError::CorruptMessage => corrupt_message(),
+        FlussError::DatabaseNotExist => database_not_exist(),
+        FlussError::DatabaseNotEmpty => database_not_empty(),
+        FlussError::DatabaseAlreadyExist => database_already_exist(),
+        FlussError::TableNotExist => table_not_exist(),
+        FlussError::TableAlreadyExist => table_already_exist(),
+        FlussError::SchemaNotExist => schema_not_exist(),
+        FlussError::LogStorageException => log_storage_exception(),
+        FlussError::KvStorageException => kv_storage_exception(),
+        FlussError::NotLeaderOrFollower => not_leader_or_follower(),
+        FlussError::RecordTooLargeException => record_too_large_exception(),
+        FlussError::CorruptRecordException => corrupt_record_exception(),
+        FlussError::InvalidTableException => invalid_table_exception(),
+        FlussError::InvalidDatabaseException => invalid_database_exception(),
+        FlussError::InvalidReplicationFactor => invalid_replication_factor(),
+        FlussError::InvalidRequiredAcks => invalid_required_acks(),
+        FlussError::LogOffsetOutOfRangeException => log_offset_out_of_range_exception(),
+        FlussError::NonPrimaryKeyTableException => non_primary_key_table_exception(),
+        FlussError::UnknownTableOrBucketException => unknown_table_or_bucket_exception(),
+        FlussError::InvalidUpdateVersionException => invalid_update_version_exception(),
+        FlussError::InvalidCoordinatorException => invalid_coordinator_exception(),
+        FlussError::FencedLeaderEpochException => fenced_leader_epoch_exception(),
+        FlussError::RequestTimeOut => request_time_out(),
+        FlussError::StorageException => storage_exception(),
+        FlussError::OperationNotAttemptedException => operation_not_attempted_exception(),
+        FlussError::NotEnoughReplicasAfterAppendException => {
+            not_enough_replicas_after_append_exception()
+        }
+        FlussError::NotEnoughReplicasException => not_enough_replicas_exception(),
+        FlussError::SecurityTokenException => security_token_exception(),
+        FlussError::OutOfOrderSequenceException => out_of_order_sequence_exception(),
+        FlussError::DuplicateSequenceException => duplicate_sequence_exception(),
+        FlussError::UnknownWriterIdException => unknown_writer_id_exception(),
+        FlussError::InvalidColumnProjection => invalid_column_projection(),
+        FlussError::InvalidTargetColumn => invalid_target_column(),
+        FlussError::PartitionNotExists => partition_not_exists(),
+        FlussError::TableNotPartitionedException => table_not_partitioned_exception(),
+        FlussError::InvalidTimestampException => invalid_timestamp_exception(),
+        FlussError::InvalidConfigException => invalid_config_exception(),
+        FlussError::LakeStorageNotConfiguredException => lake_storage_not_configured_exception(),
+        FlussError::KvSnapshotNotExist => kv_snapshot_not_exist(),
+        FlussError::PartitionAlreadyExists => partition_already_exists(),
+        FlussError::PartitionSpecInvalidException => partition_spec_invalid_exception(),
+        FlussError::LeaderNotAvailableException => leader_not_available_exception(),
+        FlussError::PartitionMaxNumException => partition_max_num_exception(),
+        FlussError::AuthenticateException => authenticate_exception(),
+        FlussError::SecurityDisabledException => security_disabled_exception(),
+        FlussError::AuthorizationException => authorization_exception(),
+        FlussError::BucketMaxNumException => bucket_max_num_exception(),
+        FlussError::FencedTieringEpochException => fenced_tiering_epoch_exception(),
+        FlussError::RetriableAuthenticateException => retriable_authenticate_exception(),
+        FlussError::InvalidServerRackInfoException => invalid_server_rack_info_exception(),
+        FlussError::LakeSnapshotNotExist => lake_snapshot_not_exist(),
+        FlussError::LakeTableAlreadyExist => lake_table_already_exist(),
+        FlussError::IneligibleReplicaException => ineligible_replica_exception(),
+        FlussError::InvalidAlterTableException => invalid_alter_table_exception(),
+        FlussError::DeletionDisabledException => deletion_disabled_exception(),
+    }
+}
+
+pub fn to_nif_err(e: CoreError) -> rustler::Error {
+    rustler::Error::Term(Box::new(NifFlussError::from_core(&e)))
 }
 
-/// Convert any `Display` error into `rustler::Error::Term`, which the NIF
-/// framework encodes as `{:error, reason_string}`.
-pub fn to_nif_err(e: impl std::fmt::Display) -> rustler::Error {
-    rustler::Error::Term(Box::new(e.to_string()))
+pub fn client_err(msg: impl Into<String>) -> rustler::Error {
+    rustler::Error::Term(Box::new(NifFlussError::client(msg.into())))
 }
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/log_scanner.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/log_scanner.rs
index 93f1d04ed5..62614e0e67 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/log_scanner.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/log_scanner.rs
@@ -17,7 +17,7 @@
 
 use crate::RUNTIME;
 use crate::async_nif;
-use crate::atoms::{self, to_nif_err};
+use crate::atoms::{self, NifFlussError, to_nif_err};
 use crate::row_convert;
 use crate::table::TableResource;
 use fluss::client::{EARLIEST_OFFSET, LogScanner};
@@ -108,13 +108,15 @@ fn send_poll_result(pid: &LocalPid, result: Result<ScanRecords, Error>, columns:
             let _ = msg_env.send_and_clear(pid, |env| {
                 match encode_scan_records(env, scan_records, columns) {
                     Ok(records) => (atoms::fluss_records(), records).encode(env),
-                    Err(e) => (atoms::fluss_poll_error(), e).encode(env),
+                    Err(message) => {
+                        (atoms::fluss_poll_error(), NifFlussError::client(message)).encode(env)
+                    }
                 }
             });
         }
         Err(e) => {
             let _ = msg_env.send_and_clear(pid, |env| {
-                (atoms::fluss_poll_error(), e.to_string()).encode(env)
+                (atoms::fluss_poll_error(), NifFlussError::from_core(&e)).encode(env)
             });
         }
     }
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/write_handle.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/write_handle.rs
index e3b325d0bf..08046660bf 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/write_handle.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/write_handle.rs
@@ -42,6 +42,6 @@ fn write_handle_wait<'a>(env: Env<'a>, handle: ResourceArc<WriteHandleResource>)
     let future = handle.inner.lock().unwrap().take();
     match future {
         Some(f) => async_nif::spawn_task(env, f),
-        None => async_nif::send_error(env, "WriteHandle already consumed"),
+        None => async_nif::send_client_error(env, "WriteHandle already consumed"),
     }
 }
diff --git a/fluss-rust/bindings/elixir/test/error_test.exs b/fluss-rust/bindings/elixir/test/error_test.exs
new file mode 100644
index 0000000000..9294391cf1
--- /dev/null
+++ b/fluss-rust/bindings/elixir/test/error_test.exs
@@ -0,0 +1,87 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.ErrorTest do
+  use ExUnit.Case, async: true
+
+  @retriable_codes [
+    :network_exception,
+    :corrupt_message,
+    :schema_not_exist,
+    :log_storage_exception,
+    :kv_storage_exception,
+    :not_leader_or_follower,
+    :corrupt_record_exception,
+    :unknown_table_or_bucket_exception,
+    :request_time_out,
+    :storage_exception,
+    :not_enough_replicas_after_append_exception,
+    :not_enough_replicas_exception,
+    :leader_not_available_exception
+  ]
+
+  @non_retriable_codes [
+    :client_error,
+    :unknown_server_error,
+    :none,
+    :table_not_exist,
+    :authenticate_exception,
+    :authorization_exception,
+    :record_too_large_exception,
+    :deletion_disabled_exception,
+    :invalid_coordinator_exception,
+    :fenced_leader_epoch_exception,
+    :fenced_tiering_epoch_exception,
+    :retriable_authenticate_exception
+  ]
+
+  defp err(code), do: %Fluss.Error{code: code, error_code: 0, message: ""}
+
+  test "Exception.message/1 formats '[<code>]: <msg>'" do
+    err = %Fluss.Error{code: :network_exception, error_code: 1, message: "disconnected"}
+    assert Exception.message(err) == "Fluss error [network_exception]: disconnected"
+  end
+
+  test "retriable?/1 returns true for transient protocol codes" do
+    for code <- @retriable_codes do
+      assert Fluss.Error.retriable?(err(code)), "expected #{code} to be retriable"
+    end
+  end
+
+  test "retriable?/1 returns false for :client_error and permanent codes" do
+    for code <- @non_retriable_codes do
+      refute Fluss.Error.retriable?(err(code)), "expected #{code} to not be retriable"
+    end
+  end
+
+  describe "NIF error surface" do
+    test "unreachable server returns %Fluss.Error{code: :client_error, error_code: -2}" do
+      config = Fluss.Config.new("127.0.0.1:1")
+
+      assert {:error, %Fluss.Error{code: :client_error, error_code: -2}} =
+               Fluss.Connection.new(config)
+    end
+
+    test "bang variant raises %Fluss.Error{}" do
+      config = Fluss.Config.new("127.0.0.1:1")
+
+      assert_raise Fluss.Error, ~r/\[client_error\]/, fn ->
+        Fluss.Connection.new!(config)
+      end
+    end
+  end
+end

From 1257cc81f0b189435eefc65c00bbe0f89ae41d5f Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Jared=20Yu=20=28=E4=BD=99=E5=90=AF=E6=AD=A3=29?=
 <qzyu999@gmail.com>
Date: Thu, 30 Apr 2026 00:34:48 -0700
Subject: [PATCH 247/287] feat: (Python) Add async context manager (#487)

* feat: implement async context manager support for connection, writers, and scanners in Python bindings

* feat: expand python context manager test coverage for scanners and connections

* refactor: adjust indentation and clean up Python example code structure

* fix: Add self.close()?; to __aexit__ in connection.rs

* fix: Cleanup docstring

* feat: implement graceful connection shutdown with async close and update Python bindings accordingly

* feat: add optional timeout parameter to Python connection close method

* feat: revert python example indentation and add example for async context manager

* fix: revert changes to original example.py

* fix: revert changes to example.py (again)

* fix: always flush writers on context manager exit

* refactor: polish connection signature and clean up tests

* fix: prevent flush errors from masking in-flight exceptions

* fix: update dictionary in append to include all 9 fields in the schema

* refactor: update the __aexit__ to use is_exc_none for FlussConnection

* fix: move the async context manager demo to avoid the dropped table issue

* refactor: update is_exc_none to use is_none_or instead of map_or in compliance with clippy linting standards

* test: replace static sleep intervals with wait_for_table_ready fixture for robust table initialization

* docs: update Python examples and API reference to reflect async connection and context manager usage

* test: include "not leader or follower" in retryable error conditions within test suite
---
 fluss-rust/bindings/python/example/example.py |  24 +++-
 fluss-rust/bindings/python/fluss/__init__.pyi |  53 +++++++-
 fluss-rust/bindings/python/src/connection.rs  |  48 +++++++-
 fluss-rust/bindings/python/src/table.rs       |  29 +++++
 fluss-rust/bindings/python/src/upsert.rs      |  29 +++++
 fluss-rust/bindings/python/test/conftest.py   |  33 ++++-
 .../python/test/test_context_manager.py       | 116 ++++++++++++++++++
 .../bindings/python/test/test_log_table.py    |  19 ++-
 .../bindings/python/test/test_sasl_auth.py    |   4 +-
 .../crates/fluss/src/client/connection.rs     |  17 ++-
 .../docs/user-guide/python/api-reference.md   |   4 +-
 .../python/example/configuration.md           |   6 +-
 .../docs/user-guide/python/example/index.md   |   2 +-
 13 files changed, 354 insertions(+), 30 deletions(-)
 create mode 100644 fluss-rust/bindings/python/test/test_context_manager.py

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 52cefe1e6b..3498412303 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -667,6 +667,26 @@ async def main():
     except Exception as e:
         print(f"Error during projection: {e}")
 
+
+    print("\n--- New: async context manager demo ---")
+    async with await fluss.FlussConnection.create(config) as demo_conn:
+        demo_table = await demo_conn.get_table(table_path)
+        async with demo_table.new_append().create_writer() as writer:
+            writer.append(
+                {
+                    "id": 1,
+                    "name": "demo",
+                    "score": 1.0,
+                    "age": 25,
+                    "birth_date": date(2000, 1, 1),
+                    "check_in_time": dt_time(12, 0, 0),
+                    "created_at": datetime(2024, 1, 1, 12, 0, 0),
+                    "updated_at": datetime(2024, 1, 1, 12, 0, 0),
+                    "salary": Decimal("100.00"),
+                }
+            )
+            # auto-flushes on exit
+
     # Demo: Drop tables
     print("\n--- Testing drop_table() ---")
     try:
@@ -933,8 +953,10 @@ async def main():
         print(f"Error with partitioned KV table: {e}")
         traceback.print_exc()
 
+
+
     # Close connection
-    conn.close()
+    await conn.close()
     print("\nConnection closed")
 
 
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 02edcdb367..2f8daa0bc2 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -245,7 +245,7 @@ class FlussConnection:
     async def create(config: Config) -> FlussConnection: ...
     def get_admin(self) -> FlussAdmin: ...
     async def get_table(self, table_path: TablePath) -> FlussTable: ...
-    def close(self) -> None: ...
+    async def close(self) -> None: ...
     def __enter__(self) -> FlussConnection: ...
     def __exit__(
         self,
@@ -253,6 +253,13 @@ class FlussConnection:
         exc_value: Optional[BaseException],
         traceback: Optional[TracebackType],
     ) -> bool: ...
+    async def __aenter__(self) -> FlussConnection: ...
+    async def __aexit__(
+        self,
+        exc_type: Optional[type],
+        exc_value: Optional[BaseException],
+        traceback: Optional[TracebackType],
+    ) -> bool: ...
     def __repr__(self) -> str: ...
 
 class ServerNode:
@@ -611,6 +618,27 @@ class AppendWriter:
     def write_arrow_batch(self, batch: pa.RecordBatch) -> WriteResultHandle: ...
     def write_pandas(self, df: pd.DataFrame) -> None: ...
     async def flush(self) -> None: ...
+    async def __aenter__(self) -> AppendWriter:
+        """
+        Enter the async context manager.
+
+        Returns:
+            The AppendWriter instance.
+        """
+        ...
+    async def __aexit__(
+        self,
+        exc_type: Optional[type],
+        exc_value: Optional[BaseException],
+        traceback: Optional[TracebackType],
+    ) -> bool:
+        """
+        Exit the async context manager.
+
+        On exit, the writer is automatically flushed to ensure
+        all pending records are sent and acknowledged.
+        """
+        ...
     def __repr__(self) -> str: ...
 
 class UpsertWriter:
@@ -644,6 +672,27 @@ class UpsertWriter:
     async def flush(self) -> None:
         """Flush all pending upsert/delete operations to the server."""
         ...
+    async def __aenter__(self) -> UpsertWriter:
+        """
+        Enter the async context manager.
+
+        Returns:
+            The UpsertWriter instance.
+        """
+        ...
+    async def __aexit__(
+        self,
+        exc_type: Optional[type],
+        exc_value: Optional[BaseException],
+        traceback: Optional[TracebackType],
+    ) -> bool:
+        """
+        Exit the async context manager.
+
+        On exit, the writer is automatically flushed to ensure
+        all pending records are sent and acknowledged.
+        """
+        ...
     def __repr__(self) -> str: ...
 
 
@@ -807,6 +856,8 @@ class LogScanner:
 
         You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
         """
+        ...
+
     def __repr__(self) -> str: ...
     def __aiter__(self) -> AsyncIterator[Union[ScanRecord, RecordBatch]]: ...
 
diff --git a/fluss-rust/bindings/python/src/connection.rs b/fluss-rust/bindings/python/src/connection.rs
index a8d2d9e37d..3853896ce4 100644
--- a/fluss-rust/bindings/python/src/connection.rs
+++ b/fluss-rust/bindings/python/src/connection.rs
@@ -18,6 +18,7 @@
 use crate::*;
 use pyo3_async_runtimes::tokio::future_into_py;
 use std::sync::Arc;
+use std::time::Duration;
 
 /// Connection to a Fluss cluster
 #[pyclass]
@@ -82,9 +83,19 @@ impl FlussConnection {
         })
     }
 
-    // Close the connection
-    fn close(&mut self) -> PyResult<()> {
-        Ok(())
+    /// Close the connection (async).
+    ///
+    /// Gracefully shuts down the connection by draining any pending write batches.
+    /// This method is awaitable.
+    fn close<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let inner = self.inner.clone();
+
+        future_into_py(py, async move {
+            inner
+                .close(Duration::MAX)
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))
+        })
     }
 
     // Enter the runtime context (for 'with' statement)
@@ -100,10 +111,39 @@ impl FlussConnection {
         _exc_value: Option<Bound<'_, PyAny>>,
         _traceback: Option<Bound<'_, PyAny>>,
     ) -> PyResult<bool> {
-        self.close()?;
+        // Sync exit cannot await the graceful drain, so it's a no-op here.
+        // Users should use 'async with' for graceful shutdown.
         Ok(false)
     }
 
+    // Enter the async runtime context (for 'async with' statement)
+    fn __aenter__<'py>(slf: PyRef<'py, Self>, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let py_slf = slf.into_pyobject(py)?.unbind();
+        future_into_py(py, async move { Ok(py_slf) })
+    }
+
+    // Exit the async runtime context (for 'async with' statement)
+    #[pyo3(signature = (exc_type=None, _exc_value=None, _traceback=None))]
+    fn __aexit__<'py>(
+        &self,
+        py: Python<'py>,
+        exc_type: Option<Bound<'py, PyAny>>,
+        _exc_value: Option<Bound<'py, PyAny>>,
+        _traceback: Option<Bound<'py, PyAny>>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let inner = self.inner.clone();
+        let is_exc_none = exc_type.as_ref().is_none_or(|e| e.is_none());
+        future_into_py(py, async move {
+            let res = inner.close(Duration::MAX).await;
+            if let Err(e) = res {
+                if is_exc_none {
+                    return Err(FlussError::from_core_error(&e));
+                }
+            }
+            Ok(false)
+        })
+    }
+
     fn __repr__(&self) -> String {
         "FlussConnection()".to_string()
     }
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index c1b467343e..7d6a6af4d2 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -989,6 +989,35 @@ impl AppendWriter {
         })
     }
 
+    // Enter the async runtime context (for 'async with' statement)
+    fn __aenter__<'py>(slf: PyRef<'py, Self>, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let py_slf = slf.into_pyobject(py)?.unbind();
+        future_into_py(py, async move { Ok(py_slf) })
+    }
+
+    // Exit the async runtime context (for 'async with' statement)
+    /// On exit, the writer is automatically flushed.
+    #[pyo3(signature = (exc_type=None, _exc_value=None, _traceback=None))]
+    fn __aexit__<'py>(
+        &self,
+        py: Python<'py>,
+        exc_type: Option<Bound<'py, PyAny>>,
+        _exc_value: Option<Bound<'py, PyAny>>,
+        _traceback: Option<Bound<'py, PyAny>>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let inner = self.inner.clone();
+        let is_exc_none = exc_type.as_ref().is_none_or(|e| e.is_none());
+        future_into_py(py, async move {
+            let res = inner.flush().await;
+            if let Err(e) = res {
+                if is_exc_none {
+                    return Err(FlussError::from_core_error(&e));
+                }
+            }
+            Ok(false)
+        })
+    }
+
     fn __repr__(&self) -> String {
         "AppendWriter()".to_string()
     }
diff --git a/fluss-rust/bindings/python/src/upsert.rs b/fluss-rust/bindings/python/src/upsert.rs
index 02ad7fa4bb..45244225f6 100644
--- a/fluss-rust/bindings/python/src/upsert.rs
+++ b/fluss-rust/bindings/python/src/upsert.rs
@@ -108,6 +108,35 @@ impl UpsertWriter {
         })
     }
 
+    // Enter the async runtime context (for 'async with' statement)
+    fn __aenter__<'py>(slf: PyRef<'py, Self>, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let py_slf = slf.into_pyobject(py)?.unbind();
+        future_into_py(py, async move { Ok(py_slf) })
+    }
+
+    // Exit the async runtime context (for 'async with' statement)
+    /// On exit, the writer is automatically flushed.
+    #[pyo3(signature = (exc_type=None, _exc_value=None, _traceback=None))]
+    fn __aexit__<'py>(
+        &self,
+        py: Python<'py>,
+        exc_type: Option<Bound<'py, PyAny>>,
+        _exc_value: Option<Bound<'py, PyAny>>,
+        _traceback: Option<Bound<'py, PyAny>>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let writer = self.writer.clone();
+        let is_exc_none = exc_type.as_ref().is_none_or(|e| e.is_none());
+        future_into_py(py, async move {
+            let res = writer.flush().await;
+            if let Err(e) = res {
+                if is_exc_none {
+                    return Err(FlussError::from_core_error(&e));
+                }
+            }
+            Ok(false)
+        })
+    }
+
     fn __repr__(&self) -> String {
         "UpsertWriter()".to_string()
     }
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index 47c928077a..00119b76a3 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -96,7 +96,7 @@ async def _connect(bootstrap_servers):
             nodes = await admin.get_server_nodes()
             if any(n.server_type == "TabletServer" for n in nodes):
                 return conn
-            conn.close()
+            await conn.close()
             last_err = RuntimeError("No TabletServer available yet")
         except Exception as e:
             last_err = e
@@ -151,3 +151,34 @@ def plaintext_bootstrap_servers(fluss_cluster):
 @pytest_asyncio.fixture
 async def admin(connection):
     return connection.get_admin()
+
+
+@pytest_asyncio.fixture
+async def wait_for_table_ready(admin):
+    """
+    Fixture that returns a helper function to wait for a table or partition to be ready.
+    """
+    async def _wait(table_path, timeout=15, partition_name=None):
+        start_time = time.monotonic()
+        while time.monotonic() - start_time < timeout:
+            try:
+                if partition_name:
+                    await admin.list_partition_offsets(
+                        table_path, partition_name, [0], fluss.OffsetSpec.earliest()
+                    )
+                else:
+                    await admin.list_offsets(table_path, [0], fluss.OffsetSpec.earliest())
+                return
+            except (fluss.FlussError, Exception) as e:
+                # Catch "No leader found" or other errors that indicate the table/partition is still initializing
+                err_msg = str(e)
+                if any(msg in err_msg for msg in ["No leader found", "Table not ready", "Metadata not ready", "not leader or follower"]):
+                    await asyncio.sleep(1)
+                    continue
+                raise
+        raise TimeoutError(
+            f"Table/Partition {table_path} ({partition_name or 'standard'}) "
+            f"did not become ready within {timeout}s"
+        )
+
+    return _wait
diff --git a/fluss-rust/bindings/python/test/test_context_manager.py b/fluss-rust/bindings/python/test/test_context_manager.py
new file mode 100644
index 0000000000..f0dcc36f0f
--- /dev/null
+++ b/fluss-rust/bindings/python/test/test_context_manager.py
@@ -0,0 +1,116 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+import pytest
+import pyarrow as pa
+import time
+import fluss
+
+def _poll_records(scanner, expected_count, timeout_s=10):
+    """Poll a record-based scanner until expected_count records are collected."""
+    collected = []
+    deadline = time.monotonic() + timeout_s
+    while len(collected) < expected_count and time.monotonic() < deadline:
+        records = scanner.poll(5000)
+        collected.extend(records)
+    return collected
+
+@pytest.mark.asyncio
+async def test_connection_context_manager(plaintext_bootstrap_servers):
+    config = fluss.Config({"bootstrap.servers": plaintext_bootstrap_servers})
+    async with await fluss.FlussConnection.create(config) as conn:
+        admin = conn.get_admin()
+        nodes = await admin.get_server_nodes()
+        assert len(nodes) > 0
+
+
+@pytest.mark.asyncio
+async def test_append_writer_success_flush(connection, admin):
+    table_path = fluss.TablePath("fluss", "test_append_ctx_success")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    
+    schema = fluss.Schema(pa.schema([pa.field("a", pa.int32())]))
+    await admin.create_table(table_path, fluss.TableDescriptor(schema))
+    
+    table = await connection.get_table(table_path)
+    
+    async with table.new_append().create_writer() as writer:
+        writer.append({"a": 1})
+        writer.append({"a": 2})
+        # No explicit flush here
+        
+    # After context exit, data should be flushed
+    scanner = await table.new_scan().create_log_scanner()
+    scanner.subscribe(0, fluss.EARLIEST_OFFSET)
+    records = _poll_records(scanner, expected_count=2)
+    assert len(records) == 2
+    assert sorted([r.row["a"] for r in records]) == [1, 2]
+
+@pytest.mark.asyncio
+async def test_connection_drain_on_close(plaintext_bootstrap_servers, admin):
+    table_path = fluss.TablePath("fluss", "test_conn_drain")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    schema = fluss.Schema(pa.schema([pa.field("a", pa.int32())]))
+    await admin.create_table(table_path, fluss.TableDescriptor(schema))
+
+    config = fluss.Config({"bootstrap.servers": plaintext_bootstrap_servers})
+    async with await fluss.FlussConnection.create(config) as conn:
+        table = await conn.get_table(table_path)
+        writer = table.new_append().create_writer()
+        writer.append({"a": 123})
+        # No explicit flush, no writer context exit. 
+        # Rely on connection.__aexit__ -> close() to drain.
+    
+    # Re-connect with a new connection to verify data arrived
+    async with await fluss.FlussConnection.create(config) as conn2:
+        table2 = await conn2.get_table(table_path)
+        scanner = await table2.new_scan().create_log_scanner()
+        scanner.subscribe(0, fluss.EARLIEST_OFFSET)
+        records = _poll_records(scanner, expected_count=1)
+        assert len(records) == 1
+        assert records[0].row["a"] == 123
+
+@pytest.mark.asyncio
+async def test_upsert_writer_context_manager(connection, admin):
+    table_path = fluss.TablePath("fluss", "test_upsert_ctx")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    
+    schema = fluss.Schema(pa.schema([pa.field("id", pa.int32()), pa.field("v", pa.string())]), primary_keys=["id"])
+    await admin.create_table(table_path, fluss.TableDescriptor(schema))
+    
+    table = await connection.get_table(table_path)
+    
+    # Success path: verify it flushes
+    async with table.new_upsert().create_writer() as writer:
+        writer.upsert({"id": 1, "v": "a"})
+        
+    lookuper = table.new_lookup().create_lookuper()
+    res = await lookuper.lookup({"id": 1})
+    assert res is not None
+    assert res["v"] == "a"
+    
+@pytest.mark.asyncio
+async def test_connection_context_manager_exception(plaintext_bootstrap_servers):
+    config = fluss.Config({"bootstrap.servers": plaintext_bootstrap_servers})
+    class TestException(Exception): pass
+    
+    try:
+        async with await fluss.FlussConnection.create(config) as conn:
+            raise TestException("connection error")
+    except TestException:
+        pass
+    # If we reach here without hanging, the connection __aexit__ gracefully handled the error
\ No newline at end of file
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index 5708a93cdd..86e9a707c9 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -118,7 +118,7 @@ async def test_append_dict_rows(connection, admin):
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
-async def test_list_offsets(connection, admin):
+async def test_list_offsets(connection, admin, wait_for_table_ready):
     """Test listing earliest, latest, and timestamp-based offsets."""
     table_path = fluss.TablePath("fluss", "py_test_list_offsets")
     await admin.drop_table(table_path, ignore_if_not_exists=True)
@@ -129,7 +129,7 @@ async def test_list_offsets(connection, admin):
     table_descriptor = fluss.TableDescriptor(schema)
     await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
 
-    await asyncio.sleep(2)  # Wait for table initialization
+    await wait_for_table_ready(table_path)
 
     # Earliest offset should be 0 for empty table
     earliest = await admin.list_offsets(
@@ -266,7 +266,7 @@ async def test_project(connection, admin):
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
-async def test_poll_batches(connection, admin):
+async def test_poll_batches(connection, admin, wait_for_table_ready):
     """Test batch-based scanning with poll_arrow and poll_record_batch."""
     table_path = fluss.TablePath("fluss", "py_test_poll_batches")
     await admin.drop_table(table_path, ignore_if_not_exists=True)
@@ -277,7 +277,7 @@ async def test_poll_batches(connection, admin):
     table_descriptor = fluss.TableDescriptor(schema)
     await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
 
-    await asyncio.sleep(1)
+    await wait_for_table_ready(table_path)
 
     table = await connection.get_table(table_path)
     scanner = await table.new_scan().create_record_batch_log_scanner()
@@ -388,7 +388,7 @@ async def test_to_arrow_and_to_pandas(connection, admin):
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
-async def test_partitioned_table_append_scan(connection, admin):
+async def test_partitioned_table_append_scan(connection, admin, wait_for_table_ready):
     """Test append and scan on a partitioned log table."""
     table_path = fluss.TablePath("fluss", "py_test_partitioned_log_append")
     await admin.drop_table(table_path, ignore_if_not_exists=True)
@@ -413,9 +413,7 @@ async def test_partitioned_table_append_scan(connection, admin):
         await admin.create_partition(
             table_path, {"region": region}, ignore_if_exists=True
         )
-
-    await asyncio.sleep(2)  # Wait for partitions to be available
-
+        await wait_for_table_ready(table_path, partition_name=region)
     table = await connection.get_table(table_path)
     append_writer = table.new_append().create_writer()
 
@@ -625,7 +623,7 @@ async def test_write_pandas(connection, admin):
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
-async def test_partitioned_table_to_arrow(connection, admin):
+async def test_partitioned_table_to_arrow(connection, admin, wait_for_table_ready):
     """Test to_arrow() on partitioned tables."""
     table_path = fluss.TablePath("fluss", "py_test_partitioned_to_arrow")
     await admin.drop_table(table_path, ignore_if_not_exists=True)
@@ -646,8 +644,7 @@ async def test_partitioned_table_to_arrow(connection, admin):
         await admin.create_partition(
             table_path, {"region": region}, ignore_if_exists=True
         )
-
-    await asyncio.sleep(2)
+        await wait_for_table_ready(table_path, partition_name=region)
 
     table = await connection.get_table(table_path)
     writer = table.new_append().create_writer()
diff --git a/fluss-rust/bindings/python/test/test_sasl_auth.py b/fluss-rust/bindings/python/test/test_sasl_auth.py
index 9dd2ddda3f..6889f1ab67 100644
--- a/fluss-rust/bindings/python/test/test_sasl_auth.py
+++ b/fluss-rust/bindings/python/test/test_sasl_auth.py
@@ -45,7 +45,7 @@ async def test_sasl_connect_with_valid_credentials(sasl_bootstrap_servers):
 
     # Cleanup
     await admin.drop_database(db_name, ignore_if_not_exists=True, cascade=True)
-    conn.close()
+    await conn.close()
 
 
 async def test_sasl_connect_with_second_user(sasl_bootstrap_servers):
@@ -62,7 +62,7 @@ async def test_sasl_connect_with_second_user(sasl_bootstrap_servers):
 
     # Basic operation to confirm functional connection
     assert not await admin.database_exists("some_nonexistent_db_alice")
-    conn.close()
+    await conn.close()
 
 
 async def test_sasl_connect_with_wrong_password(sasl_bootstrap_servers):
diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index 62d440bed5..a3ffd7557e 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -28,10 +28,6 @@ use parking_lot::RwLock;
 use std::sync::Arc;
 use std::time::Duration;
 
-// TODO: implement `close(&self, timeout: Duration)` to gracefully shut down the
-// writer client (drain pending batches, then force-close on timeout).
-// Java's FlussConnection.close() calls writerClient.close(Long.MAX_VALUE).
-// WriterClient::close() already exists but is never called from the public API.
 pub struct FlussConnection {
     metadata: Arc<Metadata>,
     network_connects: Arc<RpcClient>,
@@ -73,6 +69,19 @@ impl FlussConnection {
         })
     }
 
+    /// Gracefully shut down the connection, draining any pending write batches.
+    ///
+    /// If a writer client has been created, this method will signal it to drain
+    /// its buffers and wait for the background sender task to complete, bounded
+    /// by the provided timeout.
+    pub async fn close(&self, timeout: Duration) -> Result<()> {
+        let writer_client = self.writer_client.write().take();
+        if let Some(client) = writer_client {
+            client.close(timeout).await?;
+        }
+        Ok(())
+    }
+
     pub fn get_metadata(&self) -> Arc<Metadata> {
         self.metadata.clone()
     }
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index 1268d37f9f..73b9a8fe7c 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -38,9 +38,9 @@ Complete API reference for the Fluss Python client.
 | `await FlussConnection.create(config) -> FlussConnection` | Connect to a Fluss cluster            |
 | `conn.get_admin() -> FlussAdmin`                        | Get admin interface                   |
 | `await conn.get_table(table_path) -> FlussTable`          | Get a table for read/write operations |
-| `conn.close()`                                            | Close the connection                  |
+| `await conn.close()`                                      | Close the connection                  |
 
-Supports `with` statement (context manager).
+Supports `async with` statement (async context manager).
 
 ## `FlussAdmin`
 
diff --git a/fluss-rust/website/docs/user-guide/python/example/configuration.md b/fluss-rust/website/docs/user-guide/python/example/configuration.md
index 995a81cc33..448ae029ac 100644
--- a/fluss-rust/website/docs/user-guide/python/example/configuration.md
+++ b/fluss-rust/website/docs/user-guide/python/example/configuration.md
@@ -12,10 +12,10 @@ config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
 conn = await fluss.FlussConnection.create(config)
 ```
 
-The connection also supports context managers:
+The connection also supports async context managers:
 
 ```python
-with await fluss.FlussConnection.create(config) as conn:
+async with await fluss.FlussConnection.create(config) as conn:
     ...
 ```
 
@@ -45,5 +45,5 @@ conn = await fluss.FlussConnection.create(config)
 Remember to close the connection when done:
 
 ```python
-conn.close()
+await conn.close()
 ```
diff --git a/fluss-rust/website/docs/user-guide/python/example/index.md b/fluss-rust/website/docs/user-guide/python/example/index.md
index ec9fa78f45..21768a1d06 100644
--- a/fluss-rust/website/docs/user-guide/python/example/index.md
+++ b/fluss-rust/website/docs/user-guide/python/example/index.md
@@ -40,7 +40,7 @@ async def main():
 
     # Cleanup
     await admin.drop_table(table_path, ignore_if_not_exists=True)
-    conn.close()
+    await conn.close()
 
 asyncio.run(main())
 ```

From 4888f49eff67078bd1b798477155240418276207 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 2 May 2026 18:38:05 +0100
Subject: [PATCH 248/287] chore: regenerate Cargo.lock for declared metrics
 deps (#518)

---
 fluss-rust/Cargo.lock | 118 ++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 118 insertions(+)

diff --git a/fluss-rust/Cargo.lock b/fluss-rust/Cargo.lock
index ac5b27f883..72a861808d 100644
--- a/fluss-rust/Cargo.lock
+++ b/fluss-rust/Cargo.lock
@@ -746,6 +746,15 @@ dependencies = [
  "rustc_version",
 ]
 
+[[package]]
+name = "crossbeam-epoch"
+version = "0.9.18"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "5b82ac4a3c2ca9c3460964f020e1402edd5753411d7737aa39c3714ad1b5420e"
+dependencies = [
+ "crossbeam-utils",
+]
+
 [[package]]
 name = "crossbeam-utils"
 version = "0.8.21"
@@ -975,6 +984,12 @@ version = "1.15.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "48c757948c5ede0e46177b7add2e67155f70e33c07fea8284df6576da70b3719"
 
+[[package]]
+name = "endian-type"
+version = "0.1.2"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c34f04666d835ff5d62e058c3995147c06f42fe86ff053337632bca83e42702d"
+
 [[package]]
 name = "equivalent"
 version = "1.0.2"
@@ -1104,6 +1119,8 @@ dependencies = [
  "jiff",
  "linked-hash-map",
  "log",
+ "metrics",
+ "metrics-util",
  "opendal",
  "ordered-float",
  "parking_lot",
@@ -1403,6 +1420,9 @@ name = "hashbrown"
 version = "0.16.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "841d1cc9bed7f9236f321df977030373f4a4163ae1a7dbfe1a51a2c1a51d9100"
+dependencies = [
+ "foldhash 0.2.0",
+]
 
 [[package]]
 name = "heck"
@@ -2054,6 +2074,37 @@ dependencies = [
  "autocfg",
 ]
 
+[[package]]
+name = "metrics"
+version = "0.24.5"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ff56c2e7dce6bd462e3b8919986a617027481b1dcc703175b58cf9dd98a2f071"
+dependencies = [
+ "portable-atomic",
+ "rapidhash",
+]
+
+[[package]]
+name = "metrics-util"
+version = "0.20.3"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "9e56997f084e57b045edf17c3ed8ba7f9f779c670df8206dfd1c736f4c02dc4a"
+dependencies = [
+ "aho-corasick",
+ "crossbeam-epoch",
+ "crossbeam-utils",
+ "hashbrown 0.16.1",
+ "indexmap 2.13.1",
+ "metrics",
+ "ordered-float",
+ "quanta",
+ "radix_trie",
+ "rand 0.9.2",
+ "rand_xoshiro",
+ "rapidhash",
+ "sketches-ddsketch",
+]
+
 [[package]]
 name = "mime"
 version = "0.3.17"
@@ -2077,6 +2128,15 @@ version = "0.10.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "1d87ecb2933e8aeadb3e3a02b828fed80a7528047e68b4f424523a0981a3a084"
 
+[[package]]
+name = "nibble_vec"
+version = "0.1.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "77a5d83df9f36fe23f0c3648c6bbb8b0298bb5f1939c8f2704431371f4b84d43"
+dependencies = [
+ "smallvec",
+]
+
 [[package]]
 name = "num"
 version = "0.4.3"
@@ -2546,6 +2606,21 @@ dependencies = [
  "cc",
 ]
 
+[[package]]
+name = "quanta"
+version = "0.12.6"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f3ab5a9d756f0d97bdc89019bd2e4ea098cf9cde50ee7564dde6b81ccc8f06c7"
+dependencies = [
+ "crossbeam-utils",
+ "libc",
+ "once_cell",
+ "raw-cpuid",
+ "wasi",
+ "web-sys",
+ "winapi",
+]
+
 [[package]]
 name = "quick-xml"
 version = "0.37.5"
@@ -2648,6 +2723,16 @@ version = "0.7.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "dc33ff2d4973d518d823d61aa239014831e521c75da58e3df4840d3f47749d09"
 
+[[package]]
+name = "radix_trie"
+version = "0.2.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "c069c179fcdc6a2fe24d8d18305cf085fdbd4f922c041943e203685d6a1c58fd"
+dependencies = [
+ "endian-type",
+ "nibble_vec",
+]
+
 [[package]]
 name = "rand"
 version = "0.8.5"
@@ -2709,6 +2794,33 @@ dependencies = [
  "getrandom 0.3.4",
 ]
 
+[[package]]
+name = "rand_xoshiro"
+version = "0.7.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "f703f4665700daf5512dcca5f43afa6af89f09db47fb56be587f80636bda2d41"
+dependencies = [
+ "rand_core 0.9.5",
+]
+
+[[package]]
+name = "rapidhash"
+version = "4.4.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b5e48930979c155e2f33aa36ab3119b5ee81332beb6482199a8ecd6029b80b59"
+dependencies = [
+ "rustversion",
+]
+
+[[package]]
+name = "raw-cpuid"
+version = "11.6.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "498cd0dc59d73224351ee52a95fee0f1a617a2eae0e7d9d720cc622c73a54186"
+dependencies = [
+ "bitflags",
+]
+
 [[package]]
 name = "redox_syscall"
 version = "0.5.18"
@@ -3214,6 +3326,12 @@ version = "0.1.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "e3a9fe34e3e7a50316060351f37187a3f546bce95496156754b601a5fa71b76e"
 
+[[package]]
+name = "sketches-ddsketch"
+version = "0.3.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0c6f73aeb92d671e0cc4dca167e59b2deb6387c375391bc99ee743f326994a2b"
+
 [[package]]
 name = "slab"
 version = "0.4.12"

From 00382876333302c8c1b97b01aede70a10ef1e90a Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Sun, 3 May 2026 11:52:41 +0100
Subject: [PATCH 249/287] chore: bump rand from 0.9.2 to 0.9.3 (#512)

Bumps [rand](https://github.com/rust-random/rand) from 0.9.2 to 0.9.3.
- [Release notes](https://github.com/rust-random/rand/releases)
- [Changelog](https://github.com/rust-random/rand/blob/0.9.3/CHANGELOG.md)
- [Commits](https://github.com/rust-random/rand/compare/rand_core-0.9.2...0.9.3)

---
updated-dependencies:
- dependency-name: rand
  dependency-version: 0.9.3
  dependency-type: direct:production
...

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 fluss-rust/Cargo.lock              | 14 +++++++-------
 fluss-rust/crates/fluss/Cargo.toml |  2 +-
 2 files changed, 8 insertions(+), 8 deletions(-)

diff --git a/fluss-rust/Cargo.lock b/fluss-rust/Cargo.lock
index 72a861808d..94a38e109a 100644
--- a/fluss-rust/Cargo.lock
+++ b/fluss-rust/Cargo.lock
@@ -525,7 +525,7 @@ dependencies = [
  "log",
  "num",
  "pin-project-lite",
- "rand 0.9.2",
+ "rand 0.9.3",
  "rustls",
  "rustls-native-certs",
  "rustls-pki-types",
@@ -1040,7 +1040,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "bb330bbd4cb7a5b9f559427f06f98a4f853a137c8298f3bd3f8ca57663e21986"
 dependencies = [
  "portable-atomic",
- "rand 0.9.2",
+ "rand 0.9.3",
  "web-time",
 ]
 
@@ -1127,7 +1127,7 @@ dependencies = [
  "parse-display 0.10.0",
  "prost",
  "prost-build",
- "rand 0.9.2",
+ "rand 0.9.3",
  "scopeguard",
  "serde",
  "serde_json",
@@ -2099,7 +2099,7 @@ dependencies = [
  "ordered-float",
  "quanta",
  "radix_trie",
- "rand 0.9.2",
+ "rand 0.9.3",
  "rand_xoshiro",
  "rapidhash",
  "sketches-ddsketch",
@@ -2670,7 +2670,7 @@ dependencies = [
  "bytes",
  "getrandom 0.3.4",
  "lru-slab",
- "rand 0.9.2",
+ "rand 0.9.3",
  "ring",
  "rustc-hash",
  "rustls",
@@ -2747,9 +2747,9 @@ dependencies = [
 
 [[package]]
 name = "rand"
-version = "0.9.2"
+version = "0.9.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6db2770f06117d490610c7488547d543617b21bfa07796d7a12f6f1bd53850d1"
+checksum = "7ec095654a25171c2124e9e3393a930bddbffdc939556c914957a4c3e0a87166"
 dependencies = [
  "rand_chacha 0.9.0",
  "rand_core 0.9.5",
diff --git a/fluss-rust/crates/fluss/Cargo.toml b/fluss-rust/crates/fluss/Cargo.toml
index a47fc238f2..feac8309f1 100644
--- a/fluss-rust/crates/fluss/Cargo.toml
+++ b/fluss-rust/crates/fluss/Cargo.toml
@@ -52,7 +52,7 @@ clap = { workspace = true }
 crc32c = "0.6.8"
 linked-hash-map = "0.5.6"
 prost = "0.14"
-rand = "0.9.1"
+rand = "0.9.3"
 serde = { workspace = true, features = ["rc"] }
 serde_json = { workspace = true }
 thiserror = "1.0"

From 93c28cc152e29a20bf400f284e9d3987c964158c Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Sun, 3 May 2026 11:53:36 +0100
Subject: [PATCH 250/287] chore: bump actions/upload-artifact from 4 to 7
 (#521)

Bumps [actions/upload-artifact](https://github.com/actions/upload-artifact) from 4 to 7.
- [Release notes](https://github.com/actions/upload-artifact/releases)
- [Commits](https://github.com/actions/upload-artifact/compare/v4...v7)

---
updated-dependencies:
- dependency-name: actions/upload-artifact
  dependency-version: '7'
  dependency-type: direct:production
  update-type: version-update:semver-major
...

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 fluss-rust/.github/workflows/release_python.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/.github/workflows/release_python.yml b/fluss-rust/.github/workflows/release_python.yml
index 5a5ae7a72d..c2fed15556 100644
--- a/fluss-rust/.github/workflows/release_python.yml
+++ b/fluss-rust/.github/workflows/release_python.yml
@@ -58,7 +58,7 @@ jobs:
           args: -o dist
 
       - name: Upload sdist
-        uses: actions/upload-artifact@v4
+        uses: actions/upload-artifact@v7
         with:
           name: wheels-sdist
           path: bindings/python/dist
@@ -138,7 +138,7 @@ jobs:
           before-script-linux: *protoc-install
 
       - name: Upload wheels
-        uses: actions/upload-artifact@v4
+        uses: actions/upload-artifact@v7
         with:
           name: wheels-${{ matrix.os }}-${{ matrix.target || 'native' }}
           path: bindings/python/dist

From 142f9ccb2951be470142924ac0ccfdb3175d29b6 Mon Sep 17 00:00:00 2001
From: "dependabot[bot]" <49699333+dependabot[bot]@users.noreply.github.com>
Date: Sun, 3 May 2026 11:54:37 +0100
Subject: [PATCH 251/287] chore: bump rustls-webpki from 0.103.10 to 0.103.13
 (#513)

Bumps [rustls-webpki](https://github.com/rustls/webpki) from 0.103.10 to 0.103.13.
- [Release notes](https://github.com/rustls/webpki/releases)
- [Commits](https://github.com/rustls/webpki/compare/v/0.103.10...v/0.103.13)

---
updated-dependencies:
- dependency-name: rustls-webpki
  dependency-version: 0.103.13
  dependency-type: indirect
...

Signed-off-by: dependabot[bot] <support@github.com>
Co-authored-by: dependabot[bot] <49699333+dependabot[bot]@users.noreply.github.com>
---
 fluss-rust/Cargo.lock | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/fluss-rust/Cargo.lock b/fluss-rust/Cargo.lock
index 94a38e109a..f409723ed2 100644
--- a/fluss-rust/Cargo.lock
+++ b/fluss-rust/Cargo.lock
@@ -3081,9 +3081,9 @@ dependencies = [
 
 [[package]]
 name = "rustls-webpki"
-version = "0.103.10"
+version = "0.103.13"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "df33b2b81ac578cabaf06b89b0631153a3f416b0a886e8a7a1707fb51abbd1ef"
+checksum = "61c429a8649f110dddef65e2a5ad240f747e85f7758a6bccc7e5777bd33f756e"
 dependencies = [
  "ring",
  "rustls-pki-types",

From 273c238c72a9c6c9749a12a9ccb8999a96cdbc1c Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 3 May 2026 12:58:55 +0100
Subject: [PATCH 252/287] fix: [bindings] map RpcError to NetworkException for
 Java parity (#519)

---
 fluss-rust/bindings/cpp/src/lib.rs                  | 13 ++++++++-----
 .../bindings/elixir/native/fluss_nif/src/atoms.rs   |  5 +++++
 fluss-rust/bindings/elixir/test/error_test.exs      |  6 +++---
 fluss-rust/bindings/python/src/error.rs             | 12 ++++++------
 4 files changed, 22 insertions(+), 14 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index facb0e3198..875373bcec 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -23,6 +23,8 @@ use std::time::Duration;
 
 use fluss as fcore;
 use fluss::PartitionId;
+use fluss::error::Error;
+use fluss::rpc::FlussError as CoreFlussError;
 
 static RUNTIME: LazyLock<tokio::runtime::Runtime> = LazyLock::new(|| {
     tokio::runtime::Builder::new_multi_thread()
@@ -855,13 +857,14 @@ fn client_err(msg: String) -> ffi::FfiResult {
     err_result(CLIENT_ERROR_CODE, msg)
 }
 
-/// Convert a core Error to FfiResult.
-/// `FlussAPIError` variants carry the server protocol error code directly.
-/// All other error kinds are client-side and use CLIENT_ERROR_CODE.
-fn err_from_core_error(e: &fcore::error::Error) -> ffi::FfiResult {
-    use fcore::error::Error;
+fn err_from_core_error(e: &Error) -> ffi::FfiResult {
+    // Transport failures map to `NetworkException` (Java parity,
+    // retriable).
     match e {
         Error::FlussAPIError { api_error } => err_result(api_error.code, api_error.message.clone()),
+        Error::RpcError { .. } => {
+            err_result(CoreFlussError::NetworkException.code(), e.to_string())
+        }
         _ => client_err(e.to_string()),
     }
 }
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
index 0a8e95b8b4..45d5aa303a 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/atoms.rs
@@ -120,10 +120,15 @@ pub struct NifFlussError {
 
 impl NifFlussError {
     pub fn from_core(error: &CoreError) -> Self {
+        // Transport failures map to `:network_exception` (Java parity,
+        // retriable).
         let (code, error_code) = match error {
             CoreError::FlussAPIError { api_error } => {
                 (api_error_atom(api_error.code), api_error.code)
             }
+            CoreError::RpcError { .. } => {
+                (network_exception(), FlussError::NetworkException.code())
+            }
             _ => (client_error(), CLIENT_ERROR_CODE),
         };
         Self {
diff --git a/fluss-rust/bindings/elixir/test/error_test.exs b/fluss-rust/bindings/elixir/test/error_test.exs
index 9294391cf1..d6d4017597 100644
--- a/fluss-rust/bindings/elixir/test/error_test.exs
+++ b/fluss-rust/bindings/elixir/test/error_test.exs
@@ -69,17 +69,17 @@ defmodule Fluss.ErrorTest do
   end
 
   describe "NIF error surface" do
-    test "unreachable server returns %Fluss.Error{code: :client_error, error_code: -2}" do
+    test "unreachable server returns %Fluss.Error{code: :network_exception, error_code: 1}" do
       config = Fluss.Config.new("127.0.0.1:1")
 
-      assert {:error, %Fluss.Error{code: :client_error, error_code: -2}} =
+      assert {:error, %Fluss.Error{code: :network_exception, error_code: 1}} =
                Fluss.Connection.new(config)
     end
 
     test "bang variant raises %Fluss.Error{}" do
       config = Fluss.Config.new("127.0.0.1:1")
 
-      assert_raise Fluss.Error, ~r/\[client_error\]/, fn ->
+      assert_raise Fluss.Error, ~r/\[network_exception\]/, fn ->
         Fluss.Connection.new!(config)
       end
     end
diff --git a/fluss-rust/bindings/python/src/error.rs b/fluss-rust/bindings/python/src/error.rs
index 10c6cfa0ec..9d718aa66e 100644
--- a/fluss-rust/bindings/python/src/error.rs
+++ b/fluss-rust/bindings/python/src/error.rs
@@ -15,6 +15,8 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use fluss::error::Error;
+use fluss::rpc::FlussError as CoreFlussError;
 use pyo3::exceptions::PyException;
 use pyo3::prelude::*;
 
@@ -55,7 +57,6 @@ impl FlussError {
     /// Returns ``True`` if retrying the request may succeed. Client-side errors always return ``False``.
     #[getter]
     fn is_retriable(&self) -> bool {
-        use fluss::rpc::FlussError as CoreFlussError;
         if self.error_code == CLIENT_ERROR_CODE {
             return false;
         }
@@ -68,13 +69,12 @@ impl FlussError {
         PyErr::new::<FlussError, _>((message.to_string(), CLIENT_ERROR_CODE))
     }
 
-    /// Create a PyErr from a core Error.
-    /// `FlussAPIError` variants carry the server protocol error code directly.
-    /// All other error kinds are client-side and use CLIENT_ERROR_CODE.
-    pub fn from_core_error(error: &fluss::error::Error) -> PyErr {
-        use fluss::error::Error;
+    pub fn from_core_error(error: &Error) -> PyErr {
+        // Transport failures map to `NetworkException` (Java parity,
+        // retriable).
         let (msg, code) = match error {
             Error::FlussAPIError { api_error } => (api_error.message.clone(), api_error.code),
+            Error::RpcError { .. } => (error.to_string(), CoreFlussError::NetworkException.code()),
             _ => (error.to_string(), CLIENT_ERROR_CODE),
         };
         PyErr::new::<FlussError, _>((msg, code))

From f433709a943d0e696688bac1eb78dfb72bc9e5cb Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 3 May 2026 13:13:58 +0100
Subject: [PATCH 253/287] feat: make LogScanner poll methods async to prevent
 event loop blocking (#495)

Convert poll(), poll_record_batch(), poll_arrow(), to_arrow(), to_pandas()
from sync (py.detach + block_on) to async (future_into_py).

The sync methods blocked the asyncio event loop thread, preventing
concurrent future_into_py tasks from delivering results. This caused
deadlocks when users ran multiple async operations simultaneously.

Breaking change: these methods now return awaitables instead of direct values.
---
 fluss-rust/bindings/python/example/example.py |  26 +-
 fluss-rust/bindings/python/fluss/__init__.pyi |  10 +-
 fluss-rust/bindings/python/pyproject.toml     |   2 +-
 fluss-rust/bindings/python/src/table.rs       | 547 +++++++-----------
 fluss-rust/bindings/python/test/conftest.py   |  16 +-
 .../bindings/python/test/test_log_table.py    |  56 +-
 .../docs/user-guide/python/api-reference.md   |  12 +-
 .../docs/user-guide/python/data-types.md      |   2 +-
 .../docs/user-guide/python/example/index.md   |   2 +-
 .../user-guide/python/example/log-tables.md   |   8 +-
 .../python/example/partitioned-tables.md      |   2 +-
 11 files changed, 286 insertions(+), 397 deletions(-)

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 3498412303..0149996cd5 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -278,7 +278,7 @@ async def main():
 
         # Try to get as PyArrow Table
         try:
-            pa_table_result = batch_scanner.to_arrow()
+            pa_table_result = await batch_scanner.to_arrow()
             print(f"\nAs PyArrow Table: {pa_table_result}")
         except Exception as e:
             print(f"Could not convert to PyArrow: {e}")
@@ -289,7 +289,7 @@ async def main():
 
         # Try to get as Pandas DataFrame
         try:
-            df_result = batch_scanner2.to_pandas()
+            df_result = await batch_scanner2.to_pandas()
             print(f"\nAs Pandas DataFrame:\n{df_result}")
         except Exception as e:
             print(f"Could not convert to Pandas: {e}")
@@ -308,7 +308,7 @@ async def main():
         # Poll with a timeout of 5000ms (5 seconds)
         # Note: poll_arrow() returns an empty table (not an error) on timeout
         try:
-            poll_result = batch_scanner3.poll_arrow(5000)
+            poll_result = await batch_scanner3.poll_arrow(5000)
             print(f"Number of rows: {poll_result.num_rows}")
 
             if poll_result.num_rows > 0:
@@ -328,7 +328,7 @@ async def main():
         batch_scanner4.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
         try:
-            batches = batch_scanner4.poll_record_batch(5000)
+            batches = await batch_scanner4.poll_record_batch(5000)
             print(f"Number of batches: {len(batches)}")
 
             for i, batch in enumerate(batches):
@@ -354,7 +354,7 @@ async def main():
         # Poll returns ScanRecords — records grouped by bucket
         print("\n--- Testing poll() method (record-by-record) ---")
         try:
-            scan_records = record_scanner.poll(5000)
+            scan_records = await record_scanner.poll(5000)
             print(f"Total records: {scan_records.count()}, buckets: {len(scan_records.buckets())}")
 
             # Flat iteration over all records (regardless of bucket)
@@ -387,7 +387,7 @@ async def main():
         # Unsubscribe from bucket 0 — future polls will skip this bucket
         unsub_scanner.unsubscribe(bucket_id=0)
         print("Unsubscribed from bucket 0")
-        remaining = unsub_scanner.poll_arrow(5000)
+        remaining = await unsub_scanner.poll_arrow(5000)
         print(f"After unsubscribe, got {remaining.num_rows} records (from remaining buckets)")
     except Exception as e:
         print(f"Error during unsubscribe test: {e}")
@@ -640,7 +640,7 @@ async def main():
         print("\n1. Projection by index [0, 1] (id, name):")
         scanner_index = await table.new_scan().project([0, 1]).create_record_batch_log_scanner()
         scanner_index.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
-        df_projected = scanner_index.to_pandas()
+        df_projected = await scanner_index.to_pandas()
         print(df_projected.head())
         print(
             f"   Projected {df_projected.shape[1]} columns: {list(df_projected.columns)}"
@@ -652,7 +652,7 @@ async def main():
             .project_by_name(["name", "score"]) \
             .create_record_batch_log_scanner()
         scanner_names.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
-        df_named = scanner_names.to_pandas()
+        df_named = await scanner_names.to_pandas()
         print(df_named.head())
         print(f"   Projected {df_named.shape[1]} columns: {list(df_named.columns)}")
 
@@ -661,7 +661,7 @@ async def main():
         scanner_proj = await table.new_scan().project([0, 2]).create_record_batch_log_scanner()
         scanner_proj.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
         # Quick poll that may return empty
-        result = scanner_proj.poll_arrow(100)
+        result = await scanner_proj.poll_arrow(100)
         print(f"   Schema columns: {result.schema.names}")
 
     except Exception as e:
@@ -801,7 +801,7 @@ async def main():
             print(f"Subscribed to partition {p.partition_name} (id={p.partition_id})")
 
         # Use to_arrow() - now works for partitioned tables!
-        partitioned_arrow = partitioned_scanner.to_arrow()
+        partitioned_arrow = await partitioned_scanner.to_arrow()
         print(f"\nto_arrow() returned {partitioned_arrow.num_rows} records from partitioned table:")
         print(partitioned_arrow.to_pandas())
 
@@ -813,7 +813,7 @@ async def main():
         }
         partitioned_scanner_batch.subscribe_partition_buckets(partition_bucket_offsets)
         print(f"Batch subscribed to {len(partition_bucket_offsets)} partition+bucket combinations")
-        partitioned_batch_arrow = partitioned_scanner_batch.to_arrow()
+        partitioned_batch_arrow = await partitioned_scanner_batch.to_arrow()
         print(f"to_arrow() returned {partitioned_batch_arrow.num_rows} records:")
         print(partitioned_batch_arrow.to_pandas())
 
@@ -826,7 +826,7 @@ async def main():
         first_partition = partition_infos[0]
         partitioned_scanner3.unsubscribe_partition(first_partition.partition_id, 0)
         print(f"Unsubscribed from partition {first_partition.partition_name} (id={first_partition.partition_id})")
-        remaining_arrow = partitioned_scanner3.to_arrow()
+        remaining_arrow = await partitioned_scanner3.to_arrow()
         print(f"After unsubscribe, to_arrow() returned {remaining_arrow.num_rows} records (from remaining partitions):")
         print(remaining_arrow.to_pandas())
 
@@ -835,7 +835,7 @@ async def main():
         partitioned_scanner2 = await partitioned_table.new_scan().create_record_batch_log_scanner()
         for p in partition_infos:
             partitioned_scanner2.subscribe_partition(p.partition_id, 0, fluss.EARLIEST_OFFSET)
-        partitioned_df = partitioned_scanner2.to_pandas()
+        partitioned_df = await partitioned_scanner2.to_pandas()
         print(f"to_pandas() returned {len(partitioned_df)} records:")
         print(partitioned_df)
 
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 2f8daa0bc2..fc71397386 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -790,7 +790,7 @@ class LogScanner:
             bucket_id: The bucket ID within the partition
         """
         ...
-    def poll(self, timeout_ms: int) -> ScanRecords:
+    async def poll(self, timeout_ms: int) -> ScanRecords:
         """Poll for individual records with metadata.
 
         Requires a record-based scanner (created with new_scan().create_log_scanner()).
@@ -807,7 +807,7 @@ class LogScanner:
             Returns an empty ScanRecords if no records are available or timeout expires.
         """
         ...
-    def poll_record_batch(self, timeout_ms: int) -> List[RecordBatch]:
+    async def poll_record_batch(self, timeout_ms: int) -> List[RecordBatch]:
         """Poll for batches with metadata.
 
         Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
@@ -823,7 +823,7 @@ class LogScanner:
             Returns an empty list if no batches are available or timeout expires.
         """
         ...
-    def poll_arrow(self, timeout_ms: int) -> pa.Table:
+    async def poll_arrow(self, timeout_ms: int) -> pa.Table:
         """Poll for records as an Arrow Table.
 
         Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
@@ -839,7 +839,7 @@ class LogScanner:
             or timeout expires.
         """
         ...
-    def to_pandas(self) -> pd.DataFrame:
+    async def to_pandas(self) -> pd.DataFrame:
         """Convert all data to Pandas DataFrame.
 
         Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
@@ -848,7 +848,7 @@ class LogScanner:
         You must call subscribe(), subscribe_buckets(), or subscribe_partition() first.
         """
         ...
-    def to_arrow(self) -> pa.Table:
+    async def to_arrow(self) -> pa.Table:
         """Convert all data to Arrow Table.
 
         Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
diff --git a/fluss-rust/bindings/python/pyproject.toml b/fluss-rust/bindings/python/pyproject.toml
index 22e641881b..56a059c9d4 100644
--- a/fluss-rust/bindings/python/pyproject.toml
+++ b/fluss-rust/bindings/python/pyproject.toml
@@ -95,7 +95,7 @@ known-first-party = ["fluss"]
 
 [tool.pytest.ini_options]
 asyncio_mode = "auto"
-asyncio_default_fixture_loop_scope = "function"
+asyncio_default_fixture_loop_scope = "session"
 timeout = 120
 
 [tool.mypy]
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 7d6a6af4d2..98aee5e3c6 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -535,7 +535,7 @@ impl TableScan {
                 admin,
                 table_info,
                 projected_schema,
-                projected_row_type,
+                Arc::new(projected_row_type),
             );
 
             Python::attach(|py| Py::new(py, py_scanner))
@@ -2013,9 +2013,9 @@ pub struct LogScanner {
     /// The projected Arrow schema to use for empty table creation
     projected_schema: SchemaRef,
     /// The projected row type to use for record-based scanning
-    projected_row_type: fcore::metadata::RowType,
+    projected_row_type: Arc<fcore::metadata::RowType>,
     /// Cache for partition_id -> partition_name mapping (avoids repeated list_partition_infos calls)
-    partition_name_cache: std::sync::RwLock<Option<HashMap<i64, String>>>,
+    partition_name_cache: Arc<std::sync::RwLock<Option<HashMap<i64, String>>>>,
 }
 
 #[pymethods]
@@ -2132,9 +2132,7 @@ impl LogScanner {
     ///     - Requires a record-based scanner (created with new_scan().create_log_scanner())
     ///     - Returns an empty ScanRecords if no records are available
     ///     - When timeout expires, returns an empty ScanRecords (NOT an error)
-    fn poll(&self, py: Python, timeout_ms: i64) -> PyResult<ScanRecords> {
-        let scanner = self.kind.as_record()?;
-
+    fn poll<'py>(&self, py: Python<'py>, timeout_ms: i64) -> PyResult<Bound<'py, PyAny>> {
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
                 "timeout_ms must be non-negative, got: {timeout_ms}"
@@ -2142,29 +2140,36 @@ impl LogScanner {
         }
 
         let timeout = Duration::from_millis(timeout_ms as u64);
-        let scan_records = py
-            .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
-            .map_err(|e| FlussError::from_core_error(&e))?;
+        let scanner = Arc::clone(&self.kind);
+        let projected_row_type = self.projected_row_type.clone();
 
-        // Convert core ScanRecords to Python ScanRecords grouped by bucket
-        let row_type = &self.projected_row_type;
-        let mut records_by_bucket = IndexMap::new();
-        let mut total_count = 0usize;
-
-        for (bucket, records) in scan_records.into_records_by_buckets() {
-            let py_bucket = TableBucket::from_core(bucket);
-            let mut py_records = Vec::with_capacity(records.len());
-            for record in &records {
-                let scan_record = ScanRecord::from_core(py, record, row_type)?;
-                py_records.push(Py::new(py, scan_record)?);
-                total_count += 1;
-            }
-            records_by_bucket.insert(py_bucket, py_records);
-        }
+        future_into_py(py, async move {
+            let scan_records = scanner
+                .as_record()?
+                .poll(timeout)
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
-        Ok(ScanRecords {
-            records_by_bucket,
-            total_count,
+            Python::attach(|py| {
+                let mut records_by_bucket = IndexMap::new();
+                let mut total_count = 0usize;
+
+                for (bucket, records) in scan_records.into_records_by_buckets() {
+                    let py_bucket = TableBucket::from_core(bucket);
+                    let mut py_records = Vec::with_capacity(records.len());
+                    for record in &records {
+                        let scan_record = ScanRecord::from_core(py, record, &projected_row_type)?;
+                        py_records.push(Py::new(py, scan_record)?);
+                        total_count += 1;
+                    }
+                    records_by_bucket.insert(py_bucket, py_records);
+                }
+
+                Ok(ScanRecords {
+                    records_by_bucket,
+                    total_count,
+                })
+            })
         })
     }
 
@@ -2181,9 +2186,11 @@ impl LogScanner {
     ///     - Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner())
     ///     - Returns an empty list if no batches are available
     ///     - When timeout expires, returns an empty list (NOT an error)
-    fn poll_record_batch(&self, py: Python, timeout_ms: i64) -> PyResult<Vec<RecordBatch>> {
-        let scanner = self.kind.as_batch()?;
-
+    fn poll_record_batch<'py>(
+        &self,
+        py: Python<'py>,
+        timeout_ms: i64,
+    ) -> PyResult<Bound<'py, PyAny>> {
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
                 "timeout_ms must be non-negative, got: {timeout_ms}"
@@ -2191,17 +2198,22 @@ impl LogScanner {
         }
 
         let timeout = Duration::from_millis(timeout_ms as u64);
-        let scan_batches = py
-            .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
-            .map_err(|e| FlussError::from_core_error(&e))?;
+        let scanner = Arc::clone(&self.kind);
 
-        // Convert ScanBatch to RecordBatch with metadata
-        let result = scan_batches
-            .into_iter()
-            .map(RecordBatch::from_scan_batch)
-            .collect();
+        future_into_py(py, async move {
+            let scan_batches = scanner
+                .as_batch()?
+                .poll(timeout)
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
-        Ok(result)
+            Python::attach(|py| {
+                scan_batches
+                    .into_iter()
+                    .map(|sb| Py::new(py, RecordBatch::from_scan_batch(sb)))
+                    .collect::<PyResult<Vec<_>>>()
+            })
+        })
     }
 
     /// Poll for new records as an Arrow Table.
@@ -2216,9 +2228,7 @@ impl LogScanner {
     ///     - Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner())
     ///     - Returns an empty table (with correct schema) if no records are available
     ///     - When timeout expires, returns an empty table (NOT an error)
-    fn poll_arrow(&self, py: Python, timeout_ms: i64) -> PyResult<Py<PyAny>> {
-        let scanner = self.kind.as_batch()?;
-
+    fn poll_arrow<'py>(&self, py: Python<'py>, timeout_ms: i64) -> PyResult<Bound<'py, PyAny>> {
         if timeout_ms < 0 {
             return Err(FlussError::new_err(format!(
                 "timeout_ms must be non-negative, got: {timeout_ms}"
@@ -2226,38 +2236,23 @@ impl LogScanner {
         }
 
         let timeout = Duration::from_millis(timeout_ms as u64);
-        let scan_batches = py
-            .detach(|| TOKIO_RUNTIME.block_on(async { scanner.poll(timeout).await }))
-            .map_err(|e| FlussError::from_core_error(&e))?;
-
-        // Convert ScanBatch to Arrow batches
-        if scan_batches.is_empty() {
-            return self.create_empty_table(py);
-        }
-
-        let arrow_batches: Vec<_> = scan_batches
-            .into_iter()
-            .map(|scan_batch| Arc::new(scan_batch.into_batch()))
-            .collect();
-
-        Utils::combine_batches_to_table(py, arrow_batches)
-    }
+        let scanner = Arc::clone(&self.kind);
+        let projected_schema = self.projected_schema.clone();
 
-    /// Create an empty PyArrow table with the correct (projected) schema
-    fn create_empty_table(&self, py: Python) -> PyResult<Py<PyAny>> {
-        // Use the projected schema stored in the scanner
-        let py_schema = self
-            .projected_schema
-            .as_ref()
-            .to_pyarrow(py)
-            .map_err(|e| FlussError::new_err(format!("Failed to convert schema: {e}")))?;
+        future_into_py(py, async move {
+            let scan_batches = scanner
+                .as_batch()?
+                .poll(timeout)
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
-        let pyarrow = py.import("pyarrow")?;
-        let empty_table = pyarrow
-            .getattr("Table")?
-            .call_method1("from_batches", (vec![] as Vec<Py<PyAny>>, py_schema))?;
+            let arrow_batches = scan_batches
+                .into_iter()
+                .map(|sb| Arc::new(sb.into_batch()))
+                .collect();
 
-        Ok(empty_table.into())
+            Python::attach(|py| Self::batches_to_arrow_table(py, arrow_batches, &projected_schema))
+        })
     }
 
     /// Convert all data to Arrow Table.
@@ -2269,21 +2264,33 @@ impl LogScanner {
     ///
     /// Returns:
     ///     PyArrow Table containing all data from subscribed buckets
-    fn to_arrow(&self, py: Python) -> PyResult<Py<PyAny>> {
-        let scanner = self.kind.as_batch()?;
-        let subscribed = scanner.get_subscribed_buckets();
+    fn to_arrow<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let kind = Arc::clone(&self.kind);
+        let admin = Arc::clone(&self.admin);
+        let table_info = self.table_info.clone();
+        let projected_schema = self.projected_schema.clone();
+        let partition_name_cache = Arc::clone(&self.partition_name_cache);
 
-        if subscribed.is_empty() {
-            return Err(FlussError::new_err(
-                "No buckets subscribed. Call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.",
-            ));
-        }
+        future_into_py(py, async move {
+            let scanner = kind.as_batch()?;
+            let subscribed = scanner.get_subscribed_buckets();
+            if subscribed.is_empty() {
+                return Err(FlussError::new_err(
+                    "No buckets subscribed. Call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.",
+                ));
+            }
 
-        // 2. Query latest offsets for all subscribed buckets
-        let stopping_offsets = self.query_latest_offsets(py, &subscribed)?;
+            let all_batches = Self::collect_all_batches(
+                scanner,
+                &admin,
+                &table_info,
+                &subscribed,
+                &partition_name_cache,
+            )
+            .await?;
 
-        // 3. Poll until all buckets reach their stopping offsets
-        self.poll_until_offsets(py, stopping_offsets)
+            Python::attach(|py| Self::batches_to_arrow_table(py, all_batches, &projected_schema))
+        })
     }
 
     /// Convert all data to Pandas DataFrame.
@@ -2295,12 +2302,36 @@ impl LogScanner {
     ///
     /// Returns:
     ///     Pandas DataFrame containing all data from subscribed buckets
-    fn to_pandas(&self, py: Python) -> PyResult<Py<PyAny>> {
-        let arrow_table = self.to_arrow(py)?;
+    fn to_pandas<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
+        let kind = Arc::clone(&self.kind);
+        let admin = Arc::clone(&self.admin);
+        let table_info = self.table_info.clone();
+        let projected_schema = self.projected_schema.clone();
+        let partition_name_cache = Arc::clone(&self.partition_name_cache);
+
+        future_into_py(py, async move {
+            let scanner = kind.as_batch()?;
+            let subscribed = scanner.get_subscribed_buckets();
+            if subscribed.is_empty() {
+                return Err(FlussError::new_err(
+                    "No buckets subscribed. Call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.",
+                ));
+            }
+
+            let all_batches = Self::collect_all_batches(
+                scanner,
+                &admin,
+                &table_info,
+                &subscribed,
+                &partition_name_cache,
+            )
+            .await?;
 
-        // Convert Arrow Table to Pandas DataFrame using pyarrow
-        let df = arrow_table.call_method0(py, "to_pandas")?;
-        Ok(df)
+            Python::attach(|py| {
+                let arrow_table = Self::batches_to_arrow_table(py, all_batches, &projected_schema)?;
+                arrow_table.call_method0(py, "to_pandas")
+            })
+        })
     }
 
     fn __aiter__<'py>(slf: PyRef<'py, Self>) -> PyResult<Bound<'py, PyAny>> {
@@ -2312,14 +2343,11 @@ impl LogScanner {
         let gen_fn = ASYNC_GEN_FN.get_or_init(py, || {
             let code = pyo3::ffi::c_str!(
                 r#"
-async def _async_scan_generic(scanner, method_name):
-    # Dynamically resolve the polling method (e.g., _async_poll or _async_poll_batches)
+async def _async_scan_generic(scanner, method_name, timeout_ms):
     poll_method = getattr(scanner, method_name)
     while True:
-        items = await poll_method()
-        if items:
-            for item in items:
-                yield item
+        for item in await poll_method(timeout_ms):
+            yield item
 "#
             );
             let globals = pyo3::types::PyDict::new(py);
@@ -2331,106 +2359,16 @@ async def _async_scan_generic(scanner, method_name):
                 .unbind()
         });
 
-        // Determine which internal method to call based on the scanner kind
         let method_name = match slf.kind.as_ref() {
-            ScannerKind::Record(_) => "_async_poll",
-            ScannerKind::Batch(_) => "_async_poll_batches",
+            ScannerKind::Record(_) => "poll",
+            ScannerKind::Batch(_) => "poll_record_batch",
         };
 
-        // Instantiate the generator with the scanner instance and the target method name
-        gen_fn
-            .bind(py)
-            .call1((slf.into_bound_py_any(py)?, method_name))
-    }
-
-    /// Perform a single bounded poll and return a list of ScanRecord objects.
-    ///
-    /// This is the async building block used by `__aiter__` (record mode) to
-    /// implement `async for`. Each call does exactly one network poll (bounded
-    /// by `DEFAULT_POLL_INTERVAL_MS`), converts any results to Python ScanRecord objects,
-    /// and returns them as a list. An empty list signals a timeout (no data yet), not
-    /// end-of-stream.
-    ///
-    /// Returns:
-    ///     Awaitable that resolves to a list of ScanRecord objects
-    fn _async_poll<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let timeout = Duration::from_millis(DEFAULT_POLL_INTERVAL_MS as u64);
-
-        let scanner = Arc::clone(&self.kind);
-        let projected_row_type = self.projected_row_type.clone();
-
-        future_into_py(py, async move {
-            let core_scanner = match scanner.as_ref() {
-                ScannerKind::Record(s) => s,
-                ScannerKind::Batch(_) => {
-                    return Err(PyTypeError::new_err(
-                        "This internal method only supports record-based scanners. \
-                         For batch-based scanners, use 'async for' or 'poll_record_batch' instead.",
-                    ));
-                }
-            };
-
-            let scan_records = core_scanner
-                .poll(timeout)
-                .await
-                .map_err(|e| FlussError::from_core_error(&e))?;
-
-            // Convert to Python list
-            Python::attach(|py| {
-                let mut result: Vec<Py<ScanRecord>> = Vec::new();
-                for (_, records) in scan_records.into_records_by_buckets() {
-                    for core_record in records {
-                        let scan_record =
-                            ScanRecord::from_core(py, &core_record, &projected_row_type)?;
-                        result.push(Py::new(py, scan_record)?);
-                    }
-                }
-                Ok(result)
-            })
-        })
-    }
-
-    /// Perform a single bounded poll and return a list of RecordBatch objects.
-    ///
-    /// This is the async building block used by `__aiter__` (batch mode) to
-    /// implement `async for`. Each call does exactly one network poll (bounded
-    /// by `DEFAULT_POLL_INTERVAL_MS`), converts any results to Python RecordBatch objects,
-    /// and returns them as a list. An empty list signals a timeout (no data
-    /// yet), not end-of-stream.
-    ///
-    /// Returns:
-    ///     Awaitable that resolves to a list of RecordBatch objects
-    fn _async_poll_batches<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
-        let timeout = Duration::from_millis(DEFAULT_POLL_INTERVAL_MS as u64);
-
-        let scanner = Arc::clone(&self.kind);
-
-        future_into_py(py, async move {
-            let core_scanner = match scanner.as_ref() {
-                ScannerKind::Batch(s) => s,
-                ScannerKind::Record(_) => {
-                    return Err(PyTypeError::new_err(
-                        "This internal method only supports batch-based scanners. \
-                         For record-based scanners, use 'async for' or 'poll' instead.",
-                    ));
-                }
-            };
-
-            let scan_batches = core_scanner
-                .poll(timeout)
-                .await
-                .map_err(|e| FlussError::from_core_error(&e))?;
-
-            // Convert to Python list of RecordBatch objects
-            Python::attach(|py| {
-                let mut result: Vec<Py<RecordBatch>> = Vec::new();
-                for scan_batch in scan_batches {
-                    let rb = RecordBatch::from_scan_batch(scan_batch);
-                    result.push(Py::new(py, rb)?);
-                }
-                Ok(result)
-            })
-        })
+        gen_fn.bind(py).call1((
+            slf.into_bound_py_any(py)?,
+            method_name,
+            DEFAULT_POLL_INTERVAL_MS,
+        ))
     }
 
     fn __repr__(&self) -> String {
@@ -2444,7 +2382,7 @@ impl LogScanner {
         admin: Arc<fcore::client::FlussAdmin>,
         table_info: fcore::metadata::TableInfo,
         projected_schema: SchemaRef,
-        projected_row_type: fcore::metadata::RowType,
+        projected_row_type: Arc<fcore::metadata::RowType>,
     ) -> Self {
         Self {
             kind: Arc::new(scanner),
@@ -2452,73 +2390,52 @@ impl LogScanner {
             table_info,
             projected_schema,
             projected_row_type,
-            partition_name_cache: std::sync::RwLock::new(None),
+            partition_name_cache: Arc::new(std::sync::RwLock::new(None)),
         }
     }
 
-    /// Get partition_id -> partition_name mapping, using cache if available
-    fn get_partition_name_map(
-        &self,
-        py: Python,
-        table_path: &fcore::metadata::TablePath,
-    ) -> PyResult<HashMap<i64, String>> {
-        // Check cache first (read lock)
-        {
-            let cache = self.partition_name_cache.read().unwrap();
-            if let Some(map) = cache.as_ref() {
-                return Ok(map.clone());
-            }
-        }
-
-        // Fetch partition infos (releases GIL during async call)
-        let partition_infos: Vec<fcore::metadata::PartitionInfo> = py
-            .detach(|| {
-                TOKIO_RUNTIME.block_on(async { self.admin.list_partition_infos(table_path).await })
-            })
-            .map_err(|e| FlussError::from_core_error(&e))?;
-
-        // Build and cache the mapping
-        let map: HashMap<i64, String> = partition_infos
-            .into_iter()
-            .map(|info| (info.get_partition_id(), info.get_partition_name()))
-            .collect();
-
-        // Store in cache (write lock)
-        {
-            let mut cache = self.partition_name_cache.write().unwrap();
-            *cache = Some(map.clone());
+    /// Convert Arrow record batches to a PyArrow Table (or empty table if no batches).
+    fn batches_to_arrow_table(
+        py: Python<'_>,
+        batches: Vec<Arc<ArrowRecordBatch>>,
+        projected_schema: &SchemaRef,
+    ) -> PyResult<Py<PyAny>> {
+        if batches.is_empty() {
+            let py_schema = projected_schema
+                .as_ref()
+                .to_pyarrow(py)
+                .map_err(|e| FlussError::new_err(format!("Failed to convert schema: {e}")))?;
+            let pyarrow = py.import("pyarrow")?;
+            let empty_table = pyarrow
+                .getattr("Table")?
+                .call_method1("from_batches", (vec![] as Vec<Py<PyAny>>, py_schema))?;
+            Ok(empty_table.into())
+        } else {
+            Utils::combine_batches_to_table(py, batches)
         }
-
-        Ok(map)
     }
 
-    /// Query latest offsets for subscribed buckets (handles both partitioned and non-partitioned)
-    fn query_latest_offsets(
-        &self,
-        py: Python,
+    /// Query stopping offsets and poll until all subscribed buckets are fully read.
+    /// Returns collected Arrow record batches.
+    async fn collect_all_batches(
+        scanner: &fcore::client::RecordBatchLogScanner,
+        admin: &fcore::client::FlussAdmin,
+        table_info: &fcore::metadata::TableInfo,
         subscribed: &[(fcore::metadata::TableBucket, i64)],
-    ) -> PyResult<HashMap<fcore::metadata::TableBucket, i64>> {
-        let scanner = self.kind.as_batch()?;
+        partition_name_cache: &std::sync::RwLock<Option<HashMap<i64, String>>>,
+    ) -> PyResult<Vec<Arc<ArrowRecordBatch>>> {
         let is_partitioned = scanner.is_partitioned();
-        let table_path = &self.table_info.table_path;
+        let table_path = &table_info.table_path;
+        let table_id = table_info.table_id;
 
-        if !is_partitioned {
-            // Non-partitioned: simple case - just query all bucket IDs
+        // 1. Query latest offsets
+        let mut stopping_offsets: HashMap<fcore::metadata::TableBucket, i64> = if !is_partitioned {
             let bucket_ids: Vec<i32> = subscribed.iter().map(|(tb, _)| tb.bucket_id()).collect();
-
-            let offsets: HashMap<i32, i64> = py
-                .detach(|| {
-                    TOKIO_RUNTIME.block_on(async {
-                        self.admin
-                            .list_offsets(table_path, &bucket_ids, OffsetSpec::Latest)
-                            .await
-                    })
-                })
+            let offsets = admin
+                .list_offsets(table_path, &bucket_ids, OffsetSpec::Latest)
+                .await
                 .map_err(|e| FlussError::from_core_error(&e))?;
-
-            // Convert to TableBucket-keyed map
-            let table_id = self.table_info.table_id;
-            Ok(offsets
+            offsets
                 .into_iter()
                 .filter(|(_, offset)| *offset > 0)
                 .map(|(bucket_id, offset)| {
@@ -2527,88 +2444,69 @@ impl LogScanner {
                         offset,
                     )
                 })
-                .collect())
+                .collect()
         } else {
-            // Partitioned: need to query per partition
-            self.query_partitioned_offsets(py, subscribed)
-        }
-    }
+            let cached = partition_name_cache.read().unwrap().clone();
+            let partition_id_to_name = match cached {
+                Some(map) => map,
+                None => {
+                    let infos = admin
+                        .list_partition_infos(table_path)
+                        .await
+                        .map_err(|e| FlussError::from_core_error(&e))?;
+                    let map: HashMap<i64, String> = infos
+                        .into_iter()
+                        .map(|info| (info.get_partition_id(), info.get_partition_name()))
+                        .collect();
+                    *partition_name_cache.write().unwrap() = Some(map.clone());
+                    map
+                }
+            };
 
-    /// Query offsets for partitioned table subscriptions
-    fn query_partitioned_offsets(
-        &self,
-        py: Python,
-        subscribed: &[(fcore::metadata::TableBucket, i64)],
-    ) -> PyResult<HashMap<fcore::metadata::TableBucket, i64>> {
-        let table_path = &self.table_info.table_path;
-
-        // Get partition_id -> partition_name mapping (cached)
-        let partition_id_to_name = self.get_partition_name_map(py, table_path)?;
-
-        // Group subscribed buckets by partition_id
-        let mut by_partition: HashMap<i64, Vec<i32>> = HashMap::new();
-        for (tb, _) in subscribed {
-            if let Some(partition_id) = tb.partition_id() {
-                by_partition
-                    .entry(partition_id)
-                    .or_default()
-                    .push(tb.bucket_id());
+            let mut by_partition: HashMap<i64, Vec<i32>> = HashMap::new();
+            for (tb, _) in subscribed {
+                if let Some(partition_id) = tb.partition_id() {
+                    by_partition
+                        .entry(partition_id)
+                        .or_default()
+                        .push(tb.bucket_id());
+                }
             }
-        }
 
-        // Query offsets for each partition
-        let mut result: HashMap<fcore::metadata::TableBucket, i64> = HashMap::new();
-        let table_id = self.table_info.table_id;
-
-        for (partition_id, bucket_ids) in by_partition {
-            let partition_name = partition_id_to_name.get(&partition_id).ok_or_else(|| {
-                FlussError::new_err(format!("Unknown partition_id: {partition_id}"))
-            })?;
-
-            let offsets: HashMap<i32, i64> = py
-                .detach(|| {
-                    TOKIO_RUNTIME.block_on(async {
-                        self.admin
-                            .list_partition_offsets(
-                                table_path,
-                                partition_name,
-                                &bucket_ids,
-                                OffsetSpec::Latest,
-                            )
-                            .await
-                    })
-                })
-                .map_err(|e| FlussError::from_core_error(&e))?;
-
-            for (bucket_id, offset) in offsets {
-                if offset > 0 {
-                    let tb = fcore::metadata::TableBucket::new_with_partition(
-                        table_id,
-                        Some(partition_id),
-                        bucket_id,
-                    );
-                    result.insert(tb, offset);
+            let mut result = HashMap::new();
+            for (partition_id, bucket_ids) in by_partition {
+                let partition_name = partition_id_to_name.get(&partition_id).ok_or_else(|| {
+                    FlussError::new_err(format!("Unknown partition_id: {partition_id}"))
+                })?;
+                let offsets = admin
+                    .list_partition_offsets(
+                        table_path,
+                        partition_name,
+                        &bucket_ids,
+                        OffsetSpec::Latest,
+                    )
+                    .await
+                    .map_err(|e| FlussError::from_core_error(&e))?;
+                for (bucket_id, offset) in offsets {
+                    if offset > 0 {
+                        let tb = fcore::metadata::TableBucket::new_with_partition(
+                            table_id,
+                            Some(partition_id),
+                            bucket_id,
+                        );
+                        result.insert(tb, offset);
+                    }
                 }
             }
-        }
-
-        Ok(result)
-    }
+            result
+        };
 
-    /// Poll until all buckets reach their stopping offsets
-    fn poll_until_offsets(
-        &self,
-        py: Python,
-        mut stopping_offsets: HashMap<fcore::metadata::TableBucket, i64>,
-    ) -> PyResult<Py<PyAny>> {
-        let scanner = self.kind.as_batch()?;
+        // 2. Poll until all buckets reach their stopping offsets
         let mut all_batches = Vec::new();
-
         while !stopping_offsets.is_empty() {
-            let scan_batches = py
-                .detach(|| {
-                    TOKIO_RUNTIME.block_on(async { scanner.poll(Duration::from_millis(500)).await })
-                })
+            let scan_batches = scanner
+                .poll(Duration::from_millis(500))
+                .await
                 .map_err(|e| FlussError::from_core_error(&e))?;
 
             if scan_batches.is_empty() {
@@ -2617,8 +2515,6 @@ impl LogScanner {
 
             for scan_batch in scan_batches {
                 let table_bucket = scan_batch.bucket().clone();
-
-                // Check if this bucket is still being tracked
                 let Some(&stop_at) = stopping_offsets.get(&table_bucket) else {
                     continue;
                 };
@@ -2626,14 +2522,12 @@ impl LogScanner {
                 let base_offset = scan_batch.base_offset();
                 let last_offset = scan_batch.last_offset();
 
-                // If the batch starts at or after the stop_at offset, the bucket is exhausted
                 if base_offset >= stop_at {
                     stopping_offsets.remove(&table_bucket);
                     continue;
                 }
 
                 let batch = if last_offset >= stop_at {
-                    // Slice batch to keep only records where offset < stop_at
                     let num_to_keep = (stop_at - base_offset) as usize;
                     let b = scan_batch.into_batch();
                     let limit = num_to_keep.min(b.num_rows());
@@ -2644,14 +2538,13 @@ impl LogScanner {
 
                 all_batches.push(Arc::new(batch));
 
-                // Check if we're done with this bucket
                 if last_offset >= stop_at - 1 {
                     stopping_offsets.remove(&table_bucket);
                 }
             }
         }
 
-        Utils::combine_batches_to_table(py, all_batches)
+        Ok(all_batches)
     }
 }
 
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index 00119b76a3..52773c9e86 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -124,16 +124,12 @@ def fluss_cluster():
     yield (plaintext_addr, sasl_addr or plaintext_addr)
 
 
-_cached_connection = None
-
-
-@pytest_asyncio.fixture
+@pytest_asyncio.fixture(scope="session")
 async def connection(fluss_cluster):
-    global _cached_connection
-    if _cached_connection is None:
-        plaintext_addr, _sasl_addr = fluss_cluster
-        _cached_connection = await _connect(plaintext_addr)
-    yield _cached_connection
+    plaintext_addr, _sasl_addr = fluss_cluster
+    conn = await _connect(plaintext_addr)
+    yield conn
+    conn.close()
 
 
 @pytest.fixture(scope="session")
@@ -148,7 +144,7 @@ def plaintext_bootstrap_servers(fluss_cluster):
     return plaintext_addr
 
 
-@pytest_asyncio.fixture
+@pytest_asyncio.fixture(scope="session")
 async def admin(connection):
     return connection.get_admin()
 
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index 86e9a707c9..2f560bcf2c 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -64,7 +64,7 @@ async def test_append_and_scan(connection, admin):
     num_buckets = (await admin.get_table_info(table_path)).num_buckets
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
-    records = _poll_records(scanner, expected_count=6)
+    records = await _poll_records(scanner, expected_count=6)
 
     assert len(records) == 6, f"Expected 6 records, got {len(records)}"
 
@@ -107,7 +107,7 @@ async def test_append_dict_rows(connection, admin):
     num_buckets = (await admin.get_table_info(table_path)).num_buckets
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
-    records = _poll_records(scanner, expected_count=3)
+    records = await _poll_records(scanner, expected_count=3)
     assert len(records) == 3
 
     rows = sorted([r.row for r in records], key=lambda r: r["id"])
@@ -238,7 +238,7 @@ async def test_project(connection, admin):
     scanner = await scan.create_log_scanner()
     scanner.subscribe_buckets({0: 0})
 
-    records = _poll_records(scanner, expected_count=3)
+    records = await _poll_records(scanner, expected_count=3)
     assert len(records) == 3
 
     records.sort(key=lambda r: r.row["col_c"])
@@ -254,7 +254,7 @@ async def test_project(connection, admin):
     scanner2 = await table.new_scan().project([1, 0]).create_log_scanner()
     scanner2.subscribe_buckets({0: 0})
 
-    records2 = _poll_records(scanner2, expected_count=3)
+    records2 = await _poll_records(scanner2, expected_count=3)
     assert len(records2) == 3
 
     records2.sort(key=lambda r: r.row["col_a"])
@@ -284,7 +284,7 @@ async def test_poll_batches(connection, admin, wait_for_table_ready):
     scanner.subscribe(bucket_id=0, start_offset=0)
 
     # Empty table should return empty result
-    result = scanner.poll_arrow(500)
+    result = await scanner.poll_arrow(500)
     assert result.num_rows == 0
 
     writer = table.new_append().create_writer()
@@ -310,7 +310,7 @@ async def test_poll_batches(connection, admin, wait_for_table_ready):
     await writer.flush()
 
     # Poll until we get all 6 records
-    all_ids = _poll_arrow_ids(scanner, expected_count=6)
+    all_ids = await _poll_arrow_ids(scanner, expected_count=6)
     assert all_ids == [1, 2, 3, 4, 5, 6]
 
     # Append more and verify offset continuation (no duplicates)
@@ -322,14 +322,14 @@ async def test_poll_batches(connection, admin, wait_for_table_ready):
     )
     await writer.flush()
 
-    new_ids = _poll_arrow_ids(scanner, expected_count=2)
+    new_ids = await _poll_arrow_ids(scanner, expected_count=2)
     assert new_ids == [7, 8]
 
     # Subscribe from mid-offset should truncate (skip earlier records)
     trunc_scanner = await table.new_scan().create_record_batch_log_scanner()
     trunc_scanner.subscribe(bucket_id=0, start_offset=3)
 
-    trunc_ids = _poll_arrow_ids(trunc_scanner, expected_count=5)
+    trunc_ids = await _poll_arrow_ids(trunc_scanner, expected_count=5)
     assert trunc_ids == [4, 5, 6, 7, 8]
 
     # Projection with batch scanner
@@ -339,7 +339,7 @@ async def test_poll_batches(connection, admin, wait_for_table_ready):
         .create_record_batch_log_scanner()
     )
     proj_scanner.subscribe(bucket_id=0, start_offset=0)
-    batches = proj_scanner.poll_record_batch(10000)
+    batches = await proj_scanner.poll_record_batch(10000)
     assert len(batches) > 0
     assert batches[0].batch.num_columns == 1
 
@@ -374,14 +374,14 @@ async def test_to_arrow_and_to_pandas(connection, admin):
     # to_arrow()
     scanner = await table.new_scan().create_record_batch_log_scanner()
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
-    arrow_table = scanner.to_arrow()
+    arrow_table = await scanner.to_arrow()
     assert arrow_table.num_rows == 3
     assert arrow_table.schema.names == ["id", "name"]
 
     # to_pandas()
     scanner2 = await table.new_scan().create_record_batch_log_scanner()
     scanner2.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
-    df = scanner2.to_pandas()
+    df = await scanner2.to_pandas()
     assert len(df) == 3
     assert list(df.columns) == ["id", "name"]
 
@@ -497,7 +497,7 @@ async def test_partitioned_table_append_scan(connection, admin, wait_for_table_r
     all_records = []
     deadline = time.monotonic() + 10
     while len(all_records) < 8 and time.monotonic() < deadline:
-        scan_records = scanner.poll(5000)
+        scan_records = await scanner.poll(5000)
         for bucket, bucket_records in scan_records.items():
             assert bucket.partition_id is not None, "Partitioned table should have partition_id"
             # All records in a bucket should belong to the same partition
@@ -522,7 +522,7 @@ async def test_partitioned_table_append_scan(connection, admin, wait_for_table_r
         unsub_scanner.subscribe_partition(p.partition_id, 0, 0)
     unsub_scanner.unsubscribe_partition(eu_partition_id, 0)
 
-    remaining = _poll_records(unsub_scanner, expected_count=4, timeout_s=5)
+    remaining = await _poll_records(unsub_scanner, expected_count=4, timeout_s=5)
     assert len(remaining) == 4
     assert all(r.row["region"] == "US" for r in remaining)
 
@@ -533,7 +533,7 @@ async def test_partitioned_table_append_scan(connection, admin, wait_for_table_r
     }
     batch_scanner.subscribe_partition_buckets(partition_bucket_offsets)
 
-    batch_records = _poll_records(batch_scanner, expected_count=8)
+    batch_records = await _poll_records(batch_scanner, expected_count=8)
     assert len(batch_records) == 8
     batch_collected = sorted(
         [(r.row["id"], r.row["region"], r.row["value"]) for r in batch_records],
@@ -573,7 +573,7 @@ async def test_write_arrow(connection, admin):
     scanner = await table.new_scan().create_record_batch_log_scanner()
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
-    result = scanner.to_arrow()
+    result = await scanner.to_arrow()
     assert result.num_rows == 5
 
     ids = sorted(result.column("id").to_pylist())
@@ -613,7 +613,7 @@ async def test_write_pandas(connection, admin):
     scanner = await table.new_scan().create_record_batch_log_scanner()
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
-    result = scanner.to_pandas()
+    result = await scanner.to_pandas()
     assert len(result) == 3
 
     result_sorted = result.sort_values("id").reset_index(drop=True)
@@ -657,7 +657,7 @@ async def test_partitioned_table_to_arrow(connection, admin, wait_for_table_read
     for p in partition_infos:
         scanner.subscribe_partition(p.partition_id, 0, fluss.EARLIEST_OFFSET)
 
-    arrow_table = scanner.to_arrow()
+    arrow_table = await scanner.to_arrow()
     assert arrow_table.num_rows == 2
 
     await admin.drop_table(table_path, ignore_if_not_exists=False)
@@ -692,7 +692,7 @@ async def test_scan_records_indexing_and_slicing(connection, admin):
     sr = None
     deadline = time.monotonic() + 10
     while time.monotonic() < deadline:
-        sr = scanner.poll(5000)
+        sr = await scanner.poll(5000)
         if len(sr) >= 2:
             break
     assert sr is not None and len(sr) >= 2, "Expected at least 2 records"
@@ -831,7 +831,7 @@ async def consume_and_break():
     # records in one batch. After break, the un-yielded records from that
     # batch are lost. So sync poll may return 0 records — the key assertion
     # is that poll() completes without deadlock (returns within timeout).
-    remaining = scanner.poll(2000)
+    remaining = await scanner.poll(2000)
     assert remaining is not None, "poll() should return (not deadlock)"
 
     # If we got records, verify no duplicates
@@ -1037,7 +1037,7 @@ async def consume_and_break():
     assert first_batch.batch.num_rows > 0
 
     # Phase 2: sync poll_record_batch() must still work — proves no leak
-    remaining = batch_scanner.poll_record_batch(2000)
+    remaining = await batch_scanner.poll_record_batch(2000)
     assert remaining is not None, "poll_record_batch() should return (not deadlock)"
 
     await admin.drop_table(table_path, ignore_if_not_exists=False)
@@ -1107,22 +1107,22 @@ async def consume_all():
 # ---------------------------------------------------------------------------
 
 
-def _poll_records(scanner, expected_count, timeout_s=10):
+async def _poll_records(scanner, expected_count, timeout_s=10):
     """Poll a record-based scanner until expected_count records are collected."""
     collected = []
     deadline = time.monotonic() + timeout_s
     while len(collected) < expected_count and time.monotonic() < deadline:
-        records = scanner.poll(5000)
+        records = await scanner.poll(5000)
         collected.extend(records)
     return collected
 
 
-def _poll_arrow_ids(scanner, expected_count, timeout_s=10):
+async def _poll_arrow_ids(scanner, expected_count, timeout_s=10):
     """Poll a batch scanner and extract 'id' column values."""
     all_ids = []
     deadline = time.monotonic() + timeout_s
     while len(all_ids) < expected_count and time.monotonic() < deadline:
-        arrow_table = scanner.poll_arrow(5000)
+        arrow_table = await scanner.poll_arrow(5000)
         if arrow_table.num_rows > 0:
             all_ids.extend(arrow_table.column("id").to_pylist())
     return all_ids
@@ -1173,7 +1173,7 @@ async def test_append_and_scan_with_array(connection, admin):
     # Verify via LogScanner (record-by-record)
     scanner = await table.new_scan().create_log_scanner()
     scanner.subscribe_buckets({0: fluss.EARLIEST_OFFSET})
-    records = _poll_records(scanner, expected_count=6)
+    records = await _poll_records(scanner, expected_count=6)
 
     assert len(records) == 6
     records.sort(key=lambda r: r.row["id"])
@@ -1197,7 +1197,7 @@ async def test_append_and_scan_with_array(connection, admin):
     # Verify via to_arrow (batch-based)
     scanner2 = await table.new_scan().create_record_batch_log_scanner()
     scanner2.subscribe_buckets({0: fluss.EARLIEST_OFFSET})
-    result_table = scanner2.to_arrow()
+    result_table = await scanner2.to_arrow()
 
     assert result_table.num_rows == 6
     assert result_table.column("tags").to_pylist() == [
@@ -1251,7 +1251,7 @@ async def test_append_rows_with_array(connection, admin):
     num_buckets = (await admin.get_table_info(table_path)).num_buckets
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
-    records = _poll_records(scanner, expected_count=3)
+    records = await _poll_records(scanner, expected_count=3)
     assert len(records) == 3
 
     rows = sorted([r.row for r in records], key=lambda r: r["id"])
@@ -1293,7 +1293,7 @@ async def test_append_rows_with_nested_array(connection, admin):
     num_buckets = (await admin.get_table_info(table_path)).num_buckets
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
-    records = _poll_records(scanner, expected_count=5)
+    records = await _poll_records(scanner, expected_count=5)
     assert len(records) == 5
 
     rows = sorted([r.row for r in records], key=lambda r: r["id"])
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index 73b9a8fe7c..317aee74e4 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -161,11 +161,11 @@ Builder for creating a `Lookuper`. Obtain via `FlussTable.new_lookup()`.
 | `.subscribe_partition_buckets(partition_bucket_offsets)`      | Subscribe to multiple partition+bucket combos (`{(part_id, bucket_id): offset}`) |
 | `.unsubscribe(bucket_id)`                                     | Unsubscribe from a bucket (non-partitioned tables)                               |
 | `.unsubscribe_partition(partition_id, bucket_id)`             | Unsubscribe from a partition bucket                                              |
-| `.poll(timeout_ms) -> ScanRecords`                            | Poll individual records (record scanner only)                                    |
-| `.poll_arrow(timeout_ms) -> pa.Table`                         | Poll as Arrow Table (batch scanner only)                                         |
-| `.poll_record_batch(timeout_ms) -> list[RecordBatch]`         | Poll batches with metadata (batch scanner only)                                  |
-| `.to_arrow() -> pa.Table`                                     | Read all subscribed data as Arrow Table (batch scanner only)                     |
-| `.to_pandas() -> pd.DataFrame`                                | Read all subscribed data as DataFrame (batch scanner only)                       |
+| `await .poll(timeout_ms) -> ScanRecords`                      | Poll individual records (record scanner only)                                    |
+| `await .poll_arrow(timeout_ms) -> pa.Table`                   | Poll as Arrow Table (batch scanner only)                                         |
+| `await .poll_record_batch(timeout_ms) -> list[RecordBatch]`   | Poll batches with metadata (batch scanner only)                                  |
+| `await .to_arrow() -> pa.Table`                               | Read all subscribed data as Arrow Table (batch scanner only)                     |
+| `await .to_pandas() -> pd.DataFrame`                          | Read all subscribed data as DataFrame (batch scanner only)                       |
 
 ## `ScanRecords`
 
@@ -174,7 +174,7 @@ Returned by `LogScanner.poll()`. Records are grouped by bucket.
 > **Note:** Flat iteration and integer indexing traverse buckets in an arbitrary order that is consistent within a single `ScanRecords` instance but may differ between `poll()` calls. Use per-bucket access (`.items()`, `.records(bucket)`) when bucket ordering matters.
 
 ```python
-scan_records = scanner.poll(timeout_ms=5000)
+scan_records = await scanner.poll(timeout_ms=5000)
 
 # Sequence access
 scan_records[0]                              # first record
diff --git a/fluss-rust/website/docs/user-guide/python/data-types.md b/fluss-rust/website/docs/user-guide/python/data-types.md
index c0acb4c7ea..df8165f0f6 100644
--- a/fluss-rust/website/docs/user-guide/python/data-types.md
+++ b/fluss-rust/website/docs/user-guide/python/data-types.md
@@ -55,7 +55,7 @@ handle = writer.append(row)
 ## Reading Data
 
 ```python
-records = scanner.poll(timeout_ms=1000)
+records = await scanner.poll(timeout_ms=1000)
 for record in records:
     row = record.row  # dict[str, Any]
     print(row["user_id"])     # int
diff --git a/fluss-rust/website/docs/user-guide/python/example/index.md b/fluss-rust/website/docs/user-guide/python/example/index.md
index 21768a1d06..ecbdc84685 100644
--- a/fluss-rust/website/docs/user-guide/python/example/index.md
+++ b/fluss-rust/website/docs/user-guide/python/example/index.md
@@ -36,7 +36,7 @@ async def main():
     num_buckets = (await admin.get_table_info(table_path)).num_buckets
     scanner = await table.new_scan().create_record_batch_log_scanner()
     scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
-    print(scanner.to_pandas())
+    print(await scanner.to_pandas())
 
     # Cleanup
     await admin.drop_table(table_path, ignore_if_not_exists=True)
diff --git a/fluss-rust/website/docs/user-guide/python/example/log-tables.md b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
index c320bf4813..4dbe256781 100644
--- a/fluss-rust/website/docs/user-guide/python/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/python/example/log-tables.md
@@ -65,8 +65,8 @@ scanner = await table.new_scan().create_record_batch_log_scanner()
 scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
 # Reads everything up to current latest offset, then returns
-arrow_table = scanner.to_arrow()
-df = scanner.to_pandas()
+arrow_table = await scanner.to_arrow()
+df = await scanner.to_pandas()
 ```
 
 ### Continuous Polling
@@ -79,7 +79,7 @@ scanner = await table.new_scan().create_record_batch_log_scanner()
 scanner.subscribe(bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
 
 while True:
-    result = scanner.poll_arrow(timeout_ms=5000)
+    result = await scanner.poll_arrow(timeout_ms=5000)
     if result.num_rows > 0:
         print(result.to_pandas())
 
@@ -88,7 +88,7 @@ scanner = await table.new_scan().create_log_scanner()
 scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
 
 while True:
-    scan_records = scanner.poll(timeout_ms=5000)
+    scan_records = await scanner.poll(timeout_ms=5000)
 
     for record in scan_records:
         print(f"offset={record.offset}, change={record.change_type.short_string()}, row={record.row}")
diff --git a/fluss-rust/website/docs/user-guide/python/example/partitioned-tables.md b/fluss-rust/website/docs/user-guide/python/example/partitioned-tables.md
index f82809201b..894bb519db 100644
--- a/fluss-rust/website/docs/user-guide/python/example/partitioned-tables.md
+++ b/fluss-rust/website/docs/user-guide/python/example/partitioned-tables.md
@@ -59,7 +59,7 @@ scanner.subscribe_partition_buckets({
     (p.partition_id, 0): fluss.EARLIEST_OFFSET for p in partition_infos
 })
 
-print(scanner.to_pandas())
+print(await scanner.to_pandas())
 ```
 
 ### Unsubscribing

From cb367e83dba2772a4b306a996246a073429684fa Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 3 May 2026 14:14:22 +0100
Subject: [PATCH 254/287] chore: fix context_manager in python for async
 handling (#527)

---
 fluss-rust/bindings/python/test/test_context_manager.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/fluss-rust/bindings/python/test/test_context_manager.py b/fluss-rust/bindings/python/test/test_context_manager.py
index f0dcc36f0f..5dcb5a4c31 100644
--- a/fluss-rust/bindings/python/test/test_context_manager.py
+++ b/fluss-rust/bindings/python/test/test_context_manager.py
@@ -20,12 +20,12 @@
 import time
 import fluss
 
-def _poll_records(scanner, expected_count, timeout_s=10):
+async def _poll_records(scanner, expected_count, timeout_s=10):
     """Poll a record-based scanner until expected_count records are collected."""
     collected = []
     deadline = time.monotonic() + timeout_s
     while len(collected) < expected_count and time.monotonic() < deadline:
-        records = scanner.poll(5000)
+        records = await scanner.poll(5000)
         collected.extend(records)
     return collected
 
@@ -56,7 +56,7 @@ async def test_append_writer_success_flush(connection, admin):
     # After context exit, data should be flushed
     scanner = await table.new_scan().create_log_scanner()
     scanner.subscribe(0, fluss.EARLIEST_OFFSET)
-    records = _poll_records(scanner, expected_count=2)
+    records = await _poll_records(scanner, expected_count=2)
     assert len(records) == 2
     assert sorted([r.row["a"] for r in records]) == [1, 2]
 
@@ -80,7 +80,7 @@ async def test_connection_drain_on_close(plaintext_bootstrap_servers, admin):
         table2 = await conn2.get_table(table_path)
         scanner = await table2.new_scan().create_log_scanner()
         scanner.subscribe(0, fluss.EARLIEST_OFFSET)
-        records = _poll_records(scanner, expected_count=1)
+        records = await _poll_records(scanner, expected_count=1)
         assert len(records) == 1
         assert records[0].row["a"] == 123
 

From 024aebb41197ba54483932a9473370e643f88330 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sun, 3 May 2026 15:29:35 +0200
Subject: [PATCH 255/287] feat: Add nullability support in python (#522)

---
 fluss-rust/bindings/python/src/metadata.rs    |  2 +-
 fluss-rust/bindings/python/src/utils.rs       | 34 +++++++++-----
 .../bindings/python/test/test_schema.py       | 47 +++++++++++++++++++
 .../docs/user-guide/python/api-reference.md   |  6 +--
 .../docs/user-guide/python/data-types.md      | 25 ++++++++++
 5 files changed, 99 insertions(+), 15 deletions(-)

diff --git a/fluss-rust/bindings/python/src/metadata.rs b/fluss-rust/bindings/python/src/metadata.rs
index 02ef121dda..7b6129a489 100644
--- a/fluss-rust/bindings/python/src/metadata.rs
+++ b/fluss-rust/bindings/python/src/metadata.rs
@@ -165,7 +165,7 @@ impl Schema {
         let mut builder = fcore::metadata::Schema::builder();
 
         for field in arrow_schema.fields() {
-            let fluss_data_type = crate::utils::Utils::arrow_type_to_fluss_type(field.data_type())?;
+            let fluss_data_type = crate::utils::Utils::arrow_field_to_fluss_type(field)?;
             builder = builder.column(field.name(), fluss_data_type);
 
             if let Some(comment) = field.metadata().get("comment") {
diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
index 76b95f7a9f..5efcf5e799 100644
--- a/fluss-rust/bindings/python/src/utils.rs
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -36,14 +36,14 @@ impl Utils {
         })
     }
 
-    /// Convert Arrow DataType to Fluss DataType
-    pub fn arrow_type_to_fluss_type(
-        arrow_type: &arrow::datatypes::DataType,
+    /// Convert an Arrow Field to a Fluss DataType, preserving nullability.
+    pub fn arrow_field_to_fluss_type(
+        field: &arrow::datatypes::Field,
     ) -> PyResult<fcore::metadata::DataType> {
         use arrow::datatypes::DataType as ArrowDataType;
         use fcore::metadata::DataTypes;
 
-        let fluss_type = match arrow_type {
+        let fluss_type = match field.data_type() {
             ArrowDataType::Boolean => DataTypes::boolean(),
             ArrowDataType::Int8 => DataTypes::tinyint(),
             ArrowDataType::Int16 => DataTypes::smallint(),
@@ -95,23 +95,29 @@ impl Utils {
             ArrowDataType::Decimal128(precision, scale) => {
                 DataTypes::decimal(*precision as u32, *scale as u32)
             }
-            ArrowDataType::List(field) => {
-                let element_type = Utils::arrow_type_to_fluss_type(field.data_type())?;
+            ArrowDataType::List(element_field) => {
+                let element_type = Utils::arrow_field_to_fluss_type(element_field)?;
                 DataTypes::array(element_type)
             }
-            _ => {
+            other => {
                 return Err(FlussError::new_err(format!(
-                    "Unsupported Arrow data type: {arrow_type:?}"
+                    "Unsupported Arrow data type: {other:?}"
                 )));
             }
         };
 
-        Ok(fluss_type)
+        if field.is_nullable() {
+            Ok(fluss_type)
+        } else {
+            Ok(fluss_type.as_non_nullable())
+        }
     }
 
-    /// Convert Fluss DataType to string representation
+    /// Convert Fluss DataType to string representation, appending " NOT NULL"
+    /// for non-nullable types (matches Java's `withNullability` and Rust core's
+    /// `Display` impl).
     pub fn datatype_to_string(data_type: &fcore::metadata::DataType) -> String {
-        match data_type {
+        let type_str = match data_type {
             fcore::metadata::DataType::Boolean(_) => "boolean".to_string(),
             fcore::metadata::DataType::TinyInt(_) => "tinyint".to_string(),
             fcore::metadata::DataType::SmallInt(_) => "smallint".to_string(),
@@ -171,6 +177,12 @@ impl Utils {
                     .collect();
                 format!("row<{}>", fields.join(", "))
             }
+        };
+
+        if data_type.is_nullable() {
+            type_str
+        } else {
+            format!("{type_str} NOT NULL")
         }
     }
 
diff --git a/fluss-rust/bindings/python/test/test_schema.py b/fluss-rust/bindings/python/test/test_schema.py
index ab2d1ab447..dfd9cf5619 100644
--- a/fluss-rust/bindings/python/test/test_schema.py
+++ b/fluss-rust/bindings/python/test/test_schema.py
@@ -48,3 +48,50 @@ def test_schema_with_array():
     assert schema.get_column_types() == ["int", "array<string>"]
 
 
+def test_nullable_fields():
+    fields = pa.schema(
+        [
+            pa.field("id", pa.int32(), nullable=False),
+            pa.field("name", pa.string()),
+        ]
+    )
+    schema = fluss.Schema(fields)
+    assert schema.get_column_types() == ["int NOT NULL", "string"]
+    assert schema.get_columns() == [("id", "int NOT NULL"), ("name", "string")]
+
+
+def test_pk_forces_non_nullable():
+    fields = pa.schema(
+        [
+            pa.field("id", pa.int32()),
+            pa.field("name", pa.string()),
+        ]
+    )
+    schema = fluss.Schema(fields, primary_keys=["id"])
+    types = schema.get_column_types()
+    assert types[0] == "int NOT NULL"
+    assert types[1] == "string"
+
+
+def test_nested_list_nullability():
+    fields = pa.schema(
+        [
+            pa.field(
+                "tags",
+                pa.list_(pa.field("item", pa.string(), nullable=False)),
+            ),
+            pa.field("ids", pa.list_(pa.int32()), nullable=False),
+            pa.field(
+                "strict_ids",
+                pa.list_(pa.field("item", pa.int32(), nullable=False)),
+                nullable=False,
+            ),
+        ]
+    )
+    schema = fluss.Schema(fields)
+    types = schema.get_column_types()
+    assert types[0] == "array<string NOT NULL>"
+    assert types[1] == "array<int> NOT NULL"
+    assert types[2] == "array<int NOT NULL> NOT NULL"
+
+
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index 317aee74e4..32f23a59f7 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -242,10 +242,10 @@ for record in scan_records:
 
 | Method                                         |  Description               |
 |------------------------------------------------|----------------------------|
-| `Schema(schema: pa.Schema, primary_keys=None)` | Create from PyArrow schema |
+| `Schema(schema: pa.Schema, primary_keys=None)` | Create from PyArrow schema. Field nullability (`pa.field(..., nullable=False)`) is preserved. |
 | `.get_column_names() -> list[str]`             | Get column names           |
-| `.get_column_types() -> list[str]`             | Get column type names      |
-| `.get_columns() -> list[tuple[str, str]]`      | Get `(name, type)` pairs   |
+| `.get_column_types() -> list[str]`             | Get column type names. Non-nullable types include a `" NOT NULL"` suffix (e.g., `"int NOT NULL"`). |
+| `.get_columns() -> list[tuple[str, str]]`      | Get `(name, type)` pairs. Type strings follow the same nullability formatting as `.get_column_types()`. |
 | `.get_primary_keys() -> list[str]`             | Get primary key columns    |
 
 ## `TableDescriptor`
diff --git a/fluss-rust/website/docs/user-guide/python/data-types.md b/fluss-rust/website/docs/user-guide/python/data-types.md
index df8165f0f6..996770388e 100644
--- a/fluss-rust/website/docs/user-guide/python/data-types.md
+++ b/fluss-rust/website/docs/user-guide/python/data-types.md
@@ -21,6 +21,31 @@ The Python client uses PyArrow types for schema definitions:
 
 All Python native types (`date`, `time`, `datetime`, `Decimal`) work when appending rows via dicts.
 
+## Nullability
+
+PyArrow field nullability is preserved when constructing Fluss schemas. By default, fields are nullable. Use `nullable=False` on `pa.field()` to create a `NOT NULL` column:
+
+```python
+schema = pa.schema([
+    pa.field("id", pa.int32(), nullable=False),
+    pa.field("name", pa.string()),          # nullable by default
+])
+fluss_schema = fluss.Schema(schema)
+fluss_schema.get_column_types()  # ["int NOT NULL", "string"]
+```
+
+Primary key columns are automatically forced `NOT NULL` regardless of the PyArrow field setting.
+
+For nested types, element nullability is also preserved:
+
+```python
+schema = pa.schema([
+    pa.field("tags", pa.list_(pa.field("item", pa.string(), nullable=False))),
+])
+fluss_schema = fluss.Schema(schema)
+fluss_schema.get_column_types()  # ["array<string NOT NULL>"]
+```
+
 ## Writing Data
 
 Rows can be dicts, lists, or tuples:

From 01c9a221c24b03651c3b6ea549a5720cc78b9b2f Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 3 May 2026 15:25:10 +0100
Subject: [PATCH 256/287] [rust] lookup decoding schema id  (#517)

---
 fluss-rust/bindings/python/src/lookup.rs      |   2 +-
 fluss-rust/crates/fluss/src/client/admin.rs   |  27 +-
 fluss-rust/crates/fluss/src/client/mod.rs     |   2 +
 .../crates/fluss/src/client/schema_getter.rs  |  76 ++++
 .../crates/fluss/src/client/table/lookup.rs   | 413 +++++++++++++-----
 .../crates/fluss/src/client/table/mod.rs      |  15 +-
 .../crates/fluss/src/metadata/datatype.rs     | 157 +++++++
 .../crates/fluss/src/metadata/json_serde.rs   | 102 +++++
 fluss-rust/crates/fluss/src/metadata/mod.rs   |   2 +
 .../crates/fluss/src/metadata/schema_util.rs  | 204 +++++++++
 fluss-rust/crates/fluss/src/metadata/table.rs |  81 +++-
 .../crates/fluss/src/proto/fluss_api.proto    |  12 +
 .../src/record/kv/kv_record_read_context.rs   |   2 +-
 .../crates/fluss/src/record/kv/test_util.rs   |   2 +-
 .../fluss/src/row/fixed_schema_decoder.rs     | 196 +++++++++
 fluss-rust/crates/fluss/src/row/lookup_row.rs | 122 ++++++
 fluss-rust/crates/fluss/src/row/mod.rs        |   6 +
 .../crates/fluss/src/row/projected_row.rs     | 276 ++++++++++++
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |   4 +
 .../fluss/src/rpc/message/get_table_schema.rs |  57 +++
 .../crates/fluss/src/rpc/message/mod.rs       |   2 +
 .../docs/user-guide/rust/api-reference.md     |  26 +-
 22 files changed, 1666 insertions(+), 120 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/schema_getter.rs
 create mode 100644 fluss-rust/crates/fluss/src/metadata/schema_util.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/fixed_schema_decoder.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/lookup_row.rs
 create mode 100644 fluss-rust/crates/fluss/src/row/projected_row.rs
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/get_table_schema.rs

diff --git a/fluss-rust/bindings/python/src/lookup.rs b/fluss-rust/bindings/python/src/lookup.rs
index 09465263b5..f7bd09a505 100644
--- a/fluss-rust/bindings/python/src/lookup.rs
+++ b/fluss-rust/bindings/python/src/lookup.rs
@@ -74,7 +74,7 @@ impl Lookuper {
 
             // Convert to Python with GIL
             Python::attach(|py| match row_opt {
-                Some(compacted_row) => internal_row_to_dict(py, &compacted_row, &table_info),
+                Some(row) => internal_row_to_dict(py, &row, &table_info),
                 None => Ok(py.None()),
             })
         })
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 7f1f64efca..0828b83bfe 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -19,13 +19,13 @@ use crate::client::metadata::Metadata;
 use crate::cluster::ServerNode;
 use crate::metadata::{
     DatabaseDescriptor, DatabaseInfo, JsonSerde, LakeSnapshot, PartitionInfo, PartitionSpec,
-    PhysicalTablePath, TableBucket, TableDescriptor, TableInfo, TablePath,
+    PhysicalTablePath, Schema, SchemaInfo, TableBucket, TableDescriptor, TableInfo, TablePath,
 };
 use crate::rpc::message::{
     CreateDatabaseRequest, CreatePartitionRequest, CreateTableRequest, DatabaseExistsRequest,
     DropDatabaseRequest, DropPartitionRequest, DropTableRequest, GetDatabaseInfoRequest,
-    GetLatestLakeSnapshotRequest, GetTableRequest, ListDatabasesRequest, ListPartitionInfosRequest,
-    ListTablesRequest, TableExistsRequest,
+    GetLatestLakeSnapshotRequest, GetTableRequest, GetTableSchemaRequestMsg, ListDatabasesRequest,
+    ListPartitionInfosRequest, ListTablesRequest, TableExistsRequest,
 };
 use crate::rpc::message::{ListOffsetsRequest, OffsetSpec};
 use crate::rpc::{RpcClient, ServerConnection};
@@ -111,6 +111,27 @@ impl FlussAdmin {
         Ok(())
     }
 
+    /// Fetch the schema for `table_path` at the given `schema_id`. Pass
+    /// `None` to request the latest.
+    pub async fn get_table_schema(
+        &self,
+        table_path: &TablePath,
+        schema_id: Option<i32>,
+    ) -> Result<SchemaInfo> {
+        let response = self
+            .admin_gateway()
+            .await?
+            .request(GetTableSchemaRequestMsg::new(table_path, schema_id))
+            .await?;
+
+        let schema_node: serde_json::Value = serde_json::from_slice(&response.schema_json)
+            .map_err(|e| Error::JsonSerdeError {
+                message: format!("Failed to parse schema_json: {e}"),
+            })?;
+        let schema = Schema::deserialize_json(&schema_node)?;
+        Ok(SchemaInfo::new(schema, response.schema_id))
+    }
+
     pub async fn get_table_info(&self, table_path: &TablePath) -> Result<TableInfo> {
         let response = self
             .admin_gateway()
diff --git a/fluss-rust/crates/fluss/src/client/mod.rs b/fluss-rust/crates/fluss/src/client/mod.rs
index 77c30203bc..f8027948ae 100644
--- a/fluss-rust/crates/fluss/src/client/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/mod.rs
@@ -20,6 +20,7 @@ mod connection;
 mod credentials;
 pub mod lookup;
 mod metadata;
+mod schema_getter;
 mod table;
 mod write;
 
@@ -28,5 +29,6 @@ pub use connection::*;
 pub use credentials::*;
 pub use lookup::LookupClient;
 pub use metadata::*;
+pub(crate) use schema_getter::ClientSchemaGetter;
 pub use table::*;
 pub use write::*;
diff --git a/fluss-rust/crates/fluss/src/client/schema_getter.rs b/fluss-rust/crates/fluss/src/client/schema_getter.rs
new file mode 100644
index 0000000000..4b643c0bec
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/schema_getter.rs
@@ -0,0 +1,76 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Per-table schema cache that lazily fetches missing schema versions
+//! from the coordinator. Used by the lookup path to decode rows that
+//! predate the table's current schema.
+
+use crate::client::admin::FlussAdmin;
+use crate::error::{Error, Result};
+use crate::metadata::{Schema, SchemaInfo, TablePath};
+use parking_lot::RwLock;
+use std::collections::HashMap;
+use std::sync::Arc;
+
+pub(crate) struct ClientSchemaGetter {
+    table_path: TablePath,
+    admin: Arc<FlussAdmin>,
+    /// Pre-seeded with the table's current schema so the dominant case
+    /// (every row written under the latest schema) needs zero RPCs.
+    cache: RwLock<HashMap<i32, Arc<Schema>>>,
+}
+
+impl ClientSchemaGetter {
+    pub fn new(table_path: TablePath, admin: Arc<FlussAdmin>, latest: SchemaInfo) -> Self {
+        let mut map = HashMap::new();
+        let (schema, schema_id) = latest.into_parts();
+        map.insert(schema_id, Arc::new(schema));
+        Self {
+            table_path,
+            admin,
+            cache: RwLock::new(map),
+        }
+    }
+
+    /// Concurrent fetches for the same id are not deduplicated; we
+    /// accept one redundant RPC in exchange for staying off
+    /// `tokio::sync` machinery. Schemas are immutable per id, so
+    /// last-write-wins on the cache insert is correct.
+    pub async fn get_schema(&self, schema_id: i32) -> Result<Arc<Schema>> {
+        if let Some(schema) = self.cache.read().get(&schema_id).cloned() {
+            return Ok(schema);
+        }
+
+        let info = self
+            .admin
+            .get_table_schema(&self.table_path, Some(schema_id))
+            .await?;
+        let (schema, fetched_id) = info.into_parts();
+        if fetched_id != schema_id {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "Requested schema id {schema_id}, but server returned schema id {fetched_id}"
+                ),
+                source: None,
+            });
+        }
+        let schema = Arc::new(schema);
+
+        self.cache.write().insert(schema_id, Arc::clone(&schema));
+        Ok(schema)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/lookup.rs b/fluss-rust/crates/fluss/src/client/table/lookup.rs
index 2adb53e4c6..51a0a0714d 100644
--- a/fluss-rust/crates/fluss/src/client/table/lookup.rs
+++ b/fluss-rust/crates/fluss/src/client/table/lookup.rs
@@ -16,73 +16,126 @@
 // under the License.
 
 use crate::bucketing::BucketingFunction;
+use crate::client::ClientSchemaGetter;
 use crate::client::lookup::LookupClient;
 use crate::client::metadata::Metadata;
 use crate::client::table::partition_getter::PartitionGetter;
 use crate::error::{Error, Result};
-use crate::metadata::{PhysicalTablePath, RowType, TableBucket, TableInfo, TablePath};
+use crate::metadata::{
+    KvFormat, PhysicalTablePath, RowType, Schema, TableBucket, TableInfo, TablePath,
+};
 use crate::record::RowAppendRecordBatchBuilder;
 use crate::record::kv::SCHEMA_ID_LENGTH;
-use crate::row::InternalRow;
-use crate::row::compacted::CompactedRow;
 use crate::row::encode::{KeyEncoder, KeyEncoderFactory};
+use crate::row::{FixedSchemaDecoder, InternalRow, LookupRow};
 use arrow::array::RecordBatch;
+use byteorder::{ByteOrder, LittleEndian};
+use futures::future::try_join_all;
+use parking_lot::RwLock;
+use std::collections::HashMap;
 use std::sync::Arc;
 
-/// The result of a lookup operation.
-///
-/// Contains the rows returned from a lookup. For primary-key lookups,
-/// this will contain at most one row. For prefix-key lookups, it may
-/// contain multiple rows.
+/// Per-Lookuper decoder cache. The target-schema decoder is held
+/// directly so the dominant decode path is a single field access; older
+/// schemas are populated lazily on first observation.
+struct DecoderCache {
+    target_id: i16,
+    target_decoder: Arc<FixedSchemaDecoder>,
+    others: RwLock<HashMap<i16, Arc<FixedSchemaDecoder>>>,
+}
+
+impl DecoderCache {
+    fn new(target_id: i16, target_decoder: Arc<FixedSchemaDecoder>) -> Self {
+        Self {
+            target_id,
+            target_decoder,
+            others: RwLock::new(HashMap::new()),
+        }
+    }
+
+    fn decode<'a>(&self, schema_id: i16, bytes: &'a [u8]) -> Result<LookupRow<'a>> {
+        if schema_id == self.target_id {
+            return self.target_decoder.decode(bytes);
+        }
+        let decoder =
+            self.others
+                .read()
+                .get(&schema_id)
+                .cloned()
+                .ok_or_else(|| Error::RowConvertError {
+                    message: format!("No decoder available for schema id {schema_id}"),
+                })?;
+        decoder.decode(bytes)
+    }
+
+    fn contains(&self, schema_id: i16) -> bool {
+        schema_id == self.target_id || self.others.read().contains_key(&schema_id)
+    }
+
+    fn insert(&self, schema_id: i16, decoder: Arc<FixedSchemaDecoder>) {
+        self.others.write().insert(schema_id, decoder);
+    }
+
+    #[cfg(test)]
+    fn get(&self, schema_id: i16) -> Option<Arc<FixedSchemaDecoder>> {
+        if schema_id == self.target_id {
+            return Some(Arc::clone(&self.target_decoder));
+        }
+        self.others.read().get(&schema_id).cloned()
+    }
+}
+
+/// Rows returned from a lookup. Primary-key lookups produce at most one
+/// row; prefix-key lookups may produce many. Rows written under older
+/// schemas are decoded with their original schema and projected to the
+/// schema captured when the `Lookuper` was created — schema evolutions
+/// that land after that point are not picked up by an existing
+/// `Lookuper`; create a new one to see them.
 pub struct LookupResult {
     rows: Vec<Vec<u8>>,
-    row_type: Arc<RowType>,
+    target_row_type: Arc<RowType>,
+    decoders: Arc<DecoderCache>,
 }
 
 impl LookupResult {
-    /// Creates a new LookupResult from a list of row bytes.
-    fn new(rows: Vec<Vec<u8>>, row_type: Arc<RowType>) -> Self {
-        Self { rows, row_type }
-    }
-
-    /// Creates an empty LookupResult.
-    fn empty(row_type: Arc<RowType>) -> Self {
+    fn new(rows: Vec<Vec<u8>>, target_row_type: Arc<RowType>, decoders: Arc<DecoderCache>) -> Self {
         Self {
-            rows: Vec::new(),
-            row_type,
+            rows,
+            target_row_type,
+            decoders,
         }
     }
 
-    /// Extracts the row payload by stripping the schema id prefix.
-    fn extract_payload(bytes: &[u8]) -> Result<&[u8]> {
-        bytes
-            .get(SCHEMA_ID_LENGTH..)
-            .ok_or_else(|| Error::RowConvertError {
+    fn read_schema_id(bytes: &[u8]) -> Result<i16> {
+        if bytes.len() < SCHEMA_ID_LENGTH {
+            return Err(Error::RowConvertError {
                 message: format!(
                     "Row payload too short: {} bytes, need at least {} for schema id",
                     bytes.len(),
                     SCHEMA_ID_LENGTH
                 ),
-            })
+            });
+        }
+        let schema_id = LittleEndian::read_i16(&bytes[..SCHEMA_ID_LENGTH]);
+        if schema_id < 0 {
+            return Err(Error::RowConvertError {
+                message: format!("Invalid negative schema id {schema_id}; row prefix is corrupt"),
+            });
+        }
+        Ok(schema_id)
     }
 
-    /// Returns the only row in the result set as a [`CompactedRow`].
-    ///
-    /// This method provides a zero-copy view of the row data, which means the returned
-    /// `CompactedRow` borrows from this result set and cannot outlive it.
-    ///
-    /// # Returns
-    /// - `Ok(Some(row))`: If exactly one row exists.
-    /// - `Ok(None)`: If the result set is empty.
-    /// - `Err(Error::UnexpectedError)`: If the result set contains more than one row.
-    /// - `Err(Error)`: If the row payload is too short to contain a schema id.
-    pub fn get_single_row(&self) -> Result<Option<CompactedRow<'_>>> {
+    fn decode<'a>(&self, bytes: &'a [u8]) -> Result<LookupRow<'a>> {
+        let schema_id = Self::read_schema_id(bytes)?;
+        self.decoders.decode(schema_id, bytes)
+    }
+
+    /// Returns the single row when exactly one is present, `None` for
+    /// empty, or an error if the result holds more than one row.
+    pub fn get_single_row(&self) -> Result<Option<LookupRow<'_>>> {
         match self.rows.len() {
             0 => Ok(None),
-            1 => {
-                let payload = Self::extract_payload(&self.rows[0])?;
-                Ok(Some(CompactedRow::from_bytes(&self.row_type, payload)))
-            }
+            1 => Ok(Some(self.decode(&self.rows[0])?)),
             _ => Err(Error::UnexpectedError {
                 message: "LookupResult contains multiple rows, use get_rows() instead".to_string(),
                 source: None,
@@ -90,44 +143,105 @@ impl LookupResult {
         }
     }
 
-    /// Returns all rows in the result set as [`CompactedRow`]s.
-    ///
-    /// # Returns
-    /// - `Ok(rows)` - All rows in the result set.
-    /// - `Err(Error)` - If any row payload is too short to contain a schema id.
-    pub fn get_rows(&self) -> Result<Vec<CompactedRow<'_>>> {
-        self.rows
-            .iter()
-            // TODO Add schema id check and fetch when implementing prefix lookup
-            .map(|bytes| {
-                let payload = Self::extract_payload(bytes)?;
-                Ok(CompactedRow::from_bytes(&self.row_type, payload))
-            })
-            .collect()
+    pub fn get_rows(&self) -> Result<Vec<LookupRow<'_>>> {
+        self.rows.iter().map(|bytes| self.decode(bytes)).collect()
     }
 
-    /// Converts all rows in this result into an Arrow [`RecordBatch`].
-    ///
-    /// This is useful for integration with DataFusion or other Arrow-based tools.
-    ///
-    /// # Returns
-    /// - `Ok(RecordBatch)` - All rows in columnar Arrow format. Returns an empty
-    ///   batch (with the correct schema) if the result set is empty.
-    /// - `Err(Error)` - If the conversion fails.
     pub fn to_record_batch(&self) -> Result<RecordBatch> {
-        let mut builder = RowAppendRecordBatchBuilder::new(&self.row_type)?;
-
+        let mut builder = RowAppendRecordBatchBuilder::new(&self.target_row_type)?;
         for bytes in &self.rows {
-            let payload = Self::extract_payload(bytes)?;
-
-            let row = CompactedRow::from_bytes(&self.row_type, payload);
+            let row = self.decode(bytes)?;
             builder.append(&row)?;
         }
-
         builder.build_arrow_record_batch().map(Arc::unwrap_or_clone)
     }
 }
 
+struct LookupSchemaCtx {
+    target_schema: Arc<Schema>,
+    target_row_type: Arc<RowType>,
+    kv_format: KvFormat,
+    schema_getter: Arc<ClientSchemaGetter>,
+    decoders: Arc<DecoderCache>,
+}
+
+impl LookupSchemaCtx {
+    fn new(table_info: &TableInfo, schema_getter: Arc<ClientSchemaGetter>) -> Result<Self> {
+        let target_schema_i32 = table_info.get_schema_id();
+        if !(0..=i16::MAX as i32).contains(&target_schema_i32) {
+            return Err(Error::UnexpectedError {
+                message: format!(
+                    "Schema id {target_schema_i32} does not fit in 16 bits — wire format violated"
+                ),
+                source: None,
+            });
+        }
+        let target_schema = Arc::new(table_info.get_schema().clone());
+        let target_row_type = Arc::new(table_info.row_type().clone());
+        let kv_format = table_info.get_table_config().get_kv_format()?;
+        let target_decoder = Arc::new(FixedSchemaDecoder::new_no_projection(
+            kv_format,
+            target_schema.as_ref(),
+        )?);
+        let decoders = Arc::new(DecoderCache::new(target_schema_i32 as i16, target_decoder));
+        Ok(Self {
+            target_schema,
+            target_row_type,
+            kv_format,
+            schema_getter,
+            decoders,
+        })
+    }
+
+    async fn ensure_decoders(&self, rows: &[Vec<u8>]) -> Result<()> {
+        let mut missing: Vec<i16> = Vec::new();
+        for bytes in rows {
+            let schema_id = LookupResult::read_schema_id(bytes)?;
+            if !self.decoders.contains(schema_id) && !missing.contains(&schema_id) {
+                missing.push(schema_id);
+            }
+        }
+        if missing.is_empty() {
+            return Ok(());
+        }
+
+        let fetches = missing.into_iter().map(|schema_id| {
+            let cache = Arc::clone(&self.decoders);
+            let schema_getter = Arc::clone(&self.schema_getter);
+            let target_schema = Arc::clone(&self.target_schema);
+            let kv_format = self.kv_format;
+            async move {
+                let source = schema_getter.get_schema(schema_id as i32).await?;
+                let decoder =
+                    FixedSchemaDecoder::new(kv_format, source.as_ref(), target_schema.as_ref())?;
+                cache.insert(schema_id, Arc::new(decoder));
+                Ok::<_, Error>(())
+            }
+        });
+        try_join_all(fetches).await?;
+        Ok(())
+    }
+
+    async fn build_result(&self, rows: Vec<Vec<u8>>) -> Result<LookupResult> {
+        if !rows.is_empty() {
+            self.ensure_decoders(&rows).await?;
+        }
+        Ok(LookupResult::new(
+            rows,
+            Arc::clone(&self.target_row_type),
+            Arc::clone(&self.decoders),
+        ))
+    }
+
+    fn empty_result(&self) -> LookupResult {
+        LookupResult::new(
+            Vec::new(),
+            Arc::clone(&self.target_row_type),
+            Arc::clone(&self.decoders),
+        )
+    }
+}
+
 /// Builder for lookup operations. `create_lookuper()` builds a primary-key
 /// `Lookuper`; `lookup_by(columns).create_lookuper()` builds a
 /// `PrefixKeyLookuper` for prefix scans.
@@ -136,6 +250,7 @@ pub struct TableLookup {
     lookup_client: Arc<LookupClient>,
     table_info: TableInfo,
     metadata: Arc<Metadata>,
+    schema_getter: Arc<ClientSchemaGetter>,
 }
 
 impl TableLookup {
@@ -143,11 +258,13 @@ impl TableLookup {
         lookup_client: Arc<LookupClient>,
         table_info: TableInfo,
         metadata: Arc<Metadata>,
+        schema_getter: Arc<ClientSchemaGetter>,
     ) -> Self {
         Self {
             lookup_client,
             table_info,
             metadata,
+            schema_getter,
         }
     }
 
@@ -161,6 +278,7 @@ impl TableLookup {
             lookup_client: self.lookup_client,
             table_info: self.table_info,
             metadata: self.metadata,
+            schema_getter: self.schema_getter,
             lookup_column_names,
         }
     }
@@ -208,11 +326,10 @@ impl TableLookup {
             None
         };
 
-        let row_type = Arc::new(self.table_info.row_type().clone());
+        let schema_ctx = LookupSchemaCtx::new(&self.table_info, self.schema_getter)?;
 
         Ok(Lookuper {
             table_path: Arc::new(self.table_info.table_path.clone()),
-            row_type,
             table_info: self.table_info,
             metadata: self.metadata,
             lookup_client: self.lookup_client,
@@ -221,6 +338,7 @@ impl TableLookup {
             bucket_key_encoder,
             partition_getter,
             num_buckets,
+            schema_ctx,
         })
     }
 }
@@ -239,7 +357,6 @@ impl TableLookup {
 pub struct Lookuper {
     table_path: Arc<TablePath>,
     table_info: TableInfo,
-    row_type: Arc<RowType>,
     metadata: Arc<Metadata>,
     lookup_client: Arc<LookupClient>,
     bucketing_function: Box<dyn BucketingFunction>,
@@ -247,6 +364,7 @@ pub struct Lookuper {
     bucket_key_encoder: Option<Box<dyn KeyEncoder>>,
     partition_getter: Option<PartitionGetter>,
     num_buckets: i32,
+    schema_ctx: LookupSchemaCtx,
 }
 
 impl Lookuper {
@@ -281,7 +399,7 @@ impl Lookuper {
                 .await?
             {
                 Some(id) => Some(id),
-                None => return Ok(LookupResult::empty(Arc::clone(&self.row_type))),
+                None => return Ok(self.schema_ctx.empty_result()),
             }
         } else {
             None
@@ -300,13 +418,11 @@ impl Lookuper {
             .lookup(self.table_path.as_ref().clone(), table_bucket, pk_bytes)
             .await?;
 
-        match result {
-            Some(value_bytes) => Ok(LookupResult::new(
-                vec![value_bytes],
-                Arc::clone(&self.row_type),
-            )),
-            None => Ok(LookupResult::empty(Arc::clone(&self.row_type))),
-        }
+        let rows = match result {
+            Some(value_bytes) => vec![value_bytes],
+            None => Vec::new(),
+        };
+        self.schema_ctx.build_result(rows).await
     }
 
     /// Returns a reference to the table info.
@@ -319,6 +435,7 @@ pub struct TablePrefixLookup {
     lookup_client: Arc<LookupClient>,
     table_info: TableInfo,
     metadata: Arc<Metadata>,
+    schema_getter: Arc<ClientSchemaGetter>,
     lookup_column_names: Vec<String>,
 }
 
@@ -346,11 +463,10 @@ impl TablePrefixLookup {
             None
         };
 
-        let full_row_type = Arc::new(self.table_info.row_type().clone());
+        let schema_ctx = LookupSchemaCtx::new(&self.table_info, self.schema_getter)?;
 
         Ok(PrefixKeyLookuper {
             table_path: Arc::new(self.table_info.table_path.clone()),
-            row_type: full_row_type,
             table_info: self.table_info,
             metadata: self.metadata,
             lookup_client: self.lookup_client,
@@ -358,6 +474,7 @@ impl TablePrefixLookup {
             prefix_key_encoder,
             partition_getter,
             num_buckets,
+            schema_ctx,
         })
     }
 }
@@ -454,13 +571,13 @@ fn validate_prefix_lookup(table_info: &TableInfo, lookup_columns: &[String]) ->
 pub struct PrefixKeyLookuper {
     table_path: Arc<TablePath>,
     table_info: TableInfo,
-    row_type: Arc<RowType>,
     metadata: Arc<Metadata>,
     lookup_client: Arc<LookupClient>,
     bucketing_function: Box<dyn BucketingFunction>,
     prefix_key_encoder: Box<dyn KeyEncoder>,
     partition_getter: Option<PartitionGetter>,
     num_buckets: i32,
+    schema_ctx: LookupSchemaCtx,
 }
 
 impl PrefixKeyLookuper {
@@ -479,7 +596,7 @@ impl PrefixKeyLookuper {
                 .await?
             {
                 Some(id) => Some(id),
-                None => return Ok(LookupResult::empty(Arc::clone(&self.row_type))),
+                None => return Ok(self.schema_ctx.empty_result()),
             }
         } else {
             None
@@ -497,7 +614,7 @@ impl PrefixKeyLookuper {
             .prefix_lookup(self.table_path.as_ref().clone(), table_bucket, prefix_bytes)
             .await?;
 
-        Ok(LookupResult::new(rows, Arc::clone(&self.row_type)))
+        self.schema_ctx.build_result(rows).await
     }
 
     pub fn table_info(&self) -> &TableInfo {
@@ -508,7 +625,7 @@ impl PrefixKeyLookuper {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::{DataField, DataTypes};
+    use crate::metadata::{Column, DataTypes, Schema};
     use crate::row::binary::BinaryWriter;
     use crate::row::compacted::CompactedRowWriter;
     use arrow::array::Int32Array;
@@ -520,34 +637,56 @@ mod tests {
         bytes
     }
 
+    fn schema_with_ids(columns: &[(i32, &str, crate::metadata::DataType)]) -> Schema {
+        let cols: Vec<Column> = columns
+            .iter()
+            .map(|(id, name, dt)| Column::new(*name, dt.clone()).with_id(*id))
+            .collect();
+        Schema::builder().with_columns(cols).build().unwrap()
+    }
+
+    fn cache_with(
+        target_id: i16,
+        target_decoder: FixedSchemaDecoder,
+        others: Vec<(i16, FixedSchemaDecoder)>,
+    ) -> Arc<DecoderCache> {
+        let cache = DecoderCache::new(target_id, Arc::new(target_decoder));
+        for (id, decoder) in others {
+            cache.insert(id, Arc::new(decoder));
+        }
+        Arc::new(cache)
+    }
+
+    fn lookup_result_from(
+        rows: Vec<Vec<u8>>,
+        target_schema: &Schema,
+        decoders: Arc<DecoderCache>,
+    ) -> LookupResult {
+        LookupResult::new(rows, Arc::new(target_schema.row_type().clone()), decoders)
+    }
+
     #[test]
     fn test_to_record_batch_empty() {
-        let row_type = Arc::new(RowType::new(vec![DataField::new(
-            "id",
-            DataTypes::int(),
-            None,
-        )]));
-        let result = LookupResult::empty(row_type);
+        let target = schema_with_ids(&[(0, "id", DataTypes::int())]);
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &target).unwrap();
+        let result = lookup_result_from(Vec::new(), &target, cache_with(0, decoder, vec![]));
         let batch = result.to_record_batch().unwrap();
         assert_eq!(batch.num_rows(), 0);
         assert_eq!(batch.num_columns(), 1);
     }
 
     #[test]
-    fn test_to_record_batch_with_row() {
-        let row_type = Arc::new(RowType::new(vec![DataField::new(
-            "id",
-            DataTypes::int(),
-            None,
-        )]));
+    fn test_to_record_batch_with_row_at_target_schema() {
+        let target = schema_with_ids(&[(0, "id", DataTypes::int())]);
 
         let mut writer = CompactedRowWriter::new(1);
         writer.write_int(42);
         let row_bytes = make_row_bytes(0, writer.buffer());
 
-        let result = LookupResult::new(vec![row_bytes], Arc::clone(&row_type));
-        let batch = result.to_record_batch().unwrap();
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &target).unwrap();
+        let result = lookup_result_from(vec![row_bytes], &target, cache_with(0, decoder, vec![]));
 
+        let batch = result.to_record_batch().unwrap();
         assert_eq!(batch.num_rows(), 1);
         let col = batch
             .column(0)
@@ -557,15 +696,79 @@ mod tests {
         assert_eq!(col.value(0), 42);
     }
 
+    #[test]
+    fn test_get_rows_decodes_per_row_schema_id_with_projection() {
+        let source = schema_with_ids(&[(0, "a", DataTypes::int())]);
+        let target = schema_with_ids(&[(0, "a", DataTypes::int()), (1, "b", DataTypes::string())]);
+
+        let mut w = CompactedRowWriter::new(1);
+        w.write_int(7);
+        let old_row = make_row_bytes(3, w.buffer());
+
+        let mut w = CompactedRowWriter::new(2);
+        w.write_int(8);
+        w.write_string("eight");
+        let new_row = make_row_bytes(7, w.buffer());
+
+        let target_decoder =
+            FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &target).unwrap();
+        let projection_decoder =
+            FixedSchemaDecoder::new(KvFormat::COMPACTED, &source, &target).unwrap();
+        let cache = cache_with(7, target_decoder, vec![(3, projection_decoder)]);
+        let result = lookup_result_from(vec![old_row, new_row], &target, cache);
+
+        let rows = result.get_rows().unwrap();
+        assert_eq!(rows.len(), 2);
+        assert_eq!(rows[0].get_int(0).unwrap(), 7);
+        assert!(rows[0].is_null_at(1).unwrap());
+        assert_eq!(rows[1].get_int(0).unwrap(), 8);
+        assert_eq!(rows[1].get_string(1).unwrap(), "eight");
+    }
+
     #[test]
     fn test_to_record_batch_payload_too_short() {
-        let row_type = Arc::new(RowType::new(vec![DataField::new(
-            "id",
-            DataTypes::int(),
-            None,
-        )]));
-        // Only 1 byte — shorter than SCHEMA_ID_LENGTH (2)
-        let result = LookupResult::new(vec![vec![0u8]], Arc::clone(&row_type));
+        let target = schema_with_ids(&[(0, "id", DataTypes::int())]);
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &target).unwrap();
+        let result = lookup_result_from(vec![vec![0u8]], &target, cache_with(0, decoder, vec![]));
         assert!(result.to_record_batch().is_err());
     }
+
+    #[test]
+    fn test_get_rows_errors_when_no_decoder_for_schema_id() {
+        let target = schema_with_ids(&[(0, "id", DataTypes::int())]);
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &target).unwrap();
+        let mut w = CompactedRowWriter::new(1);
+        w.write_int(1);
+        let row = make_row_bytes(99, w.buffer());
+        let result = lookup_result_from(vec![row], &target, cache_with(0, decoder, vec![]));
+
+        let err = result
+            .get_rows()
+            .map(|_| ())
+            .map_err(|e| e.to_string())
+            .unwrap_err();
+        assert!(err.contains("schema id 99"), "{err}");
+    }
+
+    #[test]
+    fn test_read_schema_id_rejects_negative() {
+        let bytes = [0xFFu8, 0xFFu8, 0u8];
+        let err = LookupResult::read_schema_id(&bytes).unwrap_err();
+        assert!(
+            err.to_string().contains("Invalid negative schema id"),
+            "{err}"
+        );
+    }
+
+    #[test]
+    fn test_decoder_cache_target_lookup_skips_lock() {
+        let target = schema_with_ids(&[(0, "a", DataTypes::int())]);
+        let target_decoder =
+            Arc::new(FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &target).unwrap());
+        let cache = DecoderCache::new(7, Arc::clone(&target_decoder));
+
+        let returned = cache.get(7).expect("target id must hit the cache");
+        assert!(Arc::ptr_eq(&returned, &target_decoder));
+        assert!(cache.get(99).is_none());
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 2d3d01712d..ba1edd2fb0 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -17,8 +17,9 @@
 
 use crate::client::connection::FlussConnection;
 use crate::client::metadata::Metadata;
+use crate::client::schema_getter::ClientSchemaGetter;
 use crate::error::{Error, Result};
-use crate::metadata::{TableInfo, TablePath};
+use crate::metadata::{SchemaInfo, TableInfo, TablePath};
 use std::sync::Arc;
 
 pub const EARLIEST_OFFSET: i64 = -2;
@@ -121,10 +122,22 @@ impl<'a> FlussTable<'a> {
             });
         }
         let lookup_client = self.conn.get_or_create_lookup_client()?;
+        // Pre-seed the schema getter with the table's current schema —
+        // rows written under it (the dominant case) never trigger an RPC.
+        let latest = SchemaInfo::new(
+            self.table_info.get_schema().clone(),
+            self.table_info.get_schema_id(),
+        );
+        let schema_getter = Arc::new(ClientSchemaGetter::new(
+            self.table_path.clone(),
+            self.conn.get_admin()?,
+            latest,
+        ));
         Ok(TableLookup::new(
             lookup_client,
             self.table_info.clone(),
             self.metadata.clone(),
+            schema_getter,
         ))
     }
 
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index d9eb56b503..4103aa3df0 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -93,6 +93,60 @@ impl DataType {
             DataType::Bytes(v) => DataType::Bytes(v.as_non_nullable()),
         }
     }
+
+    /// Structural equality ignoring the outermost nullability flag at
+    /// every level. Equivalent to comparing `as_non_nullable()` on both
+    /// sides but without the recursive clone.
+    pub(crate) fn eq_ignore_nullable(&self, other: &DataType) -> bool {
+        match self {
+            DataType::Boolean(_) => matches!(other, DataType::Boolean(_)),
+            DataType::TinyInt(_) => matches!(other, DataType::TinyInt(_)),
+            DataType::SmallInt(_) => matches!(other, DataType::SmallInt(_)),
+            DataType::Int(_) => matches!(other, DataType::Int(_)),
+            DataType::BigInt(_) => matches!(other, DataType::BigInt(_)),
+            DataType::Float(_) => matches!(other, DataType::Float(_)),
+            DataType::Double(_) => matches!(other, DataType::Double(_)),
+            DataType::Date(_) => matches!(other, DataType::Date(_)),
+            DataType::String(_) => matches!(other, DataType::String(_)),
+            DataType::Bytes(_) => matches!(other, DataType::Bytes(_)),
+            DataType::Char(a) => {
+                matches!(other, DataType::Char(b) if a.length() == b.length())
+            }
+            DataType::Binary(a) => {
+                matches!(other, DataType::Binary(b) if a.length() == b.length())
+            }
+            DataType::Decimal(a) => matches!(
+                other,
+                DataType::Decimal(b) if a.precision() == b.precision() && a.scale() == b.scale()
+            ),
+            DataType::Time(a) => {
+                matches!(other, DataType::Time(b) if a.precision() == b.precision())
+            }
+            DataType::Timestamp(a) => {
+                matches!(other, DataType::Timestamp(b) if a.precision() == b.precision())
+            }
+            DataType::TimestampLTz(a) => {
+                matches!(other, DataType::TimestampLTz(b) if a.precision() == b.precision())
+            }
+            DataType::Array(a) => matches!(
+                other,
+                DataType::Array(b) if a.get_element_type().eq_ignore_nullable(b.get_element_type())
+            ),
+            DataType::Map(a) => matches!(
+                other,
+                DataType::Map(b)
+                    if a.key_type().eq_ignore_nullable(b.key_type())
+                        && a.value_type().eq_ignore_nullable(b.value_type())
+            ),
+            DataType::Row(a) => matches!(
+                other,
+                DataType::Row(b) if a.fields().len() == b.fields().len()
+                    && a.fields().iter().zip(b.fields().iter()).all(|(x, y)| {
+                        x.name() == y.name() && x.data_type().eq_ignore_nullable(y.data_type())
+                    })
+            ),
+        }
+    }
 }
 
 impl Display for DataType {
@@ -1695,3 +1749,106 @@ fn test_row_type_project_duplicate_indices() {
     assert_eq!(projected.fields()[1].name, "id");
     assert_eq!(projected.fields()[2].name, "name");
 }
+
+#[cfg(test)]
+mod eq_ignore_nullable_tests {
+    use super::*;
+
+    #[test]
+    fn ignores_nullability_at_top_level() {
+        let nullable = DataType::Int(IntType::new());
+        let non_nullable = DataType::Int(IntType::with_nullable(false));
+        assert_ne!(nullable, non_nullable, "PartialEq still distinguishes");
+        assert!(nullable.eq_ignore_nullable(&non_nullable));
+        assert!(non_nullable.eq_ignore_nullable(&nullable));
+    }
+
+    #[test]
+    fn rejects_different_kinds() {
+        assert!(
+            !DataType::Int(IntType::new()).eq_ignore_nullable(&DataType::BigInt(BigIntType::new()))
+        );
+    }
+
+    #[test]
+    fn compares_parameterized_types() {
+        // Char length must match.
+        assert!(
+            DataType::Char(CharType::with_nullable(10, true))
+                .eq_ignore_nullable(&DataType::Char(CharType::with_nullable(10, false)))
+        );
+        assert!(
+            !DataType::Char(CharType::with_nullable(10, true))
+                .eq_ignore_nullable(&DataType::Char(CharType::with_nullable(11, true)))
+        );
+
+        // Decimal precision + scale must match.
+        let a = DataType::Decimal(DecimalType::with_nullable(true, 10, 2).unwrap());
+        let b = DataType::Decimal(DecimalType::with_nullable(false, 10, 2).unwrap());
+        let c = DataType::Decimal(DecimalType::with_nullable(true, 10, 3).unwrap());
+        assert!(a.eq_ignore_nullable(&b));
+        assert!(!a.eq_ignore_nullable(&c));
+    }
+
+    #[test]
+    fn recurses_into_array_and_map() {
+        // Array<Int NULL> ~ Array<Int NOT NULL>
+        let a = DataType::Array(ArrayType::with_nullable(
+            true,
+            DataType::Int(IntType::new()),
+        ));
+        let b = DataType::Array(ArrayType::with_nullable(
+            false,
+            DataType::Int(IntType::with_nullable(false)),
+        ));
+        assert!(a.eq_ignore_nullable(&b));
+
+        // Map<String, Int> on both sides, mixed nullability.
+        let m1 = DataType::Map(MapType::with_nullable(
+            true,
+            DataType::String(StringType::new()),
+            DataType::Int(IntType::new()),
+        ));
+        let m2 = DataType::Map(MapType::with_nullable(
+            false,
+            DataType::String(StringType::with_nullable(false)),
+            DataType::Int(IntType::with_nullable(false)),
+        ));
+        assert!(m1.eq_ignore_nullable(&m2));
+
+        // Map element-type mismatch is still caught.
+        let m3 = DataType::Map(MapType::with_nullable(
+            true,
+            DataType::String(StringType::new()),
+            DataType::BigInt(BigIntType::new()),
+        ));
+        assert!(!m1.eq_ignore_nullable(&m3));
+    }
+
+    #[test]
+    fn recurses_into_row_fields() {
+        let r1 = DataType::Row(RowType::new(vec![
+            DataField::new("a", DataType::Int(IntType::new()), None),
+            DataField::new("b", DataType::String(StringType::new()), None),
+        ]));
+        let r2 = DataType::Row(RowType::with_nullable(
+            false,
+            vec![
+                DataField::new("a", DataType::Int(IntType::with_nullable(false)), None),
+                DataField::new(
+                    "b",
+                    DataType::String(StringType::with_nullable(false)),
+                    None,
+                ),
+            ],
+        ));
+        assert!(r1.eq_ignore_nullable(&r2));
+
+        // Field name mismatch must fail.
+        let r3 = DataType::Row(RowType::new(vec![
+            DataField::new("renamed_a", DataType::Int(IntType::new()), None),
+            DataField::new("b", DataType::String(StringType::new()), None),
+        ]));
+        assert!(!r1.eq_ignore_nullable(&r3));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
index 20f5d09757..efbce84d65 100644
--- a/fluss-rust/crates/fluss/src/metadata/json_serde.rs
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -377,6 +377,7 @@ impl Column {
     const NAME: &'static str = "name";
     const DATA_TYPE: &'static str = "data_type";
     const COMMENT: &'static str = "comment";
+    const ID: &'static str = "id";
 }
 
 impl JsonSerde for Column {
@@ -394,6 +395,9 @@ impl JsonSerde for Column {
             obj.insert(Self::COMMENT.to_string(), json!(comment));
         }
 
+        // The Java client requires `id` on input.
+        obj.insert(Self::ID.to_string(), json!(self.id()));
+
         Ok(Value::Object(obj))
     }
 
@@ -419,6 +423,15 @@ impl JsonSerde for Column {
             column = column.with_comment(comment);
         }
 
+        // Pre-id JSON is treated as unassigned; SchemaBuilder will
+        // auto-assign on build.
+        if let Some(id) = node.get(Self::ID).and_then(|v| v.as_i64()) {
+            let id = i32::try_from(id).map_err(|_| Error::JsonSerdeError {
+                message: format!("Column id {id} does not fit in i32"),
+            })?;
+            column = column.with_id(id);
+        }
+
         Ok(column)
     }
 }
@@ -671,6 +684,95 @@ mod tests {
     use super::*;
     use crate::metadata::DataTypes;
 
+    #[test]
+    fn column_id_round_trip_through_json() {
+        use crate::metadata::Column;
+
+        let col = Column::new("a", DataTypes::int())
+            .with_id(7)
+            .with_comment("desc");
+        let json = col.serialize_json().unwrap();
+        assert_eq!(json.get("id").and_then(|v| v.as_i64()), Some(7));
+        let round_tripped = Column::deserialize_json(&json).unwrap();
+        assert_eq!(round_tripped, col);
+    }
+
+    #[test]
+    fn schema_assigns_ids_when_absent_and_preserves_when_present() {
+        use crate::metadata::{Column, Schema};
+
+        let auto = Schema::builder()
+            .column("a", DataTypes::int())
+            .column("b", DataTypes::string())
+            .build()
+            .unwrap();
+        let ids: Vec<i32> = auto.columns().iter().map(|c| c.id()).collect();
+        assert_eq!(ids, vec![0, 1]);
+
+        let preserved = Schema::builder()
+            .with_columns(vec![
+                Column::new("a", DataTypes::int()).with_id(3),
+                Column::new("b", DataTypes::string()).with_id(7),
+            ])
+            .build()
+            .unwrap();
+        let ids: Vec<i32> = preserved.columns().iter().map(|c| c.id()).collect();
+        assert_eq!(ids, vec![3, 7]);
+    }
+
+    #[test]
+    fn schema_rejects_duplicate_ids() {
+        use crate::metadata::Column;
+        let err = Schema::builder()
+            .with_columns(vec![
+                Column::new("a", DataTypes::int()).with_id(7),
+                Column::new("b", DataTypes::string()).with_id(7),
+            ])
+            .build()
+            .unwrap_err();
+        assert!(err.to_string().contains("Duplicate column id 7"), "{err}");
+    }
+
+    #[test]
+    fn schema_rejects_negative_non_sentinel_ids() {
+        use crate::metadata::Column;
+        let err = Schema::builder()
+            .with_columns(vec![Column::new("a", DataTypes::int()).with_id(-7)])
+            .build()
+            .unwrap_err();
+        assert!(err.to_string().contains("invalid id -7"), "{err}");
+    }
+
+    #[test]
+    fn column_json_id_overflow_errors() {
+        use crate::metadata::Column;
+        let json = serde_json::json!({
+            "name": "a",
+            "data_type": Column::new("a", DataTypes::int()).serialize_json().unwrap()
+                .get("data_type").unwrap(),
+            "id": (i32::MAX as i64) + 1,
+        });
+        let err = Column::deserialize_json(&json).unwrap_err();
+        assert!(err.to_string().contains("does not fit in i32"), "{err}");
+    }
+
+    #[test]
+    fn schema_rejects_partially_assigned_ids() {
+        use crate::metadata::Column;
+
+        let err = Schema::builder()
+            .with_columns(vec![
+                Column::new("a", DataTypes::int()).with_id(0),
+                Column::new("b", DataTypes::string()),
+            ])
+            .build()
+            .unwrap_err();
+        assert!(
+            err.to_string().contains("All columns must have an id"),
+            "{err}"
+        );
+    }
+
     #[test]
     fn test_datatype_json_serde() {
         let data_types = vec![
diff --git a/fluss-rust/crates/fluss/src/metadata/mod.rs b/fluss-rust/crates/fluss/src/metadata/mod.rs
index 0ca654a6b1..c1d1b72c69 100644
--- a/fluss-rust/crates/fluss/src/metadata/mod.rs
+++ b/fluss-rust/crates/fluss/src/metadata/mod.rs
@@ -20,6 +20,7 @@ mod database;
 mod datatype;
 mod json_serde;
 mod partition;
+mod schema_util;
 mod table;
 
 pub use data_lake_format::*;
@@ -27,4 +28,5 @@ pub use database::*;
 pub use datatype::*;
 pub use json_serde::*;
 pub use partition::*;
+pub(crate) use schema_util::{UNEXIST_MAPPING, index_mapping};
 pub use table::*;
diff --git a/fluss-rust/crates/fluss/src/metadata/schema_util.rs b/fluss-rust/crates/fluss/src/metadata/schema_util.rs
new file mode 100644
index 0000000000..498a526eae
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/metadata/schema_util.rs
@@ -0,0 +1,204 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::error::{Error, Result};
+use crate::metadata::{Schema, UNKNOWN_COLUMN_ID};
+use std::collections::{HashMap, HashSet};
+
+/// Sentinel for an expected column that does not exist in the origin
+/// schema. Used by [`index_mapping`] and [`crate::row::ProjectedRow`].
+pub(crate) const UNEXIST_MAPPING: i32 = -1;
+
+/// For each column in `expected_schema`, return the index of the column
+/// with the same id in `origin_schema`, or [`UNEXIST_MAPPING`] if absent.
+/// Matching by id keeps mappings stable across `ALTER TABLE … RENAME`.
+pub(crate) fn index_mapping(origin_schema: &Schema, expected_schema: &Schema) -> Result<Vec<i32>> {
+    let origin_columns = origin_schema.columns();
+    let mut origin_id_to_index: HashMap<i32, usize> = HashMap::with_capacity(origin_columns.len());
+    for (i, col) in origin_columns.iter().enumerate() {
+        if col.id() == UNKNOWN_COLUMN_ID {
+            return Err(Error::RowConvertError {
+                message: format!(
+                    "origin schema column '{}' has no assigned id; cannot build index mapping",
+                    col.name()
+                ),
+            });
+        }
+        if origin_id_to_index.insert(col.id(), i).is_some() {
+            return Err(Error::RowConvertError {
+                message: format!("duplicate column id {} in origin schema", col.id()),
+            });
+        }
+    }
+
+    let expected_columns = expected_schema.columns();
+    let mut mapping = Vec::with_capacity(expected_columns.len());
+    let mut expected_seen: HashSet<i32> = HashSet::with_capacity(expected_columns.len());
+
+    for expected in expected_columns {
+        if expected.id() == UNKNOWN_COLUMN_ID {
+            return Err(Error::RowConvertError {
+                message: format!(
+                    "expected schema column '{}' has no assigned id; cannot build index mapping",
+                    expected.name()
+                ),
+            });
+        }
+        if !expected_seen.insert(expected.id()) {
+            return Err(Error::RowConvertError {
+                message: format!("duplicate column id {} in expected schema", expected.id()),
+            });
+        }
+        match origin_id_to_index.get(&expected.id()) {
+            None => mapping.push(UNEXIST_MAPPING),
+            Some(&idx) => {
+                let origin = &origin_columns[idx];
+                if !origin.data_type().eq_ignore_nullable(expected.data_type()) {
+                    return Err(Error::RowConvertError {
+                        message: format!(
+                            "Expected datatype of column(id={},name={}) is [{}], while the actual datatype is [{}]",
+                            expected.id(),
+                            expected.name(),
+                            expected.data_type(),
+                            origin.data_type()
+                        ),
+                    });
+                }
+                mapping.push(idx as i32);
+            }
+        }
+    }
+
+    Ok(mapping)
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{Column, DataType, DataTypes};
+
+    fn schema_auto(columns: &[(&str, DataType)]) -> Schema {
+        let mut b = Schema::builder();
+        for (name, dt) in columns {
+            b = b.column(*name, dt.clone());
+        }
+        b.build().expect("schema build")
+    }
+
+    fn schema_with_ids(columns: &[(i32, &str, DataType)]) -> Schema {
+        let cols: Vec<Column> = columns
+            .iter()
+            .map(|(id, name, dt)| Column::new(*name, dt.clone()).with_id(*id))
+            .collect();
+        Schema::builder()
+            .with_columns(cols)
+            .build()
+            .expect("schema build")
+    }
+
+    #[test]
+    fn identity_mapping_when_schemas_equal() {
+        let s = schema_auto(&[
+            ("a", DataTypes::bigint()),
+            ("b", DataTypes::string()),
+            ("c", DataTypes::int()),
+        ]);
+        assert_eq!(index_mapping(&s, &s).unwrap(), vec![0, 1, 2]);
+    }
+
+    #[test]
+    fn projection_subset_in_order() {
+        let origin = schema_auto(&[
+            ("a", DataTypes::bigint()),
+            ("b", DataTypes::string()),
+            ("c", DataTypes::int()),
+        ]);
+        let expected =
+            schema_with_ids(&[(0, "a", DataTypes::bigint()), (2, "c", DataTypes::int())]);
+        assert_eq!(index_mapping(&origin, &expected).unwrap(), vec![0, 2]);
+    }
+
+    #[test]
+    fn reorder_mapping() {
+        let origin = schema_auto(&[
+            ("a", DataTypes::bigint()),
+            ("b", DataTypes::string()),
+            ("c", DataTypes::int()),
+        ]);
+        let expected = schema_with_ids(&[
+            (2, "c", DataTypes::int()),
+            (0, "a", DataTypes::bigint()),
+            (1, "b", DataTypes::string()),
+        ]);
+        assert_eq!(index_mapping(&origin, &expected).unwrap(), vec![2, 0, 1]);
+    }
+
+    #[test]
+    fn missing_column_returns_sentinel() {
+        let origin = schema_auto(&[("a", DataTypes::bigint())]);
+        let expected = schema_with_ids(&[
+            (0, "a", DataTypes::bigint()),
+            (1, "new_col", DataTypes::string()),
+        ]);
+        assert_eq!(
+            index_mapping(&origin, &expected).unwrap(),
+            vec![0, UNEXIST_MAPPING]
+        );
+    }
+
+    #[test]
+    fn rename_preserves_mapping_when_id_matches() {
+        let origin = schema_with_ids(&[(0, "old_name", DataTypes::int())]);
+        let expected = schema_with_ids(&[(0, "new_name", DataTypes::int())]);
+        assert_eq!(index_mapping(&origin, &expected).unwrap(), vec![0]);
+    }
+
+    #[test]
+    fn drop_then_add_with_same_name_does_not_alias() {
+        let origin = schema_with_ids(&[(0, "a", DataTypes::int())]);
+        let expected = schema_with_ids(&[(5, "a", DataTypes::int())]);
+        assert_eq!(
+            index_mapping(&origin, &expected).unwrap(),
+            vec![UNEXIST_MAPPING]
+        );
+    }
+
+    #[test]
+    fn datatype_mismatch_returns_error() {
+        let origin = schema_auto(&[("a", DataTypes::bigint())]);
+        let expected = schema_with_ids(&[(0, "a", DataTypes::int())]);
+        let err = index_mapping(&origin, &expected).unwrap_err();
+        let msg = err.to_string();
+        assert!(msg.contains("id=0"), "{msg}");
+        assert!(msg.contains("name=a"), "{msg}");
+        assert!(msg.contains("INT"), "{msg}");
+        assert!(msg.contains("BIGINT"), "{msg}");
+    }
+
+    #[test]
+    fn nullability_difference_does_not_error() {
+        // Primary-key normalization makes the origin non-nullable while
+        // the expected is nullable.
+        let origin = Schema::builder()
+            .column("a", DataTypes::int())
+            .primary_key(["a"])
+            .build()
+            .unwrap();
+        let expected = schema_with_ids(&[(0, "a", DataTypes::int())]);
+        assert_eq!(index_mapping(&origin, &expected).unwrap(), vec![0]);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index dba9a5230d..ebaf085e21 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -28,11 +28,15 @@ use std::fmt::{Display, Formatter};
 use std::sync::Arc;
 use strum_macros::EnumString;
 
+/// Sentinel for a column whose stable id has not yet been assigned.
+pub const UNKNOWN_COLUMN_ID: i32 = -1;
+
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 pub struct Column {
     name: String,
     data_type: DataType,
     comment: Option<String>,
+    id: i32,
 }
 
 impl Column {
@@ -41,6 +45,7 @@ impl Column {
             name: name.into(),
             data_type,
             comment: None,
+            id: UNKNOWN_COLUMN_ID,
         }
     }
 
@@ -54,9 +59,15 @@ impl Column {
             name: self.name.clone(),
             data_type: data_type.clone(),
             comment: self.comment.clone(),
+            id: self.id,
         }
     }
 
+    pub fn with_id(mut self, id: i32) -> Self {
+        self.id = id;
+        self
+    }
+
     // Getters...
     pub fn name(&self) -> &str {
         &self.name
@@ -69,6 +80,12 @@ impl Column {
     pub fn comment(&self) -> Option<&str> {
         self.comment.as_deref()
     }
+
+    /// Returns the stable column id, or [`UNKNOWN_COLUMN_ID`] when the
+    /// id has not yet been assigned by a [`SchemaBuilder`].
+    pub fn id(&self) -> i32 {
+        self.id
+    }
 }
 
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
@@ -152,6 +169,31 @@ impl Schema {
     }
 }
 
+/// A schema together with its server-assigned version id.
+#[derive(Debug, Clone, PartialEq, Eq)]
+pub struct SchemaInfo {
+    schema: Schema,
+    schema_id: i32,
+}
+
+impl SchemaInfo {
+    pub fn new(schema: Schema, schema_id: i32) -> Self {
+        Self { schema, schema_id }
+    }
+
+    pub fn schema(&self) -> &Schema {
+        &self.schema
+    }
+
+    pub fn schema_id(&self) -> i32 {
+        self.schema_id
+    }
+
+    pub fn into_parts(self) -> (Schema, i32) {
+        (self.schema, self.schema_id)
+    }
+}
+
 #[derive(Debug, Default)]
 pub struct SchemaBuilder {
     columns: Vec<Column>,
@@ -236,6 +278,7 @@ impl SchemaBuilder {
 
     pub fn build(&self) -> Result<Schema> {
         let columns = Self::normalize_columns(&self.columns, self.primary_key.as_ref())?;
+        let columns = Self::assign_column_ids(columns)?;
 
         let column_names: HashSet<_> = columns.iter().map(|c| &c.name).collect();
         for auto_inc_col in &self.auto_increment_col_names {
@@ -265,6 +308,42 @@ impl SchemaBuilder {
         })
     }
 
+    /// All-or-none: preserve ids if every column has one, auto-assign
+    /// 0..N-1 if none do, error on mixed input. When preserving ids,
+    /// also reject duplicates and negative-but-not-sentinel values.
+    fn assign_column_ids(columns: Vec<Column>) -> Result<Vec<Column>> {
+        let with_id = columns.iter().filter(|c| c.id != UNKNOWN_COLUMN_ID).count();
+        if with_id == 0 {
+            return Ok(columns
+                .into_iter()
+                .enumerate()
+                .map(|(i, c)| c.with_id(i as i32))
+                .collect());
+        }
+        if with_id != columns.len() {
+            return Err(IllegalArgument {
+                message: "All columns must have an id assigned, or none of them must.".to_string(),
+            });
+        }
+        let mut seen: HashSet<i32> = HashSet::with_capacity(columns.len());
+        for col in &columns {
+            if col.id < 0 {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "Column '{}' has invalid id {}; ids must be non-negative",
+                        col.name, col.id
+                    ),
+                });
+            }
+            if !seen.insert(col.id) {
+                return Err(IllegalArgument {
+                    message: format!("Duplicate column id {} in schema", col.id),
+                });
+            }
+        }
+        Ok(columns)
+    }
+
     fn normalize_columns(
         columns: &[Column],
         primary_key: Option<&PrimaryKey>,
@@ -662,7 +741,7 @@ impl LogFormat {
     }
 }
 
-#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, EnumString)]
+#[derive(Debug, Clone, Copy, Serialize, Deserialize, PartialEq, Eq, EnumString)]
 pub enum KvFormat {
     INDEXED,
     COMPACTED,
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index f32d6b2434..a544906b1b 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -184,6 +184,18 @@ message GetTableInfoResponse {
   required int64 modified_time = 5;
 }
 
+// get table schema request and response. Mirrors the Java RPC at api key 1011.
+// Omitting `schema_id` requests the latest schema.
+message GetTableSchemaRequest {
+  required PbTablePath table_path = 1;
+  optional int32 schema_id = 2;
+}
+
+message GetTableSchemaResponse {
+  required int32 schema_id = 1;
+  required bytes schema_json = 2;
+}
+
 message ListTablesRequest {
   required string database_name = 1;
 }
diff --git a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
index 77cdbcb1b7..4200e044b3 100644
--- a/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/kv_record_read_context.rs
@@ -88,7 +88,7 @@ impl ReadContext for KvRecordReadContext {
         let row_type = schema.row_type().clone();
 
         // Create decoder outside lock
-        let decoder = RowDecoderFactory::create(self.kv_format.clone(), row_type)?;
+        let decoder = RowDecoderFactory::create(self.kv_format, row_type)?;
 
         // Second check: insert only if another thread didn't beat us to it
         {
diff --git a/fluss-rust/crates/fluss/src/record/kv/test_util.rs b/fluss-rust/crates/fluss/src/record/kv/test_util.rs
index 50ab911db2..54eaac8f3d 100644
--- a/fluss-rust/crates/fluss/src/record/kv/test_util.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/test_util.rs
@@ -45,6 +45,6 @@ impl ReadContext for TestReadContext {
     fn get_row_decoder(&self, _schema_id: i16) -> Result<Arc<dyn RowDecoder>> {
         // Directly create decoder from data types - no Schema needed!
         let row_type = RowType::with_data_types(self.data_types.clone());
-        RowDecoderFactory::create(self.kv_format.clone(), row_type)
+        RowDecoderFactory::create(self.kv_format, row_type)
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/fixed_schema_decoder.rs b/fluss-rust/crates/fluss/src/row/fixed_schema_decoder.rs
new file mode 100644
index 0000000000..eec83f3d39
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/fixed_schema_decoder.rs
@@ -0,0 +1,196 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Decode a `[schema_id (2 bytes) | row]` value into an [`InternalRow`]
+//! conforming to a fixed target schema, projecting across schema
+//! versions when needed.
+
+use crate::error::{Error, Result};
+use crate::metadata::{KvFormat, Schema, index_mapping};
+use crate::record::kv::SCHEMA_ID_LENGTH;
+use crate::row::{LookupRow, ProjectedRow, RowDecoder, RowDecoderFactory};
+use std::sync::Arc;
+
+pub(crate) struct FixedSchemaDecoder {
+    row_decoder: Arc<dyn RowDecoder>,
+    index_mapping: Option<Arc<[i32]>>,
+}
+
+impl FixedSchemaDecoder {
+    pub fn new_no_projection(kv_format: KvFormat, schema: &Schema) -> Result<Self> {
+        let row_decoder = RowDecoderFactory::create(kv_format, schema.row_type().clone())?;
+        Ok(Self {
+            row_decoder,
+            index_mapping: None,
+        })
+    }
+
+    pub fn new(
+        kv_format: KvFormat,
+        source_schema: &Schema,
+        target_schema: &Schema,
+    ) -> Result<Self> {
+        let mapping = index_mapping(source_schema, target_schema)?;
+        let row_decoder = RowDecoderFactory::create(kv_format, source_schema.row_type().clone())?;
+        Ok(Self {
+            row_decoder,
+            index_mapping: Some(Arc::from(mapping.into_boxed_slice())),
+        })
+    }
+
+    pub fn decode<'a>(&self, value_bytes: &'a [u8]) -> Result<LookupRow<'a>> {
+        let payload =
+            value_bytes
+                .get(SCHEMA_ID_LENGTH..)
+                .ok_or_else(|| Error::RowConvertError {
+                    message: format!(
+                        "Row payload too short: {} bytes, need at least {} for schema id",
+                        value_bytes.len(),
+                        SCHEMA_ID_LENGTH
+                    ),
+                })?;
+        let row = self.row_decoder.decode(payload);
+        match &self.index_mapping {
+            None => Ok(LookupRow::raw(row)),
+            Some(mapping) => Ok(LookupRow::projected(ProjectedRow::new(
+                row,
+                Arc::clone(mapping),
+            ))),
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::{Column, DataTypes, Schema};
+    use crate::record::kv::SCHEMA_ID_LENGTH;
+    use crate::row::InternalRow;
+    use crate::row::binary::BinaryWriter;
+    use crate::row::compacted::CompactedRowWriter;
+
+    fn schema_with_ids(columns: &[(i32, &str, crate::metadata::DataType)]) -> Schema {
+        let cols: Vec<Column> = columns
+            .iter()
+            .map(|(id, name, dt)| Column::new(*name, dt.clone()).with_id(*id))
+            .collect();
+        Schema::builder().with_columns(cols).build().unwrap()
+    }
+
+    fn write_value(schema_id: i16, writer: CompactedRowWriter) -> Vec<u8> {
+        let row_bytes = writer.to_bytes();
+        let mut out = Vec::with_capacity(SCHEMA_ID_LENGTH + row_bytes.len());
+        out.extend_from_slice(&schema_id.to_le_bytes());
+        out.extend_from_slice(row_bytes.as_ref());
+        out
+    }
+
+    #[test]
+    fn decode_no_projection_strips_schema_id_and_returns_row() {
+        let schema = schema_with_ids(&[(0, "a", DataTypes::int()), (1, "b", DataTypes::string())]);
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &schema).unwrap();
+
+        let mut writer = CompactedRowWriter::new(2);
+        writer.write_int(42);
+        writer.write_string("hi");
+        let value = write_value(7, writer);
+
+        let row = decoder.decode(&value).unwrap();
+        assert_eq!(row.get_field_count(), 2);
+        assert_eq!(row.get_int(0).unwrap(), 42);
+        assert_eq!(row.get_string(1).unwrap(), "hi");
+    }
+
+    #[test]
+    fn decode_with_projection_pads_missing_field_with_null() {
+        // Source schema (older): [a:int, b:string]
+        let source = schema_with_ids(&[(0, "a", DataTypes::int()), (1, "b", DataTypes::string())]);
+        // Target schema (newer): added column c at id=2
+        let target = schema_with_ids(&[
+            (0, "a", DataTypes::int()),
+            (1, "b", DataTypes::string()),
+            (2, "c", DataTypes::bigint()),
+        ]);
+        let decoder = FixedSchemaDecoder::new(KvFormat::COMPACTED, &source, &target).unwrap();
+
+        let mut writer = CompactedRowWriter::new(2);
+        writer.write_int(7);
+        writer.write_string("seven");
+        let value = write_value(0, writer);
+
+        let row = decoder.decode(&value).unwrap();
+        assert_eq!(row.get_field_count(), 3);
+        assert_eq!(row.get_int(0).unwrap(), 7);
+        assert_eq!(row.get_string(1).unwrap(), "seven");
+        assert!(
+            row.is_null_at(2).unwrap(),
+            "added-but-missing column must read as null"
+        );
+    }
+
+    #[test]
+    fn decode_with_projection_drops_removed_field() {
+        // Source schema (older): [a, b, c]
+        let source = schema_with_ids(&[
+            (0, "a", DataTypes::int()),
+            (1, "b", DataTypes::string()),
+            (2, "c", DataTypes::bigint()),
+        ]);
+        // Target schema (newer): dropped b
+        let target = schema_with_ids(&[(0, "a", DataTypes::int()), (2, "c", DataTypes::bigint())]);
+        let decoder = FixedSchemaDecoder::new(KvFormat::COMPACTED, &source, &target).unwrap();
+
+        let mut writer = CompactedRowWriter::new(3);
+        writer.write_int(1);
+        writer.write_string("dropped");
+        writer.write_long(99);
+        let value = write_value(0, writer);
+
+        let row = decoder.decode(&value).unwrap();
+        assert_eq!(row.get_field_count(), 2);
+        assert_eq!(row.get_int(0).unwrap(), 1);
+        assert_eq!(row.get_long(1).unwrap(), 99);
+    }
+
+    #[test]
+    fn decode_with_projection_reorders_fields() {
+        let source = schema_with_ids(&[(0, "a", DataTypes::int()), (1, "b", DataTypes::string())]);
+        // Target reorders: b first, then a.
+        let target = schema_with_ids(&[(1, "b", DataTypes::string()), (0, "a", DataTypes::int())]);
+        let decoder = FixedSchemaDecoder::new(KvFormat::COMPACTED, &source, &target).unwrap();
+
+        let mut writer = CompactedRowWriter::new(2);
+        writer.write_int(123);
+        writer.write_string("xyz");
+        let value = write_value(0, writer);
+
+        let row = decoder.decode(&value).unwrap();
+        assert_eq!(row.get_string(0).unwrap(), "xyz");
+        assert_eq!(row.get_int(1).unwrap(), 123);
+    }
+
+    #[test]
+    fn decode_payload_too_short_errors() {
+        let schema = schema_with_ids(&[(0, "a", DataTypes::int())]);
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &schema).unwrap();
+        // Only 1 byte — short of the schema id.
+        match decoder.decode(&[0u8]) {
+            Ok(_) => panic!("expected error for short payload"),
+            Err(e) => assert!(e.to_string().contains("too short"), "got: {e}"),
+        }
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/lookup_row.rs b/fluss-rust/crates/fluss/src/row/lookup_row.rs
new file mode 100644
index 0000000000..c002369d13
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/lookup_row.rs
@@ -0,0 +1,122 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Return type of [`crate::client::table::LookupResult`] getters: a row
+//! decoded under the table's current schema, possibly via projection
+//! over an older schema's bytes.
+
+use crate::client::WriteFormat;
+use crate::error::Result;
+use crate::row::compacted::CompactedRow;
+use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+use crate::row::projected_row::ProjectedRow;
+use crate::row::{Decimal, FlussArray, InternalRow};
+
+pub struct LookupRow<'a> {
+    inner: Inner<'a>,
+}
+
+enum Inner<'a> {
+    Raw(CompactedRow<'a>),
+    Projected(ProjectedRow<CompactedRow<'a>>),
+}
+
+impl<'a> LookupRow<'a> {
+    pub(crate) fn raw(row: CompactedRow<'a>) -> Self {
+        Self {
+            inner: Inner::Raw(row),
+        }
+    }
+
+    pub(crate) fn projected(row: ProjectedRow<CompactedRow<'a>>) -> Self {
+        Self {
+            inner: Inner::Projected(row),
+        }
+    }
+}
+
+macro_rules! delegate {
+    ($self:ident, $method:ident $(, $arg:expr)*) => {
+        match &$self.inner {
+            Inner::Raw(r) => r.$method($($arg),*),
+            Inner::Projected(r) => r.$method($($arg),*),
+        }
+    };
+}
+
+impl<'a> InternalRow for LookupRow<'a> {
+    fn get_field_count(&self) -> usize {
+        delegate!(self, get_field_count)
+    }
+    fn is_null_at(&self, pos: usize) -> Result<bool> {
+        delegate!(self, is_null_at, pos)
+    }
+    fn get_boolean(&self, pos: usize) -> Result<bool> {
+        delegate!(self, get_boolean, pos)
+    }
+    fn get_byte(&self, pos: usize) -> Result<i8> {
+        delegate!(self, get_byte, pos)
+    }
+    fn get_short(&self, pos: usize) -> Result<i16> {
+        delegate!(self, get_short, pos)
+    }
+    fn get_int(&self, pos: usize) -> Result<i32> {
+        delegate!(self, get_int, pos)
+    }
+    fn get_long(&self, pos: usize) -> Result<i64> {
+        delegate!(self, get_long, pos)
+    }
+    fn get_float(&self, pos: usize) -> Result<f32> {
+        delegate!(self, get_float, pos)
+    }
+    fn get_double(&self, pos: usize) -> Result<f64> {
+        delegate!(self, get_double, pos)
+    }
+    fn get_char(&self, pos: usize, length: usize) -> Result<&str> {
+        delegate!(self, get_char, pos, length)
+    }
+    fn get_string(&self, pos: usize) -> Result<&str> {
+        delegate!(self, get_string, pos)
+    }
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Result<Decimal> {
+        delegate!(self, get_decimal, pos, precision, scale)
+    }
+    fn get_date(&self, pos: usize) -> Result<Date> {
+        delegate!(self, get_date, pos)
+    }
+    fn get_time(&self, pos: usize) -> Result<Time> {
+        delegate!(self, get_time, pos)
+    }
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> Result<TimestampNtz> {
+        delegate!(self, get_timestamp_ntz, pos, precision)
+    }
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> Result<TimestampLtz> {
+        delegate!(self, get_timestamp_ltz, pos, precision)
+    }
+    fn get_binary(&self, pos: usize, length: usize) -> Result<&[u8]> {
+        delegate!(self, get_binary, pos, length)
+    }
+    fn get_bytes(&self, pos: usize) -> Result<&[u8]> {
+        delegate!(self, get_bytes, pos)
+    }
+    fn get_array(&self, pos: usize) -> Result<FlussArray> {
+        delegate!(self, get_array, pos)
+    }
+    fn as_encoded_bytes(&self, write_format: WriteFormat) -> Option<&[u8]> {
+        delegate!(self, as_encoded_bytes, write_format)
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 359a9a5885..c6bdd7c540 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -26,6 +26,9 @@ pub(crate) mod column_writer;
 pub mod compacted;
 pub mod encode;
 pub mod field_getter;
+mod fixed_schema_decoder;
+mod lookup_row;
+mod projected_row;
 mod row_decoder;
 
 use crate::client::WriteFormat;
@@ -36,6 +39,9 @@ pub use compacted::CompactedRow;
 pub use datum::*;
 pub use decimal::{Decimal, MAX_COMPACT_PRECISION};
 pub use encode::KeyEncoder;
+pub(crate) use fixed_schema_decoder::FixedSchemaDecoder;
+pub use lookup_row::LookupRow;
+pub(crate) use projected_row::ProjectedRow;
 pub use row_decoder::{CompactedRowDecoder, RowDecoder, RowDecoderFactory};
 
 pub struct BinaryRow<'a> {
diff --git a/fluss-rust/crates/fluss/src/row/projected_row.rs b/fluss-rust/crates/fluss/src/row/projected_row.rs
new file mode 100644
index 0000000000..cdd946a5fc
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/projected_row.rs
@@ -0,0 +1,276 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! View over an [`InternalRow`] that re-orders, drops, and null-pads
+//! fields according to a target→source index mapping.
+
+use crate::client::WriteFormat;
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::UNEXIST_MAPPING;
+use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+use crate::row::{Decimal, FlussArray, InternalRow};
+use std::sync::Arc;
+
+pub(crate) struct ProjectedRow<R> {
+    index_mapping: Arc<[i32]>,
+    inner: R,
+}
+
+impl<R> ProjectedRow<R> {
+    pub fn new(inner: R, index_mapping: Arc<[i32]>) -> Self {
+        Self {
+            index_mapping,
+            inner,
+        }
+    }
+
+    fn source_index(&self, pos: usize) -> Result<usize> {
+        let mapped = self
+            .index_mapping
+            .get(pos)
+            .copied()
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "position {pos} out of bounds (projected row has {} fields)",
+                    self.index_mapping.len()
+                ),
+            })?;
+        if mapped == UNEXIST_MAPPING {
+            return Err(IllegalArgument {
+                message: format!(
+                    "field at position {pos} does not exist in the source row \
+                     (caller should check is_null_at first)"
+                ),
+            });
+        }
+        Ok(mapped as usize)
+    }
+}
+
+macro_rules! project {
+    ($self:ident, $method:ident, $pos:expr $(, $arg:expr)*) => {
+        $self.inner.$method($self.source_index($pos)?, $($arg),*)
+    };
+}
+
+impl<R: InternalRow> InternalRow for ProjectedRow<R> {
+    fn get_field_count(&self) -> usize {
+        self.index_mapping.len()
+    }
+
+    fn is_null_at(&self, pos: usize) -> Result<bool> {
+        let mapped = self
+            .index_mapping
+            .get(pos)
+            .copied()
+            .ok_or_else(|| IllegalArgument {
+                message: format!(
+                    "position {pos} out of bounds (projected row has {} fields)",
+                    self.index_mapping.len()
+                ),
+            })?;
+        if mapped == UNEXIST_MAPPING {
+            return Ok(true);
+        }
+        self.inner.is_null_at(mapped as usize)
+    }
+
+    fn get_boolean(&self, pos: usize) -> Result<bool> {
+        project!(self, get_boolean, pos)
+    }
+    fn get_byte(&self, pos: usize) -> Result<i8> {
+        project!(self, get_byte, pos)
+    }
+    fn get_short(&self, pos: usize) -> Result<i16> {
+        project!(self, get_short, pos)
+    }
+    fn get_int(&self, pos: usize) -> Result<i32> {
+        project!(self, get_int, pos)
+    }
+    fn get_long(&self, pos: usize) -> Result<i64> {
+        project!(self, get_long, pos)
+    }
+    fn get_float(&self, pos: usize) -> Result<f32> {
+        project!(self, get_float, pos)
+    }
+    fn get_double(&self, pos: usize) -> Result<f64> {
+        project!(self, get_double, pos)
+    }
+    fn get_char(&self, pos: usize, length: usize) -> Result<&str> {
+        project!(self, get_char, pos, length)
+    }
+    fn get_string(&self, pos: usize) -> Result<&str> {
+        project!(self, get_string, pos)
+    }
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Result<Decimal> {
+        project!(self, get_decimal, pos, precision, scale)
+    }
+    fn get_date(&self, pos: usize) -> Result<Date> {
+        project!(self, get_date, pos)
+    }
+    fn get_time(&self, pos: usize) -> Result<Time> {
+        project!(self, get_time, pos)
+    }
+    fn get_timestamp_ntz(&self, pos: usize, precision: u32) -> Result<TimestampNtz> {
+        project!(self, get_timestamp_ntz, pos, precision)
+    }
+    fn get_timestamp_ltz(&self, pos: usize, precision: u32) -> Result<TimestampLtz> {
+        project!(self, get_timestamp_ltz, pos, precision)
+    }
+    fn get_binary(&self, pos: usize, length: usize) -> Result<&[u8]> {
+        project!(self, get_binary, pos, length)
+    }
+    fn get_bytes(&self, pos: usize) -> Result<&[u8]> {
+        project!(self, get_bytes, pos)
+    }
+    fn get_array(&self, pos: usize) -> Result<FlussArray> {
+        project!(self, get_array, pos)
+    }
+
+    fn as_encoded_bytes(&self, _write_format: WriteFormat) -> Option<&[u8]> {
+        // Projection changes the field layout, so the inner row's
+        // encoded form no longer matches.
+        None
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::row::{Datum, GenericRow};
+
+    fn mapping(slots: &[i32]) -> Arc<[i32]> {
+        Arc::from(slots.to_vec().into_boxed_slice())
+    }
+
+    fn row_of<'a>(values: Vec<Datum<'a>>) -> GenericRow<'a> {
+        GenericRow { values }
+    }
+
+    #[test]
+    fn projects_and_reorders_longs() {
+        let mapping = mapping(&[2, 0, 1, 4]);
+        let inner = row_of(vec![
+            Datum::Int64(0),
+            Datum::Int64(1),
+            Datum::Int64(2),
+            Datum::Int64(3),
+            Datum::Int64(4),
+        ]);
+        let projected = ProjectedRow::new(inner, mapping);
+
+        assert_eq!(projected.get_field_count(), 4);
+        assert_eq!(projected.get_long(0).unwrap(), 2);
+        assert_eq!(projected.get_long(1).unwrap(), 0);
+        assert_eq!(projected.get_long(2).unwrap(), 1);
+        assert_eq!(projected.get_long(3).unwrap(), 4);
+    }
+
+    #[test]
+    fn projects_strings_and_doubles() {
+        let mapping = mapping(&[2, 0, 1, 4]);
+
+        let strings = row_of(vec![
+            Datum::String("0".into()),
+            Datum::String("1".into()),
+            Datum::String("2".into()),
+            Datum::String("3".into()),
+            Datum::String("4".into()),
+        ]);
+        let projected = ProjectedRow::new(strings, Arc::clone(&mapping));
+        assert_eq!(projected.get_string(0).unwrap(), "2");
+        assert_eq!(projected.get_string(1).unwrap(), "0");
+        assert_eq!(projected.get_string(3).unwrap(), "4");
+
+        let doubles = row_of(vec![
+            Datum::Float64(0.5.into()),
+            Datum::Float64(0.6.into()),
+            Datum::Float64(0.7.into()),
+            Datum::Float64(0.8.into()),
+            Datum::Float64(0.9.into()),
+            Datum::Float64(1.0.into()),
+        ]);
+        let projected = ProjectedRow::new(doubles, Arc::clone(&mapping));
+        assert_eq!(projected.get_double(0).unwrap(), 0.7);
+        assert_eq!(projected.get_double(1).unwrap(), 0.5);
+        assert_eq!(projected.get_double(3).unwrap(), 0.9);
+    }
+
+    #[test]
+    fn null_handling_passes_through_inner_nulls() {
+        let mapping = mapping(&[2, 0, 1, 4]);
+        let inner = row_of(vec![
+            Datum::Int64(5),
+            Datum::Int64(6),
+            Datum::Null,
+            Datum::Int64(8),
+            Datum::Null,
+            Datum::Int64(10),
+        ]);
+        let projected = ProjectedRow::new(inner, mapping);
+
+        assert!(projected.is_null_at(0).unwrap());
+        assert!(!projected.is_null_at(1).unwrap());
+        assert!(!projected.is_null_at(2).unwrap());
+        assert!(projected.is_null_at(3).unwrap());
+    }
+
+    #[test]
+    fn unexist_mapping_reports_null_and_errors_on_get() {
+        let mapping = mapping(&[0, 1, UNEXIST_MAPPING, 2]);
+        let inner = row_of(vec![Datum::Int64(10), Datum::Int64(20), Datum::Int64(30)]);
+        let projected = ProjectedRow::new(inner, mapping);
+
+        assert_eq!(projected.get_field_count(), 4);
+        assert_eq!(projected.get_long(0).unwrap(), 10);
+        assert_eq!(projected.get_long(1).unwrap(), 20);
+        assert!(projected.is_null_at(2).unwrap());
+        let err = projected.get_long(2).unwrap_err();
+        assert!(err.to_string().contains("does not exist"), "got: {err}");
+        assert_eq!(projected.get_long(3).unwrap(), 30);
+    }
+
+    #[test]
+    fn out_of_bounds_position_returns_error() {
+        let mapping = mapping(&[0, 1]);
+        let inner = row_of(vec![Datum::Int64(1), Datum::Int64(2)]);
+        let projected = ProjectedRow::new(inner, mapping);
+
+        let err = projected.is_null_at(5).unwrap_err();
+        assert!(err.to_string().contains("out of bounds"), "got: {err}");
+        let err = projected.get_long(5).unwrap_err();
+        assert!(err.to_string().contains("out of bounds"), "got: {err}");
+    }
+
+    #[test]
+    fn shared_mapping_can_back_many_rows() {
+        let mapping = mapping(&[1, 0]);
+        let row_a = ProjectedRow::new(
+            row_of(vec![Datum::Int64(10), Datum::Int64(20)]),
+            Arc::clone(&mapping),
+        );
+        let row_b = ProjectedRow::new(
+            row_of(vec![Datum::Int64(30), Datum::Int64(40)]),
+            Arc::clone(&mapping),
+        );
+        assert_eq!(row_a.get_long(0).unwrap(), 20);
+        assert_eq!(row_a.get_long(1).unwrap(), 10);
+        assert_eq!(row_b.get_long(0).unwrap(), 40);
+        assert_eq!(row_b.get_long(1).unwrap(), 30);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index d52497837d..1ea0269d85 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -29,6 +29,7 @@ pub enum ApiKey {
     ListTables,                 // 1008
     ListPartitionInfos,         // 1009
     TableExists,                // 1010
+    GetTableSchema,             // 1011
     MetaData,                   // 1012
     ProduceLog,                 // 1014
     FetchLog,                   // 1015
@@ -60,6 +61,7 @@ impl From<i16> for ApiKey {
             1008 => ApiKey::ListTables,
             1009 => ApiKey::ListPartitionInfos,
             1010 => ApiKey::TableExists,
+            1011 => ApiKey::GetTableSchema,
             1012 => ApiKey::MetaData,
             1014 => ApiKey::ProduceLog,
             1015 => ApiKey::FetchLog,
@@ -94,6 +96,7 @@ impl From<ApiKey> for i16 {
             ApiKey::ListTables => 1008,
             ApiKey::ListPartitionInfos => 1009,
             ApiKey::TableExists => 1010,
+            ApiKey::GetTableSchema => 1011,
             ApiKey::MetaData => 1012,
             ApiKey::ProduceLog => 1014,
             ApiKey::FetchLog => 1015,
@@ -131,6 +134,7 @@ mod tests {
             (1008, ApiKey::ListTables),
             (1009, ApiKey::ListPartitionInfos),
             (1010, ApiKey::TableExists),
+            (1011, ApiKey::GetTableSchema),
             (1012, ApiKey::MetaData),
             (1014, ApiKey::ProduceLog),
             (1015, ApiKey::FetchLog),
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_table_schema.rs b/fluss-rust/crates/fluss/src/rpc/message/get_table_schema.rs
new file mode 100644
index 0000000000..ad7b23fb03
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_table_schema.rs
@@ -0,0 +1,57 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::{GetTableSchemaRequest, GetTableSchemaResponse, PbTablePath};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::api_version::ApiVersion;
+use crate::rpc::frame::WriteError;
+use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+
+use crate::metadata::TablePath;
+use crate::rpc::frame::ReadError;
+
+use crate::{impl_read_version_type, impl_write_version_type};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+/// `schema_id = None` requests the latest schema.
+#[derive(Debug)]
+pub struct GetTableSchemaRequestMsg {
+    pub inner_request: GetTableSchemaRequest,
+}
+
+impl GetTableSchemaRequestMsg {
+    pub fn new(table_path: &TablePath, schema_id: Option<i32>) -> Self {
+        let inner_request = GetTableSchemaRequest {
+            table_path: PbTablePath {
+                database_name: table_path.database().to_owned(),
+                table_name: table_path.table().to_owned(),
+            },
+            schema_id,
+        };
+        Self { inner_request }
+    }
+}
+
+impl RequestBody for GetTableSchemaRequestMsg {
+    type ResponseBody = GetTableSchemaResponse;
+    const API_KEY: ApiKey = ApiKey::GetTableSchema;
+    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
+}
+
+impl_write_version_type!(GetTableSchemaRequestMsg);
+impl_read_version_type!(GetTableSchemaResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index d4739dc632..456f9cb894 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -33,6 +33,7 @@ mod get_database_info;
 mod get_latest_lake_snapshot;
 mod get_security_token;
 mod get_table;
+mod get_table_schema;
 mod header;
 mod init_writer;
 mod limit_scan;
@@ -61,6 +62,7 @@ pub use get_database_info::*;
 pub use get_latest_lake_snapshot::*;
 pub use get_security_token::*;
 pub use get_table::*;
+pub use get_table_schema::*;
 pub use header::*;
 pub use init_writer::*;
 pub use limit_scan::*;
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 15a62c1ce1..9f2994ad60 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -53,13 +53,14 @@ Complete API reference for the Fluss Rust client.
 
 ### Table Operations
 
-| Method                                                                                                                     | Description               |
-|----------------------------------------------------------------------------------------------------------------------------|---------------------------|
-| `async fn create_table(&self, table_path: &TablePath, descriptor: &TableDescriptor, ignore_if_exists: bool) -> Result<()>` | Create a table            |
-| `async fn drop_table(&self, table_path: &TablePath, ignore_if_not_exists: bool) -> Result<()>`                             | Drop a table              |
-| `async fn get_table_info(&self, table_path: &TablePath) -> Result<TableInfo>`                                              | Get table metadata        |
-| `async fn list_tables(&self, database_name: &str) -> Result<Vec<String>>`                                                  | List tables in a database |
-| `async fn table_exists(&self, table_path: &TablePath) -> Result<bool>`                                                     | Check if a table exists   |
+| Method                                                                                                                     | Description                                                                 |
+|----------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------|
+| `async fn create_table(&self, table_path: &TablePath, descriptor: &TableDescriptor, ignore_if_exists: bool) -> Result<()>` | Create a table                                                              |
+| `async fn drop_table(&self, table_path: &TablePath, ignore_if_not_exists: bool) -> Result<()>`                             | Drop a table                                                                |
+| `async fn get_table_info(&self, table_path: &TablePath) -> Result<TableInfo>`                                              | Get table metadata                                                          |
+| `async fn get_table_schema(&self, table_path: &TablePath, schema_id: Option<i32>) -> Result<SchemaInfo>`                   | Get a table's schema by id, or the latest schema when `schema_id` is `None` |
+| `async fn list_tables(&self, database_name: &str) -> Result<Vec<String>>`                                                  | List tables in a database                                                   |
+| `async fn table_exists(&self, table_path: &TablePath) -> Result<bool>`                                                     | Check if a table exists                                                     |
 
 ### Partition Operations
 
@@ -267,6 +268,17 @@ writer.append(&row)?.await?;
 | `fn primary_key(keys: Vec<&str>) -> Self`            | Set primary key columns |
 | `fn build() -> Result<Schema>`                       | Build the schema        |
 
+## `SchemaInfo`
+
+A schema together with its server-assigned version id. Returned by [`FlussAdmin::get_table_schema`](#flussadmin).
+
+| Method                                           | Description                              |
+|--------------------------------------------------|------------------------------------------|
+| `fn new(schema: Schema, schema_id: i32) -> Self` | Construct from a schema and id           |
+| `fn schema(&self) -> &Schema`                    | Borrow the schema                        |
+| `fn schema_id(&self) -> i32`                     | Get the server-assigned schema id        |
+| `fn into_parts(self) -> (Schema, i32)`           | Consume and return `(schema, schema_id)` |
+
 ## `TableDescriptor`
 
 | Method                                                    | Description                          |

From 47973d1b1eb34cbcec24a761865b359f44c43c4c Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sun, 3 May 2026 22:53:02 +0200
Subject: [PATCH 257/287] chore: fix python CI - reduce workers to 2 with
 loadfile distribution (#529)

---
 fluss-rust/.github/workflows/build_and_test_python.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index 88c1838ba5..93f2eedb52 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -77,7 +77,7 @@ jobs:
 
       - name: Run tests (parallel)
         working-directory: bindings/python
-        run: uv run --no-sync pytest test/ -v -n auto
+        run: uv run --no-sync pytest test/ -v -n 2 --dist=loadfile
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full

From 2356cf4e0bd0f29a036f10aecd2ad7eb9c64425f Mon Sep 17 00:00:00 2001
From: Prajwal banakar <prajwal.banakara@gmail.com>
Date: Wed, 6 May 2026 13:27:28 +0530
Subject: [PATCH 258/287] chore: Add validation for numeric config fields
 (#449)

* Add validation for numeric config fields

* improved

* Added issue comments

* fix: resolve clippy empty-line-after-doc-comments warning
---
 .../crates/fluss/src/client/connection.rs     |   6 +-
 .../fluss/src/client/table/remote_log.rs      |   2 +-
 .../fluss/src/client/write/writer_client.rs   |   4 -
 fluss-rust/crates/fluss/src/config.rs         | 213 ++++++++++++++----
 4 files changed, 172 insertions(+), 53 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/connection.rs b/fluss-rust/crates/fluss/src/client/connection.rs
index a3ffd7557e..c31104c469 100644
--- a/fluss-rust/crates/fluss/src/client/connection.rs
+++ b/fluss-rust/crates/fluss/src/client/connection.rs
@@ -41,10 +41,14 @@ impl FlussConnection {
     pub async fn new(arg: Config) -> Result<Self> {
         arg.validate_security()
             .map_err(|msg| Error::IllegalArgument { message: msg })?;
-        arg.validate_scanner_fetch()
+        arg.validate_scanner()
+            .map_err(|msg| Error::IllegalArgument { message: msg })?;
+        arg.validate_writer()
             .map_err(|msg| Error::IllegalArgument { message: msg })?;
 
         let timeout = Duration::from_millis(arg.connect_timeout_ms);
+        // connect_timeout_ms: no lower-bound validation to match Java behavior.
+        // Java allows 0 — tracked in https://github.com/apache/fluss/issues/3068
         let connections = if arg.is_sasl_enabled() {
             Arc::new(
                 RpcClient::new()
diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index 6bc955125f..4d96ce96b2 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -778,7 +778,7 @@ impl RemoteLogDownloader {
         let fetcher = Arc::new(ProductionFetcher {
             credentials_rx,
             local_log_dir: Arc::new(local_log_dir),
-            remote_log_read_concurrency: remote_log_read_concurrency.max(1),
+            remote_log_read_concurrency,
         });
 
         Self::new_with_fetcher(fetcher, max_prefetch_segments, max_concurrent_downloads)
diff --git a/fluss-rust/crates/fluss/src/client/write/writer_client.rs b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
index aee6bcd91d..ffdf96b1df 100644
--- a/fluss-rust/crates/fluss/src/client/write/writer_client.rs
+++ b/fluss-rust/crates/fluss/src/client/write/writer_client.rs
@@ -54,10 +54,6 @@ impl WriterClient {
     pub fn new(config: Config, metadata: Arc<Metadata>) -> Result<Self> {
         let ack = Self::get_ack(&config)?;
 
-        config
-            .validate_idempotence()
-            .map_err(|message| Error::IllegalArgument { message })?;
-
         let idempotence_manager = Arc::new(IdempotenceManager::new(
             config.writer_enable_idempotence,
             config.writer_max_inflight_requests_per_bucket,
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 2900e2f4bf..09a17f830d 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -303,39 +303,6 @@ impl Config {
     pub fn is_sasl_enabled(&self) -> bool {
         self.security_protocol.eq_ignore_ascii_case("sasl")
     }
-
-    /// Validates idempotence configuration. Returns `Ok(())` when the config is
-    /// consistent, or an error message when idempotence is enabled but other
-    /// settings are incompatible.
-    pub fn validate_idempotence(&self) -> Result<(), String> {
-        if !self.writer_enable_idempotence {
-            return Ok(());
-        }
-        let acks_is_all = self.writer_acks.eq_ignore_ascii_case("all") || self.writer_acks == "-1";
-        if !acks_is_all {
-            return Err(format!(
-                "Idempotent writes require acks='all' (-1), but got acks='{}'",
-                self.writer_acks
-            ));
-        }
-        if self.writer_retries <= 0 {
-            return Err(format!(
-                "Idempotent writes require retries > 0, but got retries={}",
-                self.writer_retries
-            ));
-        }
-        if self.writer_max_inflight_requests_per_bucket
-            > MAX_IN_FLIGHT_REQUESTS_PER_BUCKET_FOR_IDEMPOTENCE
-        {
-            return Err(format!(
-                "Idempotent writes require max-inflight-requests-per-bucket <= {}, but got {}",
-                MAX_IN_FLIGHT_REQUESTS_PER_BUCKET_FOR_IDEMPOTENCE,
-                self.writer_max_inflight_requests_per_bucket
-            ));
-        }
-        Ok(())
-    }
-
     /// Validates security configuration. Returns `Ok(())` when the config is
     /// consistent, or an error message when SASL is enabled but the config is
     /// incomplete or uses an unsupported mechanism.
@@ -361,7 +328,18 @@ impl Config {
         }
         Ok(())
     }
-    pub fn validate_scanner_fetch(&self) -> Result<(), String> {
+    pub fn validate_scanner(&self) -> Result<(), String> {
+        if self.scanner_remote_log_prefetch_num == 0 {
+            return Err("scanner_remote_log_prefetch_num must be > 0".to_string());
+        }
+        if self.scanner_remote_log_read_concurrency == 0 {
+            return Err("scanner_remote_log_read_concurrency must be > 0".to_string());
+        }
+        if self.remote_file_download_thread_num == 0 {
+            return Err("remote_file_download_thread_num must be > 0".to_string());
+        }
+        // scanner_log_max_poll_records: validation intentionally omitted to match Java behavior.
+        // Java allows 0 — tracked in https://github.com/apache/fluss/issues/3068
         if self.scanner_log_fetch_min_bytes <= 0 {
             return Err("scanner_log_fetch_min_bytes must be > 0".to_string());
         }
@@ -387,6 +365,57 @@ impl Config {
         }
         Ok(())
     }
+
+    pub fn validate_writer(&self) -> Result<(), String> {
+        if self.writer_request_max_size <= 0 {
+            return Err("writer_request_max_size must be > 0".to_string());
+        }
+        if self.writer_batch_size <= 0 {
+            return Err("writer_batch_size must be > 0".to_string());
+        }
+        if self.writer_batch_timeout_ms < 0 {
+            return Err("writer_batch_timeout_ms must be >= 0".to_string());
+        }
+        if self.writer_max_inflight_requests_per_bucket == 0 {
+            return Err("writer_max_inflight_requests_per_bucket must be > 0".to_string());
+        }
+        if self.writer_buffer_memory_size == 0 {
+            return Err("writer_buffer_memory_size must be > 0".to_string());
+        }
+        if self.writer_batch_size > self.writer_request_max_size {
+            return Err("writer_batch_size must be <= writer_request_max_size".to_string());
+        }
+        if self.writer_batch_size as usize > self.writer_buffer_memory_size {
+            return Err("writer_batch_size must be <= writer_buffer_memory_size".to_string());
+        }
+        // idempotence checks
+        if !self.writer_enable_idempotence {
+            return Ok(());
+        }
+        let acks_is_all = self.writer_acks.eq_ignore_ascii_case("all") || self.writer_acks == "-1";
+        if !acks_is_all {
+            return Err(format!(
+                "Idempotent writes require acks='all' (-1), but got acks='{}'",
+                self.writer_acks
+            ));
+        }
+        if self.writer_retries <= 0 {
+            return Err(format!(
+                "Idempotent writes require retries > 0, but got retries={}",
+                self.writer_retries
+            ));
+        }
+        if self.writer_max_inflight_requests_per_bucket
+            > MAX_IN_FLIGHT_REQUESTS_PER_BUCKET_FOR_IDEMPOTENCE
+        {
+            return Err(format!(
+                "Idempotent writes require max-inflight-requests-per-bucket <= {}, but got {}",
+                MAX_IN_FLIGHT_REQUESTS_PER_BUCKET_FOR_IDEMPOTENCE,
+                self.writer_max_inflight_requests_per_bucket
+            ));
+        }
+        Ok(())
+    }
 }
 
 #[cfg(test)]
@@ -456,13 +485,38 @@ mod tests {
         };
         assert!(config.validate_security().is_err());
     }
+
     #[test]
-    fn test_scanner_fetch_defaults_valid() {
+    fn test_scanner_defaults_valid() {
         let config = Config::default();
-        assert!(config.validate_scanner_fetch().is_ok());
-        assert_eq!(config.scanner_log_fetch_max_bytes, 16 * 1024 * 1024);
-        assert_eq!(config.scanner_log_fetch_min_bytes, 1);
-        assert_eq!(config.scanner_log_fetch_wait_max_time_ms, 500);
+        assert!(config.validate_scanner().is_ok());
+    }
+
+    #[test]
+    fn test_scanner_remote_log_prefetch_num_zero() {
+        let config = Config {
+            scanner_remote_log_prefetch_num: 0,
+            ..Config::default()
+        };
+        assert!(config.validate_scanner().is_err());
+    }
+
+    #[test]
+    fn test_scanner_remote_log_read_concurrency_zero() {
+        let config = Config {
+            scanner_remote_log_read_concurrency: 0,
+            ..Config::default()
+        };
+        assert!(config.validate_scanner().is_err());
+    }
+
+    #[test]
+    fn test_remote_file_download_thread_num_zero() {
+        let config = Config {
+            remote_file_download_thread_num: 0,
+            ..Config::default()
+        };
+        assert!(config.validate_scanner().is_err());
     }
 
     #[test]
@@ -472,7 +526,7 @@ mod tests {
             scanner_log_fetch_max_bytes: 1,
             ..Config::default()
         };
-        assert!(config.validate_scanner_fetch().is_err());
+        assert!(config.validate_scanner().is_err());
     }
 
     #[test]
@@ -481,13 +535,78 @@ mod tests {
             scanner_log_fetch_wait_max_time_ms: -1,
             ..Config::default()
         };
-        assert!(config.validate_scanner_fetch().is_err());
+        assert!(config.validate_scanner().is_err());
     }
 
     #[test]
-    fn test_idempotence_default_is_valid() {
+    fn test_writer_defaults_valid() {
         let config = Config::default();
-        assert!(config.validate_idempotence().is_ok());
+        assert!(config.validate_writer().is_ok());
+    }
+
+    #[test]
+    fn test_writer_request_max_size_zero() {
+        let config = Config {
+            writer_request_max_size: 0,
+            ..Config::default()
+        };
+        assert!(config.validate_writer().is_err());
+    }
+
+    #[test]
+    fn test_writer_batch_size_zero() {
+        let config = Config {
+            writer_batch_size: 0,
+            ..Config::default()
+        };
+        assert!(config.validate_writer().is_err());
+    }
+
+    #[test]
+    fn test_writer_batch_timeout_negative() {
+        let config = Config {
+            writer_batch_timeout_ms: -1,
+            ..Config::default()
+        };
+        assert!(config.validate_writer().is_err());
+    }
+
+    #[test]
+    fn test_writer_max_inflight_requests_per_bucket_zero() {
+        let config = Config {
+            writer_max_inflight_requests_per_bucket: 0,
+            ..Config::default()
+        };
+        assert!(config.validate_writer().is_err());
+    }
+
+    #[test]
+    fn test_writer_buffer_memory_size_zero() {
+        let config = Config {
+            writer_buffer_memory_size: 0,
+            ..Config::default()
+        };
+        assert!(config.validate_writer().is_err());
+    }
+
+    #[test]
+    fn test_writer_batch_size_exceeds_request_max_size() {
+        let config = Config {
+            writer_batch_size: 20 * 1024 * 1024,
+            writer_request_max_size: 10 * 1024 * 1024,
+            ..Config::default()
+        };
+        assert!(config.validate_writer().is_err());
+    }
+
+    #[test]
+    fn test_writer_batch_size_exceeds_buffer_memory_size() {
+        let config = Config {
+            writer_batch_size: 128 * 1024 * 1024,
+            writer_buffer_memory_size: 64 * 1024 * 1024,
+            ..Config::default()
+        };
+        assert!(config.validate_writer().is_err());
     }
 
     #[test]
@@ -499,7 +618,7 @@ mod tests {
             writer_max_inflight_requests_per_bucket: 100,
             ..Config::default()
         };
-        assert!(config.validate_idempotence().is_ok());
+        assert!(config.validate_writer().is_ok());
     }
 
     #[test]
@@ -509,7 +628,7 @@ mod tests {
             writer_acks: "1".to_string(),
             ..Config::default()
         };
-        assert!(config.validate_idempotence().is_err());
+        assert!(config.validate_writer().is_err());
     }
 
     #[test]
@@ -519,7 +638,7 @@ mod tests {
             writer_retries: 0,
             ..Config::default()
         };
-        assert!(config.validate_idempotence().is_err());
+        assert!(config.validate_writer().is_err());
     }
 
     #[test]
@@ -529,6 +648,6 @@ mod tests {
             writer_max_inflight_requests_per_bucket: 10,
             ..Config::default()
         };
-        assert!(config.validate_idempotence().is_err());
+        assert!(config.validate_writer().is_err());
     }
 }

From 1ff4eecd03e890d9955b423aba77ab5d7cf45033 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Fri, 8 May 2026 13:52:45 +0200
Subject: [PATCH 259/287] [c++] Add nullability support for data type in c++
 (#525)

* Add nullability support for data type in c++

* add comment to explain nullability setup

* split scalar and array

* rephrase since behavriour change fater this PR

* rephrase since behavriour change fater this PR

* format
---
 fluss-rust/bindings/cpp/include/fluss.hpp     |  13 +-
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |  56 +++-
 fluss-rust/bindings/cpp/src/lib.rs            |   7 +-
 fluss-rust/bindings/cpp/src/types.rs          | 240 +++++++++++-------
 .../bindings/cpp/test/test_ffi_converter.cpp  | 178 ++++++++++++-
 .../bindings/cpp/test/test_log_table.cpp      |  63 +++++
 .../docs/user-guide/cpp/api-reference.md      |   2 +
 .../website/docs/user-guide/cpp/data-types.md |  34 +++
 8 files changed, 488 insertions(+), 105 deletions(-)

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index f222166d35..3d39783fd7 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -283,8 +283,8 @@ enum class TypeId {
 
 class DataType {
    public:
-    explicit DataType(TypeId id, int32_t p = 0, int32_t s = 0)
-        : id_(id), precision_(p), scale_(s) {}
+    explicit DataType(TypeId id, int32_t p = 0, int32_t s = 0, bool nullable = true)
+        : id_(id), precision_(p), scale_(s), nullable_(nullable) {}
 
     static DataType Boolean() { return DataType(TypeId::Boolean); }
     static DataType TinyInt() { return DataType(TypeId::TinyInt); }
@@ -321,15 +321,24 @@ class DataType {
     TypeId id() const { return id_; }
     int32_t precision() const { return precision_; }
     int32_t scale() const { return scale_; }
+    bool nullable() const { return nullable_; }
     /// Returns the element type of an ARRAY. Returns `nullptr` for non-array
     /// types. The returned pointer is valid as long as this DataType (or a
     /// copy holding the same shared element) is alive.
     const DataType* element_type() const { return element_type_.get(); }
 
+    /// Returns a copy of this DataType with nullable set to false.
+    DataType NotNull() const {
+        DataType dt(id_, precision_, scale_, false);
+        dt.element_type_ = element_type_;
+        return dt;
+    }
+
    private:
     TypeId id_;
     int32_t precision_{0};
     int32_t scale_{0};
+    bool nullable_{true};
     std::shared_ptr<DataType> element_type_;
 };
 
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 0ef1487a7d..430dd1991d 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -33,16 +33,18 @@ namespace utils {
 /// `nesting` counts the number of ARRAY wrappers stripped to reach the leaf
 /// element type. `leaf_type`/`leaf_precision`/`leaf_scale` describe that leaf
 /// scalar. A non-array input produces a zero-initialised value (nesting == 0).
+/// `array_nullability` has `nesting + 1` entries: one per ARRAY wrapper
+/// (outermost first) plus a trailing entry for the leaf scalar's nullability.
 ///
 /// Using a flat representation — rather than serialising a recursive
-/// `DataType` — keeps the cxx bridge contract small (four `i32`s inside
-/// `FfiColumn`) while preserving full schema fidelity across the FFI boundary
-/// when paired with rebuild_array_type().
+/// `DataType` — keeps the cxx bridge contract small while preserving schema
+/// fidelity across the FFI boundary when paired with rebuild_array_type().
 struct FlattenedArrayType {
     int32_t nesting{0};
     int32_t leaf_type{0};
     int32_t leaf_precision{0};
     int32_t leaf_scale{0};
+    std::vector<uint8_t> array_nullability;
 };
 
 /// Flattens an `ARRAY<ARRAY<...<leaf>>>` DataType into a FlattenedArrayType.
@@ -53,7 +55,8 @@ struct FlattenedArrayType {
 ///   - If `data_type` is an ARRAY but has a null element_type() chain (which
 ///     should only happen on malformed input), returns a zero-valued result to
 ///     signal the caller to reject the schema.
-///   - Otherwise, `nesting >= 1` and leaf_* describe the innermost scalar.
+///   - Otherwise, `nesting >= 1`, array_nullability has `nesting + 1` entries
+///     (last = leaf scalar nullability), and leaf_* describe the innermost scalar.
 inline FlattenedArrayType flatten_array_type(const DataType& data_type) {
     FlattenedArrayType out;
     if (data_type.id() != TypeId::Array) {
@@ -63,6 +66,7 @@ inline FlattenedArrayType flatten_array_type(const DataType& data_type) {
     const DataType* current = &data_type;
     while (current && current->id() == TypeId::Array) {
         out.nesting += 1;
+        out.array_nullability.push_back(current->nullable() ? 1 : 0);
         current = current->element_type();
     }
     if (!current) {
@@ -72,16 +76,29 @@ inline FlattenedArrayType flatten_array_type(const DataType& data_type) {
     out.leaf_type = static_cast<int32_t>(current->id());
     out.leaf_precision = current->precision();
     out.leaf_scale = current->scale();
+    out.array_nullability.push_back(current->nullable() ? 1 : 0);
     return out;
 }
 
 /// Inverse of flatten_array_type: rebuilds an `ARRAY<ARRAY<...<leaf>>>` type
 /// from the compact flat form. Requires `flat.nesting >= 1`; callers handle
 /// the `nesting == 0` case by using a plain scalar DataType directly.
+/// `array_nullability` must have `nesting + 1` entries (last = leaf).
 inline DataType rebuild_array_type(const FlattenedArrayType& flat) {
-    DataType dt(static_cast<TypeId>(flat.leaf_type), flat.leaf_precision, flat.leaf_scale);
-    for (int32_t i = 0; i < flat.nesting; ++i) {
-        dt = DataType::Array(std::move(dt));
+    bool leaf_nullable = (static_cast<size_t>(flat.nesting) < flat.array_nullability.size())
+                             ? (flat.array_nullability[static_cast<size_t>(flat.nesting)] != 0)
+                             : true;
+    DataType dt(static_cast<TypeId>(flat.leaf_type), flat.leaf_precision, flat.leaf_scale,
+                leaf_nullable);
+    for (int32_t i = flat.nesting - 1; i >= 0; --i) {
+        bool nullable = (static_cast<size_t>(i) < flat.array_nullability.size())
+                            ? (flat.array_nullability[static_cast<size_t>(i)] != 0)
+                            : true;
+        auto arr = DataType::Array(std::move(dt));
+        if (!nullable) {
+            arr = arr.NotNull();
+        }
+        dt = std::move(arr);
     }
     return dt;
 }
@@ -150,11 +167,15 @@ inline ffi::FfiColumn to_ffi_column(const Column& col) {
     ffi::FfiColumn ffi_col;
     ffi_col.name = rust::String(col.name);
     ffi_col.data_type = static_cast<int32_t>(col.data_type.id());
+    ffi_col.nullable = col.data_type.nullable();
     ffi_col.comment = rust::String(col.comment);
     ffi_col.precision = col.data_type.precision();
     ffi_col.scale = col.data_type.scale();
     auto flat = flatten_array_type(col.data_type);
     ffi_col.array_nesting = flat.nesting;
+    for (auto nullable : flat.array_nullability) {
+        ffi_col.array_nullability.push_back(nullable);
+    }
     if (flat.nesting > 0 && flat.leaf_type != 0) {
         ffi_col.element_data_type = flat.leaf_type;
         ffi_col.element_precision = flat.leaf_precision;
@@ -229,7 +250,6 @@ inline ffi::FfiTableDescriptor to_ffi_table_descriptor(const TableDescriptor& de
 
 inline Column from_ffi_column(const ffi::FfiColumn& ffi_col) {
     auto type_id = static_cast<TypeId>(ffi_col.data_type);
-    DataType dt(type_id, ffi_col.precision, ffi_col.scale);
     if (type_id == TypeId::Array) {
         if (ffi_col.element_data_type == 0) {
             throw std::runtime_error("Malformed ARRAY column '" + std::string(ffi_col.name) +
@@ -273,13 +293,21 @@ inline Column from_ffi_column(const ffi::FfiColumn& ffi_col) {
         }
 
         int32_t nesting = ffi_col.array_nesting > 0 ? ffi_col.array_nesting : 1;
-        dt = rebuild_array_type(FlattenedArrayType{
-            nesting,
-            ffi_col.element_data_type,
-            ffi_col.element_precision,
-            ffi_col.element_scale,
-        });
+        std::vector<uint8_t> array_nullability;
+        for (auto nullable : ffi_col.array_nullability) {
+            array_nullability.push_back(nullable);
+        }
+        auto dt = rebuild_array_type(
+            FlattenedArrayType{
+                nesting,
+                ffi_col.element_data_type,
+                ffi_col.element_precision,
+                ffi_col.element_scale,
+                std::move(array_nullability),
+            });
+        return Column{std::string(ffi_col.name), std::move(dt), std::string(ffi_col.comment)};
     }
+    DataType dt(type_id, ffi_col.precision, ffi_col.scale, ffi_col.nullable);
     return Column{std::string(ffi_col.name), std::move(dt), std::string(ffi_col.comment)};
 }
 
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 875373bcec..52df36869d 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -85,10 +85,12 @@ mod ffi {
     struct FfiColumn {
         name: String,
         data_type: i32,
+        nullable: bool,
         comment: String,
         precision: i32,
         scale: i32,
         array_nesting: i32,
+        array_nullability: Vec<u8>,
         element_data_type: i32,
         element_precision: i32,
         element_scale: i32,
@@ -3612,8 +3614,9 @@ impl ArrayWriterInner {
 
 /// Structural type equivalence that ignores nullability flags but preserves
 /// variant and precision/scale semantics. Used to compare ArrayWriter element
-/// types on the binding boundary, where C++ callers never control nullability
-/// explicitly.
+/// types on the binding boundary. Nullability is ignored in structural comparison
+/// because the Rust-side element type is always reconstructed as nullable
+/// (encoding doesn't depend on it).
 fn structurally_compatible(a: &fcore::metadata::DataType, b: &fcore::metadata::DataType) -> bool {
     use fcore::metadata::DataType;
     match (a, b) {
diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index c15aadc980..f61711b502 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -41,16 +41,43 @@ pub const DATA_TYPE_CHAR: i32 = 15;
 pub const DATA_TYPE_BINARY: i32 = 16;
 pub const DATA_TYPE_ARRAY: i32 = 17;
 
+/// Separates scalar and array type specs so each variant only carries
+/// the fields it actually needs — no zeroed-out placeholders.
+enum FfiDataTypeSpec {
+    Scalar {
+        data_type: i32,
+        precision: u32,
+        scale: u32,
+        nullable: bool,
+    },
+    Array {
+        element_data_type: i32,
+        element_precision: u32,
+        element_scale: u32,
+        array_nesting: u32,
+        /// `nesting` entries for each ARRAY wrapper (outermost first) plus
+        /// one trailing entry for the leaf scalar. Length = `nesting + 1`.
+        array_nullability: Vec<u8>,
+    },
+}
+
 fn ffi_column_to_core_data_type(col: &ffi::FfiColumn) -> Result<fcore::metadata::DataType> {
-    ffi_data_type_to_core(
-        col.data_type,
-        col.precision as u32,
-        col.scale as u32,
-        col.element_data_type,
-        col.element_precision as u32,
-        col.element_scale as u32,
-        col.array_nesting.max(0) as u32,
-    )
+    if col.data_type == DATA_TYPE_ARRAY {
+        ffi_data_type_to_core(FfiDataTypeSpec::Array {
+            element_data_type: col.element_data_type,
+            element_precision: col.element_precision as u32,
+            element_scale: col.element_scale as u32,
+            array_nesting: col.array_nesting.max(0) as u32,
+            array_nullability: col.array_nullability.clone(),
+        })
+    } else {
+        ffi_data_type_to_core(FfiDataTypeSpec::Scalar {
+            data_type: col.data_type,
+            precision: col.precision as u32,
+            scale: col.scale as u32,
+            nullable: col.nullable,
+        })
+    }
 }
 
 fn type_precision_scale(dt: &fcore::metadata::DataType) -> (i32, i32) {
@@ -64,11 +91,23 @@ fn type_precision_scale(dt: &fcore::metadata::DataType) -> (i32, i32) {
     }
 }
 
-fn flatten_array_leaf_type(dt: &fcore::metadata::DataType) -> Result<(i32, i32, i32, i32)> {
+struct FlattenedLeafType {
+    nesting: i32,
+    leaf_type: i32,
+    leaf_precision: i32,
+    leaf_scale: i32,
+    /// `nesting` entries for ARRAY wrappers (outermost first) plus one
+    /// trailing entry for the leaf scalar. Length = `nesting + 1`.
+    array_nullability: Vec<u8>,
+}
+
+fn flatten_array_leaf_type(dt: &fcore::metadata::DataType) -> Result<FlattenedLeafType> {
     let mut nesting = 0_i32;
     let mut leaf = dt;
+    let mut array_nullability = Vec::new();
     while let fcore::metadata::DataType::Array(at) = leaf {
         nesting += 1;
+        array_nullability.push(u8::from(leaf.is_nullable()));
         leaf = at.get_element_type();
     }
     if nesting == 0 {
@@ -80,85 +119,102 @@ fn flatten_array_leaf_type(dt: &fcore::metadata::DataType) -> Result<(i32, i32,
             "Unsupported ARRAY leaf type for C++ bindings: {leaf}"
         ));
     }
+    array_nullability.push(u8::from(leaf.is_nullable()));
     let (leaf_precision, leaf_scale) = type_precision_scale(leaf);
-    Ok((nesting, leaf_type, leaf_precision, leaf_scale))
+    Ok(FlattenedLeafType {
+        nesting,
+        leaf_type,
+        leaf_precision,
+        leaf_scale,
+        array_nullability,
+    })
 }
 
 fn build_array_type_from_leaf(
-    leaf_dt: i32,
-    leaf_precision: u32,
-    leaf_scale: u32,
-    nesting: u32,
+    element_data_type: i32,
+    element_precision: u32,
+    element_scale: u32,
+    array_nesting: u32,
+    array_nullability: &[u8],
 ) -> Result<fcore::metadata::DataType> {
-    if nesting == 0 {
+    if array_nesting == 0 {
         return Err(anyhow!("ARRAY nesting must be >= 1"));
     }
-    let mut dt = ffi_data_type_to_core(leaf_dt, leaf_precision, leaf_scale, 0, 0, 0, 0)?;
-    for _ in 0..nesting {
-        dt = fcore::metadata::DataTypes::array(dt);
+    let leaf_nullable = array_nullability
+        .get(array_nesting as usize)
+        .map(|v| *v != 0)
+        .unwrap_or(true);
+    let mut dt = ffi_data_type_to_core(FfiDataTypeSpec::Scalar {
+        data_type: element_data_type,
+        precision: element_precision,
+        scale: element_scale,
+        nullable: leaf_nullable,
+    })?;
+    for i in (0..array_nesting).rev() {
+        let nullable = array_nullability
+            .get(i as usize)
+            .map(|v| *v != 0)
+            .unwrap_or(true);
+        dt = fcore::metadata::DataType::Array(fcore::metadata::ArrayType::with_nullable(
+            nullable, dt,
+        ));
     }
     Ok(dt)
 }
 
-fn ffi_data_type_to_core(
-    dt: i32,
-    precision: u32,
-    scale: u32,
-    element_dt: i32,
-    element_precision: u32,
-    element_scale: u32,
-    array_nesting: u32,
-) -> Result<fcore::metadata::DataType> {
-    match dt {
-        DATA_TYPE_BOOLEAN => Ok(fcore::metadata::DataTypes::boolean()),
-        DATA_TYPE_TINYINT => Ok(fcore::metadata::DataTypes::tinyint()),
-        DATA_TYPE_SMALLINT => Ok(fcore::metadata::DataTypes::smallint()),
-        DATA_TYPE_INT => Ok(fcore::metadata::DataTypes::int()),
-        DATA_TYPE_BIGINT => Ok(fcore::metadata::DataTypes::bigint()),
-        DATA_TYPE_FLOAT => Ok(fcore::metadata::DataTypes::float()),
-        DATA_TYPE_DOUBLE => Ok(fcore::metadata::DataTypes::double()),
-        DATA_TYPE_STRING => Ok(fcore::metadata::DataTypes::string()),
-        DATA_TYPE_BYTES => Ok(fcore::metadata::DataTypes::bytes()),
-        DATA_TYPE_DATE => Ok(fcore::metadata::DataTypes::date()),
-        DATA_TYPE_TIME => Ok(fcore::metadata::DataTypes::time()),
-        DATA_TYPE_TIMESTAMP => Ok(fcore::metadata::DataTypes::timestamp_with_precision(
-            precision,
-        )),
-        DATA_TYPE_TIMESTAMP_LTZ => Ok(fcore::metadata::DataTypes::timestamp_ltz_with_precision(
+fn ffi_data_type_to_core(spec: FfiDataTypeSpec) -> Result<fcore::metadata::DataType> {
+    match spec {
+        FfiDataTypeSpec::Scalar {
+            data_type,
             precision,
-        )),
-        DATA_TYPE_DECIMAL => {
-            let dt = fcore::metadata::DecimalType::new(precision, scale)?;
-            Ok(fcore::metadata::DataType::Decimal(dt))
-        }
-        DATA_TYPE_CHAR => Ok(fcore::metadata::DataTypes::char(precision)),
-        DATA_TYPE_BINARY => Ok(fcore::metadata::DataTypes::binary(precision as usize)),
-        DATA_TYPE_ARRAY => {
-            if array_nesting > 0 {
-                build_array_type_from_leaf(
-                    element_dt,
-                    element_precision,
-                    element_scale,
-                    array_nesting,
-                )
-            } else {
-                // Backward compatibility for older one-level metadata.
-                if element_dt == 0 {
-                    return Err(anyhow!("ARRAY requires element type metadata"));
+            scale,
+            nullable,
+        } => {
+            let dt = match data_type {
+                DATA_TYPE_BOOLEAN => fcore::metadata::DataTypes::boolean(),
+                DATA_TYPE_TINYINT => fcore::metadata::DataTypes::tinyint(),
+                DATA_TYPE_SMALLINT => fcore::metadata::DataTypes::smallint(),
+                DATA_TYPE_INT => fcore::metadata::DataTypes::int(),
+                DATA_TYPE_BIGINT => fcore::metadata::DataTypes::bigint(),
+                DATA_TYPE_FLOAT => fcore::metadata::DataTypes::float(),
+                DATA_TYPE_DOUBLE => fcore::metadata::DataTypes::double(),
+                DATA_TYPE_STRING => fcore::metadata::DataTypes::string(),
+                DATA_TYPE_BYTES => fcore::metadata::DataTypes::bytes(),
+                DATA_TYPE_DATE => fcore::metadata::DataTypes::date(),
+                DATA_TYPE_TIME => fcore::metadata::DataTypes::time(),
+                DATA_TYPE_TIMESTAMP => {
+                    fcore::metadata::DataTypes::timestamp_with_precision(precision)
+                }
+                DATA_TYPE_TIMESTAMP_LTZ => {
+                    fcore::metadata::DataTypes::timestamp_ltz_with_precision(precision)
+                }
+                DATA_TYPE_DECIMAL => {
+                    let dt = fcore::metadata::DecimalType::new(precision, scale)?;
+                    fcore::metadata::DataType::Decimal(dt)
                 }
-                let element_type = ffi_data_type_to_core(
-                    element_dt,
-                    element_precision,
-                    element_scale,
-                    0,
-                    0,
-                    0,
-                    0,
-                )?;
-                Ok(fcore::metadata::DataTypes::array(element_type))
+                DATA_TYPE_CHAR => fcore::metadata::DataTypes::char(precision),
+                DATA_TYPE_BINARY => fcore::metadata::DataTypes::binary(precision as usize),
+                _ => return Err(anyhow!("Unknown data type: {}", data_type)),
+            };
+            if nullable {
+                Ok(dt)
+            } else {
+                Ok(dt.as_non_nullable())
             }
         }
-        _ => Err(anyhow!("Unknown data type: {dt}")),
+        FfiDataTypeSpec::Array {
+            element_data_type,
+            element_precision,
+            element_scale,
+            array_nesting,
+            ref array_nullability,
+        } => build_array_type_from_leaf(
+            element_data_type,
+            element_precision,
+            element_scale,
+            array_nesting,
+            array_nullability,
+        ),
     }
 }
 
@@ -188,24 +244,25 @@ pub fn core_data_type_to_ffi(dt: &fcore::metadata::DataType) -> i32 {
 fn core_column_to_ffi(col: &fcore::metadata::Column) -> ffi::FfiColumn {
     let (precision, scale) = type_precision_scale(col.data_type());
 
-    let (array_nesting, element_data_type, element_precision, element_scale) = match col.data_type()
-    {
-        fcore::metadata::DataType::Array(_) => {
-            flatten_array_leaf_type(col.data_type()).unwrap_or((0, 0, 0, 0))
-        }
-        _ => (0, 0, 0, 0),
+    let flat = match col.data_type() {
+        fcore::metadata::DataType::Array(_) => flatten_array_leaf_type(col.data_type()).ok(),
+        _ => None,
     };
 
     ffi::FfiColumn {
         name: col.name().to_string(),
         data_type: core_data_type_to_ffi(col.data_type()),
+        nullable: col.data_type().is_nullable(),
         comment: col.comment().unwrap_or("").to_string(),
         precision,
         scale,
-        array_nesting,
-        element_data_type,
-        element_precision,
-        element_scale,
+        array_nesting: flat.as_ref().map_or(0, |f| f.nesting),
+        array_nullability: flat
+            .as_ref()
+            .map_or_else(Vec::new, |f| f.array_nullability.clone()),
+        element_data_type: flat.as_ref().map_or(0, |f| f.leaf_type),
+        element_precision: flat.as_ref().map_or(0, |f| f.leaf_precision),
+        element_scale: flat.as_ref().map_or(0, |f| f.leaf_scale),
     }
 }
 
@@ -347,6 +404,11 @@ pub fn empty_table_info() -> ffi::FfiTableInfo {
 
 /// Convert element type tag + precision/scale to core DataType.
 /// Used by ArrayWriterInner construction from C++.
+///
+/// Nullability is hardcoded to `true` (the default) because `ArrayWriter`
+/// only needs the type for encoding — the binary array format does not
+/// vary based on nullability. Nullability is a schema-level constraint
+/// enforced elsewhere (column definition, primary key normalization).
 pub fn element_type_from_ffi(
     leaf_dt: i32,
     precision: u32,
@@ -354,9 +416,15 @@ pub fn element_type_from_ffi(
     array_nesting: u32,
 ) -> Result<fcore::metadata::DataType> {
     if array_nesting == 0 {
-        ffi_data_type_to_core(leaf_dt, precision, scale, 0, 0, 0, 0)
+        ffi_data_type_to_core(FfiDataTypeSpec::Scalar {
+            data_type: leaf_dt,
+            precision,
+            scale,
+            nullable: true,
+        })
     } else {
-        build_array_type_from_leaf(leaf_dt, precision, scale, array_nesting)
+        let array_nullability = vec![1u8; (array_nesting + 1) as usize];
+        build_array_type_from_leaf(leaf_dt, precision, scale, array_nesting, &array_nullability)
     }
 }
 
diff --git a/fluss-rust/bindings/cpp/test/test_ffi_converter.cpp b/fluss-rust/bindings/cpp/test/test_ffi_converter.cpp
index 4bbe3ebbaf..2078bdabb4 100644
--- a/fluss-rust/bindings/cpp/test/test_ffi_converter.cpp
+++ b/fluss-rust/bindings/cpp/test/test_ffi_converter.cpp
@@ -24,20 +24,50 @@
 
 namespace {
 
-fluss::ffi::FfiColumn MakeArrayColumn(int32_t nesting, int32_t element_type) {
+fluss::ffi::FfiColumn MakeArrayColumn(int32_t nesting, int32_t element_type,
+                                      bool nullable = true, bool leaf_nullable = true,
+                                      std::vector<uint8_t> per_level_nullability = {}) {
     fluss::ffi::FfiColumn col;
     col.name = rust::String("bad_array");
     col.data_type = static_cast<int32_t>(fluss::TypeId::Array);
+    col.nullable = nullable;
     col.comment = rust::String("");
     col.precision = 0;
     col.scale = 0;
     col.array_nesting = nesting;
+    if (!per_level_nullability.empty()) {
+        for (auto v : per_level_nullability) {
+            col.array_nullability.push_back(v);
+        }
+    } else {
+        for (int32_t i = 0; i < nesting; ++i) {
+            col.array_nullability.push_back((i == 0 ? nullable : true) ? 1 : 0);
+        }
+        col.array_nullability.push_back(leaf_nullable ? 1 : 0);
+    }
     col.element_data_type = element_type;
     col.element_precision = 0;
     col.element_scale = 0;
     return col;
 }
 
+fluss::ffi::FfiColumn MakeScalarColumn(const char* name, fluss::TypeId type_id,
+                                       bool nullable = true, int32_t precision = 0,
+                                       int32_t scale = 0) {
+    fluss::ffi::FfiColumn col;
+    col.name = rust::String(name);
+    col.data_type = static_cast<int32_t>(type_id);
+    col.nullable = nullable;
+    col.comment = rust::String("");
+    col.precision = precision;
+    col.scale = scale;
+    col.array_nesting = 0;
+    col.element_data_type = 0;
+    col.element_precision = 0;
+    col.element_scale = 0;
+    return col;
+}
+
 }  // namespace
 
 TEST(FfiConverterTest, RejectsArrayWithoutElementType) {
@@ -62,3 +92,149 @@ TEST(FfiConverterTest, SupportsLegacyOneLevelArrayMetadata) {
     ASSERT_NE(converted.data_type.element_type(), nullptr);
     EXPECT_EQ(converted.data_type.element_type()->id(), fluss::TypeId::Int);
 }
+
+// --- Nullability tests ---
+
+TEST(DataTypeTest, DefaultNullable) {
+    auto dt = fluss::DataType::Int();
+    EXPECT_TRUE(dt.nullable());
+}
+
+TEST(DataTypeTest, NotNullMethod) {
+    auto dt = fluss::DataType::Int().NotNull();
+    EXPECT_FALSE(dt.nullable());
+    EXPECT_EQ(dt.id(), fluss::TypeId::Int);
+}
+
+TEST(DataTypeTest, NotNullPreservesPrecisionScale) {
+    auto dt = fluss::DataType::Decimal(10, 2).NotNull();
+    EXPECT_FALSE(dt.nullable());
+    EXPECT_EQ(dt.precision(), 10);
+    EXPECT_EQ(dt.scale(), 2);
+}
+
+TEST(DataTypeTest, ArrayElementNullability) {
+    auto dt = fluss::DataType::Array(fluss::DataType::Int().NotNull());
+    EXPECT_TRUE(dt.nullable());
+    ASSERT_NE(dt.element_type(), nullptr);
+    EXPECT_FALSE(dt.element_type()->nullable());
+}
+
+TEST(DataTypeTest, NotNullArrayNullableElement) {
+    auto dt = fluss::DataType::Array(fluss::DataType::Int()).NotNull();
+    EXPECT_FALSE(dt.nullable());
+    ASSERT_NE(dt.element_type(), nullptr);
+    EXPECT_TRUE(dt.element_type()->nullable());
+}
+
+TEST(DataTypeTest, NotNullArrayNotNullElement) {
+    auto dt = fluss::DataType::Array(fluss::DataType::Int().NotNull()).NotNull();
+    EXPECT_FALSE(dt.nullable());
+    ASSERT_NE(dt.element_type(), nullptr);
+    EXPECT_FALSE(dt.element_type()->nullable());
+}
+
+TEST(FfiConverterTest, ScalarNullableRoundTrip) {
+    fluss::Column col{"id", fluss::DataType::Int(), ""};
+    auto ffi_col = fluss::utils::to_ffi_column(col);
+    EXPECT_TRUE(ffi_col.nullable);
+    auto back = fluss::utils::from_ffi_column(ffi_col);
+    EXPECT_TRUE(back.data_type.nullable());
+}
+
+TEST(FfiConverterTest, ScalarNotNullRoundTrip) {
+    fluss::Column col{"id", fluss::DataType::Int().NotNull(), ""};
+    auto ffi_col = fluss::utils::to_ffi_column(col);
+    EXPECT_FALSE(ffi_col.nullable);
+    auto back = fluss::utils::from_ffi_column(ffi_col);
+    EXPECT_FALSE(back.data_type.nullable());
+}
+
+TEST(FfiConverterTest, ArrayNotNullElementRoundTrip) {
+    fluss::Column col{"tags", fluss::DataType::Array(fluss::DataType::String().NotNull()), ""};
+    auto ffi_col = fluss::utils::to_ffi_column(col);
+    EXPECT_TRUE(ffi_col.nullable);
+    ASSERT_EQ(ffi_col.array_nullability.size(), 2u);
+    EXPECT_EQ(ffi_col.array_nullability[1], 0);
+    auto back = fluss::utils::from_ffi_column(ffi_col);
+    EXPECT_TRUE(back.data_type.nullable());
+    ASSERT_NE(back.data_type.element_type(), nullptr);
+    EXPECT_FALSE(back.data_type.element_type()->nullable());
+}
+
+TEST(FfiConverterTest, NotNullArrayNullableElementRoundTrip) {
+    fluss::Column col{"ids", fluss::DataType::Array(fluss::DataType::Int()).NotNull(), ""};
+    auto ffi_col = fluss::utils::to_ffi_column(col);
+    EXPECT_FALSE(ffi_col.nullable);
+    ASSERT_EQ(ffi_col.array_nullability.size(), 2u);
+    EXPECT_EQ(ffi_col.array_nullability[1], 1);
+    auto back = fluss::utils::from_ffi_column(ffi_col);
+    EXPECT_FALSE(back.data_type.nullable());
+    ASSERT_NE(back.data_type.element_type(), nullptr);
+    EXPECT_TRUE(back.data_type.element_type()->nullable());
+}
+
+TEST(FfiConverterTest, NotNullArrayNotNullElementRoundTrip) {
+    fluss::Column col{
+        "strict_ids",
+        fluss::DataType::Array(fluss::DataType::Int().NotNull()).NotNull(),
+        "",
+    };
+    auto ffi_col = fluss::utils::to_ffi_column(col);
+    EXPECT_FALSE(ffi_col.nullable);
+    ASSERT_EQ(ffi_col.array_nullability.size(), 2u);
+    EXPECT_EQ(ffi_col.array_nullability[1], 0);
+    auto back = fluss::utils::from_ffi_column(ffi_col);
+    EXPECT_FALSE(back.data_type.nullable());
+    ASSERT_NE(back.data_type.element_type(), nullptr);
+    EXPECT_FALSE(back.data_type.element_type()->nullable());
+}
+
+TEST(FfiConverterTest, NestedArrayIntermediateNullabilityRoundTrip) {
+    fluss::Column col{
+        "nested",
+        fluss::DataType::Array(fluss::DataType::Array(fluss::DataType::Int()).NotNull()),
+        "",
+    };
+    auto ffi_col = fluss::utils::to_ffi_column(col);
+    auto back = fluss::utils::from_ffi_column(ffi_col);
+
+    EXPECT_TRUE(back.data_type.nullable());
+    ASSERT_NE(back.data_type.element_type(), nullptr);
+    EXPECT_FALSE(back.data_type.element_type()->nullable());
+    ASSERT_NE(back.data_type.element_type()->element_type(), nullptr);
+    EXPECT_TRUE(back.data_type.element_type()->element_type()->nullable());
+}
+
+TEST(FfiConverterTest, NestedArrayAllLevelsNullabilityRoundTrip) {
+    fluss::Column col{
+        "strict_nested",
+        fluss::DataType::Array(
+            fluss::DataType::Array(fluss::DataType::Int().NotNull()).NotNull())
+            .NotNull(),
+        "",
+    };
+    auto ffi_col = fluss::utils::to_ffi_column(col);
+    auto back = fluss::utils::from_ffi_column(ffi_col);
+
+    EXPECT_FALSE(back.data_type.nullable());
+    ASSERT_NE(back.data_type.element_type(), nullptr);
+    EXPECT_FALSE(back.data_type.element_type()->nullable());
+    ASSERT_NE(back.data_type.element_type()->element_type(), nullptr);
+    EXPECT_FALSE(back.data_type.element_type()->element_type()->nullable());
+}
+
+TEST(FfiConverterTest, FfiColumnNonNullableScalarReconstructed) {
+    auto col = MakeScalarColumn("id", fluss::TypeId::Int, false);
+    auto converted = fluss::utils::from_ffi_column(col);
+    EXPECT_FALSE(converted.data_type.nullable());
+    EXPECT_EQ(converted.data_type.id(), fluss::TypeId::Int);
+}
+
+TEST(FfiConverterTest, FfiColumnNonNullableArrayReconstructed) {
+    auto col = MakeArrayColumn(1, static_cast<int32_t>(fluss::TypeId::String), false, false);
+    auto converted = fluss::utils::from_ffi_column(col);
+    EXPECT_FALSE(converted.data_type.nullable());
+    ASSERT_NE(converted.data_type.element_type(), nullptr);
+    EXPECT_FALSE(converted.data_type.element_type()->nullable());
+}
diff --git a/fluss-rust/bindings/cpp/test/test_log_table.cpp b/fluss-rust/bindings/cpp/test/test_log_table.cpp
index f36c870766..5678e4bb10 100644
--- a/fluss-rust/bindings/cpp/test/test_log_table.cpp
+++ b/fluss-rust/bindings/cpp/test/test_log_table.cpp
@@ -1458,3 +1458,66 @@ TEST_F(LogTableTest, ArrayWriterOverflowDetection) {
         EXPECT_NO_THROW(smallint_arr.SetInt32(0, 32767));
     }
 }
+
+TEST_F(LogTableTest, NullabilityPreservedInTableInfo) {
+    auto& adm = admin();
+    auto& conn = connection();
+
+    fluss::TablePath table_path("fluss", "test_nullability_table_info_cpp");
+
+    auto schema =
+        fluss::Schema::NewBuilder()
+            .AddColumn("id", fluss::DataType::Int())
+            .AddColumn("name", fluss::DataType::String())
+            .AddColumn("tags", fluss::DataType::Array(fluss::DataType::String().NotNull()))
+            .AddColumn("ids", fluss::DataType::Array(fluss::DataType::Int()).NotNull())
+            .AddColumn("nested",
+                       fluss::DataType::Array(
+                           fluss::DataType::Array(fluss::DataType::Int()).NotNull()))
+            .SetPrimaryKeys({"id"})
+            .Build();
+
+    auto table_descriptor = fluss::TableDescriptor::NewBuilder()
+                                .SetSchema(schema)
+                                .SetProperty("table.replication.factor", "1")
+                                .Build();
+
+    fluss_test::CreateTable(adm, table_path, table_descriptor);
+
+    fluss::Table table;
+    ASSERT_OK(conn.GetTable(table_path, table));
+    auto info = table.GetTableInfo();
+
+    ASSERT_EQ(info.schema.columns.size(), 5u);
+    EXPECT_EQ(info.primary_keys, std::vector<std::string>{"id"});
+
+    // Primary key columns are forced NOT NULL by schema normalization.
+    EXPECT_EQ(info.schema.columns[0].data_type.id(), fluss::TypeId::Int);
+    EXPECT_FALSE(info.schema.columns[0].data_type.nullable());
+
+    // "name" STRING (nullable)
+    EXPECT_EQ(info.schema.columns[1].data_type.id(), fluss::TypeId::String);
+    EXPECT_TRUE(info.schema.columns[1].data_type.nullable());
+
+    // "tags" ARRAY<STRING NOT NULL> (outer nullable)
+    EXPECT_EQ(info.schema.columns[2].data_type.id(), fluss::TypeId::Array);
+    EXPECT_TRUE(info.schema.columns[2].data_type.nullable());
+    ASSERT_NE(info.schema.columns[2].data_type.element_type(), nullptr);
+    EXPECT_FALSE(info.schema.columns[2].data_type.element_type()->nullable());
+
+    // "ids" ARRAY<INT> NOT NULL (outer not null, element nullable)
+    EXPECT_EQ(info.schema.columns[3].data_type.id(), fluss::TypeId::Array);
+    EXPECT_FALSE(info.schema.columns[3].data_type.nullable());
+    ASSERT_NE(info.schema.columns[3].data_type.element_type(), nullptr);
+    EXPECT_TRUE(info.schema.columns[3].data_type.element_type()->nullable());
+
+    // "nested" ARRAY<ARRAY<INT> NOT NULL> (outer nullable, inner array not null)
+    EXPECT_EQ(info.schema.columns[4].data_type.id(), fluss::TypeId::Array);
+    EXPECT_TRUE(info.schema.columns[4].data_type.nullable());
+    ASSERT_NE(info.schema.columns[4].data_type.element_type(), nullptr);
+    EXPECT_FALSE(info.schema.columns[4].data_type.element_type()->nullable());
+    ASSERT_NE(info.schema.columns[4].data_type.element_type()->element_type(), nullptr);
+    EXPECT_TRUE(info.schema.columns[4].data_type.element_type()->element_type()->nullable());
+
+    ASSERT_OK(adm.DropTable(table_path, false));
+}
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index c50d40cda2..ae4e9490a5 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -492,7 +492,9 @@ Same array getters as [`RowView`](#array-getters-index-based) — `GetArraySize`
 | `id() -> TypeId`                    | Get the type ID                             |
 | `precision() -> int`               | Get precision (for Decimal/Timestamp types) |
 | `scale() -> int`                   | Get scale (for Decimal type)                |
+| `nullable() -> bool`               | Returns `true` if this type is nullable (default), `false` if `NOT NULL` |
 | `element_type() -> const DataType*` | Get element type (for Array type, nullptr otherwise) |
+| `NotNull() -> DataType`            | Returns a copy of this type with nullable set to `false` |
 
 ## `ArrayWriter`
 
diff --git a/fluss-rust/website/docs/user-guide/cpp/data-types.md b/fluss-rust/website/docs/user-guide/cpp/data-types.md
index 400b2ecf07..cce40cefa1 100644
--- a/fluss-rust/website/docs/user-guide/cpp/data-types.md
+++ b/fluss-rust/website/docs/user-guide/cpp/data-types.md
@@ -23,6 +23,40 @@ sidebar_position: 3
 | `DataType::Decimal(p, s)`  | Decimal with precision and scale                               |
 | `DataType::Array(element)` | Array of the given element type (supports nesting)             |
 
+## Nullability
+
+All DataTypes are nullable by default. Use `.NotNull()` to create a `NOT NULL` type:
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("id", fluss::DataType::Int().NotNull())
+    .AddColumn("name", fluss::DataType::String())          // nullable by default
+    .Build();
+```
+
+Primary key columns are automatically forced `NOT NULL` regardless of the `DataType` setting.
+
+For nested types, nullability is preserved at each array level and at the leaf element:
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("tags", fluss::DataType::Array(fluss::DataType::String().NotNull()))
+    .AddColumn("ids", fluss::DataType::Array(fluss::DataType::Int()).NotNull())
+    .AddColumn("nested", fluss::DataType::Array(
+        fluss::DataType::Array(fluss::DataType::Int()).NotNull()))
+    .Build();
+// "tags":   ARRAY<STRING NOT NULL>         (outer nullable, elements NOT NULL)
+// "ids":    ARRAY<INT> NOT NULL            (outer NOT NULL, elements nullable)
+// "nested": ARRAY<ARRAY<INT> NOT NULL>     (outer nullable, inner array NOT NULL)
+```
+
+You can query nullability at runtime:
+
+```cpp
+auto info = table.GetTableInfo();
+bool is_nullable = info.schema.columns[0].data_type.nullable();
+```
+
 ## GenericRow Setters
 
 `SetInt32` is used for `TinyInt`, `SmallInt`, and `Int` columns. For `TinyInt` and `SmallInt`, the value is validated at write time — an error is returned if it overflows the column's range (e.g., \[-128, 127\] for `TinyInt`, \[-32768, 32767\] for `SmallInt`).

From e274bd15607bbdc30b9b47f2d9cbc8fedea6b8ef Mon Sep 17 00:00:00 2001
From: Hongshun Wang <125648852+loserwang1024@users.noreply.github.com>
Date: Sat, 9 May 2026 16:53:13 +0800
Subject: [PATCH 260/287] [rust] Support API_VERSION in rust client. (#531)

* [rust] Support API_VERSION in rust client

* remove useless write_version_type and read_version_type which is same as java client does.

* Add test about kv_format_v2.

* return apiKey.highestSupportedVersion as default.

* check whether server type mismatch.

* add test about unknown server type
---
 .../crates/fluss-test-cluster/test-images.env |   2 +-
 .../fluss/src/client/lookup/lookup_sender.rs  |   8 +-
 fluss-rust/crates/fluss/src/cluster/mod.rs    |  17 +
 fluss-rust/crates/fluss/src/error.rs          |  12 +
 .../crates/fluss/src/proto/fluss_api.proto    |  19 +-
 fluss-rust/crates/fluss/src/rpc/api_key.rs    |  45 +++
 .../fluss/src/rpc/message/api_versions.rs     |  50 +++
 .../fluss/src/rpc/message/authenticate.rs     |  10 +-
 .../fluss/src/rpc/message/create_database.rs  |  11 +-
 .../fluss/src/rpc/message/create_partition.rs |  11 +-
 .../fluss/src/rpc/message/create_table.rs     |  11 +-
 .../fluss/src/rpc/message/database_exists.rs  |  10 +-
 .../fluss/src/rpc/message/drop_database.rs    |  10 +-
 .../fluss/src/rpc/message/drop_partition.rs   |  11 +-
 .../fluss/src/rpc/message/drop_table.rs       |  11 +-
 .../crates/fluss/src/rpc/message/fetch.rs     |  11 +-
 .../src/rpc/message/get_database_info.rs      |  10 +-
 .../rpc/message/get_latest_lake_snapshot.rs   |  10 +-
 .../src/rpc/message/get_security_token.rs     |  10 +-
 .../crates/fluss/src/rpc/message/get_table.rs |  10 +-
 .../fluss/src/rpc/message/get_table_schema.rs |  10 +-
 .../crates/fluss/src/rpc/message/header.rs    |  10 +-
 .../fluss/src/rpc/message/init_writer.rs      |  11 +-
 .../fluss/src/rpc/message/limit_scan.rs       |  11 +-
 .../fluss/src/rpc/message/list_databases.rs   |  10 +-
 .../fluss/src/rpc/message/list_offsets.rs     |  13 +-
 .../src/rpc/message/list_partition_infos.rs   |  11 +-
 .../fluss/src/rpc/message/list_tables.rs      |  11 +-
 .../crates/fluss/src/rpc/message/lookup.rs    |  13 +-
 .../crates/fluss/src/rpc/message/mod.rs       |  31 +-
 .../fluss/src/rpc/message/prefix_lookup.rs    |  13 +-
 .../fluss/src/rpc/message/produce_log.rs      |  11 +-
 .../crates/fluss/src/rpc/message/put_kv.rs    |  11 +-
 .../fluss/src/rpc/message/table_exists.rs     |  11 +-
 .../fluss/src/rpc/message/update_metadata.rs  |  11 +-
 .../crates/fluss/src/rpc/server_connection.rs | 341 ++++++++++++++++--
 .../fluss/tests/integration/kv_table.rs       |  71 ++++
 37 files changed, 642 insertions(+), 247 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/rpc/message/api_versions.rs

diff --git a/fluss-rust/crates/fluss-test-cluster/test-images.env b/fluss-rust/crates/fluss-test-cluster/test-images.env
index 3aa8e735cf..5cd914172c 100644
--- a/fluss-rust/crates/fluss-test-cluster/test-images.env
+++ b/fluss-rust/crates/fluss-test-cluster/test-images.env
@@ -1,4 +1,4 @@
 FLUSS_IMAGE=apache/fluss
-FLUSS_VERSION=0.9.0-incubating
+FLUSS_VERSION=0.9.1-incubating
 ZOOKEEPER_IMAGE=zookeeper
 ZOOKEEPER_VERSION=3.9.2
diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
index efcd68538f..1e337f8395 100644
--- a/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
@@ -22,9 +22,7 @@ use crate::error::{Error, FlussError, Result};
 use crate::metadata::{TableBucket, TablePath};
 use crate::proto::{LookupResponse, PrefixLookupResponse};
 use crate::rpc::ServerConnection;
-use crate::rpc::message::{
-    LookupRequest, PrefixLookupRequest, ReadVersionedType, RequestBody, WriteVersionedType,
-};
+use crate::rpc::message::{LookupRequest, PrefixLookupRequest, ReadType, RequestBody, WriteType};
 use crate::{BucketId, PartitionId, TableId};
 use bytes::Bytes;
 use futures::stream::{FuturesUnordered, StreamExt};
@@ -51,8 +49,8 @@ struct BucketResponse<V> {
 }
 
 trait LookupProtocol {
-    type Request: RequestBody<ResponseBody = Self::Response> + Send + WriteVersionedType<Vec<u8>>;
-    type Response: ReadVersionedType<Cursor<Vec<u8>>> + Send;
+    type Request: RequestBody<ResponseBody = Self::Response> + Send + WriteType<Vec<u8>>;
+    type Response: ReadType<Cursor<Vec<u8>>> + Send;
     type Value: Send;
 
     const OP_NAME: &'static str;
diff --git a/fluss-rust/crates/fluss/src/cluster/mod.rs b/fluss-rust/crates/fluss/src/cluster/mod.rs
index 8b825eee20..863f8ed509 100644
--- a/fluss-rust/crates/fluss/src/cluster/mod.rs
+++ b/fluss-rust/crates/fluss/src/cluster/mod.rs
@@ -79,6 +79,23 @@ pub enum ServerType {
     CoordinatorServer,
 }
 
+impl ServerType {
+    pub fn to_type_id(&self) -> i32 {
+        match self {
+            ServerType::CoordinatorServer => 1,
+            ServerType::TabletServer => 2,
+        }
+    }
+
+    pub fn from_type_id(type_id: i32) -> Option<ServerType> {
+        match type_id {
+            1 => Some(ServerType::CoordinatorServer),
+            2 => Some(ServerType::TabletServer),
+            _ => None,
+        }
+    }
+}
+
 impl fmt::Display for ServerType {
     fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
         match self {
diff --git a/fluss-rust/crates/fluss/src/error.rs b/fluss-rust/crates/fluss/src/error.rs
index c2f72a74b0..4bd0690ead 100644
--- a/fluss-rust/crates/fluss/src/error.rs
+++ b/fluss-rust/crates/fluss/src/error.rs
@@ -115,6 +115,18 @@ pub enum Error {
 
     #[snafu(visibility(pub(crate)), display("Fluss API Error: {}.", api_error))]
     FlussAPIError { api_error: ApiError },
+
+    #[snafu(
+        visibility(pub(crate)),
+        display("Unsupported API version: {}.", message)
+    )]
+    UnsupportedVersion { message: String },
+
+    /// The server advertised a `server_type` that does not match the one expected
+    /// for the target `ServerNode` (e.g. connecting to a coordinator on a tablet
+    /// server address).
+    #[snafu(visibility(pub(crate)), display("Invalid server type: {}.", message))]
+    InvalidServerType { message: String },
 }
 
 /// Convenience constructors for API errors that may be raised client-side.
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
index a544906b1b..2add80d7f9 100644
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
@@ -24,6 +24,23 @@ message ErrorResponse {
   optional string error_message = 2;
 }
 
+// api versions request and response
+message ApiVersionsRequest {
+  required string client_software_name = 1;
+  required string client_software_version = 2;
+}
+
+message ApiVersionsResponse {
+  repeated PbApiVersion api_versions = 1;
+  optional int32 server_type = 2;
+}
+
+message PbApiVersion {
+  required int32 api_key = 1;
+  required int32 min_version = 2;
+  required int32 max_version = 3;
+}
+
 // metadata request and response, request send from client to each server.
 message MetadataRequest {
   repeated PbTablePath table_path = 1;
@@ -483,4 +500,4 @@ message InitWriterRequest {
 
 message InitWriterResponse {
   required int64 writer_id = 1;
-}
\ No newline at end of file
+}
diff --git a/fluss-rust/crates/fluss/src/rpc/api_key.rs b/fluss-rust/crates/fluss/src/rpc/api_key.rs
index 1ea0269d85..977b69d1d6 100644
--- a/fluss-rust/crates/fluss/src/rpc/api_key.rs
+++ b/fluss-rust/crates/fluss/src/rpc/api_key.rs
@@ -16,9 +16,11 @@
 // under the License.
 
 use crate::rpc::api_key::ApiKey::Unknown;
+use crate::rpc::api_version::{ApiVersion, ApiVersionRange};
 
 #[derive(Debug, PartialEq, Eq, PartialOrd, Ord, Hash, Clone, Copy)]
 pub enum ApiKey {
+    ApiVersion,                 // 1000
     CreateDatabase,             // 1001
     DropDatabase,               // 1002
     ListDatabases,              // 1003
@@ -48,9 +50,50 @@ pub enum ApiKey {
     Unknown(i16),
 }
 
+impl ApiKey {
+    /// Returns the range of versions supported by the client for this API key.
+    pub fn supported_versions(&self) -> Option<ApiVersionRange> {
+        match self {
+            // Most APIs only support v0.
+            ApiKey::ApiVersion
+            | ApiKey::CreateDatabase
+            | ApiKey::DropDatabase
+            | ApiKey::ListDatabases
+            | ApiKey::DatabaseExists
+            | ApiKey::CreateTable
+            | ApiKey::DropTable
+            | ApiKey::GetTable
+            | ApiKey::ListTables
+            | ApiKey::ListPartitionInfos
+            | ApiKey::TableExists
+            | ApiKey::GetTableSchema
+            | ApiKey::MetaData
+            | ApiKey::ProduceLog
+            | ApiKey::FetchLog
+            | ApiKey::ListOffsets
+            | ApiKey::GetFileSystemSecurityToken
+            | ApiKey::InitWriter
+            | ApiKey::GetLatestLakeSnapshot
+            | ApiKey::LimitScan
+            | ApiKey::GetDatabaseInfo
+            | ApiKey::CreatePartition
+            | ApiKey::DropPartition
+            | ApiKey::Authenticate
+            // TODO(key-encoding-v1): The Java server supports v0..v1 for these
+            // APIs, but the Rust client has not yet implemented the v1 key
+            // encoding format. Pinned to v0 until that is done.
+            | ApiKey::PutKv | ApiKey::Lookup | ApiKey::PrefixLookup => {
+                Some(ApiVersionRange::new(ApiVersion(0), ApiVersion(0)))
+            }
+            Unknown(_) => None,
+        }
+    }
+}
+
 impl From<i16> for ApiKey {
     fn from(key: i16) -> Self {
         match key {
+            1000 => ApiKey::ApiVersion,
             1001 => ApiKey::CreateDatabase,
             1002 => ApiKey::DropDatabase,
             1003 => ApiKey::ListDatabases,
@@ -86,6 +129,7 @@ impl From<i16> for ApiKey {
 impl From<ApiKey> for i16 {
     fn from(key: ApiKey) -> Self {
         match key {
+            ApiKey::ApiVersion => 1000,
             ApiKey::CreateDatabase => 1001,
             ApiKey::DropDatabase => 1002,
             ApiKey::ListDatabases => 1003,
@@ -124,6 +168,7 @@ mod tests {
     #[test]
     fn api_key_round_trip() {
         let cases = [
+            (1000, ApiKey::ApiVersion),
             (1001, ApiKey::CreateDatabase),
             (1002, ApiKey::DropDatabase),
             (1003, ApiKey::ListDatabases),
diff --git a/fluss-rust/crates/fluss/src/rpc/message/api_versions.rs b/fluss-rust/crates/fluss/src/rpc/message/api_versions.rs
new file mode 100644
index 0000000000..579c66a7b1
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/rpc/message/api_versions.rs
@@ -0,0 +1,50 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+use crate::proto::{
+    ApiVersionsRequest as ProtoApiVersionsRequest, ApiVersionsResponse as ProtoApiVersionsResponse,
+};
+use crate::rpc::api_key::ApiKey;
+use crate::rpc::frame::{ReadError, WriteError};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type};
+use bytes::{Buf, BufMut};
+use prost::Message;
+
+#[derive(Debug, Clone)]
+pub struct ApiVersionsRequest {
+    pub inner_request: ProtoApiVersionsRequest,
+}
+
+impl ApiVersionsRequest {
+    pub fn new(client_name: &str, client_version: &str) -> Self {
+        Self {
+            inner_request: ProtoApiVersionsRequest {
+                client_software_name: client_name.to_string(),
+                client_software_version: client_version.to_string(),
+            },
+        }
+    }
+}
+
+impl RequestBody for ApiVersionsRequest {
+    type ResponseBody = ProtoApiVersionsResponse;
+    const API_KEY: ApiKey = ApiKey::ApiVersion;
+}
+
+impl_write_type!(ApiVersionsRequest);
+impl_read_type!(ProtoApiVersionsResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/authenticate.rs b/fluss-rust/crates/fluss/src/rpc/message/authenticate.rs
index 1292cdc919..1874b30463 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/authenticate.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/authenticate.rs
@@ -17,10 +17,9 @@
 
 use crate::proto::{AuthenticateRequest as ProtoAuthenticateRequest, AuthenticateResponse};
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::{ReadError, WriteError};
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -61,11 +60,10 @@ impl AuthenticateRequest {
 impl RequestBody for AuthenticateRequest {
     type ResponseBody = AuthenticateResponse;
     const API_KEY: ApiKey = ApiKey::Authenticate;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(AuthenticateRequest);
-impl_read_version_type!(AuthenticateResponse);
+impl_write_type!(AuthenticateRequest);
+impl_read_type!(AuthenticateResponse);
 
 #[cfg(test)]
 mod tests {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_database.rs b/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
index e03cd1ffa4..ed0868da6f 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_database.rs
@@ -16,15 +16,14 @@
 // under the License.
 
 use crate::metadata::DatabaseDescriptor;
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::{impl_read_type, impl_write_type, proto};
 
 use crate::error::Result as FlussResult;
 use crate::proto::CreateDatabaseResponse;
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::ReadError;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 
 use bytes::{Buf, BufMut};
 use prost::Message;
@@ -60,9 +59,7 @@ impl RequestBody for CreateDatabaseRequest {
     type ResponseBody = CreateDatabaseResponse;
 
     const API_KEY: ApiKey = ApiKey::CreateDatabase;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(CreateDatabaseRequest);
-impl_read_version_type!(CreateDatabaseResponse);
+impl_write_type!(CreateDatabaseRequest);
+impl_read_type!(CreateDatabaseResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs b/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
index 93dbf70d3b..ad633655c0 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
@@ -18,11 +18,10 @@
 use crate::metadata::{PartitionSpec, TablePath};
 use crate::proto::CreatePartitionResponse;
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
 use crate::rpc::frame::{ReadError, WriteError};
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -51,9 +50,7 @@ impl RequestBody for CreatePartitionRequest {
     type ResponseBody = CreatePartitionResponse;
 
     const API_KEY: ApiKey = ApiKey::CreatePartition;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(CreatePartitionRequest);
-impl_read_version_type!(CreatePartitionResponse);
+impl_write_type!(CreatePartitionRequest);
+impl_read_type!(CreatePartitionResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_table.rs b/fluss-rust/crates/fluss/src/rpc/message/create_table.rs
index 69865b8902..4647fec686 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/create_table.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_table.rs
@@ -16,16 +16,15 @@
 // under the License.
 
 use crate::metadata::{JsonSerde, TableDescriptor, TablePath};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::{impl_read_type, impl_write_type, proto};
 
 use crate::error::Result as FlussResult;
 use crate::proto::CreateTableResponse;
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
 use crate::rpc::frame::ReadError;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 
 use bytes::{Buf, BufMut};
 use prost::Message;
@@ -55,9 +54,7 @@ impl RequestBody for CreateTableRequest {
     type ResponseBody = CreateTableResponse;
 
     const API_KEY: ApiKey = ApiKey::CreateTable;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(CreateTableRequest);
-impl_read_version_type!(CreateTableResponse);
+impl_write_type!(CreateTableRequest);
+impl_read_type!(CreateTableResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs b/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
index 7e717a4e7a..4a9588a209 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/database_exists.rs
@@ -18,10 +18,9 @@
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -44,8 +43,7 @@ impl RequestBody for DatabaseExistsRequest {
     type ResponseBody = proto::DatabaseExistsResponse;
 
     const API_KEY: ApiKey = ApiKey::DatabaseExists;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(DatabaseExistsRequest);
-impl_read_version_type!(proto::DatabaseExistsResponse);
+impl_write_type!(DatabaseExistsRequest);
+impl_read_type!(proto::DatabaseExistsResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs b/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
index 663e970a91..bf7477f311 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/drop_database.rs
@@ -18,10 +18,9 @@
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -46,8 +45,7 @@ impl RequestBody for DropDatabaseRequest {
     type ResponseBody = proto::DropDatabaseResponse;
 
     const API_KEY: ApiKey = ApiKey::DropDatabase;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(DropDatabaseRequest);
-impl_read_version_type!(proto::DropDatabaseResponse);
+impl_write_type!(DropDatabaseRequest);
+impl_read_type!(proto::DropDatabaseResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/drop_partition.rs b/fluss-rust/crates/fluss/src/rpc/message/drop_partition.rs
index ddc97d8300..c7494acbac 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/drop_partition.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/drop_partition.rs
@@ -18,11 +18,10 @@
 use crate::metadata::{PartitionSpec, TablePath};
 use crate::proto::DropPartitionResponse;
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
 use crate::rpc::frame::{ReadError, WriteError};
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -51,9 +50,7 @@ impl RequestBody for DropPartitionRequest {
     type ResponseBody = DropPartitionResponse;
 
     const API_KEY: ApiKey = ApiKey::DropPartition;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(DropPartitionRequest);
-impl_read_version_type!(DropPartitionResponse);
+impl_write_type!(DropPartitionRequest);
+impl_read_type!(DropPartitionResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs b/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
index a2b3f2d129..b452cf075e 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/drop_table.rs
@@ -16,16 +16,15 @@
 // under the License.
 
 use crate::metadata::TablePath;
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::{impl_read_type, impl_write_type, proto};
 
 use crate::proto::DropTableResponse;
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 
 use bytes::{Buf, BufMut};
 use prost::Message;
@@ -50,9 +49,7 @@ impl RequestBody for DropTableRequest {
     type ResponseBody = DropTableResponse;
 
     const API_KEY: ApiKey = ApiKey::DropTable;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(DropTableRequest);
-impl_read_version_type!(DropTableResponse);
+impl_write_type!(DropTableRequest);
+impl_read_type!(DropTableResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/fetch.rs b/fluss-rust/crates/fluss/src/rpc/message/fetch.rs
index 15876069d7..67930f844f 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/fetch.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/fetch.rs
@@ -19,10 +19,9 @@ use crate::proto::FetchLogResponse;
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use prost::Message;
 
 use bytes::{Buf, BufMut};
@@ -50,9 +49,7 @@ impl RequestBody for FetchLogRequest {
     type ResponseBody = FetchLogResponse;
 
     const API_KEY: ApiKey = ApiKey::FetchLog;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(FetchLogRequest);
-impl_read_version_type!(FetchLogResponse);
+impl_write_type!(FetchLogRequest);
+impl_read_type!(FetchLogResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs b/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
index 6468bebd5f..63647d5266 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_database_info.rs
@@ -18,10 +18,9 @@
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -44,8 +43,7 @@ impl RequestBody for GetDatabaseInfoRequest {
     type ResponseBody = proto::GetDatabaseInfoResponse;
 
     const API_KEY: ApiKey = ApiKey::GetDatabaseInfo;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(GetDatabaseInfoRequest);
-impl_read_version_type!(proto::GetDatabaseInfoResponse);
+impl_write_type!(GetDatabaseInfoRequest);
+impl_read_type!(proto::GetDatabaseInfoResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs b/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
index a632a1596d..0b59384dfd 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
@@ -18,14 +18,13 @@
 use crate::proto;
 use crate::proto::PbTablePath;
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 
 use crate::metadata::TablePath;
 use crate::rpc::frame::ReadError;
 
-use crate::{impl_read_version_type, impl_write_version_type};
+use crate::{impl_read_type, impl_write_type};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -50,8 +49,7 @@ impl GetLatestLakeSnapshotRequest {
 impl RequestBody for GetLatestLakeSnapshotRequest {
     type ResponseBody = proto::GetLatestLakeSnapshotResponse;
     const API_KEY: ApiKey = ApiKey::GetLatestLakeSnapshot;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(GetLatestLakeSnapshotRequest);
-impl_read_version_type!(proto::GetLatestLakeSnapshotResponse);
+impl_write_type!(GetLatestLakeSnapshotRequest);
+impl_read_type!(proto::GetLatestLakeSnapshotResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_security_token.rs b/fluss-rust/crates/fluss/src/rpc/message/get_security_token.rs
index 7995232d1a..741c8482f4 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_security_token.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_security_token.rs
@@ -17,10 +17,9 @@
 
 use crate::proto::{GetFileSystemSecurityTokenRequest, GetFileSystemSecurityTokenResponse};
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::{ReadError, WriteError};
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -46,8 +45,7 @@ impl Default for GetSecurityTokenRequest {
 impl RequestBody for GetSecurityTokenRequest {
     type ResponseBody = GetFileSystemSecurityTokenResponse;
     const API_KEY: ApiKey = ApiKey::GetFileSystemSecurityToken;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(GetSecurityTokenRequest);
-impl_read_version_type!(GetFileSystemSecurityTokenResponse);
+impl_write_type!(GetSecurityTokenRequest);
+impl_read_type!(GetFileSystemSecurityTokenResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_table.rs b/fluss-rust/crates/fluss/src/rpc/message/get_table.rs
index 61657f7a7c..a7562f92ea 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_table.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_table.rs
@@ -17,14 +17,13 @@
 
 use crate::proto::{GetTableInfoRequest, GetTableInfoResponse, PbTablePath};
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 
 use crate::metadata::TablePath;
 use crate::rpc::frame::ReadError;
 
-use crate::{impl_read_version_type, impl_write_version_type};
+use crate::{impl_read_type, impl_write_type};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -49,8 +48,7 @@ impl GetTableRequest {
 impl RequestBody for GetTableRequest {
     type ResponseBody = GetTableInfoResponse;
     const API_KEY: ApiKey = ApiKey::GetTable;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(GetTableRequest);
-impl_read_version_type!(GetTableInfoResponse);
+impl_write_type!(GetTableRequest);
+impl_read_type!(GetTableInfoResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_table_schema.rs b/fluss-rust/crates/fluss/src/rpc/message/get_table_schema.rs
index ad7b23fb03..1c7c00b7bd 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_table_schema.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_table_schema.rs
@@ -17,14 +17,13 @@
 
 use crate::proto::{GetTableSchemaRequest, GetTableSchemaResponse, PbTablePath};
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 
 use crate::metadata::TablePath;
 use crate::rpc::frame::ReadError;
 
-use crate::{impl_read_version_type, impl_write_version_type};
+use crate::{impl_read_type, impl_write_type};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -50,8 +49,7 @@ impl GetTableSchemaRequestMsg {
 impl RequestBody for GetTableSchemaRequestMsg {
     type ResponseBody = GetTableSchemaResponse;
     const API_KEY: ApiKey = ApiKey::GetTableSchema;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(GetTableSchemaRequestMsg);
-impl_read_version_type!(GetTableSchemaResponse);
+impl_write_type!(GetTableSchemaRequestMsg);
+impl_read_type!(GetTableSchemaResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/header.rs b/fluss-rust/crates/fluss/src/rpc/message/header.rs
index 2f5848aa28..11155f6833 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/header.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/header.rs
@@ -19,7 +19,7 @@ use crate::proto::ErrorResponse;
 use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::{ReadError, WriteError};
-use crate::rpc::message::{ReadVersionedType, WriteVersionedType};
+use crate::rpc::message::{ReadType, WriteType};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -42,11 +42,11 @@ pub struct RequestHeader {
     pub client_id: Option<String>,
 }
 
-impl<W> WriteVersionedType<W> for RequestHeader
+impl<W> WriteType<W> for RequestHeader
 where
     W: BufMut,
 {
-    fn write_versioned(&self, writer: &mut W, _version: ApiVersion) -> Result<(), WriteError> {
+    fn write(&self, writer: &mut W) -> Result<(), WriteError> {
         writer.put_i16(self.request_api_key.into());
         writer.put_i16(self.request_api_version.0);
         writer.put_i32(self.request_id);
@@ -60,11 +60,11 @@ pub struct ResponseHeader {
     pub error_response: Option<ErrorResponse>,
 }
 
-impl<R> ReadVersionedType<R> for ResponseHeader
+impl<R> ReadType<R> for ResponseHeader
 where
     R: Buf,
 {
-    fn read_versioned(reader: &mut R, _version: ApiVersion) -> Result<Self, ReadError> {
+    fn read(reader: &mut R) -> Result<Self, ReadError> {
         let resp_type = reader.get_u8();
         let request_id = reader.get_i32();
         if resp_type != SUCCESS_RESPONSE {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/init_writer.rs b/fluss-rust/crates/fluss/src/rpc/message/init_writer.rs
index 0bbb0dc56a..b2e64a5f89 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/init_writer.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/init_writer.rs
@@ -17,10 +17,9 @@
 
 use crate::proto::{InitWriterResponse, PbTablePath};
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::{ReadError, WriteError};
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -42,9 +41,7 @@ impl RequestBody for InitWriterRequest {
     type ResponseBody = InitWriterResponse;
 
     const API_KEY: ApiKey = ApiKey::InitWriter;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(InitWriterRequest);
-impl_read_version_type!(InitWriterResponse);
+impl_write_type!(InitWriterRequest);
+impl_read_type!(InitWriterResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/limit_scan.rs b/fluss-rust/crates/fluss/src/rpc/message/limit_scan.rs
index d83a2e8bf4..c71b03c350 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/limit_scan.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/limit_scan.rs
@@ -19,10 +19,9 @@ use crate::proto::LimitScanResponse;
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use prost::Message;
 
 use bytes::{Buf, BufMut};
@@ -50,9 +49,7 @@ impl RequestBody for LimitScanRequest {
     type ResponseBody = LimitScanResponse;
 
     const API_KEY: ApiKey = ApiKey::LimitScan;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(LimitScanRequest);
-impl_read_version_type!(LimitScanResponse);
+impl_write_type!(LimitScanRequest);
+impl_read_type!(LimitScanResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs b/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
index 83226ab1a9..21e1640000 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
@@ -18,10 +18,9 @@
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -42,8 +41,7 @@ impl RequestBody for ListDatabasesRequest {
     type ResponseBody = proto::ListDatabasesResponse;
 
     const API_KEY: ApiKey = ApiKey::ListDatabases;
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(ListDatabasesRequest);
-impl_read_version_type!(proto::ListDatabasesResponse);
+impl_write_type!(ListDatabasesRequest);
+impl_read_type!(proto::ListDatabasesResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
index 262645a6d9..2ec1437093 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_offsets.rs
@@ -15,9 +15,7 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::{
-    BucketId, PartitionId, TableId, impl_read_version_type, impl_write_version_type, proto,
-};
+use crate::{BucketId, PartitionId, TableId, impl_read_type, impl_write_type, proto};
 
 use crate::error::Result as FlussResult;
 use crate::error::{Error, FlussError};
@@ -25,9 +23,8 @@ use crate::proto::{ErrorResponse, ListOffsetsResponse};
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 use std::collections::HashMap;
 
 use bytes::{Buf, BufMut};
@@ -98,12 +95,10 @@ impl RequestBody for ListOffsetsRequest {
     type ResponseBody = ListOffsetsResponse;
 
     const API_KEY: ApiKey = ApiKey::ListOffsets;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(ListOffsetsRequest);
-impl_read_version_type!(ListOffsetsResponse);
+impl_write_type!(ListOffsetsRequest);
+impl_read_type!(ListOffsetsResponse);
 
 impl ListOffsetsResponse {
     pub fn offsets(&self) -> FlussResult<HashMap<i32, i64>> {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_partition_infos.rs b/fluss-rust/crates/fluss/src/rpc/message/list_partition_infos.rs
index ab693671e5..cf24f466a0 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_partition_infos.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_partition_infos.rs
@@ -18,11 +18,10 @@
 use crate::metadata::{PartitionInfo, PartitionSpec, TablePath};
 use crate::proto::ListPartitionInfosResponse;
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
 use crate::rpc::frame::{ReadError, WriteError};
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -46,12 +45,10 @@ impl RequestBody for ListPartitionInfosRequest {
     type ResponseBody = ListPartitionInfosResponse;
 
     const API_KEY: ApiKey = ApiKey::ListPartitionInfos;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(ListPartitionInfosRequest);
-impl_read_version_type!(ListPartitionInfosResponse);
+impl_write_type!(ListPartitionInfosRequest);
+impl_read_type!(ListPartitionInfosResponse);
 
 impl ListPartitionInfosResponse {
     pub fn get_partitions_info(&self) -> Vec<PartitionInfo> {
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs b/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
index ff2497a063..8ff72141cb 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_tables.rs
@@ -15,15 +15,14 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::{impl_read_type, impl_write_type, proto};
 
 use crate::proto::ListTablesResponse;
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 
 use bytes::{Buf, BufMut};
 use prost::Message;
@@ -47,9 +46,7 @@ impl RequestBody for ListTablesRequest {
     type ResponseBody = ListTablesResponse;
 
     const API_KEY: ApiKey = ApiKey::ListTables;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(ListTablesRequest);
-impl_read_version_type!(ListTablesResponse);
+impl_write_type!(ListTablesRequest);
+impl_read_type!(ListTablesResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
index 07f8e06ce7..200d4bc8c0 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
@@ -19,12 +19,9 @@ use crate::proto::LookupResponse;
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{
-    BucketId, PartitionId, TableId, impl_read_version_type, impl_write_version_type, proto,
-};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{BucketId, PartitionId, TableId, impl_read_type, impl_write_type, proto};
 use bytes::Bytes;
 use prost::Message;
 
@@ -65,9 +62,7 @@ impl RequestBody for LookupRequest {
     type ResponseBody = LookupResponse;
 
     const API_KEY: ApiKey = ApiKey::Lookup;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(LookupRequest);
-impl_read_version_type!(LookupResponse);
+impl_write_type!(LookupRequest);
+impl_read_type!(LookupResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/mod.rs b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
index 456f9cb894..096066ed43 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/mod.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/mod.rs
@@ -16,10 +16,10 @@
 // under the License.
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::{ReadError, WriteError};
 use bytes::{Buf, BufMut};
 
+mod api_versions;
 mod authenticate;
 mod create_database;
 mod create_partition;
@@ -49,6 +49,7 @@ mod table_exists;
 mod update_metadata;
 
 pub use crate::rpc::RpcError;
+pub use api_versions::*;
 pub use authenticate::*;
 pub use create_database::*;
 pub use create_partition::*;
@@ -81,44 +82,36 @@ pub trait RequestBody {
     type ResponseBody;
 
     const API_KEY: ApiKey;
-
-    const REQUEST_VERSION: ApiVersion;
 }
 
 impl<T: RequestBody> RequestBody for &T {
     type ResponseBody = T::ResponseBody;
 
     const API_KEY: ApiKey = T::API_KEY;
-
-    const REQUEST_VERSION: ApiVersion = T::REQUEST_VERSION;
 }
 
-pub trait WriteVersionedType<W>: Sized
+pub trait WriteType<W>: Sized
 where
     W: BufMut,
 {
-    fn write_versioned(&self, writer: &mut W, version: ApiVersion) -> Result<(), WriteError>;
+    fn write(&self, writer: &mut W) -> Result<(), WriteError>;
 }
 
-pub trait ReadVersionedType<R>: Sized
+pub trait ReadType<R>: Sized
 where
     R: Buf,
 {
-    fn read_versioned(reader: &mut R, version: ApiVersion) -> Result<Self, ReadError>;
+    fn read(reader: &mut R) -> Result<Self, ReadError>;
 }
 
 #[macro_export]
-macro_rules! impl_write_version_type {
+macro_rules! impl_write_type {
     ($type:ty) => {
-        impl<W> WriteVersionedType<W> for $type
+        impl<W> WriteType<W> for $type
         where
             W: BufMut,
         {
-            fn write_versioned(
-                &self,
-                writer: &mut W,
-                _version: ApiVersion,
-            ) -> Result<(), WriteError> {
+            fn write(&self, writer: &mut W) -> Result<(), WriteError> {
                 Ok(self.inner_request.encode(writer).unwrap())
             }
         }
@@ -126,13 +119,13 @@ macro_rules! impl_write_version_type {
 }
 
 #[macro_export]
-macro_rules! impl_read_version_type {
+macro_rules! impl_read_type {
     ($type:ty) => {
-        impl<R> ReadVersionedType<R> for $type
+        impl<R> ReadType<R> for $type
         where
             R: Buf,
         {
-            fn read_versioned(reader: &mut R, _version: ApiVersion) -> Result<Self, ReadError> {
+            fn read(reader: &mut R) -> Result<Self, ReadError> {
                 Ok(<$type>::decode(reader).unwrap())
             }
         }
diff --git a/fluss-rust/crates/fluss/src/rpc/message/prefix_lookup.rs b/fluss-rust/crates/fluss/src/rpc/message/prefix_lookup.rs
index 5ee44d2519..e71ffe7c7b 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/prefix_lookup.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/prefix_lookup.rs
@@ -19,12 +19,9 @@ use crate::proto::PrefixLookupResponse;
 use crate::rpc::frame::ReadError;
 
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{
-    BucketId, PartitionId, TableId, impl_read_version_type, impl_write_version_type, proto,
-};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{BucketId, PartitionId, TableId, impl_read_type, impl_write_type, proto};
 use bytes::Bytes;
 use prost::Message;
 
@@ -65,9 +62,7 @@ impl RequestBody for PrefixLookupRequest {
     type ResponseBody = PrefixLookupResponse;
 
     const API_KEY: ApiKey = ApiKey::PrefixLookup;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(PrefixLookupRequest);
-impl_read_version_type!(PrefixLookupResponse);
+impl_write_type!(PrefixLookupRequest);
+impl_read_type!(PrefixLookupResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
index dab7ea9a57..8be2463832 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/produce_log.rs
@@ -21,10 +21,9 @@ use crate::rpc::frame::ReadError;
 
 use crate::client::ReadyWriteBatch;
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -63,9 +62,7 @@ impl RequestBody for ProduceLogRequest {
     type ResponseBody = ProduceLogResponse;
 
     const API_KEY: ApiKey = ApiKey::ProduceLog;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(ProduceLogRequest);
-impl_read_version_type!(ProduceLogResponse);
+impl_write_type!(ProduceLogRequest);
+impl_read_type!(ProduceLogResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/put_kv.rs b/fluss-rust/crates/fluss/src/rpc/message/put_kv.rs
index 983faa6646..e76496d123 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/put_kv.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/put_kv.rs
@@ -18,11 +18,10 @@
 use crate::client::ReadyWriteBatch;
 use crate::proto::{PbPutKvReqForBucket, PutKvResponse};
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::ReadError;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -65,9 +64,7 @@ impl RequestBody for PutKvRequest {
     type ResponseBody = PutKvResponse;
 
     const API_KEY: ApiKey = ApiKey::PutKv;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(PutKvRequest);
-impl_read_version_type!(PutKvResponse);
+impl_write_type!(PutKvRequest);
+impl_read_type!(PutKvResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs b/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs
index ec982116b4..5bc848e32a 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/table_exists.rs
@@ -16,14 +16,13 @@
 // under the License.
 
 use crate::metadata::TablePath;
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::{impl_read_type, impl_write_type, proto};
 
 use crate::proto::TableExistsResponse;
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::convert::to_table_path;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 
 use crate::rpc::frame::ReadError;
 
@@ -48,9 +47,7 @@ impl RequestBody for TableExistsRequest {
     type ResponseBody = TableExistsResponse;
 
     const API_KEY: ApiKey = ApiKey::TableExists;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(TableExistsRequest);
-impl_read_version_type!(TableExistsResponse);
+impl_write_type!(TableExistsRequest);
+impl_read_type!(TableExistsResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs b/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
index 1f0d88c2ae..fd96ca5e67 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/update_metadata.rs
@@ -18,14 +18,13 @@
 use crate::metadata::{PhysicalTablePath, TablePath};
 use crate::proto::{MetadataResponse, PbPhysicalTablePath, PbTablePath};
 use crate::rpc::api_key::ApiKey;
-use crate::rpc::api_version::ApiVersion;
 use crate::rpc::frame::ReadError;
 use crate::rpc::frame::WriteError;
-use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+use crate::rpc::message::{ReadType, RequestBody, WriteType};
 use std::collections::HashSet;
 use std::sync::Arc;
 
-use crate::{impl_read_version_type, impl_write_version_type, proto};
+use crate::{impl_read_type, impl_write_type, proto};
 use bytes::{Buf, BufMut};
 use prost::Message;
 
@@ -66,9 +65,7 @@ impl RequestBody for UpdateMetadataRequest {
     type ResponseBody = MetadataResponse;
 
     const API_KEY: ApiKey = ApiKey::MetaData;
-
-    const REQUEST_VERSION: ApiVersion = ApiVersion(0);
 }
 
-impl_write_version_type!(UpdateMetadataRequest);
-impl_read_version_type!(MetadataResponse);
+impl_write_type!(UpdateMetadataRequest);
+impl_read_type!(MetadataResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/server_connection.rs b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
index 46d99c0d27..e1148f9d06 100644
--- a/fluss-rust/crates/fluss/src/rpc/server_connection.rs
+++ b/fluss-rust/crates/fluss/src/rpc/server_connection.rs
@@ -15,20 +15,22 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::cluster::ServerNode;
+use crate::cluster::{ServerNode, ServerType};
 use crate::error::Error;
 use crate::metrics::{
     CLIENT_BYTES_RECEIVED_TOTAL, CLIENT_BYTES_SENT_TOTAL, CLIENT_REQUEST_LATENCY_MS,
     CLIENT_REQUESTS_IN_FLIGHT, CLIENT_REQUESTS_TOTAL, CLIENT_RESPONSES_TOTAL, LABEL_API_KEY,
     api_key_label,
 };
+use crate::proto::PbApiVersion;
+use crate::rpc::api_key::ApiKey;
 use crate::rpc::api_version::ApiVersion;
 use crate::rpc::error::RpcError;
 use crate::rpc::error::RpcError::ConnectionError;
 use crate::rpc::frame::{AsyncMessageRead, AsyncMessageWrite};
 use crate::rpc::message::{
-    REQUEST_HEADER_LENGTH, ReadVersionedType, RequestBody, RequestHeader, ResponseHeader,
-    WriteVersionedType,
+    ApiVersionsRequest, REQUEST_HEADER_LENGTH, ReadType, RequestBody, RequestHeader,
+    ResponseHeader, WriteType,
 };
 use crate::rpc::transport::Transport;
 use futures::future::BoxFuture;
@@ -72,6 +74,108 @@ impl fmt::Debug for SaslConfig {
     }
 }
 
+/// Represents the negotiated API versions between the client and a server node.
+/// Built from the server's `ApiVersionsResponse` by intersecting each API's
+/// client-supported range with the server-supported range, keeping the highest
+/// usable version.
+#[derive(Clone, Debug)]
+pub struct ServerApiVersions {
+    versions: HashMap<ApiKey, Result<ApiVersion, String>>,
+}
+
+impl ServerApiVersions {
+    /// Build from the server's advertised API version list.
+    pub fn new(server_versions: &[PbApiVersion]) -> Self {
+        let mut versions = HashMap::new();
+        for sv in server_versions {
+            let api_key = ApiKey::from(i16::try_from(sv.api_key).unwrap());
+            // Skip unknown API keys — the client does not support them.
+            let client_range = match api_key.supported_versions() {
+                Some(range) => range,
+                None => continue,
+            };
+            let server_min = i16::try_from(sv.min_version).unwrap();
+            let server_max = i16::try_from(sv.max_version).unwrap();
+            let min_version = client_range.min().0.max(server_min);
+            let max_version = client_range.max().0.min(server_max);
+            if min_version > max_version {
+                versions.insert(
+                    api_key,
+                    Err(format!(
+                        "The server does not support {:?} with version in range [{},{}]. \
+                         The supported range is [{},{}].",
+                        api_key,
+                        client_range.min(),
+                        client_range.max(),
+                        server_min,
+                        server_max,
+                    )),
+                );
+            } else {
+                versions.insert(api_key, Ok(ApiVersion(max_version)));
+            }
+        }
+        Self { versions }
+    }
+
+    /// Get the negotiated (highest usable) version for a given API key.
+    pub fn highest_available_version(&self, api_key: ApiKey) -> Result<ApiVersion, Error> {
+        match self.versions.get(&api_key) {
+            Some(Ok(version)) => Ok(*version),
+            Some(Err(msg)) => Err(Error::UnsupportedVersion {
+                message: msg.clone(),
+            }),
+            None => Err(Error::UnsupportedVersion {
+                message: format!("The server does not support {:?}", api_key),
+            }),
+        }
+    }
+}
+
+/// Resolve the API version to use for a given API key.
+fn resolve_api_version_for(
+    api_versions: Option<&ServerApiVersions>,
+    api_key: ApiKey,
+) -> Result<ApiVersion, Error> {
+    // version equals highestSupportedVersion might happen when requesting api version check
+    // before serverApiVersions is initialized. We always use the highest version for api
+    // version checking.
+    let default_version = api_key
+        .supported_versions()
+        .map(|range| range.max())
+        .unwrap();
+    match api_versions {
+        Some(versions) => versions.highest_available_version(api_key),
+        None => Ok(default_version),
+    }
+}
+
+/// Validate that the server's advertised `server_type` matches the type we expect
+/// for the target `ServerNode`.
+fn validate_server_type(
+    expected: &ServerType,
+    response_server_type: Option<i32>,
+) -> Result<(), Error> {
+    // For forward-compat with servers that do not populate `server_type`, validation is skipped.
+    let Some(type_id) = response_server_type else {
+        return Ok(());
+    };
+    let actual = ServerType::from_type_id(type_id);
+    if actual.as_ref() == Some(expected) {
+        return Ok(());
+    }
+    let actual_desc = actual
+        .map(|t| t.to_string())
+        .unwrap_or_else(|| format!("Unknown(type_id={type_id})"));
+    Err(Error::InvalidServerType {
+        message: format!(
+            "Expected server type {expected} but the server advertised {actual_desc}. \
+             The client may be talking to the wrong endpoint \
+             (e.g. coordinator vs tablet server)."
+        ),
+    })
+}
+
 #[derive(Debug, Default)]
 pub struct RpcClient {
     connections: RwLock<HashMap<String, ServerConnection>>,
@@ -142,6 +246,9 @@ impl RpcClient {
         );
         let connection = ServerConnection::new(messenger);
 
+        // Negotiate API versions (must happen before authentication).
+        Self::check_api_versions(&connection, server_node.server_type()).await?;
+
         if let Some(ref sasl) = self.sasl_config {
             Self::authenticate(&connection, &sasl.username, &sasl.password).await?;
         }
@@ -149,6 +256,20 @@ impl RpcClient {
         Ok(connection)
     }
 
+    /// Send an `ApiVersionsRequest`, validate the advertised `server_type`, and
+    /// store the negotiated versions on the connection.
+    async fn check_api_versions(
+        connection: &ServerConnection,
+        expected_server_type: &ServerType,
+    ) -> Result<(), Error> {
+        let request = ApiVersionsRequest::new("fluss-rust", env!("CARGO_PKG_VERSION"));
+        let response = connection.request(request).await?;
+        validate_server_type(expected_server_type, response.server_type)?;
+        let api_versions = ServerApiVersions::new(&response.api_versions);
+        *connection.api_versions.lock() = Some(api_versions);
+        Ok(())
+    }
+
     /// Perform SASL/PLAIN authentication handshake.
     ///
     /// Retries on `RetriableAuthenticateException` with exponential backoff
@@ -325,6 +446,10 @@ pub struct ServerConnectionInner<RW> {
 
     state: Arc<Mutex<ConnectionState>>,
 
+    /// Negotiated API versions for this connection.
+    /// `None` until the ApiVersions handshake completes.
+    api_versions: Mutex<Option<ServerApiVersions>>,
+
     join_handle: JoinHandle<()>,
 }
 
@@ -344,16 +469,13 @@ where
                     Ok(msg) => {
                         // message was read, so all subsequent errors should not poison the whole stream
                         let mut cursor = Cursor::new(msg);
-                        let header =
-                            match ResponseHeader::read_versioned(&mut cursor, ApiVersion(0)) {
-                                Ok(header) => header,
-                                Err(err) => {
-                                    log::warn!(
-                                        "Cannot read message header, ignoring message: {err:?}"
-                                    );
-                                    continue;
-                                }
-                            };
+                        let header = match ResponseHeader::read(&mut cursor) {
+                            Ok(header) => header,
+                            Err(err) => {
+                                log::warn!("Cannot read message header, ignoring message: {err:?}");
+                                continue;
+                            }
+                        };
 
                         let active_request = match state_captured.lock().deref_mut() {
                             ConnectionState::RequestMap(map) => {
@@ -396,10 +518,16 @@ where
             client_id,
             request_id: AtomicI32::new(0),
             state,
+            api_versions: Mutex::new(None),
             join_handle,
         }
     }
 
+    fn resolve_api_version(&self, api_key: ApiKey) -> Result<ApiVersion, Error> {
+        let guard = self.api_versions.lock();
+        resolve_api_version_for(guard.as_ref(), api_key)
+    }
+
     fn is_poisoned(&self) -> bool {
         let guard = self.state.lock();
         matches!(*guard, ConnectionState::Poison(_))
@@ -407,29 +535,25 @@ where
 
     pub async fn request<R>(&self, msg: R) -> Result<R::ResponseBody, Error>
     where
-        R: RequestBody + Send + WriteVersionedType<Vec<u8>>,
-        R::ResponseBody: ReadVersionedType<Cursor<Vec<u8>>>,
+        R: RequestBody + Send + WriteType<Vec<u8>>,
+        R::ResponseBody: ReadType<Cursor<Vec<u8>>>,
     {
+        let api_version = self.resolve_api_version(R::API_KEY)?;
         let request_id = self.request_id.fetch_add(1, Ordering::SeqCst) & 0x7FFFFFFF;
         let header = RequestHeader {
             request_api_key: R::API_KEY,
-            request_api_version: ApiVersion(0),
+            request_api_version: api_version,
             request_id,
             client_id: Some(String::from(self.client_id.as_ref())),
         };
 
-        let header_version = ApiVersion(0);
-
-        let body_api_version = ApiVersion(0);
-
         let mut buf = Vec::new();
         // write header
         header
-            .write_versioned(&mut buf, header_version)
+            .write(&mut buf)
             .map_err(RpcError::WriteMessageError)?;
         // write message body
-        msg.write_versioned(&mut buf, body_api_version)
-            .map_err(RpcError::WriteMessageError)?;
+        msg.write(&mut buf).map_err(RpcError::WriteMessageError)?;
 
         let (tx, rx) = channel();
 
@@ -473,8 +597,7 @@ where
             });
         }
 
-        let body = R::ResponseBody::read_versioned(&mut response.data, body_api_version)
-            .map_err(RpcError::ReadMessageError)?;
+        let body = R::ResponseBody::read(&mut response.data).map_err(RpcError::ReadMessageError)?;
 
         let read_bytes = response.data.position();
         let message_bytes = response.data.into_inner().len() as u64;
@@ -483,7 +606,7 @@ where
                 message_size: message_bytes,
                 read: read_bytes,
                 api_key: R::API_KEY,
-                api_version: body_api_version,
+                api_version,
             }
             .into());
         }
@@ -643,7 +766,7 @@ mod tests {
     use crate::rpc::ApiKey;
     use crate::rpc::api_version::ApiVersion;
     use crate::rpc::frame::{ReadError, WriteError};
-    use crate::rpc::message::{ReadVersionedType, RequestBody, WriteVersionedType};
+    use crate::rpc::message::{ReadType, RequestBody, WriteType};
     use metrics::{SharedString, Unit};
     use metrics_util::CompositeKey;
     use metrics_util::debugging::{DebugValue, DebuggingRecorder};
@@ -659,17 +782,16 @@ mod tests {
     impl RequestBody for TestProduceRequest {
         type ResponseBody = TestProduceResponse;
         const API_KEY: ApiKey = ApiKey::ProduceLog;
-        const REQUEST_VERSION: ApiVersion = ApiVersion(0);
     }
 
-    impl WriteVersionedType<Vec<u8>> for TestProduceRequest {
-        fn write_versioned(&self, _w: &mut Vec<u8>, _v: ApiVersion) -> Result<(), WriteError> {
+    impl WriteType<Vec<u8>> for TestProduceRequest {
+        fn write(&self, _w: &mut Vec<u8>) -> Result<(), WriteError> {
             Ok(())
         }
     }
 
-    impl ReadVersionedType<Cursor<Vec<u8>>> for TestProduceResponse {
-        fn read_versioned(_r: &mut Cursor<Vec<u8>>, _v: ApiVersion) -> Result<Self, ReadError> {
+    impl ReadType<Cursor<Vec<u8>>> for TestProduceResponse {
+        fn read(_r: &mut Cursor<Vec<u8>>) -> Result<Self, ReadError> {
             Ok(TestProduceResponse)
         }
     }
@@ -680,17 +802,16 @@ mod tests {
     impl RequestBody for TestMetadataRequest {
         type ResponseBody = TestMetadataResponse;
         const API_KEY: ApiKey = ApiKey::MetaData;
-        const REQUEST_VERSION: ApiVersion = ApiVersion(0);
     }
 
-    impl WriteVersionedType<Vec<u8>> for TestMetadataRequest {
-        fn write_versioned(&self, _w: &mut Vec<u8>, _v: ApiVersion) -> Result<(), WriteError> {
+    impl WriteType<Vec<u8>> for TestMetadataRequest {
+        fn write(&self, _w: &mut Vec<u8>) -> Result<(), WriteError> {
             Ok(())
         }
     }
 
-    impl ReadVersionedType<Cursor<Vec<u8>>> for TestMetadataResponse {
-        fn read_versioned(_r: &mut Cursor<Vec<u8>>, _v: ApiVersion) -> Result<Self, ReadError> {
+    impl ReadType<Cursor<Vec<u8>>> for TestMetadataResponse {
+        fn read(_r: &mut Cursor<Vec<u8>>) -> Result<Self, ReadError> {
             Ok(TestMetadataResponse)
         }
     }
@@ -873,6 +994,11 @@ mod tests {
         tokio::spawn(mock_echo_server(server));
 
         let conn = ServerConnectionInner::new(BufStream::new(client), usize::MAX, Arc::from("t"));
+        *conn.api_versions.lock() = Some(ServerApiVersions::new(&[PbApiVersion {
+            api_key: 1014,
+            min_version: 0,
+            max_version: 0,
+        }]));
 
         let before: Vec<_> = snapshotter.snapshot().into_vec();
         let request_before = counter_for_label(&before, CLIENT_REQUESTS_TOTAL, "produce_log");
@@ -913,6 +1039,11 @@ mod tests {
         tokio::spawn(mock_echo_server(server));
 
         let conn = ServerConnectionInner::new(BufStream::new(client), usize::MAX, Arc::from("t"));
+        *conn.api_versions.lock() = Some(ServerApiVersions::new(&[PbApiVersion {
+            api_key: 1012,
+            min_version: 0,
+            max_version: 0,
+        }]));
         let before: Vec<_> = snapshotter.snapshot().into_vec();
         let request_sum_before = counter_sum(&before, CLIENT_REQUESTS_TOTAL);
         let response_sum_before = counter_sum(&before, CLIENT_RESPONSES_TOTAL);
@@ -949,6 +1080,11 @@ mod tests {
         let (client, server) = tokio::io::duplex(64);
         drop(server); // force write failure on request path
         let conn = ServerConnectionInner::new(BufStream::new(client), usize::MAX, Arc::from("t"));
+        *conn.api_versions.lock() = Some(ServerApiVersions::new(&[PbApiVersion {
+            api_key: 1014,
+            min_version: 0,
+            max_version: 0,
+        }]));
 
         let before: Vec<_> = snapshotter.snapshot().into_vec();
         let request_before = counter_for_label(&before, CLIENT_REQUESTS_TOTAL, "produce_log");
@@ -997,6 +1133,11 @@ mod tests {
         tokio::spawn(mock_error_server(server));
 
         let conn = ServerConnectionInner::new(BufStream::new(client), usize::MAX, Arc::from("t"));
+        *conn.api_versions.lock() = Some(ServerApiVersions::new(&[PbApiVersion {
+            api_key: 1014,
+            min_version: 0,
+            max_version: 0,
+        }]));
 
         let before: Vec<_> = snapshotter.snapshot().into_vec();
         let response_before = counter_for_label(&before, CLIENT_RESPONSES_TOTAL, "produce_log");
@@ -1030,4 +1171,130 @@ mod tests {
             "in-flight gauge must return to zero after API error"
         );
     }
+
+    #[tokio::test]
+    async fn server_api_versions_negotiation() {
+        assert_eq!(
+            resolve_api_version_for(None, ApiKey::ApiVersion).unwrap(),
+            ApiVersion(0)
+        );
+
+        assert_eq!(
+            resolve_api_version_for(None, ApiKey::PutKv).unwrap(),
+            ApiVersion(0)
+        );
+
+        let server_versions = vec![
+            // PutKv: server v0..v3, client v0 only (v1 key encoding not yet implemented) → negotiated v0
+            PbApiVersion {
+                api_key: 1016,
+                min_version: 0,
+                max_version: 3,
+            },
+            // ProduceLog: server v0..v2, client v0 only → negotiated v0
+            PbApiVersion {
+                api_key: 1014,
+                min_version: 0,
+                max_version: 2,
+            },
+            // Disjoint: server v5..v7, client v0 only → error
+            PbApiVersion {
+                api_key: 1015,
+                min_version: 5,
+                max_version: 7,
+            },
+            // Unknown key (9999) → skipped
+            PbApiVersion {
+                api_key: 9999,
+                min_version: 0,
+                max_version: 5,
+            },
+        ];
+        let negotiated = ServerApiVersions::new(&server_versions);
+
+        // Successful negotiation cases
+        assert_eq!(
+            negotiated.highest_available_version(ApiKey::PutKv).unwrap(),
+            ApiVersion(0)
+        );
+        assert_eq!(
+            negotiated
+                .highest_available_version(ApiKey::ProduceLog)
+                .unwrap(),
+            ApiVersion(0)
+        );
+
+        // Disjoint range → error
+        assert!(
+            negotiated
+                .highest_available_version(ApiKey::FetchLog)
+                .unwrap_err()
+                .to_string()
+                .contains(&format!(
+                    "The server does not support {:?}",
+                    ApiKey::FetchLog
+                ))
+        );
+
+        // Unknown key is skipped → not in map → error
+        assert!(
+            negotiated
+                .highest_available_version(ApiKey::Unknown(9999))
+                .is_err()
+        );
+
+        // Key not advertised by server → error
+        assert!(
+            ServerApiVersions::new(&[])
+                .highest_available_version(ApiKey::FetchLog)
+                .is_err()
+        );
+    }
+
+    #[test]
+    fn server_type_validation() {
+        // Happy path: server advertises the expected type.
+        assert!(
+            validate_server_type(
+                &ServerType::CoordinatorServer,
+                Some(ServerType::CoordinatorServer.to_type_id()),
+            )
+            .is_ok()
+        );
+        assert!(
+            validate_server_type(
+                &ServerType::TabletServer,
+                Some(ServerType::TabletServer.to_type_id()),
+            )
+            .is_ok()
+        );
+
+        // Mismatch: connected to a coordinator while expecting a tablet server
+        // (and vice versa).
+        let err = validate_server_type(
+            &ServerType::TabletServer,
+            Some(ServerType::CoordinatorServer.to_type_id()),
+        )
+        .unwrap_err();
+        assert!(
+            matches!(err, Error::InvalidServerType { .. }),
+            "expected InvalidServerType, got: {err:?}"
+        );
+
+        assert!(matches!(
+            validate_server_type(
+                &ServerType::CoordinatorServer,
+                Some(ServerType::TabletServer.to_type_id()),
+            ),
+            Err(Error::InvalidServerType { .. })
+        ));
+
+        validate_server_type(&ServerType::TabletServer, None).ok();
+        // Unknown / unmapped type id still fails, with the raw id surfaced so
+        // operators can diagnose protocol drift.
+        assert!(matches!(
+            validate_server_type(&ServerType::CoordinatorServer, Some(99),),
+            Err(Error::InvalidServerType { .. })
+        ));
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index 62e206b6f8..1979b973f2 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -1404,4 +1404,75 @@ mod kv_table_test {
             .await
             .expect("Failed to drop table");
     }
+
+    /// Test that KV format v2 tables with non-default bucket key reject v0 clients.
+    /// The Rust client currently only supports API version 0 for PutKv/Lookup/PrefixLookup.
+    /// When the server creates a table with kv_format_version=2 and a non-default bucket key,
+    /// it rejects v0 clients because CompactedKeyEncoder (v1) is required.
+    // TODO(key-encoding-v1): Once v1 key encoding is implemented and the client advertises
+    //  PutKv/Lookup/PrefixLookup v1, this test should be updated to verify that v1 clients
+    //  can successfully write to and read from kv_format_v2 tables with non-default bucket keys.
+    #[tokio::test]
+    async fn kv_format_v2_table_rejects_v0_client() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+
+        let admin = connection.get_admin().unwrap();
+
+        let table_path = TablePath::new("fluss", "test_kv_format_v2_reject_v0");
+
+        // Create a KV table with:
+        // 1. kv_format_version = 2
+        // 2. non-default bucket key ("a" is a subset of pk ("a", "b"))
+        // 3. datalake format is exist.
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("a", DataTypes::int())
+                    .column("b", DataTypes::string())
+                    .column("c", DataTypes::string())
+                    .primary_key(vec!["a", "b"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .distributed_by(Some(2), vec!["a".to_string()])
+            .property("table.kv.format-version", "2")
+            .property("table.datalake.format", "lance")
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection.get_table(&table_path).await.unwrap();
+
+        // Test PutKv with v0 client - should fail with UNSUPPORTED_VERSION
+        let table_upsert = table.new_upsert().expect("Failed to create upsert");
+        let upsert_writer = table_upsert
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let mut row = GenericRow::new(3);
+        row.set_field(0, 1);
+        row.set_field(1, "a");
+        row.set_field(2, "value1");
+        let upsert_result = upsert_writer
+            .upsert(&row)
+            .expect("Failed to upsert row")
+            .await;
+        assert!(
+            upsert_result.is_err(),
+            "PutKv with v0 client should be rejected for kv_format_v2 table with non-default bucket key"
+        );
+        let err_msg = upsert_result.unwrap_err().to_string();
+        assert!(
+            err_msg.contains("Client API version 0 is not supported"),
+            "Expected 'Client API version 0 is not supported' error, got: {}",
+            err_msg
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
 }

From d0bea1ebec17561281781753f631914fcfbc452d Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sat, 9 May 2026 22:46:53 +0200
Subject: [PATCH 261/287] Support FixedSizeBinary in python (#538)

---
 fluss-rust/bindings/python/src/utils.rs                 | 1 +
 fluss-rust/bindings/python/test/test_kv_table.py        | 3 +++
 fluss-rust/website/docs/user-guide/python/data-types.md | 1 +
 3 files changed, 5 insertions(+)

diff --git a/fluss-rust/bindings/python/src/utils.rs b/fluss-rust/bindings/python/src/utils.rs
index 5efcf5e799..e07713976e 100644
--- a/fluss-rust/bindings/python/src/utils.rs
+++ b/fluss-rust/bindings/python/src/utils.rs
@@ -57,6 +57,7 @@ impl Utils {
             ArrowDataType::Float64 => DataTypes::double(),
             ArrowDataType::Utf8 | ArrowDataType::LargeUtf8 => DataTypes::string(),
             ArrowDataType::Binary | ArrowDataType::LargeBinary => DataTypes::bytes(),
+            ArrowDataType::FixedSizeBinary(n) => DataTypes::binary(*n as usize),
             ArrowDataType::Date32 => DataTypes::date(),
             ArrowDataType::Date64 => DataTypes::date(),
             ArrowDataType::Time32(unit) => match unit {
diff --git a/fluss-rust/bindings/python/test/test_kv_table.py b/fluss-rust/bindings/python/test/test_kv_table.py
index 36aa3e463b..394073756e 100644
--- a/fluss-rust/bindings/python/test/test_kv_table.py
+++ b/fluss-rust/bindings/python/test/test_kv_table.py
@@ -358,6 +358,7 @@ async def test_all_supported_datatypes(connection, admin):
                 pa.field("col_timestamp_ntz", pa.timestamp("us")),
                 pa.field("col_timestamp_ltz", pa.timestamp("us", tz="UTC")),
                 pa.field("col_bytes", pa.binary()),
+                pa.field("col_binary", pa.binary(16)),
             ]
         ),
         primary_keys=["pk_int"],
@@ -385,6 +386,7 @@ async def test_all_supported_datatypes(connection, admin):
         "col_timestamp_ntz": datetime(2026, 1, 23, 10, 13, 47, 123000),
         "col_timestamp_ltz": datetime(2026, 1, 23, 10, 13, 47, 123000),
         "col_bytes": b"binary data",
+        "col_binary": b"binary_data_0123",
     }
 
     handle = upsert_writer.upsert(row_data)
@@ -411,6 +413,7 @@ async def test_all_supported_datatypes(connection, admin):
         2026, 1, 23, 10, 13, 47, 123000, tzinfo=timezone.utc
     )
     assert result["col_bytes"] == b"binary data"
+    assert result["col_binary"] == b"binary_data_0123"
 
     # Test with null values for all nullable columns
     null_row = {"pk_int": 2}
diff --git a/fluss-rust/website/docs/user-guide/python/data-types.md b/fluss-rust/website/docs/user-guide/python/data-types.md
index 996770388e..8e4371e216 100644
--- a/fluss-rust/website/docs/user-guide/python/data-types.md
+++ b/fluss-rust/website/docs/user-guide/python/data-types.md
@@ -12,6 +12,7 @@ The Python client uses PyArrow types for schema definitions:
 | `pa.float32()` / `float64()`                    | Float / Double                    | `float`             |
 | `pa.string()`                                   | String                            | `str`               |
 | `pa.binary()`                                   | Bytes                             | `bytes`             |
+| `pa.binary(n)`                                  | Binary(n)                         | `bytes`             |
 | `pa.date32()`                                   | Date                              | `datetime.date`     |
 | `pa.time32("ms")`                               | Time                              | `datetime.time`     |
 | `pa.timestamp("us")`                            | Timestamp (NTZ)                   | `datetime.datetime` |

From b0c54862f29403913a479c79d6d0c56b7bd99750 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sun, 10 May 2026 12:08:21 +0100
Subject: [PATCH 262/287] [rust][writer] Add DynamicWriteBatchSizeEstimator
 (#532)

* [rust][writer] Add DynamicWriteBatchSizeEstimator

* [rust][writer] Match Java defaults and key shape

* address feedback
---
 fluss-rust/bindings/cpp/include/fluss.hpp     |   6 +-
 fluss-rust/bindings/cpp/src/ffi_converter.hpp |   2 +
 fluss-rust/bindings/cpp/src/lib.rs            |   4 +
 .../bindings/elixir/lib/fluss/config.ex       |  17 +-
 .../elixir/native/fluss_nif/src/config.rs     |   8 +
 fluss-rust/bindings/python/fluss/__init__.pyi |   8 +
 fluss-rust/bindings/python/src/config.rs      |  43 ++++
 .../fluss/src/client/write/accumulator.rs     | 239 ++++++++++++++++--
 .../src/client/write/dynamic_batch_size.rs    | 147 +++++++++++
 .../crates/fluss/src/client/write/mod.rs      |   1 +
 fluss-rust/crates/fluss/src/config.rs         |  30 +++
 .../docs/user-guide/cpp/api-reference.md      |   4 +-
 .../docs/user-guide/python/api-reference.md   |   4 +-
 .../docs/user-guide/rust/api-reference.md     |   4 +-
 14 files changed, 488 insertions(+), 29 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/write/dynamic_batch_size.rs

diff --git a/fluss-rust/bindings/cpp/include/fluss.hpp b/fluss-rust/bindings/cpp/include/fluss.hpp
index 3d39783fd7..d019b42787 100644
--- a/fluss-rust/bindings/cpp/include/fluss.hpp
+++ b/fluss-rust/bindings/cpp/include/fluss.hpp
@@ -1232,8 +1232,12 @@ struct Configuration {
     std::string writer_acks{"all"};
     // Max number of writer retries
     int32_t writer_retries{std::numeric_limits<int32_t>::max()};
-    // Writer batch size in bytes (2 MB)
+    // Writer batch size in bytes (2 MB), also the upper bound when dynamic sizing is on
     int32_t writer_batch_size{2 * 1024 * 1024};
+    // Tune the per-table writer batch size from observed fill ratios
+    bool writer_dynamic_batch_size_enabled{true};
+    // Lower bound (256 KB) for the dynamic batch size estimator
+    int32_t writer_dynamic_batch_size_min{256 * 1024};
     // Bucket assigner for tables without bucket keys: "sticky" or "round_robin"
     std::string writer_bucket_no_key_assigner{"sticky"};
     // Number of remote log batches to prefetch during scanning
diff --git a/fluss-rust/bindings/cpp/src/ffi_converter.hpp b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
index 430dd1991d..47453d998a 100644
--- a/fluss-rust/bindings/cpp/src/ffi_converter.hpp
+++ b/fluss-rust/bindings/cpp/src/ffi_converter.hpp
@@ -135,6 +135,8 @@ inline ffi::FfiConfig to_ffi_config(const Configuration& config) {
     ffi_config.writer_acks = rust::String(config.writer_acks);
     ffi_config.writer_retries = config.writer_retries;
     ffi_config.writer_batch_size = config.writer_batch_size;
+    ffi_config.writer_dynamic_batch_size_enabled = config.writer_dynamic_batch_size_enabled;
+    ffi_config.writer_dynamic_batch_size_min = config.writer_dynamic_batch_size_min;
     ffi_config.writer_bucket_no_key_assigner = rust::String(config.writer_bucket_no_key_assigner);
     ffi_config.scanner_remote_log_prefetch_num = config.scanner_remote_log_prefetch_num;
     ffi_config.remote_file_download_thread_num = config.remote_file_download_thread_num;
diff --git a/fluss-rust/bindings/cpp/src/lib.rs b/fluss-rust/bindings/cpp/src/lib.rs
index 52df36869d..ed575244f6 100644
--- a/fluss-rust/bindings/cpp/src/lib.rs
+++ b/fluss-rust/bindings/cpp/src/lib.rs
@@ -46,6 +46,8 @@ mod ffi {
         writer_acks: String,
         writer_retries: i32,
         writer_batch_size: i32,
+        writer_dynamic_batch_size_enabled: bool,
+        writer_dynamic_batch_size_min: i32,
         writer_bucket_no_key_assigner: String,
         scanner_remote_log_prefetch_num: usize,
         remote_file_download_thread_num: usize,
@@ -907,6 +909,8 @@ fn new_connection(config: &ffi::FfiConfig) -> ffi::FfiPtrResult {
         writer_acks: config.writer_acks.to_string(),
         writer_retries: config.writer_retries,
         writer_batch_size: config.writer_batch_size,
+        writer_dynamic_batch_size_enabled: config.writer_dynamic_batch_size_enabled,
+        writer_dynamic_batch_size_min: config.writer_dynamic_batch_size_min,
         writer_batch_timeout_ms: config.writer_batch_timeout_ms,
         writer_bucket_no_key_assigner: assigner_type,
         scanner_remote_log_prefetch_num: config.scanner_remote_log_prefetch_num,
diff --git a/fluss-rust/bindings/elixir/lib/fluss/config.ex b/fluss-rust/bindings/elixir/lib/fluss/config.ex
index 1120a5f450..f12f61e426 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/config.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/config.ex
@@ -34,12 +34,16 @@ defmodule Fluss.Config do
   @enforce_keys [:bootstrap_servers]
   defstruct bootstrap_servers: nil,
             writer_batch_size: nil,
-            writer_batch_timeout_ms: nil
+            writer_batch_timeout_ms: nil,
+            writer_dynamic_batch_size_enabled: nil,
+            writer_dynamic_batch_size_min: nil
 
   @type t :: %__MODULE__{
           bootstrap_servers: String.t(),
           writer_batch_size: non_neg_integer() | nil,
-          writer_batch_timeout_ms: non_neg_integer() | nil
+          writer_batch_timeout_ms: non_neg_integer() | nil,
+          writer_dynamic_batch_size_enabled: boolean() | nil,
+          writer_dynamic_batch_size_min: non_neg_integer() | nil
         }
 
   @spec new(String.t()) :: t()
@@ -62,6 +66,15 @@ defmodule Fluss.Config do
   def set_writer_batch_timeout_ms(%__MODULE__{} = config, ms) when is_integer(ms),
     do: %{config | writer_batch_timeout_ms: ms}
 
+  @spec set_writer_dynamic_batch_size_enabled(t(), boolean()) :: t()
+  def set_writer_dynamic_batch_size_enabled(%__MODULE__{} = config, enabled)
+      when is_boolean(enabled),
+      do: %{config | writer_dynamic_batch_size_enabled: enabled}
+
+  @spec set_writer_dynamic_batch_size_min(t(), non_neg_integer()) :: t()
+  def set_writer_dynamic_batch_size_min(%__MODULE__{} = config, size) when is_integer(size),
+    do: %{config | writer_dynamic_batch_size_min: size}
+
   @spec get_bootstrap_servers(t()) :: String.t()
   def get_bootstrap_servers(%__MODULE__{bootstrap_servers: servers}), do: servers
 end
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
index 536ed68f3a..8bbdfad993 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
@@ -25,6 +25,8 @@ pub struct NifConfig {
     pub bootstrap_servers: String,
     pub writer_batch_size: Option<i32>,
     pub writer_batch_timeout_ms: Option<i64>,
+    pub writer_dynamic_batch_size_enabled: Option<bool>,
+    pub writer_dynamic_batch_size_min: Option<i32>,
 }
 
 impl NifConfig {
@@ -39,6 +41,12 @@ impl NifConfig {
         if let Some(ms) = self.writer_batch_timeout_ms {
             config.writer_batch_timeout_ms = ms;
         }
+        if let Some(enabled) = self.writer_dynamic_batch_size_enabled {
+            config.writer_dynamic_batch_size_enabled = enabled;
+        }
+        if let Some(size) = self.writer_dynamic_batch_size_min {
+            config.writer_dynamic_batch_size_min = size;
+        }
         config
     }
 }
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index fc71397386..5a59ea513e 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -164,6 +164,14 @@ class Config:
     @writer_batch_size.setter
     def writer_batch_size(self, size: int) -> None: ...
     @property
+    def writer_dynamic_batch_size_enabled(self) -> bool: ...
+    @writer_dynamic_batch_size_enabled.setter
+    def writer_dynamic_batch_size_enabled(self, enabled: bool) -> None: ...
+    @property
+    def writer_dynamic_batch_size_min(self) -> int: ...
+    @writer_dynamic_batch_size_min.setter
+    def writer_dynamic_batch_size_min(self, size: int) -> None: ...
+    @property
     def writer_bucket_no_key_assigner(self) -> str: ...
     @writer_bucket_no_key_assigner.setter
     def writer_bucket_no_key_assigner(self, value: str) -> None: ...
diff --git a/fluss-rust/bindings/python/src/config.rs b/fluss-rust/bindings/python/src/config.rs
index 65bcc9adfe..11188bf3c6 100644
--- a/fluss-rust/bindings/python/src/config.rs
+++ b/fluss-rust/bindings/python/src/config.rs
@@ -60,6 +60,25 @@ impl Config {
                             FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
                         })?;
                     }
+                    "writer.dynamic-batch-size.enabled" => {
+                        config.writer_dynamic_batch_size_enabled = match value.as_str() {
+                            "true" => true,
+                            "false" => false,
+                            other => {
+                                return Err(FlussError::new_err(format!(
+                                    "Invalid value '{other}' for '{key}', expected 'true' or 'false'"
+                                )));
+                            }
+                        };
+                    }
+                    "writer.dynamic-batch-size-min" => {
+                        config.writer_dynamic_batch_size_min =
+                            value.parse::<i32>().map_err(|e| {
+                                FlussError::new_err(format!(
+                                    "Invalid value '{value}' for '{key}': {e}"
+                                ))
+                            })?;
+                    }
                     "writer.batch-timeout-ms" => {
                         config.writer_batch_timeout_ms = value.parse::<i64>().map_err(|e| {
                             FlussError::new_err(format!("Invalid value '{value}' for '{key}': {e}"))
@@ -250,6 +269,30 @@ impl Config {
         self.inner.writer_batch_size = size;
     }
 
+    /// Get whether the per-table dynamic batch size estimator is enabled
+    #[getter]
+    fn writer_dynamic_batch_size_enabled(&self) -> bool {
+        self.inner.writer_dynamic_batch_size_enabled
+    }
+
+    /// Set whether the per-table dynamic batch size estimator is enabled
+    #[setter]
+    fn set_writer_dynamic_batch_size_enabled(&mut self, enabled: bool) {
+        self.inner.writer_dynamic_batch_size_enabled = enabled;
+    }
+
+    /// Get the lower bound used by the dynamic batch size estimator
+    #[getter]
+    fn writer_dynamic_batch_size_min(&self) -> i32 {
+        self.inner.writer_dynamic_batch_size_min
+    }
+
+    /// Set the lower bound used by the dynamic batch size estimator
+    #[setter]
+    fn set_writer_dynamic_batch_size_min(&mut self, size: i32) {
+        self.inner.writer_dynamic_batch_size_min = size;
+    }
+
     /// Get the scanner remote log prefetch num
     #[getter]
     fn scanner_remote_log_prefetch_num(&self) -> usize {
diff --git a/fluss-rust/crates/fluss/src/client/write/accumulator.rs b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
index 019d3b05d4..244edf7399 100644
--- a/fluss-rust/crates/fluss/src/client/write/accumulator.rs
+++ b/fluss-rust/crates/fluss/src/client/write/accumulator.rs
@@ -19,6 +19,7 @@ use crate::client::broadcast;
 use crate::client::write::IdempotenceManager;
 use crate::client::write::batch::WriteBatch::{ArrowLog, Kv};
 use crate::client::write::batch::{ArrowLogWriteBatch, KvWriteBatch, WriteBatch};
+use crate::client::write::dynamic_batch_size::DynamicWriteBatchSizeEstimator;
 use crate::client::{LogWriteRecord, Record, ResultHandle, WriteRecord};
 use crate::cluster::{BucketLocation, Cluster, ServerNode};
 use crate::compression::ArrowCompressionRatioEstimator;
@@ -307,28 +308,32 @@ impl RecordAccumulator {
             None
         };
 
-        let (dq, compression_ratio_estimator) = {
-            let mut binding =
-                self.write_batches
-                    .entry(Arc::clone(physical_table_path))
-                    .or_insert_with(|| BucketAndWriteBatches {
-                        table_id: table_info.table_id,
+        let (dq, compression_ratio_estimator, dynamic_target) = {
+            let mut binding = self
+                .write_batches
+                .entry(Arc::clone(physical_table_path))
+                .or_insert_with(|| {
+                    BucketAndWriteBatches::new(
+                        table_info.table_id,
                         is_partitioned_table,
                         partition_id,
-                        batches: Default::default(),
-                        compression_ratio_estimator: Arc::new(
-                            ArrowCompressionRatioEstimator::default(),
-                        ),
-                    });
+                        &self.config,
+                    )
+                });
             let bucket_and_batches = binding.value_mut();
             let dq = bucket_and_batches
                 .batches
                 .entry(bucket_id)
                 .or_insert_with(|| Arc::new(Mutex::new(VecDeque::new())))
                 .clone();
+            let dynamic_target = bucket_and_batches
+                .dynamic_batch_size
+                .as_ref()
+                .map(|est| est.current());
             (
                 dq,
                 Arc::clone(&bucket_and_batches.compression_ratio_estimator),
+                dynamic_target,
             )
         };
 
@@ -347,12 +352,7 @@ impl RecordAccumulator {
         // producer holds dq + blocks on memory, while sender needs dq to drain.
         drop(dq_guard);
 
-        // TODO: Implement DynamicWriteBatchSizeEstimator matching Java's
-        // client.writer.dynamic-batch-size-enabled. Adjusts the batch size target
-        // per table based on observed actual batch sizes (grow 10% when >80% full,
-        // shrink 5% when <50% full, clamped to [2*pageSize, maxBatchSize]).
-        // This would improve memory limiter utilization for tables with small rows.
-        let batch_size = self.config.writer_batch_size as usize;
+        let batch_size = dynamic_target.unwrap_or(self.config.writer_batch_size as usize);
         let record_size = record.estimated_record_size();
         let alloc_size = batch_size.max(record_size);
         let permit = self.memory_limiter.acquire(alloc_size)?;
@@ -664,6 +664,8 @@ impl RecordAccumulator {
                     let current_batch_size = batch.estimated_size_in_bytes();
                     size += current_batch_size;
 
+                    self.record_actual_batch_size(table_path, current_batch_size);
+
                     // mark the batch as drained.
                     batch.drained(current_time_ms());
                     ready.push(ReadyWriteBatch {
@@ -690,6 +692,34 @@ impl RecordAccumulator {
         self.incomplete_batches.write().remove(&batch_id);
     }
 
+    fn record_actual_batch_size(&self, table_path: &Arc<PhysicalTablePath>, actual: usize) {
+        let Some(entry) = self.write_batches.get(table_path) else {
+            return;
+        };
+        let Some(estimator) = entry.dynamic_batch_size.as_ref() else {
+            return;
+        };
+        let prev = estimator.current();
+        let next = estimator.update(actual);
+        if next != prev {
+            log::debug!(
+                "Set estimated batch size for {} from {} to {}",
+                table_path.as_ref(),
+                prev,
+                next
+            );
+        }
+    }
+
+    #[cfg(test)]
+    fn estimated_batch_size(&self, table_path: &Arc<PhysicalTablePath>) -> Option<usize> {
+        self.write_batches
+            .get(table_path)?
+            .dynamic_batch_size
+            .as_ref()
+            .map(|est| est.current())
+    }
+
     pub fn re_enqueue(&self, mut ready_write_batch: ReadyWriteBatch) {
         ready_write_batch.write_batch.re_enqueued();
 
@@ -785,12 +815,13 @@ impl RecordAccumulator {
         let mut binding = self
             .write_batches
             .entry(Arc::clone(physical_table_path))
-            .or_insert_with(|| BucketAndWriteBatches {
-                table_id,
-                is_partitioned_table,
-                partition_id,
-                batches: Default::default(),
-                compression_ratio_estimator: Arc::new(ArrowCompressionRatioEstimator::default()),
+            .or_insert_with(|| {
+                BucketAndWriteBatches::new(
+                    table_id,
+                    is_partitioned_table,
+                    partition_id,
+                    &self.config,
+                )
             });
         let bucket_and_batches = binding.value_mut();
         bucket_and_batches
@@ -938,6 +969,32 @@ struct BucketAndWriteBatches {
     batches: HashMap<BucketId, Arc<Mutex<VecDeque<WriteBatch>>>>,
     /// Compression ratio estimator shared across Arrow log batches for this table.
     compression_ratio_estimator: Arc<ArrowCompressionRatioEstimator>,
+    /// `None` when `writer_dynamic_batch_size_enabled` is false.
+    dynamic_batch_size: Option<DynamicWriteBatchSizeEstimator>,
+}
+
+impl BucketAndWriteBatches {
+    fn new(
+        table_id: TableId,
+        is_partitioned_table: bool,
+        partition_id: Option<PartitionId>,
+        config: &Config,
+    ) -> Self {
+        let dynamic_batch_size = config.writer_dynamic_batch_size_enabled.then(|| {
+            DynamicWriteBatchSizeEstimator::new(
+                config.writer_dynamic_batch_size_min as usize,
+                config.writer_batch_size as usize,
+            )
+        });
+        Self {
+            table_id,
+            is_partitioned_table,
+            partition_id,
+            batches: Default::default(),
+            compression_ratio_estimator: Arc::new(ArrowCompressionRatioEstimator::default()),
+            dynamic_batch_size,
+        }
+    }
 }
 
 pub struct RecordAppendResult {
@@ -999,9 +1056,12 @@ impl ReadyCheckResult {
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::client::write::write_format::WriteFormat;
+    use crate::client::write::{RowBytes, WriteRecord};
     use crate::metadata::TablePath;
     use crate::row::{Datum, GenericRow};
     use crate::test_utils::{build_cluster, build_table_info};
+    use bytes::Bytes;
     use std::sync::Arc;
 
     fn disabled_idempotence() -> Arc<IdempotenceManager> {
@@ -1563,4 +1623,137 @@ mod tests {
             .await
             .expect("notified should complete after wakeup_sender");
     }
+
+    #[test]
+    fn dynamic_batch_size_shrinks_after_small_drained_batch() {
+        let target = 256 * 1024;
+        let config = Config {
+            writer_dynamic_batch_size_enabled: true,
+            writer_batch_size: target,
+            writer_dynamic_batch_size_min: 4 * 1024,
+            writer_buffer_memory_size: 1024 * 1024,
+            ..Config::default()
+        };
+        let accumulator = RecordAccumulator::new(config, disabled_idempotence());
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
+
+        accumulator.append(&record, 0, &cluster, false).unwrap();
+        assert_eq!(*accumulator.memory_limiter.state.lock(), target as usize);
+
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        let mut drained = accumulator
+            .drain(cluster.clone(), &nodes, 1024 * 1024)
+            .unwrap();
+        let mut batches = drained.remove(&1).expect("drained batches");
+        let batch = batches.pop().expect("batch");
+        accumulator.remove_incomplete_batches(batch.write_batch.batch_id());
+        assert_eq!(*accumulator.memory_limiter.state.lock(), 0);
+
+        accumulator.append(&record, 0, &cluster, false).unwrap();
+        let second = *accumulator.memory_limiter.state.lock();
+        assert!(second < target as usize, "{second} >= {target}");
+    }
+
+    #[test]
+    fn dynamic_batch_size_grows_after_full_drained_batch() {
+        let max = 256 * 1024;
+        let config = Config {
+            writer_dynamic_batch_size_enabled: true,
+            writer_batch_size: max,
+            writer_dynamic_batch_size_min: 4 * 1024,
+            writer_buffer_memory_size: 4 * 1024 * 1024,
+            ..Config::default()
+        };
+        let accumulator = RecordAccumulator::new(config, disabled_idempotence());
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
+        let nodes = HashSet::from([cluster.get_tablet_server(1).unwrap().clone()]);
+
+        let kv = |size: usize| {
+            WriteRecord::for_upsert(
+                Arc::clone(&table_info),
+                Arc::clone(&physical_table_path),
+                1,
+                Bytes::from(vec![0u8; 32]),
+                None,
+                WriteFormat::CompactedKv,
+                None,
+                Some(RowBytes::Owned(Bytes::from(vec![0u8; size]))),
+            )
+        };
+        let drain_one = || {
+            let mut d = accumulator.drain(cluster.clone(), &nodes, max).unwrap();
+            let b = d.remove(&1).unwrap().pop().unwrap();
+            accumulator.remove_incomplete_batches(b.write_batch.batch_id());
+        };
+        let target = || {
+            accumulator
+                .estimated_batch_size(&physical_table_path)
+                .unwrap()
+        };
+
+        accumulator.append(&kv(1), 0, &cluster, false).unwrap();
+        drain_one();
+        let after_shrink = target();
+        assert!(
+            after_shrink < max as usize,
+            "shrink failed: after_shrink={after_shrink} max={max}"
+        );
+
+        // 0.9 sits safely above GROW_THRESHOLD (0.8) to avoid f64 boundary noise.
+        accumulator
+            .append(&kv(after_shrink * 9 / 10), 0, &cluster, false)
+            .unwrap();
+        drain_one();
+        let after_grow = target();
+        assert!(
+            after_grow > after_shrink,
+            "grow failed: after_grow={after_grow} after_shrink={after_shrink}"
+        );
+    }
+
+    #[test]
+    fn dynamic_batch_size_disabled_keeps_static_target() {
+        let target = 256 * 1024;
+        let config = Config {
+            writer_dynamic_batch_size_enabled: false,
+            writer_batch_size: target,
+            writer_dynamic_batch_size_min: 4 * 1024,
+            writer_buffer_memory_size: 1024 * 1024,
+            ..Config::default()
+        };
+        let accumulator = RecordAccumulator::new(config, disabled_idempotence());
+        let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+        let table_info = Arc::new(build_table_info(table_path.clone(), 1, 1));
+        let physical_table_path = Arc::new(PhysicalTablePath::of(Arc::new(table_path.clone())));
+        let cluster = Arc::new(build_cluster(&table_path, 1, 1));
+        let row = GenericRow {
+            values: vec![Datum::Int32(1)],
+        };
+        let record = WriteRecord::for_append(table_info, physical_table_path, 1, &row);
+
+        let server = cluster.get_tablet_server(1).expect("server");
+        let nodes = HashSet::from([server.clone()]);
+        for _ in 0..3 {
+            accumulator.append(&record, 0, &cluster, false).unwrap();
+            assert_eq!(*accumulator.memory_limiter.state.lock(), target as usize);
+
+            let mut drained = accumulator
+                .drain(cluster.clone(), &nodes, 1024 * 1024)
+                .unwrap();
+            let mut batches = drained.remove(&1).expect("drained batches");
+            let batch = batches.pop().expect("batch");
+            accumulator.remove_incomplete_batches(batch.write_batch.batch_id());
+        }
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/client/write/dynamic_batch_size.rs b/fluss-rust/crates/fluss/src/client/write/dynamic_batch_size.rs
new file mode 100644
index 0000000000..408263ee5f
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/write/dynamic_batch_size.rs
@@ -0,0 +1,147 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Per-table batch size estimator. Mirrors Java's `DynamicWriteBatchSizeEstimator`:
+//! grow 10% above 80% fill, shrink 5% below 50%, clamped to `[min, max]`.
+
+use std::sync::atomic::{AtomicUsize, Ordering};
+
+const GROW_THRESHOLD: f64 = 0.8;
+const SHRINK_THRESHOLD: f64 = 0.5;
+const GROW_FACTOR: f64 = 1.1;
+const SHRINK_FACTOR: f64 = 0.95;
+
+#[derive(Debug)]
+pub(crate) struct DynamicWriteBatchSizeEstimator {
+    current: AtomicUsize,
+    min: usize,
+    max: usize,
+}
+
+impl DynamicWriteBatchSizeEstimator {
+    pub fn new(min_size: usize, max_size: usize) -> Self {
+        Self {
+            current: AtomicUsize::new(max_size),
+            min: min_size.min(max_size),
+            max: max_size,
+        }
+    }
+
+    pub fn current(&self) -> usize {
+        self.current.load(Ordering::Relaxed)
+    }
+
+    /// Last-write-wins on races, matching Java's `ConcurrentHashMap.put`.
+    pub fn update(&self, actual: usize) -> usize {
+        let prev = self.current.load(Ordering::Relaxed);
+        let cur = prev as f64;
+        let actual = actual as f64;
+        let next = if actual > cur * GROW_THRESHOLD {
+            cur * GROW_FACTOR
+        } else if actual < cur * SHRINK_THRESHOLD {
+            cur * SHRINK_FACTOR
+        } else {
+            cur
+        };
+        let clamped = (next as usize).clamp(self.min, self.max);
+        if clamped != prev {
+            self.current.store(clamped, Ordering::Relaxed);
+        }
+        clamped
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+
+    const MIN: usize = 256 * 1024;
+    const MAX: usize = 2 * 1024 * 1024;
+    /// ~41 shrink steps, ~22 grow steps; 50 covers both with margin.
+    const CONVERGENCE_STEPS: usize = 50;
+
+    #[test]
+    fn starts_at_max() {
+        let est = DynamicWriteBatchSizeEstimator::new(MIN, MAX);
+        assert_eq!(est.current(), MAX);
+    }
+
+    #[test]
+    fn min_clamped_to_max_when_misconfigured() {
+        let est = DynamicWriteBatchSizeEstimator::new(MAX * 2, MAX);
+        assert_eq!(est.current(), MAX);
+        assert_eq!(est.update(0), MAX);
+    }
+
+    #[test]
+    fn grows_when_above_grow_threshold() {
+        let est = DynamicWriteBatchSizeEstimator::new(MIN, MAX);
+        for _ in 0..CONVERGENCE_STEPS {
+            est.update(0);
+        }
+        assert_eq!(est.current(), MIN);
+
+        // 0.9 sits safely past the 0.8 threshold and avoids f64 boundary noise.
+        let next = est.update((MIN as f64 * 0.9) as usize);
+        assert_eq!(next, ((MIN as f64) * GROW_FACTOR) as usize);
+    }
+
+    #[test]
+    fn shrinks_when_below_shrink_threshold() {
+        let est = DynamicWriteBatchSizeEstimator::new(MIN, MAX);
+        // 0.4 sits safely below the strict 0.5 threshold.
+        let next = est.update((MAX as f64 * 0.4) as usize);
+        assert_eq!(next, ((MAX as f64) * SHRINK_FACTOR) as usize);
+    }
+
+    #[test]
+    fn shrink_clamps_to_min() {
+        let est = DynamicWriteBatchSizeEstimator::new(MIN, MAX);
+        for _ in 0..CONVERGENCE_STEPS {
+            est.update(0);
+        }
+        assert_eq!(est.current(), MIN);
+    }
+
+    #[test]
+    fn grow_clamps_to_max() {
+        let est = DynamicWriteBatchSizeEstimator::new(MIN, MAX);
+        for _ in 0..CONVERGENCE_STEPS {
+            est.update(0);
+        }
+        for _ in 0..CONVERGENCE_STEPS {
+            est.update(est.current());
+        }
+        assert_eq!(est.current(), MAX);
+    }
+
+    #[test]
+    fn oversized_actual_clamps_at_max() {
+        let est = DynamicWriteBatchSizeEstimator::new(MIN, MAX);
+        assert_eq!(est.update(MAX * 4), MAX);
+    }
+
+    #[test]
+    fn dead_zone_is_a_fixed_point() {
+        let est = DynamicWriteBatchSizeEstimator::new(MIN, MAX);
+        let initial = est.current();
+        for _ in 0..20 {
+            est.update((est.current() as f64 * 0.65) as usize);
+        }
+        assert_eq!(est.current(), initial);
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/write/mod.rs b/fluss-rust/crates/fluss/src/client/write/mod.rs
index bc324e1827..a65b5d5af1 100644
--- a/fluss-rust/crates/fluss/src/client/write/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/write/mod.rs
@@ -17,6 +17,7 @@
 
 mod accumulator;
 mod batch;
+mod dynamic_batch_size;
 mod idempotence;
 
 use crate::client::broadcast::{self as client_broadcast, BatchWriteResult, BroadcastOnceReceiver};
diff --git a/fluss-rust/crates/fluss/src/config.rs b/fluss-rust/crates/fluss/src/config.rs
index 09a17f830d..cad8d9cb55 100644
--- a/fluss-rust/crates/fluss/src/config.rs
+++ b/fluss-rust/crates/fluss/src/config.rs
@@ -22,6 +22,9 @@ use strum_macros::{Display, EnumString};
 const DEFAULT_BOOTSTRAP_SERVER: &str = "127.0.0.1:9123";
 const DEFAULT_REQUEST_MAX_SIZE: i32 = 10 * 1024 * 1024;
 const DEFAULT_WRITER_BATCH_SIZE: i32 = 2 * 1024 * 1024;
+// Mirrors Java's `2 * pageSize` floor with default pageSize = 128 KB.
+const DEFAULT_WRITER_DYNAMIC_BATCH_SIZE_MIN: i32 = 256 * 1024;
+const DEFAULT_WRITER_DYNAMIC_BATCH_SIZE_ENABLED: bool = true;
 const DEFAULT_RETRIES: i32 = i32::MAX;
 const DEFAULT_PREFETCH_NUM: usize = 4;
 const DEFAULT_DOWNLOAD_THREADS: usize = 3;
@@ -76,6 +79,17 @@ pub struct Config {
     #[arg(long, default_value_t = DEFAULT_WRITER_BATCH_SIZE)]
     pub writer_batch_size: i32,
 
+    /// Tune the per-table writer batch size from observed fill ratios.
+    /// Default: true (matching Java `client.writer.dynamic-batch-size.enabled`).
+    #[arg(long, default_value_t = DEFAULT_WRITER_DYNAMIC_BATCH_SIZE_ENABLED)]
+    pub writer_dynamic_batch_size_enabled: bool,
+
+    /// Lower bound for the dynamic batch size estimator.
+    /// Default: 262144 (256 KB), matching Java's `2 * pageSize` floor.
+    /// Ignored when `writer_dynamic_batch_size_enabled` is false.
+    #[arg(long, default_value_t = DEFAULT_WRITER_DYNAMIC_BATCH_SIZE_MIN)]
+    pub writer_dynamic_batch_size_min: i32,
+
     #[arg(long, value_enum, default_value_t = NoKeyAssigner::Sticky)]
     pub writer_bucket_no_key_assigner: NoKeyAssigner,
 
@@ -199,6 +213,14 @@ impl std::fmt::Debug for Config {
             .field("writer_acks", &self.writer_acks)
             .field("writer_retries", &self.writer_retries)
             .field("writer_batch_size", &self.writer_batch_size)
+            .field(
+                "writer_dynamic_batch_size_enabled",
+                &self.writer_dynamic_batch_size_enabled,
+            )
+            .field(
+                "writer_dynamic_batch_size_min",
+                &self.writer_dynamic_batch_size_min,
+            )
             .field(
                 "writer_bucket_no_key_assigner",
                 &self.writer_bucket_no_key_assigner,
@@ -267,6 +289,8 @@ impl Default for Config {
             writer_acks: String::from(DEFAULT_ACKS),
             writer_retries: i32::MAX,
             writer_batch_size: DEFAULT_WRITER_BATCH_SIZE,
+            writer_dynamic_batch_size_enabled: DEFAULT_WRITER_DYNAMIC_BATCH_SIZE_ENABLED,
+            writer_dynamic_batch_size_min: DEFAULT_WRITER_DYNAMIC_BATCH_SIZE_MIN,
             writer_bucket_no_key_assigner: NoKeyAssigner::Sticky,
             scanner_remote_log_prefetch_num: DEFAULT_PREFETCH_NUM,
             remote_file_download_thread_num: DEFAULT_DOWNLOAD_THREADS,
@@ -388,6 +412,12 @@ impl Config {
         if self.writer_batch_size as usize > self.writer_buffer_memory_size {
             return Err("writer_batch_size must be <= writer_buffer_memory_size".to_string());
         }
+        if self.writer_dynamic_batch_size_min <= 0 {
+            return Err("writer_dynamic_batch_size_min must be > 0".to_string());
+        }
+        if self.writer_dynamic_batch_size_min > self.writer_batch_size {
+            return Err("writer_dynamic_batch_size_min must be <= writer_batch_size".to_string());
+        }
         // idempotence checks
         if !self.writer_enable_idempotence {
             return Ok(());
diff --git a/fluss-rust/website/docs/user-guide/cpp/api-reference.md b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
index ae4e9490a5..e9b94c9d9e 100644
--- a/fluss-rust/website/docs/user-guide/cpp/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/cpp/api-reference.md
@@ -21,7 +21,9 @@ Complete API reference for the Fluss C++ client.
 | `writer_request_max_size`             | `int32_t`     | `10485760` (10 MB)   | Maximum request size in bytes                                                            |
 | `writer_acks`                         | `std::string` | `"all"`              | Acknowledgment setting (`"all"`, `"0"`, `"1"`, or `"-1"`)                                |
 | `writer_retries`                      | `int32_t`     | `INT32_MAX`          | Number of retries on failure                                                             |
-| `writer_batch_size`                   | `int32_t`     | `2097152` (2 MB)     | Batch size for writes in bytes                                                           |
+| `writer_batch_size`                   | `int32_t`     | `2097152` (2 MB)     | Batch size for writes in bytes. Upper bound when dynamic sizing is on; fixed batch size when off |
+| `writer_dynamic_batch_size_enabled`   | `bool`        | `true`               | Enable per-table dynamic batch sizing: target grows 10% above 80% fill, shrinks 5% below 50% |
+| `writer_dynamic_batch_size_min`       | `int32_t`     | `262144` (256 KB)    | Lower bound for the dynamic batch size estimator (ignored when disabled)                 |
 | `writer_batch_timeout_ms`             | `int64_t`     | `100`                | Maximum time in ms to wait for a writer batch to fill up before sending                  |
 | `writer_bucket_no_key_assigner`       | `std::string` | `"sticky"`           | Bucket assignment strategy for tables without bucket keys: `"sticky"` or `"round_robin"` |
 | `scanner_remote_log_prefetch_num`     | `size_t`      | `4`                  | Number of remote log segments to prefetch                                                |
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index 32f23a59f7..aec4412dbf 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -14,7 +14,9 @@ Complete API reference for the Fluss Python client.
 | `writer_request_max_size`             | `writer.request-max-size`             | Get/set max request size in bytes                                                       |
 | `writer_acks`                         | `writer.acks`                         | Get/set acknowledgment setting (`"all"` for all replicas)                               |
 | `writer_retries`                      | `writer.retries`                      | Get/set number of retries on failure                                                    |
-| `writer_batch_size`                   | `writer.batch-size`                   | Get/set write batch size in bytes                                                       |
+| `writer_batch_size`                   | `writer.batch-size`                   | Get/set write batch size in bytes. Upper bound when dynamic sizing is on; fixed batch size when off |
+| `writer_dynamic_batch_size_enabled`   | `writer.dynamic-batch-size.enabled`   | Get/set whether the per-table dynamic batch size estimator is enabled (default `true`)  |
+| `writer_dynamic_batch_size_min`       | `writer.dynamic-batch-size-min`       | Get/set the lower bound for the dynamic batch size estimator (default 256 KB; ignored when disabled) |
 | `writer_batch_timeout_ms`             | `writer.batch-timeout-ms`             | Get/set max time in ms to wait for a writer batch to fill up before sending             |
 | `writer_bucket_no_key_assigner`       | `writer.bucket.no-key-assigner`       | Get/set bucket assignment strategy (`"sticky"` or `"round_robin"`)                      |
 | `scanner_remote_log_prefetch_num`     | `scanner.remote-log.prefetch-num`     | Get/set number of remote log segments to prefetch                                       |
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 9f2994ad60..03054f0f31 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -13,7 +13,9 @@ Complete API reference for the Fluss Rust client.
 | `writer_request_max_size`             | `i32`           | `10485760` (10 MB) | Maximum request size in bytes                                                        |
 | `writer_acks`                         | `String`        | `"all"`            | Acknowledgment setting (`"all"` waits for all replicas)                              |
 | `writer_retries`                      | `i32`           | `i32::MAX`         | Number of retries on failure                                                         |
-| `writer_batch_size`                   | `i32`           | `2097152` (2 MB)   | Batch size for writes in bytes                                                       |
+| `writer_batch_size`                   | `i32`           | `2097152` (2 MB)   | Batch size for writes in bytes. Upper bound when dynamic sizing is on; fixed batch size when off. |
+| `writer_dynamic_batch_size_enabled`   | `bool`          | `true`             | Enable per-table dynamic batch sizing: target grows 10% above 80% fill, shrinks 5% below 50%, clamped to `[writer_dynamic_batch_size_min, writer_batch_size]` |
+| `writer_dynamic_batch_size_min`       | `i32`           | `262144` (256 KB)  | Lower bound for the dynamic batch size estimator (ignored when `writer_dynamic_batch_size_enabled` is `false`) |
 | `writer_batch_timeout_ms`             | `i64`           | `100`              | Maximum time in ms to wait for a writer batch to fill up before sending              |
 | `writer_bucket_no_key_assigner`       | `NoKeyAssigner` | `sticky`           | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` |
 | `scanner_remote_log_prefetch_num`     | `usize`         | `4`                | Number of remote log segments to prefetch                                            |

From 55b3e71f2d9cd08300ebe49e78eef2c6bc9fba77 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sun, 10 May 2026 13:52:32 +0200
Subject: [PATCH 263/287] [tests] Add integration tests for array data type
 (#523)

* Add integration tests for array data type

* Address review comments

* Consolidate tests

* Conslidate tests

* resolve conflicts
---
 .../bindings/python/test/test_kv_table.py     | 181 +++++++-
 .../fluss/tests/integration/kv_table.rs       | 204 +++++++-
 .../fluss/tests/integration/log_table.rs      | 439 +++++++++++++++++-
 .../crates/fluss/tests/integration/utils.rs   |  26 +-
 4 files changed, 837 insertions(+), 13 deletions(-)

diff --git a/fluss-rust/bindings/python/test/test_kv_table.py b/fluss-rust/bindings/python/test/test_kv_table.py
index 394073756e..a17b0ad30c 100644
--- a/fluss-rust/bindings/python/test/test_kv_table.py
+++ b/fluss-rust/bindings/python/test/test_kv_table.py
@@ -30,6 +30,17 @@
 import fluss
 
 
+async def _upsert_and_wait(writer, row):
+    handle = writer.upsert(row)
+    await handle.wait()
+
+
+def _assert_float_specials(values):
+    assert math.isnan(values[0])
+    assert math.isinf(values[1]) and values[1] > 0
+    assert math.isinf(values[2]) and values[2] < 0
+
+
 async def test_upsert_delete_and_lookup(connection, admin):
     """Test upsert, lookup, update, delete, and non-existent key lookup."""
     table_path = fluss.TablePath("fluss", "py_test_upsert_and_lookup")
@@ -335,6 +346,167 @@ async def test_partitioned_table_upsert_and_lookup(connection, admin):
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
+async def test_upsert_and_lookup_with_array(connection, admin):
+    """Test upsert and lookup with flat, nested, and null-pattern arrays in KV tables."""
+    table_path = fluss.TablePath("fluss", "py_test_kv_arrays")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("tags", pa.list_(pa.string())),
+                pa.field("scores", pa.list_(pa.int32())),
+                pa.field("matrix", pa.list_(pa.list_(pa.int32()))),
+            ]
+        ),
+        primary_keys=["id"],
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    upsert_writer = table.new_upsert().create_writer()
+
+    await _upsert_and_wait(
+        upsert_writer,
+        {
+            "id": 1,
+            "tags": ["hello", "world"],
+            "scores": [10, 20, 30],
+            "matrix": [[1, 2], [3, 4]],
+        },
+    )
+    await _upsert_and_wait(
+        upsert_writer,
+        {"id": 2, "tags": [None], "scores": [], "matrix": None},
+    )
+    await _upsert_and_wait(
+        upsert_writer,
+        {"id": 3, "tags": None, "scores": [42], "matrix": [[], [5], [6, 7, 8]]},
+    )
+    await _upsert_and_wait(
+        upsert_writer,
+        {"id": 4, "tags": None, "scores": None, "matrix": [[1, None], None, []]},
+    )
+
+    lookuper = table.new_lookup().create_lookuper()
+
+    result1 = await lookuper.lookup({"id": 1})
+    assert result1 is not None
+    assert result1["tags"] == ["hello", "world"]
+    assert result1["scores"] == [10, 20, 30]
+    assert result1["matrix"] == [[1, 2], [3, 4]]
+
+    result2 = await lookuper.lookup({"id": 2})
+    assert result2 is not None
+    assert result2["tags"] == [None]
+    assert result2["scores"] == []
+    assert result2["matrix"] is None
+
+    result3 = await lookuper.lookup({"id": 3})
+    assert result3 is not None
+    assert result3["tags"] is None
+    assert result3["scores"] == [42]
+    assert result3["matrix"] == [[], [5], [6, 7, 8]]
+
+    result4 = await lookuper.lookup({"id": 4})
+    assert result4 is not None
+    assert result4["tags"] is None
+    assert result4["scores"] is None
+    assert result4["matrix"] == [[1, None], None, []]
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_upsert_and_lookup_with_array_rich_types(connection, admin):
+    """Test upsert/lookup for arrays with rich element types and encoding edge cases."""
+    table_path = fluss.TablePath("fluss", "py_test_kv_arrays_rich_types")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("id", pa.int32()),
+                pa.field("arr_bytes", pa.list_(pa.binary())),
+                pa.field("arr_date", pa.list_(pa.date32())),
+                pa.field("arr_time", pa.list_(pa.time32("ms"))),
+                pa.field("arr_ts_ntz", pa.list_(pa.timestamp("us"))),
+                pa.field("arr_ts_ltz", pa.list_(pa.timestamp("us", tz="UTC"))),
+                pa.field("arr_decimal", pa.list_(pa.decimal128(10, 2))),
+                pa.field("arr_long_str", pa.list_(pa.string())),
+                pa.field("arr_big_decimal", pa.list_(pa.decimal128(22, 5))),
+                pa.field("arr_ts_nano", pa.list_(pa.timestamp("ns"))),
+                pa.field("arr_float", pa.list_(pa.float32())),
+                pa.field("arr_double", pa.list_(pa.float64())),
+                # TODO(fluss-python#524): support PyArrow FixedSizeBinary in schema
+                # conversion. Then switch to pa.binary(4).
+                pa.field("arr_binary", pa.list_(pa.binary())),
+            ]
+        ),
+        primary_keys=["id"],
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    upsert_writer = table.new_upsert().create_writer()
+
+    await _upsert_and_wait(
+        upsert_writer,
+        {
+            "id": 1,
+            "arr_bytes": [b"\x10\x20\x30", None],
+            "arr_date": [date(2026, 1, 23), None],
+            "arr_time": [dt_time(10, 13, 47, 123000), None],
+            "arr_ts_ntz": [datetime(2026, 1, 23, 10, 13, 47, 123000)],
+            "arr_ts_ltz": [
+                datetime(2026, 1, 23, 10, 13, 47, 123000, tzinfo=timezone.utc)
+            ],
+            "arr_decimal": [Decimal("123.45"), None],
+            "arr_long_str": [
+                "abcdefgh",
+                "this is a much longer string that definitely exceeds inline",
+            ],
+            "arr_big_decimal": [
+                Decimal("12345678901234567.12345"),
+                Decimal("-99999999999999999.99999"),
+            ],
+            "arr_ts_nano": [datetime(2026, 1, 23, 10, 13, 47, 123456)],
+            "arr_float": [float("nan"), float("inf"), float("-inf")],
+            "arr_double": [float("nan"), float("inf"), float("-inf")],
+            "arr_binary": [b"\xde\xad\xbe\xef", b"\x00\x01\x02\x03"],
+        },
+    )
+
+    lookuper = table.new_lookup().create_lookuper()
+    result = await lookuper.lookup({"id": 1})
+    assert result is not None
+
+    assert result["arr_bytes"] == [b"\x10\x20\x30", None]
+    assert result["arr_date"] == [date(2026, 1, 23), None]
+    assert result["arr_time"] == [dt_time(10, 13, 47, 123000), None]
+    assert result["arr_ts_ntz"] == [datetime(2026, 1, 23, 10, 13, 47, 123000)]
+    assert result["arr_ts_ltz"] == [
+        datetime(2026, 1, 23, 10, 13, 47, 123000, tzinfo=timezone.utc)
+    ]
+    assert result["arr_decimal"] == [Decimal("123.45"), None]
+    assert result["arr_long_str"] == [
+        "abcdefgh",
+        "this is a much longer string that definitely exceeds inline",
+    ]
+    assert result["arr_big_decimal"] == [
+        Decimal("12345678901234567.12345"),
+        Decimal("-99999999999999999.99999"),
+    ]
+    assert result["arr_ts_nano"] == [datetime(2026, 1, 23, 10, 13, 47, 123456)]
+    _assert_float_specials(result["arr_float"])
+    _assert_float_specials(result["arr_double"])
+    assert result["arr_binary"] == [b"\xde\xad\xbe\xef", b"\x00\x01\x02\x03"]
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
 async def test_all_supported_datatypes(connection, admin):
     """Test upsert/lookup for all supported data types, including nulls."""
     table_path = fluss.TablePath("fluss", "py_test_kv_all_datatypes")
@@ -358,6 +530,7 @@ async def test_all_supported_datatypes(connection, admin):
                 pa.field("col_timestamp_ntz", pa.timestamp("us")),
                 pa.field("col_timestamp_ltz", pa.timestamp("us", tz="UTC")),
                 pa.field("col_bytes", pa.binary()),
+                pa.field("col_array", pa.list_(pa.string())),
                 pa.field("col_binary", pa.binary(16)),
             ]
         ),
@@ -386,11 +559,11 @@ async def test_all_supported_datatypes(connection, admin):
         "col_timestamp_ntz": datetime(2026, 1, 23, 10, 13, 47, 123000),
         "col_timestamp_ltz": datetime(2026, 1, 23, 10, 13, 47, 123000),
         "col_bytes": b"binary data",
+        "col_array": ["fluss", "python"],
         "col_binary": b"binary_data_0123",
     }
 
-    handle = upsert_writer.upsert(row_data)
-    await handle.wait()
+    await _upsert_and_wait(upsert_writer, row_data)
 
     lookuper = table.new_lookup().create_lookuper()
     result = await lookuper.lookup({"pk_int": 1})
@@ -413,6 +586,7 @@ async def test_all_supported_datatypes(connection, admin):
         2026, 1, 23, 10, 13, 47, 123000, tzinfo=timezone.utc
     )
     assert result["col_bytes"] == b"binary data"
+    assert result["col_array"] == ["fluss", "python"]
     assert result["col_binary"] == b"binary_data_0123"
 
     # Test with null values for all nullable columns
@@ -420,8 +594,7 @@ async def test_all_supported_datatypes(connection, admin):
     for col in row_data:
         if col != "pk_int":
             null_row[col] = None
-    handle = upsert_writer.upsert(null_row)
-    await handle.wait()
+    await _upsert_and_wait(upsert_writer, null_row)
 
     result = await lookuper.lookup({"pk_int": 2})
     assert result is not None, "Row with nulls should exist"
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index 1979b973f2..8787e88180 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -18,12 +18,19 @@
 
 #[cfg(test)]
 mod kv_table_test {
-    use crate::integration::utils::{create_partitions, create_table, get_shared_cluster};
+    use crate::integration::utils::{
+        create_partitions, create_table, get_shared_cluster, make_int_array, make_string_array,
+    };
     use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
-    use fluss::row::{GenericRow, InternalRow};
+    use fluss::row::binary_array::FlussArrayWriter;
+    use fluss::row::{FlussArray, GenericRow, InternalRow};
 
     fn make_key(id: i32) -> GenericRow<'static> {
-        let mut row = GenericRow::new(3);
+        make_key_with_field_count(id, 3)
+    }
+
+    fn make_key_with_field_count(id: i32, field_count: usize) -> GenericRow<'static> {
+        let mut row = GenericRow::new(field_count);
         row.set_field(0, id);
         row
     }
@@ -606,6 +613,7 @@ mod kv_table_test {
                     // Binary types
                     .column("col_bytes", DataTypes::bytes())
                     .column("col_binary", DataTypes::binary(20))
+                    .column("col_array", DataTypes::array(DataTypes::string()))
                     .primary_key(vec!["pk_int"])
                     .build()
                     .expect("Failed to build schema"),
@@ -644,8 +652,10 @@ mod kv_table_test {
         let col_bytes: &[u8] = b"binary data";
         let col_binary: &[u8] = b"fixed binary data!!!";
 
+        let col_array = make_string_array(&[Some("fluss"), Some("rust")]);
+
         // Upsert a row with all datatypes
-        let mut row = GenericRow::new(17);
+        let mut row = GenericRow::new(18);
         row.set_field(0, pk_int);
         row.set_field(1, col_boolean);
         row.set_field(2, col_tinyint);
@@ -663,6 +673,7 @@ mod kv_table_test {
         row.set_field(14, col_timestamp_ltz);
         row.set_field(15, col_bytes);
         row.set_field(16, col_binary);
+        row.set_field(17, col_array);
 
         upsert_writer
             .upsert(&row)
@@ -677,7 +688,7 @@ mod kv_table_test {
             .create_lookuper()
             .expect("Failed to create lookuper");
 
-        let mut key = GenericRow::new(17);
+        let mut key = GenericRow::new(18);
         key.set_field(0, pk_int);
 
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -772,10 +783,14 @@ mod kv_table_test {
             col_binary,
             "col_binary mismatch"
         );
+        let arr = found_row.get_array(17).unwrap();
+        assert_eq!(arr.size(), 2, "col_array size mismatch");
+        assert_eq!(arr.get_string(0).unwrap(), "fluss", "col_array[0] mismatch");
+        assert_eq!(arr.get_string(1).unwrap(), "rust", "col_array[1] mismatch");
 
         // Test with null values for nullable columns
         let pk_int_2 = 2i32;
-        let mut row_with_nulls = GenericRow::new(17);
+        let mut row_with_nulls = GenericRow::new(18);
         row_with_nulls.set_field(0, pk_int_2);
         row_with_nulls.set_field(1, Datum::Null); // col_boolean
         row_with_nulls.set_field(2, Datum::Null); // col_tinyint
@@ -793,6 +808,7 @@ mod kv_table_test {
         row_with_nulls.set_field(14, Datum::Null); // col_timestamp_ltz
         row_with_nulls.set_field(15, Datum::Null); // col_bytes
         row_with_nulls.set_field(16, Datum::Null); // col_binary
+        row_with_nulls.set_field(17, Datum::Null); // col_array
 
         upsert_writer
             .upsert(&row_with_nulls)
@@ -801,7 +817,7 @@ mod kv_table_test {
             .expect("Failed to wait for upsert acknowledgment");
 
         // Lookup row with nulls
-        let mut key2 = GenericRow::new(17);
+        let mut key2 = GenericRow::new(18);
         key2.set_field(0, pk_int_2);
 
         let result = lookuper.lookup(&key2).await.expect("Failed to lookup");
@@ -880,6 +896,180 @@ mod kv_table_test {
             found_row_nulls.is_null_at(16).unwrap(),
             "col_binary should be null"
         );
+        assert!(
+            found_row_nulls.is_null_at(17).unwrap(),
+            "col_array should be null"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn upsert_and_lookup_with_array() {
+        use fluss::row::Datum;
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_kv_arrays");
+        let inner_array_type = DataTypes::array(DataTypes::int());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("tags", DataTypes::array(DataTypes::string()))
+                    .column("scores", DataTypes::array(DataTypes::int()))
+                    .column("matrix", DataTypes::array(inner_array_type.clone()))
+                    .primary_key(vec!["id"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let upsert = table.new_upsert().expect("Failed to create upsert");
+        let upsert_writer = upsert.create_writer().expect("Failed to create writer");
+
+        // Row 1: id=1, tags=["hello", "world"], scores=[10, 20, 30], matrix=[[1,2],[3,4]]
+        let mut row1 = GenericRow::new(4);
+        row1.set_field(0, 1_i32);
+        row1.set_field(1, make_string_array(&[Some("hello"), Some("world")]));
+        row1.set_field(2, make_int_array(&[Some(10), Some(20), Some(30)]));
+        let m1 = {
+            let mut w = FlussArrayWriter::new(2, &inner_array_type);
+            w.write_array(0, &make_int_array(&[Some(1), Some(2)]));
+            w.write_array(1, &make_int_array(&[Some(3), Some(4)]));
+            w.complete().expect("matrix1")
+        };
+        row1.set_field(3, m1);
+
+        upsert_writer
+            .upsert(&row1)
+            .expect("upsert row1")
+            .await
+            .expect("ack row1");
+
+        // Row 2: id=2, tags=[null element], scores=[] (empty), matrix=null
+        let mut row2 = GenericRow::new(4);
+        row2.set_field(0, 2_i32);
+        row2.set_field(1, make_string_array(&[None]));
+        row2.set_field(2, make_int_array(&[]));
+        row2.set_field(3, Datum::Null);
+
+        upsert_writer
+            .upsert(&row2)
+            .expect("upsert row2")
+            .await
+            .expect("ack row2");
+
+        // Row 3: id=3, tags=null, scores=[42], matrix=[[5], null, []]
+        let mut row3 = GenericRow::new(4);
+        row3.set_field(0, 3_i32);
+        row3.set_field(1, Datum::Null);
+        row3.set_field(2, make_int_array(&[Some(42)]));
+        let m3 = {
+            let mut w = FlussArrayWriter::new(3, &inner_array_type);
+            w.write_array(0, &make_int_array(&[Some(5)]));
+            w.set_null_at(1);
+            w.write_array(2, &make_int_array(&[]));
+            w.complete().expect("matrix3")
+        };
+        row3.set_field(3, m3);
+
+        upsert_writer
+            .upsert(&row3)
+            .expect("upsert row3")
+            .await
+            .expect("ack row3");
+
+        // Lookup and verify
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        // Verify row 1: populated flat arrays + nested array
+        let result1 = lookuper
+            .lookup(&make_key_with_field_count(1, 4))
+            .await
+            .expect("lookup row1");
+        let r1 = result1
+            .get_single_row()
+            .expect("get row1")
+            .expect("row1 should exist");
+        assert_eq!(r1.get_int(0).unwrap(), 1);
+        let tags_r1 = r1.get_array(1).unwrap();
+        assert_eq!(tags_r1.size(), 2);
+        assert_eq!(tags_r1.get_string(0).unwrap(), "hello");
+        assert_eq!(tags_r1.get_string(1).unwrap(), "world");
+        let scores_r1 = r1.get_array(2).unwrap();
+        assert_eq!(scores_r1.size(), 3);
+        assert_eq!(scores_r1.get_int(0).unwrap(), 10);
+        assert_eq!(scores_r1.get_int(1).unwrap(), 20);
+        assert_eq!(scores_r1.get_int(2).unwrap(), 30);
+        let matrix_r1: FlussArray = r1.get_array(3).unwrap();
+        assert_eq!(matrix_r1.size(), 2);
+        let mr1_0 = matrix_r1.get_array(0).unwrap();
+        assert_eq!(mr1_0.size(), 2);
+        assert_eq!(mr1_0.get_int(0).unwrap(), 1);
+        assert_eq!(mr1_0.get_int(1).unwrap(), 2);
+        let mr1_1 = matrix_r1.get_array(1).unwrap();
+        assert_eq!(mr1_1.size(), 2);
+        assert_eq!(mr1_1.get_int(0).unwrap(), 3);
+        assert_eq!(mr1_1.get_int(1).unwrap(), 4);
+
+        // Verify row 2: null element in array, empty array, null nested column
+        let result2 = lookuper
+            .lookup(&make_key_with_field_count(2, 4))
+            .await
+            .expect("lookup row2");
+        let r2 = result2
+            .get_single_row()
+            .expect("get row2")
+            .expect("row2 should exist");
+        assert_eq!(r2.get_int(0).unwrap(), 2);
+        let tags_r2 = r2.get_array(1).unwrap();
+        assert_eq!(tags_r2.size(), 1);
+        assert!(tags_r2.is_null_at(0));
+        let scores_r2 = r2.get_array(2).unwrap();
+        assert_eq!(scores_r2.size(), 0);
+        assert!(r2.is_null_at(3).unwrap());
+
+        // Verify row 3: null flat column, nested array with mixed inner (value, null, empty)
+        let result3 = lookuper
+            .lookup(&make_key_with_field_count(3, 4))
+            .await
+            .expect("lookup row3");
+        let r3 = result3
+            .get_single_row()
+            .expect("get row3")
+            .expect("row3 should exist");
+        assert_eq!(r3.get_int(0).unwrap(), 3);
+        assert!(r3.is_null_at(1).unwrap());
+        let scores_r3 = r3.get_array(2).unwrap();
+        assert_eq!(scores_r3.size(), 1);
+        assert_eq!(scores_r3.get_int(0).unwrap(), 42);
+        let matrix_r3 = r3.get_array(3).unwrap();
+        assert_eq!(matrix_r3.size(), 3);
+        let mr3_0 = matrix_r3.get_array(0).unwrap();
+        assert_eq!(mr3_0.size(), 1);
+        assert_eq!(mr3_0.get_int(0).unwrap(), 5);
+        assert!(matrix_r3.is_null_at(1));
+        let mr3_2 = matrix_r3.get_array(2).unwrap();
+        assert_eq!(mr3_2.size(), 0);
 
         admin
             .drop_table(&table_path, false)
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index d10834e87e..1a6b514b81 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -18,7 +18,9 @@
 
 #[cfg(test)]
 mod table_test {
-    use crate::integration::utils::{create_partitions, create_table, get_shared_cluster};
+    use crate::integration::utils::{
+        create_partitions, create_table, get_shared_cluster, make_int_array, make_string_array,
+    };
     use arrow::array::record_batch;
     use fluss::client::{EARLIEST_OFFSET, FlussTable, TableScan};
     use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
@@ -658,6 +660,7 @@ mod table_test {
                         "col_timestamp_ltz_ns_neg",
                         DataTypes::timestamp_ltz_with_precision(9),
                     )
+                    .column("col_array", DataTypes::array(DataTypes::string()))
                     .build()
                     .expect("Failed to build schema"),
             )
@@ -719,6 +722,8 @@ mod table_test {
         let col_timestamp_ltz_ns_neg =
             TimestampLtz::from_millis_nanos(-301234154877, 999_999).unwrap();
 
+        let col_array = make_string_array(&[Some("fluss"), Some("rust")]);
+
         // Append a row with all datatypes
         let mut row = GenericRow::new(field_count);
         row.set_field(0, col_tinyint);
@@ -750,6 +755,7 @@ mod table_test {
         row.set_field(26, col_timestamp_ns_neg);
         row.set_field(27, col_timestamp_ltz_us_neg);
         row.set_field(28, col_timestamp_ltz_ns_neg);
+        row.set_field(29, col_array);
 
         append_writer
             .append(&row)
@@ -994,6 +1000,11 @@ mod table_test {
             "col_timestamp_ltz_ns_neg nanos mismatch"
         );
 
+        let arr = found_row.get_array(29).unwrap();
+        assert_eq!(arr.size(), 2, "col_array size mismatch");
+        assert_eq!(arr.get_string(0).unwrap(), "fluss", "col_array[0] mismatch");
+        assert_eq!(arr.get_string(1).unwrap(), "rust", "col_array[1] mismatch");
+
         // Verify row with all nulls (record index 1)
         let found_row_nulls = records[1].row();
         for i in 0..field_count {
@@ -1373,4 +1384,430 @@ mod table_test {
             .await
             .expect("Failed to drop table");
     }
+
+    #[tokio::test]
+    async fn append_and_scan_with_array() {
+        use fluss::row::binary_array::FlussArrayWriter;
+        use fluss::row::{Datum, FlussArray, GenericRow};
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_log_arrays");
+        let inner_array_type = DataTypes::array(DataTypes::int());
+
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("tags", DataTypes::array(DataTypes::string()))
+            .column("scores", DataTypes::array(DataTypes::int()))
+            .column("matrix", DataTypes::array(inner_array_type.clone()))
+            .build()
+            .expect("Failed to build schema");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        // Row 1: id=1, tags=["hello", "world"], scores=[10, 20, 30], matrix=[[1,2],[3,4]]
+        let mut row1 = GenericRow::new(4);
+        row1.set_field(0, 1_i32);
+        row1.set_field(1, make_string_array(&[Some("hello"), Some("world")]));
+        row1.set_field(2, make_int_array(&[Some(10), Some(20), Some(30)]));
+        let m1 = {
+            let mut w = FlussArrayWriter::new(2, &inner_array_type);
+            w.write_array(0, &make_int_array(&[Some(1), Some(2)]));
+            w.write_array(1, &make_int_array(&[Some(3), Some(4)]));
+            w.complete().expect("matrix1")
+        };
+        row1.set_field(3, m1);
+
+        // Row 2: id=2, tags=[null], scores=[], matrix=[[5], null, []]
+        let mut row2 = GenericRow::new(4);
+        row2.set_field(0, 2_i32);
+        row2.set_field(1, make_string_array(&[None]));
+        row2.set_field(2, make_int_array(&[]));
+        let m2 = {
+            let mut w = FlussArrayWriter::new(3, &inner_array_type);
+            w.write_array(0, &make_int_array(&[Some(5)]));
+            w.set_null_at(1);
+            w.write_array(2, &make_int_array(&[]));
+            w.complete().expect("matrix2")
+        };
+        row2.set_field(3, m2);
+
+        // Row 3: id=3, tags=null, scores=[42], matrix=null
+        let mut row3 = GenericRow::new(4);
+        row3.set_field(0, 3_i32);
+        row3.set_field(1, Datum::Null);
+        row3.set_field(2, make_int_array(&[Some(42)]));
+        row3.set_field(3, Datum::Null);
+
+        append_writer.append(&row1).expect("append row1");
+        append_writer.append(&row2).expect("append row2");
+        append_writer.append(&row3).expect("append row3");
+        append_writer.flush().await.expect("Failed to flush");
+
+        let records = scan_table(&table, |scan| scan).await;
+        assert_eq!(records.len(), 3, "expected three log records");
+
+        // Verify row 1: populated flat arrays + nested array
+        let r0 = records[0].row();
+        assert_eq!(r0.get_int(0).unwrap(), 1);
+        let tags_r0 = r0.get_array(1).unwrap();
+        assert_eq!(tags_r0.size(), 2);
+        assert_eq!(tags_r0.get_string(0).unwrap(), "hello");
+        assert_eq!(tags_r0.get_string(1).unwrap(), "world");
+        let scores_r0 = r0.get_array(2).unwrap();
+        assert_eq!(scores_r0.size(), 3);
+        assert_eq!(scores_r0.get_int(0).unwrap(), 10);
+        assert_eq!(scores_r0.get_int(1).unwrap(), 20);
+        assert_eq!(scores_r0.get_int(2).unwrap(), 30);
+        let matrix_r0: FlussArray = r0.get_array(3).unwrap();
+        assert_eq!(matrix_r0.size(), 2);
+        let mr0_0 = matrix_r0.get_array(0).unwrap();
+        assert_eq!(mr0_0.size(), 2);
+        assert_eq!(mr0_0.get_int(0).unwrap(), 1);
+        assert_eq!(mr0_0.get_int(1).unwrap(), 2);
+        let mr0_1 = matrix_r0.get_array(1).unwrap();
+        assert_eq!(mr0_1.size(), 2);
+        assert_eq!(mr0_1.get_int(0).unwrap(), 3);
+        assert_eq!(mr0_1.get_int(1).unwrap(), 4);
+
+        // Verify row 2: null element in array, empty array, nested with mixed inner
+        let r1 = records[1].row();
+        assert_eq!(r1.get_int(0).unwrap(), 2);
+        let tags_r1 = r1.get_array(1).unwrap();
+        assert_eq!(tags_r1.size(), 1);
+        assert!(tags_r1.is_null_at(0));
+        let scores_r1 = r1.get_array(2).unwrap();
+        assert_eq!(scores_r1.size(), 0);
+        let matrix_r1 = r1.get_array(3).unwrap();
+        assert_eq!(matrix_r1.size(), 3);
+        let mr1_0 = matrix_r1.get_array(0).unwrap();
+        assert_eq!(mr1_0.size(), 1);
+        assert_eq!(mr1_0.get_int(0).unwrap(), 5);
+        assert!(matrix_r1.is_null_at(1));
+        let mr1_2 = matrix_r1.get_array(2).unwrap();
+        assert_eq!(mr1_2.size(), 0);
+
+        // Verify row 3: null flat column, null nested column
+        let r2 = records[2].row();
+        assert_eq!(r2.get_int(0).unwrap(), 3);
+        assert!(r2.is_null_at(1).unwrap());
+        let scores_r2 = r2.get_array(2).unwrap();
+        assert_eq!(scores_r2.size(), 1);
+        assert_eq!(scores_r2.get_int(0).unwrap(), 42);
+        assert!(r2.is_null_at(3).unwrap());
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn append_and_scan_with_array_rich_types() {
+        use fluss::row::binary_array::FlussArrayWriter;
+        use fluss::row::{Date, Decimal, FlussArray, GenericRow, Time, TimestampNtz};
+
+        fn assert_f32_special(actual: f32, expected: f32) {
+            if expected.is_nan() {
+                assert!(actual.is_nan(), "expected NaN");
+            } else if expected.is_infinite() {
+                assert!(actual.is_infinite());
+                assert_eq!(actual.signum(), expected.signum());
+            } else {
+                assert!((actual - expected).abs() < f32::EPSILON);
+            }
+        }
+
+        fn assert_f64_special(actual: f64, expected: f64) {
+            if expected.is_nan() {
+                assert!(actual.is_nan(), "expected NaN");
+            } else if expected.is_infinite() {
+                assert!(actual.is_infinite());
+                assert_eq!(actual.signum(), expected.signum());
+            } else {
+                assert!((actual - expected).abs() < f64::EPSILON);
+            }
+        }
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_log_arrays_rich_types");
+
+        // Compact types: DECIMAL(10,2) precision<=18, TIMESTAMP(6) precision<=3 for millis
+        let dec_compact = Decimal::from_unscaled_long(12345, 10, 2).unwrap();
+        let ts_compact = TimestampNtz::from_millis_nanos(1769163227123, 456000).unwrap();
+
+        // Non-compact types: DECIMAL(22,5) precision>18, TIMESTAMP(9) precision>3
+        let dec_big = Decimal::from_unscaled_bytes(&[66, 237, 18, 59, 11, 216, 31, 4, 244], 22, 5)
+            .expect("big decimal");
+        let ts_nano = TimestampNtz::from_millis_nanos(1769163227123, 999_999).unwrap();
+
+        let d = Date::new(20476);
+        let t = Time::new(36827123);
+        let elem_bytes = &[0_u8, 1, 2, 255];
+        let fixed_a: Vec<u8> = vec![0xDE, 0xAD, 0xBE, 0xEF];
+        let fixed_b: Vec<u8> = vec![0x01, 0x02, 0x03, 0x04];
+
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("arr_bytes", DataTypes::array(DataTypes::bytes()))
+            .column("arr_date", DataTypes::array(DataTypes::date()))
+            .column(
+                "arr_time",
+                DataTypes::array(DataTypes::time_with_precision(3)),
+            )
+            .column(
+                "arr_ts_compact",
+                DataTypes::array(DataTypes::timestamp_with_precision(6)),
+            )
+            .column(
+                "arr_ts_nano",
+                DataTypes::array(DataTypes::timestamp_with_precision(9)),
+            )
+            .column(
+                "arr_decimal_compact",
+                DataTypes::array(DataTypes::decimal(10, 2)),
+            )
+            .column(
+                "arr_decimal_big",
+                DataTypes::array(DataTypes::decimal(22, 5)),
+            )
+            .column("arr_long_str", DataTypes::array(DataTypes::string()))
+            .column("arr_float", DataTypes::array(DataTypes::float()))
+            .column("arr_double", DataTypes::array(DataTypes::double()))
+            .column("arr_binary", DataTypes::array(DataTypes::binary(4)))
+            .build()
+            .expect("Failed to build schema");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let mut row = GenericRow::new(12);
+        row.set_field(0, 1_i32);
+
+        // col 1: arr_bytes — binary with null element
+        let arr_bytes = {
+            let mut w = FlussArrayWriter::new(2, &DataTypes::bytes());
+            w.write_binary_bytes(0, elem_bytes);
+            w.set_null_at(1);
+            w.complete().expect("arr_bytes")
+        };
+        row.set_field(1, arr_bytes);
+
+        // col 2: arr_date
+        let arr_date = {
+            let mut w = FlussArrayWriter::new(2, &DataTypes::date());
+            w.write_date(0, d);
+            w.set_null_at(1);
+            w.complete().expect("arr_date")
+        };
+        row.set_field(2, arr_date);
+
+        // col 3: arr_time
+        let arr_time = {
+            let mut w = FlussArrayWriter::new(2, &DataTypes::time_with_precision(3));
+            w.write_time(0, t);
+            w.set_null_at(1);
+            w.complete().expect("arr_time")
+        };
+        row.set_field(3, arr_time);
+
+        // col 4: arr_ts_compact — compact timestamp (precision 6, millis+nanos)
+        let arr_ts_compact = {
+            let mut w = FlussArrayWriter::new(2, &DataTypes::timestamp_with_precision(6));
+            w.write_timestamp_ntz(0, &ts_compact, 6);
+            w.set_null_at(1);
+            w.complete().expect("arr_ts_compact")
+        };
+        row.set_field(4, arr_ts_compact);
+
+        // col 5: arr_ts_nano — non-compact timestamp (precision 9)
+        let arr_ts_nano = {
+            let mut w = FlussArrayWriter::new(1, &DataTypes::timestamp_with_precision(9));
+            w.write_timestamp_ntz(0, &ts_nano, 9);
+            w.complete().expect("arr_ts_nano")
+        };
+        row.set_field(5, arr_ts_nano);
+
+        // col 6: arr_decimal_compact — compact decimal (precision 10)
+        let arr_decimal_compact = {
+            let mut w = FlussArrayWriter::new(2, &DataTypes::decimal(10, 2));
+            w.write_decimal(0, &dec_compact, 10);
+            w.set_null_at(1);
+            w.complete().expect("arr_decimal_compact")
+        };
+        row.set_field(6, arr_decimal_compact);
+
+        // col 7: arr_decimal_big — non-compact decimal (precision 22)
+        let arr_decimal_big = {
+            let mut w = FlussArrayWriter::new(1, &DataTypes::decimal(22, 5));
+            w.write_decimal(0, &dec_big, 22);
+            w.complete().expect("arr_decimal_big")
+        };
+        row.set_field(7, arr_decimal_big);
+
+        // col 8: arr_long_str — heap-backed strings (>= 8 bytes)
+        let arr_long_str = {
+            let mut w = FlussArrayWriter::new(2, &DataTypes::string());
+            w.write_string(0, "abcdefghi");
+            w.write_string(1, "longstring_here");
+            w.complete().expect("arr_long_str")
+        };
+        row.set_field(8, arr_long_str);
+
+        // col 9: arr_float — IEEE 754 specials
+        let arr_float = {
+            let mut w = FlussArrayWriter::new(3, &DataTypes::float());
+            w.write_float(0, f32::NAN);
+            w.write_float(1, f32::INFINITY);
+            w.write_float(2, f32::NEG_INFINITY);
+            w.complete().expect("arr_float")
+        };
+        row.set_field(9, arr_float);
+
+        // col 10: arr_double — IEEE 754 specials
+        let arr_double = {
+            let mut w = FlussArrayWriter::new(3, &DataTypes::double());
+            w.write_double(0, f64::NAN);
+            w.write_double(1, f64::INFINITY);
+            w.write_double(2, f64::NEG_INFINITY);
+            w.complete().expect("arr_double")
+        };
+        row.set_field(10, arr_double);
+
+        // col 11: arr_binary — fixed-size binary(4)
+        let arr_binary = {
+            let mut w = FlussArrayWriter::new(2, &DataTypes::binary(4));
+            w.write_binary_bytes(0, &fixed_a);
+            w.write_binary_bytes(1, &fixed_b);
+            w.complete().expect("arr_binary")
+        };
+        row.set_field(11, arr_binary);
+
+        append_writer.append(&row).expect("append");
+        append_writer.flush().await.expect("Failed to flush");
+
+        let records = scan_table(&table, |scan| scan).await;
+        assert_eq!(records.len(), 1);
+        let r = records[0].row();
+
+        // Verify arr_bytes
+        let ab = r.get_array(1).unwrap();
+        assert_eq!(ab.size(), 2);
+        assert_eq!(ab.get_binary(0).unwrap(), elem_bytes);
+        assert!(ab.is_null_at(1));
+
+        // Verify arr_date
+        let ad = r.get_array(2).unwrap();
+        assert_eq!(ad.size(), 2);
+        assert_eq!(ad.get_date(0).unwrap().get_inner(), d.get_inner());
+        assert!(ad.is_null_at(1));
+
+        // Verify arr_time
+        let at = r.get_array(3).unwrap();
+        assert_eq!(at.size(), 2);
+        assert_eq!(at.get_time(0).unwrap().get_inner(), t.get_inner());
+        assert!(at.is_null_at(1));
+
+        // Verify arr_ts_compact
+        let ats = r.get_array(4).unwrap();
+        assert_eq!(ats.size(), 2);
+        let read_ts_compact = ats.get_timestamp_ntz(0, 6).unwrap();
+        assert_eq!(
+            read_ts_compact.get_millisecond(),
+            ts_compact.get_millisecond()
+        );
+        assert_eq!(
+            read_ts_compact.get_nano_of_millisecond(),
+            ts_compact.get_nano_of_millisecond()
+        );
+        assert!(ats.is_null_at(1));
+
+        // Verify arr_ts_nano
+        let ats_nano = r.get_array(5).unwrap();
+        assert_eq!(ats_nano.size(), 1);
+        let read_ts_nano = ats_nano.get_timestamp_ntz(0, 9).unwrap();
+        assert_eq!(read_ts_nano.get_millisecond(), ts_nano.get_millisecond());
+        assert_eq!(
+            read_ts_nano.get_nano_of_millisecond(),
+            ts_nano.get_nano_of_millisecond()
+        );
+
+        // Verify arr_decimal_compact
+        let adc = r.get_array(6).unwrap();
+        assert_eq!(adc.size(), 2);
+        assert_eq!(adc.get_decimal(0, 10, 2).unwrap(), dec_compact);
+        assert!(adc.is_null_at(1));
+
+        // Verify arr_decimal_big
+        let adb = r.get_array(7).unwrap();
+        assert_eq!(adb.size(), 1);
+        assert_eq!(adb.get_decimal(0, 22, 5).unwrap(), dec_big);
+
+        // Verify arr_long_str
+        let als = r.get_array(8).unwrap();
+        assert_eq!(als.size(), 2);
+        assert_eq!(als.get_string(0).unwrap(), "abcdefghi");
+        assert_eq!(als.get_string(1).unwrap(), "longstring_here");
+
+        // Verify arr_float — IEEE 754 specials
+        let af = r.get_array(9).unwrap();
+        assert_eq!(af.size(), 3);
+        assert_f32_special(af.get_float(0).unwrap(), f32::NAN);
+        assert_f32_special(af.get_float(1).unwrap(), f32::INFINITY);
+        assert_f32_special(af.get_float(2).unwrap(), f32::NEG_INFINITY);
+
+        // Verify arr_double — IEEE 754 specials
+        let adbl = r.get_array(10).unwrap();
+        assert_eq!(adbl.size(), 3);
+        assert_f64_special(adbl.get_double(0).unwrap(), f64::NAN);
+        assert_f64_special(adbl.get_double(1).unwrap(), f64::INFINITY);
+        assert_f64_special(adbl.get_double(2).unwrap(), f64::NEG_INFINITY);
+
+        // Verify arr_binary — fixed-size binary(4)
+        let fb: FlussArray = r.get_array(11).unwrap();
+        assert_eq!(fb.size(), 2);
+        assert_eq!(fb.get_binary(0).unwrap(), fixed_a.as_slice());
+        assert_eq!(fb.get_binary(1).unwrap(), fixed_b.as_slice());
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index dc2876f899..81a7c0b107 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -17,7 +17,9 @@
  */
 use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
 use fluss::client::FlussAdmin;
-use fluss::metadata::{PartitionSpec, TableDescriptor, TablePath};
+use fluss::metadata::{DataTypes, PartitionSpec, TableDescriptor, TablePath};
+use fluss::row::FlussArray;
+use fluss::row::binary_array::FlussArrayWriter;
 use std::collections::HashMap;
 use std::sync::Arc;
 use std::sync::LazyLock;
@@ -94,6 +96,28 @@ pub async fn create_table(
         .expect("Failed to create table");
 }
 
+pub fn make_string_array(values: &[Option<&str>]) -> FlussArray {
+    let mut writer = FlussArrayWriter::new(values.len(), &DataTypes::string());
+    for (idx, value) in values.iter().enumerate() {
+        match value {
+            Some(v) => writer.write_string(idx, v),
+            None => writer.set_null_at(idx),
+        }
+    }
+    writer.complete().expect("Failed to build string array")
+}
+
+pub fn make_int_array(values: &[Option<i32>]) -> FlussArray {
+    let mut writer = FlussArrayWriter::new(values.len(), &DataTypes::int());
+    for (idx, value) in values.iter().enumerate() {
+        match value {
+            Some(v) => writer.write_int(idx, *v),
+            None => writer.set_null_at(idx),
+        }
+    }
+    writer.complete().expect("Failed to build int array")
+}
+
 /// Similar to wait_for_cluster_ready but connects with SASL credentials.
 pub async fn wait_for_cluster_ready_with_sasl(cluster: &FlussTestingCluster) {
     let timeout = Duration::from_secs(30);

From 9704b0c549ffaba039f0d0ad28c8e6e7f636e782 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sun, 10 May 2026 15:11:40 +0200
Subject: [PATCH 264/287] [python] Add prefix lookup support in python (#540)

* add prefix lookup support in python

* add more tests
---
 fluss-rust/bindings/python/fluss/__init__.pyi |  55 ++++++-
 fluss-rust/bindings/python/src/lib.rs         |   2 +
 fluss-rust/bindings/python/src/lookup.rs      |  99 ++++++++++++
 fluss-rust/bindings/python/src/table.rs       |  47 ++++++
 .../bindings/python/test/test_kv_table.py     | 146 ++++++++++++++++--
 .../docs/user-guide/python/api-reference.md   |  23 ++-
 6 files changed, 350 insertions(+), 22 deletions(-)

diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 5a59ea513e..18095c01bc 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -582,15 +582,43 @@ class TableUpsert:
     def __repr__(self) -> str: ...
 
 class TableLookup:
-    """Builder for creating a Lookuper.
+    """Builder for creating a Lookuper or PrefixLookuper.
 
-    Obtain via `FlussTable.new_lookup()`, then call `create_lookuper()`.
+    Obtain via `FlussTable.new_lookup()`, then call `create_lookuper()`
+    for primary key lookup, or `lookup_by(columns).create_lookuper()`
+    for prefix key lookup.
 
     Example:
         lookuper = table.new_lookup().create_lookuper()
+        prefix_lookuper = table.new_lookup().lookup_by(["a", "b"]).create_lookuper()
     """
 
     def create_lookuper(self) -> Lookuper: ...
+    def lookup_by(self, column_names: List[str]) -> "TablePrefixLookup":
+        """Switch to prefix-scan mode for the given lookup columns.
+
+        The columns must be the table's partition keys (if any) plus the
+        bucket keys, in that order.
+
+        Args:
+            column_names: List of column names forming the prefix key.
+
+        Returns:
+            TablePrefixLookup builder. Call `create_lookuper()` to get a PrefixLookuper.
+        """
+        ...
+    def __repr__(self) -> str: ...
+
+class TablePrefixLookup:
+    """Builder for creating a PrefixLookuper.
+
+    Obtain via `TableLookup.lookup_by(columns)`, then call `create_lookuper()`.
+
+    Example:
+        prefix_lookuper = table.new_lookup().lookup_by(["a", "b"]).create_lookuper()
+    """
+
+    def create_lookuper(self) -> "PrefixLookuper": ...
     def __repr__(self) -> str: ...
 
 class AppendWriter:
@@ -729,6 +757,29 @@ class Lookuper:
         ...
     def __repr__(self) -> str: ...
 
+class PrefixLookuper:
+    """Lookuper for performing prefix key lookups on a Fluss table.
+
+    Returns all rows whose primary key starts with the given prefix.
+    Create via `table.new_lookup().lookup_by(columns).create_lookuper()`.
+    """
+
+    async def lookup(self, prefix: dict | list | tuple) -> List[Dict[str, object]]:
+        """Lookup all rows matching a prefix key.
+
+        Args:
+            prefix: A dict, list, or tuple containing only the prefix key values
+                (the columns specified in lookup_by()).
+                For dict: keys are prefix column names.
+                For list/tuple: values in prefix column order.
+
+        Returns:
+            A list of dicts, each containing the full row data.
+            Empty list if no matches.
+        """
+        ...
+    def __repr__(self) -> str: ...
+
 class LogScanner:
     """Scanner for reading log data from a Fluss table.
 
diff --git a/fluss-rust/bindings/python/src/lib.rs b/fluss-rust/bindings/python/src/lib.rs
index 6890e08879..2d71491a7a 100644
--- a/fluss-rust/bindings/python/src/lib.rs
+++ b/fluss-rust/bindings/python/src/lib.rs
@@ -113,9 +113,11 @@ fn _fluss(m: &Bound<'_, PyModule>) -> PyResult<()> {
     m.add_class::<TableAppend>()?;
     m.add_class::<TableUpsert>()?;
     m.add_class::<TableLookup>()?;
+    m.add_class::<TablePrefixLookup>()?;
     m.add_class::<AppendWriter>()?;
     m.add_class::<UpsertWriter>()?;
     m.add_class::<Lookuper>()?;
+    m.add_class::<PrefixLookuper>()?;
     m.add_class::<Schema>()?;
     m.add_class::<LogScanner>()?;
     m.add_class::<LakeSnapshot>()?;
diff --git a/fluss-rust/bindings/python/src/lookup.rs b/fluss-rust/bindings/python/src/lookup.rs
index f7bd09a505..196faa1e81 100644
--- a/fluss-rust/bindings/python/src/lookup.rs
+++ b/fluss-rust/bindings/python/src/lookup.rs
@@ -113,3 +113,102 @@ impl Lookuper {
         })
     }
 }
+
+/// Lookuper for performing prefix key lookups on a Fluss table.
+///
+/// Returns all rows whose primary key starts with the given prefix.
+/// Create once via `table.new_lookup().lookup_by(columns).create_lookuper()`
+/// and reuse for multiple lookups.
+#[pyclass]
+pub struct PrefixLookuper {
+    inner: Arc<Mutex<fcore::client::PrefixKeyLookuper>>,
+    table_info: Arc<fcore::metadata::TableInfo>,
+    lookup_column_indices: Vec<usize>,
+}
+
+#[pymethods]
+impl PrefixLookuper {
+    /// Lookup all rows matching a prefix key.
+    ///
+    /// Args:
+    ///     prefix: A dict, list, or tuple containing only the prefix key values
+    ///         (the columns specified in lookup_by()).
+    ///         For dict: keys are prefix column names.
+    ///         For list/tuple: values in prefix column order.
+    ///
+    /// Returns:
+    ///     A list of dicts, each containing the full row data. Empty list if no matches.
+    pub fn lookup<'py>(
+        &self,
+        py: Python<'py>,
+        prefix: &Bound<'_, PyAny>,
+    ) -> PyResult<Bound<'py, PyAny>> {
+        let generic_row =
+            python_to_dense_generic_row(prefix, &self.table_info, &self.lookup_column_indices)?;
+        let inner = self.inner.clone();
+        let table_info = self.table_info.clone();
+
+        future_into_py(py, async move {
+            let result = {
+                let mut lookuper = inner.lock().await;
+                lookuper
+                    .lookup(&generic_row)
+                    .await
+                    .map_err(|e| FlussError::from_core_error(&e))?
+            };
+
+            let rows = result
+                .get_rows()
+                .map_err(|e| FlussError::from_core_error(&e))?;
+
+            Python::attach(|py| {
+                let py_rows: Vec<Py<PyAny>> = rows
+                    .iter()
+                    .map(|row| internal_row_to_dict(py, row, &table_info))
+                    .collect::<PyResult<_>>()?;
+                Ok(py_rows)
+            })
+        })
+    }
+
+    fn __repr__(&self) -> String {
+        "PrefixLookuper()".to_string()
+    }
+}
+
+impl PrefixLookuper {
+    pub fn new(
+        connection: &Arc<fcore::client::FlussConnection>,
+        metadata: Arc<fcore::client::Metadata>,
+        table_info: fcore::metadata::TableInfo,
+        lookup_column_names: Vec<String>,
+    ) -> PyResult<Self> {
+        let row_type = table_info.row_type();
+        let lookup_column_indices: Vec<usize> = lookup_column_names
+            .iter()
+            .map(|name| {
+                row_type.get_field_index(name).ok_or_else(|| {
+                    FlussError::new_err(format!("Unknown column name '{name}' for prefix lookup"))
+                })
+            })
+            .collect::<PyResult<_>>()?;
+
+        let lookuper = TOKIO_RUNTIME.block_on(async {
+            let fluss_table =
+                fcore::client::FlussTable::new(connection, metadata, table_info.clone());
+            let table_lookup = fluss_table
+                .new_lookup()
+                .map_err(|e| FlussError::from_core_error(&e))?;
+            table_lookup
+                .lookup_by(lookup_column_names)
+                .create_lookuper()
+                .map_err(|e| FlussError::from_core_error(&e))
+        })?;
+
+        Ok(Self {
+            inner: Arc::new(Mutex::new(lookuper)),
+            table_info: Arc::new(table_info),
+            lookup_column_indices,
+        })
+    }
+}
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 98aee5e3c6..4ec7b8d77e 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -888,11 +888,58 @@ impl TableLookup {
         )
     }
 
+    /// Switch to prefix-scan mode for the given lookup columns.
+    ///
+    /// The columns must be the table's partition keys (if any) plus the
+    /// bucket keys, in that order.
+    ///
+    /// Args:
+    ///     column_names: List of column names forming the prefix key.
+    ///
+    /// Returns:
+    ///     TablePrefixLookup builder. Call `create_lookuper()` to get a PrefixLookuper.
+    pub fn lookup_by(&self, column_names: Vec<String>) -> TablePrefixLookup {
+        TablePrefixLookup {
+            connection: self.connection.clone(),
+            metadata: self.metadata.clone(),
+            table_info: self.table_info.clone(),
+            lookup_column_names: column_names,
+        }
+    }
+
     fn __repr__(&self) -> String {
         "TableLookup()".to_string()
     }
 }
 
+/// Builder for creating a PrefixLookuper.
+///
+/// Obtain via `TableLookup.lookup_by(columns)`, then call `create_lookuper()`.
+#[pyclass]
+pub struct TablePrefixLookup {
+    connection: Arc<fcore::client::FlussConnection>,
+    metadata: Arc<fcore::client::Metadata>,
+    table_info: fcore::metadata::TableInfo,
+    lookup_column_names: Vec<String>,
+}
+
+#[pymethods]
+impl TablePrefixLookup {
+    /// Create a PrefixLookuper from this builder.
+    pub fn create_lookuper(&self) -> PyResult<crate::PrefixLookuper> {
+        crate::PrefixLookuper::new(
+            &self.connection,
+            self.metadata.clone(),
+            self.table_info.clone(),
+            self.lookup_column_names.clone(),
+        )
+    }
+
+    fn __repr__(&self) -> String {
+        "TablePrefixLookup()".to_string()
+    }
+}
+
 /// Writer for appending data to a Fluss table
 #[pyclass]
 pub struct AppendWriter {
diff --git a/fluss-rust/bindings/python/test/test_kv_table.py b/fluss-rust/bindings/python/test/test_kv_table.py
index a17b0ad30c..f3cddf8c3d 100644
--- a/fluss-rust/bindings/python/test/test_kv_table.py
+++ b/fluss-rust/bindings/python/test/test_kv_table.py
@@ -26,6 +26,7 @@
 from decimal import Decimal
 
 import pyarrow as pa
+import pytest
 
 import fluss
 
@@ -108,7 +109,7 @@ async def test_upsert_delete_and_lookup(connection, admin):
 
 
 async def test_composite_primary_keys(connection, admin):
-    """Test upsert and lookup with composite (multi-column) primary keys."""
+    """Test upsert/lookup with composite PKs, including prefix lookup."""
     table_path = fluss.TablePath("fluss", "py_test_composite_pk")
     await admin.drop_table(table_path, ignore_if_not_exists=True)
 
@@ -120,47 +121,79 @@ async def test_composite_primary_keys(connection, admin):
                 pa.field("region", pa.string()),
                 pa.field("score", pa.int64()),
                 pa.field("user_id", pa.int32()),
+                pa.field("event_id", pa.int64()),
             ]
         ),
-        primary_keys=["region", "user_id"],
+        primary_keys=["region", "user_id", "event_id"],
+    )
+    table_descriptor = fluss.TableDescriptor(
+        schema, bucket_count=3, bucket_keys=["region", "user_id"]
     )
-    table_descriptor = fluss.TableDescriptor(schema)
     await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
 
     table = await connection.get_table(table_path)
     upsert_writer = table.new_upsert().create_writer()
 
     test_data = [
-        ("US", 1, 100),
-        ("US", 2, 200),
-        ("EU", 1, 150),
-        ("EU", 2, 250),
+        ("US", 1, 1, 100),
+        ("US", 1, 2, 200),
+        ("US", 2, 1, 300),
+        ("EU", 1, 1, 150),
+        ("EU", 2, 1, 250),
     ]
 
-    for region, user_id, score in test_data:
-        upsert_writer.upsert({"region": region, "user_id": user_id, "score": score})
+    for region, user_id, event_id, score in test_data:
+        upsert_writer.upsert(
+            {
+                "region": region,
+                "user_id": user_id,
+                "event_id": event_id,
+                "score": score,
+            }
+        )
     await upsert_writer.flush()
 
     lookuper = table.new_lookup().create_lookuper()
 
-    # Lookup (US, 1) -> score 100
-    result = await lookuper.lookup({"region": "US", "user_id": 1})
+    # Lookup (US, 1, 1) -> score 100
+    result = await lookuper.lookup({"region": "US", "user_id": 1, "event_id": 1})
     assert result is not None
     assert result["score"] == 100
 
-    # Lookup (EU, 2) -> score 250
-    result = await lookuper.lookup({"region": "EU", "user_id": 2})
+    # Lookup (EU, 2, 1) -> score 250
+    result = await lookuper.lookup({"region": "EU", "user_id": 2, "event_id": 1})
     assert result is not None
     assert result["score"] == 250
 
-    # Update (US, 1) score (await acknowledgment)
-    handle = upsert_writer.upsert({"region": "US", "user_id": 1, "score": 500})
+    # Update (US, 1, 1) score (await acknowledgment)
+    handle = upsert_writer.upsert(
+        {"region": "US", "user_id": 1, "event_id": 1, "score": 500}
+    )
     await handle.wait()
 
-    result = await lookuper.lookup({"region": "US", "user_id": 1})
+    result = await lookuper.lookup({"region": "US", "user_id": 1, "event_id": 1})
     assert result is not None
     assert result["score"] == 500
 
+    prefix_lookuper = table.new_lookup().lookup_by(["region", "user_id"]).create_lookuper()
+
+    # Prefix (US, 1) should match 2 rows (event_id 1 and 2)
+    rows = await prefix_lookuper.lookup({"region": "US", "user_id": 1})
+    assert len(rows) == 2
+    event_ids = sorted(row["event_id"] for row in rows)
+    assert event_ids == [1, 2]
+
+    # Also validate list/tuple prefix input
+    rows = await prefix_lookuper.lookup(["US", 1])
+    assert len(rows) == 2
+    rows = await prefix_lookuper.lookup(("EU", 2))
+    assert len(rows) == 1
+    assert rows[0]["event_id"] == 1
+
+    # Validate empty-result case: valid prefix shape but no matching rows.
+    rows = await prefix_lookuper.lookup({"region": "APAC", "user_id": 999})
+    assert rows == []
+
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
@@ -604,3 +637,84 @@ async def test_all_supported_datatypes(connection, admin):
             assert result[col] is None, f"{col} should be null"
 
     await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_prefix_lookup_validation_errors(connection, admin):
+    """Test that prefix lookup raises errors for invalid column configurations."""
+    table_path = fluss.TablePath("fluss", "py_test_prefix_lookup_validation")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("a", pa.int32()),
+                pa.field("b", pa.string()),
+                pa.field("c", pa.int64()),
+            ]
+        ),
+        primary_keys=["a", "b", "c"],
+    )
+    table_descriptor = fluss.TableDescriptor(
+        schema, bucket_count=3, bucket_keys=["a", "b"]
+    )
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+
+    # lookup_by with columns equal to full PK should error
+    with pytest.raises(fluss.FlussError, match="prefix lookup"):
+        table.new_lookup().lookup_by(["a", "b", "c"]).create_lookuper()
+
+    # lookup_by with wrong column names should error
+    with pytest.raises(fluss.FlussError, match="bucket keys"):
+        table.new_lookup().lookup_by(["a", "c"]).create_lookuper()
+
+    # lookup_by with unknown column should error
+    with pytest.raises(fluss.FlussError, match="Unknown column name"):
+        table.new_lookup().lookup_by(["a", "missing_col"]).create_lookuper()
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+    # Partitioned table: lookup columns must include partition keys first,
+    # followed by bucket keys.
+    partitioned_table_path = fluss.TablePath("fluss", "py_test_prefix_lookup_validation_pt")
+    await admin.drop_table(partitioned_table_path, ignore_if_not_exists=True)
+
+    partitioned_schema = fluss.Schema(
+        pa.schema(
+            [
+                pa.field("region", pa.string()),
+                pa.field("user_id", pa.int32()),
+                pa.field("event_id", pa.int64()),
+            ]
+        ),
+        primary_keys=["region", "user_id", "event_id"],
+    )
+    partitioned_table_descriptor = fluss.TableDescriptor(
+        partitioned_schema,
+        partition_keys=["region"],
+        bucket_count=3,
+        bucket_keys=["user_id"],
+    )
+    await admin.create_table(
+        partitioned_table_path, partitioned_table_descriptor, ignore_if_exists=False
+    )
+
+    partitioned_table = await connection.get_table(partitioned_table_path)
+
+    # Missing partition key in lookup columns.
+    with pytest.raises(fluss.FlussError, match="partition fields"):
+        partitioned_table.new_lookup().lookup_by(["user_id"]).create_lookuper()
+
+    # A non-existent partition returns empty list.
+    partitioned_prefix_lookuper = (
+        partitioned_table.new_lookup().lookup_by(["region", "user_id"]).create_lookuper()
+    )
+    rows = await partitioned_prefix_lookuper.lookup({"region": "UNKNOWN_REGION", "user_id": 1})
+    assert rows == []
+
+    # After partition keys, remaining columns must equal bucket keys.
+    with pytest.raises(fluss.FlussError, match="bucket keys"):
+        partitioned_table.new_lookup().lookup_by(["region", "event_id"]).create_lookuper()
+
+    await admin.drop_table(partitioned_table_path, ignore_if_not_exists=False)
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index aec4412dbf..dc252b682c 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -117,11 +117,20 @@ Builder for creating an `UpsertWriter`. Obtain via `FlussTable.new_upsert()`.
 
 ## `TableLookup`
 
-Builder for creating a `Lookuper`. Obtain via `FlussTable.new_lookup()`.
+Builder for creating a `Lookuper` or `PrefixLookuper`. Obtain via `FlussTable.new_lookup()`.
 
-| Method                           |  Description        |
-|----------------------------------|---------------------|
-| `.create_lookuper() -> Lookuper` | Create the lookuper |
+| Method                                              |  Description                              |
+|-----------------------------------------------------|-------------------------------------------|
+| `.create_lookuper() -> Lookuper`                    | Create a primary key lookuper             |
+| `.lookup_by(column_names) -> TablePrefixLookup`     | Switch to prefix-scan mode for the given columns (partition keys + bucket keys) |
+
+## `TablePrefixLookup`
+
+Builder for creating a `PrefixLookuper`. Obtain via `TableLookup.lookup_by(columns)`.
+
+| Method                                     |  Description              |
+|--------------------------------------------|---------------------------|
+| `.create_lookuper() -> PrefixLookuper`     | Create the prefix lookuper |
 
 ## `AppendWriter`
 
@@ -153,6 +162,12 @@ Builder for creating a `Lookuper`. Obtain via `FlussTable.new_lookup()`.
 |-------------------------------------|-----------------------------|
 | `await .lookup(pk) -> dict \| None` | Lookup a row by primary key |
 
+## `PrefixLookuper`
+
+| Method                                        |  Description                                |
+|-----------------------------------------------|---------------------------------------------|
+| `await .lookup(prefix) -> list[dict]`         | Lookup all rows matching a prefix key       |
+
 ## `LogScanner`
 
 | Method                                                        |  Description                                                                     |

From 2a6f0a44c74dc99723dadab62d81fa822feb2096 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Sun, 10 May 2026 21:13:52 +0200
Subject: [PATCH 265/287] capture cluster container logs as CI artifact (#542)

---
 .../.github/workflows/build_and_test_python.yml | 17 +++++++++++++++++
 fluss-rust/bindings/python/test/conftest.py     |  2 ++
 2 files changed, 19 insertions(+)

diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
index 93f2eedb52..a8d3f05b47 100644
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ b/fluss-rust/.github/workflows/build_and_test_python.yml
@@ -81,3 +81,20 @@ jobs:
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
+          FLUSS_SKIP_CLUSTER_TEARDOWN: "1"
+
+      - name: Dump fluss cluster container logs
+        if: always()
+        run: |
+          mkdir -p cluster-logs
+          for c in $(docker ps -a --filter "name=shared-test" --format '{{.Names}}'); do
+            docker logs "$c" > "cluster-logs/$c.log" 2>&1 || true
+          done
+
+      - uses: actions/upload-artifact@v4
+        if: always()
+        with:
+          name: cluster-logs-${{ matrix.python }}
+          path: cluster-logs/
+          if-no-files-found: ignore
+          retention-days: 3
diff --git a/fluss-rust/bindings/python/test/conftest.py b/fluss-rust/bindings/python/test/conftest.py
index 52773c9e86..8b2bc732b9 100644
--- a/fluss-rust/bindings/python/test/conftest.py
+++ b/fluss-rust/bindings/python/test/conftest.py
@@ -109,6 +109,8 @@ def pytest_unconfigure(config):
         return
     if hasattr(config, "workerinput"):
         return
+    if os.environ.get("FLUSS_SKIP_CLUSTER_TEARDOWN"):
+        return
     _stop_cluster()
 
 

From 4a2fdede6aa3a3e014b6d14251f2b7fdb4ba2d22 Mon Sep 17 00:00:00 2001
From: hemanthsavasere <hemanth.savasere@gmail.com>
Date: Sun, 15 Mar 2026 18:27:30 +0000
Subject: [PATCH 266/287] feat: add end-to-end ROW (nested struct) column
 serialization support

- Add `Datum::Row(Box<GenericRow>)` variant with `as_row()` accessor
- Add `get_row()` to `InternalRow` trait with default error impl
- Implement `GenericRow::get_row()` and `CompactedRow::get_row()` delegation
- Implement `ColumnarRow::get_row()` with Arrow StructArray extraction + OnceLock caching
- Add `InnerValueWriter::Row(RowType)` and write path via nested CompactedRowWriter
- Add `DataType::Row` arm in `CompactedRowDeserializer` for eager nested decode
- Add `InnerFieldGetter::Row` and hook up FieldGetter/ValueWriter pipeline
- Handle `Datum::Row` in `resolve_row_types` (C++ bindings)
- Add round-trip tests: simple nesting, deep nesting, nullable fields, ROW as primary key

Wire format matches Java: varint-length-prefixed blob of a complete CompactedRow.
---
 fluss-rust/bindings/cpp/src/types.rs          |   1 +
 .../fluss/src/row/binary/binary_writer.rs     |  25 +-
 fluss-rust/crates/fluss/src/row/column.rs     | 300 +++++++++++++++++-
 .../fluss/src/row/compacted/compacted_row.rs  |   4 +
 .../src/row/compacted/compacted_row_reader.rs | 151 +++++++++
 fluss-rust/crates/fluss/src/row/datum.rs      |  15 +
 .../src/row/encode/compacted_key_encoder.rs   |  48 ++-
 .../crates/fluss/src/row/field_getter.rs      |  12 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |  19 +-
 9 files changed, 563 insertions(+), 12 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index f61711b502..19aa9a362f 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -529,6 +529,7 @@ pub fn resolve_row_types(
             Datum::TimestampNtz(ts) => Datum::TimestampNtz(*ts),
             Datum::TimestampLtz(ts) => Datum::TimestampLtz(*ts),
             Datum::Array(a) => Datum::Array(a.clone()),
+            Datum::Row(r) => Datum::Row(Box::new(resolve_row_types(r, None)?)),
         };
         out.set_field(idx, resolved);
     }
diff --git a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
index f51a6e80f1..fd7da4c9e5 100644
--- a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
@@ -17,7 +17,7 @@
 
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::DataType;
+use crate::metadata::{DataType, RowType};
 use crate::row::Datum;
 use crate::row::binary::BinaryRowFormat;
 
@@ -136,7 +136,7 @@ pub enum InnerValueWriter {
     TimestampNtz(u32), // precision
     TimestampLtz(u32), // precision
     Array,
-    // TODO Row
+    Row(RowType),
 }
 
 /// Accessor for writing the fields/elements of a binary writer during runtime, the
@@ -176,6 +176,7 @@ impl InnerValueWriter {
                 Ok(InnerValueWriter::TimestampLtz(t.precision()))
             }
             DataType::Array(_) => Ok(InnerValueWriter::Array),
+            DataType::Row(row_type) => Ok(InnerValueWriter::Row(row_type.clone())),
             _ => unimplemented!(
                 "ValueWriter for DataType {:?} is currently not implemented",
                 data_type
@@ -241,6 +242,26 @@ impl InnerValueWriter {
             (InnerValueWriter::Array, Datum::Array(arr)) => {
                 writer.write_array(arr.as_bytes());
             }
+            (InnerValueWriter::Row(row_type), Datum::Row(inner_row)) => {
+                use crate::row::compacted::CompactedRowWriter;
+                let field_count = row_type.fields().len();
+                let mut nested = CompactedRowWriter::new(field_count);
+                for (i, field) in row_type.fields().iter().enumerate() {
+                    let datum = &inner_row.values[i];
+                    if datum.is_null() {
+                        if field.data_type.is_nullable() {
+                            nested.set_null_at(i);
+                        }
+                    } else {
+                        let vw =
+                            InnerValueWriter::create_inner_value_writer(&field.data_type, None)
+                                .expect("create_inner_value_writer failed for nested row field");
+                        vw.write_value(&mut nested, i, datum)
+                            .expect("write_value failed for nested row field");
+                    }
+                }
+                writer.write_bytes(nested.buffer());
+            }
             _ => {
                 return Err(IllegalArgument {
                     message: format!("{self:?} used to write value {value:?}"),
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index be5b850d80..95cd3395c2 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -17,8 +17,8 @@
 
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::row::InternalRow;
-use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+use crate::row::{GenericRow, InternalRow};
+use crate::row::datum::{Date, Datum, Time, TimestampLtz, TimestampNtz};
 use arrow::array::{
     Array, AsArray, BinaryArray, BooleanArray, FixedSizeBinaryArray, ListArray, RecordBatch,
     StringArray,
@@ -35,25 +35,33 @@ use std::sync::Arc;
 pub struct ColumnarRow {
     record_batch: Arc<RecordBatch>,
     row_id: usize,
+    nested_rows: Vec<std::sync::OnceLock<GenericRow<'static>>>,
 }
 
 impl ColumnarRow {
     pub fn new(batch: Arc<RecordBatch>) -> Self {
+        let num_cols = batch.num_columns();
         ColumnarRow {
             record_batch: batch,
             row_id: 0,
+            nested_rows: (0..num_cols).map(|_| std::sync::OnceLock::new()).collect(),
         }
     }
 
     pub fn new_with_row_id(bach: Arc<RecordBatch>, row_id: usize) -> Self {
+        let num_cols = bach.num_columns();
         ColumnarRow {
             record_batch: bach,
             row_id,
+            nested_rows: (0..num_cols).map(|_| std::sync::OnceLock::new()).collect(),
         }
     }
 
     pub fn set_row_id(&mut self, row_id: usize) {
-        self.row_id = row_id
+        self.row_id = row_id;
+        for lock in &mut self.nested_rows {
+            *lock = std::sync::OnceLock::new();
+        }
     }
 
     pub fn get_row_id(&self) -> usize {
@@ -212,6 +220,168 @@ impl ColumnarRow {
             }),
         }
     }
+
+    /// Extract a `GenericRow<'static>` from a column in the RecordBatch at the given row_id.
+    fn extract_struct_at(
+        batch: &RecordBatch,
+        pos: usize,
+        row_id: usize,
+    ) -> Result<GenericRow<'static>> {
+        let col = batch.column(pos);
+        Self::extract_struct_from_array(col.as_ref(), row_id)
+    }
+
+    /// Recursively extract a `GenericRow<'static>` from a `StructArray` at row_id.
+    fn extract_struct_from_array(array: &dyn Array, row_id: usize) -> Result<GenericRow<'static>> {
+        use arrow::array::StructArray;
+        let sa = array
+            .as_any()
+            .downcast_ref::<StructArray>()
+            .ok_or_else(|| IllegalArgument {
+                message: format!("expected StructArray, got {:?}", array.data_type()),
+            })?;
+        let mut values = Vec::with_capacity(sa.num_columns());
+        for i in 0..sa.num_columns() {
+            let child = sa.column(i);
+            values.push(Self::arrow_value_to_datum(child.as_ref(), row_id)?);
+        }
+        Ok(GenericRow { values })
+    }
+
+    /// Convert a single element at `row_id` in an Arrow array to a `Datum<'static>`.
+    fn arrow_value_to_datum(array: &dyn Array, row_id: usize) -> Result<Datum<'static>> {
+        use arrow::array::{
+            BooleanArray, Decimal128Array, Float32Array, Float64Array, Int8Array, Int16Array,
+            Int32Array, Int64Array, Time32MillisecondArray, Time32SecondArray,
+            Time64MicrosecondArray, Time64NanosecondArray, TimestampMicrosecondArray,
+            TimestampMillisecondArray, TimestampNanosecondArray, TimestampSecondArray,
+        };
+        use crate::row::Decimal;
+
+        if array.is_null(row_id) {
+            return Ok(Datum::Null);
+        }
+
+        match array.data_type() {
+            ArrowDataType::Boolean => {
+                let a = array.as_any().downcast_ref::<BooleanArray>().unwrap();
+                Ok(Datum::Bool(a.value(row_id)))
+            }
+            ArrowDataType::Int8 => {
+                let a = array.as_any().downcast_ref::<Int8Array>().unwrap();
+                Ok(Datum::Int8(a.value(row_id)))
+            }
+            ArrowDataType::Int16 => {
+                let a = array.as_any().downcast_ref::<Int16Array>().unwrap();
+                Ok(Datum::Int16(a.value(row_id)))
+            }
+            ArrowDataType::Int32 => {
+                let a = array.as_any().downcast_ref::<Int32Array>().unwrap();
+                Ok(Datum::Int32(a.value(row_id)))
+            }
+            ArrowDataType::Int64 => {
+                let a = array.as_any().downcast_ref::<Int64Array>().unwrap();
+                Ok(Datum::Int64(a.value(row_id)))
+            }
+            ArrowDataType::Float32 => {
+                let a = array.as_any().downcast_ref::<Float32Array>().unwrap();
+                Ok(Datum::Float32(a.value(row_id).into()))
+            }
+            ArrowDataType::Float64 => {
+                let a = array.as_any().downcast_ref::<Float64Array>().unwrap();
+                Ok(Datum::Float64(a.value(row_id).into()))
+            }
+            ArrowDataType::Utf8 => {
+                let a = array.as_any().downcast_ref::<StringArray>().unwrap();
+                Ok(Datum::String(std::borrow::Cow::Owned(a.value(row_id).to_owned())))
+            }
+            ArrowDataType::Binary => {
+                let a = array.as_any().downcast_ref::<BinaryArray>().unwrap();
+                Ok(Datum::Blob(std::borrow::Cow::Owned(a.value(row_id).to_vec())))
+            }
+            ArrowDataType::Decimal128(p, s) => {
+                let (p, s) = (*p, *s);
+                let a = array.as_any().downcast_ref::<Decimal128Array>().unwrap();
+                let i128_val = a.value(row_id);
+                Ok(Datum::Decimal(Decimal::from_arrow_decimal128(
+                    i128_val,
+                    s as i64,
+                    p as u32,
+                    s as u32,
+                )?))
+            }
+            ArrowDataType::Date32 => {
+                let a = array.as_any().downcast_ref::<arrow::array::Date32Array>().unwrap();
+                Ok(Datum::Date(Date::new(a.value(row_id))))
+            }
+            ArrowDataType::Time32(TimeUnit::Second) => {
+                let a = array.as_any().downcast_ref::<Time32SecondArray>().unwrap();
+                Ok(Datum::Time(Time::new(a.value(row_id) * 1000)))
+            }
+            ArrowDataType::Time32(TimeUnit::Millisecond) => {
+                let a = array.as_any().downcast_ref::<Time32MillisecondArray>().unwrap();
+                Ok(Datum::Time(Time::new(a.value(row_id))))
+            }
+            ArrowDataType::Time64(TimeUnit::Microsecond) => {
+                let a = array.as_any().downcast_ref::<Time64MicrosecondArray>().unwrap();
+                Ok(Datum::Time(Time::new((a.value(row_id) / 1000) as i32)))
+            }
+            ArrowDataType::Time64(TimeUnit::Nanosecond) => {
+                let a = array.as_any().downcast_ref::<Time64NanosecondArray>().unwrap();
+                Ok(Datum::Time(Time::new((a.value(row_id) / 1_000_000) as i32)))
+            }
+            ArrowDataType::Timestamp(time_unit, tz) => {
+                let value: i64 = match time_unit {
+                    TimeUnit::Second => {
+                        array.as_any().downcast_ref::<TimestampSecondArray>().unwrap().value(row_id)
+                    }
+                    TimeUnit::Millisecond => {
+                        array.as_any().downcast_ref::<TimestampMillisecondArray>().unwrap().value(row_id)
+                    }
+                    TimeUnit::Microsecond => {
+                        array.as_any().downcast_ref::<TimestampMicrosecondArray>().unwrap().value(row_id)
+                    }
+                    TimeUnit::Nanosecond => {
+                        array.as_any().downcast_ref::<TimestampNanosecondArray>().unwrap().value(row_id)
+                    }
+                };
+                let (millis, nanos) = match time_unit {
+                    TimeUnit::Second => (value * 1000, 0i32),
+                    TimeUnit::Millisecond => (value, 0i32),
+                    TimeUnit::Microsecond => {
+                        let millis = value.div_euclid(1000);
+                        let nanos = (value.rem_euclid(1000) * 1000) as i32;
+                        (millis, nanos)
+                    }
+                    TimeUnit::Nanosecond => {
+                        let millis = value.div_euclid(1_000_000);
+                        let nanos = value.rem_euclid(1_000_000) as i32;
+                        (millis, nanos)
+                    }
+                };
+                if tz.is_some() {
+                    if nanos == 0 {
+                        Ok(Datum::TimestampLtz(TimestampLtz::new(millis)))
+                    } else {
+                        Ok(Datum::TimestampLtz(TimestampLtz::from_millis_nanos(millis, nanos)?))
+                    }
+                } else if nanos == 0 {
+                    Ok(Datum::TimestampNtz(TimestampNtz::new(millis)))
+                } else {
+                    Ok(Datum::TimestampNtz(TimestampNtz::from_millis_nanos(millis, nanos)?))
+                }
+            }
+            ArrowDataType::Struct(_) => {
+                let nested = Self::extract_struct_from_array(array, row_id)?;
+                Ok(Datum::Row(Box::new(nested)))
+            }
+            other => Err(IllegalArgument {
+                message: format!(
+                    "unsupported Arrow data type for nested row extraction: {other:?}"
+                ),
+            }),
+        }
+    }
 }
 
 impl InternalRow for ColumnarRow {
@@ -433,6 +603,18 @@ impl InternalRow for ColumnarRow {
         write_arrow_values_to_fluss_array(&*values, &element_fluss_type, &mut writer)?;
         writer.complete()
     }
+
+    fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
+        let lock = self.nested_rows.get(pos).ok_or_else(|| IllegalArgument {
+            message: format!("column index {pos} out of bounds for get_row"),
+        })?;
+        let batch = Arc::clone(&self.record_batch);
+        let row_id = self.row_id;
+        Ok(lock.get_or_init(|| {
+            Self::extract_struct_at(&batch, pos, row_id)
+                .expect("failed to extract nested row from StructArray")
+        }))
+    }
 }
 
 /// Downcast to a primitive Arrow array type, then loop with null checks calling a writer method.
@@ -794,9 +976,9 @@ mod tests {
     use arrow::array::{
         ArrayRef, BinaryArray, BooleanArray, Decimal128Array, Float32Array, Float64Array,
         Int8Array, Int16Array, Int32Array, Int32Builder, Int64Array, ListBuilder, StringArray,
-        UInt32Builder,
+        StructArray, UInt32Builder,
     };
-    use arrow::datatypes::{DataType, Field, Schema};
+    use arrow::datatypes::{DataType, Field, Fields, Schema};
 
     fn single_column_row(array: ArrayRef) -> ColumnarRow {
         let batch =
@@ -1011,4 +1193,112 @@ mod tests {
             "unexpected error: {err}"
         );
     }
+
+    fn make_struct_batch(
+        field_name: &str,
+        child_fields: Fields,
+        child_arrays: Vec<Arc<dyn Array>>,
+        _num_rows: usize,
+    ) -> Arc<RecordBatch> {
+        let struct_array = StructArray::new(child_fields.clone(), child_arrays, None);
+        let schema = Arc::new(Schema::new(vec![Field::new(
+            field_name,
+            DataType::Struct(child_fields),
+            false,
+        )]));
+        Arc::new(
+            RecordBatch::try_new(schema, vec![Arc::new(struct_array)])
+                .expect("record batch"),
+        )
+    }
+
+    #[test]
+    fn columnar_row_reads_nested_row() {
+        // Build a RecordBatch with a Struct column: {i32, string}
+        let child_fields = Fields::from(vec![
+            Field::new("x", DataType::Int32, false),
+            Field::new("s", DataType::Utf8, false),
+        ]);
+        let child_arrays: Vec<Arc<dyn Array>> = vec![
+            Arc::new(Int32Array::from(vec![42, 99])),
+            Arc::new(StringArray::from(vec!["hello", "world"])),
+        ];
+        let batch = make_struct_batch("nested", child_fields, child_arrays, 2);
+
+        let mut row = ColumnarRow::new(batch);
+
+        // row_id = 0
+        let nested = row.get_row(0).unwrap();
+        assert_eq!(nested.get_field_count(), 2);
+        assert_eq!(nested.get_int(0).unwrap(), 42);
+        assert_eq!(nested.get_string(1).unwrap(), "hello");
+
+        // row_id = 1
+        row.set_row_id(1);
+        let nested = row.get_row(0).unwrap();
+        assert_eq!(nested.get_int(0).unwrap(), 99);
+        assert_eq!(nested.get_string(1).unwrap(), "world");
+    }
+
+    #[test]
+    fn columnar_row_reads_deeply_nested_row() {
+        // Build: outer struct { i32, inner struct { string } }
+        let inner_fields = Fields::from(vec![Field::new("s", DataType::Utf8, false)]);
+        let inner_array = Arc::new(StructArray::new(
+            inner_fields.clone(),
+            vec![Arc::new(StringArray::from(vec!["deep", "deeper"])) as Arc<dyn Array>],
+            None,
+        ));
+
+        let outer_fields = Fields::from(vec![
+            Field::new("n", DataType::Int32, false),
+            Field::new("inner", DataType::Struct(inner_fields), false),
+        ]);
+        let outer_array = Arc::new(StructArray::new(
+            outer_fields.clone(),
+            vec![
+                Arc::new(Int32Array::from(vec![1, 2])) as Arc<dyn Array>,
+                inner_array as Arc<dyn Array>,
+            ],
+            None,
+        ));
+
+        let schema = Arc::new(Schema::new(vec![Field::new(
+            "outer",
+            DataType::Struct(outer_fields),
+            false,
+        )]));
+        let batch = Arc::new(
+            RecordBatch::try_new(schema, vec![outer_array]).expect("record batch"),
+        );
+
+        let row = ColumnarRow::new(batch);
+
+        // Access outer struct at column 0, row 0
+        let outer = row.get_row(0).unwrap();
+        assert_eq!(outer.get_int(0).unwrap(), 1);
+
+        // Access inner struct (column 1 of outer)
+        let inner = outer.get_row(1).unwrap();
+        assert_eq!(inner.get_string(0).unwrap(), "deep");
+    }
+
+    #[test]
+    fn columnar_row_get_row_cache_invalidated_on_set_row_id() {
+        let child_fields = Fields::from(vec![Field::new("x", DataType::Int32, false)]);
+        let child_arrays: Vec<Arc<dyn Array>> =
+            vec![Arc::new(Int32Array::from(vec![10, 20]))];
+        let batch = make_struct_batch("s", child_fields, child_arrays, 2);
+
+        let mut row = ColumnarRow::new(batch);
+
+        // row_id = 0: nested x = 10
+        let nested_0 = row.get_row(0).unwrap();
+        assert_eq!(nested_0.get_int(0).unwrap(), 10);
+
+        // After set_row_id(1), cache is cleared → nested x = 20
+        row.set_row_id(1);
+        let nested_1 = row.get_row(0).unwrap();
+        assert_eq!(nested_1.get_int(0).unwrap(), 20);
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 267ae13cd1..24e4bd79d7 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -171,6 +171,10 @@ impl<'a> InternalRow for CompactedRow<'a> {
         self.decoded_row()?.get_array(pos)
     }
 
+    fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
+        self.decoded_row().get_row(pos)
+    }
+
     fn as_encoded_bytes(&self, write_format: WriteFormat) -> Option<&[u8]> {
         match write_format {
             WriteFormat::CompactedKv => Some(self.as_bytes()),
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 4ae442fc0e..9d7fb6cb8f 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -187,6 +187,18 @@ impl<'a> CompactedRowDeserializer<'a> {
                     let array = crate::row::binary_array::FlussArray::from_bytes(bytes)?;
                     (Datum::Array(array), next)
                 }
+                DataType::Row(row_type) => {
+                    let (nested_bytes, next) = reader.read_bytes(cursor)?;
+                    let nested_reader = CompactedRowReader::new(
+                        row_type.fields().len(),
+                        nested_bytes,
+                        0,
+                        nested_bytes.len(),
+                    );
+                    let nested_deser = CompactedRowDeserializer::new_from_owned(row_type.clone());
+                    let nested_row = nested_deser.deserialize(&nested_reader)?;
+                    (Datum::Row(Box::new(nested_row)), next)
+                }
                 _ => {
                     return Err(IllegalArgument {
                         message: format!(
@@ -326,3 +338,142 @@ impl<'a> CompactedRowReader<'a> {
         Ok((s, next_pos))
     }
 }
+
+#[cfg(test)]
+mod row_type_tests {
+    use crate::metadata::{DataType, DataTypes, RowType};
+    use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
+    use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
+    use crate::row::binary::ValueWriter;
+    use crate::row::field_getter::FieldGetter;
+    use crate::row::{Datum, GenericRow, InternalRow};
+
+    fn round_trip<F>(outer_row_type: &RowType, outer_row: &GenericRow, verify: F)
+    where
+        F: FnOnce(&GenericRow),
+    {
+        // Write
+        let field_getters = FieldGetter::create_field_getters(outer_row_type);
+        let value_writers: Vec<ValueWriter> = outer_row_type
+            .fields()
+            .iter()
+            .map(|f| ValueWriter::create_value_writer(f.data_type(), None).unwrap())
+            .collect();
+        let mut writer = CompactedRowWriter::new(outer_row_type.fields().len());
+        for (i, (getter, vw)) in field_getters.iter().zip(value_writers.iter()).enumerate() {
+            let datum = getter.get_field(outer_row as &dyn InternalRow).unwrap();
+            vw.write_value(&mut writer, i, &datum).unwrap();
+        }
+        let bytes = writer.to_bytes();
+
+        // Read
+        let deser = CompactedRowDeserializer::new(outer_row_type);
+        let reader = CompactedRowReader::new(
+            outer_row_type.fields().len(),
+            bytes.as_ref(),
+            0,
+            bytes.len(),
+        );
+        let result = deser.deserialize(&reader);
+        verify(&result);
+    }
+
+    #[test]
+    fn test_row_simple_nesting() {
+        // ROW<INT, STRING> nested inside an outer row
+        let inner_row_type = RowType::with_data_types_and_field_names(
+            vec![DataTypes::int(), DataTypes::string()],
+            vec!["x", "label"],
+        );
+        let outer_row_type = RowType::with_data_types_and_field_names(
+            vec![DataTypes::int(), DataType::Row(inner_row_type.clone())],
+            vec!["id", "nested"],
+        );
+
+        let mut inner = GenericRow::new(2);
+        inner.set_field(0, 42_i32);
+        inner.set_field(1, "hello");
+
+        let mut outer = GenericRow::new(2);
+        outer.set_field(0, 1_i32);
+        outer.set_field(1, Datum::Row(Box::new(inner)));
+
+        round_trip(&outer_row_type, &outer, |result| {
+            assert_eq!(result.get_int(0).unwrap(), 1);
+            let nested = result.get_row(1).unwrap();
+            assert_eq!(nested.get_int(0).unwrap(), 42);
+            assert_eq!(nested.get_string(1).unwrap(), "hello");
+        });
+    }
+
+    #[test]
+    fn test_row_deep_nesting() {
+        // ROW<ROW<INT>> — two levels of nesting
+        let inner_inner_row_type = RowType::with_data_types_and_field_names(
+            vec![DataTypes::int()],
+            vec!["n"],
+        );
+        let inner_row_type = RowType::with_data_types_and_field_names(
+            vec![DataType::Row(inner_inner_row_type.clone())],
+            vec!["inner"],
+        );
+        let outer_row_type = RowType::with_data_types_and_field_names(
+            vec![DataType::Row(inner_row_type.clone())],
+            vec!["outer"],
+        );
+
+        let mut innermost = GenericRow::new(1);
+        innermost.set_field(0, 99_i32);
+
+        let mut middle = GenericRow::new(1);
+        middle.set_field(0, Datum::Row(Box::new(innermost)));
+
+        let mut outer = GenericRow::new(1);
+        outer.set_field(0, Datum::Row(Box::new(middle)));
+
+        round_trip(&outer_row_type, &outer, |result| {
+            let mid = result.get_row(0).unwrap();
+            let inner = mid.get_row(0).unwrap();
+            assert_eq!(inner.get_int(0).unwrap(), 99);
+        });
+    }
+
+    #[test]
+    fn test_row_with_nullable_fields() {
+        // Outer nullable ROW column; nested row with a nullable STRING field set to null
+        let inner_row_type = RowType::with_data_types_and_field_names(
+            vec![DataTypes::int(), DataTypes::string()],
+            vec!["id", "optional_name"],
+        );
+        let outer_row_type = RowType::with_data_types_and_field_names(
+            vec![DataTypes::int(), DataType::Row(inner_row_type.clone())],
+            vec!["k", "nested"],
+        );
+
+        // Case 1: non-null nested row with a null field inside
+        let mut inner = GenericRow::new(2);
+        inner.set_field(0, 7_i32);
+        inner.set_field(1, Datum::Null);
+
+        let mut outer = GenericRow::new(2);
+        outer.set_field(0, 10_i32);
+        outer.set_field(1, Datum::Row(Box::new(inner)));
+
+        round_trip(&outer_row_type, &outer, |result| {
+            assert_eq!(result.get_int(0).unwrap(), 10);
+            let nested = result.get_row(1).unwrap();
+            assert_eq!(nested.get_int(0).unwrap(), 7);
+            assert!(nested.is_null_at(1).unwrap());
+        });
+
+        // Case 2: outer ROW column is null
+        let mut outer_null = GenericRow::new(2);
+        outer_null.set_field(0, 20_i32);
+        outer_null.set_field(1, Datum::Null);
+
+        round_trip(&outer_row_type, &outer_null, |result2| {
+            assert_eq!(result2.get_int(0).unwrap(), 20);
+            assert!(result2.is_null_at(1).unwrap());
+        });
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 78dc54982c..865d4b4f8e 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -18,6 +18,7 @@
 use crate::error::Error::RowConvertError;
 use crate::error::Result;
 use crate::row::Decimal;
+use crate::row::GenericRow;
 use crate::row::binary_array::FlussArray;
 use arrow::array::{
     ArrayBuilder, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
@@ -72,6 +73,8 @@ pub enum Datum<'a> {
     TimestampLtz(TimestampLtz),
     #[display("{0}")]
     Array(FlussArray),
+    #[display("{0:?}")]
+    Row(Box<GenericRow<'a>>),
 }
 
 impl Datum<'_> {
@@ -134,6 +137,13 @@ impl Datum<'_> {
             _ => panic!("not an array: {self:?}"),
         }
     }
+
+    pub fn as_row(&self) -> &GenericRow<'_> {
+        match self {
+            Self::Row(r) => r.as_ref(),
+            _ => panic!("not a row: {self:?}"),
+        }
+    }
 }
 
 // ----------- implement from
@@ -878,6 +888,11 @@ impl Datum<'_> {
             Datum::Array(arr) => {
                 return append_fluss_array_to_list_builder(arr, builder, data_type);
             }
+            Datum::Row(_) => {
+                return Err(RowConvertError {
+                    message: "append_to is not supported for Row type".to_string(),
+                });
+            }
         }
 
         Err(RowConvertError {
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
index 877b3ecdb1..a6ba580f2a 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
@@ -109,7 +109,7 @@ impl KeyEncoder for CompactedKeyEncoder {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::DataTypes;
+    use crate::metadata::{DataType, DataTypes};
     use crate::row::binary_array::FlussArrayWriter;
     use crate::row::{Datum, GenericRow};
 
@@ -493,4 +493,50 @@ mod tests {
             encoded.iter().as_slice()
         );
     }
+
+    #[test]
+    fn test_row_as_primary_key() {
+        // ROW<INT, STRING> as a primary key column
+        let inner_row_type = RowType::with_data_types_and_field_names(
+            vec![DataTypes::int(), DataTypes::string()],
+            vec!["x", "label"],
+        );
+        let row_type = RowType::with_data_types_and_field_names(
+            vec![
+                DataTypes::int(),
+                DataType::Row(inner_row_type.clone()),
+            ],
+            vec!["id", "nested"],
+        );
+
+        let mut inner = GenericRow::new(2);
+        inner.set_field(0, 42_i32);
+        inner.set_field(1, "hello");
+
+        let mut row = GenericRow::new(2);
+        row.set_field(0, 1_i32);
+        row.set_field(1, Datum::Row(Box::new(inner)));
+
+        let mut encoder = for_test_row_type(&row_type);
+        let encoded = encoder.encode_key(&row).unwrap();
+
+        // Verify it encodes without error and produces non-empty bytes
+        assert!(!encoded.is_empty());
+
+        // Encode the same row again to verify determinism
+        let encoded2 = encoder.encode_key(&row).unwrap();
+        assert_eq!(encoded, encoded2);
+
+        // Encode a different nested row and verify different output
+        let mut inner2 = GenericRow::new(2);
+        inner2.set_field(0, 99_i32);
+        inner2.set_field(1, "world");
+
+        let mut row2 = GenericRow::new(2);
+        row2.set_field(0, 1_i32);
+        row2.set_field(1, Datum::Row(Box::new(inner2)));
+
+        let encoded3 = encoder.encode_key(&row2).unwrap();
+        assert_ne!(encoded, encoded3);
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
index 69e08602c3..a1ea378fc9 100644
--- a/fluss-rust/crates/fluss/src/row/field_getter.rs
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -82,8 +82,9 @@ impl FieldGetter {
                 pos,
                 precision: t.precision(),
             },
-            // TODO: add Map and Row variants when get_map/get_row are available in InternalRow.
+            // TODO: add Map variant when get_map is available in InternalRow.
             DataType::Array(_) => InnerFieldGetter::Array { pos },
+            DataType::Row(_) => InnerFieldGetter::Row { pos },
             _ => unimplemented!("DataType {:?} is currently unimplemented", data_type),
         };
 
@@ -154,6 +155,9 @@ pub enum InnerFieldGetter {
     Array {
         pos: usize,
     },
+    Row {
+        pos: usize,
+    },
 }
 
 impl InnerFieldGetter {
@@ -183,8 +187,9 @@ impl InnerFieldGetter {
             InnerFieldGetter::TimestampLtz { pos, precision } => {
                 Datum::TimestampLtz(row.get_timestamp_ltz(*pos, *precision)?)
             }
-            // TODO: add Map and Row field getter support once their binary forms are implemented.
+            // TODO: add Map field getter support once its binary form is implemented.
             InnerFieldGetter::Array { pos } => Datum::Array(row.get_array(*pos)?),
+            InnerFieldGetter::Row { pos } => Datum::Row(Box::new(row.get_row(*pos)?.clone())),
         })
     }
 
@@ -206,7 +211,8 @@ impl InnerFieldGetter {
             | Self::Time { pos }
             | Self::Timestamp { pos, .. }
             | Self::TimestampLtz { pos, .. }
-            | Self::Array { pos } => *pos,
+            | Self::Array { pos }
+            | Self::Row { pos } => *pos,
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index c6bdd7c540..fb599fc9af 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -34,6 +34,7 @@ mod row_decoder;
 use crate::client::WriteFormat;
 pub use binary_array::FlussArray;
 use bytes::Bytes;
+use serde::Serialize;
 pub use column::*;
 pub use compacted::CompactedRow;
 pub use datum::*;
@@ -130,13 +131,20 @@ pub trait InternalRow: Send + Sync {
     /// Returns the array value at the given position
     fn get_array(&self, pos: usize) -> Result<FlussArray>;
 
+    /// Returns the nested row value at the given position
+    fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
+        Err(crate::error::Error::IllegalArgument {
+            message: format!("get_row not supported at position {pos}"),
+        })
+    }
+
     /// Returns encoded bytes if already encoded
     fn as_encoded_bytes(&self, _write_format: WriteFormat) -> Option<&[u8]> {
         None
     }
 }
 
-#[derive(Debug)]
+#[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Hash, Serialize)]
 pub struct GenericRow<'a> {
     pub values: Vec<Datum<'a>>,
 }
@@ -294,6 +302,15 @@ impl<'a> InternalRow for GenericRow<'a> {
             }),
         }
     }
+
+    fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
+        match self.get_value(pos)? {
+            Datum::Row(r) => Ok(r.as_ref()),
+            other => Err(IllegalArgument {
+                message: format!("type mismatch at position {pos}: expected Row, got {other:?}"),
+            }),
+        }
+    }
 }
 
 impl<'a> GenericRow<'a> {

From 2c18097949cd68545edec69b251a4fe06ab3b0f3 Mon Sep 17 00:00:00 2001
From: Anton Borisov <anton.borisov@fresha.com>
Date: Sun, 10 May 2026 19:14:32 +0100
Subject: [PATCH 267/287] fixes and improvements

---
 fluss-rust/bindings/cpp/src/types.rs          |   2 +-
 fluss-rust/bindings/python/src/table.rs       |   5 +
 .../crates/fluss/src/client/table/append.rs   |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  |  58 +-
 .../crates/fluss/src/metadata/datatype.rs     |  72 ++-
 .../crates/fluss/src/metadata/json_serde.rs   | 342 ++++++++--
 fluss-rust/crates/fluss/src/metadata/table.rs | 148 ++++-
 fluss-rust/crates/fluss/src/record/arrow.rs   |  72 ++-
 fluss-rust/crates/fluss/src/record/mod.rs     |   2 +-
 .../fluss/src/row/binary/binary_writer.rs     |  74 ++-
 .../crates/fluss/src/row/binary_array.rs      | 315 ++++++++-
 fluss-rust/crates/fluss/src/row/column.rs     | 544 +++++++++-------
 .../crates/fluss/src/row/column_writer.rs     | 139 +++-
 .../src/row/compacted/compacted_key_writer.rs |  14 +-
 .../fluss/src/row/compacted/compacted_row.rs  |  44 +-
 .../src/row/compacted/compacted_row_reader.rs | 192 ++++--
 .../crates/fluss/src/row/compacted/mod.rs     |   2 +-
 fluss-rust/crates/fluss/src/row/datum.rs      | 233 +++++--
 .../src/row/encode/compacted_key_encoder.rs   |  54 +-
 fluss-rust/crates/fluss/src/row/lookup_row.rs |   5 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |  15 +-
 .../crates/fluss/src/row/projected_row.rs     |   6 +-
 .../fluss/tests/integration/kv_table.rs       | 606 ++++++++++++++++--
 .../fluss/tests/integration/log_table.rs      | 489 +++++++++++++-
 24 files changed, 2847 insertions(+), 588 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 19aa9a362f..84aec25b8f 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -529,7 +529,7 @@ pub fn resolve_row_types(
             Datum::TimestampNtz(ts) => Datum::TimestampNtz(*ts),
             Datum::TimestampLtz(ts) => Datum::TimestampLtz(*ts),
             Datum::Array(a) => Datum::Array(a.clone()),
-            Datum::Row(r) => Datum::Row(Box::new(resolve_row_types(r, None)?)),
+            Datum::Row(_) => return Err(anyhow!("Row datum is not yet supported in C++ bindings")),
         };
         out.set_field(idx, resolved);
     }
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 4ec7b8d77e..9ee84d76ed 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -1369,6 +1369,11 @@ fn python_value_to_datum(
                             }
                         }
                         Datum::Array(v) => writer.write_array(i, &v),
+                        Datum::Row(_) => {
+                            return Err(FlussError::new_err(
+                                "Row datum is not supported as an array element",
+                            ));
+                        }
                     }
                 }
             }
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index a58433f386..535520085e 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -126,7 +126,7 @@ impl AppendWriter {
     /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
     pub fn append_arrow_batch(&self, batch: RecordBatch) -> Result<WriteResultFuture> {
         let physical_table_path = if self.partition_getter.is_some() && batch.num_rows() > 0 {
-            let first_row = ColumnarRow::new(Arc::new(batch.clone()));
+            let first_row = ColumnarRow::new(Arc::new(batch.clone()), 0, None);
             Arc::new(get_physical_path(
                 &self.table_path,
                 self.partition_getter.as_ref(),
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 00c5b23859..c6228e59f9 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -23,10 +23,13 @@ use crate::client::table::log_fetch_buffer::{
     LogFetchBuffer, RemotePendingFetch,
 };
 use crate::client::table::remote_log::{RemoteLogDownloader, RemoteLogFetchInfo};
+use crate::config::Config;
 use crate::error::Error::UnsupportedOperation;
 use crate::error::{ApiError, Error, FlussError, Result};
-use crate::metadata::{LogFormat, PhysicalTablePath, TableBucket, TableInfo, TablePath};
-use crate::proto::{ErrorResponse, FetchLogRequest, PbFetchLogReqForBucket, PbFetchLogReqForTable};
+use crate::metadata::{LogFormat, PhysicalTablePath, RowType, TableBucket, TableInfo, TablePath};
+use crate::proto::{
+    ErrorResponse, FetchLogRequest, FetchLogResponse, PbFetchLogReqForBucket, PbFetchLogReqForTable,
+};
 use crate::record::{
     LogRecordsBatches, ReadContext, ScanBatch, ScanRecord, ScanRecords, to_arrow_schema,
 };
@@ -273,7 +276,7 @@ impl LogScannerInner {
         table_info: &TableInfo,
         metadata: Arc<Metadata>,
         connections: Arc<RpcClient>,
-        config: &crate::config::Config,
+        config: &Config,
         projected_fields: Option<Vec<usize>>,
     ) -> Result<Self> {
         let log_scanner_status = Arc::new(LogScannerStatus::new());
@@ -651,14 +654,26 @@ impl LogFetcher {
         conns: Arc<RpcClient>,
         metadata: Arc<Metadata>,
         log_scanner_status: Arc<LogScannerStatus>,
-        config: &crate::config::Config,
+        config: &Config,
         projected_fields: Option<Vec<usize>>,
     ) -> Result<Self> {
-        let full_arrow_schema = to_arrow_schema(table_info.get_row_type())?;
+        let full_row_type = table_info.get_row_type();
+        let full_arrow_schema = to_arrow_schema(full_row_type)?;
+        let projected_row_type = match &projected_fields {
+            None => Arc::new(full_row_type.clone()),
+            Some(fields) => Arc::new(RowType::new(
+                fields
+                    .iter()
+                    .map(|&i| full_row_type.fields()[i].clone())
+                    .collect(),
+            )),
+        };
         let read_context =
-            Self::create_read_context(full_arrow_schema.clone(), projected_fields.clone(), false)?;
+            Self::create_read_context(full_arrow_schema.clone(), projected_fields.clone(), false)?
+                .with_fluss_row_type(projected_row_type.clone());
         let remote_read_context =
-            Self::create_read_context(full_arrow_schema, projected_fields.clone(), true)?;
+            Self::create_read_context(full_arrow_schema, projected_fields.clone(), true)?
+                .with_fluss_row_type(projected_row_type);
 
         let tmp_dir = TempDir::with_prefix("fluss-remote-logs")?;
         let log_fetch_buffer = Arc::new(LogFetchBuffer::new(read_context.clone()));
@@ -928,7 +943,7 @@ impl LogFetcher {
 
     /// Handle fetch response and add completed fetches to buffer
     async fn handle_fetch_response(
-        fetch_response: crate::proto::FetchLogResponse,
+        fetch_response: FetchLogResponse,
         context: FetchResponseContext,
     ) {
         let FetchResponseContext {
@@ -1704,6 +1719,7 @@ mod tests {
         DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
     };
     use crate::metadata::{DataTypes, PhysicalTablePath, Schema, TableInfo, TablePath};
+    use crate::proto::{PbFetchLogRespForBucket, PbFetchLogRespForTable};
     use crate::record::MemoryLogRecordsArrowBuilder;
     use crate::row::{Datum, GenericRow};
     use crate::rpc::FlussError;
@@ -1743,7 +1759,7 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata,
             status.clone(),
-            &crate::config::Config::default(),
+            &Config::default(),
             None,
         )?;
 
@@ -1775,7 +1791,7 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata,
             status,
-            &crate::config::Config::default(),
+            &Config::default(),
             None,
         )?;
 
@@ -1811,7 +1827,7 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata,
             status,
-            &crate::config::Config::default(),
+            &Config::default(),
             None,
         )?;
 
@@ -1835,14 +1851,14 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata.clone(),
             status.clone(),
-            &crate::config::Config::default(),
+            &Config::default(),
             None,
         )?;
 
-        let response = crate::proto::FetchLogResponse {
-            tables_resp: vec![crate::proto::PbFetchLogRespForTable {
+        let response = FetchLogResponse {
+            tables_resp: vec![PbFetchLogRespForTable {
                 table_id: 1,
-                buckets_resp: vec![crate::proto::PbFetchLogRespForBucket {
+                buckets_resp: vec![PbFetchLogRespForBucket {
                     partition_id: None,
                     bucket_id: 0,
                     error_code: Some(FlussError::AuthorizationException.code()),
@@ -1885,17 +1901,17 @@ mod tests {
             Arc::new(RpcClient::new()),
             metadata.clone(),
             status.clone(),
-            &crate::config::Config::default(),
+            &Config::default(),
             None,
         )?;
 
         let bucket = TableBucket::new(1, 0);
         assert!(metadata.leader_for(&table_path, &bucket).await?.is_some());
 
-        let response = crate::proto::FetchLogResponse {
-            tables_resp: vec![crate::proto::PbFetchLogRespForTable {
+        let response = FetchLogResponse {
+            tables_resp: vec![PbFetchLogRespForTable {
                 table_id: 1,
-                buckets_resp: vec![crate::proto::PbFetchLogRespForBucket {
+                buckets_resp: vec![PbFetchLogRespForBucket {
                     partition_id: None,
                     bucket_id: 0,
                     error_code: Some(FlussError::NotLeaderOrFollower.code()),
@@ -2002,12 +2018,12 @@ mod tests {
         let status = Arc::new(LogScannerStatus::new());
         status.assign_scan_bucket(TableBucket::new(1, 0), 0);
 
-        let config = crate::config::Config {
+        let config = Config {
             scanner_log_fetch_max_bytes: 1234,
             scanner_log_fetch_min_bytes: 7,
             scanner_log_fetch_wait_max_time_ms: 89,
             scanner_log_fetch_max_bytes_for_bucket: 512,
-            ..crate::config::Config::default()
+            ..Config::default()
         };
 
         let fetcher = LogFetcher::new(
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 4103aa3df0..ffc48a8b69 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -531,7 +531,6 @@ impl DecimalType {
             });
         }
         // Validate scale
-        // Note: MIN_SCALE is 0, and scale is u32, so scale >= MIN_SCALE is always true
         if scale > precision {
             return Err(IllegalArgument {
                 message: format!(
@@ -1220,11 +1219,61 @@ impl DataTypes {
     }
 }
 
-#[derive(Debug, Clone, PartialEq, Eq, Hash, Serialize, Deserialize)]
+pub const UNASSIGNED_FIELD_ID: i32 = -1;
+
+pub fn reassign_field_ids(data_type: &DataType, counter: &mut i32) -> DataType {
+    match data_type {
+        DataType::Array(at) => DataType::Array(ArrayType::with_nullable(
+            at.nullable,
+            reassign_field_ids(at.get_element_type(), counter),
+        )),
+        DataType::Map(mt) => DataType::Map(MapType::with_nullable(
+            mt.nullable,
+            reassign_field_ids(mt.key_type(), counter),
+            reassign_field_ids(mt.value_type(), counter),
+        )),
+        DataType::Row(rt) => {
+            let new_fields: Vec<DataField> = rt
+                .fields()
+                .iter()
+                .map(|f| {
+                    *counter += 1;
+                    let id = *counter;
+                    let new_inner = reassign_field_ids(&f.data_type, counter);
+                    DataField::with_field_id(f.name.clone(), new_inner, f.description.clone(), id)
+                })
+                .collect();
+            DataType::Row(RowType::with_nullable(rt.nullable, new_fields))
+        }
+        _ => data_type.clone(),
+    }
+}
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct DataField {
     pub name: String,
     pub data_type: DataType,
     pub description: Option<String>,
+    pub field_id: i32,
+}
+
+// field_id is excluded from PartialEq/Eq/Hash to match Java's DataField.equals/hashCode.
+impl PartialEq for DataField {
+    fn eq(&self, other: &Self) -> bool {
+        self.name == other.name
+            && self.data_type == other.data_type
+            && self.description == other.description
+    }
+}
+
+impl Eq for DataField {}
+
+impl std::hash::Hash for DataField {
+    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
+        self.name.hash(state);
+        self.data_type.hash(state);
+        self.description.hash(state);
+    }
 }
 
 impl DataField {
@@ -1237,6 +1286,21 @@ impl DataField {
             name: name.into(),
             data_type,
             description,
+            field_id: UNASSIGNED_FIELD_ID,
+        }
+    }
+
+    pub fn with_field_id<N: Into<String>>(
+        name: N,
+        data_type: DataType,
+        description: Option<String>,
+        field_id: i32,
+    ) -> DataField {
+        DataField {
+            name: name.into(),
+            data_type,
+            description,
+            field_id,
         }
     }
 
@@ -1247,6 +1311,10 @@ impl DataField {
     pub fn data_type(&self) -> &DataType {
         &self.data_type
     }
+
+    pub fn field_id(&self) -> i32 {
+        self.field_id
+    }
 }
 
 impl Display for DataField {
diff --git a/fluss-rust/crates/fluss/src/metadata/json_serde.rs b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
index efbce84d65..b08159ae66 100644
--- a/fluss-rust/crates/fluss/src/metadata/json_serde.rs
+++ b/fluss-rust/crates/fluss/src/metadata/json_serde.rs
@@ -17,7 +17,10 @@
 
 use crate::error::Error::JsonSerdeError;
 use crate::error::{Error, Result};
-use crate::metadata::datatype::{DataField, DataType, DataTypes};
+use crate::metadata::datatype::{
+    DataField, DataType, DataTypes, DecimalType, TimeType, TimestampLTzType, TimestampType,
+    UNASSIGNED_FIELD_ID,
+};
 use crate::metadata::table::{Column, Schema, TableDescriptor};
 use serde_json::{Value, json};
 use std::collections::HashMap;
@@ -202,12 +205,11 @@ impl JsonSerde for DataType {
                     .get(Self::FIELD_NAME_SCALE)
                     .and_then(|v| v.as_u64())
                     .unwrap_or(0) as u32;
-                DataType::Decimal(
-                    crate::metadata::datatype::DecimalType::with_nullable(true, precision, scale)
-                        .map_err(|e| Error::JsonSerdeError {
+                DataType::Decimal(DecimalType::with_nullable(true, precision, scale).map_err(
+                    |e| Error::JsonSerdeError {
                         message: format!("Invalid DECIMAL parameters: {e}"),
-                    })?,
-                )
+                    },
+                )?)
             }
             "DATE" => DataTypes::date(),
             "TIME_WITHOUT_TIME_ZONE" => {
@@ -215,39 +217,33 @@ impl JsonSerde for DataType {
                     .get(Self::FIELD_NAME_PRECISION)
                     .and_then(|v| v.as_u64())
                     .unwrap_or(0) as u32;
-                DataType::Time(
-                    crate::metadata::datatype::TimeType::with_nullable(true, precision).map_err(
-                        |e| Error::JsonSerdeError {
-                            message: format!("Invalid TIME_WITHOUT_TIME_ZONE precision: {e}"),
-                        },
-                    )?,
-                )
+                DataType::Time(TimeType::with_nullable(true, precision).map_err(|e| {
+                    Error::JsonSerdeError {
+                        message: format!("Invalid TIME_WITHOUT_TIME_ZONE precision: {e}"),
+                    }
+                })?)
             }
             "TIMESTAMP_WITHOUT_TIME_ZONE" => {
                 let precision = node
                     .get(Self::FIELD_NAME_PRECISION)
                     .and_then(|v| v.as_u64())
                     .unwrap_or(6) as u32;
-                DataType::Timestamp(
-                    crate::metadata::datatype::TimestampType::with_nullable(true, precision)
-                        .map_err(|e| Error::JsonSerdeError {
-                            message: format!("Invalid TIMESTAMP_WITHOUT_TIME_ZONE precision: {e}"),
-                        })?,
-                )
+                DataType::Timestamp(TimestampType::with_nullable(true, precision).map_err(|e| {
+                    Error::JsonSerdeError {
+                        message: format!("Invalid TIMESTAMP_WITHOUT_TIME_ZONE precision: {e}"),
+                    }
+                })?)
             }
             "TIMESTAMP_WITH_LOCAL_TIME_ZONE" => {
                 let precision = node
                     .get(Self::FIELD_NAME_PRECISION)
                     .and_then(|v| v.as_u64())
                     .unwrap_or(6) as u32;
-                DataType::TimestampLTz(
-                    crate::metadata::datatype::TimestampLTzType::with_nullable(true, precision)
-                        .map_err(|e| Error::JsonSerdeError {
-                            message: format!(
-                                "Invalid TIMESTAMP_WITH_LOCAL_TIME_ZONE precision: {e}"
-                            ),
-                        })?,
-                )
+                DataType::TimestampLTz(TimestampLTzType::with_nullable(true, precision).map_err(
+                    |e| Error::JsonSerdeError {
+                        message: format!("Invalid TIMESTAMP_WITH_LOCAL_TIME_ZONE precision: {e}"),
+                    },
+                )?)
             }
             "BYTES" => DataTypes::bytes(),
             "BINARY" => {
@@ -328,6 +324,7 @@ impl DataField {
     const NAME: &'static str = "name";
     const FIELD_TYPE: &'static str = "field_type";
     const DESCRIPTION: &'static str = "description";
+    const FIELD_ID: &'static str = "field_id";
 }
 
 impl JsonSerde for DataField {
@@ -344,6 +341,8 @@ impl JsonSerde for DataField {
             obj.insert(Self::DESCRIPTION.to_string(), json!(description));
         }
 
+        obj.insert(Self::FIELD_ID.to_string(), json!(self.field_id()));
+
         Ok(Value::Object(obj))
     }
 
@@ -369,7 +368,18 @@ impl JsonSerde for DataField {
             .and_then(|v| v.as_str())
             .map(|s| s.to_string());
 
-        Ok(DataField::new(name, data_type, description))
+        let field_id = node
+            .get(Self::FIELD_ID)
+            .and_then(|v| v.as_i64())
+            .map(|v| v as i32)
+            .unwrap_or(UNASSIGNED_FIELD_ID);
+
+        Ok(DataField::with_field_id(
+            name,
+            data_type,
+            description,
+            field_id,
+        ))
     }
 }
 
@@ -439,6 +449,7 @@ impl JsonSerde for Column {
 impl Schema {
     const COLUMNS_NAME: &'static str = "columns";
     const PRIMARY_KEY_NAME: &'static str = "primary_key";
+    const HIGHEST_FIELD_ID: &'static str = "highest_field_id";
     const VERSION_KEY: &'static str = "version";
     const VERSION: u32 = 1;
 }
@@ -467,6 +478,12 @@ impl JsonSerde for Schema {
                 .collect();
             obj.insert(Self::PRIMARY_KEY_NAME.to_string(), json!(pk_values));
         }
+
+        obj.insert(
+            Self::HIGHEST_FIELD_ID.to_string(),
+            json!(self.highest_field_id()),
+        );
+
         Ok(Value::Object(obj))
     }
 
@@ -682,12 +699,13 @@ impl JsonSerde for TableDescriptor {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::DataTypes;
+    use crate::metadata::reassign_field_ids;
+    use crate::metadata::{
+        Column, DataField, DataType, DataTypes as DT, DataTypes, MapType, Schema,
+    };
 
     #[test]
     fn column_id_round_trip_through_json() {
-        use crate::metadata::Column;
-
         let col = Column::new("a", DataTypes::int())
             .with_id(7)
             .with_comment("desc");
@@ -699,8 +717,6 @@ mod tests {
 
     #[test]
     fn schema_assigns_ids_when_absent_and_preserves_when_present() {
-        use crate::metadata::{Column, Schema};
-
         let auto = Schema::builder()
             .column("a", DataTypes::int())
             .column("b", DataTypes::string())
@@ -722,7 +738,6 @@ mod tests {
 
     #[test]
     fn schema_rejects_duplicate_ids() {
-        use crate::metadata::Column;
         let err = Schema::builder()
             .with_columns(vec![
                 Column::new("a", DataTypes::int()).with_id(7),
@@ -730,12 +745,11 @@ mod tests {
             ])
             .build()
             .unwrap_err();
-        assert!(err.to_string().contains("Duplicate column id 7"), "{err}");
+        assert!(err.to_string().contains("Duplicate field id 7"), "{err}");
     }
 
     #[test]
     fn schema_rejects_negative_non_sentinel_ids() {
-        use crate::metadata::Column;
         let err = Schema::builder()
             .with_columns(vec![Column::new("a", DataTypes::int()).with_id(-7)])
             .build()
@@ -745,7 +759,6 @@ mod tests {
 
     #[test]
     fn column_json_id_overflow_errors() {
-        use crate::metadata::Column;
         let json = serde_json::json!({
             "name": "a",
             "data_type": Column::new("a", DataTypes::int()).serialize_json().unwrap()
@@ -758,8 +771,6 @@ mod tests {
 
     #[test]
     fn schema_rejects_partially_assigned_ids() {
-        use crate::metadata::Column;
-
         let err = Schema::builder()
             .with_columns(vec![
                 Column::new("a", DataTypes::int()).with_id(0),
@@ -773,6 +784,259 @@ mod tests {
         );
     }
 
+    #[test]
+    fn schema_assigns_nested_field_ids_in_java_dfs_order() {
+        let inner_row = DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
+        let nested_row = DataTypes::row(vec![
+            DataField::new("x", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let deep_row = DataTypes::row(vec![DataField::new("inner", inner_row, None)]);
+
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("nested", nested_row)
+            .column("deep", deep_row)
+            .build()
+            .unwrap();
+
+        let top_ids: Vec<i32> = schema.columns().iter().map(|c| c.id()).collect();
+        assert_eq!(top_ids, vec![0, 1, 4]);
+
+        fn nested_field(dt: &DataType, idx: usize) -> &DataField {
+            match dt {
+                DataType::Row(rt) => &rt.fields()[idx],
+                _ => panic!("not a Row"),
+            }
+        }
+        let nested_dt = schema.columns()[1].data_type();
+        assert_eq!(nested_field(nested_dt, 0).field_id(), 2); // x
+        assert_eq!(nested_field(nested_dt, 1).field_id(), 3); // label
+
+        let deep_dt = schema.columns()[2].data_type();
+        let inner_field = nested_field(deep_dt, 0); // inner
+        assert_eq!(inner_field.field_id(), 5);
+        let n_field = nested_field(inner_field.data_type(), 0); // n
+        assert_eq!(n_field.field_id(), 6);
+
+        assert_eq!(schema.highest_field_id(), 6);
+
+        for c in schema.columns() {
+            assert_ne!(c.id(), UNASSIGNED_FIELD_ID);
+        }
+    }
+
+    #[test]
+    fn schema_array_of_row_assigns_nested_ids() {
+        let elem = DataTypes::row(vec![
+            DataField::new("seq", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("events", DataTypes::array(elem))
+            .build()
+            .unwrap();
+        assert_eq!(schema.highest_field_id(), 3);
+        let array_dt = schema.columns()[1].data_type();
+        let elem_dt = match array_dt {
+            DataType::Array(at) => at.get_element_type(),
+            _ => unreachable!(),
+        };
+        let fields = match elem_dt {
+            DataType::Row(rt) => rt.fields(),
+            _ => unreachable!(),
+        };
+        assert_eq!(fields[0].field_id(), 2);
+        assert_eq!(fields[1].field_id(), 3);
+    }
+
+    #[test]
+    fn schema_nested_row_round_trips_through_json() {
+        let nested = DataTypes::row(vec![
+            DataField::new("x", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let original = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("nested", nested)
+            .build()
+            .unwrap();
+
+        let json = original.serialize_json().unwrap();
+
+        assert_eq!(
+            json.get("highest_field_id").and_then(|v| v.as_i64()),
+            Some(3)
+        );
+
+        let round_tripped = Schema::deserialize_json(&json).unwrap();
+        assert_eq!(round_tripped.highest_field_id(), 3);
+        assert_eq!(
+            round_tripped
+                .columns()
+                .iter()
+                .map(|c| c.id())
+                .collect::<Vec<_>>(),
+            vec![0, 1],
+        );
+        assert_eq!(round_tripped, original);
+    }
+
+    #[test]
+    fn schema_rejects_duplicate_nested_field_ids() {
+        let nested = DataTypes::row(vec![
+            DataField::with_field_id("x", DT::int(), None, 0),
+            DataField::with_field_id("y", DT::int(), None, 2),
+        ]);
+        let err = Schema::builder()
+            .with_columns(vec![
+                Column::new("a", DT::int()).with_id(0),
+                Column::new("b", nested).with_id(1),
+            ])
+            .build()
+            .unwrap_err();
+        assert!(err.to_string().contains("Duplicate field id 0"), "{err}");
+    }
+
+    #[test]
+    fn schema_rejects_partially_assigned_nested_field_ids() {
+        let nested = DataTypes::row(vec![DataField::new("x", DT::int(), None)]);
+        let err = Schema::builder()
+            .with_columns(vec![
+                Column::new("a", DT::int()).with_id(0),
+                Column::new("b", nested).with_id(1),
+            ])
+            .build()
+            .unwrap_err();
+        assert!(
+            err.to_string()
+                .contains("nested DataField ids are unassigned"),
+            "{err}"
+        );
+    }
+
+    #[test]
+    fn schema_preserves_nested_ids_with_gaps() {
+        // n2.m1=11), f2=2 (nested n0=9, n1=10).
+        let inner_for_n2 = DataTypes::row(vec![DataField::with_field_id(
+            "m1",
+            DataTypes::tinyint(),
+            None,
+            11,
+        )]);
+        let f1_row = DataTypes::row(vec![
+            DataField::with_field_id("n0", DataTypes::tinyint(), None, 6),
+            DataField::with_field_id("n1", DataTypes::string(), None, 7),
+            DataField::with_field_id("n2", inner_for_n2, None, 8),
+        ]);
+        let f2_row = DataTypes::row(vec![
+            DataField::with_field_id("n0", DataTypes::tinyint(), None, 9),
+            DataField::with_field_id("n1", DataTypes::string(), None, 10),
+        ]);
+
+        let schema = Schema::builder()
+            .with_columns(vec![
+                Column::new("f0", DataTypes::string().as_non_nullable()).with_id(0),
+                Column::new("f1", f1_row).with_id(1),
+                Column::new("f2", f2_row).with_id(2),
+            ])
+            .build()
+            .unwrap();
+
+        let top_ids: Vec<i32> = schema.columns().iter().map(|c| c.id()).collect();
+        assert_eq!(top_ids, vec![0, 1, 2]);
+
+        fn row_fields(dt: &DataType) -> &[DataField] {
+            match dt {
+                DataType::Row(rt) => rt.fields(),
+                _ => panic!("not a Row"),
+            }
+        }
+        let f1_fields = row_fields(schema.columns()[1].data_type());
+        assert_eq!(f1_fields[0].field_id(), 6); // n0
+        assert_eq!(f1_fields[1].field_id(), 7); // n1
+        assert_eq!(f1_fields[2].field_id(), 8); // n2
+        let n2_fields = row_fields(f1_fields[2].data_type());
+        assert_eq!(n2_fields[0].field_id(), 11); // m1 — the "gap"
+
+        let f2_fields = row_fields(schema.columns()[2].data_type());
+        assert_eq!(f2_fields[0].field_id(), 9);
+        assert_eq!(f2_fields[1].field_id(), 10);
+
+        assert_eq!(schema.highest_field_id(), 11);
+    }
+
+    #[test]
+    fn schema_deserializes_legacy_json_without_column_ids() {
+        let legacy_json: Value = serde_json::from_str(
+            r#"{
+                "version": 1,
+                "columns": [
+                    {"name": "a", "data_type": {"type": "INTEGER", "nullable": false}, "comment": "first"},
+                    {"name": "b", "data_type": {"type": "STRING"}, "comment": "second"},
+                    {"name": "c", "data_type": {"type": "CHAR", "nullable": false, "length": 10}, "comment": "third"}
+                ],
+                "primary_key": ["a", "c"]
+            }"#,
+        )
+        .unwrap();
+
+        let schema = Schema::deserialize_json(&legacy_json).expect("legacy JSON must deserialize");
+        let ids: Vec<i32> = schema.columns().iter().map(|c| c.id()).collect();
+        assert_eq!(ids, vec![0, 1, 2], "missing IDs auto-assigned 0..N-1");
+        assert_eq!(schema.highest_field_id(), 2);
+        assert!(schema.primary_key().is_some());
+    }
+
+    #[test]
+    fn empty_schema_has_minus_one_highest_field_id() {
+        let s = Schema::builder().build().unwrap();
+        assert_eq!(s.highest_field_id(), -1);
+        let json = s.serialize_json().unwrap();
+        assert_eq!(
+            json.get("highest_field_id").and_then(|v| v.as_i64()),
+            Some(-1)
+        );
+    }
+
+    #[test]
+    fn reassign_field_ids_walks_array_map_row() {
+        let dt = DataTypes::array(DataTypes::row(vec![
+            DataField::new("a", DataTypes::int(), None),
+            DataField::new("b", DataTypes::string(), None),
+        ]));
+        let mut counter = -1_i32;
+        let assigned = reassign_field_ids(&dt, &mut counter);
+        match assigned {
+            DataType::Array(at) => match at.get_element_type() {
+                DataType::Row(rt) => {
+                    assert_eq!(rt.fields()[0].field_id(), 0);
+                    assert_eq!(rt.fields()[1].field_id(), 1);
+                }
+                _ => panic!("expected Row"),
+            },
+            _ => panic!("expected Array"),
+        }
+        assert_eq!(counter, 1);
+
+        let dt = DataType::Map(MapType::new(
+            DataTypes::int(),
+            DataTypes::row(vec![DataField::new("x", DataTypes::int(), None)]),
+        ));
+        let mut counter = -1_i32;
+        let assigned = reassign_field_ids(&dt, &mut counter);
+        let value_type = match &assigned {
+            DataType::Map(mt) => mt.value_type(),
+            _ => panic!("expected Map"),
+        };
+        match value_type {
+            DataType::Row(rt) => assert_eq!(rt.fields()[0].field_id(), 0),
+            _ => panic!("expected Row"),
+        }
+        assert_eq!(counter, 0);
+    }
+
     #[test]
     fn test_datatype_json_serde() {
         let data_types = vec![
diff --git a/fluss-rust/crates/fluss/src/metadata/table.rs b/fluss-rust/crates/fluss/src/metadata/table.rs
index ebaf085e21..390bdbfcc9 100644
--- a/fluss-rust/crates/fluss/src/metadata/table.rs
+++ b/fluss-rust/crates/fluss/src/metadata/table.rs
@@ -19,7 +19,9 @@ use crate::compression::ArrowCompressionInfo;
 use crate::error::Error::IllegalArgument;
 use crate::error::{Error, Result};
 use crate::metadata::DataLakeFormat;
-use crate::metadata::datatype::{DataField, DataType, RowType};
+use crate::metadata::datatype::{
+    DataField, DataType, RowType, UNASSIGNED_FIELD_ID, reassign_field_ids,
+};
 use crate::{BucketId, PartitionId, TableId};
 use core::fmt;
 use serde::{Deserialize, Serialize};
@@ -112,12 +114,55 @@ impl PrimaryKey {
     }
 }
 
+fn collect_field_id_state(data_type: &DataType, max_id: &mut i32, has_unassigned: &mut bool) {
+    match data_type {
+        DataType::Row(rt) => {
+            for f in rt.fields() {
+                if f.field_id == UNASSIGNED_FIELD_ID {
+                    *has_unassigned = true;
+                } else {
+                    *max_id = (*max_id).max(f.field_id);
+                }
+                collect_field_id_state(&f.data_type, max_id, has_unassigned);
+            }
+        }
+        DataType::Array(at) => {
+            collect_field_id_state(at.get_element_type(), max_id, has_unassigned);
+        }
+        DataType::Map(mt) => {
+            collect_field_id_state(mt.key_type(), max_id, has_unassigned);
+            collect_field_id_state(mt.value_type(), max_id, has_unassigned);
+        }
+        _ => {}
+    }
+}
+
+fn collect_nested_field_ids(data_type: &DataType, ids: &mut Vec<i32>) {
+    match data_type {
+        DataType::Row(rt) => {
+            for f in rt.fields() {
+                if f.field_id != UNASSIGNED_FIELD_ID {
+                    ids.push(f.field_id);
+                }
+                collect_nested_field_ids(&f.data_type, ids);
+            }
+        }
+        DataType::Array(at) => collect_nested_field_ids(at.get_element_type(), ids),
+        DataType::Map(mt) => {
+            collect_nested_field_ids(mt.key_type(), ids);
+            collect_nested_field_ids(mt.value_type(), ids);
+        }
+        _ => {}
+    }
+}
+
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 pub struct Schema {
     columns: Vec<Column>,
     primary_key: Option<PrimaryKey>,
     row_type: RowType,
     auto_increment_col_names: Vec<String>,
+    highest_field_id: i32,
 }
 
 impl Schema {
@@ -167,6 +212,10 @@ impl Schema {
     pub fn auto_increment_col_names(&self) -> &Vec<String> {
         &self.auto_increment_col_names
     }
+
+    pub fn highest_field_id(&self) -> i32 {
+        self.highest_field_id
+    }
 }
 
 /// A schema together with its server-assigned version id.
@@ -278,9 +327,9 @@ impl SchemaBuilder {
 
     pub fn build(&self) -> Result<Schema> {
         let columns = Self::normalize_columns(&self.columns, self.primary_key.as_ref())?;
-        let columns = Self::assign_column_ids(columns)?;
+        let (columns_with_ids, highest_field_id) = Self::assign_all_field_ids(columns)?;
 
-        let column_names: HashSet<_> = columns.iter().map(|c| &c.name).collect();
+        let column_names: HashSet<_> = columns_with_ids.iter().map(|c| &c.name).collect();
         for auto_inc_col in &self.auto_increment_col_names {
             if !column_names.contains(auto_inc_col) {
                 return Err(IllegalArgument {
@@ -291,26 +340,115 @@ impl SchemaBuilder {
             }
         }
 
-        let data_fields = columns
+        let data_fields = columns_with_ids
             .iter()
             .map(|c| DataField {
                 name: c.name.clone(),
                 data_type: c.data_type.clone(),
                 description: c.comment.clone(),
+                field_id: c.id,
             })
             .collect();
 
         Ok(Schema {
-            columns,
+            columns: columns_with_ids,
             primary_key: self.primary_key.clone(),
             row_type: RowType::new(data_fields),
             auto_increment_col_names: self.auto_increment_col_names.clone(),
+            highest_field_id,
         })
     }
 
+    fn assign_all_field_ids(columns: Vec<Column>) -> Result<(Vec<Column>, i32)> {
+        let with_top_id = columns.iter().filter(|c| c.id != UNKNOWN_COLUMN_ID).count();
+        let none_set = with_top_id == 0;
+        let all_top_set = with_top_id == columns.len();
+
+        if !none_set && !all_top_set {
+            return Err(IllegalArgument {
+                message: "All columns must have an id assigned, or none of them must.".to_string(),
+            });
+        }
+
+        let mut max_nested_id = -1_i32;
+        let mut has_unassigned_nested = false;
+        for c in &columns {
+            collect_field_id_state(&c.data_type, &mut max_nested_id, &mut has_unassigned_nested);
+        }
+
+        if all_top_set && !has_unassigned_nested {
+            let mut seen: HashSet<i32> = HashSet::new();
+            let mut max_id = -1_i32;
+            for col in &columns {
+                if col.id < 0 {
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "Column '{}' has invalid id {}; ids must be non-negative",
+                            col.name, col.id
+                        ),
+                    });
+                }
+                if !seen.insert(col.id) {
+                    return Err(IllegalArgument {
+                        message: format!("Duplicate field id {} in schema", col.id),
+                    });
+                }
+                max_id = max_id.max(col.id);
+
+                let mut nested_ids = Vec::new();
+                collect_nested_field_ids(&col.data_type, &mut nested_ids);
+                for id in nested_ids {
+                    if id < 0 {
+                        return Err(IllegalArgument {
+                            message: format!(
+                                "Nested DataField in column '{}' has invalid id {}; ids must be non-negative",
+                                col.name, id
+                            ),
+                        });
+                    }
+                    if !seen.insert(id) {
+                        return Err(IllegalArgument {
+                            message: format!(
+                                "Duplicate field id {} in schema (column '{}')",
+                                id, col.name
+                            ),
+                        });
+                    }
+                }
+            }
+            max_id = max_id.max(max_nested_id);
+            return Ok((columns, max_id));
+        }
+
+        if all_top_set && has_unassigned_nested {
+            return Err(IllegalArgument {
+                message: "Top-level column ids are set but some nested DataField ids are unassigned; reassign all or none."
+                    .to_string(),
+            });
+        }
+
+        let mut counter: i32 = -1;
+        let new_columns: Vec<Column> = columns
+            .into_iter()
+            .map(|c| {
+                counter += 1;
+                let id = counter;
+                let new_data_type = reassign_field_ids(&c.data_type, &mut counter);
+                Column {
+                    name: c.name,
+                    data_type: new_data_type,
+                    comment: c.comment,
+                    id,
+                }
+            })
+            .collect();
+        Ok((new_columns, counter))
+    }
+
     /// All-or-none: preserve ids if every column has one, auto-assign
     /// 0..N-1 if none do, error on mixed input. When preserving ids,
     /// also reject duplicates and negative-but-not-sentinel values.
+    #[allow(dead_code)]
     fn assign_column_ids(columns: Vec<Column>) -> Result<Vec<Column>> {
         let with_id = columns.iter().filter(|c| c.id != UNKNOWN_COLUMN_ID).count();
         if with_id == 0 {
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index d03f1454d2..9f1a97840d 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -20,10 +20,10 @@ use crate::compression::{
     ArrowCompressionInfo, ArrowCompressionRatioEstimator, ArrowCompressionType,
 };
 use crate::error::{Error, Result};
-use crate::metadata::{DataType, RowType};
+use crate::metadata::{DataField, DataType, RowType};
 use crate::record::{ChangeType, ScanRecord};
 use crate::row::column_writer::{ColumnWriter, round_up_to_8};
-use crate::row::{ColumnarRow, InternalRow};
+use crate::row::{ColumnarRow, InternalRow, arrow_row_column_indices, fluss_row_column_indices};
 use arrow::array::{ArrayBuilder, ArrayRef};
 use arrow::{
     array::RecordBatch,
@@ -992,7 +992,10 @@ impl LogRecordBatch {
         let data = &self.data[RECORDS_OFFSET..];
 
         let record_batch = read_context.record_batch(data)?;
-        let arrow_reader = ArrowReader::new(Arc::new(record_batch));
+        let arrow_reader = ArrowReader::new_with_fluss_row_type(
+            Arc::new(record_batch),
+            read_context.fluss_row_type().cloned(),
+        );
         let log_record_iterator = LogRecordIterator::Arrow(ArrowLogRecordIterator {
             reader: arrow_reader,
             base_offset: self.base_log_offset(),
@@ -1015,7 +1018,10 @@ impl LogRecordBatch {
         let log_record_iterator = match record_batch {
             None => LogRecordIterator::empty(),
             Some(record_batch) => {
-                let arrow_reader = ArrowReader::new(Arc::new(record_batch));
+                let arrow_reader = ArrowReader::new_with_fluss_row_type(
+                    Arc::new(record_batch),
+                    read_context.fluss_row_type().cloned(),
+                );
                 LogRecordIterator::Arrow(ArrowLogRecordIterator {
                     reader: arrow_reader,
                     base_offset: self.base_log_offset(),
@@ -1216,7 +1222,7 @@ pub fn to_arrow_type(fluss_type: &DataType) -> Result<ArrowDataType> {
         DataType::Array(array_type) => ArrowDataType::List(
             Field::new_list_field(
                 to_arrow_type(array_type.get_element_type())?,
-                fluss_type.is_nullable(),
+                array_type.get_element_type().is_nullable(),
             )
             .into(),
         ),
@@ -1310,6 +1316,19 @@ pub(crate) fn from_arrow_type(arrow_type: &ArrowDataType) -> Result<DataType> {
             }
         }
         ArrowDataType::List(field) => DataTypes::array(from_arrow_type(field.data_type())?),
+        ArrowDataType::Struct(fields) => {
+            let row_fields: Result<Vec<DataField>> = fields
+                .iter()
+                .map(|f| {
+                    let mut dt = from_arrow_type(f.data_type())?;
+                    if !f.is_nullable() {
+                        dt = dt.as_non_nullable();
+                    }
+                    Ok(DataField::new(f.name(), dt, None))
+                })
+                .collect();
+            DataTypes::row(row_fields?)
+        }
         other => {
             return Err(Error::IllegalArgument {
                 message: format!("Cannot convert Arrow type to Fluss type: {other:?}"),
@@ -1324,6 +1343,7 @@ pub struct ReadContext {
     full_schema: SchemaRef,
     projection: Option<Projection>,
     is_from_remote: bool,
+    fluss_row_type: Option<Arc<RowType>>,
 }
 
 #[derive(Clone)]
@@ -1343,9 +1363,19 @@ impl ReadContext {
             full_schema: arrow_schema,
             projection: None,
             is_from_remote,
+            fluss_row_type: None,
         }
     }
 
+    pub fn with_fluss_row_type(mut self, fluss_row_type: Arc<RowType>) -> ReadContext {
+        self.fluss_row_type = Some(fluss_row_type);
+        self
+    }
+
+    pub fn fluss_row_type(&self) -> Option<&Arc<RowType>> {
+        self.fluss_row_type.as_ref()
+    }
+
     pub fn with_projection_pushdown(
         arrow_schema: SchemaRef,
         projected_fields: Vec<usize>,
@@ -1414,6 +1444,7 @@ impl ReadContext {
             full_schema: arrow_schema,
             projection: Some(project),
             is_from_remote,
+            fluss_row_type: None,
         })
     }
 
@@ -1604,11 +1635,33 @@ impl Iterator for ArrowLogRecordIterator {
 
 pub struct ArrowReader {
     record_batch: Arc<RecordBatch>,
+    fluss_row_type: Option<Arc<RowType>>,
+    row_column_indices: Arc<[usize]>,
 }
 
 impl ArrowReader {
     pub fn new(record_batch: Arc<RecordBatch>) -> Self {
-        ArrowReader { record_batch }
+        let row_column_indices = arrow_row_column_indices(&record_batch);
+        ArrowReader {
+            record_batch,
+            fluss_row_type: None,
+            row_column_indices,
+        }
+    }
+
+    pub fn new_with_fluss_row_type(
+        record_batch: Arc<RecordBatch>,
+        fluss_row_type: Option<Arc<RowType>>,
+    ) -> Self {
+        let row_column_indices = match &fluss_row_type {
+            Some(rt) => fluss_row_column_indices(rt),
+            None => arrow_row_column_indices(&record_batch),
+        };
+        ArrowReader {
+            record_batch,
+            fluss_row_type,
+            row_column_indices,
+        }
     }
 
     pub fn row_count(&self) -> usize {
@@ -1616,7 +1669,12 @@ impl ArrowReader {
     }
 
     pub fn read(&self, row_id: usize) -> ColumnarRow {
-        ColumnarRow::new_with_row_id(self.record_batch.clone(), row_id)
+        ColumnarRow::with_indices(
+            self.record_batch.clone(),
+            row_id,
+            self.fluss_row_type.clone(),
+            self.row_column_indices.clone(),
+        )
     }
 }
 pub struct MyVec<T>(pub StreamReader<T>);
diff --git a/fluss-rust/crates/fluss/src/record/mod.rs b/fluss-rust/crates/fluss/src/record/mod.rs
index 8438b16d54..522fb03bbe 100644
--- a/fluss-rust/crates/fluss/src/record/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/mod.rs
@@ -249,7 +249,7 @@ mod tests {
         let schema = Arc::new(Schema::new(vec![Field::new("v", DataType::Int32, false)]));
         let batch = RecordBatch::try_new(schema, vec![Arc::new(Int32Array::from(values))])
             .expect("record batch");
-        ColumnarRow::new_with_row_id(Arc::new(batch), row_id)
+        ColumnarRow::new(Arc::new(batch), row_id, None)
     }
 
     #[test]
diff --git a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
index fd7da4c9e5..7192ee57ab 100644
--- a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
@@ -19,7 +19,9 @@ use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::{DataType, RowType};
 use crate::row::Datum;
+use crate::row::Decimal;
 use crate::row::binary::BinaryRowFormat;
+use crate::row::datum::{TimestampLtz, TimestampNtz};
 
 /// Writer to write a composite data format, like row, array,
 #[allow(dead_code)]
@@ -52,7 +54,7 @@ pub trait BinaryWriter {
 
     fn write_binary(&mut self, bytes: &[u8], length: usize);
 
-    fn write_decimal(&mut self, value: &crate::row::Decimal, precision: u32);
+    fn write_decimal(&mut self, value: &Decimal, precision: u32);
 
     /// Writes a TIME value.
     ///
@@ -63,9 +65,9 @@ pub trait BinaryWriter {
     /// currently vary by precision.
     fn write_time(&mut self, value: i32, precision: u32);
 
-    fn write_timestamp_ntz(&mut self, value: &crate::row::datum::TimestampNtz, precision: u32);
+    fn write_timestamp_ntz(&mut self, value: &TimestampNtz, precision: u32);
 
-    fn write_timestamp_ltz(&mut self, value: &crate::row::datum::TimestampLtz, precision: u32);
+    fn write_timestamp_ltz(&mut self, value: &TimestampLtz, precision: u32);
 
     fn write_array(&mut self, value: &[u8]);
 
@@ -136,7 +138,36 @@ pub enum InnerValueWriter {
     TimestampNtz(u32), // precision
     TimestampLtz(u32), // precision
     Array,
-    Row(RowType),
+    Row(NestedRowWriter),
+}
+
+#[derive(Debug)]
+pub struct NestedRowWriter {
+    field_writers: Vec<InnerValueWriter>,
+    field_nullable: Vec<bool>,
+}
+
+impl NestedRowWriter {
+    fn from_row_type(row_type: &RowType) -> Result<Self> {
+        let fields = row_type.fields();
+        let mut field_writers = Vec::with_capacity(fields.len());
+        let mut field_nullable = Vec::with_capacity(fields.len());
+        for field in fields {
+            field_writers.push(InnerValueWriter::create_inner_value_writer(
+                field.data_type(),
+                None,
+            )?);
+            field_nullable.push(field.data_type().is_nullable());
+        }
+        Ok(Self {
+            field_writers,
+            field_nullable,
+        })
+    }
+
+    fn field_count(&self) -> usize {
+        self.field_writers.len()
+    }
 }
 
 /// Accessor for writing the fields/elements of a binary writer during runtime, the
@@ -176,7 +207,9 @@ impl InnerValueWriter {
                 Ok(InnerValueWriter::TimestampLtz(t.precision()))
             }
             DataType::Array(_) => Ok(InnerValueWriter::Array),
-            DataType::Row(row_type) => Ok(InnerValueWriter::Row(row_type.clone())),
+            DataType::Row(row_type) => Ok(InnerValueWriter::Row(NestedRowWriter::from_row_type(
+                row_type,
+            )?)),
             _ => unimplemented!(
                 "ValueWriter for DataType {:?} is currently not implemented",
                 data_type
@@ -242,22 +275,31 @@ impl InnerValueWriter {
             (InnerValueWriter::Array, Datum::Array(arr)) => {
                 writer.write_array(arr.as_bytes());
             }
-            (InnerValueWriter::Row(row_type), Datum::Row(inner_row)) => {
+            (InnerValueWriter::Row(nested_writer), Datum::Row(inner_row)) => {
                 use crate::row::compacted::CompactedRowWriter;
-                let field_count = row_type.fields().len();
+                let field_count = nested_writer.field_count();
+                if inner_row.values.len() != field_count {
+                    return Err(IllegalArgument {
+                        message: format!(
+                            "nested row arity mismatch: schema has {} fields, got {}",
+                            field_count,
+                            inner_row.values.len(),
+                        ),
+                    });
+                }
                 let mut nested = CompactedRowWriter::new(field_count);
-                for (i, field) in row_type.fields().iter().enumerate() {
-                    let datum = &inner_row.values[i];
+                for (i, datum) in inner_row.values.iter().enumerate() {
                     if datum.is_null() {
-                        if field.data_type.is_nullable() {
-                            nested.set_null_at(i);
+                        if !nested_writer.field_nullable[i] {
+                            return Err(IllegalArgument {
+                                message: format!(
+                                    "nested row field {i} is non-nullable but received null",
+                                ),
+                            });
                         }
+                        nested.set_null_at(i);
                     } else {
-                        let vw =
-                            InnerValueWriter::create_inner_value_writer(&field.data_type, None)
-                                .expect("create_inner_value_writer failed for nested row field");
-                        vw.write_value(&mut nested, i, datum)
-                            .expect("write_value failed for nested row field");
+                        nested_writer.field_writers[i].write_value(&mut nested, i, datum)?;
                     }
                 }
                 writer.write_bytes(nested.buffer());
diff --git a/fluss-rust/crates/fluss/src/row/binary_array.rs b/fluss-rust/crates/fluss/src/row/binary_array.rs
index 3383a366df..d0e8c9a528 100644
--- a/fluss-rust/crates/fluss/src/row/binary_array.rs
+++ b/fluss-rust/crates/fluss/src/row/binary_array.rs
@@ -26,9 +26,13 @@
 
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::DataType;
+use crate::metadata::{DataType, RowType};
 use crate::row::Decimal;
+use crate::row::InternalRow;
+use crate::row::binary::{BinaryRowFormat, ValueWriter};
+use crate::row::compacted::{CompactedRow, CompactedRowWriter, calculate_bit_set_width_in_bytes};
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+use crate::row::field_getter::FieldGetter;
 use bytes::Bytes;
 use serde::Serialize;
 use std::fmt;
@@ -418,6 +422,48 @@ impl FlussArray {
         let (start, len) = self.read_var_len_span(pos)?;
         FlussArray::from_owned_bytes(self.data.slice(start..start + len))
     }
+
+    pub fn get_row<'a>(&'a self, pos: usize, row_type: &'a RowType) -> Result<CompactedRow<'a>> {
+        let bytes = self.read_var_len_bytes(pos)?;
+        let header_size = calculate_bit_set_width_in_bytes(row_type.fields().len());
+        if bytes.len() < header_size {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussArray row bytes at position {} are too short for row type with {} fields: \
+                     need at least {} header bytes, got {}",
+                    pos,
+                    row_type.fields().len(),
+                    header_size,
+                    bytes.len()
+                ),
+            });
+        }
+        Ok(CompactedRow::from_bytes(row_type, bytes))
+    }
+}
+
+struct RowFieldAccessor {
+    getter: FieldGetter,
+    writer: ValueWriter,
+    nullable: bool,
+}
+
+fn build_row_accessors(row_type: &RowType) -> Result<Vec<RowFieldAccessor>> {
+    row_type
+        .fields()
+        .iter()
+        .enumerate()
+        .map(|(i, f)| {
+            Ok(RowFieldAccessor {
+                getter: FieldGetter::create(f.data_type(), i),
+                writer: ValueWriter::create_value_writer(
+                    f.data_type(),
+                    Some(&BinaryRowFormat::Compacted),
+                )?,
+                nullable: f.data_type().is_nullable(),
+            })
+        })
+        .collect()
 }
 
 /// Writer for building a `FlussArray` element by element.
@@ -429,17 +475,34 @@ pub struct FlussArrayWriter {
     element_size: usize,
     cursor: usize,
     num_elements: usize,
+    // Some(_) only when constructed with a DataType::Row(_) element type.
+    row_accessors: Option<Vec<RowFieldAccessor>>,
 }
 
 impl FlussArrayWriter {
     /// Creates a new writer for an array with `num_elements` elements of the given element type.
     pub fn new(num_elements: usize, element_type: &DataType) -> Self {
         let element_size = calculate_fix_length_part_size(element_type);
-        Self::with_element_size(num_elements, element_size)
+        let row_accessors = match element_type {
+            DataType::Row(rt) => Some(
+                build_row_accessors(rt)
+                    .expect("ROW element type contains a field with no ValueWriter"),
+            ),
+            _ => None,
+        };
+        Self::with_state(num_elements, element_size, row_accessors)
     }
 
-    /// Creates a new writer with an explicit element size (in bytes).
+    /// Creates a new writer with an explicit element size (in bytes). Does not support `write_row`.
     pub fn with_element_size(num_elements: usize, element_size: usize) -> Self {
+        Self::with_state(num_elements, element_size, None)
+    }
+
+    fn with_state(
+        num_elements: usize,
+        element_size: usize,
+        row_accessors: Option<Vec<RowFieldAccessor>>,
+    ) -> Self {
         let header_in_bytes = calculate_header_in_bytes(num_elements);
         let fixed_size = round_to_nearest_word(header_in_bytes + element_size * num_elements);
         let mut data = vec![0u8; fixed_size];
@@ -454,6 +517,7 @@ impl FlussArrayWriter {
             element_size,
             cursor: fixed_size,
             num_elements,
+            row_accessors,
         }
     }
 
@@ -608,6 +672,26 @@ impl FlussArrayWriter {
         self.write_bytes_to_var_len_part(pos, value.as_bytes());
     }
 
+    /// Writes a nested row at `pos`. Requires the writer to have been
+    /// constructed via [`new`](Self::new) with a `DataType::Row(_)` element type.
+    pub fn write_row(&mut self, pos: usize, row: &dyn InternalRow) -> Result<()> {
+        let accessors = self.row_accessors.as_ref().ok_or_else(|| IllegalArgument {
+            message: "write_row requires a DataType::Row element type".to_string(),
+        })?;
+        let mut nested = CompactedRowWriter::new(accessors.len());
+        for (i, accessor) in accessors.iter().enumerate() {
+            if !accessor.nullable && row.is_null_at(i)? {
+                return Err(IllegalArgument {
+                    message: format!("nested row field {i} is non-nullable but received null"),
+                });
+            }
+            let datum = accessor.getter.get_field(row)?;
+            accessor.writer.write_value(&mut nested, i, &datum)?;
+        }
+        self.write_bytes_to_var_len_part(pos, nested.buffer());
+        Ok(())
+    }
+
     /// Finalizes the writer and returns the completed FlussArray.
     pub fn complete(self) -> Result<FlussArray> {
         let mut data = self.data;
@@ -621,7 +705,7 @@ impl FlussArrayWriter {
     }
 }
 
-impl crate::row::InternalRow for FlussArray {
+impl InternalRow for FlussArray {
     fn get_field_count(&self) -> usize {
         self.size()
     }
@@ -693,7 +777,10 @@ impl crate::row::InternalRow for FlussArray {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::DataTypes;
+    use crate::metadata::{DataField, DataTypes};
+    use crate::row::binary::BinaryWriter as BinaryWriterTrait;
+    use crate::row::compacted::CompactedRowWriter;
+    use crate::row::{Datum, GenericRow};
 
     #[test]
     fn test_header_calculation() {
@@ -843,18 +930,232 @@ mod tests {
         assert_eq!(array.get_double(1).unwrap(), -4.56);
     }
 
+    #[test]
+    fn test_round_trip_array_of_row() {
+        let row_type_owned = DataTypes::row(vec![
+            DataField::new("x", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let element_type = row_type_owned.clone();
+        let row_type = match &row_type_owned {
+            DataType::Row(rt) => rt,
+            _ => unreachable!(),
+        };
+
+        // Build array<row<int, string>> with two rows: (42, "hello"), (-1, null)
+        let mut writer = FlussArrayWriter::new(2, &element_type);
+
+        let mut r0 = GenericRow::new(2);
+        r0.set_field(0, 42_i32);
+        r0.set_field(1, "hello");
+        writer.write_row(0, &r0).expect("write row 0");
+
+        let mut r1 = GenericRow::new(2);
+        r1.set_field(0, -1_i32);
+        r1.set_field(1, Datum::Null);
+        writer.write_row(1, &r1).expect("write row 1");
+
+        let array = writer.complete().unwrap();
+        assert_eq!(array.size(), 2);
+
+        let row0 = array.get_row(0, row_type).expect("get row 0");
+        assert_eq!(row0.get_int(0).unwrap(), 42);
+        assert_eq!(row0.get_string(1).unwrap(), "hello");
+
+        let row1 = array.get_row(1, row_type).expect("get row 1");
+        assert_eq!(row1.get_int(0).unwrap(), -1);
+        assert!(row1.is_null_at(1).unwrap());
+    }
+
+    #[test]
+    fn test_get_row_rejects_oversized_row_type() {
+        let small_row_type_owned =
+            DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
+        let small_row_type = match &small_row_type_owned {
+            DataType::Row(rt) => rt,
+            _ => unreachable!(),
+        };
+        let mut writer = FlussArrayWriter::new(1, &small_row_type_owned);
+        let mut row = GenericRow::new(1);
+        row.set_field(0, 7_i32);
+        writer.write_row(0, &row).unwrap();
+        let array = writer.complete().unwrap();
+
+        let oversized_owned = DataTypes::row(
+            (0..10)
+                .map(|i| DataField::new(format!("f{i}"), DataTypes::int(), None))
+                .collect(),
+        );
+        let oversized_row_type = match &oversized_owned {
+            DataType::Row(rt) => rt,
+            _ => unreachable!(),
+        };
+        let huge_owned = DataTypes::row(
+            (0..100)
+                .map(|i| DataField::new(format!("f{i}"), DataTypes::int(), None))
+                .collect(),
+        );
+        let huge_row_type = match &huge_owned {
+            DataType::Row(rt) => rt,
+            _ => unreachable!(),
+        };
+        match array.get_row(0, huge_row_type) {
+            Err(e) => assert!(
+                e.to_string().contains("too short for row type"),
+                "unexpected error: {e}"
+            ),
+            Ok(_) => panic!("expected oversized row_type to be rejected"),
+        }
+
+        let recovered = array.get_row(0, small_row_type).unwrap();
+        assert_eq!(recovered.get_int(0).unwrap(), 7);
+
+        let _ = oversized_row_type;
+    }
+
+    #[test]
+    fn test_round_trip_array_of_row_with_nullable_element() {
+        let row_type_owned = DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
+        let element_type = row_type_owned.clone();
+        let row_type = match &row_type_owned {
+            DataType::Row(rt) => rt,
+            _ => unreachable!(),
+        };
+
+        let mut writer = FlussArrayWriter::new(3, &element_type);
+
+        let mut r0 = GenericRow::new(1);
+        r0.set_field(0, 7_i32);
+        writer.write_row(0, &r0).expect("write row 0");
+
+        writer.set_null_at(1);
+
+        let mut r2 = GenericRow::new(1);
+        r2.set_field(0, 8_i32);
+        writer.write_row(2, &r2).expect("write row 2");
+
+        let array = writer.complete().unwrap();
+
+        let row0 = array.get_row(0, row_type).unwrap();
+        assert_eq!(row0.get_int(0).unwrap(), 7);
+        assert!(array.is_null_at(1));
+        let row2 = array.get_row(2, row_type).unwrap();
+        assert_eq!(row2.get_int(0).unwrap(), 8);
+
+        let strict_row_type_owned = DataTypes::row(vec![DataField::new(
+            "n",
+            DataTypes::int().as_non_nullable(),
+            None,
+        )]);
+        let mut bad_writer = FlussArrayWriter::new(1, &strict_row_type_owned);
+        let mut bad = GenericRow::new(1);
+        bad.set_field(0, Datum::Null);
+        let err = bad_writer.write_row(0, &bad).unwrap_err();
+        assert!(
+            err.to_string().contains("non-nullable"),
+            "unexpected error: {err}"
+        );
+    }
+
+    #[test]
+    fn test_round_trip_array_of_row_of_array_of_string() {
+        let inner_array_type = DataTypes::array(DataTypes::string());
+        let inner_row_type_owned =
+            DataTypes::row(vec![DataField::new("tags", inner_array_type.clone(), None)]);
+        let inner_row_type = match &inner_row_type_owned {
+            DataType::Row(rt) => rt,
+            _ => unreachable!(),
+        };
+
+        let mut tags1 = FlussArrayWriter::new(2, &DataTypes::string());
+        tags1.write_string(0, "alpha");
+        tags1.write_string(1, "beta");
+        let tags1 = tags1.complete().unwrap();
+        let mut row1 = GenericRow::new(1);
+        row1.set_field(0, tags1);
+
+        let mut tags2 = FlussArrayWriter::new(3, &DataTypes::string());
+        tags2.write_string(0, "x");
+        tags2.set_null_at(1);
+        tags2.write_string(2, "z");
+        let tags2 = tags2.complete().unwrap();
+        let mut row2 = GenericRow::new(1);
+        row2.set_field(0, tags2);
+
+        let mut outer_writer = FlussArrayWriter::new(2, &inner_row_type_owned);
+        outer_writer.write_row(0, &row1).unwrap();
+        outer_writer.write_row(1, &row2).unwrap();
+        let outer = outer_writer.complete().unwrap();
+
+        assert_eq!(outer.size(), 2);
+
+        let r0 = outer.get_row(0, inner_row_type).unwrap();
+        let r0_tags = r0.get_array(0).unwrap();
+        assert_eq!(r0_tags.size(), 2);
+        assert_eq!(r0_tags.get_string(0).unwrap(), "alpha");
+        assert_eq!(r0_tags.get_string(1).unwrap(), "beta");
+
+        let r1 = outer.get_row(1, inner_row_type).unwrap();
+        let r1_tags = r1.get_array(0).unwrap();
+        assert_eq!(r1_tags.size(), 3);
+        assert_eq!(r1_tags.get_string(0).unwrap(), "x");
+        assert!(r1_tags.is_null_at(1));
+        assert_eq!(r1_tags.get_string(2).unwrap(), "z");
+    }
+
+    #[test]
+    fn test_round_trip_row_of_array_of_row() {
+        let inner_row_type_owned =
+            DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
+        let inner_array_type = DataTypes::array(inner_row_type_owned.clone());
+        let outer_row_type_owned =
+            DataTypes::row(vec![DataField::new("arr", inner_array_type.clone(), None)]);
+
+        let outer_row_type = match &outer_row_type_owned {
+            DataType::Row(rt) => rt,
+            _ => unreachable!(),
+        };
+        let inner_row_type = match &inner_row_type_owned {
+            DataType::Row(rt) => rt,
+            _ => unreachable!(),
+        };
+
+        let mut arr_writer = FlussArrayWriter::new(2, &inner_row_type_owned);
+        let mut r0 = GenericRow::new(1);
+        r0.set_field(0, 1_i32);
+        arr_writer.write_row(0, &r0).unwrap();
+        let mut r1 = GenericRow::new(1);
+        r1.set_field(0, 2_i32);
+        arr_writer.write_row(1, &r1).unwrap();
+        let inner_arr = arr_writer.complete().unwrap();
+
+        let mut outer = GenericRow::new(1);
+        outer.set_field(0, inner_arr.clone());
+
+        let mut writer = CompactedRowWriter::new(1);
+        writer.write_array(inner_arr.as_bytes());
+        let bytes = writer.to_bytes();
+
+        let outer_compacted = CompactedRow::from_bytes(outer_row_type, &bytes);
+        let recovered_arr = outer_compacted.get_array(0).unwrap();
+        assert_eq!(recovered_arr.size(), 2);
+
+        let recovered_r0 = recovered_arr.get_row(0, inner_row_type).unwrap();
+        assert_eq!(recovered_r0.get_int(0).unwrap(), 1);
+        let recovered_r1 = recovered_arr.get_row(1, inner_row_type).unwrap();
+        assert_eq!(recovered_r1.get_int(0).unwrap(), 2);
+    }
+
     #[test]
     fn test_round_trip_nested_array() {
         let inner_type = DataTypes::int();
         let outer_type = DataTypes::array(DataTypes::int());
 
-        // Build inner array [1, 2]
         let mut inner_writer = FlussArrayWriter::new(2, &inner_type);
         inner_writer.write_int(0, 1);
         inner_writer.write_int(1, 2);
         let inner_array = inner_writer.complete().unwrap();
 
-        // Build outer array containing the inner array
         let mut outer_writer = FlussArrayWriter::new(1, &outer_type);
         outer_writer.write_array(0, &inner_array);
         let outer_array = outer_writer.complete().unwrap();
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 95cd3395c2..5db1cd5073 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -17,11 +17,17 @@
 
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::row::{GenericRow, InternalRow};
+use crate::metadata::{DataType, RowType};
+use crate::record::from_arrow_type;
+use crate::row::binary_array::FlussArrayWriter;
 use crate::row::datum::{Date, Datum, Time, TimestampLtz, TimestampNtz};
+use crate::row::{Decimal, FlussArray, GenericRow, InternalRow};
 use arrow::array::{
-    Array, AsArray, BinaryArray, BooleanArray, FixedSizeBinaryArray, ListArray, RecordBatch,
-    StringArray,
+    Array, AsArray, BinaryArray, BooleanArray, Date32Array, Decimal128Array, FixedSizeBinaryArray,
+    Float32Array, Float64Array, Int8Array, Int16Array, Int32Array, Int64Array, ListArray,
+    RecordBatch, StringArray, StructArray, Time32MillisecondArray, Time32SecondArray,
+    Time64MicrosecondArray, Time64NanosecondArray, TimestampMicrosecondArray,
+    TimestampMillisecondArray, TimestampNanosecondArray, TimestampSecondArray,
 };
 use arrow::datatypes::{
     DataType as ArrowDataType, Date32Type, Decimal128Type, Float32Type, Float64Type, Int8Type,
@@ -35,31 +41,69 @@ use std::sync::Arc;
 pub struct ColumnarRow {
     record_batch: Arc<RecordBatch>,
     row_id: usize,
-    nested_rows: Vec<std::sync::OnceLock<GenericRow<'static>>>,
+    fluss_row_type: Option<Arc<RowType>>,
+    row_column_indices: Arc<[usize]>,
+    row_caches: Box<[std::sync::OnceLock<GenericRow<'static>>]>,
+}
+
+pub(crate) fn fluss_row_column_indices(row_type: &RowType) -> Arc<[usize]> {
+    row_type
+        .fields()
+        .iter()
+        .enumerate()
+        .filter_map(|(i, f)| matches!(f.data_type, DataType::Row(_)).then_some(i))
+        .collect()
+}
+
+pub(crate) fn arrow_row_column_indices(batch: &RecordBatch) -> Arc<[usize]> {
+    batch
+        .columns()
+        .iter()
+        .enumerate()
+        .filter_map(|(i, c)| matches!(c.data_type(), ArrowDataType::Struct(_)).then_some(i))
+        .collect()
+}
+
+fn make_row_caches(indices: &[usize]) -> Box<[std::sync::OnceLock<GenericRow<'static>>]> {
+    indices.iter().map(|_| std::sync::OnceLock::new()).collect()
 }
 
 impl ColumnarRow {
-    pub fn new(batch: Arc<RecordBatch>) -> Self {
-        let num_cols = batch.num_columns();
-        ColumnarRow {
-            record_batch: batch,
-            row_id: 0,
-            nested_rows: (0..num_cols).map(|_| std::sync::OnceLock::new()).collect(),
-        }
+    pub fn new(
+        batch: Arc<RecordBatch>,
+        row_id: usize,
+        fluss_row_type: Option<Arc<RowType>>,
+    ) -> Self {
+        let row_column_indices = match &fluss_row_type {
+            Some(rt) => fluss_row_column_indices(rt),
+            None => arrow_row_column_indices(&batch),
+        };
+        Self::with_indices(batch, row_id, fluss_row_type, row_column_indices)
     }
 
-    pub fn new_with_row_id(bach: Arc<RecordBatch>, row_id: usize) -> Self {
-        let num_cols = bach.num_columns();
+    pub(crate) fn with_indices(
+        batch: Arc<RecordBatch>,
+        row_id: usize,
+        fluss_row_type: Option<Arc<RowType>>,
+        row_column_indices: Arc<[usize]>,
+    ) -> Self {
+        let row_caches = make_row_caches(&row_column_indices);
         ColumnarRow {
-            record_batch: bach,
+            record_batch: batch,
             row_id,
-            nested_rows: (0..num_cols).map(|_| std::sync::OnceLock::new()).collect(),
+            fluss_row_type,
+            row_column_indices,
+            row_caches,
         }
     }
 
+    pub fn fluss_row_type(&self) -> Option<&Arc<RowType>> {
+        self.fluss_row_type.as_ref()
+    }
+
     pub fn set_row_id(&mut self, row_id: usize) {
         self.row_id = row_id;
-        for lock in &mut self.nested_rows {
+        for lock in self.row_caches.iter_mut() {
             *lock = std::sync::OnceLock::new();
         }
     }
@@ -220,167 +264,161 @@ impl ColumnarRow {
             }),
         }
     }
+}
 
-    /// Extract a `GenericRow<'static>` from a column in the RecordBatch at the given row_id.
-    fn extract_struct_at(
-        batch: &RecordBatch,
-        pos: usize,
-        row_id: usize,
-    ) -> Result<GenericRow<'static>> {
-        let col = batch.column(pos);
-        Self::extract_struct_from_array(col.as_ref(), row_id)
+fn extract_struct_from_array(
+    array: &dyn Array,
+    row_id: usize,
+    row_type: Option<&RowType>,
+) -> Result<GenericRow<'static>> {
+    let sa = array
+        .as_any()
+        .downcast_ref::<StructArray>()
+        .ok_or_else(|| IllegalArgument {
+            message: format!("expected StructArray, got {:?}", array.data_type()),
+        })?;
+    if let Some(rt) = row_type
+        && rt.fields().len() != sa.num_columns()
+    {
+        return Err(IllegalArgument {
+            message: format!(
+                "Fluss RowType has {} fields but Arrow StructArray has {}",
+                rt.fields().len(),
+                sa.num_columns(),
+            ),
+        });
     }
+    let mut values = Vec::with_capacity(sa.num_columns());
+    for i in 0..sa.num_columns() {
+        let child = sa.column(i);
+        let fluss_type = row_type.map(|rt| &rt.fields()[i].data_type);
+        values.push(arrow_value_to_datum(child.as_ref(), row_id, fluss_type)?);
+    }
+    Ok(GenericRow { values })
+}
 
-    /// Recursively extract a `GenericRow<'static>` from a `StructArray` at row_id.
-    fn extract_struct_from_array(array: &dyn Array, row_id: usize) -> Result<GenericRow<'static>> {
-        use arrow::array::StructArray;
-        let sa = array
-            .as_any()
-            .downcast_ref::<StructArray>()
-            .ok_or_else(|| IllegalArgument {
-                message: format!("expected StructArray, got {:?}", array.data_type()),
-            })?;
-        let mut values = Vec::with_capacity(sa.num_columns());
-        for i in 0..sa.num_columns() {
-            let child = sa.column(i);
-            values.push(Self::arrow_value_to_datum(child.as_ref(), row_id)?);
-        }
-        Ok(GenericRow { values })
+fn arrow_value_to_datum(
+    array: &dyn Array,
+    row_id: usize,
+    fluss_type: Option<&DataType>,
+) -> Result<Datum<'static>> {
+    if array.is_null(row_id) {
+        return Ok(Datum::Null);
     }
 
-    /// Convert a single element at `row_id` in an Arrow array to a `Datum<'static>`.
-    fn arrow_value_to_datum(array: &dyn Array, row_id: usize) -> Result<Datum<'static>> {
-        use arrow::array::{
-            BooleanArray, Decimal128Array, Float32Array, Float64Array, Int8Array, Int16Array,
-            Int32Array, Int64Array, Time32MillisecondArray, Time32SecondArray,
-            Time64MicrosecondArray, Time64NanosecondArray, TimestampMicrosecondArray,
-            TimestampMillisecondArray, TimestampNanosecondArray, TimestampSecondArray,
+    macro_rules! downcast {
+        ($ty:ty) => {
+            array
+                .as_any()
+                .downcast_ref::<$ty>()
+                .ok_or_else(|| IllegalArgument {
+                    message: format!(
+                        "expected {} for arrow type {:?}",
+                        stringify!($ty),
+                        array.data_type()
+                    ),
+                })?
         };
-        use crate::row::Decimal;
+    }
 
-        if array.is_null(row_id) {
-            return Ok(Datum::Null);
+    match array.data_type() {
+        ArrowDataType::Boolean => Ok(Datum::Bool(downcast!(BooleanArray).value(row_id))),
+        ArrowDataType::Int8 => Ok(Datum::Int8(downcast!(Int8Array).value(row_id))),
+        ArrowDataType::Int16 => Ok(Datum::Int16(downcast!(Int16Array).value(row_id))),
+        ArrowDataType::Int32 => Ok(Datum::Int32(downcast!(Int32Array).value(row_id))),
+        ArrowDataType::Int64 => Ok(Datum::Int64(downcast!(Int64Array).value(row_id))),
+        ArrowDataType::Float32 => Ok(Datum::Float32(downcast!(Float32Array).value(row_id).into())),
+        ArrowDataType::Float64 => Ok(Datum::Float64(downcast!(Float64Array).value(row_id).into())),
+        ArrowDataType::Utf8 => Ok(Datum::String(std::borrow::Cow::Owned(
+            downcast!(StringArray).value(row_id).to_owned(),
+        ))),
+        ArrowDataType::Binary => Ok(Datum::Blob(std::borrow::Cow::Owned(
+            downcast!(BinaryArray).value(row_id).to_vec(),
+        ))),
+        ArrowDataType::FixedSizeBinary(_) => Ok(Datum::Blob(std::borrow::Cow::Owned(
+            downcast!(FixedSizeBinaryArray).value(row_id).to_vec(),
+        ))),
+        ArrowDataType::Decimal128(p, s) => {
+            let (p, s) = (*p, *s);
+            let i128_val = downcast!(Decimal128Array).value(row_id);
+            Ok(Datum::Decimal(Decimal::from_arrow_decimal128(
+                i128_val, s as i64, p as u32, s as u32,
+            )?))
         }
-
-        match array.data_type() {
-            ArrowDataType::Boolean => {
-                let a = array.as_any().downcast_ref::<BooleanArray>().unwrap();
-                Ok(Datum::Bool(a.value(row_id)))
-            }
-            ArrowDataType::Int8 => {
-                let a = array.as_any().downcast_ref::<Int8Array>().unwrap();
-                Ok(Datum::Int8(a.value(row_id)))
-            }
-            ArrowDataType::Int16 => {
-                let a = array.as_any().downcast_ref::<Int16Array>().unwrap();
-                Ok(Datum::Int16(a.value(row_id)))
-            }
-            ArrowDataType::Int32 => {
-                let a = array.as_any().downcast_ref::<Int32Array>().unwrap();
-                Ok(Datum::Int32(a.value(row_id)))
-            }
-            ArrowDataType::Int64 => {
-                let a = array.as_any().downcast_ref::<Int64Array>().unwrap();
-                Ok(Datum::Int64(a.value(row_id)))
-            }
-            ArrowDataType::Float32 => {
-                let a = array.as_any().downcast_ref::<Float32Array>().unwrap();
-                Ok(Datum::Float32(a.value(row_id).into()))
-            }
-            ArrowDataType::Float64 => {
-                let a = array.as_any().downcast_ref::<Float64Array>().unwrap();
-                Ok(Datum::Float64(a.value(row_id).into()))
-            }
-            ArrowDataType::Utf8 => {
-                let a = array.as_any().downcast_ref::<StringArray>().unwrap();
-                Ok(Datum::String(std::borrow::Cow::Owned(a.value(row_id).to_owned())))
-            }
-            ArrowDataType::Binary => {
-                let a = array.as_any().downcast_ref::<BinaryArray>().unwrap();
-                Ok(Datum::Blob(std::borrow::Cow::Owned(a.value(row_id).to_vec())))
-            }
-            ArrowDataType::Decimal128(p, s) => {
-                let (p, s) = (*p, *s);
-                let a = array.as_any().downcast_ref::<Decimal128Array>().unwrap();
-                let i128_val = a.value(row_id);
-                Ok(Datum::Decimal(Decimal::from_arrow_decimal128(
-                    i128_val,
-                    s as i64,
-                    p as u32,
-                    s as u32,
-                )?))
-            }
-            ArrowDataType::Date32 => {
-                let a = array.as_any().downcast_ref::<arrow::array::Date32Array>().unwrap();
-                Ok(Datum::Date(Date::new(a.value(row_id))))
-            }
-            ArrowDataType::Time32(TimeUnit::Second) => {
-                let a = array.as_any().downcast_ref::<Time32SecondArray>().unwrap();
-                Ok(Datum::Time(Time::new(a.value(row_id) * 1000)))
-            }
-            ArrowDataType::Time32(TimeUnit::Millisecond) => {
-                let a = array.as_any().downcast_ref::<Time32MillisecondArray>().unwrap();
-                Ok(Datum::Time(Time::new(a.value(row_id))))
-            }
-            ArrowDataType::Time64(TimeUnit::Microsecond) => {
-                let a = array.as_any().downcast_ref::<Time64MicrosecondArray>().unwrap();
-                Ok(Datum::Time(Time::new((a.value(row_id) / 1000) as i32)))
-            }
-            ArrowDataType::Time64(TimeUnit::Nanosecond) => {
-                let a = array.as_any().downcast_ref::<Time64NanosecondArray>().unwrap();
-                Ok(Datum::Time(Time::new((a.value(row_id) / 1_000_000) as i32)))
-            }
-            ArrowDataType::Timestamp(time_unit, tz) => {
-                let value: i64 = match time_unit {
-                    TimeUnit::Second => {
-                        array.as_any().downcast_ref::<TimestampSecondArray>().unwrap().value(row_id)
-                    }
-                    TimeUnit::Millisecond => {
-                        array.as_any().downcast_ref::<TimestampMillisecondArray>().unwrap().value(row_id)
-                    }
-                    TimeUnit::Microsecond => {
-                        array.as_any().downcast_ref::<TimestampMicrosecondArray>().unwrap().value(row_id)
-                    }
-                    TimeUnit::Nanosecond => {
-                        array.as_any().downcast_ref::<TimestampNanosecondArray>().unwrap().value(row_id)
-                    }
-                };
-                let (millis, nanos) = match time_unit {
-                    TimeUnit::Second => (value * 1000, 0i32),
-                    TimeUnit::Millisecond => (value, 0i32),
-                    TimeUnit::Microsecond => {
-                        let millis = value.div_euclid(1000);
-                        let nanos = (value.rem_euclid(1000) * 1000) as i32;
-                        (millis, nanos)
-                    }
-                    TimeUnit::Nanosecond => {
-                        let millis = value.div_euclid(1_000_000);
-                        let nanos = value.rem_euclid(1_000_000) as i32;
-                        (millis, nanos)
-                    }
-                };
-                if tz.is_some() {
-                    if nanos == 0 {
-                        Ok(Datum::TimestampLtz(TimestampLtz::new(millis)))
-                    } else {
-                        Ok(Datum::TimestampLtz(TimestampLtz::from_millis_nanos(millis, nanos)?))
-                    }
-                } else if nanos == 0 {
-                    Ok(Datum::TimestampNtz(TimestampNtz::new(millis)))
+        ArrowDataType::Date32 => Ok(Datum::Date(Date::new(downcast!(Date32Array).value(row_id)))),
+        ArrowDataType::Time32(TimeUnit::Second) => Ok(Datum::Time(Time::new(
+            downcast!(Time32SecondArray).value(row_id) * 1000,
+        ))),
+        ArrowDataType::Time32(TimeUnit::Millisecond) => Ok(Datum::Time(Time::new(
+            downcast!(Time32MillisecondArray).value(row_id),
+        ))),
+        ArrowDataType::Time64(TimeUnit::Microsecond) => Ok(Datum::Time(Time::new(
+            (downcast!(Time64MicrosecondArray).value(row_id) / 1000) as i32,
+        ))),
+        ArrowDataType::Time64(TimeUnit::Nanosecond) => Ok(Datum::Time(Time::new(
+            (downcast!(Time64NanosecondArray).value(row_id) / 1_000_000) as i32,
+        ))),
+        ArrowDataType::Timestamp(time_unit, _tz) => {
+            let value: i64 = match time_unit {
+                TimeUnit::Second => downcast!(TimestampSecondArray).value(row_id),
+                TimeUnit::Millisecond => downcast!(TimestampMillisecondArray).value(row_id),
+                TimeUnit::Microsecond => downcast!(TimestampMicrosecondArray).value(row_id),
+                TimeUnit::Nanosecond => downcast!(TimestampNanosecondArray).value(row_id),
+            };
+            let (millis, nanos) = match time_unit {
+                TimeUnit::Second => (value * 1000, 0i32),
+                TimeUnit::Millisecond => (value, 0i32),
+                TimeUnit::Microsecond => {
+                    let millis = value.div_euclid(1000);
+                    let nanos = (value.rem_euclid(1000) * 1000) as i32;
+                    (millis, nanos)
+                }
+                TimeUnit::Nanosecond => {
+                    let millis = value.div_euclid(1_000_000);
+                    let nanos = value.rem_euclid(1_000_000) as i32;
+                    (millis, nanos)
+                }
+            };
+            // TIMESTAMP and TIMESTAMP_LTZ both map to `Timestamp(unit, None)` in Arrow.
+            let is_ltz = matches!(fluss_type, Some(DataType::TimestampLTz(_)));
+            if is_ltz {
+                if nanos == 0 {
+                    Ok(Datum::TimestampLtz(TimestampLtz::new(millis)))
                 } else {
-                    Ok(Datum::TimestampNtz(TimestampNtz::from_millis_nanos(millis, nanos)?))
+                    Ok(Datum::TimestampLtz(TimestampLtz::from_millis_nanos(
+                        millis, nanos,
+                    )?))
                 }
+            } else if nanos == 0 {
+                Ok(Datum::TimestampNtz(TimestampNtz::new(millis)))
+            } else {
+                Ok(Datum::TimestampNtz(TimestampNtz::from_millis_nanos(
+                    millis, nanos,
+                )?))
             }
-            ArrowDataType::Struct(_) => {
-                let nested = Self::extract_struct_from_array(array, row_id)?;
-                Ok(Datum::Row(Box::new(nested)))
-            }
-            other => Err(IllegalArgument {
-                message: format!(
-                    "unsupported Arrow data type for nested row extraction: {other:?}"
-                ),
-            }),
         }
+        ArrowDataType::Struct(_) => {
+            let nested_row_type = fluss_type.and_then(|t| match t {
+                DataType::Row(rt) => Some(rt),
+                _ => None,
+            });
+            let nested = extract_struct_from_array(array, row_id, nested_row_type)?;
+            Ok(Datum::Row(Box::new(nested)))
+        }
+        ArrowDataType::List(field) => {
+            let list_arr = downcast!(ListArray);
+            let values = list_arr.value(row_id);
+            let element_fluss_type = match fluss_type {
+                Some(DataType::Array(at)) => at.get_element_type().clone(),
+                _ => from_arrow_type(field.data_type())?,
+            };
+            let mut writer = FlussArrayWriter::new(values.len(), &element_fluss_type);
+            write_arrow_values_to_fluss_array(&*values, &element_fluss_type, &mut writer)?;
+            Ok(Datum::Array(writer.complete()?))
+        }
+        other => Err(IllegalArgument {
+            message: format!("unsupported Arrow data type for nested row extraction: {other:?}"),
+        }),
     }
 }
 
@@ -485,14 +523,7 @@ impl InternalRow for ColumnarRow {
             .value(self.row_id))
     }
 
-    fn get_decimal(
-        &self,
-        pos: usize,
-        precision: usize,
-        scale: usize,
-    ) -> Result<crate::row::Decimal> {
-        use arrow::datatypes::DataType;
-
+    fn get_decimal(&self, pos: usize, precision: usize, scale: usize) -> Result<Decimal> {
         let column = self.column(pos)?;
         let array = column
             .as_primitive_opt::<Decimal128Type>()
@@ -511,9 +542,8 @@ impl InternalRow for ColumnarRow {
             self.row_id
         );
 
-        // Read scale from Arrow column data type
         let arrow_scale = match column.data_type() {
-            DataType::Decimal128(_p, s) => *s as i64,
+            ArrowDataType::Decimal128(_p, s) => *s as i64,
             dt => {
                 return Err(IllegalArgument {
                     message: format!(
@@ -523,11 +553,8 @@ impl InternalRow for ColumnarRow {
             }
         };
 
-        let i128_val = array.value(self.row_id);
-
-        // Convert Arrow Decimal128 to Fluss Decimal (handles rescaling and validation)
-        crate::row::Decimal::from_arrow_decimal128(
-            i128_val,
+        Decimal::from_arrow_decimal128(
+            array.value(self.row_id),
             arrow_scale,
             precision as u32,
             scale as u32,
@@ -581,10 +608,7 @@ impl InternalRow for ColumnarRow {
             .value(self.row_id))
     }
 
-    fn get_array(&self, pos: usize) -> Result<crate::row::FlussArray> {
-        use crate::record::from_arrow_type;
-        use crate::row::binary_array::FlussArrayWriter;
-
+    fn get_array(&self, pos: usize) -> Result<FlussArray> {
         let column = self.column(pos)?;
         let values = if let Some(list_arr) = column.as_any().downcast_ref::<ListArray>() {
             list_arr.value(self.row_id)
@@ -605,15 +629,37 @@ impl InternalRow for ColumnarRow {
     }
 
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
-        let lock = self.nested_rows.get(pos).ok_or_else(|| IllegalArgument {
-            message: format!("column index {pos} out of bounds for get_row"),
-        })?;
-        let batch = Arc::clone(&self.record_batch);
-        let row_id = self.row_id;
-        Ok(lock.get_or_init(|| {
-            Self::extract_struct_at(&batch, pos, row_id)
-                .expect("failed to extract nested row from StructArray")
-        }))
+        let cache_idx = self
+            .row_column_indices
+            .iter()
+            .position(|&i| i == pos)
+            .ok_or_else(|| IllegalArgument {
+                message: format!("get_row called on non-ROW column at position {pos}"),
+            })?;
+        let column = self.record_batch.column(pos);
+        // Children of a null parent may carry stale bytes; caller must
+        // check is_null_at first rather than rely on what we'd read.
+        if column.is_null(self.row_id) {
+            return Err(IllegalArgument {
+                message: format!(
+                    "get_row called on null ROW cell at position {pos}, row {}; \
+                     check is_null_at({pos}) first",
+                    self.row_id
+                ),
+            });
+        }
+        let lock = &self.row_caches[cache_idx];
+        if let Some(row) = lock.get() {
+            return Ok(row);
+        }
+        let nested_row_type = self.fluss_row_type.as_ref().and_then(|rt| {
+            rt.fields().get(pos).and_then(|f| match &f.data_type {
+                DataType::Row(inner) => Some(inner),
+                _ => None,
+            })
+        });
+        let extracted = extract_struct_from_array(column.as_ref(), self.row_id, nested_row_type)?;
+        Ok(lock.get_or_init(|| extracted))
     }
 }
 
@@ -624,7 +670,7 @@ macro_rules! write_primitive_elements {
             .as_primitive_opt::<$arrow_type>()
             .ok_or_else(|| IllegalArgument {
                 message: format!(
-                    "Expected {} for {:?} element",
+                    "expected {} for {:?} element",
                     stringify!($arrow_type),
                     $element_type
                 ),
@@ -647,7 +693,7 @@ macro_rules! write_downcast_elements {
             .downcast_ref::<$array_type>()
             .ok_or_else(|| IllegalArgument {
                 message: format!(
-                    "Expected {} for {:?} element",
+                    "expected {} for {:?} element",
                     stringify!($array_type),
                     $element_type
                 ),
@@ -670,7 +716,7 @@ macro_rules! write_list_elements {
             .downcast_ref::<$list_array_type>()
             .ok_or_else(|| IllegalArgument {
                 message: format!(
-                    "Expected {} for {:?} element",
+                    "expected {} for {:?} element",
                     stringify!($list_array_type),
                     $element_type
                 ),
@@ -699,13 +745,9 @@ macro_rules! write_list_elements {
 /// the Arrow array once per call rather than per element.
 fn write_arrow_values_to_fluss_array(
     values: &dyn Array,
-    element_type: &crate::metadata::DataType,
-    writer: &mut crate::row::binary_array::FlussArrayWriter,
+    element_type: &DataType,
+    writer: &mut FlussArrayWriter,
 ) -> Result<()> {
-    use crate::metadata::DataType;
-    use crate::record::from_arrow_type;
-    use crate::row::binary_array::FlussArrayWriter;
-
     let len = values.len();
 
     match element_type {
@@ -756,14 +798,14 @@ fn write_arrow_values_to_fluss_array(
                 values
                     .as_primitive_opt::<Decimal128Type>()
                     .ok_or_else(|| IllegalArgument {
-                        message: format!("Expected Decimal128Array for {element_type:?} element"),
+                        message: format!("expected Decimal128Array for {element_type:?} element"),
                     })?;
             let arrow_scale = match values.data_type() {
                 ArrowDataType::Decimal128(_p, s) => *s as i64,
                 other => {
                     return Err(IllegalArgument {
                         message: format!(
-                            "Expected Decimal128 data type for {element_type:?} element, got {other:?}"
+                            "expected Decimal128 data type for {element_type:?} element, got {other:?}"
                         ),
                     });
                 }
@@ -774,7 +816,7 @@ fn write_arrow_values_to_fluss_array(
                 if arr.is_null(i) {
                     writer.set_null_at(i);
                 } else {
-                    let d = crate::row::Decimal::from_arrow_decimal128(
+                    let d = Decimal::from_arrow_decimal128(
                         arr.value(i),
                         arrow_scale,
                         precision,
@@ -788,7 +830,7 @@ fn write_arrow_values_to_fluss_array(
             let arr = values
                 .as_primitive_opt::<Date32Type>()
                 .ok_or_else(|| IllegalArgument {
-                    message: format!("Expected Date32Array for {element_type:?} element"),
+                    message: format!("expected Date32Array for {element_type:?} element"),
                 })?;
             for i in 0..len {
                 if arr.is_null(i) {
@@ -829,16 +871,35 @@ fn write_arrow_values_to_fluss_array(
             } else {
                 return Err(IllegalArgument {
                     message: format!(
-                        "Expected ListArray for {element_type:?} element, got {:?}",
+                        "expected ListArray for {element_type:?} element, got {:?}",
                         values.data_type()
                     ),
                 });
             }
         }
+        DataType::Row(row_type) => {
+            let struct_arr = values
+                .as_any()
+                .downcast_ref::<StructArray>()
+                .ok_or_else(|| IllegalArgument {
+                    message: format!(
+                        "expected StructArray for {element_type:?} element, got {:?}",
+                        values.data_type()
+                    ),
+                })?;
+            for i in 0..len {
+                if struct_arr.is_null(i) {
+                    writer.set_null_at(i);
+                } else {
+                    let nested = extract_struct_from_array(struct_arr, i, Some(row_type))?;
+                    writer.write_row(i, &nested)?;
+                }
+            }
+        }
         _ => {
             return Err(IllegalArgument {
                 message: format!(
-                    "Unsupported element type for Arrow → FlussArray conversion: {element_type:?}"
+                    "unsupported element type for Arrow → FlussArray conversion: {element_type:?}"
                 ),
             });
         }
@@ -848,8 +909,8 @@ fn write_arrow_values_to_fluss_array(
 
 fn write_time_elements(
     values: &dyn Array,
-    element_type: &crate::metadata::DataType,
-    writer: &mut crate::row::binary_array::FlussArrayWriter,
+    element_type: &DataType,
+    writer: &mut FlussArrayWriter,
 ) -> Result<()> {
     macro_rules! process_time {
         ($arrow_type:ty, $to_millis:expr) => {{
@@ -857,7 +918,7 @@ fn write_time_elements(
                 .as_primitive_opt::<$arrow_type>()
                 .ok_or_else(|| IllegalArgument {
                     message: format!(
-                        "Expected {} for {:?} element",
+                        "expected {} for {:?} element",
                         stringify!($arrow_type),
                         element_type
                     ),
@@ -889,7 +950,7 @@ fn write_time_elements(
         other => {
             return Err(IllegalArgument {
                 message: format!(
-                    "Expected Time column for {element_type:?} element, got {other:?}"
+                    "expected Time column for {element_type:?} element, got {other:?}"
                 ),
             });
         }
@@ -916,19 +977,19 @@ fn convert_timestamp_raw(raw: i64, unit: &TimeUnit) -> (i64, i32) {
 
 fn write_timestamp_elements<T>(
     values: &dyn Array,
-    element_type: &crate::metadata::DataType,
-    writer: &mut crate::row::binary_array::FlussArrayWriter,
+    element_type: &DataType,
+    writer: &mut FlussArrayWriter,
     precision: u32,
     construct_compact: impl Fn(i64) -> T,
     construct_with_nanos: impl Fn(i64, i32) -> Result<T>,
-    write_fn: impl Fn(&mut crate::row::binary_array::FlussArrayWriter, usize, T, u32),
+    write_fn: impl Fn(&mut FlussArrayWriter, usize, T, u32),
 ) -> Result<()> {
     let unit = match values.data_type() {
         ArrowDataType::Timestamp(unit, _) => unit,
         other => {
             return Err(IllegalArgument {
                 message: format!(
-                    "Expected Timestamp column for {element_type:?} element, got {other:?}"
+                    "expected Timestamp column for {element_type:?} element, got {other:?}"
                 ),
             });
         }
@@ -940,7 +1001,7 @@ fn write_timestamp_elements<T>(
                 .as_primitive_opt::<$arrow_type>()
                 .ok_or_else(|| IllegalArgument {
                     message: format!(
-                        "Expected {} for {:?} element",
+                        "expected {} for {:?} element",
                         stringify!($arrow_type),
                         element_type
                     ),
@@ -983,7 +1044,7 @@ mod tests {
     fn single_column_row(array: ArrayRef) -> ColumnarRow {
         let batch =
             RecordBatch::try_from_iter(vec![("arr", array)]).expect("record batch with one column");
-        ColumnarRow::new(Arc::new(batch))
+        ColumnarRow::new(Arc::new(batch), 0, None)
     }
 
     #[test]
@@ -1018,7 +1079,7 @@ mod tests {
         )
         .expect("record batch");
 
-        let mut row = ColumnarRow::new(Arc::new(batch));
+        let mut row = ColumnarRow::new(Arc::new(batch), 0, None);
         assert_eq!(row.get_field_count(), 10);
         assert!(row.get_boolean(0).unwrap());
         assert_eq!(row.get_byte(1).unwrap(), 1);
@@ -1073,27 +1134,21 @@ mod tests {
         )
         .expect("record batch");
 
-        let row = ColumnarRow::new(Arc::new(batch));
+        let row = ColumnarRow::new(Arc::new(batch), 0, None);
         assert_eq!(row.get_field_count(), 3);
 
         // Verify decimal values
         assert_eq!(
             row.get_decimal(0, 10, 2).unwrap(),
-            crate::row::Decimal::from_big_decimal(BigDecimal::new(BigInt::from(12345), 2), 10, 2)
-                .unwrap()
+            Decimal::from_big_decimal(BigDecimal::new(BigInt::from(12345), 2), 10, 2).unwrap()
         );
         assert_eq!(
             row.get_decimal(1, 20, 5).unwrap(),
-            crate::row::Decimal::from_big_decimal(
-                BigDecimal::new(BigInt::from(1234567890), 5),
-                20,
-                5
-            )
-            .unwrap()
+            Decimal::from_big_decimal(BigDecimal::new(BigInt::from(1234567890), 5), 20, 5).unwrap()
         );
         assert_eq!(
             row.get_decimal(2, 38, 10).unwrap(),
-            crate::row::Decimal::from_big_decimal(
+            Decimal::from_big_decimal(
                 BigDecimal::new(BigInt::from(999999999999999999i128), 10),
                 38,
                 10
@@ -1206,15 +1261,11 @@ mod tests {
             DataType::Struct(child_fields),
             false,
         )]));
-        Arc::new(
-            RecordBatch::try_new(schema, vec![Arc::new(struct_array)])
-                .expect("record batch"),
-        )
+        Arc::new(RecordBatch::try_new(schema, vec![Arc::new(struct_array)]).expect("record batch"))
     }
 
     #[test]
     fn columnar_row_reads_nested_row() {
-        // Build a RecordBatch with a Struct column: {i32, string}
         let child_fields = Fields::from(vec![
             Field::new("x", DataType::Int32, false),
             Field::new("s", DataType::Utf8, false),
@@ -1225,7 +1276,7 @@ mod tests {
         ];
         let batch = make_struct_batch("nested", child_fields, child_arrays, 2);
 
-        let mut row = ColumnarRow::new(batch);
+        let mut row = ColumnarRow::new(batch, 0, None);
 
         // row_id = 0
         let nested = row.get_row(0).unwrap();
@@ -1268,29 +1319,32 @@ mod tests {
             DataType::Struct(outer_fields),
             false,
         )]));
-        let batch = Arc::new(
-            RecordBatch::try_new(schema, vec![outer_array]).expect("record batch"),
-        );
+        let batch =
+            Arc::new(RecordBatch::try_new(schema, vec![outer_array]).expect("record batch"));
 
-        let row = ColumnarRow::new(batch);
+        let mut row = ColumnarRow::new(batch, 0, None);
 
-        // Access outer struct at column 0, row 0
+        // row_id = 0
         let outer = row.get_row(0).unwrap();
         assert_eq!(outer.get_int(0).unwrap(), 1);
-
-        // Access inner struct (column 1 of outer)
         let inner = outer.get_row(1).unwrap();
         assert_eq!(inner.get_string(0).unwrap(), "deep");
+
+        // row_id = 1
+        row.set_row_id(1);
+        let outer = row.get_row(0).unwrap();
+        assert_eq!(outer.get_int(0).unwrap(), 2);
+        let inner = outer.get_row(1).unwrap();
+        assert_eq!(inner.get_string(0).unwrap(), "deeper");
     }
 
     #[test]
     fn columnar_row_get_row_cache_invalidated_on_set_row_id() {
         let child_fields = Fields::from(vec![Field::new("x", DataType::Int32, false)]);
-        let child_arrays: Vec<Arc<dyn Array>> =
-            vec![Arc::new(Int32Array::from(vec![10, 20]))];
+        let child_arrays: Vec<Arc<dyn Array>> = vec![Arc::new(Int32Array::from(vec![10, 20]))];
         let batch = make_struct_batch("s", child_fields, child_arrays, 2);
 
-        let mut row = ColumnarRow::new(batch);
+        let mut row = ColumnarRow::new(batch, 0, None);
 
         // row_id = 0: nested x = 10
         let nested_0 = row.get_row(0).unwrap();
diff --git a/fluss-rust/crates/fluss/src/row/column_writer.rs b/fluss-rust/crates/fluss/src/row/column_writer.rs
index be94cf062b..d595df9191 100644
--- a/fluss-rust/crates/fluss/src/row/column_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/column_writer.rs
@@ -21,7 +21,7 @@
 
 use crate::error::Error::RowConvertError;
 use crate::error::{Error, Result};
-use crate::metadata::DataType;
+use crate::metadata::{DataType, RowType};
 use crate::row::InternalRow;
 use crate::row::datum::{
     MICROS_PER_MILLI, MILLIS_PER_SECOND, NANOS_PER_MILLI, append_decimal_to_builder,
@@ -123,6 +123,12 @@ enum TypedWriter {
         offsets: Vec<i32>,
         validity: Vec<bool>,
     },
+    Struct {
+        field_writers: Vec<ColumnWriter>,
+        validity: Vec<bool>,
+        fields: arrow_schema::Fields,
+        row_type: RowType,
+    },
 }
 
 /// Dispatch to the inner builder across all `TypedWriter` variants.
@@ -156,6 +162,7 @@ macro_rules! with_builder {
             TypedWriter::TimestampLtzMicrosecond { builder: $b, .. } => $body,
             TypedWriter::TimestampLtzNanosecond { builder: $b, .. } => $body,
             TypedWriter::List { .. } => panic!("List variant not supported in with_builder!"),
+            TypedWriter::Struct { .. } => panic!("Struct variant not supported in with_builder!"),
         }
     };
 }
@@ -354,6 +361,39 @@ impl ColumnWriter {
                     validity: Vec::with_capacity(capacity),
                 }
             }
+            DataType::Row(row_type) => {
+                let arrow_fields = match arrow_type {
+                    ArrowDataType::Struct(fields) => fields.clone(),
+                    _ => {
+                        return Err(Error::IllegalArgument {
+                            message: format!(
+                                "Expected Struct Arrow type for Row, got: {arrow_type:?}"
+                            ),
+                        });
+                    }
+                };
+                if arrow_fields.len() != row_type.fields().len() {
+                    return Err(Error::IllegalArgument {
+                        message: format!(
+                            "Row arity mismatch: Fluss type has {} fields, Arrow type has {}",
+                            row_type.fields().len(),
+                            arrow_fields.len(),
+                        ),
+                    });
+                }
+                let field_writers: Result<Vec<_>> = row_type
+                    .fields()
+                    .iter()
+                    .zip(arrow_fields.iter())
+                    .map(|(f, af)| ColumnWriter::create(&f.data_type, af.data_type(), 0, capacity))
+                    .collect();
+                TypedWriter::Struct {
+                    field_writers: field_writers?,
+                    validity: Vec::with_capacity(capacity),
+                    fields: arrow_fields,
+                    row_type: row_type.clone(),
+                }
+            }
             _ => {
                 return Err(Error::IllegalArgument {
                     message: format!("Unsupported Fluss DataType: {fluss_type:?}"),
@@ -400,6 +440,17 @@ impl ColumnWriter {
                 let taken_validity = std::mem::take(validity);
                 finish_list_array(values, item_nullable, &taken_offsets, &taken_validity)
             }
+            TypedWriter::Struct {
+                field_writers,
+                validity,
+                fields,
+                ..
+            } => {
+                let taken_validity = std::mem::take(validity);
+                let child_arrays: Vec<ArrayRef> =
+                    field_writers.iter_mut().map(|w| w.finish()).collect();
+                finish_struct_array(fields.clone(), child_arrays, &taken_validity)
+            }
             _ => with_builder!(&mut self.inner, b => (b as &mut dyn ArrayBuilder).finish()),
         }
     }
@@ -476,6 +527,15 @@ impl ColumnWriter {
                 let offsets_bytes = round_up_to_8(offsets.len() * std::mem::size_of::<i32>());
                 validity_bytes + offsets_bytes + element_writer.buffer_size()
             }
+            TypedWriter::Struct {
+                field_writers,
+                validity,
+                ..
+            } => {
+                let validity_bytes = round_up_to_8(validity.len().div_ceil(8));
+                let children_bytes: usize = field_writers.iter().map(|w| w.buffer_size()).sum();
+                validity_bytes + children_bytes
+            }
         }
     }
 
@@ -488,6 +548,17 @@ impl ColumnWriter {
                 offsets.push(last);
                 validity.push(false);
             }
+            TypedWriter::Struct {
+                field_writers,
+                validity,
+                ..
+            } => {
+                // Arrow StructArray children must match parent length.
+                for child in field_writers.iter_mut() {
+                    child.append_null();
+                }
+                validity.push(false);
+            }
             _ => with_builder!(&mut self.inner, b => b.append_null()),
         }
     }
@@ -676,22 +747,75 @@ impl ColumnWriter {
                 validity,
             } => {
                 let array = row.get_array(pos)?;
-                for i in 0..array.size() {
-                    element_writer.write_field_at(&array, i)?;
+                let size = array.size();
+                if let TypedWriter::Struct {
+                    field_writers,
+                    validity: child_validity,
+                    row_type,
+                    ..
+                } = &mut element_writer.inner
+                {
+                    for i in 0..size {
+                        if array.is_null_at(i) {
+                            for child in field_writers.iter_mut() {
+                                child.append_null();
+                            }
+                            child_validity.push(false);
+                        } else {
+                            let nested = array.get_row(i, row_type)?;
+                            for (j, child) in field_writers.iter_mut().enumerate() {
+                                child.write_field_at(&nested, j)?;
+                            }
+                            child_validity.push(true);
+                        }
+                    }
+                } else {
+                    for i in 0..size {
+                        element_writer.write_field_at(&array, i)?;
+                    }
                 }
                 let last = *offsets.last().unwrap();
                 offsets.push(
-                    last + i32::try_from(array.size()).map_err(|_| RowConvertError {
-                        message: format!("Array size {} exceeds i32 range", array.size()),
+                    last + i32::try_from(size).map_err(|_| RowConvertError {
+                        message: format!("Array size {size} exceeds i32 range"),
                     })?,
                 );
                 validity.push(true);
                 Ok(())
             }
+            TypedWriter::Struct {
+                field_writers,
+                validity,
+                ..
+            } => {
+                let nested = row.get_row(pos)?;
+                for (i, child) in field_writers.iter_mut().enumerate() {
+                    child.write_field_at(nested, i)?;
+                }
+                validity.push(true);
+                Ok(())
+            }
         }
     }
 }
 
+fn finish_struct_array(
+    fields: arrow_schema::Fields,
+    child_arrays: Vec<ArrayRef>,
+    validity: &[bool],
+) -> ArrayRef {
+    use arrow::array::StructArray;
+    use arrow::buffer::NullBuffer;
+    use std::sync::Arc;
+
+    let null_buffer = if validity.iter().any(|v| !v) {
+        Some(NullBuffer::from(validity.to_vec()))
+    } else {
+        None
+    };
+    Arc::new(StructArray::new(fields, child_arrays, null_buffer))
+}
+
 fn finish_list_array(
     values: ArrayRef,
     item_nullable: bool,
@@ -726,7 +850,7 @@ mod tests {
     use crate::metadata::DataTypes;
     use crate::record::to_arrow_type;
     use crate::row::binary_array::FlussArrayWriter;
-    use crate::row::{Date, Datum, GenericRow, Time, TimestampLtz, TimestampNtz};
+    use crate::row::{Date, Datum, Decimal, GenericRow, Time, TimestampLtz, TimestampNtz};
     use arrow::array::*;
     use bigdecimal::BigDecimal;
     use std::str::FromStr;
@@ -857,8 +981,7 @@ mod tests {
 
         // Decimal
         let decimal =
-            crate::row::Decimal::from_big_decimal(BigDecimal::from_str("123.45").unwrap(), 10, 2)
-                .unwrap();
+            Decimal::from_big_decimal(BigDecimal::from_str("123.45").unwrap(), 10, 2).unwrap();
         let arr = write_one(&DataTypes::decimal(10, 2), Datum::Decimal(decimal));
         assert_eq!(
             arr.as_any()
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
index c6940652f5..9e0ffa5391 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
@@ -18,10 +18,12 @@
 use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
 use bytes::Bytes;
 
+use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::DataType;
 use crate::row::Decimal;
 use crate::row::binary::{BinaryRowFormat, BinaryWriter, ValueWriter};
+use crate::row::datum::{TimestampLtz, TimestampNtz};
 use delegate::delegate;
 
 /// A wrapping of [`CompactedRowWriter`] used to encode key columns.
@@ -47,12 +49,8 @@ impl CompactedKeyWriter {
     }
 
     pub fn create_value_writer(field_type: &DataType) -> Result<ValueWriter> {
-        // Java's CompactedKeyEncoder allows encoding Array types (Map/Row
-        // are not yet supported by ValueWriter). The server rejects
-        // unsupported key types at table-creation time, so encoding is
-        // allowed here to match Java parity.
-        if matches!(field_type, DataType::Map(_) | DataType::Row(_)) {
-            return Err(crate::error::Error::IllegalArgument {
+        if matches!(field_type, DataType::Map(_)) {
+            return Err(IllegalArgument {
                 message: format!("Cannot use {field_type:?} as a key column type"),
             });
         }
@@ -107,9 +105,9 @@ impl BinaryWriter for CompactedKeyWriter {
 
             fn write_time(&mut self, value: i32, precision: u32);
 
-            fn write_timestamp_ntz(&mut self, value: &crate::row::datum::TimestampNtz, precision: u32);
+            fn write_timestamp_ntz(&mut self, value: &TimestampNtz, precision: u32);
 
-            fn write_timestamp_ltz(&mut self, value: &crate::row::datum::TimestampLtz, precision: u32);
+            fn write_timestamp_ltz(&mut self, value: &TimestampLtz, precision: u32);
 
             fn write_array(&mut self, value: &[u8]);
         }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 24e4bd79d7..fbf47c58b7 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -16,13 +16,18 @@
 // under the License.
 
 use crate::client::WriteFormat;
+use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::RowType;
 use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
-use crate::row::{Decimal, GenericRow, InternalRow};
+use crate::row::{Decimal, FlussArray, GenericRow, InternalRow};
 use std::sync::{Arc, OnceLock};
 
+pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
+    arity.div_ceil(8)
+}
+
 // Reference implementation:
 // https://github.com/apache/fluss/blob/main/fluss-common/src/main/java/org/apache/fluss/row/compacted/CompactedRow.java
 #[allow(dead_code)]
@@ -35,10 +40,6 @@ pub struct CompactedRow<'a> {
     data: &'a [u8],
 }
 
-pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
-    arity.div_ceil(8)
-}
-
 #[allow(dead_code)]
 impl<'a> CompactedRow<'a> {
     pub fn from_bytes(row_type: &'a RowType, data: &'a [u8]) -> Self {
@@ -93,7 +94,7 @@ impl<'a> InternalRow for CompactedRow<'a> {
     fn is_null_at(&self, pos: usize) -> Result<bool> {
         let fields = self.deserializer.get_row_type().fields();
         if pos >= fields.len() {
-            return Err(crate::error::Error::IllegalArgument {
+            return Err(IllegalArgument {
                 message: format!(
                     "position {pos} out of bounds (row has {} fields)",
                     fields.len()
@@ -167,12 +168,12 @@ impl<'a> InternalRow for CompactedRow<'a> {
         self.decoded_row()?.get_bytes(pos)
     }
 
-    fn get_array(&self, pos: usize) -> Result<crate::row::FlussArray> {
+    fn get_array(&self, pos: usize) -> Result<FlussArray> {
         self.decoded_row()?.get_array(pos)
     }
 
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
-        self.decoded_row().get_row(pos)
+        self.decoded_row()?.get_row(pos)
     }
 
     fn as_encoded_bytes(&self, write_format: WriteFormat) -> Option<&[u8]> {
@@ -187,13 +188,14 @@ impl<'a> InternalRow for CompactedRow<'a> {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::row::binary::BinaryWriter;
-
     use crate::metadata::{
-        BigIntType, BooleanType, BytesType, DataType, DoubleType, FloatType, IntType, SmallIntType,
-        StringType, TinyIntType,
+        BigIntType, BooleanType, BytesType, DataType, DataTypes, DecimalType, DoubleType,
+        FloatType, IntType, SmallIntType, StringType, TimestampLTzType, TimestampType, TinyIntType,
     };
+    use crate::row::binary::BinaryWriter;
+    use crate::row::binary_array::FlussArrayWriter;
     use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
+    use crate::row::datum::{TimestampLtz, TimestampNtz};
 
     #[test]
     fn test_compacted_row() {
@@ -263,9 +265,6 @@ mod tests {
     #[test]
     fn test_compacted_row_temporal_and_decimal_types() {
         // Comprehensive test covering DATE, TIME, TIMESTAMP (compact/non-compact), and DECIMAL (compact/non-compact)
-        use crate::metadata::{DataTypes, DecimalType, TimestampLTzType, TimestampType};
-        use crate::row::Decimal;
-        use crate::row::datum::{TimestampLtz, TimestampNtz};
         use bigdecimal::{BigDecimal, num_bigint::BigInt};
 
         let row_type = RowType::with_data_types(vec![
@@ -345,9 +344,6 @@ mod tests {
 
     #[test]
     fn test_compacted_row_int_array() {
-        use crate::metadata::DataTypes;
-        use crate::row::binary_array::FlussArrayWriter;
-
         let row_type =
             RowType::with_data_types(vec![DataTypes::int(), DataTypes::array(DataTypes::int())]);
 
@@ -375,9 +371,6 @@ mod tests {
 
     #[test]
     fn test_compacted_row_string_array() {
-        use crate::metadata::DataTypes;
-        use crate::row::binary_array::FlussArrayWriter;
-
         let row_type = RowType::with_data_types(vec![DataTypes::array(DataTypes::string())]);
 
         let mut writer = CompactedRowWriter::new(row_type.fields().len());
@@ -402,9 +395,6 @@ mod tests {
 
     #[test]
     fn test_compacted_row_array_with_nulls() {
-        use crate::metadata::DataTypes;
-        use crate::row::binary_array::FlussArrayWriter;
-
         let row_type = RowType::with_data_types(vec![DataTypes::array(DataTypes::int())]);
 
         let mut writer = CompactedRowWriter::new(row_type.fields().len());
@@ -431,9 +421,6 @@ mod tests {
 
     #[test]
     fn test_compacted_row_empty_array() {
-        use crate::metadata::DataTypes;
-        use crate::row::binary_array::FlussArrayWriter;
-
         let row_type = RowType::with_data_types(vec![DataTypes::array(DataTypes::int())]);
 
         let mut writer = CompactedRowWriter::new(row_type.fields().len());
@@ -452,9 +439,6 @@ mod tests {
 
     #[test]
     fn test_compacted_row_nested_array() {
-        use crate::metadata::DataTypes;
-        use crate::row::binary_array::FlussArrayWriter;
-
         let row_type =
             RowType::with_data_types(vec![DataTypes::array(DataTypes::array(DataTypes::int()))]);
 
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index 9d7fb6cb8f..efcb39f2ed 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -15,34 +15,59 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::metadata::RowType;
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::{DataType, RowType};
 use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
-use crate::{
-    error::{Error::IllegalArgument, Result},
-    metadata::DataType,
-    row::{Datum, Decimal, GenericRow, compacted::compacted_row_writer::CompactedRowWriter},
-    util::varint::{read_unsigned_varint_at, read_unsigned_varint_u64_at},
-};
+use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
+use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+use crate::row::{Datum, Decimal, FlussArray, GenericRow};
+use crate::util::varint::{read_unsigned_varint_at, read_unsigned_varint_u64_at};
 use std::borrow::Cow;
 use std::str::from_utf8;
+use std::sync::Arc;
 
 #[allow(dead_code)]
 #[derive(Clone)]
 pub struct CompactedRowDeserializer<'a> {
     row_type: Cow<'a, RowType>,
+    // Index-parallel to row_type.fields(); Some(_) only for ROW-typed fields.
+    nested: Vec<Option<Arc<CompactedRowDeserializer<'a>>>>,
+}
+
+fn build_nested_deserializers<'a>(
+    row_type: &RowType,
+) -> Vec<Option<Arc<CompactedRowDeserializer<'a>>>> {
+    row_type
+        .fields()
+        .iter()
+        .map(|f| {
+            if let DataType::Row(inner) = &f.data_type {
+                Some(Arc::new(CompactedRowDeserializer::new_from_owned(
+                    inner.clone(),
+                )))
+            } else {
+                None
+            }
+        })
+        .collect()
 }
 
 #[allow(dead_code)]
 impl<'a> CompactedRowDeserializer<'a> {
     pub fn new(row_type: &'a RowType) -> Self {
+        let nested = build_nested_deserializers(row_type);
         Self {
             row_type: Cow::Borrowed(row_type),
+            nested,
         }
     }
 
     pub fn new_from_owned(row_type: RowType) -> Self {
+        let nested = build_nested_deserializers(&row_type);
         Self {
             row_type: Cow::Owned(row_type),
+            nested,
         }
     }
 
@@ -127,65 +152,52 @@ impl<'a> CompactedRowDeserializer<'a> {
                 }
                 DataType::Date(_) => {
                     let (val, next) = reader.read_int(cursor)?;
-                    (Datum::Date(crate::row::datum::Date::new(val)), next)
+                    (Datum::Date(Date::new(val)), next)
                 }
                 DataType::Time(_) => {
                     let (val, next) = reader.read_int(cursor)?;
-                    (Datum::Time(crate::row::datum::Time::new(val)), next)
+                    (Datum::Time(Time::new(val)), next)
                 }
                 DataType::Timestamp(timestamp_type) => {
                     let precision = timestamp_type.precision();
-                    if crate::row::datum::TimestampNtz::is_compact(precision) {
-                        // Compact: only milliseconds
+                    if TimestampNtz::is_compact(precision) {
                         let (millis, next) = reader.read_long(cursor)?;
-                        (
-                            Datum::TimestampNtz(crate::row::datum::TimestampNtz::new(millis)),
-                            next,
-                        )
+                        (Datum::TimestampNtz(TimestampNtz::new(millis)), next)
                     } else {
-                        // Non-compact: milliseconds + nanos
                         let (millis, mid) = reader.read_long(cursor)?;
                         let (nanos, next) = reader.read_int(mid)?;
-                        let timestamp = crate::row::datum::TimestampNtz::from_millis_nanos(
-                            millis, nanos,
-                        )
-                        .map_err(|e| IllegalArgument {
-                            message: format!(
-                                "Invalid nano_of_millisecond value in compacted row timestamp: {e}"
-                            ),
-                        })?;
+                        let timestamp = TimestampNtz::from_millis_nanos(millis, nanos).map_err(
+                            |e| IllegalArgument {
+                                message: format!(
+                                    "Invalid nano_of_millisecond value in compacted row timestamp: {e}"
+                                ),
+                            },
+                        )?;
                         (Datum::TimestampNtz(timestamp), next)
                     }
                 }
                 DataType::TimestampLTz(timestamp_ltz_type) => {
                     let precision = timestamp_ltz_type.precision();
-                    if crate::row::datum::TimestampLtz::is_compact(precision) {
-                        // Compact: only epoch milliseconds
+                    if TimestampLtz::is_compact(precision) {
                         let (epoch_millis, next) = reader.read_long(cursor)?;
-                        (
-                            Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(epoch_millis)),
-                            next,
-                        )
+                        (Datum::TimestampLtz(TimestampLtz::new(epoch_millis)), next)
                     } else {
-                        // Non-compact: epoch milliseconds + nanos
                         let (epoch_millis, mid) = reader.read_long(cursor)?;
                         let (nanos, next) = reader.read_int(mid)?;
-                        let timestamp_ltz = crate::row::datum::TimestampLtz::from_millis_nanos(
-                            epoch_millis,
-                            nanos,
-                        )
-                        .map_err(|e| IllegalArgument {
-                            message: format!(
-                                "Invalid nano_of_millisecond value in compacted row timestamp_ltz: {e}"
-                            ),
-                        })?;
+                        let timestamp_ltz =
+                            TimestampLtz::from_millis_nanos(epoch_millis, nanos).map_err(|e| {
+                                IllegalArgument {
+                                    message: format!(
+                                        "Invalid nano_of_millisecond value in compacted row timestamp_ltz: {e}"
+                                    ),
+                                }
+                            })?;
                         (Datum::TimestampLtz(timestamp_ltz), next)
                     }
                 }
                 DataType::Array(_) => {
                     let (bytes, next) = reader.read_bytes(cursor)?;
-                    let array = crate::row::binary_array::FlussArray::from_bytes(bytes)?;
-                    (Datum::Array(array), next)
+                    (Datum::Array(FlussArray::from_bytes(bytes)?), next)
                 }
                 DataType::Row(row_type) => {
                     let (nested_bytes, next) = reader.read_bytes(cursor)?;
@@ -195,7 +207,9 @@ impl<'a> CompactedRowDeserializer<'a> {
                         0,
                         nested_bytes.len(),
                     );
-                    let nested_deser = CompactedRowDeserializer::new_from_owned(row_type.clone());
+                    let nested_deser = self.nested[col_pos]
+                        .as_ref()
+                        .expect("ROW field must have nested deserializer");
                     let nested_row = nested_deser.deserialize(&nested_reader)?;
                     (Datum::Row(Box::new(nested_row)), next)
                 }
@@ -342,9 +356,12 @@ impl<'a> CompactedRowReader<'a> {
 #[cfg(test)]
 mod row_type_tests {
     use crate::metadata::{DataType, DataTypes, RowType};
-    use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
-    use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
     use crate::row::binary::ValueWriter;
+    use crate::row::compacted::compacted_row_reader::{
+        CompactedRowDeserializer, CompactedRowReader,
+    };
+    use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
+    use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
     use crate::row::field_getter::FieldGetter;
     use crate::row::{Datum, GenericRow, InternalRow};
 
@@ -374,13 +391,12 @@ mod row_type_tests {
             0,
             bytes.len(),
         );
-        let result = deser.deserialize(&reader);
+        let result = deser.deserialize(&reader).expect("deserialize");
         verify(&result);
     }
 
     #[test]
     fn test_row_simple_nesting() {
-        // ROW<INT, STRING> nested inside an outer row
         let inner_row_type = RowType::with_data_types_and_field_names(
             vec![DataTypes::int(), DataTypes::string()],
             vec!["x", "label"],
@@ -408,11 +424,8 @@ mod row_type_tests {
 
     #[test]
     fn test_row_deep_nesting() {
-        // ROW<ROW<INT>> — two levels of nesting
-        let inner_inner_row_type = RowType::with_data_types_and_field_names(
-            vec![DataTypes::int()],
-            vec!["n"],
-        );
+        let inner_inner_row_type =
+            RowType::with_data_types_and_field_names(vec![DataTypes::int()], vec!["n"]);
         let inner_row_type = RowType::with_data_types_and_field_names(
             vec![DataType::Row(inner_inner_row_type.clone())],
             vec!["inner"],
@@ -476,4 +489,79 @@ mod row_type_tests {
             assert!(result2.is_null_at(1).unwrap());
         });
     }
+
+    #[test]
+    fn test_row_all_primitives_round_trip() {
+        let inner_row_type = RowType::with_data_types_and_field_names(
+            vec![
+                DataTypes::boolean(),
+                DataTypes::tinyint(),
+                DataTypes::smallint(),
+                DataTypes::int(),
+                DataTypes::bigint(),
+                DataTypes::float(),
+                DataTypes::double(),
+                DataTypes::string(),
+                DataTypes::bytes(),
+                DataTypes::date(),
+                DataTypes::time(),
+                DataTypes::timestamp(),
+                DataTypes::timestamp_ltz(),
+            ],
+            vec![
+                "b", "tin", "sm", "i", "lo", "fl", "db", "str", "by", "dt", "ti", "tsn", "tsl",
+            ],
+        );
+        let outer_row_type = RowType::with_data_types_and_field_names(
+            vec![DataType::Row(inner_row_type.clone())],
+            vec!["nested"],
+        );
+
+        let mut inner = GenericRow::new(13);
+        inner.set_field(0, true);
+        inner.set_field(1, 7_i8);
+        inner.set_field(2, -42_i16);
+        inner.set_field(3, 100_000_i32);
+        inner.set_field(4, 9_876_543_210_i64);
+        inner.set_field(5, std::f32::consts::PI);
+        inner.set_field(6, std::f64::consts::E);
+        inner.set_field(7, "hello world");
+        inner.set_field(8, b"binary".as_slice());
+        inner.set_field(9, Datum::Date(Date::new(20476)));
+        inner.set_field(10, Datum::Time(Time::new(36_827_123)));
+        inner.set_field(
+            11,
+            Datum::TimestampNtz(TimestampNtz::new(1_769_163_227_123)),
+        );
+        inner.set_field(
+            12,
+            Datum::TimestampLtz(TimestampLtz::new(1_769_163_227_123)),
+        );
+
+        let mut outer = GenericRow::new(1);
+        outer.set_field(0, Datum::Row(Box::new(inner)));
+
+        round_trip(&outer_row_type, &outer, |result| {
+            let n = result.get_row(0).unwrap();
+            assert!(n.get_boolean(0).unwrap());
+            assert_eq!(n.get_byte(1).unwrap(), 7);
+            assert_eq!(n.get_short(2).unwrap(), -42);
+            assert_eq!(n.get_int(3).unwrap(), 100_000);
+            assert_eq!(n.get_long(4).unwrap(), 9_876_543_210);
+            assert!((n.get_float(5).unwrap() - std::f32::consts::PI).abs() < f32::EPSILON);
+            assert!((n.get_double(6).unwrap() - std::f64::consts::E).abs() < f64::EPSILON);
+            assert_eq!(n.get_string(7).unwrap(), "hello world");
+            assert_eq!(n.get_bytes(8).unwrap(), b"binary");
+            assert_eq!(n.get_date(9).unwrap().get_inner(), 20476);
+            assert_eq!(n.get_time(10).unwrap().get_inner(), 36_827_123);
+            assert_eq!(
+                n.get_timestamp_ntz(11, 6).unwrap().get_millisecond(),
+                1_769_163_227_123,
+            );
+            assert_eq!(
+                n.get_timestamp_ltz(12, 6).unwrap().get_epoch_millisecond(),
+                1_769_163_227_123,
+            );
+        });
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/mod.rs b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
index 3361078321..fa603d23b2 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/mod.rs
@@ -23,7 +23,7 @@ mod compacted_row_writer;
 
 pub use compacted_key_writer::CompactedKeyWriter;
 #[allow(unused_imports)]
-pub use compacted_row::CompactedRow;
+pub use compacted_row::{CompactedRow, calculate_bit_set_width_in_bytes};
 #[allow(unused_imports)]
 pub use compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
 #[allow(unused_imports)]
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index 865d4b4f8e..d3f19a1e60 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -15,18 +15,21 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use crate::error::Error::RowConvertError;
+use crate::error::Error::{IllegalArgument, RowConvertError};
 use crate::error::Result;
+use crate::metadata::{DataType, RowType};
 use crate::row::Decimal;
 use crate::row::GenericRow;
+use crate::row::InternalRow;
 use crate::row::binary_array::FlussArray;
+use crate::row::field_getter::FieldGetter;
 use arrow::array::{
     ArrayBuilder, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
     FixedSizeBinaryBuilder, Float32Builder, Float64Builder, Int8Builder, Int16Builder,
-    Int32Builder, Int64Builder, ListBuilder, StringBuilder, Time32MillisecondBuilder,
-    Time32SecondBuilder, Time64MicrosecondBuilder, Time64NanosecondBuilder,
-    TimestampMicrosecondBuilder, TimestampMillisecondBuilder, TimestampNanosecondBuilder,
-    TimestampSecondBuilder,
+    Int32Builder, Int64Builder, ListBuilder, StringBuilder, StructBuilder,
+    Time32MillisecondBuilder, Time32SecondBuilder, Time64MicrosecondBuilder,
+    Time64NanosecondBuilder, TimestampMicrosecondBuilder, TimestampMillisecondBuilder,
+    TimestampNanosecondBuilder, TimestampSecondBuilder,
 };
 use arrow::datatypes as arrow_schema;
 use arrow::error::ArrowError;
@@ -146,6 +149,30 @@ impl Datum<'_> {
     }
 }
 
+impl<'a> Datum<'a> {
+    pub fn into_owned(self) -> Datum<'static> {
+        match self {
+            Datum::Null => Datum::Null,
+            Datum::Bool(v) => Datum::Bool(v),
+            Datum::Int8(v) => Datum::Int8(v),
+            Datum::Int16(v) => Datum::Int16(v),
+            Datum::Int32(v) => Datum::Int32(v),
+            Datum::Int64(v) => Datum::Int64(v),
+            Datum::Float32(v) => Datum::Float32(v),
+            Datum::Float64(v) => Datum::Float64(v),
+            Datum::String(s) => Datum::String(Cow::Owned(s.into_owned())),
+            Datum::Blob(b) => Datum::Blob(Cow::Owned(b.into_owned())),
+            Datum::Decimal(d) => Datum::Decimal(d),
+            Datum::Date(d) => Datum::Date(d),
+            Datum::Time(t) => Datum::Time(t),
+            Datum::TimestampNtz(t) => Datum::TimestampNtz(t),
+            Datum::TimestampLtz(t) => Datum::TimestampLtz(t),
+            Datum::Array(a) => Datum::Array(a),
+            Datum::Row(boxed) => Datum::Row(Box::new(boxed.into_owned())),
+        }
+    }
+}
+
 // ----------- implement from
 impl<'a> From<i32> for Datum<'a> {
     #[inline]
@@ -563,42 +590,29 @@ fn append_fluss_array_to_list_builder(
 fn read_datum_from_fluss_array<'a>(
     arr: &FlussArray,
     pos: usize,
-    element_type: &crate::metadata::DataType,
+    element_type: &DataType,
 ) -> Result<Datum<'a>> {
-    use crate::metadata::DataType;
-
-    Ok(match element_type {
-        DataType::Boolean(_) => Datum::Bool(arr.get_boolean(pos)?),
-        DataType::TinyInt(_) => Datum::Int8(arr.get_byte(pos)?),
-        DataType::SmallInt(_) => Datum::Int16(arr.get_short(pos)?),
-        DataType::Int(_) => Datum::Int32(arr.get_int(pos)?),
-        DataType::BigInt(_) => Datum::Int64(arr.get_long(pos)?),
-        DataType::Float(_) => Datum::Float32(arr.get_float(pos)?.into()),
-        DataType::Double(_) => Datum::Float64(arr.get_double(pos)?.into()),
-        DataType::Char(_) | DataType::String(_) => {
-            Datum::String(Cow::Owned(arr.get_string(pos)?.to_string()))
-        }
-        DataType::Binary(_) | DataType::Bytes(_) => {
-            Datum::Blob(Cow::Owned(arr.get_binary(pos)?.to_vec()))
-        }
-        DataType::Decimal(dt) => {
-            Datum::Decimal(arr.get_decimal(pos, dt.precision(), dt.scale())?)
-        }
-        DataType::Date(_) => Datum::Date(arr.get_date(pos)?),
-        DataType::Time(_) => Datum::Time(arr.get_time(pos)?),
-        DataType::Timestamp(t) => Datum::TimestampNtz(arr.get_timestamp_ntz(pos, t.precision())?),
-        DataType::TimestampLTz(t) => {
-            Datum::TimestampLtz(arr.get_timestamp_ltz(pos, t.precision())?)
-        }
-        DataType::Array(_) => Datum::Array(arr.get_array(pos)?),
-        _ => {
-            return Err(RowConvertError {
-                message: format!(
-                    "Unsupported element type for FlussArray → Arrow conversion: {element_type:?}"
-                ),
-            });
-        }
-    })
+    if let DataType::Row(row_type) = element_type {
+        let compacted = arr.get_row(pos, row_type)?;
+        return Ok(Datum::Row(Box::new(internal_row_to_owned_generic(
+            &compacted, row_type,
+        )?)));
+    }
+
+    let getter = FieldGetter::create(element_type, pos);
+    Ok(getter.get_field(arr)?.into_owned())
+}
+
+fn internal_row_to_owned_generic(
+    row: &dyn InternalRow,
+    row_type: &RowType,
+) -> Result<GenericRow<'static>> {
+    let mut owned = GenericRow::new(row_type.fields().len());
+    for (i, field) in row_type.fields().iter().enumerate() {
+        let getter = FieldGetter::create(field.data_type(), i);
+        owned.set_field(i, getter.get_field(row)?.into_owned());
+    }
+    Ok(owned)
 }
 
 fn append_null_for_type(
@@ -661,12 +675,74 @@ fn append_null_for_type(
         arrow_schema::DataType::List(_) => {
             downcast_null!(ListBuilder<Box<dyn ArrayBuilder>>)
         }
+        arrow_schema::DataType::Struct(fields) => {
+            // StructBuilder::append_null only flips parent validity; children must each get a null too.
+            let struct_builder = builder
+                .as_any_mut()
+                .downcast_mut::<StructBuilder>()
+                .ok_or_else(|| RowConvertError {
+                    message: format!(
+                        "Builder type mismatch: expected StructBuilder for {data_type:?}",
+                    ),
+                })?;
+            let cloned_fields = fields.clone();
+            {
+                let field_builders = struct_builder.field_builders_mut();
+                for (i, field) in cloned_fields.iter().enumerate() {
+                    append_null_for_type(field_builders[i].as_mut(), field.data_type())?;
+                }
+            }
+            struct_builder.append(false);
+            Ok(())
+        }
         _ => Err(RowConvertError {
             message: format!("Unsupported Arrow data type for null append: {data_type:?}"),
         }),
     }
 }
 
+fn append_generic_row_to_struct_builder(
+    row: &GenericRow<'_>,
+    builder: &mut dyn ArrayBuilder,
+    data_type: &arrow_schema::DataType,
+) -> Result<()> {
+    let struct_builder = builder
+        .as_any_mut()
+        .downcast_mut::<StructBuilder>()
+        .ok_or_else(|| RowConvertError {
+            message: "Builder type mismatch for Row: expected StructBuilder".to_string(),
+        })?;
+
+    let fields = match data_type {
+        arrow_schema::DataType::Struct(fields) => fields.clone(),
+        _ => {
+            return Err(RowConvertError {
+                message: format!("Expected Struct Arrow type for Row datum, got: {data_type:?}"),
+            });
+        }
+    };
+
+    if row.values.len() != fields.len() {
+        return Err(RowConvertError {
+            message: format!(
+                "Row arity mismatch: schema has {} fields, got {}",
+                fields.len(),
+                row.values.len(),
+            ),
+        });
+    }
+
+    {
+        let field_builders = struct_builder.field_builders_mut();
+        for (i, datum) in row.values.iter().enumerate() {
+            let child = field_builders[i].as_mut();
+            datum.append_to(child, fields[i].data_type())?;
+        }
+    }
+    struct_builder.append(true);
+    Ok(())
+}
+
 impl Datum<'_> {
     pub fn append_to(
         &self,
@@ -888,10 +964,8 @@ impl Datum<'_> {
             Datum::Array(arr) => {
                 return append_fluss_array_to_list_builder(arr, builder, data_type);
             }
-            Datum::Row(_) => {
-                return Err(RowConvertError {
-                    message: "append_to is not supported for Row type".to_string(),
-                });
+            Datum::Row(row) => {
+                return append_generic_row_to_struct_builder(row, builder, data_type);
             }
         }
 
@@ -981,7 +1055,7 @@ impl TimestampNtz {
 
     pub fn from_millis_nanos(millisecond: i64, nano_of_millisecond: i32) -> Result<Self> {
         if !(0..=MAX_NANO_OF_MILLISECOND).contains(&nano_of_millisecond) {
-            return Err(crate::error::Error::IllegalArgument {
+            return Err(IllegalArgument {
                 message: format!(
                     "nanoOfMillisecond must be in range [0, {MAX_NANO_OF_MILLISECOND}], got: {nano_of_millisecond}"
                 ),
@@ -1025,7 +1099,7 @@ impl TimestampLtz {
 
     pub fn from_millis_nanos(epoch_millisecond: i64, nano_of_millisecond: i32) -> Result<Self> {
         if !(0..=MAX_NANO_OF_MILLISECOND).contains(&nano_of_millisecond) {
-            return Err(crate::error::Error::IllegalArgument {
+            return Err(IllegalArgument {
                 message: format!(
                     "nanoOfMillisecond must be in range [0, {MAX_NANO_OF_MILLISECOND}], got: {nano_of_millisecond}"
                 ),
@@ -1149,7 +1223,7 @@ mod tests {
         let err = Datum::Int32(1)
             .append_to(&mut builder, &arrow_schema::DataType::Utf8)
             .unwrap_err();
-        assert!(matches!(err, crate::error::Error::RowConvertError { .. }));
+        assert!(matches!(err, RowConvertError { .. }));
     }
 
     #[test]
@@ -1177,6 +1251,13 @@ mod tests {
 #[cfg(test)]
 mod timestamp_tests {
     use super::*;
+    use crate::metadata::{DataField, DataTypes};
+    use crate::record::to_arrow_type;
+    use crate::row::InternalRow;
+    use crate::row::column::ColumnarRow;
+    use arrow::array::{RecordBatch, StructArray, StructBuilder};
+    use arrow::datatypes::{Field, Fields, Schema};
+    use std::sync::Arc;
 
     #[test]
     fn test_timestamp_valid_nanos() {
@@ -1221,4 +1302,62 @@ mod timestamp_tests {
         assert!(result_ltz.is_err());
         assert!(result_ltz.unwrap_err().to_string().contains(&expected_msg));
     }
+
+    #[test]
+    fn test_row_arrow_struct_round_trip() {
+        let row_type_owned = DataTypes::row(vec![
+            DataField::new("x", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let arrow_struct_dt = to_arrow_type(&row_type_owned).unwrap();
+        let struct_fields: Fields = match &arrow_struct_dt {
+            arrow_schema::DataType::Struct(f) => f.clone(),
+            _ => unreachable!(),
+        };
+
+        let mut struct_builder = StructBuilder::from_fields(struct_fields.clone(), 3);
+
+        let mut r0 = GenericRow::new(2);
+        r0.set_field(0, 42_i32);
+        r0.set_field(1, "hello");
+        Datum::Row(Box::new(r0))
+            .append_to(&mut struct_builder, &arrow_struct_dt)
+            .expect("append row 0");
+
+        Datum::Null
+            .append_to(&mut struct_builder, &arrow_struct_dt)
+            .expect("append null row");
+
+        let mut r2 = GenericRow::new(2);
+        r2.set_field(0, -7_i32);
+        r2.set_field(1, Datum::Null);
+        Datum::Row(Box::new(r2))
+            .append_to(&mut struct_builder, &arrow_struct_dt)
+            .expect("append row 2");
+
+        let struct_array: StructArray = struct_builder.finish();
+
+        let schema = Arc::new(Schema::new(vec![Field::new(
+            "nested",
+            arrow_struct_dt.clone(),
+            true,
+        )]));
+        let batch = Arc::new(
+            RecordBatch::try_new(schema, vec![Arc::new(struct_array)]).expect("record batch"),
+        );
+
+        let mut columnar = ColumnarRow::new(batch, 0, None);
+
+        let nested = columnar.get_row(0).expect("get_row 0");
+        assert_eq!(nested.get_int(0).unwrap(), 42);
+        assert_eq!(nested.get_string(1).unwrap(), "hello");
+
+        columnar.set_row_id(1);
+        assert!(columnar.is_null_at(0).unwrap(), "row 1 should be null");
+
+        columnar.set_row_id(2);
+        let nested = columnar.get_row(0).expect("get_row 2");
+        assert_eq!(nested.get_int(0).unwrap(), -7);
+        assert!(nested.is_null_at(1).unwrap(), "label should be null");
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
index a6ba580f2a..c7f16d6ca5 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
@@ -111,9 +111,10 @@ mod tests {
     use super::*;
     use crate::metadata::{DataType, DataTypes};
     use crate::row::binary_array::FlussArrayWriter;
-    use crate::row::{Datum, GenericRow};
+    use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
+    use crate::row::{Datum, Decimal, FlussArray, GenericRow};
 
-    fn build_int_array(values: &[i32]) -> crate::row::FlussArray {
+    fn build_int_array(values: &[i32]) -> FlussArray {
         let mut w = FlussArrayWriter::new(values.len(), &DataTypes::int());
         for (i, v) in values.iter().enumerate() {
             w.write_int(i, *v);
@@ -121,7 +122,7 @@ mod tests {
         w.complete().unwrap()
     }
 
-    fn build_nullable_int_array(values: &[Option<i32>]) -> crate::row::FlussArray {
+    fn build_nullable_int_array(values: &[Option<i32>]) -> FlussArray {
         let mut w = FlussArrayWriter::new(values.len(), &DataTypes::int());
         for (i, v) in values.iter().enumerate() {
             match v {
@@ -132,7 +133,7 @@ mod tests {
         w.complete().unwrap()
     }
 
-    fn build_float_array(values: &[f32]) -> crate::row::FlussArray {
+    fn build_float_array(values: &[f32]) -> FlussArray {
         let mut w = FlussArrayWriter::new(values.len(), &DataTypes::float().as_non_nullable());
         for (i, v) in values.iter().enumerate() {
             w.write_float(i, *v);
@@ -140,7 +141,7 @@ mod tests {
         w.complete().unwrap()
     }
 
-    fn build_nested_string_array() -> crate::row::FlussArray {
+    fn build_nested_string_array() -> FlussArray {
         let mut inner_1 = FlussArrayWriter::new(3, &DataTypes::string());
         inner_1.write_string(0, "a");
         inner_1.set_null_at(1);
@@ -369,32 +370,32 @@ mod tests {
 
         // Exact values from Java's IndexedRowTest.genRecordForAllTypes()
         let row = GenericRow::from_data(vec![
-            Datum::from(true),                                   // BOOLEAN: true
-            Datum::from(2i8),                                    // TINYINT: 2
-            Datum::from(10i16),                                  // SMALLINT: 10
-            Datum::from(100i32),                                 // INT: 100
-            Datum::from(-6101065172474983726i64),                // BIGINT
-            Datum::from(13.2f32),                                // FLOAT: 13.2
-            Datum::from(15.21f64),                               // DOUBLE: 15.21
-            Datum::Date(crate::row::datum::Date::new(19655)), // DATE: 2023-10-25 (19655 days since epoch)
-            Datum::Time(crate::row::datum::Time::new(34200000)), // TIME: 09:30:00.0
-            Datum::from("1234567890".as_bytes()),             // BINARY(20)
-            Datum::from("20".as_bytes()),                     // BYTES
-            Datum::from("1"),                                 // CHAR(2): "1"
-            Datum::from("hello"),                             // STRING: "hello"
-            Datum::Decimal(crate::row::Decimal::from_unscaled_long(9, 5, 2).unwrap()), // DECIMAL(5,2)
+            Datum::from(true),                                             // BOOLEAN: true
+            Datum::from(2i8),                                              // TINYINT: 2
+            Datum::from(10i16),                                            // SMALLINT: 10
+            Datum::from(100i32),                                           // INT: 100
+            Datum::from(-6101065172474983726i64),                          // BIGINT
+            Datum::from(13.2f32),                                          // FLOAT: 13.2
+            Datum::from(15.21f64),                                         // DOUBLE: 15.21
+            Datum::Date(Date::new(19655)), // DATE: 2023-10-25 (19655 days since epoch)
+            Datum::Time(Time::new(34200000)), // TIME: 09:30:00.0
+            Datum::from("1234567890".as_bytes()), // BINARY(20)
+            Datum::from("20".as_bytes()),  // BYTES
+            Datum::from("1"),              // CHAR(2): "1"
+            Datum::from("hello"),          // STRING: "hello"
+            Datum::Decimal(Decimal::from_unscaled_long(9, 5, 2).unwrap()), // DECIMAL(5,2)
             Datum::Decimal(
-                crate::row::Decimal::from_big_decimal(
+                Decimal::from_big_decimal(
                     bigdecimal::BigDecimal::new(bigdecimal::num_bigint::BigInt::from(10), 0),
                     20,
                     0,
                 )
                 .unwrap(),
             ), // DECIMAL(20,0)
-            Datum::TimestampNtz(crate::row::datum::TimestampNtz::new(1698235273182)), // TIMESTAMP(1)
-            Datum::TimestampNtz(crate::row::datum::TimestampNtz::new(1698235273182)), // TIMESTAMP(5)
-            Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(1698235273182)), // TIMESTAMP_LTZ(1)
-            Datum::TimestampLtz(crate::row::datum::TimestampLtz::new(1698235273182)), // TIMESTAMP_LTZ(5)
+            Datum::TimestampNtz(TimestampNtz::new(1698235273182)), // TIMESTAMP(1)
+            Datum::TimestampNtz(TimestampNtz::new(1698235273182)), // TIMESTAMP(5)
+            Datum::TimestampLtz(TimestampLtz::new(1698235273182)), // TIMESTAMP_LTZ(1)
+            Datum::TimestampLtz(TimestampLtz::new(1698235273182)), // TIMESTAMP_LTZ(5)
             Datum::Array(build_nullable_int_array(&[
                 Some(1),
                 Some(2),
@@ -502,10 +503,7 @@ mod tests {
             vec!["x", "label"],
         );
         let row_type = RowType::with_data_types_and_field_names(
-            vec![
-                DataTypes::int(),
-                DataType::Row(inner_row_type.clone()),
-            ],
+            vec![DataTypes::int(), DataType::Row(inner_row_type.clone())],
             vec!["id", "nested"],
         );
 
diff --git a/fluss-rust/crates/fluss/src/row/lookup_row.rs b/fluss-rust/crates/fluss/src/row/lookup_row.rs
index c002369d13..76505abf63 100644
--- a/fluss-rust/crates/fluss/src/row/lookup_row.rs
+++ b/fluss-rust/crates/fluss/src/row/lookup_row.rs
@@ -24,7 +24,7 @@ use crate::error::Result;
 use crate::row::compacted::CompactedRow;
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
 use crate::row::projected_row::ProjectedRow;
-use crate::row::{Decimal, FlussArray, InternalRow};
+use crate::row::{Decimal, FlussArray, GenericRow, InternalRow};
 
 pub struct LookupRow<'a> {
     inner: Inner<'a>,
@@ -116,6 +116,9 @@ impl<'a> InternalRow for LookupRow<'a> {
     fn get_array(&self, pos: usize) -> Result<FlussArray> {
         delegate!(self, get_array, pos)
     }
+    fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
+        delegate!(self, get_row, pos)
+    }
     fn as_encoded_bytes(&self, write_format: WriteFormat) -> Option<&[u8]> {
         delegate!(self, as_encoded_bytes, write_format)
     }
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index fb599fc9af..36f9a1c250 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -34,7 +34,6 @@ mod row_decoder;
 use crate::client::WriteFormat;
 pub use binary_array::FlussArray;
 use bytes::Bytes;
-use serde::Serialize;
 pub use column::*;
 pub use compacted::CompactedRow;
 pub use datum::*;
@@ -44,6 +43,7 @@ pub(crate) use fixed_schema_decoder::FixedSchemaDecoder;
 pub use lookup_row::LookupRow;
 pub(crate) use projected_row::ProjectedRow;
 pub use row_decoder::{CompactedRowDecoder, RowDecoder, RowDecoderFactory};
+use serde::Serialize;
 
 pub struct BinaryRow<'a> {
     data: BinaryDataWrapper<'a>,
@@ -133,7 +133,7 @@ pub trait InternalRow: Send + Sync {
 
     /// Returns the nested row value at the given position
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
-        Err(crate::error::Error::IllegalArgument {
+        Err(IllegalArgument {
             message: format!("get_row not supported at position {pos}"),
         })
     }
@@ -313,6 +313,17 @@ impl<'a> InternalRow for GenericRow<'a> {
     }
 }
 
+impl<'a> GenericRow<'a> {
+    /// Consumes this row and returns one whose `Datum` values are all
+    /// `'static` (borrowed `Cow`s are promoted to owned, nested rows recurse).
+    /// Lets a row outlive the bytes it was decoded from.
+    pub fn into_owned(self) -> GenericRow<'static> {
+        GenericRow {
+            values: self.values.into_iter().map(Datum::into_owned).collect(),
+        }
+    }
+}
+
 impl<'a> GenericRow<'a> {
     pub fn from_data(data: Vec<impl Into<Datum<'a>>>) -> GenericRow<'a> {
         GenericRow {
diff --git a/fluss-rust/crates/fluss/src/row/projected_row.rs b/fluss-rust/crates/fluss/src/row/projected_row.rs
index cdd946a5fc..fc4a521ee0 100644
--- a/fluss-rust/crates/fluss/src/row/projected_row.rs
+++ b/fluss-rust/crates/fluss/src/row/projected_row.rs
@@ -23,7 +23,7 @@ use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::UNEXIST_MAPPING;
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
-use crate::row::{Decimal, FlussArray, InternalRow};
+use crate::row::{Decimal, FlussArray, GenericRow, InternalRow};
 use std::sync::Arc;
 
 pub(crate) struct ProjectedRow<R> {
@@ -142,6 +142,10 @@ impl<R: InternalRow> InternalRow for ProjectedRow<R> {
         project!(self, get_array, pos)
     }
 
+    fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
+        project!(self, get_row, pos)
+    }
+
     fn as_encoded_bytes(&self, _write_format: WriteFormat) -> Option<&[u8]> {
         // Projection changes the field layout, so the inner row's
         // encoded form no longer matches.
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index 8787e88180..ee496a5a5f 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -21,9 +21,11 @@ mod kv_table_test {
     use crate::integration::utils::{
         create_partitions, create_table, get_shared_cluster, make_int_array, make_string_array,
     };
-    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    use fluss::metadata::{DataField, DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::row::binary_array::FlussArrayWriter;
-    use fluss::row::{FlussArray, GenericRow, InternalRow};
+    use fluss::row::{
+        Date, Datum, Decimal, FlussArray, GenericRow, InternalRow, Time, TimestampLtz, TimestampNtz,
+    };
 
     fn make_key(id: i32) -> GenericRow<'static> {
         make_key_with_field_count(id, 3)
@@ -284,8 +286,6 @@ mod kv_table_test {
 
     #[tokio::test]
     async fn partial_update() {
-        use fluss::row::Datum;
-
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
@@ -293,6 +293,11 @@ mod kv_table_test {
 
         let table_path = TablePath::new("fluss", "test_partial_update");
 
+        let nested_type = DataTypes::row(vec![
+            DataField::new("seq", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+
         let table_descriptor = TableDescriptor::builder()
             .schema(
                 Schema::builder()
@@ -300,6 +305,7 @@ mod kv_table_test {
                     .column("name", DataTypes::string())
                     .column("age", DataTypes::bigint())
                     .column("score", DataTypes::bigint())
+                    .column("nested", nested_type)
                     .primary_key(vec!["id"])
                     .build()
                     .expect("Failed to build schema"),
@@ -314,24 +320,26 @@ mod kv_table_test {
             .await
             .expect("Failed to get table");
 
-        // Insert initial record with all columns
         let table_upsert = table.new_upsert().expect("Failed to create upsert");
         let upsert_writer = table_upsert
             .create_writer()
             .expect("Failed to create writer");
 
-        let mut row = GenericRow::new(4);
+        let mut nested0 = GenericRow::new(2);
+        nested0.set_field(0, 10_i32);
+        nested0.set_field(1, "alpha");
+        let mut row = GenericRow::new(5);
         row.set_field(0, 1);
         row.set_field(1, "Verso");
         row.set_field(2, 32i64);
         row.set_field(3, 6942i64);
+        row.set_field(4, Datum::Row(Box::new(nested0)));
         upsert_writer
             .upsert(&row)
             .expect("Failed to upsert initial row")
             .await
             .expect("Failed to wait for upsert acknowledgment");
 
-        // Verify initial record
         let mut lookuper = table
             .new_lookup()
             .expect("Failed to create lookup")
@@ -351,8 +359,10 @@ mod kv_table_test {
         assert_eq!(found_row.get_string(1).unwrap(), "Verso");
         assert_eq!(found_row.get_long(2).unwrap(), 32i64);
         assert_eq!(found_row.get_long(3).unwrap(), 6942i64);
+        let nested = found_row.get_row(4).unwrap();
+        assert_eq!(nested.get_int(0).unwrap(), 10);
+        assert_eq!(nested.get_string(1).unwrap(), "alpha");
 
-        // Create partial update writer to update only score column
         let partial_upsert = table_upsert
             .partial_update_with_column_names(&["id", "score"])
             .expect("Failed to create TableUpsert with partial update");
@@ -360,19 +370,18 @@ mod kv_table_test {
             .create_writer()
             .expect("Failed to create UpsertWriter with partial write");
 
-        // Update only the score column (await acknowledgment)
-        let mut partial_row = GenericRow::new(4);
+        let mut partial_row = GenericRow::new(5);
         partial_row.set_field(0, 1);
-        partial_row.set_field(1, Datum::Null); // not in partial update column
-        partial_row.set_field(2, Datum::Null); // not in partial update column
+        partial_row.set_field(1, Datum::Null);
+        partial_row.set_field(2, Datum::Null);
         partial_row.set_field(3, 420i64);
+        partial_row.set_field(4, Datum::Null);
         partial_writer
             .upsert(&partial_row)
             .expect("Failed to upsert")
             .await
             .expect("Failed to wait for upsert acknowledgment");
 
-        // Verify partial update - name and age should remain unchanged
         let result = lookuper
             .lookup(&make_key(1))
             .await
@@ -398,6 +407,56 @@ mod kv_table_test {
             420,
             "score should be updated to 420"
         );
+        let nested = found_row.get_row(4).unwrap();
+        assert_eq!(
+            nested.get_int(0).unwrap(),
+            10,
+            "ROW preserved across non-ROW partial update"
+        );
+        assert_eq!(nested.get_string(1).unwrap(), "alpha");
+
+        let partial_nested_upsert = table_upsert
+            .partial_update_with_column_names(&["id", "nested"])
+            .expect("partial_update_with_column_names");
+        let partial_nested_writer = partial_nested_upsert
+            .create_writer()
+            .expect("partial writer");
+        let mut new_nested = GenericRow::new(2);
+        new_nested.set_field(0, 99_i32);
+        new_nested.set_field(1, "omega");
+        let mut partial_nested = GenericRow::new(5);
+        partial_nested.set_field(0, 1);
+        partial_nested.set_field(1, Datum::Null);
+        partial_nested.set_field(2, Datum::Null);
+        partial_nested.set_field(3, Datum::Null);
+        partial_nested.set_field(4, Datum::Row(Box::new(new_nested)));
+        partial_nested_writer
+            .upsert(&partial_nested)
+            .expect("partial upsert")
+            .await
+            .expect("partial ack");
+
+        let result = lookuper
+            .lookup(&make_key(1))
+            .await
+            .expect("Failed to lookup after nested partial");
+        let found_row = result
+            .get_single_row()
+            .expect("Failed to get row")
+            .expect("Row should exist");
+        assert_eq!(
+            found_row.get_string(1).unwrap(),
+            "Verso",
+            "name preserved when ROW updated"
+        );
+        assert_eq!(
+            found_row.get_long(3).unwrap(),
+            420,
+            "score preserved when ROW updated"
+        );
+        let nested = found_row.get_row(4).unwrap();
+        assert_eq!(nested.get_int(0).unwrap(), 99);
+        assert_eq!(nested.get_string(1).unwrap(), "omega");
 
         admin
             .drop_table(&table_path, false)
@@ -414,7 +473,11 @@ mod kv_table_test {
 
         let table_path = TablePath::new("fluss", "test_partitioned_kv_table");
 
-        // Create a partitioned KV table with region as partition key
+        let nested_type = DataTypes::row(vec![
+            DataField::new("seq", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+
         let table_descriptor = TableDescriptor::builder()
             .schema(
                 Schema::builder()
@@ -422,6 +485,7 @@ mod kv_table_test {
                     .column("user_id", DataTypes::int())
                     .column("name", DataTypes::string())
                     .column("score", DataTypes::bigint())
+                    .column("nested", nested_type)
                     .primary_key(vec!["region", "user_id"])
                     .build()
                     .expect("Failed to build schema"),
@@ -432,7 +496,6 @@ mod kv_table_test {
 
         create_table(&admin, &table_path, &table_descriptor).await;
 
-        // Create partitions for each region before inserting data
         create_partitions(&admin, &table_path, "region", &["US", "EU", "APAC"]).await;
 
         let connection = cluster.get_fluss_connection().await;
@@ -448,35 +511,38 @@ mod kv_table_test {
             .create_writer()
             .expect("Failed to create writer");
 
-        // Insert records with different partitions
         let test_data = [
-            ("US", 1, "Gustave", 100i64),
-            ("US", 2, "Lune", 200i64),
-            ("EU", 1, "Sciel", 150i64),
-            ("EU", 2, "Maelle", 250i64),
-            ("APAC", 1, "Noco", 300i64),
+            ("US", 1, "Gustave", 100i64, 11_i32, "a"),
+            ("US", 2, "Lune", 200i64, 22, "b"),
+            ("EU", 1, "Sciel", 150i64, 33, "c"),
+            ("EU", 2, "Maelle", 250i64, 44, "d"),
+            ("APAC", 1, "Noco", 300i64, 55, "e"),
         ];
 
-        for (region, user_id, name, score) in &test_data {
-            let mut row = GenericRow::new(4);
+        for (region, user_id, name, score, seq, label) in &test_data {
+            let mut nested = GenericRow::new(2);
+            nested.set_field(0, *seq);
+            nested.set_field(1, *label);
+            let mut row = GenericRow::new(5);
             row.set_field(0, *region);
             row.set_field(1, *user_id);
             row.set_field(2, *name);
             row.set_field(3, *score);
+            row.set_field(4, Datum::Row(Box::new(nested)));
             upsert_writer.upsert(&row).expect("Failed to upsert");
         }
         upsert_writer.flush().await.expect("Failed to flush");
 
-        // Create lookuper
         let mut lookuper = table
             .new_lookup()
             .expect("Failed to create lookup")
             .create_lookuper()
             .expect("Failed to create lookuper");
 
-        // Lookup records - the lookup key includes partition key columns
-        for (region, user_id, expected_name, expected_score) in &test_data {
-            let mut key = GenericRow::new(4);
+        for (region, user_id, expected_name, expected_score, expected_seq, expected_label) in
+            &test_data
+        {
+            let mut key = GenericRow::new(5);
             key.set_field(0, *region);
             key.set_field(1, *user_id);
 
@@ -490,14 +556,28 @@ mod kv_table_test {
             assert_eq!(row.get_int(1).unwrap(), *user_id, "user_id mismatch");
             assert_eq!(row.get_string(2).unwrap(), *expected_name, "name mismatch");
             assert_eq!(row.get_long(3).unwrap(), *expected_score, "score mismatch");
+            let nested = row.get_row(4).unwrap();
+            assert_eq!(
+                nested.get_int(0).unwrap(),
+                *expected_seq,
+                "ROW seq mismatch"
+            );
+            assert_eq!(
+                nested.get_string(1).unwrap(),
+                *expected_label,
+                "ROW label mismatch"
+            );
         }
 
-        // Test update within a partition (await acknowledgment)
-        let mut updated_row = GenericRow::new(4);
+        let mut updated_nested = GenericRow::new(2);
+        updated_nested.set_field(0, 999_i32);
+        updated_nested.set_field(1, "updated");
+        let mut updated_row = GenericRow::new(5);
         updated_row.set_field(0, "US");
         updated_row.set_field(1, 1);
         updated_row.set_field(2, "Gustave Updated");
         updated_row.set_field(3, 999i64);
+        updated_row.set_field(4, Datum::Row(Box::new(updated_nested)));
         upsert_writer
             .upsert(&updated_row)
             .expect("Failed to upsert updated row")
@@ -505,7 +585,7 @@ mod kv_table_test {
             .expect("Failed to wait for upsert acknowledgment");
 
         // Verify the update
-        let mut key = GenericRow::new(4);
+        let mut key = GenericRow::new(5);
         key.set_field(0, "US");
         key.set_field(1, 1);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -515,9 +595,12 @@ mod kv_table_test {
             .expect("Row should exist");
         assert_eq!(row.get_string(2).unwrap(), "Gustave Updated");
         assert_eq!(row.get_long(3).unwrap(), 999);
+        let nested = row.get_row(4).unwrap();
+        assert_eq!(nested.get_int(0).unwrap(), 999);
+        assert_eq!(nested.get_string(1).unwrap(), "updated");
 
         // Lookup in non-existent partition should return empty result
-        let mut non_existent_key = GenericRow::new(4);
+        let mut non_existent_key = GenericRow::new(5);
         non_existent_key.set_field(0, "UNKNOWN_REGION");
         non_existent_key.set_field(1, 1);
         let result = lookuper
@@ -533,7 +616,7 @@ mod kv_table_test {
         );
 
         // Delete a record within a partition (await acknowledgment)
-        let mut delete_key = GenericRow::new(4);
+        let mut delete_key = GenericRow::new(5);
         delete_key.set_field(0, "EU");
         delete_key.set_field(1, 1);
         upsert_writer
@@ -543,7 +626,7 @@ mod kv_table_test {
             .expect("Failed to wait for delete acknowledgment");
 
         // Verify deletion
-        let mut key = GenericRow::new(4);
+        let mut key = GenericRow::new(5);
         key.set_field(0, "EU");
         key.set_field(1, 1);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -556,7 +639,7 @@ mod kv_table_test {
         );
 
         // Verify other records in the same partition still exist
-        let mut key = GenericRow::new(4);
+        let mut key = GenericRow::new(5);
         key.set_field(0, "EU");
         key.set_field(1, 2);
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -572,11 +655,122 @@ mod kv_table_test {
             .expect("Failed to drop table");
     }
 
+    #[tokio::test]
+    async fn upsert_and_lookup_with_row_rich_types() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_kv_row_rich_types");
+
+        let row_type_owned = DataTypes::row(vec![
+            DataField::new("f_bool", DataTypes::boolean(), None),
+            DataField::new("f_long", DataTypes::bigint(), None),
+            DataField::new("f_float", DataTypes::float(), None),
+            DataField::new("f_double", DataTypes::double(), None),
+            DataField::new("f_str", DataTypes::string(), None),
+            DataField::new("f_bytes", DataTypes::bytes(), None),
+            DataField::new("f_decimal", DataTypes::decimal(10, 2), None),
+            DataField::new("f_date", DataTypes::date(), None),
+            DataField::new("f_time", DataTypes::time_with_precision(3), None),
+            DataField::new("f_ts_ntz", DataTypes::timestamp_with_precision(6), None),
+            DataField::new("f_ts_ltz", DataTypes::timestamp_ltz_with_precision(6), None),
+        ]);
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("nested", row_type_owned)
+                    .primary_key(vec!["id"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let upsert = table.new_upsert().expect("Failed to create upsert");
+        let upsert_writer = upsert.create_writer().expect("Failed to create writer");
+
+        let mut nested = GenericRow::new(11);
+        nested.set_field(0, true);
+        nested.set_field(1, 9_876_543_210_i64);
+        nested.set_field(2, f32::NEG_INFINITY);
+        nested.set_field(3, f64::NAN);
+        nested.set_field(4, "rich types here");
+        nested.set_field(5, b"opaque".as_slice());
+        nested.set_field(6, Decimal::from_unscaled_long(54321, 10, 2).unwrap());
+        nested.set_field(7, Datum::Date(Date::new(20476)));
+        nested.set_field(8, Datum::Time(Time::new(36_827_123)));
+        nested.set_field(9, Datum::TimestampNtz(TimestampNtz::new(1_769_163_227_123)));
+        nested.set_field(
+            10,
+            Datum::TimestampLtz(TimestampLtz::new(1_769_163_227_123)),
+        );
+
+        let mut row = GenericRow::new(2);
+        row.set_field(0, 1_i32);
+        row.set_field(1, Datum::Row(Box::new(nested)));
+
+        upsert_writer
+            .upsert(&row)
+            .expect("upsert")
+            .await
+            .expect("ack");
+
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        let result = lookuper
+            .lookup(&make_key_with_field_count(1, 2))
+            .await
+            .expect("lookup");
+        let r = result
+            .get_single_row()
+            .expect("get row")
+            .expect("row should exist");
+
+        let n = r.get_row(1).unwrap();
+        assert!(n.get_boolean(0).unwrap());
+        assert_eq!(n.get_long(1).unwrap(), 9_876_543_210);
+        assert!(n.get_float(2).unwrap().is_infinite());
+        assert!(n.get_float(2).unwrap().is_sign_negative());
+        assert!(n.get_double(3).unwrap().is_nan());
+        assert_eq!(n.get_string(4).unwrap(), "rich types here");
+        assert_eq!(n.get_bytes(5).unwrap(), b"opaque");
+        assert_eq!(
+            n.get_decimal(6, 10, 2).unwrap(),
+            Decimal::from_unscaled_long(54321, 10, 2).unwrap(),
+        );
+        assert_eq!(n.get_date(7).unwrap().get_inner(), 20476);
+        assert_eq!(n.get_time(8).unwrap().get_inner(), 36_827_123);
+        assert_eq!(
+            n.get_timestamp_ntz(9, 6).unwrap().get_millisecond(),
+            1_769_163_227_123,
+        );
+        assert_eq!(
+            n.get_timestamp_ltz(10, 6).unwrap().get_epoch_millisecond(),
+            1_769_163_227_123,
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
     /// Integration test covering put and get operations for all supported datatypes.
     #[tokio::test]
     async fn all_supported_datatypes() {
-        use fluss::row::{Date, Datum, Decimal, Time, TimestampLtz, TimestampNtz};
-
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
@@ -614,6 +808,13 @@ mod kv_table_test {
                     .column("col_bytes", DataTypes::bytes())
                     .column("col_binary", DataTypes::binary(20))
                     .column("col_array", DataTypes::array(DataTypes::string()))
+                    .column(
+                        "col_row",
+                        DataTypes::row(vec![
+                            DataField::new("seq", DataTypes::int(), None),
+                            DataField::new("label", DataTypes::string(), None),
+                        ]),
+                    )
                     .primary_key(vec!["pk_int"])
                     .build()
                     .expect("Failed to build schema"),
@@ -654,8 +855,12 @@ mod kv_table_test {
 
         let col_array = make_string_array(&[Some("fluss"), Some("rust")]);
 
+        let mut col_row_inner = GenericRow::new(2);
+        col_row_inner.set_field(0, 7_i32);
+        col_row_inner.set_field(1, "lumiere");
+
         // Upsert a row with all datatypes
-        let mut row = GenericRow::new(18);
+        let mut row = GenericRow::new(19);
         row.set_field(0, pk_int);
         row.set_field(1, col_boolean);
         row.set_field(2, col_tinyint);
@@ -674,6 +879,7 @@ mod kv_table_test {
         row.set_field(15, col_bytes);
         row.set_field(16, col_binary);
         row.set_field(17, col_array);
+        row.set_field(18, Datum::Row(Box::new(col_row_inner)));
 
         upsert_writer
             .upsert(&row)
@@ -688,7 +894,7 @@ mod kv_table_test {
             .create_lookuper()
             .expect("Failed to create lookuper");
 
-        let mut key = GenericRow::new(18);
+        let mut key = GenericRow::new(19);
         key.set_field(0, pk_int);
 
         let result = lookuper.lookup(&key).await.expect("Failed to lookup");
@@ -787,10 +993,17 @@ mod kv_table_test {
         assert_eq!(arr.size(), 2, "col_array size mismatch");
         assert_eq!(arr.get_string(0).unwrap(), "fluss", "col_array[0] mismatch");
         assert_eq!(arr.get_string(1).unwrap(), "rust", "col_array[1] mismatch");
+        let nested = found_row.get_row(18).unwrap();
+        assert_eq!(nested.get_int(0).unwrap(), 7, "col_row.seq mismatch");
+        assert_eq!(
+            nested.get_string(1).unwrap(),
+            "lumiere",
+            "col_row.label mismatch"
+        );
 
         // Test with null values for nullable columns
         let pk_int_2 = 2i32;
-        let mut row_with_nulls = GenericRow::new(18);
+        let mut row_with_nulls = GenericRow::new(19);
         row_with_nulls.set_field(0, pk_int_2);
         row_with_nulls.set_field(1, Datum::Null); // col_boolean
         row_with_nulls.set_field(2, Datum::Null); // col_tinyint
@@ -809,6 +1022,7 @@ mod kv_table_test {
         row_with_nulls.set_field(15, Datum::Null); // col_bytes
         row_with_nulls.set_field(16, Datum::Null); // col_binary
         row_with_nulls.set_field(17, Datum::Null); // col_array
+        row_with_nulls.set_field(18, Datum::Null); // col_row
 
         upsert_writer
             .upsert(&row_with_nulls)
@@ -817,7 +1031,7 @@ mod kv_table_test {
             .expect("Failed to wait for upsert acknowledgment");
 
         // Lookup row with nulls
-        let mut key2 = GenericRow::new(18);
+        let mut key2 = GenericRow::new(19);
         key2.set_field(0, pk_int_2);
 
         let result = lookuper.lookup(&key2).await.expect("Failed to lookup");
@@ -900,6 +1114,10 @@ mod kv_table_test {
             found_row_nulls.is_null_at(17).unwrap(),
             "col_array should be null"
         );
+        assert!(
+            found_row_nulls.is_null_at(18).unwrap(),
+            "col_row should be null"
+        );
 
         admin
             .drop_table(&table_path, false)
@@ -908,9 +1126,307 @@ mod kv_table_test {
     }
 
     #[tokio::test]
-    async fn upsert_and_lookup_with_array() {
-        use fluss::row::Datum;
+    async fn upsert_and_lookup_with_row() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_kv_rows");
+        let nested_row_type = DataTypes::row(vec![
+            DataField::new("x", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let deep_inner_row_type = DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
+        let deep_row_type =
+            DataTypes::row(vec![DataField::new("inner", deep_inner_row_type, None)]);
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("nested", nested_row_type)
+                    .column("deep", deep_row_type)
+                    .primary_key(vec!["id"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let upsert = table.new_upsert().expect("Failed to create upsert");
+        let upsert_writer = upsert.create_writer().expect("Failed to create writer");
+
+        let mut nested1 = GenericRow::new(2);
+        nested1.set_field(0, 42_i32);
+        nested1.set_field(1, "hello");
+
+        let mut deep_inner1 = GenericRow::new(1);
+        deep_inner1.set_field(0, 99_i32);
+        let mut deep1 = GenericRow::new(1);
+        deep1.set_field(0, Datum::Row(Box::new(deep_inner1)));
+
+        let mut row1 = GenericRow::new(3);
+        row1.set_field(0, 1_i32);
+        row1.set_field(1, Datum::Row(Box::new(nested1)));
+        row1.set_field(2, Datum::Row(Box::new(deep1)));
+
+        upsert_writer
+            .upsert(&row1)
+            .expect("upsert row1")
+            .await
+            .expect("ack row1");
+
+        let mut nested2 = GenericRow::new(2);
+        nested2.set_field(0, 7_i32);
+        nested2.set_field(1, Datum::Null);
+
+        let mut row2 = GenericRow::new(3);
+        row2.set_field(0, 2_i32);
+        row2.set_field(1, Datum::Row(Box::new(nested2)));
+        row2.set_field(2, Datum::Null);
+
+        upsert_writer
+            .upsert(&row2)
+            .expect("upsert row2")
+            .await
+            .expect("ack row2");
+
+        let mut deep_inner3 = GenericRow::new(1);
+        deep_inner3.set_field(0, -1_i32);
+        let mut deep3 = GenericRow::new(1);
+        deep3.set_field(0, Datum::Row(Box::new(deep_inner3)));
+
+        let mut row3 = GenericRow::new(3);
+        row3.set_field(0, 3_i32);
+        row3.set_field(1, Datum::Null);
+        row3.set_field(2, Datum::Row(Box::new(deep3)));
+
+        upsert_writer
+            .upsert(&row3)
+            .expect("upsert row3")
+            .await
+            .expect("ack row3");
+
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        let result1 = lookuper
+            .lookup(&make_key_with_field_count(1, 3))
+            .await
+            .expect("lookup row1");
+        let r1 = result1
+            .get_single_row()
+            .expect("get row1")
+            .expect("row1 should exist");
+        assert_eq!(r1.get_int(0).unwrap(), 1);
+        let nested_r1 = r1.get_row(1).unwrap();
+        assert_eq!(nested_r1.get_int(0).unwrap(), 42);
+        assert_eq!(nested_r1.get_string(1).unwrap(), "hello");
+        let deep_r1 = r1.get_row(2).unwrap();
+        let deep_inner_r1 = deep_r1.get_row(0).unwrap();
+        assert_eq!(deep_inner_r1.get_int(0).unwrap(), 99);
+
+        let result2 = lookuper
+            .lookup(&make_key_with_field_count(2, 3))
+            .await
+            .expect("lookup row2");
+        let r2 = result2
+            .get_single_row()
+            .expect("get row2")
+            .expect("row2 should exist");
+        assert_eq!(r2.get_int(0).unwrap(), 2);
+        let nested_r2 = r2.get_row(1).unwrap();
+        assert_eq!(nested_r2.get_int(0).unwrap(), 7);
+        assert!(nested_r2.is_null_at(1).unwrap());
+        assert!(r2.is_null_at(2).unwrap());
 
+        let result3 = lookuper
+            .lookup(&make_key_with_field_count(3, 3))
+            .await
+            .expect("lookup row3");
+        let r3 = result3
+            .get_single_row()
+            .expect("get row3")
+            .expect("row3 should exist");
+        assert_eq!(r3.get_int(0).unwrap(), 3);
+        assert!(r3.is_null_at(1).unwrap());
+        let deep_r3 = r3.get_row(2).unwrap();
+        let deep_inner_r3 = deep_r3.get_row(0).unwrap();
+        assert_eq!(deep_inner_r3.get_int(0).unwrap(), -1);
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn upsert_and_lookup_with_array_of_row() {
+        use fluss::metadata::{DataField, DataType};
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_kv_array_of_row");
+
+        let event_row_type_owned = DataTypes::row(vec![
+            DataField::new("seq", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let array_of_row_type = DataTypes::array(event_row_type_owned.clone());
+
+        let event_row_type = match &event_row_type_owned {
+            DataType::Row(rt) => rt.clone(),
+            _ => unreachable!(),
+        };
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("events", array_of_row_type.clone())
+                    .primary_key(vec!["id"])
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let upsert = table.new_upsert().expect("Failed to create upsert");
+        let upsert_writer = upsert.create_writer().expect("Failed to create writer");
+
+        let mut events1 = FlussArrayWriter::new(2, &event_row_type_owned);
+        let mut e0 = GenericRow::new(2);
+        e0.set_field(0, 1_i32);
+        e0.set_field(1, "open");
+        events1.write_row(0, &e0).expect("write e0");
+        let mut e1 = GenericRow::new(2);
+        e1.set_field(0, 2_i32);
+        e1.set_field(1, "close");
+        events1.write_row(1, &e1).expect("write e1");
+        let events1 = events1.complete().expect("events1");
+
+        let mut row1 = GenericRow::new(2);
+        row1.set_field(0, 1_i32);
+        row1.set_field(1, events1);
+
+        upsert_writer
+            .upsert(&row1)
+            .expect("upsert row1")
+            .await
+            .expect("ack row1");
+
+        let mut events2 = FlussArrayWriter::new(3, &event_row_type_owned);
+        let mut e2 = GenericRow::new(2);
+        e2.set_field(0, 7_i32);
+        e2.set_field(1, "x");
+        events2.write_row(0, &e2).expect("write e2");
+        events2.set_null_at(1);
+        let mut e3 = GenericRow::new(2);
+        e3.set_field(0, 8_i32);
+        e3.set_field(1, "y");
+        events2.write_row(2, &e3).expect("write e3");
+        let events2 = events2.complete().expect("events2");
+
+        let mut row2 = GenericRow::new(2);
+        row2.set_field(0, 2_i32);
+        row2.set_field(1, events2);
+
+        upsert_writer
+            .upsert(&row2)
+            .expect("upsert row2")
+            .await
+            .expect("ack row2");
+
+        let mut row3 = GenericRow::new(2);
+        row3.set_field(0, 3_i32);
+        row3.set_field(1, Datum::Null);
+
+        upsert_writer
+            .upsert(&row3)
+            .expect("upsert row3")
+            .await
+            .expect("ack row3");
+
+        let mut lookuper = table
+            .new_lookup()
+            .expect("Failed to create lookup")
+            .create_lookuper()
+            .expect("Failed to create lookuper");
+
+        let result1 = lookuper
+            .lookup(&make_key_with_field_count(1, 2))
+            .await
+            .expect("lookup row1");
+        let r1 = result1
+            .get_single_row()
+            .expect("get row1")
+            .expect("row1 should exist");
+        assert_eq!(r1.get_int(0).unwrap(), 1);
+        let events_r1 = r1.get_array(1).unwrap();
+        assert_eq!(events_r1.size(), 2);
+        let e0_r1 = events_r1.get_row(0, &event_row_type).unwrap();
+        assert_eq!(e0_r1.get_int(0).unwrap(), 1);
+        assert_eq!(e0_r1.get_string(1).unwrap(), "open");
+        let e1_r1 = events_r1.get_row(1, &event_row_type).unwrap();
+        assert_eq!(e1_r1.get_int(0).unwrap(), 2);
+        assert_eq!(e1_r1.get_string(1).unwrap(), "close");
+
+        let result2 = lookuper
+            .lookup(&make_key_with_field_count(2, 2))
+            .await
+            .expect("lookup row2");
+        let r2 = result2
+            .get_single_row()
+            .expect("get row2")
+            .expect("row2 should exist");
+        let events_r2 = r2.get_array(1).unwrap();
+        assert_eq!(events_r2.size(), 3);
+        let e0_r2 = events_r2.get_row(0, &event_row_type).unwrap();
+        assert_eq!(e0_r2.get_int(0).unwrap(), 7);
+        assert_eq!(e0_r2.get_string(1).unwrap(), "x");
+        assert!(events_r2.is_null_at(1));
+        let e2_r2 = events_r2.get_row(2, &event_row_type).unwrap();
+        assert_eq!(e2_r2.get_int(0).unwrap(), 8);
+        assert_eq!(e2_r2.get_string(1).unwrap(), "y");
+
+        let result3 = lookuper
+            .lookup(&make_key_with_field_count(3, 2))
+            .await
+            .expect("lookup row3");
+        let r3 = result3
+            .get_single_row()
+            .expect("get row3")
+            .expect("row3 should exist");
+        assert_eq!(r3.get_int(0).unwrap(), 3);
+        assert!(r3.is_null_at(1).unwrap());
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn upsert_and_lookup_with_array() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().expect("Failed to get admin");
@@ -942,7 +1458,6 @@ mod kv_table_test {
         let upsert = table.new_upsert().expect("Failed to create upsert");
         let upsert_writer = upsert.create_writer().expect("Failed to create writer");
 
-        // Row 1: id=1, tags=["hello", "world"], scores=[10, 20, 30], matrix=[[1,2],[3,4]]
         let mut row1 = GenericRow::new(4);
         row1.set_field(0, 1_i32);
         row1.set_field(1, make_string_array(&[Some("hello"), Some("world")]));
@@ -961,7 +1476,6 @@ mod kv_table_test {
             .await
             .expect("ack row1");
 
-        // Row 2: id=2, tags=[null element], scores=[] (empty), matrix=null
         let mut row2 = GenericRow::new(4);
         row2.set_field(0, 2_i32);
         row2.set_field(1, make_string_array(&[None]));
@@ -974,7 +1488,6 @@ mod kv_table_test {
             .await
             .expect("ack row2");
 
-        // Row 3: id=3, tags=null, scores=[42], matrix=[[5], null, []]
         let mut row3 = GenericRow::new(4);
         row3.set_field(0, 3_i32);
         row3.set_field(1, Datum::Null);
@@ -1001,7 +1514,6 @@ mod kv_table_test {
             .create_lookuper()
             .expect("Failed to create lookuper");
 
-        // Verify row 1: populated flat arrays + nested array
         let result1 = lookuper
             .lookup(&make_key_with_field_count(1, 4))
             .await
@@ -1031,7 +1543,6 @@ mod kv_table_test {
         assert_eq!(mr1_1.get_int(0).unwrap(), 3);
         assert_eq!(mr1_1.get_int(1).unwrap(), 4);
 
-        // Verify row 2: null element in array, empty array, null nested column
         let result2 = lookuper
             .lookup(&make_key_with_field_count(2, 4))
             .await
@@ -1048,7 +1559,6 @@ mod kv_table_test {
         assert_eq!(scores_r2.size(), 0);
         assert!(r2.is_null_at(3).unwrap());
 
-        // Verify row 3: null flat column, nested array with mixed inner (value, null, empty)
         let result3 = lookuper
             .lookup(&make_key_with_field_count(3, 4))
             .await
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 1a6b514b81..fadb49622c 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -23,9 +23,12 @@ mod table_test {
     };
     use arrow::array::record_batch;
     use fluss::client::{EARLIEST_OFFSET, FlussTable, TableScan};
-    use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+    use fluss::metadata::{DataField, DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::record::ScanRecord;
-    use fluss::row::InternalRow;
+    use fluss::row::binary_array::FlussArrayWriter;
+    use fluss::row::{
+        Date, Datum, Decimal, FlussArray, GenericRow, InternalRow, Time, TimestampLtz, TimestampNtz,
+    };
     use fluss::rpc::message::OffsetSpec;
     use std::collections::HashMap;
     use std::time::Duration;
@@ -581,8 +584,6 @@ mod table_test {
     /// in log tables.
     #[tokio::test]
     async fn all_supported_datatypes() {
-        use fluss::row::{Date, Datum, Decimal, GenericRow, Time, TimestampLtz, TimestampNtz};
-
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
@@ -661,6 +662,13 @@ mod table_test {
                         DataTypes::timestamp_ltz_with_precision(9),
                     )
                     .column("col_array", DataTypes::array(DataTypes::string()))
+                    .column(
+                        "col_row",
+                        DataTypes::row(vec![
+                            DataField::new("seq", DataTypes::int(), None),
+                            DataField::new("label", DataTypes::string(), None),
+                        ]),
+                    )
                     .build()
                     .expect("Failed to build schema"),
             )
@@ -724,7 +732,10 @@ mod table_test {
 
         let col_array = make_string_array(&[Some("fluss"), Some("rust")]);
 
-        // Append a row with all datatypes
+        let mut col_row_inner = GenericRow::new(2);
+        col_row_inner.set_field(0, 7_i32);
+        col_row_inner.set_field(1, "lumiere");
+
         let mut row = GenericRow::new(field_count);
         row.set_field(0, col_tinyint);
         row.set_field(1, col_smallint);
@@ -756,6 +767,7 @@ mod table_test {
         row.set_field(27, col_timestamp_ltz_us_neg);
         row.set_field(28, col_timestamp_ltz_ns_neg);
         row.set_field(29, col_array);
+        row.set_field(30, Datum::Row(Box::new(col_row_inner)));
 
         append_writer
             .append(&row)
@@ -1005,6 +1017,14 @@ mod table_test {
         assert_eq!(arr.get_string(0).unwrap(), "fluss", "col_array[0] mismatch");
         assert_eq!(arr.get_string(1).unwrap(), "rust", "col_array[1] mismatch");
 
+        let nested = found_row.get_row(30).unwrap();
+        assert_eq!(nested.get_int(0).unwrap(), 7, "col_row.seq mismatch");
+        assert_eq!(
+            nested.get_string(1).unwrap(),
+            "lumiere",
+            "col_row.label mismatch"
+        );
+
         // Verify row with all nulls (record index 1)
         let found_row_nulls = records[1].row();
         for i in 0..field_count {
@@ -1387,9 +1407,6 @@ mod table_test {
 
     #[tokio::test]
     async fn append_and_scan_with_array() {
-        use fluss::row::binary_array::FlussArrayWriter;
-        use fluss::row::{Datum, FlussArray, GenericRow};
-
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().expect("Failed to get admin");
@@ -1423,7 +1440,6 @@ mod table_test {
             .create_writer()
             .expect("Failed to create writer");
 
-        // Row 1: id=1, tags=["hello", "world"], scores=[10, 20, 30], matrix=[[1,2],[3,4]]
         let mut row1 = GenericRow::new(4);
         row1.set_field(0, 1_i32);
         row1.set_field(1, make_string_array(&[Some("hello"), Some("world")]));
@@ -1436,7 +1452,6 @@ mod table_test {
         };
         row1.set_field(3, m1);
 
-        // Row 2: id=2, tags=[null], scores=[], matrix=[[5], null, []]
         let mut row2 = GenericRow::new(4);
         row2.set_field(0, 2_i32);
         row2.set_field(1, make_string_array(&[None]));
@@ -1450,7 +1465,6 @@ mod table_test {
         };
         row2.set_field(3, m2);
 
-        // Row 3: id=3, tags=null, scores=[42], matrix=null
         let mut row3 = GenericRow::new(4);
         row3.set_field(0, 3_i32);
         row3.set_field(1, Datum::Null);
@@ -1465,7 +1479,6 @@ mod table_test {
         let records = scan_table(&table, |scan| scan).await;
         assert_eq!(records.len(), 3, "expected three log records");
 
-        // Verify row 1: populated flat arrays + nested array
         let r0 = records[0].row();
         assert_eq!(r0.get_int(0).unwrap(), 1);
         let tags_r0 = r0.get_array(1).unwrap();
@@ -1488,7 +1501,6 @@ mod table_test {
         assert_eq!(mr0_1.get_int(0).unwrap(), 3);
         assert_eq!(mr0_1.get_int(1).unwrap(), 4);
 
-        // Verify row 2: null element in array, empty array, nested with mixed inner
         let r1 = records[1].row();
         assert_eq!(r1.get_int(0).unwrap(), 2);
         let tags_r1 = r1.get_array(1).unwrap();
@@ -1505,7 +1517,6 @@ mod table_test {
         let mr1_2 = matrix_r1.get_array(2).unwrap();
         assert_eq!(mr1_2.size(), 0);
 
-        // Verify row 3: null flat column, null nested column
         let r2 = records[2].row();
         assert_eq!(r2.get_int(0).unwrap(), 3);
         assert!(r2.is_null_at(1).unwrap());
@@ -1521,10 +1532,454 @@ mod table_test {
     }
 
     #[tokio::test]
-    async fn append_and_scan_with_array_rich_types() {
-        use fluss::row::binary_array::FlussArrayWriter;
-        use fluss::row::{Date, Decimal, FlussArray, GenericRow, Time, TimestampNtz};
+    async fn append_and_scan_with_array_of_row() {
+        use fluss::metadata::{DataField, DataType};
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_log_array_of_row");
+
+        let event_row_type_owned = DataTypes::row(vec![
+            DataField::new("seq", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let array_of_row_type = DataTypes::array(event_row_type_owned.clone());
+
+        let event_row_type = match &event_row_type_owned {
+            DataType::Row(rt) => rt.clone(),
+            _ => unreachable!(),
+        };
+
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("events", array_of_row_type)
+            .build()
+            .expect("Failed to build schema");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let mut events1 = FlussArrayWriter::new(2, &event_row_type_owned);
+        let mut e0 = GenericRow::new(2);
+        e0.set_field(0, 1_i32);
+        e0.set_field(1, "open");
+        events1.write_row(0, &e0).expect("write e0");
+        let mut e1 = GenericRow::new(2);
+        e1.set_field(0, 2_i32);
+        e1.set_field(1, "close");
+        events1.write_row(1, &e1).expect("write e1");
+        let events1 = events1.complete().expect("events1");
+
+        let mut row1 = GenericRow::new(2);
+        row1.set_field(0, 1_i32);
+        row1.set_field(1, events1);
+
+        let mut events2 = FlussArrayWriter::new(3, &event_row_type_owned);
+        let mut e2 = GenericRow::new(2);
+        e2.set_field(0, 7_i32);
+        e2.set_field(1, "x");
+        events2.write_row(0, &e2).expect("write e2");
+        events2.set_null_at(1);
+        let mut e3 = GenericRow::new(2);
+        e3.set_field(0, 8_i32);
+        e3.set_field(1, "y");
+        events2.write_row(2, &e3).expect("write e3");
+        let events2 = events2.complete().expect("events2");
+
+        let mut row2 = GenericRow::new(2);
+        row2.set_field(0, 2_i32);
+        row2.set_field(1, events2);
+
+        let mut row3 = GenericRow::new(2);
+        row3.set_field(0, 3_i32);
+        row3.set_field(1, Datum::Null);
+
+        append_writer.append(&row1).expect("append row1");
+        append_writer.append(&row2).expect("append row2");
+        append_writer.append(&row3).expect("append row3");
+        append_writer.flush().await.expect("Failed to flush");
+
+        let records = scan_table(&table, |scan| scan).await;
+        assert_eq!(records.len(), 3, "expected three log records");
+
+        let r0 = records[0].row();
+        assert_eq!(r0.get_int(0).unwrap(), 1);
+        let events_r0 = r0.get_array(1).unwrap();
+        assert_eq!(events_r0.size(), 2);
+        let e0_r0 = events_r0.get_row(0, &event_row_type).unwrap();
+        assert_eq!(e0_r0.get_int(0).unwrap(), 1);
+        assert_eq!(e0_r0.get_string(1).unwrap(), "open");
+        let e1_r0 = events_r0.get_row(1, &event_row_type).unwrap();
+        assert_eq!(e1_r0.get_int(0).unwrap(), 2);
+        assert_eq!(e1_r0.get_string(1).unwrap(), "close");
+
+        let r1 = records[1].row();
+        let events_r1 = r1.get_array(1).unwrap();
+        assert_eq!(events_r1.size(), 3);
+        let e0_r1 = events_r1.get_row(0, &event_row_type).unwrap();
+        assert_eq!(e0_r1.get_int(0).unwrap(), 7);
+        assert_eq!(e0_r1.get_string(1).unwrap(), "x");
+        assert!(events_r1.is_null_at(1));
+        let e2_r1 = events_r1.get_row(2, &event_row_type).unwrap();
+        assert_eq!(e2_r1.get_int(0).unwrap(), 8);
+        assert_eq!(e2_r1.get_string(1).unwrap(), "y");
+
+        let r2 = records[2].row();
+        assert_eq!(r2.get_int(0).unwrap(), 3);
+        assert!(r2.is_null_at(1).unwrap());
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn append_and_scan_with_row() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_log_rows");
+        let nested_row_type = DataTypes::row(vec![
+            DataField::new("x", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+        let deep_inner_row_type = DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
+        let deep_row_type =
+            DataTypes::row(vec![DataField::new("inner", deep_inner_row_type, None)]);
+
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("nested", nested_row_type)
+            .column("deep", deep_row_type)
+            .build()
+            .expect("Failed to build schema");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let mut nested1 = GenericRow::new(2);
+        nested1.set_field(0, 42_i32);
+        nested1.set_field(1, "hello");
+        let mut deep_inner1 = GenericRow::new(1);
+        deep_inner1.set_field(0, 99_i32);
+        let mut deep1 = GenericRow::new(1);
+        deep1.set_field(0, Datum::Row(Box::new(deep_inner1)));
+
+        let mut row1 = GenericRow::new(3);
+        row1.set_field(0, 1_i32);
+        row1.set_field(1, Datum::Row(Box::new(nested1)));
+        row1.set_field(2, Datum::Row(Box::new(deep1)));
+
+        let mut nested2 = GenericRow::new(2);
+        nested2.set_field(0, 7_i32);
+        nested2.set_field(1, Datum::Null);
+
+        let mut row2 = GenericRow::new(3);
+        row2.set_field(0, 2_i32);
+        row2.set_field(1, Datum::Row(Box::new(nested2)));
+        row2.set_field(2, Datum::Null);
+
+        let mut deep_inner3 = GenericRow::new(1);
+        deep_inner3.set_field(0, -1_i32);
+        let mut deep3 = GenericRow::new(1);
+        deep3.set_field(0, Datum::Row(Box::new(deep_inner3)));
+
+        let mut row3 = GenericRow::new(3);
+        row3.set_field(0, 3_i32);
+        row3.set_field(1, Datum::Null);
+        row3.set_field(2, Datum::Row(Box::new(deep3)));
+
+        append_writer.append(&row1).expect("append row1");
+        append_writer.append(&row2).expect("append row2");
+        append_writer.append(&row3).expect("append row3");
+        append_writer.flush().await.expect("Failed to flush");
+
+        let records = scan_table(&table, |scan| scan).await;
+        assert_eq!(records.len(), 3, "expected three log records");
+
+        let r0 = records[0].row();
+        assert_eq!(r0.get_int(0).unwrap(), 1);
+        let nested_r0 = r0.get_row(1).unwrap();
+        assert_eq!(nested_r0.get_int(0).unwrap(), 42);
+        assert_eq!(nested_r0.get_string(1).unwrap(), "hello");
+        let deep_r0 = r0.get_row(2).unwrap();
+        let deep_inner_r0 = deep_r0.get_row(0).unwrap();
+        assert_eq!(deep_inner_r0.get_int(0).unwrap(), 99);
+
+        let r1 = records[1].row();
+        assert_eq!(r1.get_int(0).unwrap(), 2);
+        let nested_r1 = r1.get_row(1).unwrap();
+        assert_eq!(nested_r1.get_int(0).unwrap(), 7);
+        assert!(nested_r1.is_null_at(1).unwrap());
+        assert!(r1.is_null_at(2).unwrap());
+
+        let r2 = records[2].row();
+        assert_eq!(r2.get_int(0).unwrap(), 3);
+        assert!(r2.is_null_at(1).unwrap());
+        let deep_r2 = r2.get_row(2).unwrap();
+        let deep_inner_r2 = deep_r2.get_row(0).unwrap();
+        assert_eq!(deep_inner_r2.get_int(0).unwrap(), -1);
 
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    /// Partitioned log table with a ROW column. Confirms partition routing
+    /// + ROW column encoding compose correctly across partitions.
+    /// ROW column with all rich element types (decimal, date, time, timestamps,
+    /// bytes, binary, float NaN/Inf, long strings) round-tripped through the
+    /// log path. Confirms the wire-level encoding of `ROW<rich types>` matches
+    /// what the server expects — the unit-level `test_row_all_primitives_round_trip`
+    /// proves Rust↔Rust round-trip; this test proves Rust→server→Rust.
+    #[tokio::test]
+    async fn append_and_scan_with_row_rich_types() {
+        fn assert_f32_special(actual: f32, expected: f32) {
+            if expected.is_nan() {
+                assert!(actual.is_nan(), "expected NaN");
+            } else if expected.is_infinite() {
+                assert!(actual.is_infinite());
+                assert_eq!(actual.signum(), expected.signum());
+            } else {
+                assert!((actual - expected).abs() < f32::EPSILON);
+            }
+        }
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_log_row_rich_types");
+
+        let row_type_owned = DataTypes::row(vec![
+            DataField::new("f_bool", DataTypes::boolean(), None),
+            DataField::new("f_int", DataTypes::int(), None),
+            DataField::new("f_long", DataTypes::bigint(), None),
+            DataField::new("f_float", DataTypes::float(), None),
+            DataField::new("f_double", DataTypes::double(), None),
+            DataField::new("f_str", DataTypes::string(), None),
+            DataField::new("f_bytes", DataTypes::bytes(), None),
+            DataField::new("f_decimal", DataTypes::decimal(10, 2), None),
+            DataField::new("f_date", DataTypes::date(), None),
+            DataField::new("f_time", DataTypes::time_with_precision(3), None),
+            DataField::new("f_ts_ntz", DataTypes::timestamp_with_precision(6), None),
+            DataField::new("f_ts_ltz", DataTypes::timestamp_ltz_with_precision(6), None),
+            DataField::new("f_binary_fixed", DataTypes::binary(4), None),
+            DataField::new("f_array_int", DataTypes::array(DataTypes::int()), None),
+        ]);
+
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("nested", row_type_owned)
+            .build()
+            .expect("Failed to build schema");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let mut nested1 = GenericRow::new(14);
+        nested1.set_field(0, true);
+        nested1.set_field(1, 100_000_i32);
+        nested1.set_field(2, 9_876_543_210_i64);
+        nested1.set_field(3, f32::INFINITY);
+        nested1.set_field(4, f64::NAN);
+        nested1.set_field(5, "hello world");
+        nested1.set_field(6, b"binary".as_slice());
+        nested1.set_field(7, Decimal::from_unscaled_long(12345, 10, 2).unwrap());
+        nested1.set_field(8, Datum::Date(Date::new(20476)));
+        nested1.set_field(9, Datum::Time(Time::new(36_827_123)));
+        nested1.set_field(
+            10,
+            Datum::TimestampNtz(TimestampNtz::new(1_769_163_227_123)),
+        );
+        nested1.set_field(
+            11,
+            Datum::TimestampLtz(TimestampLtz::new(1_769_163_227_456)),
+        );
+        nested1.set_field(12, b"\x01\x02\x03\x04".as_slice());
+        nested1.set_field(13, make_int_array(&[Some(7), None, Some(11)]));
+
+        let mut row1 = GenericRow::new(2);
+        row1.set_field(0, 1_i32);
+        row1.set_field(1, Datum::Row(Box::new(nested1)));
+
+        let mut row2 = GenericRow::new(2);
+        row2.set_field(0, 2_i32);
+        row2.set_field(1, Datum::Null);
+
+        append_writer.append(&row1).expect("append row1");
+        append_writer.append(&row2).expect("append row2");
+        append_writer.flush().await.expect("Failed to flush");
+
+        let records = scan_table(&table, |scan| scan).await;
+        assert_eq!(records.len(), 2);
+
+        let r0 = records[0].row();
+        assert_eq!(r0.get_int(0).unwrap(), 1);
+        let nested = r0.get_row(1).unwrap();
+        assert!(nested.get_boolean(0).unwrap());
+        assert_eq!(nested.get_int(1).unwrap(), 100_000);
+        assert_eq!(nested.get_long(2).unwrap(), 9_876_543_210);
+        assert_f32_special(nested.get_float(3).unwrap(), f32::INFINITY);
+        assert!(nested.get_double(4).unwrap().is_nan());
+        assert_eq!(nested.get_string(5).unwrap(), "hello world");
+        assert_eq!(nested.get_bytes(6).unwrap(), b"binary");
+        assert_eq!(
+            nested.get_decimal(7, 10, 2).unwrap(),
+            Decimal::from_unscaled_long(12345, 10, 2).unwrap(),
+        );
+        assert_eq!(nested.get_date(8).unwrap().get_inner(), 20476);
+        assert_eq!(nested.get_time(9).unwrap().get_inner(), 36_827_123);
+        assert_eq!(
+            nested.get_timestamp_ntz(10, 6).unwrap().get_millisecond(),
+            1_769_163_227_123,
+        );
+        assert_eq!(
+            nested
+                .get_timestamp_ltz(11, 6)
+                .unwrap()
+                .get_epoch_millisecond(),
+            1_769_163_227_456,
+        );
+        assert_eq!(nested.get_binary(12, 4).unwrap(), b"\x01\x02\x03\x04");
+        let arr = nested.get_array(13).unwrap();
+        assert_eq!(arr.size(), 3);
+        assert_eq!(arr.get_int(0).unwrap(), 7);
+        assert!(arr.is_null_at(1));
+        assert_eq!(arr.get_int(2).unwrap(), 11);
+
+        let r1 = records[1].row();
+        assert_eq!(r1.get_int(0).unwrap(), 2);
+        assert!(r1.is_null_at(1).unwrap());
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    /// Projection over a log table with ROW columns. Specifically tests that
+    /// `ProjectedRow::get_row` (added by this PR) works end-to-end against the
+    /// server — without this, the projection code path for ROW would have zero
+    /// integration coverage.
+    #[tokio::test]
+    async fn append_and_scan_with_row_projection() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_log_row_projection");
+
+        let row_type = DataTypes::row(vec![
+            DataField::new("seq", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("nested", row_type)
+            .column("extra", DataTypes::string())
+            .build()
+            .expect("Failed to build schema");
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .build()
+            .expect("Failed to build table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let mut nested = GenericRow::new(2);
+        nested.set_field(0, 42_i32);
+        nested.set_field(1, "hello");
+
+        let mut row = GenericRow::new(3);
+        row.set_field(0, 7_i32);
+        row.set_field(1, Datum::Row(Box::new(nested)));
+        row.set_field(2, "ignore-me");
+        append_writer.append(&row).expect("append");
+        append_writer.flush().await.expect("Failed to flush");
+
+        let records = scan_table(&table, |scan| {
+            scan.project_by_name(&["nested", "id"])
+                .expect("project failed")
+        })
+        .await;
+        assert_eq!(records.len(), 1);
+
+        let r0 = records[0].row();
+        let projected_nested = r0.get_row(0).expect("get_row over projection");
+        assert_eq!(projected_nested.get_int(0).unwrap(), 42);
+        assert_eq!(projected_nested.get_string(1).unwrap(), "hello");
+        assert_eq!(r0.get_int(1).unwrap(), 7);
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn append_and_scan_with_array_rich_types() {
         fn assert_f32_special(actual: f32, expected: f32) {
             if expected.is_nan() {
                 assert!(actual.is_nan(), "expected NaN");

From 338b6b8ed0dba20cb9c1578535329e09be3b6e16 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Thu, 14 May 2026 11:11:14 +0200
Subject: [PATCH 268/287] feat: Add RecordBatchLogReader for bounded log
 reading (#446)

* Add RecordBatchLogReader for bounded log reading

* address comments

* update doc

* update doc and inline comments

* rebase and follow up after rebase of new changes, and fix a corner issue

* feedback

* run tests in thread to avoid asyncio event loop starvation

* address feedback
---
 fluss-rust/bindings/python/example/example.py |  10 +-
 fluss-rust/bindings/python/fluss/__init__.pyi |  24 +
 fluss-rust/bindings/python/src/table.rs       | 293 ++++----
 .../bindings/python/test/test_log_table.py    | 124 ++++
 .../crates/fluss/src/client/table/mod.rs      |   2 +
 .../crates/fluss/src/client/table/reader.rs   | 701 ++++++++++++++++++
 .../crates/fluss/src/client/table/scanner.rs  | 138 +++-
 .../docs/user-guide/python/api-reference.md   |   3 +
 .../docs/user-guide/rust/api-reference.md     |  44 ++
 9 files changed, 1169 insertions(+), 170 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/client/table/reader.rs

diff --git a/fluss-rust/bindings/python/example/example.py b/fluss-rust/bindings/python/example/example.py
index 0149996cd5..23ccc6d1c1 100644
--- a/fluss-rust/bindings/python/example/example.py
+++ b/fluss-rust/bindings/python/example/example.py
@@ -294,8 +294,14 @@ async def main():
         except Exception as e:
             print(f"Could not convert to Pandas: {e}")
 
-        # TODO: support to_arrow_batch_reader()
-        # which is reserved for streaming use cases
+        # to_arrow_batch_reader() — returns a lazy PyArrow RecordBatchReader
+        batch_scanner_reader = await table.new_scan().create_record_batch_log_scanner()
+        batch_scanner_reader.subscribe_buckets(
+            {i: fluss.EARLIEST_OFFSET for i in range(num_buckets)}
+        )
+        arrow_reader = batch_scanner_reader.to_arrow_batch_reader()
+        reader_table = pa.Table.from_batches(list(arrow_reader), schema=arrow_reader.schema)
+        print(f"\nVia to_arrow_batch_reader(): {reader_table.num_rows} rows")
 
         # TODO: support to_duckdb()
 
diff --git a/fluss-rust/bindings/python/fluss/__init__.pyi b/fluss-rust/bindings/python/fluss/__init__.pyi
index 18095c01bc..b5bfdfab28 100644
--- a/fluss-rust/bindings/python/fluss/__init__.pyi
+++ b/fluss-rust/bindings/python/fluss/__init__.pyi
@@ -898,6 +898,26 @@ class LogScanner:
             or timeout expires.
         """
         ...
+    def to_arrow_batch_reader(self) -> pa.RecordBatchReader:
+        """Create a lazy Arrow RecordBatchReader that reads until latest offsets.
+
+        Returns a ``pyarrow.RecordBatchReader`` that lazily polls batches one at
+        a time (streaming). Prefer this when you want to process batches without
+        holding the full result in memory at once.
+
+        Do not call ``poll_arrow`` / ``poll_record_batch`` on this scanner while
+        iterating the reader; they share the same underlying scanner state.
+        Overlapping calls are not supported. Use one active
+        polling/consumption path at a time.
+
+        Requires a batch-based scanner (created with ``new_scan().create_record_batch_log_scanner()``).
+        You must call ``subscribe()``, ``subscribe_buckets()``, ``subscribe_partition()``,
+        or ``subscribe_partition_buckets()`` first.
+
+        Returns:
+            ``pyarrow.RecordBatchReader`` yielding ``RecordBatch`` objects.
+        """
+        ...
     async def to_pandas(self) -> pd.DataFrame:
         """Convert all data to Pandas DataFrame.
 
@@ -910,6 +930,10 @@ class LogScanner:
     async def to_arrow(self) -> pa.Table:
         """Convert all data to Arrow Table.
 
+        Batches are collected in Rust then combined into one table (no per-batch
+        Python iteration). Do not interleave with ``poll_arrow`` / ``poll_record_batch``
+        for the same subscription session; overlapping use is not supported.
+
         Requires a batch-based scanner (created with new_scan().create_record_batch_log_scanner()).
         Reads from currently subscribed buckets until reaching their latest offsets.
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 9ee84d76ed..4133bed47e 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -18,10 +18,10 @@
 use crate::TOKIO_RUNTIME;
 use crate::*;
 use arrow::array::RecordBatch as ArrowRecordBatch;
+use arrow::record_batch::RecordBatchReader as _;
 use arrow_pyarrow::{FromPyArrow, ToPyArrow};
 use arrow_schema::SchemaRef;
 use fluss::record::to_arrow_schema;
-use fluss::rpc::message::OffsetSpec;
 use indexmap::IndexMap;
 use pyo3::IntoPyObjectExt;
 use pyo3::exceptions::{PyIndexError, PyRuntimeError, PyTypeError};
@@ -2014,6 +2014,38 @@ fn get_type_name(value: &Bound<PyAny>) -> String {
         .unwrap_or_else(|_| "unknown".to_string())
 }
 
+/// Thin Python iterator over [`fcore::client::SyncRecordBatchLogReader`].
+/// Used internally as the backing iterator for
+/// ``pa.RecordBatchReader.from_batches()``; not registered on the module.
+#[pyclass]
+struct PyRecordBatchLogReader {
+    sync_reader: fcore::client::SyncRecordBatchLogReader,
+}
+
+#[pymethods]
+impl PyRecordBatchLogReader {
+    fn __iter__(slf: PyRef<'_, Self>) -> PyRef<'_, Self> {
+        slf
+    }
+
+    fn __next__(&mut self, py: Python) -> PyResult<Option<Py<PyAny>>> {
+        let result = py.detach(|| self.sync_reader.next().transpose());
+
+        match result {
+            Ok(Some(batch)) => {
+                let py_batch = batch
+                    .to_pyarrow(py)
+                    .map_err(|e| FlussError::new_err(format!("Failed to convert batch: {e}")))?;
+                Ok(Some(py_batch.unbind()))
+            }
+            Ok(None) => Ok(None),
+            Err(arrow_err) => Err(FlussError::new_err(format!(
+                "Error reading batch: {arrow_err}"
+            ))),
+        }
+    }
+}
+
 /// Wraps the two scanner variants so we never have an impossible state
 /// (both None or both Some).
 enum ScannerKind {
@@ -2066,8 +2098,6 @@ pub struct LogScanner {
     projected_schema: SchemaRef,
     /// The projected row type to use for record-based scanning
     projected_row_type: Arc<fcore::metadata::RowType>,
-    /// Cache for partition_id -> partition_name mapping (avoids repeated list_partition_infos calls)
-    partition_name_cache: Arc<std::sync::RwLock<Option<HashMap<i64, String>>>>,
 }
 
 #[pymethods]
@@ -2307,11 +2337,75 @@ impl LogScanner {
         })
     }
 
+    /// Create a lazy Arrow RecordBatchReader that reads until latest offsets.
+    ///
+    /// This is a **blocking / synchronous** API: construction queries the
+    /// server for latest offsets (via ``block_on``), and each
+    /// ``RecordBatchReader.__next__()`` call blocks the calling thread until
+    /// the next batch is available. It is suitable for Arrow interop
+    /// (feeding into DuckDB, Polars, etc.) but should not be used
+    /// from ``asyncio`` coroutines -- see issue #545 for a planned
+    /// asyncio-native streaming alternative.
+    /// TODO(#545): Add asyncio-native streaming counterpart.
+    ///
+    /// Returns a PyArrow RecordBatchReader that lazily polls batches one at a
+    /// time. This is more memory-efficient than ``to_arrow()`` which loads all
+    /// data into a single table.
+    ///
+    /// **Concurrency:** While this reader is alive, ``subscribe*`` and
+    /// ``unsubscribe*`` calls on the scanner are rejected with an error.
+    /// You should also avoid calling ``poll_arrow`` / ``poll_record_batch``
+    /// on the same scanner — these are not blocked by the guard, but they
+    /// share the underlying fetch buffer with the reader and would
+    /// interleave batches between both consumers. Drop the reader before
+    /// resuming any of these operations.
+    ///
+    /// You must call subscribe(), subscribe_buckets(), subscribe_partition(),
+    /// or subscribe_partition_buckets() first.
+    ///
+    /// Returns:
+    ///     ``pyarrow.RecordBatchReader`` yielding ``RecordBatch`` objects
+    fn to_arrow_batch_reader(&self, py: Python) -> PyResult<Py<PyAny>> {
+        let scanner = self.kind.as_batch()?;
+
+        let sync_reader = py
+            .detach(|| {
+                TOKIO_RUNTIME.block_on(async {
+                    let reader = fcore::client::RecordBatchLogReader::new_until_latest(
+                        scanner.new_shared_handle(),
+                        &self.admin,
+                    )
+                    .await?;
+                    Ok::<_, fcore::error::Error>(
+                        reader.to_record_batch_reader(TOKIO_RUNTIME.handle().clone()),
+                    )
+                })
+            })
+            .map_err(|e| FlussError::from_core_error(&e))?;
+
+        let py_schema = sync_reader
+            .schema()
+            .to_pyarrow(py)
+            .map_err(|e| FlussError::new_err(format!("Failed to convert schema: {e}")))?;
+
+        let py_iter = Py::new(py, PyRecordBatchLogReader { sync_reader })?;
+
+        let pyarrow = py.import("pyarrow")?;
+        let batch_reader = pyarrow
+            .getattr("RecordBatchReader")?
+            .call_method1("from_batches", (py_schema, py_iter))?;
+
+        Ok(batch_reader.into())
+    }
+
     /// Convert all data to Arrow Table.
     ///
     /// Reads from currently subscribed buckets until reaching their latest offsets.
     /// Works for both partitioned and non-partitioned tables.
     ///
+    /// Materializes batches in Rust (``RecordBatchLogReader::collect_all_batches``)
+    /// then builds one PyArrow table, avoiding per-batch Python iteration.
+    ///
     /// You must call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.
     ///
     /// Returns:
@@ -2319,29 +2413,29 @@ impl LogScanner {
     fn to_arrow<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
         let kind = Arc::clone(&self.kind);
         let admin = Arc::clone(&self.admin);
-        let table_info = self.table_info.clone();
         let projected_schema = self.projected_schema.clone();
-        let partition_name_cache = Arc::clone(&self.partition_name_cache);
 
         future_into_py(py, async move {
             let scanner = kind.as_batch()?;
-            let subscribed = scanner.get_subscribed_buckets();
-            if subscribed.is_empty() {
-                return Err(FlussError::new_err(
-                    "No buckets subscribed. Call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.",
-                ));
-            }
 
-            let all_batches = Self::collect_all_batches(
-                scanner,
+            let mut reader = fcore::client::RecordBatchLogReader::new_until_latest(
+                scanner.new_shared_handle(),
                 &admin,
-                &table_info,
-                &subscribed,
-                &partition_name_cache,
             )
-            .await?;
+            .await
+            .map_err(|e| FlussError::from_core_error(&e))?;
+
+            let scan_batches = reader
+                .collect_all_batches()
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
 
-            Python::attach(|py| Self::batches_to_arrow_table(py, all_batches, &projected_schema))
+            let batches: Vec<Arc<ArrowRecordBatch>> = scan_batches
+                .into_iter()
+                .map(|sb| Arc::new(sb.into_batch()))
+                .collect();
+
+            Python::attach(|py| Self::batches_to_arrow_table(py, batches, &projected_schema))
         })
     }
 
@@ -2357,30 +2451,30 @@ impl LogScanner {
     fn to_pandas<'py>(&self, py: Python<'py>) -> PyResult<Bound<'py, PyAny>> {
         let kind = Arc::clone(&self.kind);
         let admin = Arc::clone(&self.admin);
-        let table_info = self.table_info.clone();
         let projected_schema = self.projected_schema.clone();
-        let partition_name_cache = Arc::clone(&self.partition_name_cache);
 
         future_into_py(py, async move {
             let scanner = kind.as_batch()?;
-            let subscribed = scanner.get_subscribed_buckets();
-            if subscribed.is_empty() {
-                return Err(FlussError::new_err(
-                    "No buckets subscribed. Call subscribe(), subscribe_buckets(), subscribe_partition(), or subscribe_partition_buckets() first.",
-                ));
-            }
 
-            let all_batches = Self::collect_all_batches(
-                scanner,
+            let mut reader = fcore::client::RecordBatchLogReader::new_until_latest(
+                scanner.new_shared_handle(),
                 &admin,
-                &table_info,
-                &subscribed,
-                &partition_name_cache,
             )
-            .await?;
+            .await
+            .map_err(|e| FlussError::from_core_error(&e))?;
+
+            let scan_batches = reader
+                .collect_all_batches()
+                .await
+                .map_err(|e| FlussError::from_core_error(&e))?;
+
+            let batches: Vec<Arc<ArrowRecordBatch>> = scan_batches
+                .into_iter()
+                .map(|sb| Arc::new(sb.into_batch()))
+                .collect();
 
             Python::attach(|py| {
-                let arrow_table = Self::batches_to_arrow_table(py, all_batches, &projected_schema)?;
+                let arrow_table = Self::batches_to_arrow_table(py, batches, &projected_schema)?;
                 arrow_table.call_method0(py, "to_pandas")
             })
         })
@@ -2442,7 +2536,6 @@ impl LogScanner {
             table_info,
             projected_schema,
             projected_row_type,
-            partition_name_cache: Arc::new(std::sync::RwLock::new(None)),
         }
     }
 
@@ -2466,138 +2559,6 @@ impl LogScanner {
             Utils::combine_batches_to_table(py, batches)
         }
     }
-
-    /// Query stopping offsets and poll until all subscribed buckets are fully read.
-    /// Returns collected Arrow record batches.
-    async fn collect_all_batches(
-        scanner: &fcore::client::RecordBatchLogScanner,
-        admin: &fcore::client::FlussAdmin,
-        table_info: &fcore::metadata::TableInfo,
-        subscribed: &[(fcore::metadata::TableBucket, i64)],
-        partition_name_cache: &std::sync::RwLock<Option<HashMap<i64, String>>>,
-    ) -> PyResult<Vec<Arc<ArrowRecordBatch>>> {
-        let is_partitioned = scanner.is_partitioned();
-        let table_path = &table_info.table_path;
-        let table_id = table_info.table_id;
-
-        // 1. Query latest offsets
-        let mut stopping_offsets: HashMap<fcore::metadata::TableBucket, i64> = if !is_partitioned {
-            let bucket_ids: Vec<i32> = subscribed.iter().map(|(tb, _)| tb.bucket_id()).collect();
-            let offsets = admin
-                .list_offsets(table_path, &bucket_ids, OffsetSpec::Latest)
-                .await
-                .map_err(|e| FlussError::from_core_error(&e))?;
-            offsets
-                .into_iter()
-                .filter(|(_, offset)| *offset > 0)
-                .map(|(bucket_id, offset)| {
-                    (
-                        fcore::metadata::TableBucket::new(table_id, bucket_id),
-                        offset,
-                    )
-                })
-                .collect()
-        } else {
-            let cached = partition_name_cache.read().unwrap().clone();
-            let partition_id_to_name = match cached {
-                Some(map) => map,
-                None => {
-                    let infos = admin
-                        .list_partition_infos(table_path)
-                        .await
-                        .map_err(|e| FlussError::from_core_error(&e))?;
-                    let map: HashMap<i64, String> = infos
-                        .into_iter()
-                        .map(|info| (info.get_partition_id(), info.get_partition_name()))
-                        .collect();
-                    *partition_name_cache.write().unwrap() = Some(map.clone());
-                    map
-                }
-            };
-
-            let mut by_partition: HashMap<i64, Vec<i32>> = HashMap::new();
-            for (tb, _) in subscribed {
-                if let Some(partition_id) = tb.partition_id() {
-                    by_partition
-                        .entry(partition_id)
-                        .or_default()
-                        .push(tb.bucket_id());
-                }
-            }
-
-            let mut result = HashMap::new();
-            for (partition_id, bucket_ids) in by_partition {
-                let partition_name = partition_id_to_name.get(&partition_id).ok_or_else(|| {
-                    FlussError::new_err(format!("Unknown partition_id: {partition_id}"))
-                })?;
-                let offsets = admin
-                    .list_partition_offsets(
-                        table_path,
-                        partition_name,
-                        &bucket_ids,
-                        OffsetSpec::Latest,
-                    )
-                    .await
-                    .map_err(|e| FlussError::from_core_error(&e))?;
-                for (bucket_id, offset) in offsets {
-                    if offset > 0 {
-                        let tb = fcore::metadata::TableBucket::new_with_partition(
-                            table_id,
-                            Some(partition_id),
-                            bucket_id,
-                        );
-                        result.insert(tb, offset);
-                    }
-                }
-            }
-            result
-        };
-
-        // 2. Poll until all buckets reach their stopping offsets
-        let mut all_batches = Vec::new();
-        while !stopping_offsets.is_empty() {
-            let scan_batches = scanner
-                .poll(Duration::from_millis(500))
-                .await
-                .map_err(|e| FlussError::from_core_error(&e))?;
-
-            if scan_batches.is_empty() {
-                continue;
-            }
-
-            for scan_batch in scan_batches {
-                let table_bucket = scan_batch.bucket().clone();
-                let Some(&stop_at) = stopping_offsets.get(&table_bucket) else {
-                    continue;
-                };
-
-                let base_offset = scan_batch.base_offset();
-                let last_offset = scan_batch.last_offset();
-
-                if base_offset >= stop_at {
-                    stopping_offsets.remove(&table_bucket);
-                    continue;
-                }
-
-                let batch = if last_offset >= stop_at {
-                    let num_to_keep = (stop_at - base_offset) as usize;
-                    let b = scan_batch.into_batch();
-                    let limit = num_to_keep.min(b.num_rows());
-                    b.slice(0, limit)
-                } else {
-                    scan_batch.into_batch()
-                };
-
-                all_batches.push(Arc::new(batch));
-
-                if last_offset >= stop_at - 1 {
-                    stopping_offsets.remove(&table_bucket);
-                }
-            }
-        }
-
-        Ok(all_batches)
-    }
 }
 
 #[cfg(test)]
diff --git a/fluss-rust/bindings/python/test/test_log_table.py b/fluss-rust/bindings/python/test/test_log_table.py
index 2f560bcf2c..50b9078bcb 100644
--- a/fluss-rust/bindings/python/test/test_log_table.py
+++ b/fluss-rust/bindings/python/test/test_log_table.py
@@ -388,6 +388,130 @@ async def test_to_arrow_and_to_pandas(connection, admin):
     await admin.drop_table(table_path, ignore_if_not_exists=False)
 
 
+async def test_to_arrow_batch_reader(connection, admin):
+    """Test to_arrow_batch_reader() returns a lazy PyArrow RecordBatchReader."""
+    table_path = fluss.TablePath("fluss", "py_test_to_arrow_batch_reader")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+
+    pa_schema = pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    writer.write_arrow_batch(
+        pa.RecordBatch.from_arrays(
+            [pa.array([10, 20, 30], type=pa.int32()), pa.array(["x", "y", "z"])],
+            schema=pa_schema,
+        )
+    )
+    await writer.flush()
+
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    # to_arrow_batch_reader() is a blocking/sync API; run in a thread to
+    # avoid starving the asyncio event loop (see docstring warning).
+    def _read_all():
+        reader = scanner.to_arrow_batch_reader()
+        assert isinstance(reader, pa.RecordBatchReader)
+        assert reader.schema == pa_schema
+
+        batches = list(reader)
+        total_rows = sum(b.num_rows for b in batches)
+        assert total_rows == 3
+
+        result_table = pa.Table.from_batches(batches, schema=pa_schema)
+        assert result_table.column("id").to_pylist() == [10, 20, 30]
+        assert result_table.column("name").to_pylist() == ["x", "y", "z"]
+
+    await asyncio.to_thread(_read_all)
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
+async def test_to_arrow_batch_reader_drop_and_guard(connection, admin):
+    """Test reader-active guard and Drop cleanup on mid-iteration drop."""
+    table_path = fluss.TablePath("fluss", "py_test_batch_reader_drop_guard")
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+
+    schema = fluss.Schema(
+        pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    )
+    table_descriptor = fluss.TableDescriptor(schema)
+    await admin.create_table(table_path, table_descriptor, ignore_if_exists=False)
+
+    table = await connection.get_table(table_path)
+    writer = table.new_append().create_writer()
+
+    pa_schema = pa.schema([pa.field("id", pa.int32()), pa.field("name", pa.string())])
+    # Write multiple separate flushes so the server stores multiple log
+    # batches per bucket. This makes it likely that the reader's first poll
+    # only drains a subset, leaving real work for the Drop cleanup loop.
+    num_flushes = 10
+    rows_per_flush = 200
+    total_rows = num_flushes * rows_per_flush
+    for f in range(num_flushes):
+        start = f * rows_per_flush
+        writer.write_arrow_batch(
+            pa.RecordBatch.from_arrays(
+                [
+                    pa.array(
+                        list(range(start, start + rows_per_flush)), type=pa.int32()
+                    ),
+                    pa.array(
+                        [f"row_{i}" for i in range(start, start + rows_per_flush)]
+                    ),
+                ],
+                schema=pa_schema,
+            )
+        )
+        await writer.flush()
+
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+    # to_arrow_batch_reader() is a blocking/sync API; run all blocking
+    # interactions in a thread to avoid starving the asyncio event loop.
+    def _test_guard_and_drop():
+        # --- Guard blocks subscribe / unsubscribe while reader is active ---
+        reader = scanner.to_arrow_batch_reader()
+        with pytest.raises(fluss.FlussError, match="RecordBatchLogReader is active"):
+            scanner.subscribe_buckets({0: fluss.EARLIEST_OFFSET})
+        with pytest.raises(fluss.FlussError, match="RecordBatchLogReader is active"):
+            scanner.unsubscribe(0)
+
+        # --- Drop mid-iteration: read one batch, then discard ---
+        first_batch = next(reader)
+        assert first_batch.num_rows > 0
+        del reader
+
+        # --- Drop unsubscribed leftover buckets: creating a reader without
+        #     re-subscribing must fail with "No buckets subscribed" ---
+        with pytest.raises(fluss.FlussError, match="No buckets subscribed"):
+            scanner.to_arrow_batch_reader()
+
+        # --- Guard cleared after drop: scanner is reusable from a fresh subscribe ---
+        scanner.subscribe_buckets(
+            {i: fluss.EARLIEST_OFFSET for i in range(num_buckets)}
+        )
+        reader2 = scanner.to_arrow_batch_reader()
+        batches = list(reader2)
+        assert sum(b.num_rows for b in batches) == total_rows
+
+    await asyncio.to_thread(_test_guard_and_drop)
+
+    await admin.drop_table(table_path, ignore_if_not_exists=False)
+
+
 async def test_partitioned_table_append_scan(connection, admin, wait_for_table_ready):
     """Test append and scan on a partitioned log table."""
     table_path = fluss.TablePath("fluss", "py_test_partitioned_log_append")
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index ba1edd2fb0..e116bbb42d 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -29,12 +29,14 @@ mod lookup;
 
 mod log_fetch_buffer;
 mod partition_getter;
+mod reader;
 mod remote_log;
 mod scanner;
 mod upsert;
 
 pub use append::{AppendWriter, TableAppend};
 pub use lookup::{LookupResult, Lookuper, PrefixKeyLookuper, TableLookup, TablePrefixLookup};
+pub use reader::{RecordBatchLogReader, SyncRecordBatchLogReader};
 pub use remote_log::{
     DEFAULT_REMOTE_FILE_DOWNLOAD_THREAD_NUM, DEFAULT_SCANNER_REMOTE_LOG_PREFETCH_NUM,
 };
diff --git a/fluss-rust/crates/fluss/src/client/table/reader.rs b/fluss-rust/crates/fluss/src/client/table/reader.rs
new file mode 100644
index 0000000000..0a08803d9e
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/reader.rs
@@ -0,0 +1,701 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Bounded log reader that polls until stopping offsets, then terminates.
+//!
+//! Unlike [`RecordBatchLogScanner`] which is unbounded (continuous streaming),
+//! [`RecordBatchLogReader`] reads log data up to a finite set of stopping
+//! offsets and then signals completion. This enables "snapshot-style" reads
+//! from a streaming log: capture the latest offsets, then consume all data
+//! up to those offsets.
+//!
+//! The reader **takes ownership** of the scanner (move, not clone). Once the
+//! scanner is moved into a reader, the compiler prevents concurrent polls.
+//!
+//! The reader also provides a synchronous [`arrow::record_batch::RecordBatchReader`]
+//! adapter via [`RecordBatchLogReader::to_record_batch_reader`] for Arrow
+//! ecosystem interop and FFI consumers (Python, C++).
+
+use crate::client::admin::FlussAdmin;
+use crate::client::table::RecordBatchLogScanner;
+use crate::error::{Error, Result};
+use crate::metadata::TableBucket;
+use crate::record::ScanBatch;
+use crate::rpc::message::OffsetSpec;
+use arrow::record_batch::RecordBatch;
+use arrow_schema::SchemaRef;
+use log::warn;
+use std::collections::{HashMap, VecDeque};
+use std::time::Duration;
+
+const DEFAULT_POLL_TIMEOUT: Duration = Duration::from_millis(500);
+
+/// Bounded log reader that consumes log data up to specified stopping offsets.
+///
+/// This type wraps a [`RecordBatchLogScanner`] and adds stopping semantics:
+/// it polls batches from the scanner, filters/slices them against per-bucket
+/// stopping offsets, and signals completion when all buckets are caught up.
+///
+/// The reader takes **ownership** of the scanner. Once moved in, no other code
+/// can poll the same scanner concurrently.
+///
+/// # Construction
+///
+/// Use [`RecordBatchLogReader::new_until_latest`] for the common case of
+/// reading all currently-available data, or [`RecordBatchLogReader::new_until_offsets`]
+/// for custom stopping offsets.
+///
+/// # Async iteration
+///
+/// Call [`next_batch`](RecordBatchLogReader::next_batch) repeatedly to get
+/// [`ScanBatch`]es lazily, one at a time. Returns `None` when all buckets
+/// have reached their stopping offsets.
+///
+/// # Sync adapter
+///
+/// Call [`to_record_batch_reader`](RecordBatchLogReader::to_record_batch_reader)
+/// to get a synchronous [`arrow::record_batch::RecordBatchReader`] suitable
+/// for Arrow FFI consumers.
+pub struct RecordBatchLogReader {
+    scanner: RecordBatchLogScanner,
+    stopping_offsets: HashMap<TableBucket, i64>,
+    buffer: VecDeque<ScanBatch>,
+    schema: SchemaRef,
+}
+
+impl RecordBatchLogReader {
+    /// Create a reader that reads until the latest offsets at the time of creation.
+    ///
+    /// Queries the server for the current latest offset of each subscribed
+    /// bucket, then reads until those offsets are reached. Buckets whose
+    /// subscribed offset already meets or exceeds the latest offset are
+    /// excluded (nothing to read).
+    ///
+    /// Partition metadata is fetched once during construction; no caching
+    /// is needed since each reader is typically short-lived.
+    pub async fn new_until_latest(
+        scanner: RecordBatchLogScanner,
+        admin: &FlussAdmin,
+    ) -> Result<Self> {
+        // Acquire the guard first so no concurrent unsubscribe can mutate
+        // state between reading subscriptions and using them.
+        scanner.try_set_reader_active()?;
+
+        let subscribed = scanner.get_subscribed_buckets();
+        if subscribed.is_empty() {
+            scanner.clear_reader_active();
+            return Err(Error::IllegalArgument {
+                message: "No buckets subscribed. Call subscribe() before creating a reader."
+                    .to_string(),
+            });
+        }
+
+        let stopping_offsets = match query_latest_offsets(admin, &scanner, &subscribed).await {
+            Ok(o) => o,
+            Err(e) => {
+                scanner.clear_reader_active();
+                return Err(e);
+            }
+        };
+        let schema = scanner.schema();
+
+        Ok(Self {
+            scanner,
+            stopping_offsets,
+            buffer: VecDeque::new(),
+            schema,
+        })
+    }
+
+    /// Create a reader with explicit stopping offsets per bucket.
+    ///
+    /// # NOTE: Every key in `stopping_offsets` **must** correspond to a bucket that is
+    /// currently subscribed on the `scanner`. If a stopping offset refers to a
+    /// bucket that will never appear in polled batches, the reader will loop
+    /// indefinitely waiting for data that never arrives.
+    ///
+    /// Use [`new_until_latest`](Self::new_until_latest) for the common case;
+    /// it queries the server and builds a validated stopping-offset map
+    /// automatically.
+    pub fn new_until_offsets(
+        scanner: RecordBatchLogScanner,
+        stopping_offsets: HashMap<TableBucket, i64>,
+    ) -> Result<Self> {
+        scanner.try_set_reader_active()?;
+        let schema = scanner.schema();
+        Ok(Self {
+            scanner,
+            stopping_offsets,
+            buffer: VecDeque::new(),
+            schema,
+        })
+    }
+
+    /// Returns the Arrow schema for batches produced by this reader.
+    pub fn schema(&self) -> SchemaRef {
+        self.schema.clone()
+    }
+
+    /// Drain all remaining batches until stopping offsets are satisfied.
+    ///
+    /// This is a convenience for callers (e.g. bindings building a single Arrow
+    /// table) that want to materialize the full result in Rust without per-batch
+    /// iteration.
+    pub async fn collect_all_batches(&mut self) -> Result<Vec<ScanBatch>> {
+        let mut out = Vec::new();
+        while let Some(b) = self.next_batch().await? {
+            out.push(b);
+        }
+        Ok(out)
+    }
+
+    /// Fetch the next [`ScanBatch`], or `None` if all buckets are caught up.
+    ///
+    /// Each call may internally poll multiple batches from the scanner,
+    /// buffer them, and return one at a time. Batches that cross a stopping
+    /// offset boundary are sliced to exclude records at or beyond the stop point.
+    ///
+    /// Completed buckets are unsubscribed from the scanner to avoid wasting
+    /// network traffic on data the reader will discard.
+    pub async fn next_batch(&mut self) -> Result<Option<ScanBatch>> {
+        loop {
+            if let Some(batch) = self.buffer.pop_front() {
+                return Ok(Some(batch));
+            }
+
+            if self.stopping_offsets.is_empty() {
+                return Ok(None);
+            }
+
+            let scan_batches = self.scanner.poll(DEFAULT_POLL_TIMEOUT).await?;
+
+            if scan_batches.is_empty() {
+                continue;
+            }
+
+            let completed =
+                filter_batches(scan_batches, &mut self.stopping_offsets, &mut self.buffer);
+
+            // Use the `_sync` unsubscribe variants here: the active-reader
+            // guard rejects calls to the async `unsubscribe*` methods, but
+            // the reader is allowed to clean up its own completed buckets.
+            // The sync variants do the same map removal without the guard
+            // check, and the partitioned/non-partitioned mismatch they
+            // silently ignore is unreachable since the reader inherits the
+            // scanner's partition mode.
+            for tb in completed {
+                if let Some(partition_id) = tb.partition_id() {
+                    self.scanner
+                        .unsubscribe_partition_sync(partition_id, tb.bucket_id());
+                } else {
+                    self.scanner.unsubscribe_sync(tb.bucket_id());
+                }
+            }
+        }
+    }
+
+    /// Convert this async reader into a synchronous [`arrow::record_batch::RecordBatchReader`].
+    ///
+    /// The returned adapter calls [`tokio::runtime::Handle::block_on`] on each
+    /// iterator step. **Do not** call this from inside a Tokio worker thread
+    /// while the same runtime is driving async work (nested `block_on` can
+    /// panic or deadlock). Prefer [`next_batch`](RecordBatchLogReader::next_batch)
+    /// in async Rust code. This is intended for sync/FFI boundaries (C++, some
+    /// Python call paths).
+    pub fn to_record_batch_reader(
+        self,
+        handle: tokio::runtime::Handle,
+    ) -> SyncRecordBatchLogReader {
+        SyncRecordBatchLogReader {
+            reader: self,
+            handle,
+        }
+    }
+}
+
+/// Best-effort cleanup when the reader is dropped before all buckets reach
+/// their stopping offsets (early `break`, an exception in the consumer, etc.).
+///
+/// Why this matters even though we own the scanner:
+///
+/// In pure Rust, dropping the reader drops the owned `RecordBatchLogScanner`,
+/// which decrements the `Arc<LogScannerInner>` to zero and frees the inner
+/// state. Subscriptions die with it, so this `Drop` is a no-op in that path.
+///
+/// In the binding layer (Python today, C++/Elixir later), the binding holds
+/// its own `Arc<LogScannerInner>` and uses
+/// [`RecordBatchLogScanner::new_shared_handle`] to obtain a second handle for
+/// the reader. When the reader is dropped mid-iteration the inner state stays
+/// alive — and any buckets the reader hadn't yet completed remain in
+/// `LogScannerStatus.bucket_status_map`. The user's next operations on the
+/// original `LogScanner` would then see "ghost" subscriptions (extra buckets
+/// being polled, stale offsets, etc.).
+///
+/// The `next_batch` loop already calls `unsubscribe` on each completed bucket,
+/// so `stopping_offsets` accurately reflects the still-active set when `Drop`
+/// runs. We unsubscribe each remaining bucket synchronously via the
+/// `_sync` escape hatches (the underlying `LogScannerStatus` ops don't await),
+/// so this is safe to call from any context — sync, async, a Tokio worker, or
+/// a Python thread holding the GIL.
+///
+/// After cleanup, the `reader_active` guard is cleared so that the original
+/// scanner (held by the binding layer) can accept new subscriptions again.
+///
+/// Caveats:
+/// - Batches already buffered in `LogFetcher.log_fetch_buffer` for an
+///   unsubscribed bucket are not drained here. They'll either be filtered out
+///   by the next `RecordBatchLogReader` (via the "bucket not in
+///   stopping_offsets" branch) or surface to a direct `poll_arrow` caller, who
+///   was sharing scanner state in the first place.
+/// - `Drop` cannot return errors. The `_sync` variants no-op on
+///   partitioned/non-partitioned mismatch, but that mismatch is unreachable
+///   here because the reader was constructed from this scanner and inherited
+///   its partition mode.
+impl Drop for RecordBatchLogReader {
+    fn drop(&mut self) {
+        for (tb, _) in self.stopping_offsets.drain() {
+            if let Some(partition_id) = tb.partition_id() {
+                self.scanner
+                    .unsubscribe_partition_sync(partition_id, tb.bucket_id());
+            } else {
+                self.scanner.unsubscribe_sync(tb.bucket_id());
+            }
+        }
+        self.scanner.clear_reader_active();
+    }
+}
+
+/// Synchronous adapter that implements [`arrow::record_batch::RecordBatchReader`].
+///
+/// Created via [`RecordBatchLogReader::to_record_batch_reader`].
+/// Blocks the current thread on each `next()` call using the provided
+/// Tokio runtime handle.
+///
+/// The iterator yields plain [`RecordBatch`]es (bucket/offset metadata from
+/// [`ScanBatch`] is stripped to satisfy the Arrow trait contract).
+pub struct SyncRecordBatchLogReader {
+    reader: RecordBatchLogReader,
+    handle: tokio::runtime::Handle,
+}
+
+impl Iterator for SyncRecordBatchLogReader {
+    type Item = std::result::Result<RecordBatch, arrow::error::ArrowError>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        match self.handle.block_on(self.reader.next_batch()) {
+            Ok(Some(scan_batch)) => Some(Ok(scan_batch.into_batch())),
+            Ok(None) => None,
+            Err(e) => Some(Err(arrow::error::ArrowError::ExternalError(Box::new(e)))),
+        }
+    }
+}
+
+impl arrow::record_batch::RecordBatchReader for SyncRecordBatchLogReader {
+    fn schema(&self) -> SchemaRef {
+        self.reader.schema()
+    }
+}
+
+/// Query latest offsets for all subscribed buckets, handling both partitioned
+/// and non-partitioned tables.
+///
+/// Buckets whose subscribed offset already meets or exceeds the latest offset
+/// are excluded from the result (there is nothing to read). A `latest_offset`
+/// of `0` means the bucket is empty and is silently skipped; a negative value
+/// is unexpected from the server and is logged as a warning before being
+/// skipped.
+async fn query_latest_offsets(
+    admin: &FlussAdmin,
+    scanner: &RecordBatchLogScanner,
+    subscribed: &[(TableBucket, i64)],
+) -> Result<HashMap<TableBucket, i64>> {
+    let table_path = scanner.table_path();
+
+    if !scanner.is_partitioned() {
+        let bucket_ids: Vec<i32> = subscribed.iter().map(|(tb, _)| tb.bucket_id()).collect();
+
+        let offsets = admin
+            .list_offsets(table_path, &bucket_ids, OffsetSpec::Latest)
+            .await?;
+
+        let subscribed_offset_by_bucket: HashMap<i32, i64> = subscribed
+            .iter()
+            .map(|(tb, off)| (tb.bucket_id(), *off))
+            .collect();
+
+        let table_id = scanner.table_id();
+        Ok(offsets
+            .into_iter()
+            .filter(|(bucket_id, latest_offset)| {
+                if *latest_offset < 0 {
+                    warn!(
+                        "Server returned negative latest offset {latest_offset} for bucket {bucket_id} of table {table_id}; skipping bucket."
+                    );
+                    return false;
+                }
+                if *latest_offset == 0 {
+                    return false;
+                }
+                let Some(&subscribed_offset) = subscribed_offset_by_bucket.get(bucket_id)
+                else {
+                    return false;
+                };
+                subscribed_offset < *latest_offset
+            })
+            .map(|(bucket_id, offset)| (TableBucket::new(table_id, bucket_id), offset))
+            .collect())
+    } else {
+        query_partitioned_offsets(admin, scanner, subscribed).await
+    }
+}
+
+/// Query offsets for partitioned table subscriptions.
+///
+/// Partition metadata is fetched once per reader construction (not cached),
+/// since each [`RecordBatchLogReader`] is typically short-lived and consumed.
+async fn query_partitioned_offsets(
+    admin: &FlussAdmin,
+    scanner: &RecordBatchLogScanner,
+    subscribed: &[(TableBucket, i64)],
+) -> Result<HashMap<TableBucket, i64>> {
+    let table_path = scanner.table_path();
+    let table_id = scanner.table_id();
+
+    let partition_infos = admin.list_partition_infos(table_path).await?;
+    let partition_id_to_name: HashMap<i64, String> = partition_infos
+        .into_iter()
+        .map(|info| (info.get_partition_id(), info.get_partition_name()))
+        .collect();
+
+    let subscribed_offset_map: HashMap<TableBucket, i64> = subscribed.iter().cloned().collect();
+
+    let mut by_partition: HashMap<i64, Vec<i32>> = HashMap::new();
+    for (tb, _) in subscribed {
+        if let Some(partition_id) = tb.partition_id() {
+            by_partition
+                .entry(partition_id)
+                .or_default()
+                .push(tb.bucket_id());
+        }
+    }
+
+    let mut result: HashMap<TableBucket, i64> = HashMap::new();
+
+    for (partition_id, bucket_ids) in by_partition {
+        let partition_name =
+            partition_id_to_name
+                .get(&partition_id)
+                .ok_or_else(|| Error::UnexpectedError {
+                    message: format!("Unknown partition_id: {partition_id}"),
+                    source: None,
+                })?;
+
+        let offsets = admin
+            .list_partition_offsets(table_path, partition_name, &bucket_ids, OffsetSpec::Latest)
+            .await?;
+
+        for (bucket_id, latest_offset) in offsets {
+            if latest_offset < 0 {
+                warn!(
+                    "Server returned negative latest offset {latest_offset} for bucket {bucket_id} of partition {partition_id} (table {table_id}); skipping bucket."
+                );
+                continue;
+            }
+            if latest_offset == 0 {
+                continue;
+            }
+            let tb = TableBucket::new_with_partition(table_id, Some(partition_id), bucket_id);
+            let Some(&subscribed_offset) = subscribed_offset_map.get(&tb) else {
+                continue;
+            };
+            if subscribed_offset < latest_offset {
+                result.insert(tb, latest_offset);
+            }
+        }
+    }
+
+    Ok(result)
+}
+
+/// Filter and slice scan batches against per-bucket stopping offsets.
+///
+/// For each batch:
+/// - If the batch's bucket is not in `stopping_offsets`, skip it.
+/// - If `base_offset >= stop_at`, the bucket is exhausted; remove from map.
+/// - If `last_offset >= stop_at`, slice to keep only records before stop_at.
+/// - Otherwise, keep the full batch.
+///
+/// Accepted batches with at least one row are pushed to `buffer`; empty
+/// batches (e.g. a server-emitted batch containing no rows, or a slice that
+/// reduces to zero rows) are dropped so consumers never observe an empty
+/// `ScanBatch`. Returns the list of buckets that completed (were removed
+/// from `stopping_offsets`).
+fn filter_batches(
+    scan_batches: Vec<ScanBatch>,
+    stopping_offsets: &mut HashMap<TableBucket, i64>,
+    buffer: &mut VecDeque<ScanBatch>,
+) -> Vec<TableBucket> {
+    let mut completed = Vec::new();
+
+    for scan_batch in scan_batches {
+        let bucket = scan_batch.bucket().clone();
+        let Some(&stop_at) = stopping_offsets.get(&bucket) else {
+            continue;
+        };
+
+        let base_offset = scan_batch.base_offset();
+        let last_offset = scan_batch.last_offset();
+
+        if base_offset >= stop_at {
+            stopping_offsets.remove(&bucket);
+            completed.push(bucket);
+            continue;
+        }
+
+        let kept_batch = if last_offset >= stop_at {
+            let num_to_keep = (stop_at - base_offset) as usize;
+            let b = scan_batch.into_batch();
+            let limit = num_to_keep.min(b.num_rows());
+            ScanBatch::new(bucket.clone(), b.slice(0, limit), base_offset)
+        } else {
+            scan_batch
+        };
+
+        if kept_batch.batch().num_rows() > 0 {
+            buffer.push_back(kept_batch);
+        }
+
+        if last_offset >= stop_at - 1 {
+            stopping_offsets.remove(&bucket);
+            completed.push(bucket);
+        }
+    }
+
+    completed
+}
+
+// TODO: Add Rust-level end-to-end tests with `FlussTestingCluster` (feature
+// `integration_tests`) covering `new_until_latest`, partitioned tables,
+// and `new_until_offsets` stopping semantics. Drop cleanup and the
+// reader-active guard are covered by the Python integration test
+// `test_to_arrow_batch_reader_drop_and_guard`.
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use arrow::array::Int32Array;
+    use arrow_schema::{DataType, Field, Schema};
+    use std::sync::Arc;
+
+    fn test_schema() -> SchemaRef {
+        Arc::new(Schema::new(vec![Field::new("v", DataType::Int32, false)]))
+    }
+
+    fn make_batch(values: &[i32]) -> RecordBatch {
+        RecordBatch::try_new(
+            test_schema(),
+            vec![Arc::new(Int32Array::from(values.to_vec()))],
+        )
+        .unwrap()
+    }
+
+    fn make_scan_batch(bucket: TableBucket, base_offset: i64, values: &[i32]) -> ScanBatch {
+        ScanBatch::new(bucket, make_batch(values), base_offset)
+    }
+
+    fn bucket(id: i32) -> TableBucket {
+        TableBucket::new(1, id)
+    }
+
+    #[test]
+    fn filter_batch_entirely_before_stop() {
+        let mut offsets = HashMap::from([(bucket(0), 100)]);
+        let mut buffer = VecDeque::new();
+
+        let batches = vec![make_scan_batch(bucket(0), 10, &[1, 2, 3])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert_eq!(buffer.len(), 1);
+        assert_eq!(buffer[0].batch().num_rows(), 3);
+        assert!(offsets.contains_key(&bucket(0)));
+        assert!(completed.is_empty());
+    }
+
+    #[test]
+    fn filter_batch_crossing_stop_offset_is_sliced() {
+        let mut offsets = HashMap::from([(bucket(0), 12)]);
+        let mut buffer = VecDeque::new();
+
+        // base_offset=10, 5 rows -> offsets 10,11,12,13,14; stop_at=12 -> keep 2
+        let batches = vec![make_scan_batch(bucket(0), 10, &[1, 2, 3, 4, 5])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert_eq!(buffer.len(), 1);
+        assert_eq!(buffer[0].batch().num_rows(), 2);
+        assert!(!offsets.contains_key(&bucket(0)));
+        assert_eq!(completed, vec![bucket(0)]);
+    }
+
+    #[test]
+    fn filter_batch_at_or_after_stop_offset_is_skipped() {
+        let mut offsets = HashMap::from([(bucket(0), 10)]);
+        let mut buffer = VecDeque::new();
+
+        // base_offset=10, stop_at=10 -> base >= stop, skip entirely
+        let batches = vec![make_scan_batch(bucket(0), 10, &[1, 2, 3])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert!(buffer.is_empty());
+        assert!(!offsets.contains_key(&bucket(0)));
+        assert_eq!(completed, vec![bucket(0)]);
+    }
+
+    #[test]
+    fn filter_batch_ending_exactly_at_stop_minus_one() {
+        let mut offsets = HashMap::from([(bucket(0), 13)]);
+        let mut buffer = VecDeque::new();
+
+        // base_offset=10, 3 rows -> offsets 10,11,12; last_offset=12, stop_at=13
+        // last_offset (12) >= stop_at - 1 (12) => bucket done
+        let batches = vec![make_scan_batch(bucket(0), 10, &[1, 2, 3])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert_eq!(buffer.len(), 1);
+        assert_eq!(buffer[0].batch().num_rows(), 3);
+        assert!(!offsets.contains_key(&bucket(0)));
+        assert_eq!(completed, vec![bucket(0)]);
+    }
+
+    #[test]
+    fn filter_unknown_bucket_is_ignored() {
+        let mut offsets = HashMap::from([(bucket(0), 100)]);
+        let mut buffer = VecDeque::new();
+
+        let batches = vec![make_scan_batch(bucket(99), 0, &[1, 2])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert!(buffer.is_empty());
+        assert!(offsets.contains_key(&bucket(0)));
+        assert!(completed.is_empty());
+    }
+
+    #[test]
+    fn filter_multiple_buckets_independent_tracking() {
+        let mut offsets = HashMap::from([(bucket(0), 12), (bucket(1), 5)]);
+        let mut buffer = VecDeque::new();
+
+        let batches = vec![
+            make_scan_batch(bucket(0), 10, &[1, 2, 3]), // last=12, stop=12 -> keep 2, done
+            make_scan_batch(bucket(1), 0, &[10, 20, 30]), // last=2, stop=5 -> keep all, not done
+        ];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert_eq!(buffer.len(), 2);
+        assert_eq!(buffer[0].batch().num_rows(), 2); // bucket 0: sliced
+        assert_eq!(buffer[1].batch().num_rows(), 3); // bucket 1: full
+        assert!(!offsets.contains_key(&bucket(0))); // bucket 0: done
+        assert!(offsets.contains_key(&bucket(1))); // bucket 1: still tracking
+        assert_eq!(completed, vec![bucket(0)]);
+    }
+
+    #[test]
+    fn filter_empty_batch_at_stop() {
+        let mut offsets = HashMap::from([(bucket(0), 5)]);
+        let mut buffer = VecDeque::new();
+
+        // empty batch: base_offset=5, 0 rows -> last_offset = base-1 = 4
+        // base_offset (5) >= stop_at (5) -> skip, remove
+        let batches = vec![make_scan_batch(bucket(0), 5, &[])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert!(buffer.is_empty());
+        assert!(!offsets.contains_key(&bucket(0)));
+        assert_eq!(completed, vec![bucket(0)]);
+    }
+
+    #[test]
+    fn filter_drops_empty_batch_before_stop() {
+        // Empty batch well below the stop offset: base=5, 0 rows -> last=4, stop=100.
+        // base_offset (5) < stop_at (100) and last_offset (4) < stop_at (100),
+        // so it falls into the "keep full batch" branch but must not surface to
+        // the consumer because it has zero rows.
+        let mut offsets = HashMap::from([(bucket(0), 100)]);
+        let mut buffer = VecDeque::new();
+
+        let batches = vec![make_scan_batch(bucket(0), 5, &[])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert!(buffer.is_empty());
+        assert!(offsets.contains_key(&bucket(0)));
+        assert!(completed.is_empty());
+    }
+
+    #[test]
+    fn filter_single_row_batch_before_stop() {
+        let mut offsets = HashMap::from([(bucket(0), 10)]);
+        let mut buffer = VecDeque::new();
+
+        let batches = vec![make_scan_batch(bucket(0), 5, &[42])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert_eq!(buffer.len(), 1);
+        assert_eq!(buffer[0].batch().num_rows(), 1);
+        assert!(offsets.contains_key(&bucket(0)));
+        assert!(completed.is_empty());
+    }
+
+    #[test]
+    fn filter_single_row_batch_at_stop_boundary() {
+        let mut offsets = HashMap::from([(bucket(0), 5)]);
+        let mut buffer = VecDeque::new();
+
+        // base_offset=4, 1 row -> last_offset=4, stop=5
+        // last < stop -> keep all; last (4) >= stop-1 (4) -> done
+        let batches = vec![make_scan_batch(bucket(0), 4, &[42])];
+        let completed = filter_batches(batches, &mut offsets, &mut buffer);
+
+        assert_eq!(buffer.len(), 1);
+        assert_eq!(buffer[0].batch().num_rows(), 1);
+        assert!(!offsets.contains_key(&bucket(0)));
+        assert_eq!(completed, vec![bucket(0)]);
+    }
+
+    #[test]
+    fn filter_preserves_scan_batch_metadata() {
+        let mut offsets = HashMap::from([(bucket(3), 100)]);
+        let mut buffer = VecDeque::new();
+
+        let batches = vec![make_scan_batch(bucket(3), 42, &[1, 2])];
+        filter_batches(batches, &mut offsets, &mut buffer);
+
+        let sb = &buffer[0];
+        assert_eq!(*sb.bucket(), bucket(3));
+        assert_eq!(sb.base_offset(), 42);
+    }
+
+    #[test]
+    fn filter_sliced_batch_preserves_base_offset() {
+        let mut offsets = HashMap::from([(bucket(0), 12)]);
+        let mut buffer = VecDeque::new();
+
+        let batches = vec![make_scan_batch(bucket(0), 10, &[1, 2, 3, 4, 5])];
+        filter_batches(batches, &mut offsets, &mut buffer);
+
+        let sb = &buffer[0];
+        assert_eq!(sb.base_offset(), 10);
+        assert_eq!(*sb.bucket(), bucket(0));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index c6228e59f9..868709919f 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -257,6 +257,10 @@ pub struct LogScanner {
 ///
 /// More efficient than [`LogScanner`] for batch-level analytics where per-record
 /// metadata (offsets, timestamps) is not needed.
+///
+/// This type is intentionally **not** `Clone`. To perform a bounded read, move
+/// the scanner into a [`crate::client::RecordBatchLogReader`] — the compiler
+/// then prevents concurrent polls by construction.
 pub struct RecordBatchLogScanner {
     inner: Arc<LogScannerInner>,
 }
@@ -269,6 +273,10 @@ struct LogScannerInner {
     log_scanner_status: Arc<LogScannerStatus>,
     log_fetcher: LogFetcher,
     is_partitioned_table: bool,
+    arrow_schema: SchemaRef,
+    /// Guards against subscription changes while a
+    /// [`crate::client::RecordBatchLogReader`] is iterating.
+    reader_active: std::sync::atomic::AtomicBool,
 }
 
 impl LogScannerInner {
@@ -280,6 +288,20 @@ impl LogScannerInner {
         projected_fields: Option<Vec<usize>>,
     ) -> Result<Self> {
         let log_scanner_status = Arc::new(LogScannerStatus::new());
+
+        let full_row_type = table_info.get_row_type();
+        let arrow_schema = match &projected_fields {
+            Some(indices) => {
+                let projected_fields_vec: Vec<_> = indices
+                    .iter()
+                    .map(|&i| full_row_type.fields()[i].clone())
+                    .collect();
+                let projected_row_type = crate::metadata::RowType::new(projected_fields_vec);
+                to_arrow_schema(&projected_row_type)?
+            }
+            None => to_arrow_schema(full_row_type)?,
+        };
+
         Ok(Self {
             table_path: table_info.table_path.clone(),
             table_id: table_info.table_id,
@@ -288,15 +310,31 @@ impl LogScannerInner {
             log_scanner_status: log_scanner_status.clone(),
             log_fetcher: LogFetcher::new(
                 table_info.clone(),
-                connections.clone(),
-                metadata.clone(),
+                connections,
+                metadata,
                 log_scanner_status.clone(),
                 config,
                 projected_fields,
             )?,
+            arrow_schema,
+            reader_active: std::sync::atomic::AtomicBool::new(false),
         })
     }
 
+    fn check_no_active_reader(&self) -> Result<()> {
+        if self
+            .reader_active
+            .load(std::sync::atomic::Ordering::Acquire)
+        {
+            return Err(Error::IllegalArgument {
+                message: "Cannot modify subscriptions while a RecordBatchLogReader is active. \
+                          Drop the reader first."
+                    .to_string(),
+            });
+        }
+        Ok(())
+    }
+
     async fn poll_records(&self, timeout: Duration) -> Result<ScanRecords> {
         let start = Instant::now();
         let deadline = start + timeout;
@@ -337,6 +375,7 @@ impl LogScannerInner {
     }
 
     async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
+        self.check_no_active_reader()?;
         if self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
                 message: "The table is a partitioned table, please use \"subscribe_partition\" to \
@@ -354,6 +393,7 @@ impl LogScannerInner {
     }
 
     async fn subscribe_buckets(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()> {
+        self.check_no_active_reader()?;
         if self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
                 message:
@@ -376,6 +416,7 @@ impl LogScannerInner {
         bucket: i32,
         offset: i64,
     ) -> Result<()> {
+        self.check_no_active_reader()?;
         if !self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
                 message: "The table is not a partitioned table, please use \"subscribe\" to \
@@ -397,6 +438,7 @@ impl LogScannerInner {
         &self,
         partition_bucket_offsets: &HashMap<(PartitionId, i32), i64>,
     ) -> Result<()> {
+        self.check_no_active_reader()?;
         if !self.is_partitioned_table {
             return Err(UnsupportedOperation {
                 message: "The table is not a partitioned table, please use \"subscribe_buckets\" \
@@ -431,6 +473,7 @@ impl LogScannerInner {
     }
 
     async fn unsubscribe(&self, bucket: i32) -> Result<()> {
+        self.check_no_active_reader()?;
         if self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
                 message:
@@ -446,6 +489,7 @@ impl LogScannerInner {
     }
 
     async fn unsubscribe_partition(&self, partition_id: PartitionId, bucket: i32) -> Result<()> {
+        self.check_no_active_reader()?;
         if !self.is_partitioned_table {
             return Err(Error::UnsupportedOperation {
                 message: "Can't unsubscribe a partition for a non-partitioned table.".to_string(),
@@ -615,6 +659,95 @@ impl RecordBatchLogScanner {
     ) -> Result<()> {
         self.inner.unsubscribe_partition(partition_id, bucket).await
     }
+
+    /// Returns the Arrow schema for batches produced by this scanner.
+    pub fn schema(&self) -> SchemaRef {
+        self.inner.arrow_schema.clone()
+    }
+
+    pub fn table_path(&self) -> &TablePath {
+        &self.inner.table_path
+    }
+
+    pub fn table_id(&self) -> TableId {
+        self.inner.table_id
+    }
+
+    /// Creates a new handle to the same underlying scanner state.
+    ///
+    /// Binding layers (Python, C++) that hold the scanner behind shared
+    /// ownership (`Arc`) cannot move it into a [`crate::client::RecordBatchLogReader`].
+    /// This method produces a second handle so the reader can take ownership
+    /// while the binding retains its reference for subscription management.
+    ///
+    /// **Not intended for general use** — prefer moving the scanner directly.
+    #[doc(hidden)]
+    pub fn new_shared_handle(&self) -> Self {
+        RecordBatchLogScanner {
+            inner: Arc::clone(&self.inner),
+        }
+    }
+
+    /// Atomically marks the scanner as having an active reader.
+    ///
+    /// Returns `Err(IllegalArgument)` if another reader is already active on
+    /// this scanner — only one [`crate::client::RecordBatchLogReader`] may
+    /// iterate per scanner at a time. This mirrors Java's
+    /// `LogScannerImpl.acquire()` single-consumer guard.
+    pub(crate) fn try_set_reader_active(&self) -> Result<()> {
+        use std::sync::atomic::Ordering;
+        self.inner
+            .reader_active
+            .compare_exchange(false, true, Ordering::AcqRel, Ordering::Acquire)
+            .map(|_| ())
+            .map_err(|_| Error::IllegalArgument {
+                message: "Another RecordBatchLogReader is already active on this scanner. \
+                          Drop the existing reader first."
+                    .to_string(),
+            })
+    }
+
+    /// Clears the active-reader guard, re-enabling subscription changes.
+    pub(crate) fn clear_reader_active(&self) {
+        self.inner
+            .reader_active
+            .store(false, std::sync::atomic::Ordering::Release);
+    }
+
+    /// Synchronous, infallible counterpart to [`unsubscribe`](Self::unsubscribe).
+    ///
+    /// Exists so [`crate::client::RecordBatchLogReader`]'s `Drop` impl can
+    /// release lingering subscriptions without `.await`. The async version is
+    /// also synchronous under the hood (it only acquires a lock and removes
+    /// from a map — no IO), so this exposes the same work without the
+    /// async wrapper. Silently no-ops on partitioned/non-partitioned mismatch
+    /// because `Drop` cannot return errors; callers must pick the correct
+    /// variant.
+    ///
+    /// **Not intended for general use** — prefer the async [`unsubscribe`].
+    pub(crate) fn unsubscribe_sync(&self, bucket: i32) {
+        if self.inner.is_partitioned_table {
+            return;
+        }
+        let table_bucket = TableBucket::new(self.inner.table_id, bucket);
+        self.inner
+            .log_scanner_status
+            .unassign_scan_buckets(from_ref(&table_bucket));
+    }
+
+    /// Synchronous, infallible counterpart to
+    /// [`unsubscribe_partition`](Self::unsubscribe_partition). See
+    /// [`unsubscribe_sync`](Self::unsubscribe_sync) for rationale.
+    pub(crate) fn unsubscribe_partition_sync(&self, partition_id: PartitionId, bucket: i32) {
+        if !self.inner.is_partitioned_table {
+            return;
+        }
+        let table_bucket =
+            TableBucket::new_with_partition(self.inner.table_id, Some(partition_id), bucket);
+        self.inner
+            .log_scanner_status
+            .unassign_scan_buckets(from_ref(&table_bucket));
+    }
 }
 
 struct LogFetcher {
@@ -2009,6 +2142,7 @@ mod tests {
         let result = validate_scan_support(&table_path, &table_info);
         assert!(result.is_ok());
     }
+
     #[tokio::test]
     async fn prepare_fetch_log_requests_uses_configured_fetch_params() -> Result<()> {
         let table_path = TablePath::new("db".to_string(), "tbl".to_string());
diff --git a/fluss-rust/website/docs/user-guide/python/api-reference.md b/fluss-rust/website/docs/user-guide/python/api-reference.md
index dc252b682c..9bf0b6902f 100644
--- a/fluss-rust/website/docs/user-guide/python/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/python/api-reference.md
@@ -181,9 +181,12 @@ Builder for creating a `PrefixLookuper`. Obtain via `TableLookup.lookup_by(colum
 | `await .poll(timeout_ms) -> ScanRecords`                      | Poll individual records (record scanner only)                                    |
 | `await .poll_arrow(timeout_ms) -> pa.Table`                   | Poll as Arrow Table (batch scanner only)                                         |
 | `await .poll_record_batch(timeout_ms) -> list[RecordBatch]`   | Poll batches with metadata (batch scanner only)                                  |
+| `.to_arrow_batch_reader() -> pa.RecordBatchReader`            | Lazy Arrow RecordBatchReader reading until latest offsets (batch scanner only)    |
 | `await .to_arrow() -> pa.Table`                               | Read all subscribed data as Arrow Table (batch scanner only)                     |
 | `await .to_pandas() -> pd.DataFrame`                          | Read all subscribed data as DataFrame (batch scanner only)                       |
 
+> **Note:** Overlapping `poll_*` / `to_arrow*` / `to_arrow_batch_reader` calls on the same underlying scanner are not supported. Use only one active polling/consumption path at a time.
+
 ## `ScanRecords`
 
 Returned by `LogScanner.poll()`. Records are grouped by bucket.
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 03054f0f31..5d3068b5a2 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -151,6 +151,8 @@ Complete API reference for the Fluss Rust client.
 
 ## `RecordBatchLogScanner`
 
+Overlapping `poll` calls on clones that share state, or `poll` concurrent with `RecordBatchLogReader::next_batch`, are not supported. Use one active polling/consumption call at a time per underlying scanner state.
+
 | Method                                                                                                    | Description                                              |
 |-----------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
 | `async fn subscribe(&self, bucket_id: i32, start_offset: i64) -> Result<()>`                              | Subscribe to a bucket                                    |
@@ -162,6 +164,48 @@ Complete API reference for the Fluss Rust client.
 | `async fn poll(&self, timeout: Duration) -> Result<Vec<ScanBatch>>`                                       | Poll for Arrow record batches                            |
 | `fn is_partitioned(&self) -> bool`                                                                        | Check if the table is partitioned                        |
 | `fn get_subscribed_buckets(&self) -> Vec<(TableBucket, i64)>`                                             | Get all current subscriptions as (bucket, offset) pairs  |
+| `fn schema(&self) -> SchemaRef`                                                                           | Get the Arrow schema for batches produced by this scanner|
+| `fn table_path(&self) -> &TablePath`                                                                      | Get the table path                                       |
+| `fn table_id(&self) -> TableId`                                                                           | Get the table ID                                         |
+
+## `RecordBatchLogReader`
+
+Bounded log reader that consumes data up to specified stopping offsets, then terminates.
+Unlike `RecordBatchLogScanner` which polls indefinitely, this reader stops automatically.
+
+| Method                                                                                                      | Description                                              |
+|-------------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
+| `async fn new_until_latest(scanner: RecordBatchLogScanner, admin: &FlussAdmin) -> Result<Self>`              | Read until the latest offsets at time of creation         |
+| `fn new_until_offsets(scanner: RecordBatchLogScanner, stopping_offsets: HashMap<TableBucket, i64>) -> Result<Self>` | Read until custom stopping offsets per bucket             |
+| `async fn next_batch(&mut self) -> Result<Option<ScanBatch>>`                                                | Get the next batch with bucket/offset metadata, or `None` when all buckets caught up |
+| `async fn collect_all_batches(&mut self) -> Result<Vec<ScanBatch>>`                                          | Drain all batches (with metadata) until stopping offsets are satisfied |
+| `fn schema(&self) -> SchemaRef`                                                                              | Arrow schema for produced batches                        |
+| `fn to_record_batch_reader(self, handle: tokio::runtime::Handle) -> SyncRecordBatchLogReader`                | Sync adapter implementing `arrow::RecordBatchReader` (see below) |
+
+## `SyncRecordBatchLogReader`
+
+Synchronous adapter for `RecordBatchLogReader`. Created via
+`RecordBatchLogReader::to_record_batch_reader(handle)`.
+
+Implements both [`Iterator`] and [`arrow::record_batch::RecordBatchReader`], so it
+plugs into the wider Arrow ecosystem — FFI, PyArrow's
+`pa.RecordBatchReader.from_batches`, the C++ Arrow `RecordBatchReader` interface,
+DataFusion sources, etc.
+
+Each `next()` call drives the underlying async reader via
+`tokio::runtime::Handle::block_on`. **Do not call from inside a Tokio worker
+thread that belongs to the same runtime** — nested `block_on` panics. Prefer
+`RecordBatchLogReader::next_batch` in async Rust code; use this adapter only at
+sync/FFI boundaries.
+
+Bucket and offset metadata carried by `ScanBatch` is **dropped** here, because
+the Arrow trait contract yields plain `RecordBatch`. If you need offsets or
+bucket identity per batch, use `next_batch` instead.
+
+| Method                                                          | Description                                      |
+|-----------------------------------------------------------------|--------------------------------------------------|
+| `fn next(&mut self) -> Option<Result<RecordBatch, ArrowError>>` | Iterator: next batch, or `None` when caught up   |
+| `fn schema(&self) -> SchemaRef`                                 | Arrow schema for produced batches                |
 
 ## `ScanRecord`
 

From e17e0873fadb46b6b7e518d570dbf1e21bf9b4e2 Mon Sep 17 00:00:00 2001
From: Jared Yu <qzyu999@gmail.com>
Date: Fri, 15 May 2026 12:56:38 +0100
Subject: [PATCH 269/287] feat: implement MAP data type support

---
 fluss-rust/bindings/cpp/src/types.rs          |   4 +
 fluss-rust/bindings/python/src/table.rs       |   1 +
 .../crates/fluss/src/client/table/append.rs   |   7 +-
 .../src/client/table/log_fetch_buffer.rs      |   8 +-
 .../crates/fluss/src/client/table/scanner.rs  |  42 +-
 .../crates/fluss/src/metadata/datatype.rs     |  23 +-
 fluss-rust/crates/fluss/src/record/arrow.rs   |  43 +-
 fluss-rust/crates/fluss/src/record/mod.rs     |   6 +-
 .../fluss/src/row/binary/binary_writer.rs     |  17 +-
 .../row/binary/iceberg_binary_row_writer.rs   |  10 +-
 .../crates/fluss/src/row/binary_array.rs      |  65 +-
 fluss-rust/crates/fluss/src/row/binary_map.rs | 555 ++++++++++++++++++
 fluss-rust/crates/fluss/src/row/column.rs     | 237 ++++++--
 .../crates/fluss/src/row/column_writer.rs     | 211 ++++++-
 .../src/row/compacted/compacted_key_writer.rs |   6 +-
 .../fluss/src/row/compacted/compacted_row.rs  | 172 +++++-
 .../src/row/compacted/compacted_row_reader.rs |  14 +-
 .../src/row/compacted/compacted_row_writer.rs |  10 +-
 fluss-rust/crates/fluss/src/row/datum.rs      | 284 +++++++--
 .../src/row/encode/compacted_key_encoder.rs   |  18 +-
 .../crates/fluss/src/row/field_getter.rs      |  54 +-
 fluss-rust/crates/fluss/src/row/lookup_row.rs |   6 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |  24 +-
 .../crates/fluss/src/row/projected_row.rs     |   7 +-
 .../fluss/tests/integration/log_table.rs      |  84 +++
 25 files changed, 1765 insertions(+), 143 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/row/binary_map.rs

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 84aec25b8f..9ef8fe72c4 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -529,6 +529,7 @@ pub fn resolve_row_types(
             Datum::TimestampNtz(ts) => Datum::TimestampNtz(*ts),
             Datum::TimestampLtz(ts) => Datum::TimestampLtz(*ts),
             Datum::Array(a) => Datum::Array(a.clone()),
+            Datum::Map(m) => Datum::Map(m.clone()),
             Datum::Row(_) => return Err(anyhow!("Row datum is not yet supported in C++ bindings")),
         };
         out.set_field(idx, resolved);
@@ -588,6 +589,9 @@ pub fn compacted_row_to_owned(
                 Datum::Blob(Cow::Owned(row.get_binary(i, dt.length())?.to_vec()))
             }
             fcore::metadata::DataType::Array(_) => Datum::Array(row.get_array(i)?),
+            fcore::metadata::DataType::Map(mt) => {
+                Datum::Map(row.get_map(i, mt.key_type(), mt.value_type())?)
+            }
             other => return Err(anyhow!("Unsupported data type for column {i}: {other:?}")),
         };
 
diff --git a/fluss-rust/bindings/python/src/table.rs b/fluss-rust/bindings/python/src/table.rs
index 4133bed47e..b30baeb5ca 100644
--- a/fluss-rust/bindings/python/src/table.rs
+++ b/fluss-rust/bindings/python/src/table.rs
@@ -1369,6 +1369,7 @@ fn python_value_to_datum(
                             }
                         }
                         Datum::Array(v) => writer.write_array(i, &v),
+                        Datum::Map(v) => writer.write_map(i, &v),
                         Datum::Row(_) => {
                             return Err(FlussError::new_err(
                                 "Row datum is not supported as an array element",
diff --git a/fluss-rust/crates/fluss/src/client/table/append.rs b/fluss-rust/crates/fluss/src/client/table/append.rs
index 535520085e..562e8ea7e7 100644
--- a/fluss-rust/crates/fluss/src/client/table/append.rs
+++ b/fluss-rust/crates/fluss/src/client/table/append.rs
@@ -126,7 +126,12 @@ impl AppendWriter {
     /// or dropped for fire-and-forget behavior (use `flush()` to ensure delivery).
     pub fn append_arrow_batch(&self, batch: RecordBatch) -> Result<WriteResultFuture> {
         let physical_table_path = if self.partition_getter.is_some() && batch.num_rows() > 0 {
-            let first_row = ColumnarRow::new(Arc::new(batch.clone()), 0, None);
+            let first_row = ColumnarRow::new(
+                Arc::new(batch.clone()),
+                Arc::new(self.table_info.row_type.clone()),
+                0,
+                None,
+            );
             Arc::new(get_physical_path(
                 &self.table_path,
                 self.partition_getter.as_ref(),
diff --git a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
index 0dff4e8749..9d45abad29 100644
--- a/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
+++ b/fluss-rust/crates/fluss/src/client/table/log_fetch_buffer.rs
@@ -842,7 +842,11 @@ mod tests {
 
     fn test_read_context() -> Result<ReadContext> {
         let row_type = RowType::new(vec![DataField::new("id", DataTypes::int(), None)]);
-        Ok(ReadContext::new(to_arrow_schema(&row_type)?, false))
+        Ok(ReadContext::new(
+            to_arrow_schema(&row_type)?,
+            Arc::new(row_type),
+            false,
+        ))
     }
 
     struct ErrorPendingFetch {
@@ -921,7 +925,7 @@ mod tests {
 
         let data = builder.build()?;
         let log_records = LogRecordsBatches::new(data.clone());
-        let read_context = ReadContext::new(to_arrow_schema(&row_type)?, false);
+        let read_context = ReadContext::new(to_arrow_schema(&row_type)?, Arc::new(row_type), false);
         let mut fetch = DefaultCompletedFetch::new(
             TableBucket::new(1, 0),
             log_records,
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 868709919f..a4164b9976 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -801,12 +801,20 @@ impl LogFetcher {
                     .collect(),
             )),
         };
-        let read_context =
-            Self::create_read_context(full_arrow_schema.clone(), projected_fields.clone(), false)?
-                .with_fluss_row_type(projected_row_type.clone());
-        let remote_read_context =
-            Self::create_read_context(full_arrow_schema, projected_fields.clone(), true)?
-                .with_fluss_row_type(projected_row_type);
+        let read_context = Self::create_read_context(
+            full_arrow_schema.clone(),
+            projected_row_type.clone(),
+            projected_fields.clone(),
+            false,
+        )?
+        .with_fluss_row_type(projected_row_type.clone());
+        let remote_read_context = Self::create_read_context(
+            full_arrow_schema,
+            projected_row_type.clone(),
+            projected_fields.clone(),
+            true,
+        )?
+        .with_fluss_row_type(projected_row_type);
 
         let tmp_dir = TempDir::with_prefix("fluss-remote-logs")?;
         let log_fetch_buffer = Arc::new(LogFetchBuffer::new(read_context.clone()));
@@ -851,14 +859,22 @@ impl LogFetcher {
 
     fn create_read_context(
         full_arrow_schema: SchemaRef,
+        row_type: Arc<RowType>,
         projected_fields: Option<Vec<usize>>,
         is_from_remote: bool,
     ) -> Result<ReadContext> {
         match projected_fields {
-            None => Ok(ReadContext::new(full_arrow_schema, is_from_remote)),
-            Some(fields) => {
-                ReadContext::with_projection_pushdown(full_arrow_schema, fields, is_from_remote)
-            }
+            None => Ok(ReadContext::new(
+                full_arrow_schema,
+                row_type,
+                is_from_remote,
+            )),
+            Some(fields) => ReadContext::with_projection_pushdown(
+                full_arrow_schema,
+                row_type,
+                fields,
+                is_from_remote,
+            ),
         }
     }
 
@@ -1901,7 +1917,8 @@ mod tests {
 
         let data = build_records(&table_info, Arc::new(table_path))?;
         let log_records = LogRecordsBatches::new(data.clone());
-        let read_context = ReadContext::new(to_arrow_schema(table_info.get_row_type())?, false);
+        let row_type = Arc::new(table_info.get_row_type().clone());
+        let read_context = ReadContext::new(to_arrow_schema(&row_type)?, row_type, false);
         let completed =
             DefaultCompletedFetch::new(bucket.clone(), log_records, data.len(), read_context, 0, 0);
         fetcher.log_fetch_buffer.add(Box::new(completed));
@@ -1931,7 +1948,8 @@ mod tests {
         let bucket = TableBucket::new(1, 0);
         let data = build_records(&table_info, Arc::new(table_path))?;
         let log_records = LogRecordsBatches::new(data.clone());
-        let read_context = ReadContext::new(to_arrow_schema(table_info.get_row_type())?, false);
+        let row_type = Arc::new(table_info.get_row_type().clone());
+        let read_context = ReadContext::new(to_arrow_schema(&row_type)?, row_type, false);
         let mut completed: Box<dyn CompletedFetch> = Box::new(DefaultCompletedFetch::new(
             bucket,
             log_records,
diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index ffc48a8b69..98823f075c 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -935,7 +935,7 @@ impl MapType {
     pub fn with_nullable(nullable: bool, key_type: DataType, value_type: DataType) -> Self {
         Self {
             nullable,
-            key_type: Box::new(key_type),
+            key_type: Box::new(key_type.as_non_nullable()),
             value_type: Box::new(value_type),
         }
     }
@@ -1452,16 +1452,22 @@ fn test_array_display() {
 #[test]
 fn test_map_display() {
     let map_type = MapType::new(DataTypes::string(), DataTypes::int());
-    assert_eq!(map_type.to_string(), "MAP<STRING, INT>");
+    assert_eq!(map_type.to_string(), "MAP<STRING NOT NULL, INT>");
 
     let map_type_non_null = MapType::with_nullable(false, DataTypes::int(), DataTypes::string());
-    assert_eq!(map_type_non_null.to_string(), "MAP<INT, STRING> NOT NULL");
+    assert_eq!(
+        map_type_non_null.to_string(),
+        "MAP<INT NOT NULL, STRING> NOT NULL"
+    );
 
     let nested_map = MapType::new(
         DataTypes::string(),
         DataTypes::map(DataTypes::int(), DataTypes::boolean()),
     );
-    assert_eq!(nested_map.to_string(), "MAP<STRING, MAP<INT, BOOLEAN>>");
+    assert_eq!(
+        nested_map.to_string(),
+        "MAP<STRING NOT NULL, MAP<INT NOT NULL, BOOLEAN>>"
+    );
 }
 
 #[test]
@@ -1497,7 +1503,7 @@ fn test_datatype_display() {
     assert_eq!(DataTypes::array(DataTypes::int()).to_string(), "ARRAY<INT>");
     assert_eq!(
         DataTypes::map(DataTypes::string(), DataTypes::int()).to_string(),
-        "MAP<STRING, INT>"
+        "MAP<STRING NOT NULL, INT>"
     );
 }
 
@@ -1525,7 +1531,7 @@ fn test_complex_nested_display() {
     ]);
     assert_eq!(
         row_type.to_string(),
-        "ROW<id INT, tags ARRAY<STRING>, metadata MAP<STRING, STRING>>"
+        "ROW<id INT, tags ARRAY<STRING>, metadata MAP<STRING NOT NULL, STRING>>"
     );
 }
 
@@ -1547,7 +1553,10 @@ fn test_deeply_nested_types() {
             DataTypes::field("y", DataTypes::int()),
         ]),
     ));
-    assert_eq!(nested.to_string(), "ARRAY<MAP<STRING, ROW<x INT, y INT>>>");
+    assert_eq!(
+        nested.to_string(),
+        "ARRAY<MAP<STRING NOT NULL, ROW<x INT, y INT>>>"
+    );
 }
 
 // ============================================================================
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 9f1a97840d..179062e90d 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -994,6 +994,7 @@ impl LogRecordBatch {
         let record_batch = read_context.record_batch(data)?;
         let arrow_reader = ArrowReader::new_with_fluss_row_type(
             Arc::new(record_batch),
+            read_context.row_type.clone(),
             read_context.fluss_row_type().cloned(),
         );
         let log_record_iterator = LogRecordIterator::Arrow(ArrowLogRecordIterator {
@@ -1020,6 +1021,7 @@ impl LogRecordBatch {
             Some(record_batch) => {
                 let arrow_reader = ArrowReader::new_with_fluss_row_type(
                     Arc::new(record_batch),
+                    read_context.row_type.clone(),
                     read_context.fluss_row_type().cloned(),
                 );
                 LogRecordIterator::Arrow(ArrowLogRecordIterator {
@@ -1237,7 +1239,7 @@ pub fn to_arrow_type(fluss_type: &DataType) -> Result<ArrowDataType> {
                 Arc::new(Field::new(
                     "entries",
                     ArrowDataType::Struct(arrow_schema::Fields::from(entry_fields)),
-                    fluss_type.is_nullable(),
+                    false,
                 )),
                 false,
             )
@@ -1341,6 +1343,7 @@ pub(crate) fn from_arrow_type(arrow_type: &ArrowDataType) -> Result<DataType> {
 pub struct ReadContext {
     target_schema: SchemaRef,
     full_schema: SchemaRef,
+    row_type: Arc<RowType>,
     projection: Option<Projection>,
     is_from_remote: bool,
     fluss_row_type: Option<Arc<RowType>>,
@@ -1357,10 +1360,15 @@ struct Projection {
 }
 
 impl ReadContext {
-    pub fn new(arrow_schema: SchemaRef, is_from_remote: bool) -> ReadContext {
+    pub fn new(
+        arrow_schema: SchemaRef,
+        row_type: Arc<RowType>,
+        is_from_remote: bool,
+    ) -> ReadContext {
         ReadContext {
             target_schema: arrow_schema.clone(),
             full_schema: arrow_schema,
+            row_type,
             projection: None,
             is_from_remote,
             fluss_row_type: None,
@@ -1378,6 +1386,7 @@ impl ReadContext {
 
     pub fn with_projection_pushdown(
         arrow_schema: SchemaRef,
+        row_type: Arc<RowType>,
         projected_fields: Vec<usize>,
         is_from_remote: bool,
     ) -> Result<ReadContext> {
@@ -1442,6 +1451,7 @@ impl ReadContext {
         Ok(ReadContext {
             target_schema,
             full_schema: arrow_schema,
+            row_type,
             projection: Some(project),
             is_from_remote,
             fluss_row_type: None,
@@ -1635,15 +1645,17 @@ impl Iterator for ArrowLogRecordIterator {
 
 pub struct ArrowReader {
     record_batch: Arc<RecordBatch>,
+    row_type: Arc<RowType>,
     fluss_row_type: Option<Arc<RowType>>,
     row_column_indices: Arc<[usize]>,
 }
 
 impl ArrowReader {
-    pub fn new(record_batch: Arc<RecordBatch>) -> Self {
+    pub fn new(record_batch: Arc<RecordBatch>, row_type: Arc<RowType>) -> Self {
         let row_column_indices = arrow_row_column_indices(&record_batch);
         ArrowReader {
             record_batch,
+            row_type,
             fluss_row_type: None,
             row_column_indices,
         }
@@ -1651,6 +1663,7 @@ impl ArrowReader {
 
     pub fn new_with_fluss_row_type(
         record_batch: Arc<RecordBatch>,
+        row_type: Arc<RowType>,
         fluss_row_type: Option<Arc<RowType>>,
     ) -> Self {
         let row_column_indices = match &fluss_row_type {
@@ -1659,6 +1672,7 @@ impl ArrowReader {
         };
         ArrowReader {
             record_batch,
+            row_type,
             fluss_row_type,
             row_column_indices,
         }
@@ -1671,6 +1685,7 @@ impl ArrowReader {
     pub fn read(&self, row_id: usize) -> ColumnarRow {
         ColumnarRow::with_indices(
             self.record_batch.clone(),
+            self.row_type.clone(),
             row_id,
             self.fluss_row_type.clone(),
             self.row_column_indices.clone(),
@@ -1799,10 +1814,10 @@ mod tests {
                 Arc::new(Field::new(
                     "entries",
                     ArrowDataType::Struct(arrow_schema::Fields::from(vec![
-                        Field::new("key", ArrowDataType::Utf8, true),
+                        Field::new("key", ArrowDataType::Utf8, false),
                         Field::new("value", ArrowDataType::Int32, true),
                     ])),
-                    true,
+                    false,
                 )),
                 false,
             )
@@ -1821,6 +1836,21 @@ mod tests {
         );
     }
 
+    #[test]
+    fn test_arrow_map_schema_strictness() {
+        let map_type = DataTypes::map(DataTypes::string(), DataTypes::int());
+        let arrow_type = to_arrow_type(&map_type).unwrap();
+
+        if let ArrowDataType::Map(entries_field, _) = arrow_type {
+            assert!(
+                !entries_field.is_nullable(),
+                "Arrow Map 'entries' field must be strictly non-nullable"
+            );
+        } else {
+            panic!("Expected ArrowDataType::Map, got {:?}", arrow_type);
+        }
+    }
+
     #[test]
     fn test_parse_ipc_message() {
         let empty_body: &[u8] = &le_bytes(&[0xFFFFFFFF, 0x00000000]);
@@ -1878,7 +1908,8 @@ mod tests {
             DataField::new("name", DataTypes::string(), None),
         ]);
         let schema = to_arrow_schema(&row_type).unwrap();
-        let result = ReadContext::with_projection_pushdown(schema, vec![0, 2], false);
+        let result =
+            ReadContext::with_projection_pushdown(schema, Arc::new(row_type), vec![0, 2], false);
 
         assert!(matches!(result, Err(IllegalArgument { .. })));
     }
diff --git a/fluss-rust/crates/fluss/src/record/mod.rs b/fluss-rust/crates/fluss/src/record/mod.rs
index 522fb03bbe..462bdebbc1 100644
--- a/fluss-rust/crates/fluss/src/record/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/mod.rs
@@ -246,10 +246,14 @@ mod tests {
     use std::sync::Arc;
 
     fn make_row(values: Vec<i32>, row_id: usize) -> ColumnarRow {
+        use crate::metadata::RowType;
         let schema = Arc::new(Schema::new(vec![Field::new("v", DataType::Int32, false)]));
         let batch = RecordBatch::try_new(schema, vec![Arc::new(Int32Array::from(values))])
             .expect("record batch");
-        ColumnarRow::new(Arc::new(batch), row_id, None)
+        let row_type = Arc::new(RowType::with_data_types(vec![
+            crate::metadata::DataType::Int(crate::metadata::IntType::new()),
+        ]));
+        ColumnarRow::new(Arc::new(batch), row_type, row_id, None)
     }
 
     #[test]
diff --git a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
index 7192ee57ab..3380629599 100644
--- a/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/binary_writer.rs
@@ -18,10 +18,10 @@
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::{DataType, RowType};
-use crate::row::Datum;
 use crate::row::Decimal;
 use crate::row::binary::BinaryRowFormat;
 use crate::row::datum::{TimestampLtz, TimestampNtz};
+use crate::row::{Datum, FlussArray, FlussMap};
 
 /// Writer to write a composite data format, like row, array,
 #[allow(dead_code)]
@@ -69,7 +69,9 @@ pub trait BinaryWriter {
 
     fn write_timestamp_ltz(&mut self, value: &TimestampLtz, precision: u32);
 
-    fn write_array(&mut self, value: &[u8]);
+    fn write_array(&mut self, value: &FlussArray);
+
+    fn write_map(&mut self, value: &FlussMap);
 
     // TODO Row serializer
     // fn write_row(&mut self, pos: i32, value: &InternalRow);
@@ -138,6 +140,7 @@ pub enum InnerValueWriter {
     TimestampNtz(u32), // precision
     TimestampLtz(u32), // precision
     Array,
+    Map,
     Row(NestedRowWriter),
 }
 
@@ -207,13 +210,10 @@ impl InnerValueWriter {
                 Ok(InnerValueWriter::TimestampLtz(t.precision()))
             }
             DataType::Array(_) => Ok(InnerValueWriter::Array),
+            DataType::Map(_) => Ok(InnerValueWriter::Map),
             DataType::Row(row_type) => Ok(InnerValueWriter::Row(NestedRowWriter::from_row_type(
                 row_type,
             )?)),
-            _ => unimplemented!(
-                "ValueWriter for DataType {:?} is currently not implemented",
-                data_type
-            ),
         }
     }
     pub fn write_value<W: BinaryWriter>(
@@ -273,7 +273,10 @@ impl InnerValueWriter {
                 writer.write_timestamp_ltz(ts, *p);
             }
             (InnerValueWriter::Array, Datum::Array(arr)) => {
-                writer.write_array(arr.as_bytes());
+                writer.write_array(arr);
+            }
+            (InnerValueWriter::Map, Datum::Map(map)) => {
+                writer.write_map(map);
             }
             (InnerValueWriter::Row(nested_writer), Datum::Row(inner_row)) => {
                 use crate::row::compacted::CompactedRowWriter;
diff --git a/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs b/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
index b0e8434d1d..4320a62285 100644
--- a/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
@@ -21,6 +21,8 @@ use crate::error::{Error, Result};
 use crate::metadata::DataType;
 use crate::row::Decimal;
 use crate::row::binary::{BinaryWriter, ValueWriter};
+use crate::row::binary_array::FlussArray;
+use crate::row::binary_map::FlussMap;
 
 const MICROS_PER_MILLI: i64 = 1_000;
 
@@ -225,8 +227,12 @@ impl BinaryWriter for IcebergBinaryRowWriter {
         self.write_raw(&micros.to_le_bytes());
     }
 
-    fn write_array(&mut self, _value: &[u8]) {
-        panic!("Iceberg key columns do not support array values");
+    fn write_array(&mut self, _value: &FlussArray) {
+        unreachable!("Array/Map types are rejected during value writer creation");
+    }
+
+    fn write_map(&mut self, _value: &FlussMap) {
+        unreachable!("Array/Map types are rejected during value writer creation");
     }
 
     fn complete(&mut self) {
diff --git a/fluss-rust/crates/fluss/src/row/binary_array.rs b/fluss-rust/crates/fluss/src/row/binary_array.rs
index d0e8c9a528..d4fab7620b 100644
--- a/fluss-rust/crates/fluss/src/row/binary_array.rs
+++ b/fluss-rust/crates/fluss/src/row/binary_array.rs
@@ -30,6 +30,7 @@ use crate::metadata::{DataType, RowType};
 use crate::row::Decimal;
 use crate::row::InternalRow;
 use crate::row::binary::{BinaryRowFormat, ValueWriter};
+use crate::row::binary_map::FlussMap;
 use crate::row::compacted::{CompactedRow, CompactedRowWriter, calculate_bit_set_width_in_bytes};
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
 use crate::row::field_getter::FieldGetter;
@@ -76,6 +77,22 @@ fn round_to_nearest_word(num_bytes: usize) -> usize {
     (num_bytes + 7) & !7
 }
 
+fn is_variable_length_type(dt: &DataType) -> bool {
+    match dt {
+        DataType::Char(_)
+        | DataType::String(_)
+        | DataType::Binary(_)
+        | DataType::Bytes(_)
+        | DataType::Array(_)
+        | DataType::Map(_)
+        | DataType::Row(_) => true,
+        DataType::Decimal(d) => !Decimal::is_compact_precision(d.precision()),
+        DataType::Timestamp(t) => !TimestampNtz::is_compact(t.precision()),
+        DataType::TimestampLTz(t) => !TimestampLtz::is_compact(t.precision()),
+        _ => false,
+    }
+}
+
 /// A Fluss binary array, wire-compatible with Java's `BinaryArray`.
 ///
 /// Stores elements in a flat byte buffer with a header (element count + null bitmap)
@@ -219,6 +236,33 @@ impl FlussArray {
         (self.data[4 + byte_index] & (1u8 << bit)) != 0
     }
 
+    /// Returns the logically occupied bytes of this array, including the variable-length part.
+    /// This is used to detect trailing garbage in binary containers.
+    pub fn extent(&self, element_type: &DataType) -> Result<usize> {
+        let header_size = calculate_header_in_bytes(self.size);
+        let element_size = calculate_fix_length_part_size(element_type);
+        let fixed_part_size = round_to_nearest_word(header_size + self.size * element_size);
+
+        if !is_variable_length_type(element_type) {
+            return Ok(fixed_part_size);
+        }
+
+        let mut max_extent = fixed_part_size;
+        for i in 0..self.size {
+            if !self.is_null_at(i) {
+                let packed = self.read_i64(i, "extent calculation")? as u64;
+                let mark = packed & HIGHEST_FIRST_BIT;
+                if mark == 0 {
+                    let offset = (packed >> 32) as usize;
+                    let len = (packed & 0xFFFF_FFFF) as usize;
+                    max_extent = max_extent.max(offset + len);
+                }
+            }
+        }
+
+        Ok(round_to_nearest_word(max_extent))
+    }
+
     fn checked_slice(&self, start: usize, len: usize, context: &str) -> Result<&[u8]> {
         let end = start.checked_add(len).ok_or_else(|| IllegalArgument {
             message: format!("Overflow while reading {context}: start={start}, len={len}"),
@@ -423,6 +467,16 @@ impl FlussArray {
         FlussArray::from_owned_bytes(self.data.slice(start..start + len))
     }
 
+    pub fn get_map(
+        &self,
+        pos: usize,
+        key_type: &DataType,
+        value_type: &DataType,
+    ) -> Result<FlussMap> {
+        let (start, len) = self.read_var_len_span(pos)?;
+        FlussMap::from_owned_bytes(self.data.slice(start..start + len), key_type, value_type)
+    }
+
     pub fn get_row<'a>(&'a self, pos: usize, row_type: &'a RowType) -> Result<CompactedRow<'a>> {
         let bytes = self.read_var_len_bytes(pos)?;
         let header_size = calculate_bit_set_width_in_bytes(row_type.fields().len());
@@ -672,6 +726,11 @@ impl FlussArrayWriter {
         self.write_bytes_to_var_len_part(pos, value.as_bytes());
     }
 
+    /// Writes a nested FlussMap into this array at position `pos`.
+    pub fn write_map(&mut self, pos: usize, value: &FlussMap) {
+        self.write_bytes_to_var_len_part(pos, value.as_bytes());
+    }
+
     /// Writes a nested row at `pos`. Requires the writer to have been
     /// constructed via [`new`](Self::new) with a `DataType::Row(_)` element type.
     pub fn write_row(&mut self, pos: usize, row: &dyn InternalRow) -> Result<()> {
@@ -772,6 +831,10 @@ impl InternalRow for FlussArray {
     fn get_array(&self, pos: usize) -> Result<FlussArray> {
         self.get_array(pos)
     }
+
+    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
+        self.get_map(pos, key_type, value_type)
+    }
 }
 
 #[cfg(test)]
@@ -1133,7 +1196,7 @@ mod tests {
         outer.set_field(0, inner_arr.clone());
 
         let mut writer = CompactedRowWriter::new(1);
-        writer.write_array(inner_arr.as_bytes());
+        writer.write_array(&inner_arr);
         let bytes = writer.to_bytes();
 
         let outer_compacted = CompactedRow::from_bytes(outer_row_type, &bytes);
diff --git a/fluss-rust/crates/fluss/src/row/binary_map.rs b/fluss-rust/crates/fluss/src/row/binary_map.rs
new file mode 100644
index 0000000000..b710b69c7d
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/row/binary_map.rs
@@ -0,0 +1,555 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Binary map format matching Java's `BinaryMap.java` layout.
+//!
+//! Binary layout:
+//! ```text
+//! [4 bytes: keyArraySizeInBytes] + [Key BinaryArray bytes] + [Value BinaryArray bytes]
+//! ```
+
+use crate::error::Error::IllegalArgument;
+use crate::error::Result;
+use crate::metadata::DataType;
+use crate::row::binary_array::{FlussArray, FlussArrayWriter};
+use crate::row::datum::Datum;
+use bytes::Bytes;
+use serde::Serialize;
+use std::fmt;
+use std::hash::{Hash, Hasher};
+
+/// A Fluss binary map, wire-compatible with Java's `BinaryMap`.
+///
+/// Stores entries as two parallel binary arrays (keys and values) within a single
+/// byte buffer.
+#[derive(Clone)]
+pub struct FlussMap {
+    data: Bytes,
+    key_array: FlussArray,
+    value_array: FlussArray,
+}
+
+impl fmt::Debug for FlussMap {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        f.debug_struct("FlussMap")
+            .field("size", &self.size())
+            .field("data_len", &self.data.len())
+            .finish()
+    }
+}
+
+impl fmt::Display for FlussMap {
+    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
+        write!(f, "FlussMap[size={}]", self.size())
+    }
+}
+
+impl PartialEq for FlussMap {
+    fn eq(&self, other: &Self) -> bool {
+        self.data == other.data
+    }
+}
+
+impl Eq for FlussMap {}
+
+impl PartialOrd for FlussMap {
+    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
+        Some(self.cmp(other))
+    }
+}
+
+impl Ord for FlussMap {
+    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
+        self.data.cmp(&other.data)
+    }
+}
+
+impl Hash for FlussMap {
+    fn hash<H: Hasher>(&self, state: &mut H) {
+        self.data.hash(state);
+    }
+}
+
+impl Serialize for FlussMap {
+    fn serialize<S>(&self, serializer: S) -> std::result::Result<S::Ok, S::Error>
+    where
+        S: serde::Serializer,
+    {
+        serializer.serialize_bytes(&self.data)
+    }
+}
+
+impl FlussMap {
+    /// Validates the raw bytes and extracts the sub-arrays.
+    fn validate(
+        data: &[u8],
+        key_type: &DataType,
+        value_type: &DataType,
+    ) -> Result<(FlussArray, FlussArray)> {
+        if data.len() < 4 {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussMap data too short: need at least 4 bytes, got {}",
+                    data.len()
+                ),
+            });
+        }
+        let raw_key_size = i32::from_le_bytes(data[0..4].try_into().unwrap());
+        if raw_key_size < 0 {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussMap key array size must be non-negative, got {}",
+                    raw_key_size
+                ),
+            });
+        }
+        let key_size = raw_key_size as usize;
+        if 4 + key_size > data.len() {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussMap key array size {} exceeds remaining payload {}",
+                    key_size,
+                    data.len() - 4
+                ),
+            });
+        }
+
+        let key_bytes = &data[4..4 + key_size];
+        let value_bytes = &data[4 + key_size..];
+
+        let key_array = FlussArray::from_bytes(key_bytes).map_err(|e| IllegalArgument {
+            message: format!("Invalid key array in FlussMap: {}", e),
+        })?;
+
+        let value_array = FlussArray::from_bytes(value_bytes).map_err(|e| IllegalArgument {
+            message: format!("Invalid value array in FlussMap: {}", e),
+        })?;
+
+        if key_array.size() != value_array.size() {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussMap key array size ({}) does not match value array size ({})",
+                    key_array.size(),
+                    value_array.size()
+                ),
+            });
+        }
+
+        // Strict trailing byte check: ensure the total reach of key and value arrays
+        // plus the 4-byte header matches the provided data length exactly.
+        let key_extent = key_array.extent(key_type)?;
+        let value_extent = value_array.extent(value_type)?;
+        let expected_len = 4 + key_extent + value_extent;
+        if expected_len != data.len() {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussMap binary validation failed: expected {expected_len} bytes, got {}",
+                    data.len()
+                ),
+            });
+        }
+
+        // Centralized null-key check: FlussMap keys are never allowed to be null.
+        for i in 0..key_array.size() {
+            if key_array.is_null_at(i) {
+                return Err(IllegalArgument {
+                    message: "FlussMap keys cannot be null".to_string(),
+                });
+            }
+        }
+
+        Ok((key_array, value_array))
+    }
+
+    /// Creates a FlussMap from a byte slice (copies data).
+    pub(crate) fn from_bytes(
+        data: &[u8],
+        key_type: &DataType,
+        value_type: &DataType,
+    ) -> Result<Self> {
+        let (key_array, value_array) = Self::validate(data, key_type, value_type)?;
+        Ok(FlussMap {
+            data: Bytes::copy_from_slice(data),
+            key_array,
+            value_array,
+        })
+    }
+
+    /// Creates a FlussMap from owned bytes without copying.
+    pub(crate) fn from_owned_bytes(
+        data: Bytes,
+        key_type: &DataType,
+        value_type: &DataType,
+    ) -> Result<Self> {
+        let (key_array, value_array) = Self::validate(&data, key_type, value_type)?;
+        Ok(FlussMap {
+            data,
+            key_array,
+            value_array,
+        })
+    }
+
+    /// Creates a FlussMap by combining a key array and a value array.
+    ///
+    /// Copies both arrays into a new contiguous buffer.
+    pub fn from_arrays(key_array: &FlussArray, value_array: &FlussArray) -> Result<Self> {
+        if key_array.size() != value_array.size() {
+            return Err(IllegalArgument {
+                message: format!(
+                    "FlussMap key array size ({}) does not match value array size ({})",
+                    key_array.size(),
+                    value_array.size()
+                ),
+            });
+        }
+
+        let key_bytes = key_array.as_bytes();
+        let value_bytes = value_array.as_bytes();
+
+        let mut data = Vec::with_capacity(4 + key_bytes.len() + value_bytes.len());
+        // Write the key array size (4 bytes)
+        // Java's BinaryMap uses memory segment methods which write in LE
+        data.extend_from_slice(&(key_bytes.len() as i32).to_le_bytes());
+        // Write key array bytes
+        data.extend_from_slice(key_bytes);
+        // Write value array bytes
+        data.extend_from_slice(value_bytes);
+
+        let data = Bytes::from(data);
+        Ok(FlussMap {
+            data,
+            key_array: key_array.clone(),
+            value_array: value_array.clone(),
+        })
+    }
+
+    /// Returns the number of entries in the map.
+    pub fn size(&self) -> usize {
+        self.key_array.size()
+    }
+
+    /// Returns the raw bytes of this map (the complete binary representation).
+    pub fn as_bytes(&self) -> &[u8] {
+        &self.data
+    }
+
+    /// Returns the key array.
+    pub fn key_array(&self) -> &FlussArray {
+        &self.key_array
+    }
+
+    /// Returns the value array.
+    pub fn value_array(&self) -> &FlussArray {
+        &self.value_array
+    }
+}
+
+/// Writer for building a `FlussMap` entry by entry.
+pub struct FlussMapWriter {
+    key_writer: FlussArrayWriter,
+    value_writer: FlussArrayWriter,
+    key_type: DataType,
+    value_type: DataType,
+    current_index: usize,
+}
+
+impl FlussMapWriter {
+    /// Creates a new writer for a map with the given capacity and key/value types.
+    pub fn new(capacity: usize, key_type: &DataType, value_type: &DataType) -> Self {
+        Self {
+            key_writer: FlussArrayWriter::new(capacity, key_type),
+            value_writer: FlussArrayWriter::new(capacity, value_type),
+            key_type: key_type.clone(),
+            value_type: value_type.clone(),
+            current_index: 0,
+        }
+    }
+
+    /// Writes a key-value entry into the map.
+    ///
+    /// # Errors
+    /// Returns an error if the key is null or if there's a type mismatch.
+    pub fn write_entry(&mut self, key: Datum, value: Datum) -> Result<()> {
+        if key.is_null() {
+            return Err(IllegalArgument {
+                message: "FlussMap keys cannot be null".to_string(),
+            });
+        }
+
+        Self::write_datum(
+            &mut self.key_writer,
+            self.current_index,
+            key,
+            &self.key_type,
+        )?;
+        Self::write_datum(
+            &mut self.value_writer,
+            self.current_index,
+            value,
+            &self.value_type,
+        )?;
+        self.current_index += 1;
+        Ok(())
+    }
+
+    /// Finalizes the writer and returns the completed `FlussMap`.
+    pub fn complete(self) -> Result<FlussMap> {
+        let key_array = self.key_writer.complete()?;
+        let value_array = self.value_writer.complete()?;
+        FlussMap::from_arrays(&key_array, &value_array)
+    }
+
+    fn write_datum(
+        writer: &mut FlussArrayWriter,
+        pos: usize,
+        datum: Datum,
+        dt: &DataType,
+    ) -> Result<()> {
+        if datum.is_null() {
+            writer.set_null_at(pos);
+            return Ok(());
+        }
+
+        match (dt, &datum) {
+            (DataType::Boolean(_), Datum::Bool(v)) => writer.write_boolean(pos, *v),
+            (DataType::TinyInt(_), Datum::Int8(v)) => writer.write_byte(pos, *v),
+            (DataType::SmallInt(_), Datum::Int16(v)) => writer.write_short(pos, *v),
+            (DataType::Int(_), Datum::Int32(v)) => writer.write_int(pos, *v),
+            (DataType::BigInt(_), Datum::Int64(v)) => writer.write_long(pos, *v),
+            (DataType::Float(_), Datum::Float32(v)) => writer.write_float(pos, v.into_inner()),
+            (DataType::Double(_), Datum::Float64(v)) => writer.write_double(pos, v.into_inner()),
+            (DataType::Char(_), Datum::String(v)) => writer.write_string(pos, v),
+            (DataType::String(_), Datum::String(v)) => writer.write_string(pos, v),
+            (DataType::Binary(_), Datum::Blob(v)) => writer.write_binary_bytes(pos, v),
+            (DataType::Bytes(_), Datum::Blob(v)) => writer.write_binary_bytes(pos, v),
+            (DataType::Decimal(d), Datum::Decimal(v)) => {
+                writer.write_decimal(pos, v, d.precision())
+            }
+            (DataType::Date(_), Datum::Date(v)) => writer.write_date(pos, *v),
+            (DataType::Time(_), Datum::Time(v)) => writer.write_time(pos, *v),
+            (DataType::Timestamp(t), Datum::TimestampNtz(v)) => {
+                writer.write_timestamp_ntz(pos, v, t.precision())
+            }
+            (DataType::TimestampLTz(t), Datum::TimestampLtz(v)) => {
+                writer.write_timestamp_ltz(pos, v, t.precision())
+            }
+            (DataType::Array(_), Datum::Array(v)) => writer.write_array(pos, v),
+            (DataType::Map(_), Datum::Map(v)) => writer.write_map(pos, v),
+            _ => {
+                return Err(IllegalArgument {
+                    message: format!("Type mismatch: expected {:?}, got {:?}", dt, datum),
+                });
+            }
+        }
+        Ok(())
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::metadata::DataTypes;
+    use crate::row::binary_array::FlussArrayWriter;
+
+    #[test]
+    fn test_round_trip_int_to_string_map() {
+        let mut writer = FlussMapWriter::new(2, &DataTypes::int(), &DataTypes::string());
+        writer.write_entry(1.into(), "a".into()).unwrap();
+        writer.write_entry(2.into(), "b".into()).unwrap();
+        let map = writer.complete().unwrap();
+        assert_eq!(map.size(), 2);
+
+        assert_eq!(
+            map.as_bytes(),
+            &[
+                16, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 2, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0,
+                0, 97, 0, 0, 0, 0, 0, 0, 129, 98, 0, 0, 0, 0, 0, 0, 129
+            ]
+        );
+
+        let bytes = map.as_bytes();
+        let decoded = FlussMap::from_bytes(bytes, &DataTypes::int(), &DataTypes::string()).unwrap();
+
+        assert_eq!(decoded.size(), 2);
+        let decoded_keys = decoded.key_array();
+        let decoded_values = decoded.value_array();
+
+        assert_eq!(decoded_keys.get_int(0).unwrap(), 1);
+        assert_eq!(decoded_keys.get_int(1).unwrap(), 2);
+        assert_eq!(decoded_values.get_string(0).unwrap(), "a");
+        assert_eq!(decoded_values.get_string(1).unwrap(), "b");
+    }
+
+    #[test]
+    fn test_empty_map() {
+        let writer = FlussMapWriter::new(0, &DataTypes::int(), &DataTypes::string());
+        let map = writer.complete().unwrap();
+        assert_eq!(map.size(), 0);
+
+        let decoded =
+            FlussMap::from_bytes(map.as_bytes(), &DataTypes::int(), &DataTypes::string()).unwrap();
+        assert_eq!(decoded.size(), 0);
+    }
+
+    #[test]
+    fn test_map_with_null_values() {
+        let key_type = DataTypes::string();
+        let value_type = DataTypes::int();
+        let mut writer = FlussMapWriter::new(3, &key_type, &value_type);
+        writer.write_entry("k1".into(), 10.into()).unwrap();
+        writer.write_entry("k2".into(), Datum::Null).unwrap();
+        writer.write_entry("k3".into(), 30.into()).unwrap();
+        let map = writer.complete().unwrap();
+
+        assert_eq!(
+            map.as_bytes(),
+            &[
+                32, 0, 0, 0, 3, 0, 0, 0, 0, 0, 0, 0, 107, 49, 0, 0, 0, 0, 0, 130, 107, 50, 0, 0, 0,
+                0, 0, 130, 107, 51, 0, 0, 0, 0, 0, 130, 3, 0, 0, 0, 2, 0, 0, 0, 10, 0, 0, 0, 0, 0,
+                0, 0, 30, 0, 0, 0, 0, 0, 0, 0
+            ]
+        );
+
+        let decoded = FlussMap::from_bytes(map.as_bytes(), &key_type, &value_type).unwrap();
+
+        let values = decoded.value_array();
+        assert_eq!(values.size(), 3);
+        assert!(!values.is_null_at(0));
+        assert!(values.is_null_at(1));
+        assert!(!values.is_null_at(2));
+        assert_eq!(values.get_int(0).unwrap(), 10);
+        assert_eq!(values.get_int(2).unwrap(), 30);
+    }
+
+    #[test]
+    fn test_invalid_data() {
+        // Too short
+        let err =
+            FlussMap::from_bytes(&[1, 2, 3], &DataTypes::int(), &DataTypes::int()).unwrap_err();
+        assert!(err.to_string().contains("FlussMap data too short"));
+
+        // Negative size
+        let neg_size = (-1i32).to_le_bytes();
+        let mut bad_data = vec![];
+        bad_data.extend_from_slice(&neg_size);
+        bad_data.extend_from_slice(&[0, 0, 0, 0]);
+        let err2 =
+            FlussMap::from_bytes(&bad_data, &DataTypes::int(), &DataTypes::int()).unwrap_err();
+        assert!(
+            err2.to_string()
+                .contains("FlussMap key array size must be non-negative")
+        );
+
+        // Key array length exceeds payload
+        let large_size = 100i32.to_le_bytes();
+        let mut bad_data2 = vec![];
+        bad_data2.extend_from_slice(&large_size);
+        bad_data2.extend_from_slice(&[0, 0, 0, 0]);
+        let err3 =
+            FlussMap::from_bytes(&bad_data2, &DataTypes::int(), &DataTypes::int()).unwrap_err();
+        assert!(
+            err3.to_string()
+                .contains("FlussMap key array size 100 exceeds remaining payload 4")
+        );
+    }
+
+    #[test]
+    fn test_mismatched_array_sizes() {
+        let key_writer = FlussArrayWriter::new(1, &DataTypes::int());
+        let key_array = key_writer.complete().unwrap();
+
+        let value_writer = FlussArrayWriter::new(2, &DataTypes::string());
+        let value_array = value_writer.complete().unwrap();
+
+        let err = FlussMap::from_arrays(&key_array, &value_array).unwrap_err();
+        assert!(err.to_string().contains("does not match value array size"));
+    }
+
+    #[test]
+    fn test_nested_map() {
+        let map_type = DataTypes::map(DataTypes::int(), DataTypes::string());
+        let mut inner_writer = FlussMapWriter::new(1, &DataTypes::int(), &DataTypes::string());
+        inner_writer.write_entry(1.into(), "b".into()).unwrap();
+        let inner_map = inner_writer.complete().unwrap();
+
+        let mut writer = FlussMapWriter::new(1, &DataTypes::string(), &map_type);
+        writer
+            .write_entry("a".into(), Datum::Map(inner_map))
+            .unwrap();
+        let map = writer.complete().unwrap();
+
+        let decoded =
+            FlussMap::from_bytes(map.as_bytes(), &DataTypes::string(), &map_type).unwrap();
+        let decoded_keys = decoded.key_array();
+        let decoded_values = decoded.value_array();
+
+        assert_eq!(decoded_keys.get_string(0).unwrap(), "a");
+        let decoded_inner_map = decoded_values
+            .get_map(0, &DataTypes::int(), &DataTypes::string())
+            .unwrap();
+        assert_eq!(decoded_inner_map.key_array().get_int(0).unwrap(), 1);
+        assert_eq!(decoded_inner_map.value_array().get_string(0).unwrap(), "b");
+    }
+
+    #[test]
+    fn test_trailing_garbage() {
+        let mut key_writer = FlussArrayWriter::new(1, &DataTypes::int());
+        key_writer.write_int(0, 1);
+        let key_array = key_writer.complete().unwrap();
+
+        let mut value_writer = FlussArrayWriter::new(1, &DataTypes::int());
+        value_writer.write_int(0, 100);
+        let value_array = value_writer.complete().unwrap();
+
+        let map = FlussMap::from_arrays(&key_array, &value_array).unwrap();
+        let bytes = map.as_bytes();
+
+        // Valid bytes should pass
+        assert!(FlussMap::from_bytes(bytes, &DataTypes::int(), &DataTypes::int()).is_ok());
+
+        // Append trailing garbage
+        let mut bad_bytes = bytes.to_vec();
+        bad_bytes.push(0);
+        let err =
+            FlussMap::from_bytes(&bad_bytes, &DataTypes::int(), &DataTypes::int()).unwrap_err();
+        assert!(err.to_string().contains("binary validation failed"));
+        assert!(err.to_string().contains("expected"));
+    }
+
+    #[test]
+    fn test_null_keys_fail_validation() {
+        let mut key_writer = FlussArrayWriter::new(1, &DataTypes::int());
+        key_writer.set_null_at(0); // null key!
+        let key_array = key_writer.complete().unwrap();
+
+        let mut value_writer = FlussArrayWriter::new(1, &DataTypes::int());
+        value_writer.write_int(0, 100);
+        let value_array = value_writer.complete().unwrap();
+
+        // Constructing bytes manually since from_arrays no longer catches it,
+        // and we want to verify validate catches it.
+        let key_bytes = key_array.as_bytes();
+        let value_bytes = value_array.as_bytes();
+        let mut data = vec![];
+        data.extend_from_slice(&(key_bytes.len() as i32).to_le_bytes());
+        data.extend_from_slice(key_bytes);
+        data.extend_from_slice(value_bytes);
+
+        let err = FlussMap::from_bytes(&data, &DataTypes::int(), &DataTypes::int()).unwrap_err();
+        assert!(err.to_string().contains("keys cannot be null"));
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 5db1cd5073..b088f124b6 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -20,11 +20,12 @@ use crate::error::Result;
 use crate::metadata::{DataType, RowType};
 use crate::record::from_arrow_type;
 use crate::row::binary_array::FlussArrayWriter;
+use crate::row::binary_map::FlussMap;
 use crate::row::datum::{Date, Datum, Time, TimestampLtz, TimestampNtz};
 use crate::row::{Decimal, FlussArray, GenericRow, InternalRow};
 use arrow::array::{
     Array, AsArray, BinaryArray, BooleanArray, Date32Array, Decimal128Array, FixedSizeBinaryArray,
-    Float32Array, Float64Array, Int8Array, Int16Array, Int32Array, Int64Array, ListArray,
+    Float32Array, Float64Array, Int8Array, Int16Array, Int32Array, Int64Array, ListArray, MapArray,
     RecordBatch, StringArray, StructArray, Time32MillisecondArray, Time32SecondArray,
     Time64MicrosecondArray, Time64NanosecondArray, TimestampMicrosecondArray,
     TimestampMillisecondArray, TimestampNanosecondArray, TimestampSecondArray,
@@ -40,6 +41,7 @@ use std::sync::Arc;
 #[derive(Clone)]
 pub struct ColumnarRow {
     record_batch: Arc<RecordBatch>,
+    row_type: Arc<RowType>,
     row_id: usize,
     fluss_row_type: Option<Arc<RowType>>,
     row_column_indices: Arc<[usize]>,
@@ -71,6 +73,7 @@ fn make_row_caches(indices: &[usize]) -> Box<[std::sync::OnceLock<GenericRow<'st
 impl ColumnarRow {
     pub fn new(
         batch: Arc<RecordBatch>,
+        row_type: Arc<RowType>,
         row_id: usize,
         fluss_row_type: Option<Arc<RowType>>,
     ) -> Self {
@@ -78,11 +81,12 @@ impl ColumnarRow {
             Some(rt) => fluss_row_column_indices(rt),
             None => arrow_row_column_indices(&batch),
         };
-        Self::with_indices(batch, row_id, fluss_row_type, row_column_indices)
+        Self::with_indices(batch, row_type, row_id, fluss_row_type, row_column_indices)
     }
 
     pub(crate) fn with_indices(
         batch: Arc<RecordBatch>,
+        row_type: Arc<RowType>,
         row_id: usize,
         fluss_row_type: Option<Arc<RowType>>,
         row_column_indices: Arc<[usize]>,
@@ -90,6 +94,7 @@ impl ColumnarRow {
         let row_caches = make_row_caches(&row_column_indices);
         ColumnarRow {
             record_batch: batch,
+            row_type,
             row_id,
             fluss_row_type,
             row_column_indices,
@@ -609,6 +614,18 @@ impl InternalRow for ColumnarRow {
     }
 
     fn get_array(&self, pos: usize) -> Result<FlussArray> {
+        let expected_type = self.row_type.fields()[pos].data_type();
+        let element_fluss_type = match expected_type {
+            DataType::Array(a) => a.get_element_type(),
+            _ => {
+                return Err(IllegalArgument {
+                    message: format!(
+                        "expected Array type at position {pos}, got {expected_type:?}"
+                    ),
+                });
+            }
+        };
+
         let column = self.column(pos)?;
         let values = if let Some(list_arr) = column.as_any().downcast_ref::<ListArray>() {
             list_arr.value(self.row_id)
@@ -621,13 +638,60 @@ impl InternalRow for ColumnarRow {
             });
         };
 
-        let element_fluss_type = from_arrow_type(values.data_type())?;
-        let mut writer = FlussArrayWriter::new(values.len(), &element_fluss_type);
+        // Validate that the Arrow element type matches the expected Fluss element type
+        let actual_element_type = from_arrow_type(values.data_type())?;
+        if actual_element_type != *element_fluss_type {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Arrow list element type {:?} does not match expected Fluss type {:?}",
+                    actual_element_type, element_fluss_type
+                ),
+            });
+        }
+
+        let mut writer = FlussArrayWriter::new(values.len(), element_fluss_type);
 
-        write_arrow_values_to_fluss_array(&*values, &element_fluss_type, &mut writer)?;
+        write_arrow_values_to_fluss_array(&*values, element_fluss_type, &mut writer)?;
         writer.complete()
     }
 
+    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
+        let column = self.column(pos)?;
+        let map_arr =
+            column
+                .as_any()
+                .downcast_ref::<MapArray>()
+                .ok_or_else(|| IllegalArgument {
+                    message: format!(
+                        "expected Map array at position {pos}, got {:?}",
+                        column.data_type()
+                    ),
+                })?;
+
+        // Validate the Arrow element type matches the expected Fluss types
+        let actual_key_type = from_arrow_type(map_arr.key_type())?;
+        if actual_key_type != *key_type {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Arrow map key type {:?} does not match expected Fluss type {:?}",
+                    actual_key_type, key_type
+                ),
+            });
+        }
+        let actual_value_type = from_arrow_type(map_arr.value_type())?;
+        if actual_value_type != *value_type {
+            return Err(IllegalArgument {
+                message: format!(
+                    "Arrow map value type {:?} does not match expected Fluss type {:?}",
+                    actual_value_type, value_type
+                ),
+            });
+        }
+
+        // Get the entries for this specific row
+        arrow_map_entry_to_fluss_map(&map_arr.value(self.row_id), key_type, value_type)
+    }
+
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
         let cache_idx = self
             .row_column_indices
@@ -663,6 +727,60 @@ impl InternalRow for ColumnarRow {
     }
 }
 
+#[inline]
+fn arrow_map_entry_to_fluss_map(
+    struct_arr: &arrow::array::StructArray,
+    key_type: &DataType,
+    value_type: &DataType,
+) -> Result<FlussMap> {
+    if struct_arr.num_columns() != 2 {
+        return Err(IllegalArgument {
+            message: format!(
+                "Expected 2 columns in Map entries struct, got {}",
+                struct_arr.num_columns()
+            ),
+        });
+    }
+
+    let keys_arrow = struct_arr.column(0);
+    let values_arrow = struct_arr.column(1);
+
+    // Validate that the Arrow key/value types match the expected Fluss types
+    let actual_key_type = from_arrow_type(keys_arrow.data_type())?;
+    if actual_key_type != *key_type {
+        return Err(IllegalArgument {
+            message: format!(
+                "Arrow map key type {:?} does not match expected Fluss type {:?}",
+                actual_key_type, key_type
+            ),
+        });
+    }
+
+    let actual_value_type = from_arrow_type(values_arrow.data_type())?;
+    if actual_value_type != *value_type {
+        return Err(IllegalArgument {
+            message: format!(
+                "Arrow map value type {:?} does not match expected Fluss type {:?}",
+                actual_value_type, value_type
+            ),
+        });
+    }
+
+    let len = keys_arrow.len();
+
+    // Convert Arrow keys → FlussArray
+    let mut key_writer = FlussArrayWriter::new(len, key_type);
+    write_arrow_values_to_fluss_array(&**keys_arrow, key_type, &mut key_writer)?;
+    let key_array = key_writer.complete()?;
+
+    // Convert Arrow values → FlussArray
+    let mut value_writer = FlussArrayWriter::new(len, value_type);
+    write_arrow_values_to_fluss_array(&**values_arrow, value_type, &mut value_writer)?;
+    let value_array = value_writer.complete()?;
+
+    FlussMap::from_arrays(&key_array, &value_array)
+}
+
 /// Downcast to a primitive Arrow array type, then loop with null checks calling a writer method.
 macro_rules! write_primitive_elements {
     ($values:expr, $arrow_type:ty, $element_type:expr, $writer:expr, $write_method:ident) => {{
@@ -721,7 +839,10 @@ macro_rules! write_list_elements {
                     $element_type
                 ),
             })?;
-        let nested_element_type = from_arrow_type(&arr.value_type())?;
+        let nested_element_type = match $element_type {
+            DataType::Array(a) => a.get_element_type(),
+            _ => unreachable!("Expected Array type for write_list_elements"),
+        };
         for i in 0..$len {
             if arr.is_null(i) {
                 $writer.set_null_at(i);
@@ -877,6 +998,34 @@ fn write_arrow_values_to_fluss_array(
                 });
             }
         }
+        DataType::Map(_) => {
+            let map_arr =
+                values
+                    .as_any()
+                    .downcast_ref::<MapArray>()
+                    .ok_or_else(|| IllegalArgument {
+                        message: format!(
+                            "Expected MapArray for {element_type:?} element, got {:?}",
+                            values.data_type()
+                        ),
+                    })?;
+            for i in 0..len {
+                if map_arr.is_null(i) {
+                    writer.set_null_at(i);
+                } else {
+                    let expected_map_type = match element_type {
+                        DataType::Map(m) => m,
+                        _ => unreachable!("Expected Map type for Map variant"),
+                    };
+                    let fluss_map = arrow_map_entry_to_fluss_map(
+                        &map_arr.value(i),
+                        expected_map_type.key_type(),
+                        expected_map_type.value_type(),
+                    )?;
+                    writer.write_map(i, &fluss_map);
+                }
+            }
+        }
         DataType::Row(row_type) => {
             let struct_arr = values
                 .as_any()
@@ -896,13 +1045,6 @@ fn write_arrow_values_to_fluss_array(
                 }
             }
         }
-        _ => {
-            return Err(IllegalArgument {
-                message: format!(
-                    "unsupported element type for Arrow → FlussArray conversion: {element_type:?}"
-                ),
-            });
-        }
     }
     Ok(())
 }
@@ -1034,6 +1176,7 @@ fn write_timestamp_elements<T>(
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::metadata::{DataField, RowType};
     use arrow::array::{
         ArrayRef, BinaryArray, BooleanArray, Decimal128Array, Float32Array, Float64Array,
         Int8Array, Int16Array, Int32Array, Int32Builder, Int64Array, ListBuilder, StringArray,
@@ -1041,29 +1184,43 @@ mod tests {
     };
     use arrow::datatypes::{DataType, Field, Fields, Schema};
 
+    fn infer_fluss_type(arrow_dt: &arrow_schema::DataType) -> crate::metadata::DataType {
+        match arrow_dt {
+            arrow_schema::DataType::Int32 => {
+                crate::metadata::DataType::Int(crate::metadata::IntType::new())
+            }
+            arrow_schema::DataType::List(f) => crate::metadata::DataType::Array(
+                crate::metadata::ArrayType::new(infer_fluss_type(f.data_type())),
+            ),
+            _ => crate::metadata::DataType::Int(crate::metadata::IntType::new()),
+        }
+    }
+
     fn single_column_row(array: ArrayRef) -> ColumnarRow {
+        let dt = infer_fluss_type(array.data_type());
         let batch =
             RecordBatch::try_from_iter(vec![("arr", array)]).expect("record batch with one column");
-        ColumnarRow::new(Arc::new(batch), 0, None)
+        let row_type = Arc::new(RowType::with_data_types(vec![dt]));
+        ColumnarRow::new(Arc::new(batch), row_type, 0, None)
     }
 
     #[test]
     fn columnar_row_reads_values() {
         let schema = Arc::new(Schema::new(vec![
-            Field::new("b", DataType::Boolean, false),
-            Field::new("i8", DataType::Int8, false),
-            Field::new("i16", DataType::Int16, false),
-            Field::new("i32", DataType::Int32, false),
-            Field::new("i64", DataType::Int64, false),
-            Field::new("f32", DataType::Float32, false),
-            Field::new("f64", DataType::Float64, false),
-            Field::new("s", DataType::Utf8, false),
-            Field::new("bin", DataType::Binary, false),
-            Field::new("char", DataType::Utf8, false),
+            Field::new("b", ArrowDataType::Boolean, false),
+            Field::new("i8", ArrowDataType::Int8, false),
+            Field::new("i16", ArrowDataType::Int16, false),
+            Field::new("i32", ArrowDataType::Int32, false),
+            Field::new("i64", ArrowDataType::Int64, false),
+            Field::new("f32", ArrowDataType::Float32, false),
+            Field::new("f64", ArrowDataType::Float64, false),
+            Field::new("s", ArrowDataType::Utf8, false),
+            Field::new("bin", ArrowDataType::Binary, false),
+            Field::new("char", ArrowDataType::Utf8, false),
         ]));
 
         let batch = RecordBatch::try_new(
-            schema,
+            schema.clone(),
             vec![
                 Arc::new(BooleanArray::from(vec![true])),
                 Arc::new(Int8Array::from(vec![1])),
@@ -1079,7 +1236,7 @@ mod tests {
         )
         .expect("record batch");
 
-        let mut row = ColumnarRow::new(Arc::new(batch), 0, None);
+        let mut row = ColumnarRow::new(Arc::new(batch), Arc::new(RowType::new(vec![])), 0, None);
         assert_eq!(row.get_field_count(), 10);
         assert!(row.get_boolean(0).unwrap());
         assert_eq!(row.get_byte(1).unwrap(), 1);
@@ -1097,14 +1254,13 @@ mod tests {
 
     #[test]
     fn columnar_row_reads_decimal() {
-        use arrow::datatypes::DataType;
         use bigdecimal::{BigDecimal, num_bigint::BigInt};
 
         // Test with Decimal128
         let schema = Arc::new(Schema::new(vec![
-            Field::new("dec1", DataType::Decimal128(10, 2), false),
-            Field::new("dec2", DataType::Decimal128(20, 5), false),
-            Field::new("dec3", DataType::Decimal128(38, 10), false),
+            Field::new("dec1", ArrowDataType::Decimal128(10, 2), false),
+            Field::new("dec2", ArrowDataType::Decimal128(20, 5), false),
+            Field::new("dec3", ArrowDataType::Decimal128(38, 10), false),
         ]));
 
         // Create decimal values: 123.45, 12345.67890, large decimal
@@ -1134,7 +1290,7 @@ mod tests {
         )
         .expect("record batch");
 
-        let row = ColumnarRow::new(Arc::new(batch), 0, None);
+        let row = ColumnarRow::new(Arc::new(batch), Arc::new(RowType::new(vec![])), 0, None);
         assert_eq!(row.get_field_count(), 3);
 
         // Verify decimal values
@@ -1228,7 +1384,7 @@ mod tests {
         let row = single_column_row(array);
         let err = row.get_array(0).unwrap_err();
         assert!(
-            err.to_string().contains("expected List array"),
+            err.to_string().contains("expected Array type"),
             "unexpected error: {err}"
         );
     }
@@ -1240,7 +1396,16 @@ mod tests {
         builder.append(true);
         let array = Arc::new(builder.finish()) as ArrayRef;
 
-        let row = single_column_row(array);
+        let batch = RecordBatch::try_from_iter(vec![("arr", array)]).expect("record batch");
+        // We manually create a row type that claims to be Array(Int) even though it's List(UInt32)
+        // to test the validation in get_array.
+        let row_type = Arc::new(RowType::new(vec![DataField::new(
+            "arr",
+            crate::metadata::DataTypes::array(crate::metadata::DataTypes::int()),
+            None,
+        )]));
+        let row = ColumnarRow::new(Arc::new(batch), row_type, 0, None);
+
         let err = row.get_array(0).unwrap_err();
         assert!(
             err.to_string()
@@ -1276,7 +1441,7 @@ mod tests {
         ];
         let batch = make_struct_batch("nested", child_fields, child_arrays, 2);
 
-        let mut row = ColumnarRow::new(batch, 0, None);
+        let mut row = ColumnarRow::new(batch, Arc::new(RowType::new(vec![])), 0, None);
 
         // row_id = 0
         let nested = row.get_row(0).unwrap();
@@ -1322,7 +1487,7 @@ mod tests {
         let batch =
             Arc::new(RecordBatch::try_new(schema, vec![outer_array]).expect("record batch"));
 
-        let mut row = ColumnarRow::new(batch, 0, None);
+        let mut row = ColumnarRow::new(batch, Arc::new(RowType::new(vec![])), 0, None);
 
         // row_id = 0
         let outer = row.get_row(0).unwrap();
@@ -1344,7 +1509,7 @@ mod tests {
         let child_arrays: Vec<Arc<dyn Array>> = vec![Arc::new(Int32Array::from(vec![10, 20]))];
         let batch = make_struct_batch("s", child_fields, child_arrays, 2);
 
-        let mut row = ColumnarRow::new(batch, 0, None);
+        let mut row = ColumnarRow::new(batch, Arc::new(RowType::new(vec![])), 0, None);
 
         // row_id = 0: nested x = 10
         let nested_0 = row.get_row(0).unwrap();
diff --git a/fluss-rust/crates/fluss/src/row/column_writer.rs b/fluss-rust/crates/fluss/src/row/column_writer.rs
index d595df9191..bbd2876733 100644
--- a/fluss-rust/crates/fluss/src/row/column_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/column_writer.rs
@@ -123,6 +123,14 @@ enum TypedWriter {
         offsets: Vec<i32>,
         validity: Vec<bool>,
     },
+    Map {
+        key_writer: Box<ColumnWriter>,
+        value_writer: Box<ColumnWriter>,
+        key_type: DataType,
+        value_type: DataType,
+        offsets: Vec<i32>,
+        validity: Vec<bool>,
+    },
     Struct {
         field_writers: Vec<ColumnWriter>,
         validity: Vec<bool>,
@@ -162,6 +170,7 @@ macro_rules! with_builder {
             TypedWriter::TimestampLtzMicrosecond { builder: $b, .. } => $body,
             TypedWriter::TimestampLtzNanosecond { builder: $b, .. } => $body,
             TypedWriter::List { .. } => panic!("List variant not supported in with_builder!"),
+            TypedWriter::Map { .. } => panic!("Map variant not supported in with_builder!"),
             TypedWriter::Struct { .. } => panic!("Struct variant not supported in with_builder!"),
         }
     };
@@ -361,6 +370,50 @@ impl ColumnWriter {
                     validity: Vec::with_capacity(capacity),
                 }
             }
+            DataType::Map(m) => {
+                let (key_arrow_type, value_arrow_type) = match arrow_type {
+                    ArrowDataType::Map(field, _) => match field.data_type() {
+                        ArrowDataType::Struct(fields) => {
+                            if fields.len() != 2 {
+                                return Err(Error::IllegalArgument {
+                                    message: format!(
+                                        "Expected Struct with 2 fields for Map, got {}",
+                                        fields.len()
+                                    ),
+                                });
+                            }
+                            (fields[0].data_type().clone(), fields[1].data_type().clone())
+                        }
+                        struct_type => {
+                            return Err(Error::IllegalArgument {
+                                message: format!(
+                                    "Expected Struct within Map Arrow type, got {:?}",
+                                    struct_type
+                                ),
+                            });
+                        }
+                    },
+                    _ => {
+                        return Err(Error::IllegalArgument {
+                            message: format!(
+                                "Expected Map Arrow type for Map, got: {arrow_type:?}"
+                            ),
+                        });
+                    }
+                };
+
+                let key_writer = ColumnWriter::create(m.key_type(), &key_arrow_type, 0, capacity)?;
+                let value_writer =
+                    ColumnWriter::create(m.value_type(), &value_arrow_type, 1, capacity)?;
+                TypedWriter::Map {
+                    key_writer: Box::new(key_writer),
+                    value_writer: Box::new(value_writer),
+                    key_type: m.key_type().clone(),
+                    value_type: m.value_type().clone(),
+                    offsets: vec![0],
+                    validity: Vec::with_capacity(capacity),
+                }
+            }
             DataType::Row(row_type) => {
                 let arrow_fields = match arrow_type {
                     ArrowDataType::Struct(fields) => fields.clone(),
@@ -394,11 +447,6 @@ impl ColumnWriter {
                     row_type: row_type.clone(),
                 }
             }
-            _ => {
-                return Err(Error::IllegalArgument {
-                    message: format!("Unsupported Fluss DataType: {fluss_type:?}"),
-                });
-            }
         };
 
         Ok(Self {
@@ -440,6 +488,26 @@ impl ColumnWriter {
                 let taken_validity = std::mem::take(validity);
                 finish_list_array(values, item_nullable, &taken_offsets, &taken_validity)
             }
+            TypedWriter::Map {
+                key_writer,
+                value_writer,
+                offsets,
+                validity,
+                ..
+            } => {
+                let value_nullable = value_writer.nullable;
+                let keys = key_writer.finish();
+                let values = value_writer.finish();
+                let taken_offsets = std::mem::replace(offsets, vec![0]);
+                let taken_validity = std::mem::take(validity);
+                finish_map_array(
+                    keys,
+                    values,
+                    value_nullable,
+                    &taken_offsets,
+                    &taken_validity,
+                )
+            }
             TypedWriter::Struct {
                 field_writers,
                 validity,
@@ -527,6 +595,20 @@ impl ColumnWriter {
                 let offsets_bytes = round_up_to_8(offsets.len() * std::mem::size_of::<i32>());
                 validity_bytes + offsets_bytes + element_writer.buffer_size()
             }
+            TypedWriter::Map {
+                key_writer,
+                value_writer,
+                offsets,
+                validity,
+                ..
+            } => {
+                let validity_bytes = round_up_to_8(validity.len().div_ceil(8));
+                let offsets_bytes = round_up_to_8(offsets.len() * std::mem::size_of::<i32>());
+                validity_bytes
+                    + offsets_bytes
+                    + key_writer.buffer_size()
+                    + value_writer.buffer_size()
+            }
             TypedWriter::Struct {
                 field_writers,
                 validity,
@@ -543,6 +625,9 @@ impl ColumnWriter {
         match &mut self.inner {
             TypedWriter::List {
                 offsets, validity, ..
+            }
+            | TypedWriter::Map {
+                offsets, validity, ..
             } => {
                 let last = *offsets.last().unwrap_or(&0);
                 offsets.push(last);
@@ -783,6 +868,30 @@ impl ColumnWriter {
                 validity.push(true);
                 Ok(())
             }
+            TypedWriter::Map {
+                key_writer,
+                value_writer,
+                key_type,
+                value_type,
+                offsets,
+                validity,
+            } => {
+                let map = row.get_map(pos, key_type, value_type)?;
+                let key_array = map.key_array();
+                let value_array = map.value_array();
+                for i in 0..map.size() {
+                    key_writer.write_field_at(key_array, i)?;
+                    value_writer.write_field_at(value_array, i)?;
+                }
+                let last = *offsets.last().unwrap();
+                offsets.push(
+                    last + i32::try_from(map.size()).map_err(|_| RowConvertError {
+                        message: format!("Map size {} exceeds i32 range", map.size()),
+                    })?,
+                );
+                validity.push(true);
+                Ok(())
+            }
             TypedWriter::Struct {
                 field_writers,
                 validity,
@@ -844,12 +953,52 @@ fn finish_list_array(
     ))
 }
 
+fn finish_map_array(
+    keys: ArrayRef,
+    values: ArrayRef,
+    value_nullable: bool,
+    offsets: &[i32],
+    validity: &[bool],
+) -> ArrayRef {
+    use arrow::array::{Array, MapArray, StructArray};
+    use arrow::buffer::{NullBuffer, OffsetBuffer, ScalarBuffer};
+    use arrow::datatypes::Field;
+    use std::sync::Arc;
+
+    let offsets_buffer = OffsetBuffer::new(ScalarBuffer::from(offsets.to_vec()));
+    let null_buffer = NullBuffer::from(validity.to_vec());
+
+    let key_field = Arc::new(Field::new("key", keys.data_type().clone(), false));
+    let value_field = Arc::new(Field::new(
+        "value",
+        values.data_type().clone(),
+        value_nullable,
+    ));
+
+    let struct_array = StructArray::from(vec![(key_field, keys), (value_field, values)]);
+
+    let entries_field = Arc::new(Field::new(
+        "entries",
+        struct_array.data_type().clone(),
+        false,
+    ));
+
+    Arc::new(MapArray::new(
+        entries_field,
+        offsets_buffer,
+        struct_array,
+        Some(null_buffer),
+        false,
+    ))
+}
+
 #[cfg(test)]
 mod tests {
     use super::*;
     use crate::metadata::DataTypes;
     use crate::record::to_arrow_type;
     use crate::row::binary_array::FlussArrayWriter;
+    use crate::row::binary_map::FlussMapWriter;
     use crate::row::{Date, Datum, Decimal, GenericRow, Time, TimestampLtz, TimestampNtz};
     use arrow::array::*;
     use bigdecimal::BigDecimal;
@@ -1116,4 +1265,56 @@ mod tests {
             "Arrow field inside the list should be non-nullable"
         );
     }
+
+    #[test]
+    fn test_write_map_type() {
+        use crate::metadata::DataTypes;
+        let key_type = DataTypes::int();
+        let value_type = DataTypes::string();
+        let fluss_type = DataTypes::map(key_type.clone(), value_type.clone());
+
+        let mut map_writer = FlussMapWriter::new(2, &key_type, &value_type);
+        map_writer.write_entry(1.into(), "a".into()).unwrap();
+        map_writer.write_entry(2.into(), "b".into()).unwrap();
+        let map = map_writer.complete().unwrap();
+
+        let arr = write_one(&fluss_type, Datum::Map(map));
+        let map_arr = arr.as_any().downcast_ref::<MapArray>().unwrap();
+        assert_eq!(map_arr.len(), 1);
+
+        let entries = map_arr.value(0);
+        let struct_arr = entries.as_any().downcast_ref::<StructArray>().unwrap();
+        assert_eq!(struct_arr.num_columns(), 2);
+
+        let keys = struct_arr
+            .column(0)
+            .as_any()
+            .downcast_ref::<Int32Array>()
+            .unwrap();
+        let values = struct_arr
+            .column(1)
+            .as_any()
+            .downcast_ref::<StringArray>()
+            .unwrap();
+
+        assert_eq!(keys.len(), 2);
+        assert_eq!(keys.value(0), 1);
+        assert_eq!(keys.value(1), 2);
+
+        assert_eq!(values.len(), 2);
+        assert_eq!(values.value(0), "a");
+        assert_eq!(values.value(1), "b");
+    }
+
+    #[test]
+    fn test_write_null_map_type() {
+        use crate::metadata::DataTypes;
+
+        let fluss_type = DataTypes::map(DataTypes::int(), DataTypes::string());
+        let arr = write_one(&fluss_type, Datum::Null);
+        let map_arr = arr.as_any().downcast_ref::<MapArray>().unwrap();
+
+        assert_eq!(map_arr.len(), 1);
+        assert!(map_arr.is_null(0));
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
index 9e0ffa5391..d5f7c2f1d8 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_key_writer.rs
@@ -23,6 +23,8 @@ use crate::error::Result;
 use crate::metadata::DataType;
 use crate::row::Decimal;
 use crate::row::binary::{BinaryRowFormat, BinaryWriter, ValueWriter};
+use crate::row::binary_array::FlussArray;
+use crate::row::binary_map::FlussMap;
 use crate::row::datum::{TimestampLtz, TimestampNtz};
 use delegate::delegate;
 
@@ -109,7 +111,9 @@ impl BinaryWriter for CompactedKeyWriter {
 
             fn write_timestamp_ltz(&mut self, value: &TimestampLtz, precision: u32);
 
-            fn write_array(&mut self, value: &[u8]);
+            fn write_array(&mut self, value: &FlussArray);
+
+            fn write_map(&mut self, value: &FlussMap);
         }
     }
 
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index fbf47c58b7..2463e47951 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -18,10 +18,12 @@
 use crate::client::WriteFormat;
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::RowType;
+use crate::metadata::{DataType, RowType};
+use crate::row::binary_array::FlussArray;
+use crate::row::binary_map::FlussMap;
 use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
-use crate::row::{Decimal, FlussArray, GenericRow, InternalRow};
+use crate::row::{Decimal, GenericRow, InternalRow};
 use std::sync::{Arc, OnceLock};
 
 pub fn calculate_bit_set_width_in_bytes(arity: usize) -> usize {
@@ -172,6 +174,10 @@ impl<'a> InternalRow for CompactedRow<'a> {
         self.decoded_row()?.get_array(pos)
     }
 
+    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
+        self.decoded_row()?.get_map(pos, key_type, value_type)
+    }
+
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
         self.decoded_row()?.get_row(pos)
     }
@@ -188,14 +194,17 @@ impl<'a> InternalRow for CompactedRow<'a> {
 #[cfg(test)]
 mod tests {
     use super::*;
-    use crate::metadata::{
-        BigIntType, BooleanType, BytesType, DataType, DataTypes, DecimalType, DoubleType,
-        FloatType, IntType, SmallIntType, StringType, TimestampLTzType, TimestampType, TinyIntType,
-    };
+    use crate::metadata::DataTypes;
     use crate::row::binary::BinaryWriter;
     use crate::row::binary_array::FlussArrayWriter;
+    use crate::row::binary_map::FlussMapWriter;
+
+    use crate::metadata::{
+        BigIntType, BooleanType, BytesType, DataType, DoubleType, FloatType, IntType, SmallIntType,
+        StringType, TinyIntType,
+    };
+    use crate::row::Datum;
     use crate::row::compacted::compacted_row_writer::CompactedRowWriter;
-    use crate::row::datum::{TimestampLtz, TimestampNtz};
 
     #[test]
     fn test_compacted_row() {
@@ -265,6 +274,9 @@ mod tests {
     #[test]
     fn test_compacted_row_temporal_and_decimal_types() {
         // Comprehensive test covering DATE, TIME, TIMESTAMP (compact/non-compact), and DECIMAL (compact/non-compact)
+        use crate::metadata::{DecimalType, TimestampLTzType, TimestampType};
+        use crate::row::Decimal;
+        use crate::row::datum::{TimestampLtz, TimestampNtz};
         use bigdecimal::{BigDecimal, num_bigint::BigInt};
 
         let row_type = RowType::with_data_types(vec![
@@ -356,7 +368,7 @@ mod tests {
         arr_writer.write_int(1, 2);
         arr_writer.write_int(2, 3);
         let arr = arr_writer.complete().unwrap();
-        writer.write_array(arr.as_bytes());
+        writer.write_array(&arr);
 
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
@@ -381,7 +393,7 @@ mod tests {
         arr_writer.write_string(1, "fluss");
         arr_writer.write_string(2, "rust");
         let arr = arr_writer.complete().unwrap();
-        writer.write_array(arr.as_bytes());
+        writer.write_array(&arr);
 
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
@@ -405,7 +417,7 @@ mod tests {
         arr_writer.set_null_at(1);
         arr_writer.write_int(2, 30);
         let arr = arr_writer.complete().unwrap();
-        writer.write_array(arr.as_bytes());
+        writer.write_array(&arr);
 
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
@@ -428,7 +440,7 @@ mod tests {
         let elem_type = DataTypes::int();
         let arr_writer = FlussArrayWriter::new(0, &elem_type);
         let arr = arr_writer.complete().unwrap();
-        writer.write_array(arr.as_bytes());
+        writer.write_array(&arr);
 
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
@@ -462,7 +474,7 @@ mod tests {
         outer_writer.write_array(1, &inner2_arr);
         let outer_arr = outer_writer.complete().unwrap();
 
-        writer.write_array(outer_arr.as_bytes());
+        writer.write_array(&outer_arr);
 
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
@@ -479,4 +491,140 @@ mod tests {
         assert_eq!(nested2.size(), 1);
         assert_eq!(nested2.get_int(0).unwrap(), 99);
     }
+
+    #[test]
+    fn test_compacted_row_map() {
+        let row_type =
+            RowType::with_data_types(vec![DataTypes::map(DataTypes::int(), DataTypes::string())]);
+
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+
+        let mut map_writer = FlussMapWriter::new(2, &DataTypes::int(), &DataTypes::string());
+        map_writer.write_entry(1.into(), "a".into()).unwrap();
+        map_writer.write_entry(2.into(), "b".into()).unwrap();
+        let map = map_writer.complete().unwrap();
+        writer.write_map(&map);
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        let read_map = row
+            .get_map(0, &DataTypes::int(), &DataTypes::string())
+            .unwrap();
+        assert_eq!(read_map.size(), 2);
+        assert_eq!(read_map.key_array().get_int(0).unwrap(), 1);
+        assert_eq!(read_map.value_array().get_string(0).unwrap(), "a");
+    }
+
+    #[test]
+    fn test_compacted_row_map_with_nulls() {
+        // Row with two columns: an INT and a nullable MAP
+        let row_type = RowType::with_data_types(vec![
+            DataTypes::int(),
+            DataTypes::map(DataTypes::int(), DataTypes::string()),
+        ]);
+
+        // Write row with null map
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+        writer.write_int(42);
+        writer.set_null_at(1);
+        writer.complete();
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        assert_eq!(row.get_int(0).unwrap(), 42);
+        assert!(row.is_null_at(1).unwrap());
+
+        // Write row with non-null map
+        writer.reset();
+        writer.write_int(99);
+        let mut map_writer = FlussMapWriter::new(1, &DataTypes::int(), &DataTypes::string());
+        map_writer.write_entry(7.into(), "hello".into()).unwrap();
+        let map = map_writer.complete().unwrap();
+        writer.write_map(&map);
+        writer.complete();
+
+        let bytes2 = writer.to_bytes();
+        let row2 = CompactedRow::from_bytes(&row_type, bytes2.as_ref());
+        assert_eq!(row2.get_int(0).unwrap(), 99);
+        assert!(!row2.is_null_at(1).unwrap());
+        let read_map = row2
+            .get_map(1, &DataTypes::int(), &DataTypes::string())
+            .unwrap();
+        assert_eq!(read_map.size(), 1);
+        assert_eq!(read_map.key_array().get_int(0).unwrap(), 7);
+        assert_eq!(read_map.value_array().get_string(0).unwrap(), "hello");
+    }
+
+    #[test]
+    fn test_compacted_row_nested_map() {
+        // Map<STRING, ARRAY<INT>>
+        let row_type = RowType::with_data_types(vec![DataTypes::map(
+            DataTypes::string(),
+            DataTypes::array(DataTypes::int()),
+        )]);
+
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+
+        // Values: [[1, 2], [3]]
+        let inner_type = DataTypes::int();
+        let mut inner1 = FlussArrayWriter::new(2, &inner_type);
+        inner1.write_int(0, 1);
+        inner1.write_int(1, 2);
+        let inner1_arr = inner1.complete().unwrap();
+
+        let mut inner2 = FlussArrayWriter::new(1, &inner_type);
+        inner2.write_int(0, 3);
+        let inner2_arr = inner2.complete().unwrap();
+
+        let array_type = DataTypes::array(DataTypes::int());
+
+        let mut map_writer = FlussMapWriter::new(2, &DataTypes::string(), &array_type);
+        map_writer
+            .write_entry("a".into(), Datum::Array(inner1_arr))
+            .unwrap();
+        map_writer
+            .write_entry("b".into(), Datum::Array(inner2_arr))
+            .unwrap();
+        let map = map_writer.complete().unwrap();
+        writer.write_map(&map);
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        let read_map = row.get_map(0, &DataTypes::string(), &array_type).unwrap();
+        assert_eq!(read_map.size(), 2);
+        assert_eq!(read_map.key_array().get_string(0).unwrap(), "a");
+        assert_eq!(read_map.key_array().get_string(1).unwrap(), "b");
+
+        let nested1 = read_map.value_array().get_array(0).unwrap();
+        assert_eq!(nested1.size(), 2);
+        assert_eq!(nested1.get_int(0).unwrap(), 1);
+        assert_eq!(nested1.get_int(1).unwrap(), 2);
+
+        let nested2 = read_map.value_array().get_array(1).unwrap();
+        assert_eq!(nested2.size(), 1);
+        assert_eq!(nested2.get_int(0).unwrap(), 3);
+    }
+
+    #[test]
+    fn test_compacted_row_empty_map() {
+        let row_type =
+            RowType::with_data_types(vec![DataTypes::map(DataTypes::int(), DataTypes::string())]);
+
+        let mut writer = CompactedRowWriter::new(row_type.fields().len());
+
+        let map_writer = FlussMapWriter::new(0, &DataTypes::int(), &DataTypes::string());
+        let map = map_writer.complete().unwrap();
+        writer.write_map(&map);
+
+        let bytes = writer.to_bytes();
+        let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
+
+        let read_map = row
+            .get_map(0, &DataTypes::int(), &DataTypes::string())
+            .unwrap();
+        assert_eq!(read_map.size(), 0);
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
index efcb39f2ed..3f2eb65352 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_reader.rs
@@ -213,12 +213,14 @@ impl<'a> CompactedRowDeserializer<'a> {
                     let nested_row = nested_deser.deserialize(&nested_reader)?;
                     (Datum::Row(Box::new(nested_row)), next)
                 }
-                _ => {
-                    return Err(IllegalArgument {
-                        message: format!(
-                            "Unsupported DataType in CompactedRowDeserializer: {dtype:?}"
-                        ),
-                    });
+                DataType::Map(map_type) => {
+                    let (bytes, next) = reader.read_bytes(cursor)?;
+                    let map = crate::row::binary_map::FlussMap::from_bytes(
+                        bytes,
+                        map_type.key_type(),
+                        map_type.value_type(),
+                    )?;
+                    (Datum::Map(map), next)
                 }
             };
             cursor = next_cursor;
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
index 3627174315..2af8767f0c 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row_writer.rs
@@ -17,6 +17,8 @@
 
 use crate::row::Decimal;
 use crate::row::binary::BinaryWriter;
+use crate::row::binary_array::FlussArray;
+use crate::row::binary_map::FlussMap;
 use crate::row::compacted::compacted_row::calculate_bit_set_width_in_bytes;
 use crate::util::varint::{write_unsigned_varint_to_slice, write_unsigned_varint_u64_to_slice};
 use bytes::{Bytes, BytesMut};
@@ -165,8 +167,12 @@ impl BinaryWriter for CompactedRowWriter {
         self.write_bytes(&bytes[..length.min(bytes.len())])
     }
 
-    fn write_array(&mut self, value: &[u8]) {
-        self.write_bytes(value)
+    fn write_array(&mut self, value: &FlussArray) {
+        self.write_bytes(value.as_bytes())
+    }
+
+    fn write_map(&mut self, value: &FlussMap) {
+        self.write_bytes(value.as_bytes())
     }
 
     fn complete(&mut self) {
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index d3f19a1e60..b1595b311e 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -22,11 +22,12 @@ use crate::row::Decimal;
 use crate::row::GenericRow;
 use crate::row::InternalRow;
 use crate::row::binary_array::FlussArray;
+use crate::row::binary_map::FlussMap;
 use crate::row::field_getter::FieldGetter;
 use arrow::array::{
     ArrayBuilder, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
     FixedSizeBinaryBuilder, Float32Builder, Float64Builder, Int8Builder, Int16Builder,
-    Int32Builder, Int64Builder, ListBuilder, StringBuilder, StructBuilder,
+    Int32Builder, Int64Builder, ListBuilder, MapBuilder, StringBuilder, StructBuilder,
     Time32MillisecondBuilder, Time32SecondBuilder, Time64MicrosecondBuilder,
     Time64NanosecondBuilder, TimestampMicrosecondBuilder, TimestampMillisecondBuilder,
     TimestampNanosecondBuilder, TimestampSecondBuilder,
@@ -76,6 +77,8 @@ pub enum Datum<'a> {
     TimestampLtz(TimestampLtz),
     #[display("{0}")]
     Array(FlussArray),
+    #[display("{0}")]
+    Map(FlussMap),
     #[display("{0:?}")]
     Row(Box<GenericRow<'a>>),
 }
@@ -141,6 +144,17 @@ impl Datum<'_> {
         }
     }
 
+    pub fn is_map(&self) -> bool {
+        matches!(self, Datum::Map(_))
+    }
+
+    pub fn as_map(&self) -> &FlussMap {
+        match self {
+            Self::Map(m) => m,
+            _ => panic!("not a map: {self:?}"),
+        }
+    }
+
     pub fn as_row(&self) -> &GenericRow<'_> {
         match self {
             Self::Row(r) => r.as_ref(),
@@ -168,6 +182,7 @@ impl<'a> Datum<'a> {
             Datum::TimestampNtz(t) => Datum::TimestampNtz(t),
             Datum::TimestampLtz(t) => Datum::TimestampLtz(t),
             Datum::Array(a) => Datum::Array(a),
+            Datum::Map(m) => Datum::Map(m),
             Datum::Row(boxed) => Datum::Row(Box::new(boxed.into_owned())),
         }
     }
@@ -443,11 +458,19 @@ impl<'a> From<FlussArray> for Datum<'a> {
     }
 }
 
+impl<'a> From<FlussMap> for Datum<'a> {
+    #[inline]
+    fn from(map: FlussMap) -> Datum<'a> {
+        Datum::Map(map)
+    }
+}
+
 pub trait ToArrow {
     fn append_to(
         &self,
         builder: &mut dyn ArrayBuilder,
-        data_type: &arrow_schema::DataType,
+        fluss_type: &crate::metadata::DataType,
+        arrow_type: &arrow_schema::DataType,
     ) -> Result<()>;
 }
 
@@ -552,10 +575,9 @@ impl AppendResult for std::result::Result<(), ArrowError> {
 fn append_fluss_array_to_list_builder(
     arr: &FlussArray,
     builder: &mut dyn ArrayBuilder,
-    data_type: &arrow_schema::DataType,
+    fluss_type: &crate::metadata::DataType,
+    arrow_type: &arrow_schema::DataType,
 ) -> Result<()> {
-    use crate::record::from_arrow_type;
-
     let list_builder = builder
         .as_any_mut()
         .downcast_mut::<ListBuilder<Box<dyn ArrayBuilder>>>()
@@ -563,34 +585,106 @@ fn append_fluss_array_to_list_builder(
             message: "Builder type mismatch for Array: expected ListBuilder".to_string(),
         })?;
 
-    let element_arrow_type = match data_type {
+    let element_fluss_type = match fluss_type {
+        crate::metadata::DataType::Array(a) => a.get_element_type(),
+        _ => {
+            return Err(RowConvertError {
+                message: format!("Expected Array Fluss type for Array datum, got: {fluss_type:?}"),
+            });
+        }
+    };
+
+    let element_arrow_type = match arrow_type {
         arrow_schema::DataType::List(field) => field.data_type().clone(),
         _ => {
             return Err(RowConvertError {
-                message: format!("Expected List Arrow type for Array datum, got: {data_type:?}"),
+                message: format!("Expected List Arrow type for Array datum, got: {arrow_type:?}"),
             });
         }
     };
 
-    let element_fluss_type = from_arrow_type(&element_arrow_type)?;
     let values_builder = list_builder.values();
 
     for i in 0..arr.size() {
         if arr.is_null_at(i) {
             append_null_for_type(values_builder, &element_arrow_type)?;
         } else {
-            let datum = read_datum_from_fluss_array(arr, i, &element_fluss_type)?;
-            datum.append_to(values_builder, &element_arrow_type)?;
+            let datum = read_datum_from_fluss_array(arr, i, element_fluss_type)?;
+            datum.append_to(values_builder, element_fluss_type, &element_arrow_type)?;
         }
     }
     list_builder.append(true);
     Ok(())
 }
 
+fn append_fluss_map_to_map_builder(
+    map: &crate::row::FlussMap,
+    builder: &mut dyn ArrayBuilder,
+    fluss_type: &crate::metadata::DataType,
+    arrow_type: &arrow_schema::DataType,
+) -> Result<()> {
+    let map_builder = builder
+        .as_any_mut()
+        .downcast_mut::<MapBuilder<Box<dyn ArrayBuilder>, Box<dyn ArrayBuilder>>>()
+        .ok_or_else(|| RowConvertError {
+            message: "Builder type mismatch for Map: expected MapBuilder".to_string(),
+        })?;
+
+    let expected_map_type = match fluss_type {
+        crate::metadata::DataType::Map(m) => m,
+        _ => {
+            return Err(RowConvertError {
+                message: format!("Expected Map Fluss type for Map datum, got: {fluss_type:?}"),
+            });
+        }
+    };
+
+    let (key_arrow_type, value_arrow_type) = match arrow_type {
+        arrow_schema::DataType::Map(entries_field, _) => match entries_field.data_type() {
+            arrow_schema::DataType::Struct(fields) if fields.len() == 2 => {
+                (fields[0].data_type().clone(), fields[1].data_type().clone())
+            }
+            other => {
+                return Err(RowConvertError {
+                    message: format!(
+                        "Expected Struct with 2 fields for Map entries, got: {other:?}"
+                    ),
+                });
+            }
+        },
+        _ => {
+            return Err(RowConvertError {
+                message: format!("Expected Map Arrow type for Map datum, got: {arrow_type:?}"),
+            });
+        }
+    };
+
+    let key_fluss_type = expected_map_type.key_type();
+    let value_fluss_type = expected_map_type.value_type();
+    let key_array = map.key_array();
+    let value_array = map.value_array();
+
+    for i in 0..map.size() {
+        let key_datum = read_datum_from_fluss_array(key_array, i, key_fluss_type)?;
+        key_datum.append_to(map_builder.keys(), key_fluss_type, &key_arrow_type)?;
+
+        if value_array.is_null_at(i) {
+            append_null_for_type(map_builder.values(), &value_arrow_type)?;
+        } else {
+            let val_datum = read_datum_from_fluss_array(value_array, i, value_fluss_type)?;
+            val_datum.append_to(map_builder.values(), value_fluss_type, &value_arrow_type)?;
+        }
+    }
+    map_builder.append(true).map_err(|e| RowConvertError {
+        message: format!("Failed to append Map entries: {e}"),
+    })?;
+    Ok(())
+}
+
 fn read_datum_from_fluss_array<'a>(
     arr: &FlussArray,
     pos: usize,
-    element_type: &DataType,
+    element_type: &crate::metadata::DataType,
 ) -> Result<Datum<'a>> {
     if let DataType::Row(row_type) = element_type {
         let compacted = arr.get_row(pos, row_type)?;
@@ -675,6 +769,20 @@ fn append_null_for_type(
         arrow_schema::DataType::List(_) => {
             downcast_null!(ListBuilder<Box<dyn ArrayBuilder>>)
         }
+        arrow_schema::DataType::Map(_, _) => {
+            let b = builder
+                .as_any_mut()
+                .downcast_mut::<MapBuilder<Box<dyn ArrayBuilder>, Box<dyn ArrayBuilder>>>()
+                .ok_or_else(|| RowConvertError {
+                    message: format!(
+                        "Builder type mismatch: expected MapBuilder for {data_type:?}",
+                    ),
+                })?;
+            b.append(false).map_err(|e| RowConvertError {
+                message: format!("Failed to append null Map entries: {e}"),
+            })?;
+            Ok(())
+        }
         arrow_schema::DataType::Struct(fields) => {
             // StructBuilder::append_null only flips parent validity; children must each get a null too.
             let struct_builder = builder
@@ -704,7 +812,8 @@ fn append_null_for_type(
 fn append_generic_row_to_struct_builder(
     row: &GenericRow<'_>,
     builder: &mut dyn ArrayBuilder,
-    data_type: &arrow_schema::DataType,
+    fluss_type: &crate::metadata::DataType,
+    arrow_type: &arrow_schema::DataType,
 ) -> Result<()> {
     let struct_builder = builder
         .as_any_mut()
@@ -713,11 +822,20 @@ fn append_generic_row_to_struct_builder(
             message: "Builder type mismatch for Row: expected StructBuilder".to_string(),
         })?;
 
-    let fields = match data_type {
+    let row_type = match fluss_type {
+        crate::metadata::DataType::Row(rt) => rt,
+        _ => {
+            return Err(RowConvertError {
+                message: format!("Expected Row Fluss type for Row datum, got: {fluss_type:?}"),
+            });
+        }
+    };
+
+    let fields = match arrow_type {
         arrow_schema::DataType::Struct(fields) => fields.clone(),
         _ => {
             return Err(RowConvertError {
-                message: format!("Expected Struct Arrow type for Row datum, got: {data_type:?}"),
+                message: format!("Expected Struct Arrow type for Row datum, got: {arrow_type:?}"),
             });
         }
     };
@@ -736,7 +854,8 @@ fn append_generic_row_to_struct_builder(
         let field_builders = struct_builder.field_builders_mut();
         for (i, datum) in row.values.iter().enumerate() {
             let child = field_builders[i].as_mut();
-            datum.append_to(child, fields[i].data_type())?;
+            let child_fluss_type = row_type.fields()[i].data_type();
+            datum.append_to(child, child_fluss_type, fields[i].data_type())?;
         }
     }
     struct_builder.append(true);
@@ -747,7 +866,8 @@ impl Datum<'_> {
     pub fn append_to(
         &self,
         builder: &mut dyn ArrayBuilder,
-        data_type: &arrow_schema::DataType,
+        fluss_type: &crate::metadata::DataType,
+        arrow_type: &arrow_schema::DataType,
     ) -> Result<()> {
         macro_rules! append_value_to_arrow {
             ($builder_type:ty, $value:expr) => {
@@ -759,7 +879,7 @@ impl Datum<'_> {
         }
 
         match self {
-            Datum::Null => return append_null_for_type(builder, data_type),
+            Datum::Null => return append_null_for_type(builder, arrow_type),
             Datum::Bool(v) => append_value_to_arrow!(BooleanBuilder, *v),
             Datum::Int8(v) => append_value_to_arrow!(Int8Builder, *v),
             Datum::Int16(v) => append_value_to_arrow!(Int16Builder, *v),
@@ -768,7 +888,7 @@ impl Datum<'_> {
             Datum::Float32(v) => append_value_to_arrow!(Float32Builder, v.into_inner()),
             Datum::Float64(v) => append_value_to_arrow!(Float64Builder, v.into_inner()),
             Datum::String(v) => append_value_to_arrow!(StringBuilder, v.as_ref()),
-            Datum::Blob(v) => match data_type {
+            Datum::Blob(v) => match arrow_type {
                 arrow_schema::DataType::Binary => {
                     append_value_to_arrow!(BinaryBuilder, v.as_ref());
                 }
@@ -778,18 +898,18 @@ impl Datum<'_> {
                 _ => {
                     return Err(RowConvertError {
                         message: format!(
-                            "Expected Binary or FixedSizeBinary Arrow type, got: {data_type:?}"
+                            "Expected Binary or FixedSizeBinary Arrow type, got: {arrow_type:?}"
                         ),
                     });
                 }
             },
             Datum::Decimal(decimal) => {
                 // Extract target precision and scale from Arrow schema
-                let (p, s) = match data_type {
+                let (p, s) = match arrow_type {
                     arrow_schema::DataType::Decimal128(p, s) => (*p, *s),
                     _ => {
                         return Err(RowConvertError {
-                            message: format!("Expected Decimal128 Arrow type, got: {data_type:?}"),
+                            message: format!("Expected Decimal128 Arrow type, got: {arrow_type:?}"),
                         });
                     }
                 };
@@ -817,7 +937,7 @@ impl Datum<'_> {
                 // Convert to Arrow's time unit based on schema
                 let millis = time.get_inner();
 
-                match data_type {
+                match arrow_type {
                     arrow_schema::DataType::Time32(arrow_schema::TimeUnit::Second) => {
                         if let Some(b) = builder.as_any_mut().downcast_mut::<Time32SecondBuilder>()
                         {
@@ -877,7 +997,7 @@ impl Datum<'_> {
                     _ => {
                         return Err(RowConvertError {
                             message: format!(
-                                "Expected Time32/Time64 Arrow type, got: {data_type:?}"
+                                "Expected Time32/Time64 Arrow type, got: {arrow_type:?}"
                             ),
                         });
                     }
@@ -962,10 +1082,13 @@ impl Datum<'_> {
                 });
             }
             Datum::Array(arr) => {
-                return append_fluss_array_to_list_builder(arr, builder, data_type);
+                return append_fluss_array_to_list_builder(arr, builder, fluss_type, arrow_type);
+            }
+            Datum::Map(map) => {
+                return append_fluss_map_to_map_builder(map, builder, fluss_type, arrow_type);
             }
             Datum::Row(row) => {
-                return append_generic_row_to_struct_builder(row, builder, data_type);
+                return append_generic_row_to_struct_builder(row, builder, fluss_type, arrow_type);
             }
         }
 
@@ -985,7 +1108,8 @@ macro_rules! impl_to_arrow {
             fn append_to(
                 &self,
                 builder: &mut dyn ArrayBuilder,
-                _data_type: &arrow_schema::DataType,
+                _fluss_type: &crate::metadata::DataType,
+                _arrow_type: &arrow_schema::DataType,
             ) -> Result<()> {
                 if let Some(b) = builder.as_any_mut().downcast_mut::<$variant>() {
                     b.append_value(*self);
@@ -1208,20 +1332,23 @@ mod tests {
 
     #[test]
     fn datum_append_to_builder() {
+        use crate::metadata::DataTypes;
         let mut builder = Int32Builder::new();
+        let int_type = DataTypes::int();
         Datum::Null
-            .append_to(&mut builder, &arrow_schema::DataType::Int32)
+            .append_to(&mut builder, &int_type, &arrow_schema::DataType::Int32)
             .unwrap();
         Datum::Int32(5)
-            .append_to(&mut builder, &arrow_schema::DataType::Int32)
+            .append_to(&mut builder, &int_type, &arrow_schema::DataType::Int32)
             .unwrap();
         let array = builder.finish();
         assert!(array.is_null(0));
         assert_eq!(array.value(1), 5);
 
         let mut builder = StringBuilder::new();
+        let string_type = DataTypes::string();
         let err = Datum::Int32(1)
-            .append_to(&mut builder, &arrow_schema::DataType::Utf8)
+            .append_to(&mut builder, &string_type, &arrow_schema::DataType::Utf8)
             .unwrap_err();
         assert!(matches!(err, RowConvertError { .. }));
     }
@@ -1246,6 +1373,94 @@ mod tests {
         assert_eq!(date.month(), 1);
         assert_eq!(date.day(), 1);
     }
+    #[test]
+    fn test_datum_map_appends_to_arrow() {
+        use crate::metadata::DataTypes;
+        use crate::row::binary_map::FlussMapWriter;
+        use arrow::array::MapBuilder;
+        use std::sync::Arc;
+
+        let mut writer = FlussMapWriter::new(1, &DataTypes::int(), &DataTypes::string());
+        writer.write_entry(99.into(), "arrow_test".into()).unwrap();
+        let map = writer.complete().unwrap();
+
+        let arrow_type = arrow_schema::DataType::Map(
+            Arc::new(arrow_schema::Field::new(
+                "entries",
+                arrow_schema::DataType::Struct(arrow_schema::Fields::from(vec![
+                    arrow_schema::Field::new("key", arrow_schema::DataType::Int32, false),
+                    arrow_schema::Field::new("value", arrow_schema::DataType::Utf8, true),
+                ])),
+                false,
+            )),
+            false,
+        );
+
+        let mut map_builder: MapBuilder<
+            Box<dyn arrow::array::ArrayBuilder>,
+            Box<dyn arrow::array::ArrayBuilder>,
+        > = MapBuilder::new(
+            None,
+            Box::new(Int32Builder::new()),
+            Box::new(StringBuilder::new()),
+        );
+
+        let map_type = DataTypes::map(DataTypes::int(), DataTypes::string());
+        Datum::Map(map)
+            .append_to(&mut map_builder, &map_type, &arrow_type)
+            .unwrap();
+
+        let array = map_builder.finish();
+        assert_eq!(array.len(), 1);
+        assert!(!array.is_null(0));
+    }
+
+    #[test]
+    fn test_datum_map_append_type_mismatch() {
+        use crate::metadata::DataTypes;
+        use crate::row::binary_map::FlussMapWriter;
+        use arrow::array::{Float64Builder, MapBuilder, StringBuilder};
+        use std::sync::Arc;
+
+        // 1. Construct a Map with Keys: String, Values: Float64
+        let mut writer = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::double());
+        writer.write_entry("key1".into(), 1.23.into()).unwrap();
+        let map = writer.complete().unwrap();
+
+        // 2. Define an Arrow Map builder for (String, Float64) using Boxed builders
+        let mut map_builder: MapBuilder<
+            Box<dyn arrow::array::ArrayBuilder>,
+            Box<dyn arrow::array::ArrayBuilder>,
+        > = MapBuilder::new(
+            None,
+            Box::new(StringBuilder::new()),
+            Box::new(Float64Builder::new()),
+        );
+
+        // 3. Define an INCOMPATIBLE expected Fluss type (Int32 instead of Map)
+        let mismatched_type = DataTypes::int();
+
+        // 4. Define the Arrow type (must match the builder structure)
+        let arrow_type = arrow_schema::DataType::Map(
+            Arc::new(arrow_schema::Field::new(
+                "entries",
+                arrow_schema::DataType::Struct(arrow_schema::Fields::from(vec![
+                    arrow_schema::Field::new("key", arrow_schema::DataType::Utf8, false),
+                    arrow_schema::Field::new("value", arrow_schema::DataType::Float64, true),
+                ])),
+                false,
+            )),
+            false,
+        );
+
+        // 5. Assert that append_to returns an error
+        let result = Datum::Map(map).append_to(&mut map_builder, &mismatched_type, &arrow_type);
+
+        assert!(result.is_err());
+        let err = result.unwrap_err().to_string();
+        assert!(err.contains("row convert error Expected Map Fluss type for Map datum"));
+        assert!(err.contains("Int(IntType { nullable: true })"));
+    }
 }
 
 #[cfg(test)]
@@ -1305,10 +1520,11 @@ mod timestamp_tests {
 
     #[test]
     fn test_row_arrow_struct_round_trip() {
-        let row_type_owned = DataTypes::row(vec![
+        let row_type = crate::metadata::RowType::new(vec![
             DataField::new("x", DataTypes::int(), None),
             DataField::new("label", DataTypes::string(), None),
         ]);
+        let row_type_owned = DataType::Row(row_type.clone());
         let arrow_struct_dt = to_arrow_type(&row_type_owned).unwrap();
         let struct_fields: Fields = match &arrow_struct_dt {
             arrow_schema::DataType::Struct(f) => f.clone(),
@@ -1321,18 +1537,18 @@ mod timestamp_tests {
         r0.set_field(0, 42_i32);
         r0.set_field(1, "hello");
         Datum::Row(Box::new(r0))
-            .append_to(&mut struct_builder, &arrow_struct_dt)
+            .append_to(&mut struct_builder, &row_type_owned, &arrow_struct_dt)
             .expect("append row 0");
 
         Datum::Null
-            .append_to(&mut struct_builder, &arrow_struct_dt)
+            .append_to(&mut struct_builder, &row_type_owned, &arrow_struct_dt)
             .expect("append null row");
 
         let mut r2 = GenericRow::new(2);
         r2.set_field(0, -7_i32);
         r2.set_field(1, Datum::Null);
         Datum::Row(Box::new(r2))
-            .append_to(&mut struct_builder, &arrow_struct_dt)
+            .append_to(&mut struct_builder, &row_type_owned, &arrow_struct_dt)
             .expect("append row 2");
 
         let struct_array: StructArray = struct_builder.finish();
@@ -1346,7 +1562,7 @@ mod timestamp_tests {
             RecordBatch::try_new(schema, vec![Arc::new(struct_array)]).expect("record batch"),
         );
 
-        let mut columnar = ColumnarRow::new(batch, 0, None);
+        let mut columnar = ColumnarRow::new(batch, Arc::new(row_type), 0, None);
 
         let nested = columnar.get_row(0).expect("get_row 0");
         assert_eq!(nested.get_int(0).unwrap(), 42);
diff --git a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
index c7f16d6ca5..81cd96fa42 100644
--- a/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
+++ b/fluss-rust/crates/fluss/src/row/encode/compacted_key_encoder.rs
@@ -165,6 +165,22 @@ mod tests {
             .expect("CompactedKeyEncoder initialization failed")
     }
 
+    #[test]
+    fn test_encode_map_rejected() {
+        let row_type =
+            RowType::with_data_types(vec![DataTypes::map(DataTypes::string(), DataTypes::int())]);
+
+        let res = CompactedKeyEncoder::new(&row_type, vec![0]);
+        assert!(res.is_err());
+        if let Err(e) = res {
+            assert!(
+                e.to_string().contains("Cannot use Map"),
+                "Expected error to contain 'Cannot use Map', got '{}'",
+                e
+            );
+        }
+    }
+
     #[test]
     fn test_encode_key() {
         let row_type = RowType::with_data_types(vec![
@@ -364,7 +380,7 @@ mod tests {
             DataTypes::array(DataTypes::int()), // ARRAY<INT>
             DataTypes::array(DataTypes::float().as_non_nullable()), // ARRAY<FLOAT NOT NULL>
             DataTypes::array(DataTypes::array(DataTypes::string())), // ARRAY<ARRAY<STRING>>
-                                                // TODO: Add support for MAP type
+                                                // Note: MAP is rejected as a key type (see test_encode_map_rejected)
                                                 // TODO: Add support for ROW type
         ]);
 
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
index a1ea378fc9..41322f542b 100644
--- a/fluss-rust/crates/fluss/src/row/field_getter.rs
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -82,10 +82,13 @@ impl FieldGetter {
                 pos,
                 precision: t.precision(),
             },
-            // TODO: add Map variant when get_map is available in InternalRow.
             DataType::Array(_) => InnerFieldGetter::Array { pos },
+            DataType::Map(m) => InnerFieldGetter::Map {
+                pos,
+                key_type: m.key_type().clone(),
+                value_type: m.value_type().clone(),
+            },
             DataType::Row(_) => InnerFieldGetter::Row { pos },
-            _ => unimplemented!("DataType {:?} is currently unimplemented", data_type),
         };
 
         if data_type.is_nullable() {
@@ -155,6 +158,11 @@ pub enum InnerFieldGetter {
     Array {
         pos: usize,
     },
+    Map {
+        pos: usize,
+        key_type: DataType,
+        value_type: DataType,
+    },
     Row {
         pos: usize,
     },
@@ -187,8 +195,12 @@ impl InnerFieldGetter {
             InnerFieldGetter::TimestampLtz { pos, precision } => {
                 Datum::TimestampLtz(row.get_timestamp_ltz(*pos, *precision)?)
             }
-            // TODO: add Map field getter support once its binary form is implemented.
             InnerFieldGetter::Array { pos } => Datum::Array(row.get_array(*pos)?),
+            InnerFieldGetter::Map {
+                pos,
+                key_type,
+                value_type,
+            } => Datum::Map(row.get_map(*pos, key_type, value_type)?),
             InnerFieldGetter::Row { pos } => Datum::Row(Box::new(row.get_row(*pos)?.clone())),
         })
     }
@@ -212,6 +224,7 @@ impl InnerFieldGetter {
             | Self::Timestamp { pos, .. }
             | Self::TimestampLtz { pos, .. }
             | Self::Array { pos }
+            | Self::Map { pos, .. }
             | Self::Row { pos } => *pos,
         }
     }
@@ -223,6 +236,7 @@ mod tests {
     use crate::metadata::DataTypes;
     use crate::row::GenericRow;
     use crate::row::binary_array::FlussArrayWriter;
+    use crate::row::binary_map::FlussMapWriter;
 
     #[test]
     fn test_field_getter_array() {
@@ -258,4 +272,38 @@ mod tests {
         let datum = getter.get_field(&row).unwrap();
         assert!(datum.is_null());
     }
+
+    #[test]
+    fn test_field_getter_map() {
+        let mut map_writer = FlussMapWriter::new(1, &DataTypes::int(), &DataTypes::string());
+        map_writer.write_entry(42.into(), "value".into()).unwrap();
+        let map = map_writer.complete().unwrap();
+
+        let mut row = GenericRow::new(2);
+        row.set_field(0, Datum::Int32(1));
+        row.set_field(1, Datum::Map(map));
+
+        let data_type = DataTypes::map(DataTypes::int(), DataTypes::string());
+        let getter = FieldGetter::create(&data_type, 1);
+        let datum = getter.get_field(&row).unwrap();
+
+        match datum {
+            Datum::Map(m) => {
+                assert_eq!(m.size(), 1);
+                assert_eq!(m.key_array().get_int(0).unwrap(), 42);
+                assert_eq!(m.value_array().get_string(0).unwrap(), "value");
+            }
+            _ => panic!("Expected Map datum"),
+        }
+    }
+
+    #[test]
+    fn test_field_getter_nullable_map() {
+        let row = GenericRow::from_data(vec![Datum::Null]);
+
+        let data_type = DataTypes::map(DataTypes::int(), DataTypes::string());
+        let getter = FieldGetter::create(&data_type, 0);
+        let datum = getter.get_field(&row).unwrap();
+        assert!(datum.is_null());
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/lookup_row.rs b/fluss-rust/crates/fluss/src/row/lookup_row.rs
index 76505abf63..fd3db4fcfb 100644
--- a/fluss-rust/crates/fluss/src/row/lookup_row.rs
+++ b/fluss-rust/crates/fluss/src/row/lookup_row.rs
@@ -21,10 +21,11 @@
 
 use crate::client::WriteFormat;
 use crate::error::Result;
+use crate::metadata::DataType;
 use crate::row::compacted::CompactedRow;
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
 use crate::row::projected_row::ProjectedRow;
-use crate::row::{Decimal, FlussArray, GenericRow, InternalRow};
+use crate::row::{Decimal, FlussArray, FlussMap, GenericRow, InternalRow};
 
 pub struct LookupRow<'a> {
     inner: Inner<'a>,
@@ -116,6 +117,9 @@ impl<'a> InternalRow for LookupRow<'a> {
     fn get_array(&self, pos: usize) -> Result<FlussArray> {
         delegate!(self, get_array, pos)
     }
+    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
+        delegate!(self, get_map, pos, key_type, value_type)
+    }
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
         delegate!(self, get_row, pos)
     }
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 36f9a1c250..2456ee4d39 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 pub mod binary_array;
+pub mod binary_map;
 mod column;
 
 pub(crate) mod datum;
@@ -32,7 +33,9 @@ mod projected_row;
 mod row_decoder;
 
 use crate::client::WriteFormat;
-pub use binary_array::FlussArray;
+use crate::metadata::DataType;
+pub use binary_array::{FlussArray, FlussArrayWriter};
+pub use binary_map::{FlussMap, FlussMapWriter};
 use bytes::Bytes;
 pub use column::*;
 pub use compacted::CompactedRow;
@@ -131,7 +134,10 @@ pub trait InternalRow: Send + Sync {
     /// Returns the array value at the given position
     fn get_array(&self, pos: usize) -> Result<FlussArray>;
 
-    /// Returns the nested row value at the given position
+    /// Returns the map value at the given position
+    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap>;
+
+    /// Returns     the nested row value at the given position
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
         Err(IllegalArgument {
             message: format!("get_row not supported at position {pos}"),
@@ -303,6 +309,20 @@ impl<'a> InternalRow for GenericRow<'a> {
         }
     }
 
+    fn get_map(
+        &self,
+        pos: usize,
+        _key_type: &DataType,
+        _value_type: &DataType,
+    ) -> Result<FlussMap> {
+        match self.get_value(pos)? {
+            Datum::Map(m) => Ok(m.clone()),
+            other => Err(IllegalArgument {
+                message: format!("type mismatch at position {pos}: expected Map, got {other:?}"),
+            }),
+        }
+    }
+
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
         match self.get_value(pos)? {
             Datum::Row(r) => Ok(r.as_ref()),
diff --git a/fluss-rust/crates/fluss/src/row/projected_row.rs b/fluss-rust/crates/fluss/src/row/projected_row.rs
index fc4a521ee0..0075f0b8e2 100644
--- a/fluss-rust/crates/fluss/src/row/projected_row.rs
+++ b/fluss-rust/crates/fluss/src/row/projected_row.rs
@@ -21,9 +21,10 @@
 use crate::client::WriteFormat;
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
+use crate::metadata::DataType;
 use crate::metadata::UNEXIST_MAPPING;
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
-use crate::row::{Decimal, FlussArray, GenericRow, InternalRow};
+use crate::row::{Decimal, FlussArray, FlussMap, GenericRow, InternalRow};
 use std::sync::Arc;
 
 pub(crate) struct ProjectedRow<R> {
@@ -142,6 +143,10 @@ impl<R: InternalRow> InternalRow for ProjectedRow<R> {
         project!(self, get_array, pos)
     }
 
+    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
+        project!(self, get_map, pos, key_type, value_type)
+    }
+
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
         project!(self, get_row, pos)
     }
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index fadb49622c..8be0d1daae 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -1041,6 +1041,90 @@ mod table_test {
             .expect("Failed to drop table");
     }
 
+    #[tokio::test]
+    async fn test_map_datatype_roundtrip() {
+        use fluss::row::binary_map::FlussMapWriter;
+        use fluss::row::{Datum, GenericRow};
+
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_map_datatype_roundtrip");
+
+        let key_type = DataTypes::string();
+        let value_type = DataTypes::int();
+        let map_type = DataTypes::map(key_type.clone(), value_type.clone());
+
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("map_col", map_type.clone())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+
+        // 1. Construct FlussMap
+        let mut map_writer = FlussMapWriter::new(3, &key_type, &value_type);
+        map_writer.write_entry("k1".into(), 10.into()).unwrap();
+        map_writer.write_entry("k2".into(), 20.into()).unwrap();
+        map_writer.write_entry("k3".into(), 30.into()).unwrap();
+        let fluss_map = map_writer.complete().unwrap();
+
+        // 2. Insert Row
+        let mut row = GenericRow::new(2);
+        row.set_field(0, 1i32);
+        row.set_field(1, Datum::Map(fluss_map));
+
+        let append_writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        append_writer.append(&row).expect("Failed to append row");
+        append_writer.flush().await.expect("Failed to flush");
+
+        // 3. Fetch Row
+        let records = scan_table(&table, |scan| scan).await;
+        assert_eq!(records.len(), 1, "Expected 1 record");
+
+        let found_row = records[0].row();
+        assert_eq!(found_row.get_int(0).unwrap(), 1);
+
+        // 4. Assert Map
+        let decoded_map = found_row
+            .get_map(1, &key_type, &value_type)
+            .expect("Failed to get map");
+        assert_eq!(decoded_map.size(), 3);
+
+        let decoded_keys = decoded_map.key_array();
+        let decoded_values = decoded_map.value_array();
+
+        assert_eq!(decoded_keys.get_string(0).unwrap(), "k1");
+        assert_eq!(decoded_keys.get_string(1).unwrap(), "k2");
+        assert_eq!(decoded_keys.get_string(2).unwrap(), "k3");
+
+        assert_eq!(decoded_values.get_int(0).unwrap(), 10);
+        assert_eq!(decoded_values.get_int(1).unwrap(), 20);
+        assert_eq!(decoded_values.get_int(2).unwrap(), 30);
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
     #[tokio::test]
     async fn partitioned_table_append_scan() {
         let cluster = get_shared_cluster();

From 5425b93665d67d22ae852fdeae5fa9c5c1fd4c28 Mon Sep 17 00:00:00 2001
From: Anton Borisov <anton.borisov@fresha.com>
Date: Fri, 15 May 2026 12:56:38 +0100
Subject: [PATCH 270/287] fix: close Arrow read-path gaps for MAP

---
 .../crates/fluss/src/metadata/datatype.rs     |  63 +++-
 fluss-rust/crates/fluss/src/record/arrow.rs   |  66 +++-
 fluss-rust/crates/fluss/src/row/binary_map.rs |  28 +-
 fluss-rust/crates/fluss/src/row/column.rs     | 301 +++++++++++++++---
 .../fluss/tests/integration/log_table.rs      |  12 +-
 5 files changed, 405 insertions(+), 65 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/metadata/datatype.rs b/fluss-rust/crates/fluss/src/metadata/datatype.rs
index 98823f075c..60a44ba718 100644
--- a/fluss-rust/crates/fluss/src/metadata/datatype.rs
+++ b/fluss-rust/crates/fluss/src/metadata/datatype.rs
@@ -920,13 +920,36 @@ impl Display for ArrayType {
     }
 }
 
-#[derive(Debug, Clone, PartialEq, Eq, Deserialize, Serialize, Hash)]
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Hash)]
 pub struct MapType {
     nullable: bool,
     key_type: Box<DataType>,
     value_type: Box<DataType>,
 }
 
+// Route Deserialize through `with_nullable` so a Serde-built MapType
+// collapses to the same canonical form as the constructor (otherwise
+// equivalent maps disagree under `PartialEq`).
+impl<'de> Deserialize<'de> for MapType {
+    fn deserialize<D>(deserializer: D) -> std::result::Result<Self, D::Error>
+    where
+        D: serde::Deserializer<'de>,
+    {
+        #[derive(Deserialize)]
+        struct Raw {
+            nullable: bool,
+            key_type: Box<DataType>,
+            value_type: Box<DataType>,
+        }
+        let raw = Raw::deserialize(deserializer)?;
+        Ok(MapType::with_nullable(
+            raw.nullable,
+            *raw.key_type,
+            *raw.value_type,
+        ))
+    }
+}
+
 impl MapType {
     pub fn new(key_type: DataType, value_type: DataType) -> Self {
         Self::with_nullable(true, key_type, value_type)
@@ -1470,6 +1493,44 @@ fn test_map_display() {
     );
 }
 
+#[test]
+fn test_map_deserialize_normalises_key_nullability() {
+    let json = r#"{
+        "nullable": true,
+        "key_type": {"Int": {"nullable": true}},
+        "value_type": {"String": {"nullable": true}}
+    }"#;
+    let from_json: MapType = serde_json::from_str(json).expect("deserialize");
+    let from_ctor = MapType::new(DataTypes::int(), DataTypes::string());
+    assert_eq!(from_json, from_ctor);
+    assert!(!from_json.key_type().is_nullable());
+}
+
+#[test]
+fn test_map_deserialize_normalises_nested_map_keys() {
+    let json = r#"{
+        "nullable": true,
+        "key_type": {"String": {"nullable": true}},
+        "value_type": {"Map": {
+            "nullable": true,
+            "key_type": {"Int": {"nullable": true}},
+            "value_type": {"Boolean": {"nullable": true}}
+        }}
+    }"#;
+    let from_json: MapType = serde_json::from_str(json).expect("deserialize");
+    let from_ctor = MapType::new(
+        DataTypes::string(),
+        DataTypes::map(DataTypes::int(), DataTypes::boolean()),
+    );
+    assert_eq!(from_json, from_ctor);
+    assert!(!from_json.key_type().is_nullable());
+    let inner = match from_json.value_type() {
+        DataType::Map(m) => m,
+        other => panic!("expected nested Map, got {other:?}"),
+    };
+    assert!(!inner.key_type().is_nullable());
+}
+
 #[test]
 fn test_row_display() {
     let fields = vec![
diff --git a/fluss-rust/crates/fluss/src/record/arrow.rs b/fluss-rust/crates/fluss/src/record/arrow.rs
index 179062e90d..b97fc120de 100644
--- a/fluss-rust/crates/fluss/src/record/arrow.rs
+++ b/fluss-rust/crates/fluss/src/record/arrow.rs
@@ -1261,6 +1261,16 @@ pub fn to_arrow_type(fluss_type: &DataType) -> Result<ArrowDataType> {
     })
 }
 
+/// Like `from_arrow_type`, but also reads the Field's nullability —
+/// Arrow stores it on the Field wrapper, not the leaf data type.
+pub(crate) fn from_arrow_field(field: &arrow_schema::Field) -> Result<DataType> {
+    let mut dt = from_arrow_type(field.data_type())?;
+    if !field.is_nullable() {
+        dt = dt.as_non_nullable();
+    }
+    Ok(dt)
+}
+
 /// Converts an Arrow data type back to a Fluss `DataType`.
 /// Used for reading array elements from Arrow ListArray back into Fluss types.
 pub(crate) fn from_arrow_type(arrow_type: &ArrowDataType) -> Result<DataType> {
@@ -1317,17 +1327,30 @@ pub(crate) fn from_arrow_type(arrow_type: &ArrowDataType) -> Result<DataType> {
                 DataTypes::timestamp_with_precision(precision)
             }
         }
-        ArrowDataType::List(field) => DataTypes::array(from_arrow_type(field.data_type())?),
+        ArrowDataType::List(field) => DataTypes::array(from_arrow_field(field)?),
+        ArrowDataType::Map(entries_field, _sorted) => {
+            let fields = match entries_field.data_type() {
+                ArrowDataType::Struct(f) => f,
+                other => {
+                    return Err(Error::IllegalArgument {
+                        message: format!("Map entries must be Struct, got {other:?}"),
+                    });
+                }
+            };
+            if fields.len() != 2 {
+                return Err(Error::IllegalArgument {
+                    message: format!(
+                        "Map entries Struct must have 2 fields (key, value), got {}",
+                        fields.len()
+                    ),
+                });
+            }
+            DataTypes::map(from_arrow_field(&fields[0])?, from_arrow_field(&fields[1])?)
+        }
         ArrowDataType::Struct(fields) => {
             let row_fields: Result<Vec<DataField>> = fields
                 .iter()
-                .map(|f| {
-                    let mut dt = from_arrow_type(f.data_type())?;
-                    if !f.is_nullable() {
-                        dt = dt.as_non_nullable();
-                    }
-                    Ok(DataField::new(f.name(), dt, None))
-                })
+                .map(|f| Ok(DataField::new(f.name(), from_arrow_field(f)?, None)))
                 .collect();
             DataTypes::row(row_fields?)
         }
@@ -1851,6 +1874,33 @@ mod tests {
         }
     }
 
+    #[test]
+    fn test_from_arrow_type_preserves_container_field_nullability() {
+        let arrow_list = ArrowDataType::List(Arc::new(arrow_schema::Field::new(
+            "item",
+            ArrowDataType::Int32,
+            false,
+        )));
+        match from_arrow_type(&arrow_list).unwrap() {
+            DataType::Array(at) => assert!(!at.get_element_type().is_nullable()),
+            other => panic!("expected Array, got {other:?}"),
+        }
+
+        let entries_struct = ArrowDataType::Struct(arrow_schema::Fields::from(vec![
+            arrow_schema::Field::new("key", ArrowDataType::Utf8, false),
+            arrow_schema::Field::new("value", ArrowDataType::Int32, false),
+        ]));
+        let entries_field = arrow_schema::Field::new("entries", entries_struct, false);
+        let arrow_map = ArrowDataType::Map(Arc::new(entries_field), false);
+        match from_arrow_type(&arrow_map).unwrap() {
+            DataType::Map(m) => {
+                assert!(!m.key_type().is_nullable());
+                assert!(!m.value_type().is_nullable());
+            }
+            other => panic!("expected Map, got {other:?}"),
+        }
+    }
+
     #[test]
     fn test_parse_ipc_message() {
         let empty_body: &[u8] = &le_bytes(&[0xFFFFFFFF, 0x00000000]);
diff --git a/fluss-rust/crates/fluss/src/row/binary_map.rs b/fluss-rust/crates/fluss/src/row/binary_map.rs
index b710b69c7d..46e82899ab 100644
--- a/fluss-rust/crates/fluss/src/row/binary_map.rs
+++ b/fluss-rust/crates/fluss/src/row/binary_map.rs
@@ -93,6 +93,17 @@ impl Serialize for FlussMap {
     }
 }
 
+fn check_no_null_keys(key_array: &FlussArray) -> Result<()> {
+    for i in 0..key_array.size() {
+        if key_array.is_null_at(i) {
+            return Err(IllegalArgument {
+                message: "FlussMap keys cannot be null".to_string(),
+            });
+        }
+    }
+    Ok(())
+}
+
 impl FlussMap {
     /// Validates the raw bytes and extracts the sub-arrays.
     fn validate(
@@ -163,14 +174,7 @@ impl FlussMap {
             });
         }
 
-        // Centralized null-key check: FlussMap keys are never allowed to be null.
-        for i in 0..key_array.size() {
-            if key_array.is_null_at(i) {
-                return Err(IllegalArgument {
-                    message: "FlussMap keys cannot be null".to_string(),
-                });
-            }
-        }
+        check_no_null_keys(&key_array)?;
 
         Ok((key_array, value_array))
     }
@@ -216,6 +220,7 @@ impl FlussMap {
                 ),
             });
         }
+        check_no_null_keys(key_array)?;
 
         let key_bytes = key_array.as_bytes();
         let value_bytes = value_array.as_bytes();
@@ -533,15 +538,16 @@ mod tests {
     #[test]
     fn test_null_keys_fail_validation() {
         let mut key_writer = FlussArrayWriter::new(1, &DataTypes::int());
-        key_writer.set_null_at(0); // null key!
+        key_writer.set_null_at(0);
         let key_array = key_writer.complete().unwrap();
 
         let mut value_writer = FlussArrayWriter::new(1, &DataTypes::int());
         value_writer.write_int(0, 100);
         let value_array = value_writer.complete().unwrap();
 
-        // Constructing bytes manually since from_arrays no longer catches it,
-        // and we want to verify validate catches it.
+        let err = FlussMap::from_arrays(&key_array, &value_array).unwrap_err();
+        assert!(err.to_string().contains("keys cannot be null"));
+
         let key_bytes = key_array.as_bytes();
         let value_bytes = value_array.as_bytes();
         let mut data = vec![];
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index b088f124b6..8b23423bbf 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -18,7 +18,7 @@
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::{DataType, RowType};
-use crate::record::from_arrow_type;
+use crate::record::from_arrow_field;
 use crate::row::binary_array::FlussArrayWriter;
 use crate::row::binary_map::FlussMap;
 use crate::row::datum::{Date, Datum, Time, TimestampLtz, TimestampNtz};
@@ -413,14 +413,48 @@ fn arrow_value_to_datum(
         ArrowDataType::List(field) => {
             let list_arr = downcast!(ListArray);
             let values = list_arr.value(row_id);
+            // Infer via from_arrow_field so the inferred element type
+            // matches what `arrow_map_entry_to_fluss_map` / strict `==`
+            // expect when there's no upstream Fluss schema.
             let element_fluss_type = match fluss_type {
                 Some(DataType::Array(at)) => at.get_element_type().clone(),
-                _ => from_arrow_type(field.data_type())?,
+                _ => from_arrow_field(field)?,
             };
             let mut writer = FlussArrayWriter::new(values.len(), &element_fluss_type);
             write_arrow_values_to_fluss_array(&*values, &element_fluss_type, &mut writer)?;
             Ok(Datum::Array(writer.complete()?))
         }
+        ArrowDataType::Map(entries_field, _) => {
+            let map_arr = downcast!(MapArray);
+            let entries = map_arr.value(row_id);
+            let (key_type, value_type) = match fluss_type {
+                Some(DataType::Map(m)) => (m.key_type().clone(), m.value_type().clone()),
+                _ => {
+                    let fields = match entries_field.data_type() {
+                        ArrowDataType::Struct(f) => f,
+                        other => {
+                            return Err(IllegalArgument {
+                                message: format!("expected Struct for Map entries, got {other:?}"),
+                            });
+                        }
+                    };
+                    if fields.len() != 2 {
+                        return Err(IllegalArgument {
+                            message: format!(
+                                "Map entries Struct must have 2 fields, got {}",
+                                fields.len()
+                            ),
+                        });
+                    }
+                    (from_arrow_field(&fields[0])?, from_arrow_field(&fields[1])?)
+                }
+            };
+            Ok(Datum::Map(arrow_map_entry_to_fluss_map(
+                &entries,
+                &key_type,
+                &value_type,
+            )?))
+        }
         other => Err(IllegalArgument {
             message: format!("unsupported Arrow data type for nested row extraction: {other:?}"),
         }),
@@ -627,19 +661,16 @@ impl InternalRow for ColumnarRow {
         };
 
         let column = self.column(pos)?;
-        let values = if let Some(list_arr) = column.as_any().downcast_ref::<ListArray>() {
-            list_arr.value(self.row_id)
-        } else {
-            return Err(IllegalArgument {
-                message: format!(
-                    "expected List array at position {pos}, got {:?}",
-                    column.data_type()
-                ),
-            });
+        let element_field = match column.data_type() {
+            ArrowDataType::List(field) => field,
+            other => {
+                return Err(IllegalArgument {
+                    message: format!("expected List array at position {pos}, got {other:?}"),
+                });
+            }
         };
 
-        // Validate that the Arrow element type matches the expected Fluss element type
-        let actual_element_type = from_arrow_type(values.data_type())?;
+        let actual_element_type = from_arrow_field(element_field)?;
         if actual_element_type != *element_fluss_type {
             return Err(IllegalArgument {
                 message: format!(
@@ -649,8 +680,12 @@ impl InternalRow for ColumnarRow {
             });
         }
 
+        let list_arr = column
+            .as_any()
+            .downcast_ref::<ListArray>()
+            .expect("data_type matched List but downcast failed; arrow-rs invariant violated");
+        let values = list_arr.value(self.row_id);
         let mut writer = FlussArrayWriter::new(values.len(), element_fluss_type);
-
         write_arrow_values_to_fluss_array(&*values, element_fluss_type, &mut writer)?;
         writer.complete()
     }
@@ -668,27 +703,6 @@ impl InternalRow for ColumnarRow {
                     ),
                 })?;
 
-        // Validate the Arrow element type matches the expected Fluss types
-        let actual_key_type = from_arrow_type(map_arr.key_type())?;
-        if actual_key_type != *key_type {
-            return Err(IllegalArgument {
-                message: format!(
-                    "Arrow map key type {:?} does not match expected Fluss type {:?}",
-                    actual_key_type, key_type
-                ),
-            });
-        }
-        let actual_value_type = from_arrow_type(map_arr.value_type())?;
-        if actual_value_type != *value_type {
-            return Err(IllegalArgument {
-                message: format!(
-                    "Arrow map value type {:?} does not match expected Fluss type {:?}",
-                    actual_value_type, value_type
-                ),
-            });
-        }
-
-        // Get the entries for this specific row
         arrow_map_entry_to_fluss_map(&map_arr.value(self.row_id), key_type, value_type)
     }
 
@@ -733,20 +747,24 @@ fn arrow_map_entry_to_fluss_map(
     key_type: &DataType,
     value_type: &DataType,
 ) -> Result<FlussMap> {
-    if struct_arr.num_columns() != 2 {
+    let fields = match struct_arr.data_type() {
+        ArrowDataType::Struct(f) => f,
+        other => {
+            return Err(IllegalArgument {
+                message: format!("expected Struct for Map entries, got {other:?}"),
+            });
+        }
+    };
+    if fields.len() != 2 {
         return Err(IllegalArgument {
             message: format!(
                 "Expected 2 columns in Map entries struct, got {}",
-                struct_arr.num_columns()
+                fields.len()
             ),
         });
     }
 
-    let keys_arrow = struct_arr.column(0);
-    let values_arrow = struct_arr.column(1);
-
-    // Validate that the Arrow key/value types match the expected Fluss types
-    let actual_key_type = from_arrow_type(keys_arrow.data_type())?;
+    let actual_key_type = from_arrow_field(&fields[0])?;
     if actual_key_type != *key_type {
         return Err(IllegalArgument {
             message: format!(
@@ -756,7 +774,7 @@ fn arrow_map_entry_to_fluss_map(
         });
     }
 
-    let actual_value_type = from_arrow_type(values_arrow.data_type())?;
+    let actual_value_type = from_arrow_field(&fields[1])?;
     if actual_value_type != *value_type {
         return Err(IllegalArgument {
             message: format!(
@@ -766,6 +784,9 @@ fn arrow_map_entry_to_fluss_map(
         });
     }
 
+    let keys_arrow = struct_arr.column(0);
+    let values_arrow = struct_arr.column(1);
+
     let len = keys_arrow.len();
 
     // Convert Arrow keys → FlussArray
@@ -1520,4 +1541,198 @@ mod tests {
         let nested_1 = row.get_row(0).unwrap();
         assert_eq!(nested_1.get_int(0).unwrap(), 20);
     }
+
+    #[test]
+    fn columnar_row_get_map_accepts_non_nullable_key_from_map_type() {
+        use crate::metadata::DataTypes;
+        use arrow::array::{MapBuilder, StringBuilder};
+
+        // Arrow map column with INT keys, STRING values.
+        let mut builder = MapBuilder::new(None, Int32Builder::new(), StringBuilder::new());
+        builder.keys().append_value(1);
+        builder.values().append_value("a");
+        builder.append(true).unwrap();
+        let map_arr = builder.finish();
+
+        let map_arrow_type = map_arr.data_type().clone();
+        let schema = Arc::new(Schema::new(vec![Field::new("m", map_arrow_type, true)]));
+        let batch =
+            Arc::new(RecordBatch::try_new(schema, vec![Arc::new(map_arr)]).expect("record batch"));
+
+        let map_type = DataTypes::map(DataTypes::int(), DataTypes::string());
+        let row_type = Arc::new(RowType::with_data_types(vec![map_type.clone()]));
+        let row = ColumnarRow::new(batch, row_type, 0, None);
+
+        let (k, v) = match &map_type {
+            crate::metadata::DataType::Map(m) => (m.key_type(), m.value_type()),
+            _ => unreachable!(),
+        };
+        let fluss_map = row
+            .get_map(0, k, v)
+            .expect("get_map should accept non-nullable key from MapType");
+        assert_eq!(fluss_map.size(), 1);
+        assert_eq!(fluss_map.key_array().get_int(0).unwrap(), 1);
+        assert_eq!(fluss_map.value_array().get_string(0).unwrap(), "a");
+    }
+
+    #[test]
+    fn columnar_row_reads_row_containing_map() {
+        use crate::metadata::DataTypes;
+        use arrow::array::{MapBuilder, StringBuilder};
+
+        // Inner Map<String, Int> Arrow column with one entry per row, 2 rows.
+        let mut mb = MapBuilder::new(None, StringBuilder::new(), Int32Builder::new());
+        mb.keys().append_value("k1");
+        mb.values().append_value(42);
+        mb.append(true).unwrap();
+        mb.keys().append_value("k2");
+        mb.values().append_value(7);
+        mb.append(true).unwrap();
+        let map_arr = mb.finish();
+
+        // Struct { id: Int32, m: Map<String, Int> }
+        let id_arr = Int32Array::from(vec![10, 20]);
+        let struct_fields = Fields::from(vec![
+            Field::new("id", DataType::Int32, false),
+            Field::new("m", map_arr.data_type().clone(), false),
+        ]);
+        let struct_arr = Arc::new(StructArray::new(
+            struct_fields.clone(),
+            vec![Arc::new(id_arr), Arc::new(map_arr)],
+            None,
+        ));
+        let schema = Arc::new(Schema::new(vec![Field::new(
+            "outer",
+            DataType::Struct(struct_fields),
+            false,
+        )]));
+        let batch = Arc::new(RecordBatch::try_new(schema, vec![struct_arr]).expect("record batch"));
+
+        // Fluss outer ROW<id INT, m MAP<STRING, INT>>
+        let inner_row_type = RowType::with_data_types(vec![
+            DataTypes::int(),
+            DataTypes::map(DataTypes::string(), DataTypes::int()),
+        ]);
+        let outer_row_type = Arc::new(RowType::with_data_types(vec![
+            crate::metadata::DataType::Row(inner_row_type),
+        ]));
+
+        let mut row = ColumnarRow::new(
+            batch,
+            outer_row_type.clone(),
+            0,
+            Some(outer_row_type.clone()),
+        );
+
+        let nested = row
+            .get_row(0)
+            .expect("reading row with Map field must succeed");
+        assert_eq!(nested.get_int(0).unwrap(), 10);
+        let inner_map = nested
+            .get_map(1, &DataTypes::string(), &DataTypes::int())
+            .expect("nested map should be accessible");
+        assert_eq!(inner_map.size(), 1);
+        assert_eq!(inner_map.key_array().get_string(0).unwrap(), "k1");
+        assert_eq!(inner_map.value_array().get_int(0).unwrap(), 42);
+
+        // Verify cache invalidation across rows works for Row-with-Map too.
+        row.set_row_id(1);
+        let nested = row.get_row(0).expect("row 1 must read");
+        assert_eq!(nested.get_int(0).unwrap(), 20);
+        let inner_map = nested
+            .get_map(1, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(inner_map.key_array().get_string(0).unwrap(), "k2");
+        assert_eq!(inner_map.value_array().get_int(0).unwrap(), 7);
+    }
+
+    #[test]
+    fn columnar_row_reads_array_of_maps() {
+        use crate::metadata::DataTypes;
+        use arrow::array::{ListBuilder, MapBuilder, StringBuilder};
+
+        // One row whose ARRAY<MAP<STRING, INT>> contains two maps:
+        // [{"k1" -> 1}, {"k2" -> 2, "k3" -> 3}].
+        let mut outer = ListBuilder::new(MapBuilder::new(
+            None,
+            StringBuilder::new(),
+            Int32Builder::new(),
+        ));
+        {
+            let mb = outer.values();
+            // Map 0: {"k1" -> 1}
+            mb.keys().append_value("k1");
+            mb.values().append_value(1);
+            mb.append(true).unwrap();
+            // Map 1: {"k2" -> 2, "k3" -> 3}
+            mb.keys().append_value("k2");
+            mb.values().append_value(2);
+            mb.keys().append_value("k3");
+            mb.values().append_value(3);
+            mb.append(true).unwrap();
+        }
+        outer.append(true);
+        let list_arr = outer.finish();
+        let arrow_dt = list_arr.data_type().clone();
+
+        let schema = Arc::new(Schema::new(vec![Field::new("a", arrow_dt, false)]));
+        let batch =
+            Arc::new(RecordBatch::try_new(schema, vec![Arc::new(list_arr)]).expect("record batch"));
+
+        let array_type = DataTypes::array(DataTypes::map(DataTypes::string(), DataTypes::int()));
+        let row_type = Arc::new(RowType::with_data_types(vec![array_type]));
+        let row = ColumnarRow::new(batch, row_type, 0, None);
+
+        let arr = row.get_array(0).expect("get_array on ARRAY<MAP> must work");
+        assert_eq!(arr.size(), 2);
+
+        let m0 = arr
+            .get_map(0, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(m0.size(), 1);
+        assert_eq!(m0.key_array().get_string(0).unwrap(), "k1");
+        assert_eq!(m0.value_array().get_int(0).unwrap(), 1);
+
+        let m1 = arr
+            .get_map(1, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(m1.size(), 2);
+        assert_eq!(m1.key_array().get_string(0).unwrap(), "k2");
+        assert_eq!(m1.value_array().get_int(0).unwrap(), 2);
+        assert_eq!(m1.key_array().get_string(1).unwrap(), "k3");
+        assert_eq!(m1.value_array().get_int(1).unwrap(), 3);
+    }
+
+    #[test]
+    fn columnar_row_get_map_rejects_real_type_mismatch() {
+        use crate::metadata::DataTypes;
+        use arrow::array::{MapBuilder, StringBuilder};
+
+        let mut mb = MapBuilder::new(None, StringBuilder::new(), Int32Builder::new());
+        mb.keys().append_value("k");
+        mb.values().append_value(1);
+        mb.append(true).unwrap();
+        let map_arr = mb.finish();
+        let map_arrow_type = map_arr.data_type().clone();
+
+        let schema = Arc::new(Schema::new(vec![Field::new("m", map_arrow_type, true)]));
+        let batch =
+            Arc::new(RecordBatch::try_new(schema, vec![Arc::new(map_arr)]).expect("record batch"));
+
+        // Caller mis-declares the value type as STRING.
+        let row_type = Arc::new(RowType::with_data_types(vec![DataTypes::map(
+            DataTypes::string(),
+            DataTypes::string(),
+        )]));
+        let row = ColumnarRow::new(batch, row_type, 0, None);
+
+        let err = row
+            .get_map(0, &DataTypes::string(), &DataTypes::string())
+            .expect_err("type mismatch must error");
+        let msg = err.to_string();
+        assert!(
+            msg.contains("does not match expected Fluss type"),
+            "unexpected error: {msg}"
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 8be0d1daae..11c5b3e95d 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -1102,9 +1102,17 @@ mod table_test {
         let found_row = records[0].row();
         assert_eq!(found_row.get_int(0).unwrap(), 1);
 
-        // 4. Assert Map
+        // 4. Assert Map. Look the types up from `map_type` rather than reusing
+        // the locally-stashed `key_type`/`value_type`: `MapType::with_nullable`
+        // forces the stored key non-nullable, which exercises the same
+        // (non-nullable schema) vs (Arrow-derived nullable) comparison realistic
+        // callers hit.
+        let (mt_key, mt_value) = match &map_type {
+            fluss::metadata::DataType::Map(m) => (m.key_type(), m.value_type()),
+            _ => unreachable!("map_type is a MAP"),
+        };
         let decoded_map = found_row
-            .get_map(1, &key_type, &value_type)
+            .get_map(1, mt_key, mt_value)
             .expect("Failed to get map");
         assert_eq!(decoded_map.size(), 3);
 

From dbf5f80ee16c8e66db8ff6b7bcb4e7c598db2440 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Fri, 15 May 2026 14:23:57 +0100
Subject: [PATCH 271/287] chore: fix main broken due to new clippy
 useless_conversion (#548)

---
 fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs b/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
index 1e337f8395..06014bfbb7 100644
--- a/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
+++ b/fluss-rust/crates/fluss/src/client/lookup/lookup_sender.rs
@@ -197,7 +197,7 @@ impl<T> LookupBatch<T> {
             return;
         }
 
-        for (lookup, value) in self.lookups.iter_mut().zip(values.into_iter()) {
+        for (lookup, value) in self.lookups.iter_mut().zip(values) {
             lookup.complete(Ok(value));
         }
     }

From 5f452c879f0cfee79180a376f89afc4d4986c50e Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Tue, 19 May 2026 02:46:33 +0200
Subject: [PATCH 272/287] [metrics] Add scanner fetch and remote download
 metrics (#553)

* add scanner fetch and remote download metrics

* add scanner fetch and remote download metrics
---
 .../fluss/src/client/table/remote_log.rs      |  13 ++
 .../crates/fluss/src/client/table/scanner.rs  | 149 +++++++++++++++++-
 fluss-rust/crates/fluss/src/metrics.rs        |  93 +++++++++++
 3 files changed, 247 insertions(+), 8 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index 4d96ce96b2..8957aced14 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -18,6 +18,10 @@ use crate::client::credentials::CredentialsReceiver;
 use crate::error::{Error, Result};
 use crate::io::{FileIO, Storage};
 use crate::metadata::TableBucket;
+use crate::metrics::{
+    SCANNER_REMOTE_FETCH_BYTES_TOTAL, SCANNER_REMOTE_FETCH_ERRORS_TOTAL,
+    SCANNER_REMOTE_FETCH_REQUESTS_TOTAL,
+};
 use crate::proto::{PbRemoteLogFetchInfo, PbRemoteLogSegment};
 use futures::TryStreamExt;
 use parking_lot::Mutex;
@@ -494,12 +498,19 @@ async fn spawn_download_task(
         return DownloadResult::Cancelled;
     }
 
+    // Java reference: RemoteLogDownloader.java increments `remoteFetchRequestCount`
+    // immediately before initiating the download. Each retry of the same segment
+    // counts as a separate request (matches Java behavior).
+    metrics::counter!(SCANNER_REMOTE_FETCH_REQUESTS_TOTAL).increment(1);
+
     // Try download ONCE
     let download_result = fetcher.fetch(&request).await;
 
     match download_result {
         Ok(fetch_result) => {
             // Success - permit will be released on drop (FileSource handles file deletion)
+            metrics::counter!(SCANNER_REMOTE_FETCH_BYTES_TOTAL)
+                .increment(fetch_result.file_size as u64);
             DownloadResult::Success {
                 result: RemoteLogFile {
                     file_path: fetch_result.file_path,
@@ -516,6 +527,8 @@ async fn spawn_download_task(
         }
         Err(e) => {
             // Download failed - check if we should retry or give up
+            // Counted per attempt, so retries each contribute one error.
+            metrics::counter!(SCANNER_REMOTE_FETCH_ERRORS_TOTAL).increment(1);
             let retry_count = request.retry_count + 1;
 
             if retry_count > MAX_RETRY_COUNT {
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index a4164b9976..0167af02e2 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -27,6 +27,9 @@ use crate::config::Config;
 use crate::error::Error::UnsupportedOperation;
 use crate::error::{ApiError, Error, FlussError, Result};
 use crate::metadata::{LogFormat, PhysicalTablePath, RowType, TableBucket, TableInfo, TablePath};
+use crate::metrics::{
+    SCANNER_BYTES_PER_REQUEST, SCANNER_FETCH_LATENCY_MS, SCANNER_FETCH_REQUESTS_TOTAL,
+};
 use crate::proto::{
     ErrorResponse, FetchLogRequest, FetchLogResponse, PbFetchLogReqForBucket, PbFetchLogReqForTable,
 };
@@ -39,6 +42,7 @@ use crate::{PartitionId, TableId};
 use arrow_schema::SchemaRef;
 use log::{debug, warn};
 use parking_lot::{Mutex, RwLock};
+use prost::Message;
 use std::{
     collections::{HashMap, HashSet},
     slice::from_ref,
@@ -779,6 +783,9 @@ struct FetchResponseContext {
     read_context: ReadContext,
     remote_read_context: ReadContext,
     remote_log_downloader: Arc<RemoteLogDownloader>,
+    /// `Instant` captured immediately before the FetchLog RPC; used to compute
+    /// `scanner.fetch_latency_ms` on a successful response.
+    request_start_time: Instant,
 }
 
 impl LogFetcher {
@@ -1021,14 +1028,6 @@ impl LogFetcher {
             let remote_log_downloader = Arc::clone(&self.remote_log_downloader);
             let nodes_with_pending = self.nodes_with_pending_fetch_requests.clone();
             let metadata = self.metadata.clone();
-            let response_context = FetchResponseContext {
-                metadata: metadata.clone(),
-                log_fetch_buffer,
-                log_scanner_status,
-                read_context,
-                remote_read_context,
-                remote_log_downloader,
-            };
             // Spawn async task to handle the fetch request
             // Note: These tasks are not explicitly tracked or cancelled when LogFetcher is dropped.
             // This is acceptable because:
@@ -1060,6 +1059,11 @@ impl LogFetcher {
                     }
                 };
 
+                // Java increment the fetch counter and capture `requestStartTime` immediately
+                // before the RPC. Failed connection acquisition above is not counted.
+                let request_start_time = Instant::now();
+                metrics::counter!(SCANNER_FETCH_REQUESTS_TOTAL).increment(1);
+
                 let fetch_response = match con
                     .request(message::FetchLogRequest::new(fetch_request.clone()))
                     .await
@@ -1074,6 +1078,18 @@ impl LogFetcher {
                     }
                 };
 
+                // Build the context after the RPC so `request_start_time` measures only RPC wall-clock
+                // — not tablet-server lookup or connection acquisition, which is matching Java's bebaviour
+                // Building it here also skips the allocation on the early-return error paths above.
+                let response_context = FetchResponseContext {
+                    metadata: metadata.clone(),
+                    log_fetch_buffer,
+                    log_scanner_status,
+                    read_context,
+                    remote_read_context,
+                    remote_log_downloader,
+                    request_start_time,
+                };
                 Self::handle_fetch_response(fetch_response, response_context).await;
             });
         }
@@ -1102,8 +1118,17 @@ impl LogFetcher {
             read_context,
             remote_read_context,
             remote_log_downloader,
+            request_start_time,
         } = context;
 
+        // `encoded_len()` mirrors Java's `fetchLogResponse.totalSize()`:
+        // both report the serialized API message body size, excluding protocol
+        // headers and framing. Recorded unconditionally (including zero-record
+        // responses) to match Java's histogram semantics.
+        metrics::histogram!(SCANNER_FETCH_LATENCY_MS)
+            .record(request_start_time.elapsed().as_secs_f64() * 1000.0);
+        metrics::histogram!(SCANNER_BYTES_PER_REQUEST).record(fetch_response.encoded_len() as f64);
+
         for pb_fetch_log_resp in fetch_response.tables_resp {
             let table_id = pb_fetch_log_resp.table_id;
             let fetch_log_for_buckets = pb_fetch_log_resp.buckets_resp;
@@ -2029,6 +2054,7 @@ mod tests {
             read_context: fetcher.read_context.clone(),
             remote_read_context: fetcher.remote_read_context.clone(),
             remote_log_downloader: fetcher.remote_log_downloader.clone(),
+            request_start_time: Instant::now(),
         };
 
         LogFetcher::handle_fetch_response(response, response_context).await;
@@ -2082,6 +2108,7 @@ mod tests {
             read_context: fetcher.read_context.clone(),
             remote_read_context: fetcher.remote_read_context.clone(),
             remote_log_downloader: fetcher.remote_log_downloader.clone(),
+            request_start_time: Instant::now(),
         };
 
         LogFetcher::handle_fetch_response(response, response_context).await;
@@ -2204,4 +2231,110 @@ mod tests {
         }
         Ok(())
     }
+
+    /// Drives `handle_fetch_response` against a local metrics recorder and
+    /// asserts that latency + bytes-per-request histograms are emitted with
+    /// values that mirror what Java would record. This complements the unit
+    /// tests in `metrics.rs` (which only verify the facade) by exercising
+    /// the actual instrumented call path.
+    ///
+    /// Note: uses a `current_thread` runtime inside `with_local_recorder`
+    /// (rather than `#[tokio::test]`) because the metrics facade installs a
+    /// thread-local recorder; running the async work on the same thread is
+    /// the only way to observe the emitted metrics in the snapshot. Both
+    /// the fetcher construction and the `handle_fetch_response` call run
+    /// inside the runtime (the security-token manager and remote-log
+    /// downloader require a Tokio reactor).
+    #[test]
+    fn handle_fetch_response_emits_latency_and_bytes_metrics() {
+        use crate::metrics::{SCANNER_BYTES_PER_REQUEST, SCANNER_FETCH_LATENCY_MS};
+        use metrics_util::debugging::{DebugValue, DebuggingRecorder};
+
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        let expected_bytes = metrics::with_local_recorder(&recorder, || {
+            let rt = tokio::runtime::Builder::new_current_thread()
+                .enable_all()
+                .build()
+                .expect("build current_thread runtime");
+
+            rt.block_on(async {
+                let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+                let table_info = build_table_info(table_path.clone(), 1, 1);
+                let cluster = build_cluster_arc(&table_path, 1, 1);
+                let metadata = Arc::new(Metadata::new_for_test(cluster));
+                let status = Arc::new(LogScannerStatus::new());
+                status.assign_scan_bucket(TableBucket::new(1, 0), 5);
+                let fetcher = LogFetcher::new(
+                    table_info,
+                    Arc::new(RpcClient::new()),
+                    metadata.clone(),
+                    status,
+                    &Config::default(),
+                    None,
+                )
+                .expect("build LogFetcher");
+
+                let response = FetchLogResponse {
+                    tables_resp: vec![PbFetchLogRespForTable {
+                        table_id: 1,
+                        buckets_resp: vec![PbFetchLogRespForBucket {
+                            partition_id: None,
+                            bucket_id: 0,
+                            error_code: Some(FlussError::None.code()),
+                            error_message: None,
+                            high_watermark: Some(7),
+                            log_start_offset: Some(0),
+                            remote_log_fetch_info: None,
+                            records: None,
+                        }],
+                    }],
+                };
+                let expected_bytes = response.encoded_len() as f64;
+                let response_context = FetchResponseContext {
+                    metadata: metadata.clone(),
+                    log_fetch_buffer: fetcher.log_fetch_buffer.clone(),
+                    log_scanner_status: fetcher.log_scanner_status.clone(),
+                    read_context: fetcher.read_context.clone(),
+                    remote_read_context: fetcher.remote_read_context.clone(),
+                    remote_log_downloader: fetcher.remote_log_downloader.clone(),
+                    request_start_time: Instant::now(),
+                };
+
+                LogFetcher::handle_fetch_response(response, response_context).await;
+                expected_bytes
+            })
+        });
+
+        let entries: Vec<_> = snapshotter.snapshot().into_vec();
+        let find_histogram = |name: &str| -> Vec<f64> {
+            entries
+                .iter()
+                .find_map(|(key, _, _, val)| {
+                    if key.key().name() == name {
+                        if let DebugValue::Histogram(v) = val {
+                            return Some(v.iter().map(|f| f.into_inner()).collect());
+                        }
+                    }
+                    None
+                })
+                .unwrap_or_default()
+        };
+
+        let latency_samples = find_histogram(SCANNER_FETCH_LATENCY_MS);
+        assert_eq!(latency_samples.len(), 1, "expected one latency sample");
+        assert!(
+            latency_samples[0] >= 0.0,
+            "latency must be non-negative, got {}",
+            latency_samples[0]
+        );
+
+        let bytes_samples = find_histogram(SCANNER_BYTES_PER_REQUEST);
+        assert_eq!(
+            bytes_samples,
+            vec![expected_bytes],
+            "bytes histogram must record encoded_len() for parity with Java fetchLogResponse.totalSize()",
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/metrics.rs b/fluss-rust/crates/fluss/src/metrics.rs
index 756e2db561..a533abd535 100644
--- a/fluss-rust/crates/fluss/src/metrics.rs
+++ b/fluss-rust/crates/fluss/src/metrics.rs
@@ -49,6 +49,43 @@ pub const CLIENT_BYTES_RECEIVED_TOTAL: &str = "fluss.client.bytes_received.total
 pub const CLIENT_REQUEST_LATENCY_MS: &str = "fluss.client.request_latency_ms";
 pub const CLIENT_REQUESTS_IN_FLIGHT: &str = "fluss.client.requests_in_flight";
 
+// ---------------------------------------------------------------------------
+// Scanner fetch + remote download metrics
+//
+// Fetch metrics are recorded in the LogFetcher fetch loop on response
+// completion. Remote metrics are recorded inside RemoteLogDownloader's
+// download task.
+//
+// Java uses a volatile-long gauge for fetch latency and Counter+MeterView
+// for rates. Rust uses a histogram for latency (richer percentile data)
+// and counters for throughput; the recorder/exporter handles rate
+// computation (e.g. Prometheus `rate()`).
+//
+// Java emits one `ScannerMetricGroup` per (database, table). Rust currently
+// emits without per-table labels — adding `database`/`table` labels is
+// tracked separately and intentionally deferred to keep this PR minimal.
+// ---------------------------------------------------------------------------
+
+/// Histogram: elapsed ms for each successful FetchLog RPC.
+pub const SCANNER_FETCH_LATENCY_MS: &str = "fluss.client.scanner.fetch_latency_ms";
+
+/// Counter: total FetchLog RPC requests attempted after connection acquisition.
+pub const SCANNER_FETCH_REQUESTS_TOTAL: &str = "fluss.client.scanner.fetch_requests.total";
+
+/// Histogram: serialized bytes per successful FetchLog response.
+pub const SCANNER_BYTES_PER_REQUEST: &str = "fluss.client.scanner.bytes_per_request";
+
+/// Counter: total remote log download attempts (includes per-segment retries).
+pub const SCANNER_REMOTE_FETCH_REQUESTS_TOTAL: &str =
+    "fluss.client.scanner.remote_fetch_requests.total";
+
+/// Counter: total bytes downloaded from remote log storage.
+pub const SCANNER_REMOTE_FETCH_BYTES_TOTAL: &str = "fluss.client.scanner.remote_fetch_bytes.total";
+
+/// Counter: total remote log download failures (each retry attempt counts).
+pub const SCANNER_REMOTE_FETCH_ERRORS_TOTAL: &str =
+    "fluss.client.scanner.remote_fetch_errors.total";
+
 /// Returns a label value for reportable API keys, matching Java's
 /// `ConnectionMetrics.REPORT_API_KEYS` filter (`ProduceLog`, `FetchLog`,
 /// `PutKv`, `Lookup`). Returns `None` for admin/metadata/auth calls to
@@ -267,4 +304,60 @@ mod tests {
         assert_eq!(counter_by_api_key.get("produce_log"), Some(&5));
         assert_eq!(counter_by_api_key.get("fetch_log"), Some(&3));
     }
+
+    #[test]
+    fn scanner_fetch_metrics_emit_correctly() {
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            metrics::counter!(SCANNER_FETCH_REQUESTS_TOTAL).increment(1);
+            metrics::histogram!(SCANNER_FETCH_LATENCY_MS).record(15.5);
+            metrics::histogram!(SCANNER_BYTES_PER_REQUEST).record(4096.0);
+        });
+
+        let snapshot = snapshotter.snapshot();
+        let entries: Vec<_> = snapshot.into_vec();
+
+        assert_eq!(
+            find_counter!(entries, SCANNER_FETCH_REQUESTS_TOTAL),
+            Some(1)
+        );
+        assert_eq!(
+            find_histogram!(entries, SCANNER_FETCH_LATENCY_MS),
+            Some(vec![15.5])
+        );
+        assert_eq!(
+            find_histogram!(entries, SCANNER_BYTES_PER_REQUEST),
+            Some(vec![4096.0])
+        );
+    }
+
+    #[test]
+    fn scanner_remote_fetch_metrics_emit_correctly() {
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            metrics::counter!(SCANNER_REMOTE_FETCH_REQUESTS_TOTAL).increment(3);
+            metrics::counter!(SCANNER_REMOTE_FETCH_BYTES_TOTAL).increment(1024);
+            metrics::counter!(SCANNER_REMOTE_FETCH_ERRORS_TOTAL).increment(1);
+        });
+
+        let snapshot = snapshotter.snapshot();
+        let entries: Vec<_> = snapshot.into_vec();
+
+        assert_eq!(
+            find_counter!(entries, SCANNER_REMOTE_FETCH_REQUESTS_TOTAL),
+            Some(3)
+        );
+        assert_eq!(
+            find_counter!(entries, SCANNER_REMOTE_FETCH_BYTES_TOTAL),
+            Some(1024)
+        );
+        assert_eq!(
+            find_counter!(entries, SCANNER_REMOTE_FETCH_ERRORS_TOTAL),
+            Some(1)
+        );
+    }
 }

From 29ea5cedbfac43c8b9baa64cb134d11a7bd4516c Mon Sep 17 00:00:00 2001
From: Jared Yu <qzyu999@gmail.com>
Date: Mon, 18 May 2026 20:02:55 -0700
Subject: [PATCH 273/287] docs: add documentation for MAP dtype (#556)

---
 .../docs/user-guide/rust/api-reference.md     | 14 +++++++++++
 .../docs/user-guide/rust/data-types.md        | 23 +++++++++++++++++++
 2 files changed, 37 insertions(+)

diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 5d3068b5a2..7ef34ef3ac 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -466,6 +466,7 @@ Implements the `InternalRow` trait (see below).
 | `fn get_binary(&self, idx: usize, length: usize) -> Result<&[u8]>`                     | Get fixed-length binary value           |
 | `fn get_char(&self, idx: usize, length: usize) -> Result<&str>`                        | Get fixed-length char value             |
 | `fn get_array(&self, idx: usize) -> Result<FlussArray>`                                | Get array value                         |
+| `fn get_map(&self, idx: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap>` | Get map value                           |
 
 ## `FlussArray`
 
@@ -479,6 +480,19 @@ Implements the `InternalRow` trait (see below).
 
 Element getters mirror `InternalRow` typed getters and return `Result<T>`. For example, use `get_int()`, `get_long()`, and `get_double()` for primitive elements, and `get_string()`, `get_binary()`, `get_decimal()`, `get_timestamp_ntz()`, `get_timestamp_ltz()`, and `get_array()` for variable-length or nested elements.
 
+## `FlussMap`
+
+`FlussMap` is the Rust row representation for `MAP` values. You usually obtain it from `InternalRow::get_map()`.
+
+| Method | Description |
+|--------|-------------|
+| `fn size(&self) -> usize` | Number of entries in the map |
+| `fn as_bytes(&self) -> &[u8]` | Get encoded bytes of the map |
+| `fn key_array(&self) -> &FlussArray` | Get the key array |
+| `fn value_array(&self) -> &FlussArray` | Get the value array |
+
+Key and value arrays are returned as `&FlussArray`, allowing you to read entries by retrieving keys and values at the same index positions.
+
 ## `ChangeType`
 
 | Value                      | Short String  | Description                      |
diff --git a/fluss-rust/website/docs/user-guide/rust/data-types.md b/fluss-rust/website/docs/user-guide/rust/data-types.md
index 63b7fa6239..ad14028bd7 100644
--- a/fluss-rust/website/docs/user-guide/rust/data-types.md
+++ b/fluss-rust/website/docs/user-guide/rust/data-types.md
@@ -22,6 +22,7 @@ sidebar_position: 3
 | `BYTES`         | `&[u8]`        | `get_bytes()`                        | `set_field(idx, &[u8])`        |
 | `BINARY(n)`     | `&[u8]`        | `get_binary(idx, length)`            | `set_field(idx, &[u8])`        |
 | `ARRAY<T>`      | `FlussArray`   | `get_array()`                        | `set_field(idx, FlussArray)`   |
+| `MAP<K, V>`     | `FlussMap`     | `get_map(idx, key_type, value_type)` | `set_field(idx, FlussMap)`     |
 
 ## Constructing Special Types
 
@@ -83,6 +84,28 @@ row.set_field(0, Datum::Array(arr));
 
 `ARRAY` is supported for row values and nested row fields. For key encoding, Rust follows Java parity: `ARRAY` can be encoded by the compacted key encoder, while table-level key constraints are validated by the server (which may reject unsupported key types).
 
+## Maps
+
+Use `DataTypes::map(key_type, value_type)` in schema definitions. At runtime, read maps with `row.get_map(idx, &key_type, &value_type)?`.
+
+To construct map values for writes, build a `FlussMap` using `FlussMapWriter` and wrap it with `Datum::Map`:
+
+```rust
+use fluss::metadata::DataTypes;
+use fluss::row::binary_map::FlussMapWriter;
+use fluss::row::{Datum, GenericRow};
+
+let mut writer = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+writer.write_entry("key1".into(), 100.into())?;
+writer.write_entry("key2".into(), Datum::Null)?;
+let map = writer.complete()?;
+
+let mut row = GenericRow::new(1);
+row.set_field(0, Datum::Map(map));
+```
+
+`MAP` keys cannot be null. `MAP` is supported for row values and nested row fields. Like arrays, `MAP` follows Java parity for key encoding and can be encoded by the compacted key encoder, while table-level key constraints are validated by the server.
+
 ## Reading Row Data
 
 ```rust

From 32ae530ce2db721a72c79ce9cec3c55b356c7dcc Mon Sep 17 00:00:00 2001
From: Anton Borisov <anton.borisov@fresha.com>
Date: Sat, 23 May 2026 20:27:09 +0100
Subject: [PATCH 274/287] [chore] improve ergonomics for MAP dt, docs additions

---
 fluss-rust/bindings/cpp/src/types.rs          |   4 +-
 .../crates/fluss/src/row/binary_array.rs      |  11 +-
 fluss-rust/crates/fluss/src/row/binary_map.rs | 153 +++++++++++++++++-
 fluss-rust/crates/fluss/src/row/column.rs     |  42 ++---
 .../crates/fluss/src/row/column_writer.rs     | 102 ++++++++----
 .../fluss/src/row/compacted/compacted_row.rs  |  20 +--
 fluss-rust/crates/fluss/src/row/datum.rs      |  11 +-
 .../crates/fluss/src/row/field_getter.rs      |   6 +-
 fluss-rust/crates/fluss/src/row/lookup_row.rs |   5 +-
 fluss-rust/crates/fluss/src/row/mod.rs        |  12 +-
 .../crates/fluss/src/row/projected_row.rs     |   5 +-
 .../fluss/tests/integration/log_table.rs      |  14 +-
 .../docs/user-guide/rust/api-reference.md     |  23 ++-
 .../docs/user-guide/rust/data-types.md        |  60 ++++++-
 14 files changed, 349 insertions(+), 119 deletions(-)

diff --git a/fluss-rust/bindings/cpp/src/types.rs b/fluss-rust/bindings/cpp/src/types.rs
index 9ef8fe72c4..23ac636d4c 100644
--- a/fluss-rust/bindings/cpp/src/types.rs
+++ b/fluss-rust/bindings/cpp/src/types.rs
@@ -589,9 +589,7 @@ pub fn compacted_row_to_owned(
                 Datum::Blob(Cow::Owned(row.get_binary(i, dt.length())?.to_vec()))
             }
             fcore::metadata::DataType::Array(_) => Datum::Array(row.get_array(i)?),
-            fcore::metadata::DataType::Map(mt) => {
-                Datum::Map(row.get_map(i, mt.key_type(), mt.value_type())?)
-            }
+            fcore::metadata::DataType::Map(_) => Datum::Map(row.get_map(i)?),
             other => return Err(anyhow!("Unsupported data type for column {i}: {other:?}")),
         };
 
diff --git a/fluss-rust/crates/fluss/src/row/binary_array.rs b/fluss-rust/crates/fluss/src/row/binary_array.rs
index d4fab7620b..b987cec8b7 100644
--- a/fluss-rust/crates/fluss/src/row/binary_array.rs
+++ b/fluss-rust/crates/fluss/src/row/binary_array.rs
@@ -832,8 +832,15 @@ impl InternalRow for FlussArray {
         self.get_array(pos)
     }
 
-    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
-        self.get_map(pos, key_type, value_type)
+    fn get_map(&self, pos: usize) -> Result<FlussMap> {
+        // FlussArray carries no schema; nested map reads must go through the
+        // inherent FlussArray::get_map(pos, key_type, value_type).
+        Err(IllegalArgument {
+            message: format!(
+                "InternalRow::get_map is not supported on FlussArray (pos {pos}); \
+                 use FlussArray::get_map(pos, key_type, value_type) directly"
+            ),
+        })
     }
 }
 
diff --git a/fluss-rust/crates/fluss/src/row/binary_map.rs b/fluss-rust/crates/fluss/src/row/binary_map.rs
index 46e82899ab..57201b84b5 100644
--- a/fluss-rust/crates/fluss/src/row/binary_map.rs
+++ b/fluss-rust/crates/fluss/src/row/binary_map.rs
@@ -26,7 +26,7 @@ use crate::error::Error::IllegalArgument;
 use crate::error::Result;
 use crate::metadata::DataType;
 use crate::row::binary_array::{FlussArray, FlussArrayWriter};
-use crate::row::datum::Datum;
+use crate::row::datum::{Datum, read_datum_from_fluss_array};
 use bytes::Bytes;
 use serde::Serialize;
 use std::fmt;
@@ -41,6 +41,8 @@ pub struct FlussMap {
     data: Bytes,
     key_array: FlussArray,
     value_array: FlussArray,
+    key_type: DataType,
+    value_type: DataType,
 }
 
 impl fmt::Debug for FlussMap {
@@ -190,6 +192,8 @@ impl FlussMap {
             data: Bytes::copy_from_slice(data),
             key_array,
             value_array,
+            key_type: key_type.clone(),
+            value_type: value_type.clone(),
         })
     }
 
@@ -204,13 +208,20 @@ impl FlussMap {
             data,
             key_array,
             value_array,
+            key_type: key_type.clone(),
+            value_type: value_type.clone(),
         })
     }
 
     /// Creates a FlussMap by combining a key array and a value array.
     ///
     /// Copies both arrays into a new contiguous buffer.
-    pub fn from_arrays(key_array: &FlussArray, value_array: &FlussArray) -> Result<Self> {
+    pub fn from_arrays(
+        key_array: &FlussArray,
+        value_array: &FlussArray,
+        key_type: &DataType,
+        value_type: &DataType,
+    ) -> Result<Self> {
         if key_array.size() != value_array.size() {
             return Err(IllegalArgument {
                 message: format!(
@@ -239,6 +250,8 @@ impl FlussMap {
             data,
             key_array: key_array.clone(),
             value_array: value_array.clone(),
+            key_type: key_type.clone(),
+            value_type: value_type.clone(),
         })
     }
 
@@ -261,8 +274,61 @@ impl FlussMap {
     pub fn value_array(&self) -> &FlussArray {
         &self.value_array
     }
+
+    pub fn key_type(&self) -> &DataType {
+        &self.key_type
+    }
+
+    pub fn value_type(&self) -> &DataType {
+        &self.value_type
+    }
+
+    pub fn entries(&self) -> Entries<'_> {
+        Entries {
+            map: self,
+            index: 0,
+        }
+    }
+
+    /// O(n) linear scan; the binary format carries no key index.
+    pub fn get<'a>(&'a self, key: &Datum<'_>) -> Result<Option<Datum<'a>>> {
+        for entry in self.entries() {
+            let (k, v) = entry?;
+            if &k == key {
+                return Ok(Some(v));
+            }
+        }
+        Ok(None)
+    }
+}
+
+pub struct Entries<'a> {
+    map: &'a FlussMap,
+    index: usize,
 }
 
+impl<'a> Iterator for Entries<'a> {
+    type Item = Result<(Datum<'a>, Datum<'a>)>;
+
+    fn next(&mut self) -> Option<Self::Item> {
+        if self.index >= self.map.size() {
+            return None;
+        }
+        let i = self.index;
+        self.index += 1;
+        let key = read_datum_from_fluss_array(&self.map.key_array, i, &self.map.key_type);
+        let value = read_datum_from_fluss_array(&self.map.value_array, i, &self.map.value_type);
+        Some(key.and_then(|k| value.map(|v| (k, v))))
+    }
+
+    fn size_hint(&self) -> (usize, Option<usize>) {
+        let remaining = self.map.size() - self.index;
+        (remaining, Some(remaining))
+    }
+}
+
+impl ExactSizeIterator for Entries<'_> {}
+
 /// Writer for building a `FlussMap` entry by entry.
 pub struct FlussMapWriter {
     key_writer: FlussArrayWriter,
@@ -284,6 +350,18 @@ impl FlussMapWriter {
         }
     }
 
+    pub fn extend<'a, I, K, V>(&mut self, entries: I) -> Result<()>
+    where
+        I: IntoIterator<Item = (K, V)>,
+        K: Into<Datum<'a>>,
+        V: Into<Datum<'a>>,
+    {
+        for (k, v) in entries {
+            self.write_entry(k.into(), v.into())?;
+        }
+        Ok(())
+    }
+
     /// Writes a key-value entry into the map.
     ///
     /// # Errors
@@ -315,7 +393,7 @@ impl FlussMapWriter {
     pub fn complete(self) -> Result<FlussMap> {
         let key_array = self.key_writer.complete()?;
         let value_array = self.value_writer.complete()?;
-        FlussMap::from_arrays(&key_array, &value_array)
+        FlussMap::from_arrays(&key_array, &value_array, &self.key_type, &self.value_type)
     }
 
     fn write_datum(
@@ -480,7 +558,13 @@ mod tests {
         let value_writer = FlussArrayWriter::new(2, &DataTypes::string());
         let value_array = value_writer.complete().unwrap();
 
-        let err = FlussMap::from_arrays(&key_array, &value_array).unwrap_err();
+        let err = FlussMap::from_arrays(
+            &key_array,
+            &value_array,
+            &DataTypes::int(),
+            &DataTypes::string(),
+        )
+        .unwrap_err();
         assert!(err.to_string().contains("does not match value array size"));
     }
 
@@ -520,7 +604,13 @@ mod tests {
         value_writer.write_int(0, 100);
         let value_array = value_writer.complete().unwrap();
 
-        let map = FlussMap::from_arrays(&key_array, &value_array).unwrap();
+        let map = FlussMap::from_arrays(
+            &key_array,
+            &value_array,
+            &DataTypes::int(),
+            &DataTypes::int(),
+        )
+        .unwrap();
         let bytes = map.as_bytes();
 
         // Valid bytes should pass
@@ -545,7 +635,13 @@ mod tests {
         value_writer.write_int(0, 100);
         let value_array = value_writer.complete().unwrap();
 
-        let err = FlussMap::from_arrays(&key_array, &value_array).unwrap_err();
+        let err = FlussMap::from_arrays(
+            &key_array,
+            &value_array,
+            &DataTypes::int(),
+            &DataTypes::int(),
+        )
+        .unwrap_err();
         assert!(err.to_string().contains("keys cannot be null"));
 
         let key_bytes = key_array.as_bytes();
@@ -558,4 +654,49 @@ mod tests {
         let err = FlussMap::from_bytes(&data, &DataTypes::int(), &DataTypes::int()).unwrap_err();
         assert!(err.to_string().contains("keys cannot be null"));
     }
+
+    #[test]
+    fn entries_yields_typed_pairs_including_nulls() {
+        let mut writer = FlussMapWriter::new(3, &DataTypes::string(), &DataTypes::int());
+        writer.write_entry("a".into(), 1.into()).unwrap();
+        writer.write_entry("b".into(), Datum::Null).unwrap();
+        writer.write_entry("c".into(), 3.into()).unwrap();
+        let map = writer.complete().unwrap();
+
+        let collected: Vec<(Datum, Datum)> = map
+            .entries()
+            .collect::<Result<Vec<_>>>()
+            .expect("entries should decode cleanly");
+
+        assert_eq!(collected.len(), 3);
+        assert_eq!(collected[0], (Datum::from("a"), Datum::from(1i32)));
+        assert_eq!(collected[1].0, Datum::from("b"));
+        assert_eq!(collected[1].1, Datum::Null);
+        assert_eq!(collected[2], (Datum::from("c"), Datum::from(3i32)));
+    }
+
+    #[test]
+    fn get_finds_present_key_and_returns_none_for_absent() {
+        let mut writer = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+        writer.write_entry("a".into(), 10.into()).unwrap();
+        writer.write_entry("b".into(), 20.into()).unwrap();
+        let map = writer.complete().unwrap();
+
+        let v = map.get(&Datum::from("b")).unwrap();
+        assert_eq!(v, Some(Datum::from(20i32)));
+
+        let missing = map.get(&Datum::from("z")).unwrap();
+        assert!(missing.is_none());
+    }
+
+    #[test]
+    fn writer_extend_from_iterator_round_trips() {
+        let src: Vec<(&str, i32)> = vec![("a", 1), ("b", 2), ("c", 3)];
+        let mut writer = FlussMapWriter::new(src.len(), &DataTypes::string(), &DataTypes::int());
+        writer.extend(src).unwrap();
+        let map = writer.complete().unwrap();
+
+        assert_eq!(map.size(), 3);
+        assert_eq!(map.get(&Datum::from("b")).unwrap(), Some(Datum::from(2i32)));
+    }
 }
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index 8b23423bbf..f4da6b3fe4 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -690,7 +690,17 @@ impl InternalRow for ColumnarRow {
         writer.complete()
     }
 
-    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
+    fn get_map(&self, pos: usize) -> Result<FlussMap> {
+        let expected_type = self.row_type.fields()[pos].data_type();
+        let map_type = match expected_type {
+            DataType::Map(m) => m,
+            _ => {
+                return Err(IllegalArgument {
+                    message: format!("expected Map type at position {pos}, got {expected_type:?}"),
+                });
+            }
+        };
+
         let column = self.column(pos)?;
         let map_arr =
             column
@@ -703,7 +713,11 @@ impl InternalRow for ColumnarRow {
                     ),
                 })?;
 
-        arrow_map_entry_to_fluss_map(&map_arr.value(self.row_id), key_type, value_type)
+        arrow_map_entry_to_fluss_map(
+            &map_arr.value(self.row_id),
+            map_type.key_type(),
+            map_type.value_type(),
+        )
     }
 
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
@@ -799,7 +813,7 @@ fn arrow_map_entry_to_fluss_map(
     write_arrow_values_to_fluss_array(&**values_arrow, value_type, &mut value_writer)?;
     let value_array = value_writer.complete()?;
 
-    FlussMap::from_arrays(&key_array, &value_array)
+    FlussMap::from_arrays(&key_array, &value_array, key_type, value_type)
 }
 
 /// Downcast to a primitive Arrow array type, then loop with null checks calling a writer method.
@@ -1560,16 +1574,12 @@ mod tests {
             Arc::new(RecordBatch::try_new(schema, vec![Arc::new(map_arr)]).expect("record batch"));
 
         let map_type = DataTypes::map(DataTypes::int(), DataTypes::string());
-        let row_type = Arc::new(RowType::with_data_types(vec![map_type.clone()]));
+        let row_type = Arc::new(RowType::with_data_types(vec![map_type]));
         let row = ColumnarRow::new(batch, row_type, 0, None);
 
-        let (k, v) = match &map_type {
-            crate::metadata::DataType::Map(m) => (m.key_type(), m.value_type()),
-            _ => unreachable!(),
-        };
         let fluss_map = row
-            .get_map(0, k, v)
-            .expect("get_map should accept non-nullable key from MapType");
+            .get_map(0)
+            .expect("get_map should succeed on ColumnarRow");
         assert_eq!(fluss_map.size(), 1);
         assert_eq!(fluss_map.key_array().get_int(0).unwrap(), 1);
         assert_eq!(fluss_map.value_array().get_string(0).unwrap(), "a");
@@ -1628,9 +1638,7 @@ mod tests {
             .get_row(0)
             .expect("reading row with Map field must succeed");
         assert_eq!(nested.get_int(0).unwrap(), 10);
-        let inner_map = nested
-            .get_map(1, &DataTypes::string(), &DataTypes::int())
-            .expect("nested map should be accessible");
+        let inner_map = nested.get_map(1).expect("nested map should be accessible");
         assert_eq!(inner_map.size(), 1);
         assert_eq!(inner_map.key_array().get_string(0).unwrap(), "k1");
         assert_eq!(inner_map.value_array().get_int(0).unwrap(), 42);
@@ -1639,9 +1647,7 @@ mod tests {
         row.set_row_id(1);
         let nested = row.get_row(0).expect("row 1 must read");
         assert_eq!(nested.get_int(0).unwrap(), 20);
-        let inner_map = nested
-            .get_map(1, &DataTypes::string(), &DataTypes::int())
-            .unwrap();
+        let inner_map = nested.get_map(1).unwrap();
         assert_eq!(inner_map.key_array().get_string(0).unwrap(), "k2");
         assert_eq!(inner_map.value_array().get_int(0).unwrap(), 7);
     }
@@ -1726,9 +1732,7 @@ mod tests {
         )]));
         let row = ColumnarRow::new(batch, row_type, 0, None);
 
-        let err = row
-            .get_map(0, &DataTypes::string(), &DataTypes::string())
-            .expect_err("type mismatch must error");
+        let err = row.get_map(0).expect_err("type mismatch must error");
         let msg = err.to_string();
         assert!(
             msg.contains("does not match expected Fluss type"),
diff --git a/fluss-rust/crates/fluss/src/row/column_writer.rs b/fluss-rust/crates/fluss/src/row/column_writer.rs
index bbd2876733..94777faf3c 100644
--- a/fluss-rust/crates/fluss/src/row/column_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/column_writer.rs
@@ -22,6 +22,7 @@
 use crate::error::Error::RowConvertError;
 use crate::error::{Error, Result};
 use crate::metadata::{DataType, RowType};
+use crate::row::FlussMap;
 use crate::row::InternalRow;
 use crate::row::datum::{
     MICROS_PER_MILLI, MILLIS_PER_SECOND, NANOS_PER_MILLI, append_decimal_to_builder,
@@ -833,30 +834,52 @@ impl ColumnWriter {
             } => {
                 let array = row.get_array(pos)?;
                 let size = array.size();
-                if let TypedWriter::Struct {
-                    field_writers,
-                    validity: child_validity,
-                    row_type,
-                    ..
-                } = &mut element_writer.inner
-                {
-                    for i in 0..size {
-                        if array.is_null_at(i) {
-                            for child in field_writers.iter_mut() {
-                                child.append_null();
+                match &mut element_writer.inner {
+                    TypedWriter::Struct {
+                        field_writers,
+                        validity: child_validity,
+                        row_type,
+                        ..
+                    } => {
+                        for i in 0..size {
+                            if array.is_null_at(i) {
+                                for child in field_writers.iter_mut() {
+                                    child.append_null();
+                                }
+                                child_validity.push(false);
+                            } else {
+                                let nested = array.get_row(i, row_type)?;
+                                for (j, child) in field_writers.iter_mut().enumerate() {
+                                    child.write_field_at(&nested, j)?;
+                                }
+                                child_validity.push(true);
                             }
-                            child_validity.push(false);
-                        } else {
-                            let nested = array.get_row(i, row_type)?;
-                            for (j, child) in field_writers.iter_mut().enumerate() {
-                                child.write_field_at(&nested, j)?;
+                        }
+                    }
+                    TypedWriter::Map {
+                        key_writer,
+                        value_writer,
+                        key_type,
+                        value_type,
+                        offsets: child_offsets,
+                        validity: child_validity,
+                    } => {
+                        for i in 0..size {
+                            if array.is_null_at(i) {
+                                child_validity.push(false);
+                                let last = *child_offsets.last().unwrap();
+                                child_offsets.push(last);
+                            } else {
+                                let map = array.get_map(i, key_type, value_type)?;
+                                write_map_into(map, key_writer, value_writer, child_offsets)?;
+                                child_validity.push(true);
                             }
-                            child_validity.push(true);
                         }
                     }
-                } else {
-                    for i in 0..size {
-                        element_writer.write_field_at(&array, i)?;
+                    _ => {
+                        for i in 0..size {
+                            element_writer.write_field_at(&array, i)?;
+                        }
                     }
                 }
                 let last = *offsets.last().unwrap();
@@ -871,24 +894,12 @@ impl ColumnWriter {
             TypedWriter::Map {
                 key_writer,
                 value_writer,
-                key_type,
-                value_type,
                 offsets,
                 validity,
+                ..
             } => {
-                let map = row.get_map(pos, key_type, value_type)?;
-                let key_array = map.key_array();
-                let value_array = map.value_array();
-                for i in 0..map.size() {
-                    key_writer.write_field_at(key_array, i)?;
-                    value_writer.write_field_at(value_array, i)?;
-                }
-                let last = *offsets.last().unwrap();
-                offsets.push(
-                    last + i32::try_from(map.size()).map_err(|_| RowConvertError {
-                        message: format!("Map size {} exceeds i32 range", map.size()),
-                    })?,
-                );
+                let map = row.get_map(pos)?;
+                write_map_into(map, key_writer, value_writer, offsets)?;
                 validity.push(true);
                 Ok(())
             }
@@ -908,6 +919,27 @@ impl ColumnWriter {
     }
 }
 
+fn write_map_into(
+    map: FlussMap,
+    key_writer: &mut ColumnWriter,
+    value_writer: &mut ColumnWriter,
+    offsets: &mut Vec<i32>,
+) -> Result<()> {
+    let key_array = map.key_array();
+    let value_array = map.value_array();
+    for i in 0..map.size() {
+        key_writer.write_field_at(key_array, i)?;
+        value_writer.write_field_at(value_array, i)?;
+    }
+    let last = *offsets.last().unwrap();
+    offsets.push(
+        last + i32::try_from(map.size()).map_err(|_| RowConvertError {
+            message: format!("Map size {} exceeds i32 range", map.size()),
+        })?,
+    );
+    Ok(())
+}
+
 fn finish_struct_array(
     fields: arrow_schema::Fields,
     child_arrays: Vec<ArrayRef>,
diff --git a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
index 2463e47951..7f2b5c0429 100644
--- a/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
+++ b/fluss-rust/crates/fluss/src/row/compacted/compacted_row.rs
@@ -18,7 +18,7 @@
 use crate::client::WriteFormat;
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::{DataType, RowType};
+use crate::metadata::RowType;
 use crate::row::binary_array::FlussArray;
 use crate::row::binary_map::FlussMap;
 use crate::row::compacted::compacted_row_reader::{CompactedRowDeserializer, CompactedRowReader};
@@ -174,8 +174,8 @@ impl<'a> InternalRow for CompactedRow<'a> {
         self.decoded_row()?.get_array(pos)
     }
 
-    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
-        self.decoded_row()?.get_map(pos, key_type, value_type)
+    fn get_map(&self, pos: usize) -> Result<FlussMap> {
+        self.decoded_row()?.get_map(pos)
     }
 
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
@@ -508,9 +508,7 @@ mod tests {
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
-        let read_map = row
-            .get_map(0, &DataTypes::int(), &DataTypes::string())
-            .unwrap();
+        let read_map = row.get_map(0).unwrap();
         assert_eq!(read_map.size(), 2);
         assert_eq!(read_map.key_array().get_int(0).unwrap(), 1);
         assert_eq!(read_map.value_array().get_string(0).unwrap(), "a");
@@ -549,9 +547,7 @@ mod tests {
         let row2 = CompactedRow::from_bytes(&row_type, bytes2.as_ref());
         assert_eq!(row2.get_int(0).unwrap(), 99);
         assert!(!row2.is_null_at(1).unwrap());
-        let read_map = row2
-            .get_map(1, &DataTypes::int(), &DataTypes::string())
-            .unwrap();
+        let read_map = row2.get_map(1).unwrap();
         assert_eq!(read_map.size(), 1);
         assert_eq!(read_map.key_array().get_int(0).unwrap(), 7);
         assert_eq!(read_map.value_array().get_string(0).unwrap(), "hello");
@@ -593,7 +589,7 @@ mod tests {
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
-        let read_map = row.get_map(0, &DataTypes::string(), &array_type).unwrap();
+        let read_map = row.get_map(0).unwrap();
         assert_eq!(read_map.size(), 2);
         assert_eq!(read_map.key_array().get_string(0).unwrap(), "a");
         assert_eq!(read_map.key_array().get_string(1).unwrap(), "b");
@@ -622,9 +618,7 @@ mod tests {
         let bytes = writer.to_bytes();
         let row = CompactedRow::from_bytes(&row_type, bytes.as_ref());
 
-        let read_map = row
-            .get_map(0, &DataTypes::int(), &DataTypes::string())
-            .unwrap();
+        let read_map = row.get_map(0).unwrap();
         assert_eq!(read_map.size(), 0);
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/datum.rs b/fluss-rust/crates/fluss/src/row/datum.rs
index b1595b311e..e6a67394b1 100644
--- a/fluss-rust/crates/fluss/src/row/datum.rs
+++ b/fluss-rust/crates/fluss/src/row/datum.rs
@@ -681,7 +681,7 @@ fn append_fluss_map_to_map_builder(
     Ok(())
 }
 
-fn read_datum_from_fluss_array<'a>(
+pub(crate) fn read_datum_from_fluss_array<'a>(
     arr: &FlussArray,
     pos: usize,
     element_type: &crate::metadata::DataType,
@@ -693,6 +693,15 @@ fn read_datum_from_fluss_array<'a>(
         )?)));
     }
 
+    // FlussArray has no attached schema; use the typed inherent accessor.
+    if let DataType::Map(map_type) = element_type {
+        return Ok(Datum::Map(arr.get_map(
+            pos,
+            map_type.key_type(),
+            map_type.value_type(),
+        )?));
+    }
+
     let getter = FieldGetter::create(element_type, pos);
     Ok(getter.get_field(arr)?.into_owned())
 }
diff --git a/fluss-rust/crates/fluss/src/row/field_getter.rs b/fluss-rust/crates/fluss/src/row/field_getter.rs
index 41322f542b..3c2c7ce1ca 100644
--- a/fluss-rust/crates/fluss/src/row/field_getter.rs
+++ b/fluss-rust/crates/fluss/src/row/field_getter.rs
@@ -196,11 +196,7 @@ impl InnerFieldGetter {
                 Datum::TimestampLtz(row.get_timestamp_ltz(*pos, *precision)?)
             }
             InnerFieldGetter::Array { pos } => Datum::Array(row.get_array(*pos)?),
-            InnerFieldGetter::Map {
-                pos,
-                key_type,
-                value_type,
-            } => Datum::Map(row.get_map(*pos, key_type, value_type)?),
+            InnerFieldGetter::Map { pos, .. } => Datum::Map(row.get_map(*pos)?),
             InnerFieldGetter::Row { pos } => Datum::Row(Box::new(row.get_row(*pos)?.clone())),
         })
     }
diff --git a/fluss-rust/crates/fluss/src/row/lookup_row.rs b/fluss-rust/crates/fluss/src/row/lookup_row.rs
index fd3db4fcfb..6271a7ebff 100644
--- a/fluss-rust/crates/fluss/src/row/lookup_row.rs
+++ b/fluss-rust/crates/fluss/src/row/lookup_row.rs
@@ -21,7 +21,6 @@
 
 use crate::client::WriteFormat;
 use crate::error::Result;
-use crate::metadata::DataType;
 use crate::row::compacted::CompactedRow;
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
 use crate::row::projected_row::ProjectedRow;
@@ -117,8 +116,8 @@ impl<'a> InternalRow for LookupRow<'a> {
     fn get_array(&self, pos: usize) -> Result<FlussArray> {
         delegate!(self, get_array, pos)
     }
-    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
-        delegate!(self, get_map, pos, key_type, value_type)
+    fn get_map(&self, pos: usize) -> Result<FlussMap> {
+        delegate!(self, get_map, pos)
     }
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
         delegate!(self, get_row, pos)
diff --git a/fluss-rust/crates/fluss/src/row/mod.rs b/fluss-rust/crates/fluss/src/row/mod.rs
index 2456ee4d39..1e045b2d14 100644
--- a/fluss-rust/crates/fluss/src/row/mod.rs
+++ b/fluss-rust/crates/fluss/src/row/mod.rs
@@ -33,7 +33,6 @@ mod projected_row;
 mod row_decoder;
 
 use crate::client::WriteFormat;
-use crate::metadata::DataType;
 pub use binary_array::{FlussArray, FlussArrayWriter};
 pub use binary_map::{FlussMap, FlussMapWriter};
 use bytes::Bytes;
@@ -135,9 +134,9 @@ pub trait InternalRow: Send + Sync {
     fn get_array(&self, pos: usize) -> Result<FlussArray>;
 
     /// Returns the map value at the given position
-    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap>;
+    fn get_map(&self, pos: usize) -> Result<FlussMap>;
 
-    /// Returns     the nested row value at the given position
+    /// Returns the nested row value at the given position
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
         Err(IllegalArgument {
             message: format!("get_row not supported at position {pos}"),
@@ -309,12 +308,7 @@ impl<'a> InternalRow for GenericRow<'a> {
         }
     }
 
-    fn get_map(
-        &self,
-        pos: usize,
-        _key_type: &DataType,
-        _value_type: &DataType,
-    ) -> Result<FlussMap> {
+    fn get_map(&self, pos: usize) -> Result<FlussMap> {
         match self.get_value(pos)? {
             Datum::Map(m) => Ok(m.clone()),
             other => Err(IllegalArgument {
diff --git a/fluss-rust/crates/fluss/src/row/projected_row.rs b/fluss-rust/crates/fluss/src/row/projected_row.rs
index 0075f0b8e2..f08778ccda 100644
--- a/fluss-rust/crates/fluss/src/row/projected_row.rs
+++ b/fluss-rust/crates/fluss/src/row/projected_row.rs
@@ -21,7 +21,6 @@
 use crate::client::WriteFormat;
 use crate::error::Error::IllegalArgument;
 use crate::error::Result;
-use crate::metadata::DataType;
 use crate::metadata::UNEXIST_MAPPING;
 use crate::row::datum::{Date, Time, TimestampLtz, TimestampNtz};
 use crate::row::{Decimal, FlussArray, FlussMap, GenericRow, InternalRow};
@@ -143,8 +142,8 @@ impl<R: InternalRow> InternalRow for ProjectedRow<R> {
         project!(self, get_array, pos)
     }
 
-    fn get_map(&self, pos: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap> {
-        project!(self, get_map, pos, key_type, value_type)
+    fn get_map(&self, pos: usize) -> Result<FlussMap> {
+        project!(self, get_map, pos)
     }
 
     fn get_row(&self, pos: usize) -> Result<&GenericRow<'_>> {
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 11c5b3e95d..fc8f837649 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -1102,18 +1102,8 @@ mod table_test {
         let found_row = records[0].row();
         assert_eq!(found_row.get_int(0).unwrap(), 1);
 
-        // 4. Assert Map. Look the types up from `map_type` rather than reusing
-        // the locally-stashed `key_type`/`value_type`: `MapType::with_nullable`
-        // forces the stored key non-nullable, which exercises the same
-        // (non-nullable schema) vs (Arrow-derived nullable) comparison realistic
-        // callers hit.
-        let (mt_key, mt_value) = match &map_type {
-            fluss::metadata::DataType::Map(m) => (m.key_type(), m.value_type()),
-            _ => unreachable!("map_type is a MAP"),
-        };
-        let decoded_map = found_row
-            .get_map(1, mt_key, mt_value)
-            .expect("Failed to get map");
+        // 4. Assert Map
+        let decoded_map = found_row.get_map(1).expect("Failed to get map");
         assert_eq!(decoded_map.size(), 3);
 
         let decoded_keys = decoded_map.key_array();
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 7ef34ef3ac..52999e8cda 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -466,7 +466,7 @@ Implements the `InternalRow` trait (see below).
 | `fn get_binary(&self, idx: usize, length: usize) -> Result<&[u8]>`                     | Get fixed-length binary value           |
 | `fn get_char(&self, idx: usize, length: usize) -> Result<&str>`                        | Get fixed-length char value             |
 | `fn get_array(&self, idx: usize) -> Result<FlussArray>`                                | Get array value                         |
-| `fn get_map(&self, idx: usize, key_type: &DataType, value_type: &DataType) -> Result<FlussMap>` | Get map value                           |
+| `fn get_map(&self, idx: usize) -> Result<FlussMap>`                                    | Get map value                           |
 
 ## `FlussArray`
 
@@ -488,10 +488,25 @@ Element getters mirror `InternalRow` typed getters and return `Result<T>`. For e
 |--------|-------------|
 | `fn size(&self) -> usize` | Number of entries in the map |
 | `fn as_bytes(&self) -> &[u8]` | Get encoded bytes of the map |
-| `fn key_array(&self) -> &FlussArray` | Get the key array |
-| `fn value_array(&self) -> &FlussArray` | Get the value array |
+| `fn key_type(&self) -> &DataType` | Schema-declared type of keys |
+| `fn value_type(&self) -> &DataType` | Schema-declared type of values |
+| `fn entries(&self) -> Entries<'_>` | Iterator yielding `Result<(Datum, Datum)>` pairs |
+| `fn get(&self, key: &Datum) -> Result<Option<Datum>>` | Linear-scan lookup by key (`O(n)`) |
+| `fn key_array(&self) -> &FlussArray` | Parallel keys array (zero-copy view) |
+| `fn value_array(&self) -> &FlussArray` | Parallel values array (zero-copy view) |
 
-Key and value arrays are returned as `&FlussArray`, allowing you to read entries by retrieving keys and values at the same index positions.
+Most user code should prefer `entries()` (iteration) and `get()` (lookup). The `key_array()` / `value_array()` views are for serdes and Arrow-adapter code that needs zero-copy access to the underlying parallel-array layout.
+
+## `FlussMapWriter`
+
+`FlussMapWriter` builds a `FlussMap` for write paths.
+
+| Method | Description |
+|--------|-------------|
+| `fn new(capacity: usize, key_type: &DataType, value_type: &DataType) -> Self` | Create a writer sized for `capacity` entries |
+| `fn write_entry(&mut self, key: Datum, value: Datum) -> Result<()>` | Append a single entry; rejects null keys and type mismatches |
+| `fn extend<I, K, V>(&mut self, entries: I) -> Result<()>` | Append every pair from `entries: IntoIterator<Item = (K, V)>` |
+| `fn complete(self) -> Result<FlussMap>` | Finalize the writer and produce the `FlussMap` |
 
 ## `ChangeType`
 
diff --git a/fluss-rust/website/docs/user-guide/rust/data-types.md b/fluss-rust/website/docs/user-guide/rust/data-types.md
index ad14028bd7..5418839184 100644
--- a/fluss-rust/website/docs/user-guide/rust/data-types.md
+++ b/fluss-rust/website/docs/user-guide/rust/data-types.md
@@ -22,7 +22,7 @@ sidebar_position: 3
 | `BYTES`         | `&[u8]`        | `get_bytes()`                        | `set_field(idx, &[u8])`        |
 | `BINARY(n)`     | `&[u8]`        | `get_binary(idx, length)`            | `set_field(idx, &[u8])`        |
 | `ARRAY<T>`      | `FlussArray`   | `get_array()`                        | `set_field(idx, FlussArray)`   |
-| `MAP<K, V>`     | `FlussMap`     | `get_map(idx, key_type, value_type)` | `set_field(idx, FlussMap)`     |
+| `MAP<K, V>`     | `FlussMap`     | `get_map(idx)`                       | `set_field(idx, FlussMap)`     |
 
 ## Constructing Special Types
 
@@ -86,9 +86,11 @@ row.set_field(0, Datum::Array(arr));
 
 ## Maps
 
-Use `DataTypes::map(key_type, value_type)` in schema definitions. At runtime, read maps with `row.get_map(idx, &key_type, &value_type)?`.
+Use `DataTypes::map(key_type, value_type)` in schema definitions. At runtime, read maps with `row.get_map(idx)?` — the row knows its schema, so no extra type arguments are needed.
 
-To construct map values for writes, build a `FlussMap` using `FlussMapWriter` and wrap it with `Datum::Map`:
+### Writing
+
+Build a `FlussMap` entry-by-entry, then wrap it with `Datum::Map`:
 
 ```rust
 use fluss::metadata::DataTypes;
@@ -104,7 +106,57 @@ let mut row = GenericRow::new(1);
 row.set_field(0, Datum::Map(map));
 ```
 
-`MAP` keys cannot be null. `MAP` is supported for row values and nested row fields. Like arrays, `MAP` follows Java parity for key encoding and can be encoded by the compacted key encoder, while table-level key constraints are validated by the server.
+For bulk writes from any iterator of `(key, value)` pairs (including a `HashMap`), use `extend`:
+
+```rust
+use std::collections::HashMap;
+
+let entries: HashMap<&str, i32> = HashMap::from([("a", 1), ("b", 2)]);
+let mut writer = FlussMapWriter::new(entries.len(), &DataTypes::string(), &DataTypes::int());
+writer.extend(entries)?;
+let map = writer.complete()?;
+```
+
+### Reading
+
+The `entries()` iterator yields `(key, value)` pairs as schema-typed `Datum`s, folding the null check in:
+
+```rust
+use fluss::row::InternalRow;
+
+let m = row.get_map(0)?;
+for entry in m.entries() {
+    let (k, v) = entry?;
+    println!("{k:?} => {v:?}");          // Datum's Debug handles null
+}
+```
+
+For point lookups, `get(&key)` does a linear scan and returns `Option<Datum>`:
+
+```rust
+use fluss::row::Datum;
+
+if let Some(v) = m.get(&Datum::from("attr_size"))? {
+    println!("size = {v:?}");
+}
+```
+
+Lookup is `O(n)` — the binary MAP layout has no key index. If you need repeated lookups against the same map, collect the entries once:
+
+```rust
+use std::collections::HashMap;
+
+let snapshot: HashMap<String, Datum<'_>> = m
+    .entries()
+    .map(|e| e.map(|(k, v)| (format!("{k:?}"), v)))
+    .collect::<Result<_, _>>()?;
+```
+
+For raw access to the underlying parallel-array representation (zero-copy, used by serdes / Arrow adapters), `m.key_array()` and `m.value_array()` are still available.
+
+### Constraints
+
+`MAP` keys cannot be null. `MAP` is supported for row values and nested row fields. `MAP` cannot be used as a primary key or bucket key column — the Rust client rejects it at the compacted key encoder, and the Fluss server bans `MAP` (along with `ARRAY` and `ROW`) from key columns.
 
 ## Reading Row Data
 

From 50171d484e82d22efd08947ee13f357af8f5e43a Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Sat, 23 May 2026 23:46:42 +0100
Subject: [PATCH 275/287] [ci] scope rust integration job to test_fluss target
 only (#561)

---
 fluss-rust/.github/workflows/build_and_test_rust.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/fluss-rust/.github/workflows/build_and_test_rust.yml
index af108699cd..9e60bd0c52 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/fluss-rust/.github/workflows/build_and_test_rust.yml
@@ -84,7 +84,7 @@ jobs:
         uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
 
       - name: Integration Test
-        run: cargo test --features integration_tests --all-targets --workspace --exclude fluss_python --exclude fluss-cpp --exclude fluss_nif
+        run: cargo test --features integration_tests --test test_fluss -p fluss-rs
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full

From e0ecf8ba9cdd0cea2ebad7e43d8edfeddeceec19 Mon Sep 17 00:00:00 2001
From: Anton Borisov <148864665+fresh-borzoni@users.noreply.github.com>
Date: Mon, 25 May 2026 09:39:45 +0100
Subject: [PATCH 276/287] [rust] integration tests for MAP dt + restructure ITs
 for complex dts (#560)

* [rust] integration tests for MAP dt + restructure tests around complex types (#549)

* address comments
---
 fluss-rust/crates/fluss/src/row/binary_map.rs |    1 +
 fluss-rust/crates/fluss/src/row/column.rs     |   45 +-
 .../crates/fluss/src/row/column_writer.rs     |   58 +-
 .../fluss/tests/integration/kv_table.rs       | 2042 ++++++---------
 .../fluss/tests/integration/log_table.rs      | 2327 +++++++----------
 .../crates/fluss/tests/integration/utils.rs   |  201 +-
 6 files changed, 2056 insertions(+), 2618 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/row/binary_map.rs b/fluss-rust/crates/fluss/src/row/binary_map.rs
index 57201b84b5..02425129d3 100644
--- a/fluss-rust/crates/fluss/src/row/binary_map.rs
+++ b/fluss-rust/crates/fluss/src/row/binary_map.rs
@@ -432,6 +432,7 @@ impl FlussMapWriter {
             }
             (DataType::Array(_), Datum::Array(v)) => writer.write_array(pos, v),
             (DataType::Map(_), Datum::Map(v)) => writer.write_map(pos, v),
+            (DataType::Row(_), Datum::Row(v)) => writer.write_row(pos, v.as_ref())?,
             _ => {
                 return Err(IllegalArgument {
                     message: format!("Type mismatch: expected {:?}, got {:?}", dt, datum),
diff --git a/fluss-rust/crates/fluss/src/row/column.rs b/fluss-rust/crates/fluss/src/row/column.rs
index f4da6b3fe4..9dbdd947dd 100644
--- a/fluss-rust/crates/fluss/src/row/column.rs
+++ b/fluss-rust/crates/fluss/src/row/column.rs
@@ -661,25 +661,19 @@ impl InternalRow for ColumnarRow {
         };
 
         let column = self.column(pos)?;
-        let element_field = match column.data_type() {
-            ArrowDataType::List(field) => field,
+        match column.data_type() {
+            ArrowDataType::List(_) => {}
             other => {
                 return Err(IllegalArgument {
                     message: format!("expected List array at position {pos}, got {other:?}"),
                 });
             }
-        };
-
-        let actual_element_type = from_arrow_field(element_field)?;
-        if actual_element_type != *element_fluss_type {
-            return Err(IllegalArgument {
-                message: format!(
-                    "Arrow list element type {:?} does not match expected Fluss type {:?}",
-                    actual_element_type, element_fluss_type
-                ),
-            });
         }
 
+        // `to_arrow_type` is lossy (e.g. TIMESTAMP_LTZ → plain Arrow Timestamp);
+        // trust the Fluss schema and let the per-element conversion below catch
+        // real shape mismatches.
+
         let list_arr = column
             .as_any()
             .downcast_ref::<ListArray>()
@@ -778,25 +772,9 @@ fn arrow_map_entry_to_fluss_map(
         });
     }
 
-    let actual_key_type = from_arrow_field(&fields[0])?;
-    if actual_key_type != *key_type {
-        return Err(IllegalArgument {
-            message: format!(
-                "Arrow map key type {:?} does not match expected Fluss type {:?}",
-                actual_key_type, key_type
-            ),
-        });
-    }
-
-    let actual_value_type = from_arrow_field(&fields[1])?;
-    if actual_value_type != *value_type {
-        return Err(IllegalArgument {
-            message: format!(
-                "Arrow map value type {:?} does not match expected Fluss type {:?}",
-                actual_value_type, value_type
-            ),
-        });
-    }
+    // `to_arrow_type` is lossy (e.g. TIMESTAMP_LTZ → plain Arrow Timestamp);
+    // trust the Fluss schema and let the per-element conversion below catch
+    // real shape mismatches.
 
     let keys_arrow = struct_arr.column(0);
     let values_arrow = struct_arr.column(1);
@@ -1443,8 +1421,7 @@ mod tests {
 
         let err = row.get_array(0).unwrap_err();
         assert!(
-            err.to_string()
-                .contains("Cannot convert Arrow type to Fluss type"),
+            err.to_string().contains("expected Int32Type"),
             "unexpected error: {err}"
         );
     }
@@ -1735,7 +1712,7 @@ mod tests {
         let err = row.get_map(0).expect_err("type mismatch must error");
         let msg = err.to_string();
         assert!(
-            msg.contains("does not match expected Fluss type"),
+            msg.contains("expected StringArray"),
             "unexpected error: {msg}"
         );
     }
diff --git a/fluss-rust/crates/fluss/src/row/column_writer.rs b/fluss-rust/crates/fluss/src/row/column_writer.rs
index 94777faf3c..85776bc53e 100644
--- a/fluss-rust/crates/fluss/src/row/column_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/column_writer.rs
@@ -22,12 +22,11 @@
 use crate::error::Error::RowConvertError;
 use crate::error::{Error, Result};
 use crate::metadata::{DataType, RowType};
-use crate::row::FlussMap;
-use crate::row::InternalRow;
 use crate::row::datum::{
     MICROS_PER_MILLI, MILLIS_PER_SECOND, NANOS_PER_MILLI, append_decimal_to_builder,
     millis_nanos_to_micros, millis_nanos_to_nanos,
 };
+use crate::row::{FlussArray, FlussMap, InternalRow};
 use arrow::array::{
     ArrayBuilder, ArrayRef, BinaryBuilder, BooleanBuilder, Date32Builder, Decimal128Builder,
     FixedSizeBinaryBuilder, Float32Builder, Float64Builder, Int8Builder, Int16Builder,
@@ -928,8 +927,8 @@ fn write_map_into(
     let key_array = map.key_array();
     let value_array = map.value_array();
     for i in 0..map.size() {
-        key_writer.write_field_at(key_array, i)?;
-        value_writer.write_field_at(value_array, i)?;
+        write_array_element_into_column(key_writer, key_array, i)?;
+        write_array_element_into_column(value_writer, value_array, i)?;
     }
     let last = *offsets.last().unwrap();
     offsets.push(
@@ -940,6 +939,57 @@ fn write_map_into(
     Ok(())
 }
 
+// FlussArray carries no schema; nested row/map elements need the typed
+// inherent accessors (get_row/get_map with explicit types).
+fn write_array_element_into_column(
+    writer: &mut ColumnWriter,
+    array: &FlussArray,
+    index: usize,
+) -> Result<()> {
+    match &mut writer.inner {
+        TypedWriter::Struct {
+            field_writers,
+            validity,
+            row_type,
+            ..
+        } => {
+            if array.is_null_at(index) {
+                for child in field_writers.iter_mut() {
+                    child.append_null();
+                }
+                validity.push(false);
+            } else {
+                let nested = array.get_row(index, row_type)?;
+                for (j, child) in field_writers.iter_mut().enumerate() {
+                    child.write_field_at(&nested, j)?;
+                }
+                validity.push(true);
+            }
+            Ok(())
+        }
+        TypedWriter::Map {
+            key_writer,
+            value_writer,
+            key_type,
+            value_type,
+            offsets,
+            validity,
+        } => {
+            if array.is_null_at(index) {
+                validity.push(false);
+                let last = *offsets.last().unwrap();
+                offsets.push(last);
+            } else {
+                let nested = array.get_map(index, key_type, value_type)?;
+                write_map_into(nested, key_writer, value_writer, offsets)?;
+                validity.push(true);
+            }
+            Ok(())
+        }
+        _ => writer.write_field_at(array, index),
+    }
+}
+
 fn finish_struct_array(
     fields: arrow_schema::Fields,
     child_arrays: Vec<ArrayRef>,
diff --git a/fluss-rust/crates/fluss/tests/integration/kv_table.rs b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
index ee496a5a5f..4da7c75d5b 100644
--- a/fluss-rust/crates/fluss/tests/integration/kv_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/kv_table.rs
@@ -19,13 +19,18 @@
 #[cfg(test)]
 mod kv_table_test {
     use crate::integration::utils::{
-        create_partitions, create_table, get_shared_cluster, make_int_array, make_string_array,
+        ColumnPlan, array_dt_basics_columns, as_row_type, create_partitions, create_table,
+        dt_array_int, dt_map_string_int, dt_row_seq_label, get_shared_cluster, make_int_array,
+        make_string_array, map_dt_basics_columns, row_dt_basics_columns, scalar_dt_columns,
     };
+    use fluss::client::TableUpsert;
     use fluss::metadata::{DataField, DataTypes, Schema, TableDescriptor, TablePath};
     use fluss::row::binary_array::FlussArrayWriter;
+    use fluss::row::binary_map::FlussMapWriter;
     use fluss::row::{
-        Date, Datum, Decimal, FlussArray, GenericRow, InternalRow, Time, TimestampLtz, TimestampNtz,
+        Date, Datum, Decimal, GenericRow, InternalRow, Time, TimestampLtz, TimestampNtz,
     };
+    use futures::stream::{FuturesUnordered, StreamExt};
 
     fn make_key(id: i32) -> GenericRow<'static> {
         make_key_with_field_count(id, 3)
@@ -284,11 +289,11 @@ mod kv_table_test {
             .expect("Failed to drop table");
     }
 
+    /// Partial-update preserves columns absent from the partial-write set.
     #[tokio::test]
     async fn partial_update() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
-
         let admin = connection.get_admin().expect("Failed to get admin");
 
         let table_path = TablePath::new("fluss", "test_partial_update");
@@ -303,1295 +308,368 @@ mod kv_table_test {
                 Schema::builder()
                     .column("id", DataTypes::int())
                     .column("name", DataTypes::string())
-                    .column("age", DataTypes::bigint())
                     .column("score", DataTypes::bigint())
                     .column("nested", nested_type)
+                    .column(
+                        "attrs",
+                        DataTypes::map(DataTypes::string(), DataTypes::int()),
+                    )
+                    .column("tags", DataTypes::array(DataTypes::string()))
                     .primary_key(vec!["id"])
                     .build()
-                    .expect("Failed to build schema"),
+                    .expect("schema"),
             )
             .build()
-            .expect("Failed to build table");
+            .expect("table descriptor");
 
         create_table(&admin, &table_path, &table_descriptor).await;
 
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let table_upsert = table.new_upsert().expect("Failed to create upsert");
-        let upsert_writer = table_upsert
-            .create_writer()
-            .expect("Failed to create writer");
+        let table = connection.get_table(&table_path).await.expect("table");
+        let table_upsert = table.new_upsert().expect("upsert");
+        let upsert_writer = table_upsert.create_writer().expect("writer");
 
         let mut nested0 = GenericRow::new(2);
         nested0.set_field(0, 10_i32);
         nested0.set_field(1, "alpha");
-        let mut row = GenericRow::new(5);
+        let attrs0 = {
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+            w.write_entry("a".into(), 1.into()).unwrap();
+            w.write_entry("b".into(), 2.into()).unwrap();
+            w.complete().expect("attrs0")
+        };
+        let tags0 = make_string_array(&[Some("alpha-tag"), Some("beta-tag")]);
+
+        let mut row = GenericRow::new(6);
         row.set_field(0, 1);
         row.set_field(1, "Verso");
-        row.set_field(2, 32i64);
-        row.set_field(3, 6942i64);
-        row.set_field(4, Datum::Row(Box::new(nested0)));
+        row.set_field(2, 100i64);
+        row.set_field(3, Datum::Row(Box::new(nested0)));
+        row.set_field(4, Datum::Map(attrs0));
+        row.set_field(5, tags0);
         upsert_writer
             .upsert(&row)
-            .expect("Failed to upsert initial row")
+            .expect("upsert initial")
             .await
-            .expect("Failed to wait for upsert acknowledgment");
+            .expect("ack initial");
 
         let mut lookuper = table
             .new_lookup()
-            .expect("Failed to create lookup")
+            .expect("lookup")
             .create_lookuper()
-            .expect("Failed to create lookuper");
-
-        let result = lookuper
-            .lookup(&make_key(1))
-            .await
-            .expect("Failed to lookup");
-        let found_row = result
-            .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-
-        assert_eq!(found_row.get_int(0).unwrap(), 1);
-        assert_eq!(found_row.get_string(1).unwrap(), "Verso");
-        assert_eq!(found_row.get_long(2).unwrap(), 32i64);
-        assert_eq!(found_row.get_long(3).unwrap(), 6942i64);
-        let nested = found_row.get_row(4).unwrap();
-        assert_eq!(nested.get_int(0).unwrap(), 10);
-        assert_eq!(nested.get_string(1).unwrap(), "alpha");
-
-        let partial_upsert = table_upsert
-            .partial_update_with_column_names(&["id", "score"])
-            .expect("Failed to create TableUpsert with partial update");
-        let partial_writer = partial_upsert
-            .create_writer()
-            .expect("Failed to create UpsertWriter with partial write");
-
-        let mut partial_row = GenericRow::new(5);
-        partial_row.set_field(0, 1);
-        partial_row.set_field(1, Datum::Null);
-        partial_row.set_field(2, Datum::Null);
-        partial_row.set_field(3, 420i64);
-        partial_row.set_field(4, Datum::Null);
-        partial_writer
-            .upsert(&partial_row)
-            .expect("Failed to upsert")
-            .await
-            .expect("Failed to wait for upsert acknowledgment");
+            .expect("lookuper");
+
+        // Helper to issue a partial upsert against a specific column set.
+        async fn partial_upsert(table_upsert: &TableUpsert, cols: &[&str], row: GenericRow<'_>) {
+            let pu = table_upsert
+                .partial_update_with_column_names(cols)
+                .expect("partial upsert");
+            let pw = pu.create_writer().expect("partial writer");
+            pw.upsert(&row)
+                .expect("partial upsert")
+                .await
+                .expect("partial ack");
+        }
 
-        let result = lookuper
-            .lookup(&make_key(1))
-            .await
-            .expect("Failed to lookup after partial update");
-        let found_row = result
+        // === Partial update on a scalar column — compound columns preserved ===
+        let mut p1 = GenericRow::new(6);
+        p1.set_field(0, 1);
+        p1.set_field(1, Datum::Null);
+        p1.set_field(2, 420i64);
+        p1.set_field(3, Datum::Null);
+        p1.set_field(4, Datum::Null);
+        p1.set_field(5, Datum::Null);
+        partial_upsert(&table_upsert, &["id", "score"], p1).await;
+
+        let result = lookuper.lookup(&make_key(1)).await.expect("lookup");
+        let r = result
             .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-
-        assert_eq!(found_row.get_int(0).unwrap(), 1, "id should remain 1");
-        assert_eq!(
-            found_row.get_string(1).unwrap(),
-            "Verso",
-            "name should remain unchanged"
-        );
-        assert_eq!(
-            found_row.get_long(2).unwrap(),
-            32,
-            "age should remain unchanged"
-        );
-        assert_eq!(
-            found_row.get_long(3).unwrap(),
-            420,
-            "score should be updated to 420"
-        );
-        let nested = found_row.get_row(4).unwrap();
-        assert_eq!(
-            nested.get_int(0).unwrap(),
-            10,
-            "ROW preserved across non-ROW partial update"
-        );
-        assert_eq!(nested.get_string(1).unwrap(), "alpha");
-
-        let partial_nested_upsert = table_upsert
-            .partial_update_with_column_names(&["id", "nested"])
-            .expect("partial_update_with_column_names");
-        let partial_nested_writer = partial_nested_upsert
-            .create_writer()
-            .expect("partial writer");
+            .expect("get row")
+            .expect("row exists");
+        assert_eq!(r.get_string(1).unwrap(), "Verso", "name preserved");
+        assert_eq!(r.get_long(2).unwrap(), 420, "score updated");
+        let n = r.get_row(3).unwrap();
+        assert_eq!(n.get_int(0).unwrap(), 10, "ROW preserved");
+        assert_eq!(r.get_map(4).unwrap().size(), 2, "MAP preserved");
+        assert_eq!(r.get_array(5).unwrap().size(), 2, "ARRAY preserved");
+
+        // === Partial update on the ROW column ===
         let mut new_nested = GenericRow::new(2);
         new_nested.set_field(0, 99_i32);
         new_nested.set_field(1, "omega");
-        let mut partial_nested = GenericRow::new(5);
-        partial_nested.set_field(0, 1);
-        partial_nested.set_field(1, Datum::Null);
-        partial_nested.set_field(2, Datum::Null);
-        partial_nested.set_field(3, Datum::Null);
-        partial_nested.set_field(4, Datum::Row(Box::new(new_nested)));
-        partial_nested_writer
-            .upsert(&partial_nested)
-            .expect("partial upsert")
-            .await
-            .expect("partial ack");
-
-        let result = lookuper
-            .lookup(&make_key(1))
-            .await
-            .expect("Failed to lookup after nested partial");
-        let found_row = result
-            .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-        assert_eq!(
-            found_row.get_string(1).unwrap(),
-            "Verso",
-            "name preserved when ROW updated"
-        );
-        assert_eq!(
-            found_row.get_long(3).unwrap(),
-            420,
-            "score preserved when ROW updated"
-        );
-        let nested = found_row.get_row(4).unwrap();
-        assert_eq!(nested.get_int(0).unwrap(), 99);
-        assert_eq!(nested.get_string(1).unwrap(), "omega");
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    #[tokio::test]
-    async fn partitioned_table_upsert_and_lookup() {
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_partitioned_kv_table");
-
-        let nested_type = DataTypes::row(vec![
-            DataField::new("seq", DataTypes::int(), None),
-            DataField::new("label", DataTypes::string(), None),
-        ]);
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(
-                Schema::builder()
-                    .column("region", DataTypes::string())
-                    .column("user_id", DataTypes::int())
-                    .column("name", DataTypes::string())
-                    .column("score", DataTypes::bigint())
-                    .column("nested", nested_type)
-                    .primary_key(vec!["region", "user_id"])
-                    .build()
-                    .expect("Failed to build schema"),
-            )
-            .partitioned_by(vec!["region"])
-            .build()
-            .expect("Failed to build table");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        create_partitions(&admin, &table_path, "region", &["US", "EU", "APAC"]).await;
-
-        let connection = cluster.get_fluss_connection().await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let table_upsert = table.new_upsert().expect("Failed to create upsert");
-
-        let upsert_writer = table_upsert
-            .create_writer()
-            .expect("Failed to create writer");
-
-        let test_data = [
-            ("US", 1, "Gustave", 100i64, 11_i32, "a"),
-            ("US", 2, "Lune", 200i64, 22, "b"),
-            ("EU", 1, "Sciel", 150i64, 33, "c"),
-            ("EU", 2, "Maelle", 250i64, 44, "d"),
-            ("APAC", 1, "Noco", 300i64, 55, "e"),
-        ];
-
-        for (region, user_id, name, score, seq, label) in &test_data {
-            let mut nested = GenericRow::new(2);
-            nested.set_field(0, *seq);
-            nested.set_field(1, *label);
-            let mut row = GenericRow::new(5);
-            row.set_field(0, *region);
-            row.set_field(1, *user_id);
-            row.set_field(2, *name);
-            row.set_field(3, *score);
-            row.set_field(4, Datum::Row(Box::new(nested)));
-            upsert_writer.upsert(&row).expect("Failed to upsert");
-        }
-        upsert_writer.flush().await.expect("Failed to flush");
-
-        let mut lookuper = table
-            .new_lookup()
-            .expect("Failed to create lookup")
-            .create_lookuper()
-            .expect("Failed to create lookuper");
-
-        for (region, user_id, expected_name, expected_score, expected_seq, expected_label) in
-            &test_data
-        {
-            let mut key = GenericRow::new(5);
-            key.set_field(0, *region);
-            key.set_field(1, *user_id);
-
-            let result = lookuper.lookup(&key).await.expect("Failed to lookup");
-            let row = result
-                .get_single_row()
-                .expect("Failed to get row")
-                .expect("Row should exist");
-
-            assert_eq!(row.get_string(0).unwrap(), *region, "region mismatch");
-            assert_eq!(row.get_int(1).unwrap(), *user_id, "user_id mismatch");
-            assert_eq!(row.get_string(2).unwrap(), *expected_name, "name mismatch");
-            assert_eq!(row.get_long(3).unwrap(), *expected_score, "score mismatch");
-            let nested = row.get_row(4).unwrap();
-            assert_eq!(
-                nested.get_int(0).unwrap(),
-                *expected_seq,
-                "ROW seq mismatch"
-            );
-            assert_eq!(
-                nested.get_string(1).unwrap(),
-                *expected_label,
-                "ROW label mismatch"
-            );
-        }
-
-        let mut updated_nested = GenericRow::new(2);
-        updated_nested.set_field(0, 999_i32);
-        updated_nested.set_field(1, "updated");
-        let mut updated_row = GenericRow::new(5);
-        updated_row.set_field(0, "US");
-        updated_row.set_field(1, 1);
-        updated_row.set_field(2, "Gustave Updated");
-        updated_row.set_field(3, 999i64);
-        updated_row.set_field(4, Datum::Row(Box::new(updated_nested)));
-        upsert_writer
-            .upsert(&updated_row)
-            .expect("Failed to upsert updated row")
-            .await
-            .expect("Failed to wait for upsert acknowledgment");
-
-        // Verify the update
-        let mut key = GenericRow::new(5);
-        key.set_field(0, "US");
-        key.set_field(1, 1);
-        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
-        let row = result
+        let mut p2 = GenericRow::new(6);
+        p2.set_field(0, 1);
+        p2.set_field(1, Datum::Null);
+        p2.set_field(2, Datum::Null);
+        p2.set_field(3, Datum::Row(Box::new(new_nested)));
+        p2.set_field(4, Datum::Null);
+        p2.set_field(5, Datum::Null);
+        partial_upsert(&table_upsert, &["id", "nested"], p2).await;
+
+        let result = lookuper.lookup(&make_key(1)).await.expect("lookup");
+        let r = result
             .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-        assert_eq!(row.get_string(2).unwrap(), "Gustave Updated");
-        assert_eq!(row.get_long(3).unwrap(), 999);
-        let nested = row.get_row(4).unwrap();
-        assert_eq!(nested.get_int(0).unwrap(), 999);
-        assert_eq!(nested.get_string(1).unwrap(), "updated");
-
-        // Lookup in non-existent partition should return empty result
-        let mut non_existent_key = GenericRow::new(5);
-        non_existent_key.set_field(0, "UNKNOWN_REGION");
-        non_existent_key.set_field(1, 1);
-        let result = lookuper
-            .lookup(&non_existent_key)
-            .await
-            .expect("Failed to lookup non-existent partition");
-        assert!(
-            result
-                .get_single_row()
-                .expect("Failed to get row")
-                .is_none(),
-            "Lookup in non-existent partition should return None"
-        );
-
-        // Delete a record within a partition (await acknowledgment)
-        let mut delete_key = GenericRow::new(5);
-        delete_key.set_field(0, "EU");
-        delete_key.set_field(1, 1);
-        upsert_writer
-            .delete(&delete_key)
-            .expect("Failed to delete")
-            .await
-            .expect("Failed to wait for delete acknowledgment");
-
-        // Verify deletion
-        let mut key = GenericRow::new(5);
-        key.set_field(0, "EU");
-        key.set_field(1, 1);
-        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
-        assert!(
-            result
-                .get_single_row()
-                .expect("Failed to get row")
-                .is_none(),
-            "Deleted record should not exist"
-        );
-
-        // Verify other records in the same partition still exist
-        let mut key = GenericRow::new(5);
-        key.set_field(0, "EU");
-        key.set_field(1, 2);
-        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
-        let row = result
+            .expect("get row")
+            .expect("row exists");
+        assert_eq!(r.get_string(1).unwrap(), "Verso", "name preserved");
+        assert_eq!(r.get_long(2).unwrap(), 420, "score preserved");
+        let n = r.get_row(3).unwrap();
+        assert_eq!(n.get_int(0).unwrap(), 99);
+        assert_eq!(n.get_string(1).unwrap(), "omega");
+        assert_eq!(r.get_map(4).unwrap().size(), 2, "MAP preserved");
+        assert_eq!(r.get_array(5).unwrap().size(), 2, "ARRAY preserved");
+
+        // === Partial update on the MAP column ===
+        let new_attrs = {
+            let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::int());
+            w.write_entry("z".into(), 99.into()).unwrap();
+            w.complete().expect("new_attrs")
+        };
+        let mut p3 = GenericRow::new(6);
+        p3.set_field(0, 1);
+        p3.set_field(1, Datum::Null);
+        p3.set_field(2, Datum::Null);
+        p3.set_field(3, Datum::Null);
+        p3.set_field(4, Datum::Map(new_attrs));
+        p3.set_field(5, Datum::Null);
+        partial_upsert(&table_upsert, &["id", "attrs"], p3).await;
+
+        let result = lookuper.lookup(&make_key(1)).await.expect("lookup");
+        let r = result
             .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-        assert_eq!(row.get_string(2).unwrap(), "Maelle");
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    #[tokio::test]
-    async fn upsert_and_lookup_with_row_rich_types() {
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_kv_row_rich_types");
-
-        let row_type_owned = DataTypes::row(vec![
-            DataField::new("f_bool", DataTypes::boolean(), None),
-            DataField::new("f_long", DataTypes::bigint(), None),
-            DataField::new("f_float", DataTypes::float(), None),
-            DataField::new("f_double", DataTypes::double(), None),
-            DataField::new("f_str", DataTypes::string(), None),
-            DataField::new("f_bytes", DataTypes::bytes(), None),
-            DataField::new("f_decimal", DataTypes::decimal(10, 2), None),
-            DataField::new("f_date", DataTypes::date(), None),
-            DataField::new("f_time", DataTypes::time_with_precision(3), None),
-            DataField::new("f_ts_ntz", DataTypes::timestamp_with_precision(6), None),
-            DataField::new("f_ts_ltz", DataTypes::timestamp_ltz_with_precision(6), None),
-        ]);
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(
-                Schema::builder()
-                    .column("id", DataTypes::int())
-                    .column("nested", row_type_owned)
-                    .primary_key(vec!["id"])
-                    .build()
-                    .expect("Failed to build schema"),
-            )
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-        let upsert = table.new_upsert().expect("Failed to create upsert");
-        let upsert_writer = upsert.create_writer().expect("Failed to create writer");
-
-        let mut nested = GenericRow::new(11);
-        nested.set_field(0, true);
-        nested.set_field(1, 9_876_543_210_i64);
-        nested.set_field(2, f32::NEG_INFINITY);
-        nested.set_field(3, f64::NAN);
-        nested.set_field(4, "rich types here");
-        nested.set_field(5, b"opaque".as_slice());
-        nested.set_field(6, Decimal::from_unscaled_long(54321, 10, 2).unwrap());
-        nested.set_field(7, Datum::Date(Date::new(20476)));
-        nested.set_field(8, Datum::Time(Time::new(36_827_123)));
-        nested.set_field(9, Datum::TimestampNtz(TimestampNtz::new(1_769_163_227_123)));
-        nested.set_field(
-            10,
-            Datum::TimestampLtz(TimestampLtz::new(1_769_163_227_123)),
-        );
-
-        let mut row = GenericRow::new(2);
-        row.set_field(0, 1_i32);
-        row.set_field(1, Datum::Row(Box::new(nested)));
-
-        upsert_writer
-            .upsert(&row)
-            .expect("upsert")
-            .await
-            .expect("ack");
-
-        let mut lookuper = table
-            .new_lookup()
-            .expect("Failed to create lookup")
-            .create_lookuper()
-            .expect("Failed to create lookuper");
-
-        let result = lookuper
-            .lookup(&make_key_with_field_count(1, 2))
-            .await
-            .expect("lookup");
+            .expect("get row")
+            .expect("row exists");
+        assert_eq!(r.get_string(1).unwrap(), "Verso", "name preserved");
+        let n = r.get_row(3).unwrap();
+        assert_eq!(n.get_int(0).unwrap(), 99, "ROW preserved");
+        let m = r.get_map(4).unwrap();
+        assert_eq!(m.size(), 1);
+        assert_eq!(m.get(&Datum::from("z")).unwrap(), Some(Datum::from(99_i32)));
+        assert_eq!(r.get_array(5).unwrap().size(), 2, "ARRAY preserved");
+
+        // === Partial update on the ARRAY column ===
+        let new_tags = make_string_array(&[Some("gamma-tag")]);
+        let mut p4 = GenericRow::new(6);
+        p4.set_field(0, 1);
+        p4.set_field(1, Datum::Null);
+        p4.set_field(2, Datum::Null);
+        p4.set_field(3, Datum::Null);
+        p4.set_field(4, Datum::Null);
+        p4.set_field(5, new_tags);
+        partial_upsert(&table_upsert, &["id", "tags"], p4).await;
+
+        let result = lookuper.lookup(&make_key(1)).await.expect("lookup");
         let r = result
             .get_single_row()
             .expect("get row")
-            .expect("row should exist");
-
-        let n = r.get_row(1).unwrap();
-        assert!(n.get_boolean(0).unwrap());
-        assert_eq!(n.get_long(1).unwrap(), 9_876_543_210);
-        assert!(n.get_float(2).unwrap().is_infinite());
-        assert!(n.get_float(2).unwrap().is_sign_negative());
-        assert!(n.get_double(3).unwrap().is_nan());
-        assert_eq!(n.get_string(4).unwrap(), "rich types here");
-        assert_eq!(n.get_bytes(5).unwrap(), b"opaque");
-        assert_eq!(
-            n.get_decimal(6, 10, 2).unwrap(),
-            Decimal::from_unscaled_long(54321, 10, 2).unwrap(),
-        );
-        assert_eq!(n.get_date(7).unwrap().get_inner(), 20476);
-        assert_eq!(n.get_time(8).unwrap().get_inner(), 36_827_123);
-        assert_eq!(
-            n.get_timestamp_ntz(9, 6).unwrap().get_millisecond(),
-            1_769_163_227_123,
-        );
-        assert_eq!(
-            n.get_timestamp_ltz(10, 6).unwrap().get_epoch_millisecond(),
-            1_769_163_227_123,
-        );
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    /// Integration test covering put and get operations for all supported datatypes.
-    #[tokio::test]
-    async fn all_supported_datatypes() {
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_all_datatypes");
-
-        // Create a table with all supported primitive datatypes
-        let table_descriptor = TableDescriptor::builder()
-            .schema(
-                Schema::builder()
-                    // Primary key column
-                    .column("pk_int", DataTypes::int())
-                    // Boolean type
-                    .column("col_boolean", DataTypes::boolean())
-                    // Integer types
-                    .column("col_tinyint", DataTypes::tinyint())
-                    .column("col_smallint", DataTypes::smallint())
-                    .column("col_int", DataTypes::int())
-                    .column("col_bigint", DataTypes::bigint())
-                    // Floating point types
-                    .column("col_float", DataTypes::float())
-                    .column("col_double", DataTypes::double())
-                    // String types
-                    .column("col_char", DataTypes::char(10))
-                    .column("col_string", DataTypes::string())
-                    // Decimal type
-                    .column("col_decimal", DataTypes::decimal(10, 2))
-                    // Date and time types
-                    .column("col_date", DataTypes::date())
-                    .column("col_time", DataTypes::time())
-                    .column("col_timestamp", DataTypes::timestamp())
-                    .column("col_timestamp_ltz", DataTypes::timestamp_ltz())
-                    // Binary types
-                    .column("col_bytes", DataTypes::bytes())
-                    .column("col_binary", DataTypes::binary(20))
-                    .column("col_array", DataTypes::array(DataTypes::string()))
-                    .column(
-                        "col_row",
-                        DataTypes::row(vec![
-                            DataField::new("seq", DataTypes::int(), None),
-                            DataField::new("label", DataTypes::string(), None),
-                        ]),
-                    )
-                    .primary_key(vec!["pk_int"])
-                    .build()
-                    .expect("Failed to build schema"),
-            )
-            .build()
-            .expect("Failed to build table");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let table_upsert = table.new_upsert().expect("Failed to create upsert");
-        let upsert_writer = table_upsert
-            .create_writer()
-            .expect("Failed to create writer");
-
-        // Test data for all datatypes
-        let pk_int = 1i32;
-        let col_boolean = true;
-        let col_tinyint = 127i8;
-        let col_smallint = 32767i16;
-        let col_int = 2147483647i32;
-        let col_bigint = 9223372036854775807i64;
-        let col_float = std::f32::consts::PI;
-        let col_double = std::f64::consts::E;
-        let col_char = "hello";
-        let col_string = "world of fluss rust client";
-        let col_decimal = Decimal::from_unscaled_long(12345, 10, 2).unwrap(); // 123.45
-        let col_date = Date::new(20476); // 2026-01-23
-        let col_time = Time::new(36827123); // 10:13:47.123
-        let col_timestamp = TimestampNtz::new(1769163227123); // 2026-01-23 10:13:47.123 UTC
-        let col_timestamp_ltz = TimestampLtz::new(1769163227123); // 2026-01-23 10:13:47.123 UTC
-        let col_bytes: &[u8] = b"binary data";
-        let col_binary: &[u8] = b"fixed binary data!!!";
-
-        let col_array = make_string_array(&[Some("fluss"), Some("rust")]);
-
-        let mut col_row_inner = GenericRow::new(2);
-        col_row_inner.set_field(0, 7_i32);
-        col_row_inner.set_field(1, "lumiere");
-
-        // Upsert a row with all datatypes
-        let mut row = GenericRow::new(19);
-        row.set_field(0, pk_int);
-        row.set_field(1, col_boolean);
-        row.set_field(2, col_tinyint);
-        row.set_field(3, col_smallint);
-        row.set_field(4, col_int);
-        row.set_field(5, col_bigint);
-        row.set_field(6, col_float);
-        row.set_field(7, col_double);
-        row.set_field(8, col_char);
-        row.set_field(9, col_string);
-        row.set_field(10, col_decimal.clone());
-        row.set_field(11, col_date);
-        row.set_field(12, col_time);
-        row.set_field(13, col_timestamp);
-        row.set_field(14, col_timestamp_ltz);
-        row.set_field(15, col_bytes);
-        row.set_field(16, col_binary);
-        row.set_field(17, col_array);
-        row.set_field(18, Datum::Row(Box::new(col_row_inner)));
-
-        upsert_writer
-            .upsert(&row)
-            .expect("Failed to upsert row with all datatypes")
-            .await
-            .expect("Failed to wait for upsert acknowledgment");
-
-        // Lookup the record
-        let mut lookuper = table
-            .new_lookup()
-            .expect("Failed to create lookup")
-            .create_lookuper()
-            .expect("Failed to create lookuper");
-
-        let mut key = GenericRow::new(19);
-        key.set_field(0, pk_int);
-
-        let result = lookuper.lookup(&key).await.expect("Failed to lookup");
-        let found_row = result
-            .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-
-        // Verify all datatypes
-        assert_eq!(found_row.get_int(0).unwrap(), pk_int, "pk_int mismatch");
-        assert_eq!(
-            found_row.get_boolean(1).unwrap(),
-            col_boolean,
-            "col_boolean mismatch"
-        );
-        assert_eq!(
-            found_row.get_byte(2).unwrap(),
-            col_tinyint,
-            "col_tinyint mismatch"
-        );
-        assert_eq!(
-            found_row.get_short(3).unwrap(),
-            col_smallint,
-            "col_smallint mismatch"
-        );
-        assert_eq!(found_row.get_int(4).unwrap(), col_int, "col_int mismatch");
-        assert_eq!(
-            found_row.get_long(5).unwrap(),
-            col_bigint,
-            "col_bigint mismatch"
-        );
-        assert!(
-            (found_row.get_float(6).unwrap() - col_float).abs() < f32::EPSILON,
-            "col_float mismatch: expected {}, got {}",
-            col_float,
-            found_row.get_float(6).unwrap()
-        );
-        assert!(
-            (found_row.get_double(7).unwrap() - col_double).abs() < f64::EPSILON,
-            "col_double mismatch: expected {}, got {}",
-            col_double,
-            found_row.get_double(7).unwrap()
-        );
-        assert_eq!(
-            found_row.get_char(8, 10).unwrap(),
-            col_char,
-            "col_char mismatch"
-        );
-        assert_eq!(
-            found_row.get_string(9).unwrap(),
-            col_string,
-            "col_string mismatch"
-        );
-        assert_eq!(
-            found_row.get_decimal(10, 10, 2).unwrap(),
-            col_decimal,
-            "col_decimal mismatch"
-        );
-        assert_eq!(
-            found_row.get_date(11).unwrap().get_inner(),
-            col_date.get_inner(),
-            "col_date mismatch"
-        );
-        assert_eq!(
-            found_row.get_time(12).unwrap().get_inner(),
-            col_time.get_inner(),
-            "col_time mismatch"
-        );
-        assert_eq!(
-            found_row
-                .get_timestamp_ntz(13, 6)
-                .unwrap()
-                .get_millisecond(),
-            col_timestamp.get_millisecond(),
-            "col_timestamp mismatch"
-        );
-        assert_eq!(
-            found_row
-                .get_timestamp_ltz(14, 6)
-                .unwrap()
-                .get_epoch_millisecond(),
-            col_timestamp_ltz.get_epoch_millisecond(),
-            "col_timestamp_ltz mismatch"
-        );
-        assert_eq!(
-            found_row.get_bytes(15).unwrap(),
-            col_bytes,
-            "col_bytes mismatch"
-        );
-        assert_eq!(
-            found_row.get_binary(16, 20).unwrap(),
-            col_binary,
-            "col_binary mismatch"
-        );
-        let arr = found_row.get_array(17).unwrap();
-        assert_eq!(arr.size(), 2, "col_array size mismatch");
-        assert_eq!(arr.get_string(0).unwrap(), "fluss", "col_array[0] mismatch");
-        assert_eq!(arr.get_string(1).unwrap(), "rust", "col_array[1] mismatch");
-        let nested = found_row.get_row(18).unwrap();
-        assert_eq!(nested.get_int(0).unwrap(), 7, "col_row.seq mismatch");
-        assert_eq!(
-            nested.get_string(1).unwrap(),
-            "lumiere",
-            "col_row.label mismatch"
-        );
-
-        // Test with null values for nullable columns
-        let pk_int_2 = 2i32;
-        let mut row_with_nulls = GenericRow::new(19);
-        row_with_nulls.set_field(0, pk_int_2);
-        row_with_nulls.set_field(1, Datum::Null); // col_boolean
-        row_with_nulls.set_field(2, Datum::Null); // col_tinyint
-        row_with_nulls.set_field(3, Datum::Null); // col_smallint
-        row_with_nulls.set_field(4, Datum::Null); // col_int
-        row_with_nulls.set_field(5, Datum::Null); // col_bigint
-        row_with_nulls.set_field(6, Datum::Null); // col_float
-        row_with_nulls.set_field(7, Datum::Null); // col_double
-        row_with_nulls.set_field(8, Datum::Null); // col_char
-        row_with_nulls.set_field(9, Datum::Null); // col_string
-        row_with_nulls.set_field(10, Datum::Null); // col_decimal
-        row_with_nulls.set_field(11, Datum::Null); // col_date
-        row_with_nulls.set_field(12, Datum::Null); // col_time
-        row_with_nulls.set_field(13, Datum::Null); // col_timestamp
-        row_with_nulls.set_field(14, Datum::Null); // col_timestamp_ltz
-        row_with_nulls.set_field(15, Datum::Null); // col_bytes
-        row_with_nulls.set_field(16, Datum::Null); // col_binary
-        row_with_nulls.set_field(17, Datum::Null); // col_array
-        row_with_nulls.set_field(18, Datum::Null); // col_row
-
-        upsert_writer
-            .upsert(&row_with_nulls)
-            .expect("Failed to upsert row with nulls")
-            .await
-            .expect("Failed to wait for upsert acknowledgment");
-
-        // Lookup row with nulls
-        let mut key2 = GenericRow::new(19);
-        key2.set_field(0, pk_int_2);
-
-        let result = lookuper.lookup(&key2).await.expect("Failed to lookup");
-        let found_row_nulls = result
-            .get_single_row()
-            .expect("Failed to get row")
-            .expect("Row should exist");
-
-        // Verify all nullable columns are null
-        assert_eq!(
-            found_row_nulls.get_int(0).unwrap(),
-            pk_int_2,
-            "pk_int mismatch"
-        );
-        assert!(
-            found_row_nulls.is_null_at(1).unwrap(),
-            "col_boolean should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(2).unwrap(),
-            "col_tinyint should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(3).unwrap(),
-            "col_smallint should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(4).unwrap(),
-            "col_int should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(5).unwrap(),
-            "col_bigint should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(6).unwrap(),
-            "col_float should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(7).unwrap(),
-            "col_double should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(8).unwrap(),
-            "col_char should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(9).unwrap(),
-            "col_string should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(10).unwrap(),
-            "col_decimal should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(11).unwrap(),
-            "col_date should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(12).unwrap(),
-            "col_time should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(13).unwrap(),
-            "col_timestamp should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(14).unwrap(),
-            "col_timestamp_ltz should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(15).unwrap(),
-            "col_bytes should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(16).unwrap(),
-            "col_binary should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(17).unwrap(),
-            "col_array should be null"
-        );
-        assert!(
-            found_row_nulls.is_null_at(18).unwrap(),
-            "col_row should be null"
-        );
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    #[tokio::test]
-    async fn upsert_and_lookup_with_row() {
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_kv_rows");
-        let nested_row_type = DataTypes::row(vec![
-            DataField::new("x", DataTypes::int(), None),
-            DataField::new("label", DataTypes::string(), None),
-        ]);
-        let deep_inner_row_type = DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
-        let deep_row_type =
-            DataTypes::row(vec![DataField::new("inner", deep_inner_row_type, None)]);
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(
-                Schema::builder()
-                    .column("id", DataTypes::int())
-                    .column("nested", nested_row_type)
-                    .column("deep", deep_row_type)
-                    .primary_key(vec!["id"])
-                    .build()
-                    .expect("Failed to build schema"),
-            )
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let upsert = table.new_upsert().expect("Failed to create upsert");
-        let upsert_writer = upsert.create_writer().expect("Failed to create writer");
-
-        let mut nested1 = GenericRow::new(2);
-        nested1.set_field(0, 42_i32);
-        nested1.set_field(1, "hello");
-
-        let mut deep_inner1 = GenericRow::new(1);
-        deep_inner1.set_field(0, 99_i32);
-        let mut deep1 = GenericRow::new(1);
-        deep1.set_field(0, Datum::Row(Box::new(deep_inner1)));
-
-        let mut row1 = GenericRow::new(3);
-        row1.set_field(0, 1_i32);
-        row1.set_field(1, Datum::Row(Box::new(nested1)));
-        row1.set_field(2, Datum::Row(Box::new(deep1)));
-
-        upsert_writer
-            .upsert(&row1)
-            .expect("upsert row1")
-            .await
-            .expect("ack row1");
-
-        let mut nested2 = GenericRow::new(2);
-        nested2.set_field(0, 7_i32);
-        nested2.set_field(1, Datum::Null);
-
-        let mut row2 = GenericRow::new(3);
-        row2.set_field(0, 2_i32);
-        row2.set_field(1, Datum::Row(Box::new(nested2)));
-        row2.set_field(2, Datum::Null);
-
-        upsert_writer
-            .upsert(&row2)
-            .expect("upsert row2")
-            .await
-            .expect("ack row2");
-
-        let mut deep_inner3 = GenericRow::new(1);
-        deep_inner3.set_field(0, -1_i32);
-        let mut deep3 = GenericRow::new(1);
-        deep3.set_field(0, Datum::Row(Box::new(deep_inner3)));
-
-        let mut row3 = GenericRow::new(3);
-        row3.set_field(0, 3_i32);
-        row3.set_field(1, Datum::Null);
-        row3.set_field(2, Datum::Row(Box::new(deep3)));
-
-        upsert_writer
-            .upsert(&row3)
-            .expect("upsert row3")
-            .await
-            .expect("ack row3");
-
-        let mut lookuper = table
-            .new_lookup()
-            .expect("Failed to create lookup")
-            .create_lookuper()
-            .expect("Failed to create lookuper");
-
-        let result1 = lookuper
-            .lookup(&make_key_with_field_count(1, 3))
-            .await
-            .expect("lookup row1");
-        let r1 = result1
-            .get_single_row()
-            .expect("get row1")
-            .expect("row1 should exist");
-        assert_eq!(r1.get_int(0).unwrap(), 1);
-        let nested_r1 = r1.get_row(1).unwrap();
-        assert_eq!(nested_r1.get_int(0).unwrap(), 42);
-        assert_eq!(nested_r1.get_string(1).unwrap(), "hello");
-        let deep_r1 = r1.get_row(2).unwrap();
-        let deep_inner_r1 = deep_r1.get_row(0).unwrap();
-        assert_eq!(deep_inner_r1.get_int(0).unwrap(), 99);
-
-        let result2 = lookuper
-            .lookup(&make_key_with_field_count(2, 3))
-            .await
-            .expect("lookup row2");
-        let r2 = result2
-            .get_single_row()
-            .expect("get row2")
-            .expect("row2 should exist");
-        assert_eq!(r2.get_int(0).unwrap(), 2);
-        let nested_r2 = r2.get_row(1).unwrap();
-        assert_eq!(nested_r2.get_int(0).unwrap(), 7);
-        assert!(nested_r2.is_null_at(1).unwrap());
-        assert!(r2.is_null_at(2).unwrap());
-
-        let result3 = lookuper
-            .lookup(&make_key_with_field_count(3, 3))
-            .await
-            .expect("lookup row3");
-        let r3 = result3
-            .get_single_row()
-            .expect("get row3")
-            .expect("row3 should exist");
-        assert_eq!(r3.get_int(0).unwrap(), 3);
-        assert!(r3.is_null_at(1).unwrap());
-        let deep_r3 = r3.get_row(2).unwrap();
-        let deep_inner_r3 = deep_r3.get_row(0).unwrap();
-        assert_eq!(deep_inner_r3.get_int(0).unwrap(), -1);
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    #[tokio::test]
-    async fn upsert_and_lookup_with_array_of_row() {
-        use fluss::metadata::{DataField, DataType};
-
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_kv_array_of_row");
-
-        let event_row_type_owned = DataTypes::row(vec![
-            DataField::new("seq", DataTypes::int(), None),
-            DataField::new("label", DataTypes::string(), None),
-        ]);
-        let array_of_row_type = DataTypes::array(event_row_type_owned.clone());
-
-        let event_row_type = match &event_row_type_owned {
-            DataType::Row(rt) => rt.clone(),
-            _ => unreachable!(),
-        };
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(
-                Schema::builder()
-                    .column("id", DataTypes::int())
-                    .column("events", array_of_row_type.clone())
-                    .primary_key(vec!["id"])
-                    .build()
-                    .expect("Failed to build schema"),
-            )
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let upsert = table.new_upsert().expect("Failed to create upsert");
-        let upsert_writer = upsert.create_writer().expect("Failed to create writer");
-
-        let mut events1 = FlussArrayWriter::new(2, &event_row_type_owned);
-        let mut e0 = GenericRow::new(2);
-        e0.set_field(0, 1_i32);
-        e0.set_field(1, "open");
-        events1.write_row(0, &e0).expect("write e0");
-        let mut e1 = GenericRow::new(2);
-        e1.set_field(0, 2_i32);
-        e1.set_field(1, "close");
-        events1.write_row(1, &e1).expect("write e1");
-        let events1 = events1.complete().expect("events1");
-
-        let mut row1 = GenericRow::new(2);
-        row1.set_field(0, 1_i32);
-        row1.set_field(1, events1);
-
-        upsert_writer
-            .upsert(&row1)
-            .expect("upsert row1")
-            .await
-            .expect("ack row1");
-
-        let mut events2 = FlussArrayWriter::new(3, &event_row_type_owned);
-        let mut e2 = GenericRow::new(2);
-        e2.set_field(0, 7_i32);
-        e2.set_field(1, "x");
-        events2.write_row(0, &e2).expect("write e2");
-        events2.set_null_at(1);
-        let mut e3 = GenericRow::new(2);
-        e3.set_field(0, 8_i32);
-        e3.set_field(1, "y");
-        events2.write_row(2, &e3).expect("write e3");
-        let events2 = events2.complete().expect("events2");
-
-        let mut row2 = GenericRow::new(2);
-        row2.set_field(0, 2_i32);
-        row2.set_field(1, events2);
-
-        upsert_writer
-            .upsert(&row2)
-            .expect("upsert row2")
-            .await
-            .expect("ack row2");
-
-        let mut row3 = GenericRow::new(2);
-        row3.set_field(0, 3_i32);
-        row3.set_field(1, Datum::Null);
-
-        upsert_writer
-            .upsert(&row3)
-            .expect("upsert row3")
-            .await
-            .expect("ack row3");
-
-        let mut lookuper = table
-            .new_lookup()
-            .expect("Failed to create lookup")
-            .create_lookuper()
-            .expect("Failed to create lookuper");
-
-        let result1 = lookuper
-            .lookup(&make_key_with_field_count(1, 2))
-            .await
-            .expect("lookup row1");
-        let r1 = result1
-            .get_single_row()
-            .expect("get row1")
-            .expect("row1 should exist");
-        assert_eq!(r1.get_int(0).unwrap(), 1);
-        let events_r1 = r1.get_array(1).unwrap();
-        assert_eq!(events_r1.size(), 2);
-        let e0_r1 = events_r1.get_row(0, &event_row_type).unwrap();
-        assert_eq!(e0_r1.get_int(0).unwrap(), 1);
-        assert_eq!(e0_r1.get_string(1).unwrap(), "open");
-        let e1_r1 = events_r1.get_row(1, &event_row_type).unwrap();
-        assert_eq!(e1_r1.get_int(0).unwrap(), 2);
-        assert_eq!(e1_r1.get_string(1).unwrap(), "close");
-
-        let result2 = lookuper
-            .lookup(&make_key_with_field_count(2, 2))
-            .await
-            .expect("lookup row2");
-        let r2 = result2
-            .get_single_row()
-            .expect("get row2")
-            .expect("row2 should exist");
-        let events_r2 = r2.get_array(1).unwrap();
-        assert_eq!(events_r2.size(), 3);
-        let e0_r2 = events_r2.get_row(0, &event_row_type).unwrap();
-        assert_eq!(e0_r2.get_int(0).unwrap(), 7);
-        assert_eq!(e0_r2.get_string(1).unwrap(), "x");
-        assert!(events_r2.is_null_at(1));
-        let e2_r2 = events_r2.get_row(2, &event_row_type).unwrap();
-        assert_eq!(e2_r2.get_int(0).unwrap(), 8);
-        assert_eq!(e2_r2.get_string(1).unwrap(), "y");
-
-        let result3 = lookuper
-            .lookup(&make_key_with_field_count(3, 2))
-            .await
-            .expect("lookup row3");
-        let r3 = result3
-            .get_single_row()
-            .expect("get row3")
-            .expect("row3 should exist");
-        assert_eq!(r3.get_int(0).unwrap(), 3);
-        assert!(r3.is_null_at(1).unwrap());
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
+            .expect("row exists");
+        assert_eq!(r.get_string(1).unwrap(), "Verso", "name preserved");
+        let n = r.get_row(3).unwrap();
+        assert_eq!(n.get_int(0).unwrap(), 99, "ROW preserved");
+        assert_eq!(r.get_map(4).unwrap().size(), 1, "MAP preserved");
+        let a = r.get_array(5).unwrap();
+        assert_eq!(a.size(), 1);
+        assert_eq!(a.get_string(0).unwrap(), "gamma-tag");
+
+        admin.drop_table(&table_path, false).await.expect("drop");
     }
 
+    /// Partitioned KV upsert + lookup against every compound type.
     #[tokio::test]
-    async fn upsert_and_lookup_with_array() {
+    async fn partitioned_table_upsert_and_lookup() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss", "test_kv_arrays");
-        let inner_array_type = DataTypes::array(DataTypes::int());
+        let table_path = TablePath::new("fluss", "test_partitioned_kv_table");
+
+        let nested_type = DataTypes::row(vec![
+            DataField::new("seq", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
 
         let table_descriptor = TableDescriptor::builder()
             .schema(
                 Schema::builder()
-                    .column("id", DataTypes::int())
+                    .column("region", DataTypes::string())
+                    .column("user_id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .column("score", DataTypes::bigint())
+                    .column("nested", nested_type)
+                    .column(
+                        "attrs",
+                        DataTypes::map(DataTypes::string(), DataTypes::int()),
+                    )
                     .column("tags", DataTypes::array(DataTypes::string()))
-                    .column("scores", DataTypes::array(DataTypes::int()))
-                    .column("matrix", DataTypes::array(inner_array_type.clone()))
-                    .primary_key(vec!["id"])
+                    .primary_key(vec!["region", "user_id"])
                     .build()
-                    .expect("Failed to build schema"),
+                    .expect("schema"),
             )
+            .partitioned_by(vec!["region"])
             .build()
-            .expect("Failed to build table descriptor");
+            .expect("table descriptor");
 
         create_table(&admin, &table_path, &table_descriptor).await;
+        create_partitions(&admin, &table_path, "region", &["US", "EU", "APAC"]).await;
 
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
+        let table = connection.get_table(&table_path).await.expect("table");
+        let table_upsert = table.new_upsert().expect("upsert");
+        let upsert_writer = table_upsert.create_writer().expect("writer");
 
-        let upsert = table.new_upsert().expect("Failed to create upsert");
-        let upsert_writer = upsert.create_writer().expect("Failed to create writer");
+        let test_data = [
+            ("US", 1_i32, "Gustave", 100_i64, 11_i32, "a", 1_i32, "alpha"),
+            ("US", 2, "Lune", 200, 22, "b", 2, "beta"),
+            ("EU", 1, "Sciel", 150, 33, "c", 3, "gamma"),
+            ("EU", 2, "Maelle", 250, 44, "d", 4, "delta"),
+            ("APAC", 1, "Noco", 300, 55, "e", 5, "epsilon"),
+        ];
 
-        let mut row1 = GenericRow::new(4);
-        row1.set_field(0, 1_i32);
-        row1.set_field(1, make_string_array(&[Some("hello"), Some("world")]));
-        row1.set_field(2, make_int_array(&[Some(10), Some(20), Some(30)]));
-        let m1 = {
-            let mut w = FlussArrayWriter::new(2, &inner_array_type);
-            w.write_array(0, &make_int_array(&[Some(1), Some(2)]));
-            w.write_array(1, &make_int_array(&[Some(3), Some(4)]));
-            w.complete().expect("matrix1")
-        };
-        row1.set_field(3, m1);
+        for (region, user_id, name, score, seq, label, attr_v, tag) in &test_data {
+            let mut nested = GenericRow::new(2);
+            nested.set_field(0, *seq);
+            nested.set_field(1, *label);
+            let attrs = {
+                let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::int());
+                w.write_entry((*label).into(), (*attr_v).into()).unwrap();
+                w.complete().expect("attrs")
+            };
+            let tags = make_string_array(&[Some(*tag)]);
+
+            let mut row = GenericRow::new(7);
+            row.set_field(0, *region);
+            row.set_field(1, *user_id);
+            row.set_field(2, *name);
+            row.set_field(3, *score);
+            row.set_field(4, Datum::Row(Box::new(nested)));
+            row.set_field(5, Datum::Map(attrs));
+            row.set_field(6, tags);
+            upsert_writer.upsert(&row).expect("upsert");
+        }
+        upsert_writer.flush().await.expect("flush");
 
-        upsert_writer
-            .upsert(&row1)
-            .expect("upsert row1")
-            .await
-            .expect("ack row1");
+        let mut lookuper = table
+            .new_lookup()
+            .expect("lookup")
+            .create_lookuper()
+            .expect("lookuper");
 
-        let mut row2 = GenericRow::new(4);
-        row2.set_field(0, 2_i32);
-        row2.set_field(1, make_string_array(&[None]));
-        row2.set_field(2, make_int_array(&[]));
-        row2.set_field(3, Datum::Null);
+        // === Per-partition lookup verifies all compound columns ===
+        for (region, user_id, name, score, seq, label, attr_v, tag) in &test_data {
+            let mut key = GenericRow::new(7);
+            key.set_field(0, *region);
+            key.set_field(1, *user_id);
 
-        upsert_writer
-            .upsert(&row2)
-            .expect("upsert row2")
-            .await
-            .expect("ack row2");
+            let result = lookuper.lookup(&key).await.expect("lookup");
+            let row = result
+                .get_single_row()
+                .expect("get row")
+                .expect("row exists");
 
-        let mut row3 = GenericRow::new(4);
-        row3.set_field(0, 3_i32);
-        row3.set_field(1, Datum::Null);
-        row3.set_field(2, make_int_array(&[Some(42)]));
-        let m3 = {
-            let mut w = FlussArrayWriter::new(3, &inner_array_type);
-            w.write_array(0, &make_int_array(&[Some(5)]));
-            w.set_null_at(1);
-            w.write_array(2, &make_int_array(&[]));
-            w.complete().expect("matrix3")
-        };
-        row3.set_field(3, m3);
+            assert_eq!(row.get_string(0).unwrap(), *region);
+            assert_eq!(row.get_int(1).unwrap(), *user_id);
+            assert_eq!(row.get_string(2).unwrap(), *name);
+            assert_eq!(row.get_long(3).unwrap(), *score);
+            let nested = row.get_row(4).unwrap();
+            assert_eq!(nested.get_int(0).unwrap(), *seq);
+            assert_eq!(nested.get_string(1).unwrap(), *label);
+            let attrs = row.get_map(5).unwrap();
+            assert_eq!(attrs.size(), 1);
+            assert_eq!(
+                attrs.get(&Datum::from(*label)).unwrap(),
+                Some(Datum::from(*attr_v))
+            );
+            let tags = row.get_array(6).unwrap();
+            assert_eq!(tags.size(), 1);
+            assert_eq!(tags.get_string(0).unwrap(), *tag);
+        }
 
+        // === Update a row in US partition ===
+        let mut updated_nested = GenericRow::new(2);
+        updated_nested.set_field(0, 999_i32);
+        updated_nested.set_field(1, "updated");
+        let updated_attrs = {
+            let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::int());
+            w.write_entry("u".into(), 999.into()).unwrap();
+            w.complete().expect("updated_attrs")
+        };
+        let updated_tags = make_string_array(&[Some("renamed")]);
+        let mut updated_row = GenericRow::new(7);
+        updated_row.set_field(0, "US");
+        updated_row.set_field(1, 1);
+        updated_row.set_field(2, "Gustave Updated");
+        updated_row.set_field(3, 999_i64);
+        updated_row.set_field(4, Datum::Row(Box::new(updated_nested)));
+        updated_row.set_field(5, Datum::Map(updated_attrs));
+        updated_row.set_field(6, updated_tags);
         upsert_writer
-            .upsert(&row3)
-            .expect("upsert row3")
+            .upsert(&updated_row)
+            .expect("upsert updated")
             .await
-            .expect("ack row3");
-
-        // Lookup and verify
-        let mut lookuper = table
-            .new_lookup()
-            .expect("Failed to create lookup")
-            .create_lookuper()
-            .expect("Failed to create lookuper");
+            .expect("ack updated");
 
-        let result1 = lookuper
-            .lookup(&make_key_with_field_count(1, 4))
-            .await
-            .expect("lookup row1");
-        let r1 = result1
+        let mut key = GenericRow::new(7);
+        key.set_field(0, "US");
+        key.set_field(1, 1);
+        let result = lookuper.lookup(&key).await.expect("lookup");
+        let row = result
             .get_single_row()
-            .expect("get row1")
-            .expect("row1 should exist");
-        assert_eq!(r1.get_int(0).unwrap(), 1);
-        let tags_r1 = r1.get_array(1).unwrap();
-        assert_eq!(tags_r1.size(), 2);
-        assert_eq!(tags_r1.get_string(0).unwrap(), "hello");
-        assert_eq!(tags_r1.get_string(1).unwrap(), "world");
-        let scores_r1 = r1.get_array(2).unwrap();
-        assert_eq!(scores_r1.size(), 3);
-        assert_eq!(scores_r1.get_int(0).unwrap(), 10);
-        assert_eq!(scores_r1.get_int(1).unwrap(), 20);
-        assert_eq!(scores_r1.get_int(2).unwrap(), 30);
-        let matrix_r1: FlussArray = r1.get_array(3).unwrap();
-        assert_eq!(matrix_r1.size(), 2);
-        let mr1_0 = matrix_r1.get_array(0).unwrap();
-        assert_eq!(mr1_0.size(), 2);
-        assert_eq!(mr1_0.get_int(0).unwrap(), 1);
-        assert_eq!(mr1_0.get_int(1).unwrap(), 2);
-        let mr1_1 = matrix_r1.get_array(1).unwrap();
-        assert_eq!(mr1_1.size(), 2);
-        assert_eq!(mr1_1.get_int(0).unwrap(), 3);
-        assert_eq!(mr1_1.get_int(1).unwrap(), 4);
-
-        let result2 = lookuper
-            .lookup(&make_key_with_field_count(2, 4))
+            .expect("get row")
+            .expect("row exists");
+        assert_eq!(row.get_string(2).unwrap(), "Gustave Updated");
+        assert_eq!(row.get_long(3).unwrap(), 999);
+        let nested = row.get_row(4).unwrap();
+        assert_eq!(nested.get_int(0).unwrap(), 999);
+        let attrs = row.get_map(5).unwrap();
+        assert_eq!(
+            attrs.get(&Datum::from("u")).unwrap(),
+            Some(Datum::from(999_i32))
+        );
+        let tags = row.get_array(6).unwrap();
+        assert_eq!(tags.get_string(0).unwrap(), "renamed");
+
+        // === Lookup in non-existent partition returns None ===
+        let mut missing = GenericRow::new(7);
+        missing.set_field(0, "UNKNOWN_REGION");
+        missing.set_field(1, 1);
+        let result = lookuper
+            .lookup(&missing)
             .await
-            .expect("lookup row2");
-        let r2 = result2
-            .get_single_row()
-            .expect("get row2")
-            .expect("row2 should exist");
-        assert_eq!(r2.get_int(0).unwrap(), 2);
-        let tags_r2 = r2.get_array(1).unwrap();
-        assert_eq!(tags_r2.size(), 1);
-        assert!(tags_r2.is_null_at(0));
-        let scores_r2 = r2.get_array(2).unwrap();
-        assert_eq!(scores_r2.size(), 0);
-        assert!(r2.is_null_at(3).unwrap());
-
-        let result3 = lookuper
-            .lookup(&make_key_with_field_count(3, 4))
+            .expect("lookup unknown partition");
+        assert!(result.get_single_row().expect("get").is_none());
+
+        // === Delete a row within a partition ===
+        let mut delete_key = GenericRow::new(7);
+        delete_key.set_field(0, "EU");
+        delete_key.set_field(1, 1);
+        upsert_writer
+            .delete(&delete_key)
+            .expect("delete")
             .await
-            .expect("lookup row3");
-        let r3 = result3
+            .expect("ack delete");
+        let mut key = GenericRow::new(7);
+        key.set_field(0, "EU");
+        key.set_field(1, 1);
+        let result = lookuper.lookup(&key).await.expect("lookup");
+        assert!(result.get_single_row().expect("get").is_none());
+
+        // === Sibling row in same partition still exists ===
+        let mut key = GenericRow::new(7);
+        key.set_field(0, "EU");
+        key.set_field(1, 2);
+        let result = lookuper.lookup(&key).await.expect("lookup");
+        let row = result
             .get_single_row()
-            .expect("get row3")
-            .expect("row3 should exist");
-        assert_eq!(r3.get_int(0).unwrap(), 3);
-        assert!(r3.is_null_at(1).unwrap());
-        let scores_r3 = r3.get_array(2).unwrap();
-        assert_eq!(scores_r3.size(), 1);
-        assert_eq!(scores_r3.get_int(0).unwrap(), 42);
-        let matrix_r3 = r3.get_array(3).unwrap();
-        assert_eq!(matrix_r3.size(), 3);
-        let mr3_0 = matrix_r3.get_array(0).unwrap();
-        assert_eq!(mr3_0.size(), 1);
-        assert_eq!(mr3_0.get_int(0).unwrap(), 5);
-        assert!(matrix_r3.is_null_at(1));
-        let mr3_2 = matrix_r3.get_array(2).unwrap();
-        assert_eq!(mr3_2.size(), 0);
+            .expect("get row")
+            .expect("row exists");
+        assert_eq!(row.get_string(2).unwrap(), "Maelle");
+        assert_eq!(row.get_array(6).unwrap().get_string(0).unwrap(), "delta");
 
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
+        admin.drop_table(&table_path, false).await.expect("drop");
     }
 
+    /// Integration test covering put and get operations for all supported datatypes.
     /// Integration test for concurrent batched lookups across partitions.
     #[tokio::test]
     async fn batched_concurrent_lookups_partitioned() {
-        use futures::stream::{FuturesUnordered, StreamExt};
-
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
@@ -1977,8 +1055,6 @@ mod kv_table_test {
     /// Integration test for concurrent batched lookups.
     #[tokio::test]
     async fn batched_concurrent_lookups() {
-        use futures::stream::{FuturesUnordered, StreamExt};
-
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
 
@@ -2175,4 +1251,522 @@ mod kv_table_test {
             .await
             .expect("Failed to drop table");
     }
+
+    /// KV upsert + lookup against a schema covering every supported data type.
+    #[tokio::test]
+    async fn all_supported_datatypes() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_kv_complex_types");
+
+        let row_seq_label_owned = dt_row_seq_label();
+        let row_seq_label = as_row_type(&row_seq_label_owned);
+        let inner_array_int = dt_array_int();
+        let inner_map_string_int = dt_map_string_int();
+
+        let plan = ColumnPlan::new()
+            .add("id", DataTypes::int())
+            .start_section("array_basics")
+            .extend(array_dt_basics_columns())
+            .start_section("row_basics")
+            .extend(row_dt_basics_columns())
+            .start_section("map_basics")
+            .extend(map_dt_basics_columns())
+            .start_section("scalars")
+            .extend(scalar_dt_columns());
+        let table_descriptor = TableDescriptor::builder()
+            .schema(plan.build_schema(Some(&["id"])))
+            .build()
+            .expect("table descriptor");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+
+        let table = connection.get_table(&table_path).await.expect("table");
+        let upsert_writer = table
+            .new_upsert()
+            .expect("upsert")
+            .create_writer()
+            .expect("writer");
+
+        // Row 1 (id=1) — comprehensive: every column populated.
+        let column_count = plan.len();
+        let mut row1 = GenericRow::new(column_count);
+        row1.set_field(0, 1_i32);
+        row1.set_field(1, make_int_array(&[Some(10), Some(20), Some(30)]));
+        row1.set_field(2, make_string_array(&[Some("hello"), Some("world")]));
+        let arr_of_arr_1 = {
+            let mut w = FlussArrayWriter::new(2, &inner_array_int);
+            w.write_array(0, &make_int_array(&[Some(1), Some(2)]));
+            w.write_array(1, &make_int_array(&[Some(3), Some(4)]));
+            w.complete().expect("arr_of_arr_1")
+        };
+        row1.set_field(3, arr_of_arr_1);
+        let arr_of_row_1 = {
+            let mut w = FlussArrayWriter::new(2, &row_seq_label_owned);
+            let mut e0 = GenericRow::new(2);
+            e0.set_field(0, 1_i32);
+            e0.set_field(1, "open");
+            w.write_row(0, &e0).expect("e0");
+            let mut e1 = GenericRow::new(2);
+            e1.set_field(0, 2_i32);
+            e1.set_field(1, "close");
+            w.write_row(1, &e1).expect("e1");
+            w.complete().expect("arr_of_row_1")
+        };
+        row1.set_field(4, arr_of_row_1);
+        let mut row_basic_1 = GenericRow::new(2);
+        row_basic_1.set_field(0, 42_i32);
+        row_basic_1.set_field(1, "hello");
+        row1.set_field(5, Datum::Row(Box::new(row_basic_1)));
+        let mut deep_inner_1 = GenericRow::new(1);
+        deep_inner_1.set_field(0, 99_i32);
+        let mut row_deep_1 = GenericRow::new(1);
+        row_deep_1.set_field(0, Datum::Row(Box::new(deep_inner_1)));
+        row1.set_field(6, Datum::Row(Box::new(row_deep_1)));
+        let mut row_rich_1 = GenericRow::new(14);
+        row_rich_1.set_field(0, true);
+        row_rich_1.set_field(1, 100_000_i32);
+        row_rich_1.set_field(2, 9_876_543_210_i64);
+        row_rich_1.set_field(3, f32::INFINITY);
+        row_rich_1.set_field(4, std::f64::consts::PI);
+        row_rich_1.set_field(5, "hello world");
+        row_rich_1.set_field(6, b"binary".as_slice());
+        row_rich_1.set_field(7, Decimal::from_unscaled_long(12345, 10, 2).unwrap());
+        row_rich_1.set_field(8, Datum::Date(Date::new(20476)));
+        row_rich_1.set_field(9, Datum::Time(Time::new(36_827_123)));
+        row_rich_1.set_field(
+            10,
+            Datum::TimestampNtz(TimestampNtz::new(1_769_163_227_123)),
+        );
+        row_rich_1.set_field(
+            11,
+            Datum::TimestampLtz(TimestampLtz::new(1_769_163_227_456)),
+        );
+        row_rich_1.set_field(12, b"\x01\x02\x03\x04".as_slice());
+        row_rich_1.set_field(13, make_int_array(&[Some(7), None, Some(11)]));
+        row1.set_field(7, Datum::Row(Box::new(row_rich_1)));
+        let map_string_int_1 = {
+            let mut w = FlussMapWriter::new(3, &DataTypes::string(), &DataTypes::int());
+            w.write_entry("a".into(), 1.into()).unwrap();
+            w.write_entry("b".into(), Datum::Null).unwrap();
+            w.write_entry("c".into(), 3.into()).unwrap();
+            w.complete().expect("map_string_int_1")
+        };
+        row1.set_field(8, Datum::Map(map_string_int_1));
+        let map_of_row_1 = {
+            let mut e0 = GenericRow::new(2);
+            e0.set_field(0, 1_i32);
+            e0.set_field(1, "open");
+            let mut e1 = GenericRow::new(2);
+            e1.set_field(0, 2_i32);
+            e1.set_field(1, "close");
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &row_seq_label_owned);
+            w.write_entry("e0".into(), Datum::Row(Box::new(e0)))
+                .unwrap();
+            w.write_entry("e1".into(), Datum::Row(Box::new(e1)))
+                .unwrap();
+            w.complete().expect("map_of_row_1")
+        };
+        row1.set_field(9, Datum::Map(map_of_row_1));
+        let map_of_map_1 = {
+            let g1 = {
+                let mut w = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+                w.write_entry("a".into(), 1.into()).unwrap();
+                w.write_entry("b".into(), 2.into()).unwrap();
+                w.complete().expect("g1")
+            };
+            let g2 = {
+                let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::int());
+                w.write_entry("c".into(), 3.into()).unwrap();
+                w.complete().expect("g2")
+            };
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &inner_map_string_int);
+            w.write_entry("g1".into(), Datum::Map(g1)).unwrap();
+            w.write_entry("g2".into(), Datum::Map(g2)).unwrap();
+            w.complete().expect("map_of_map_1")
+        };
+        row1.set_field(10, Datum::Map(map_of_map_1));
+        let map_of_array_1 = {
+            let primes = make_int_array(&[Some(2), Some(3), Some(5)]);
+            let squares = make_int_array(&[Some(1), Some(4)]);
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &inner_array_int);
+            w.write_entry("primes".into(), Datum::Array(primes))
+                .unwrap();
+            w.write_entry("squares".into(), Datum::Array(squares))
+                .unwrap();
+            w.complete().expect("map_of_array_1")
+        };
+        row1.set_field(11, Datum::Map(map_of_array_1));
+        let array_of_map_1 = {
+            let m0 = {
+                let mut w = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+                w.write_entry("x".into(), 1.into()).unwrap();
+                w.write_entry("y".into(), 2.into()).unwrap();
+                w.complete().expect("m0")
+            };
+            let m1 = {
+                let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::int());
+                w.write_entry("z".into(), 9.into()).unwrap();
+                w.complete().expect("m1")
+            };
+            let mut w = FlussArrayWriter::new(2, &inner_map_string_int);
+            w.write_map(0, &m0);
+            w.write_map(1, &m1);
+            w.complete().expect("array_of_map_1")
+        };
+        row1.set_field(12, array_of_map_1);
+
+        // Scalar values for row 1.
+        let s_tinyint = 127_i8;
+        let s_smallint = 32_767_i16;
+        let s_bigint = 9_223_372_036_854_775_807_i64;
+        let s_float = std::f32::consts::PI;
+        let s_double = std::f64::consts::E;
+        let s_char = "hello";
+        let s_string = "world of fluss rust client";
+        let s_decimal = Decimal::from_unscaled_long(12345, 10, 2).unwrap();
+        let s_date = Date::new(20476);
+        let s_time_s = Time::new(36_827_000);
+        let s_time_ms = Time::new(36_827_123);
+        let s_time_us = Time::new(86_399_999);
+        let s_time_ns = Time::new(1);
+        let s_ts_s = TimestampNtz::new(1_769_163_227_000);
+        let s_ts_ms = TimestampNtz::new(1_769_163_227_123);
+        let s_ts_us = TimestampNtz::from_millis_nanos(1_769_163_227_123, 456_000).unwrap();
+        let s_ts_ns = TimestampNtz::from_millis_nanos(1_769_163_227_123, 999_999).unwrap();
+        let s_ts_ltz_s = TimestampLtz::new(1_769_163_227_000);
+        let s_ts_ltz_ms = TimestampLtz::new(1_769_163_227_123);
+        let s_ts_ltz_us = TimestampLtz::from_millis_nanos(1_769_163_227_123, 456_000).unwrap();
+        let s_ts_ltz_ns = TimestampLtz::from_millis_nanos(1_769_163_227_123, 999_999).unwrap();
+        let s_bytes_top: Vec<u8> = b"binary data".to_vec();
+        let s_binary_top: Vec<u8> = vec![0xDE, 0xAD, 0xBE, 0xEF];
+        let s_ts_us_neg = TimestampNtz::from_millis_nanos(-301_234_154_877, 456_000).unwrap();
+        let s_ts_ns_neg = TimestampNtz::from_millis_nanos(-301_234_154_877, 999_999).unwrap();
+        let s_ts_ltz_us_neg = TimestampLtz::from_millis_nanos(-301_234_154_877, 456_000).unwrap();
+        let s_ts_ltz_ns_neg = TimestampLtz::from_millis_nanos(-301_234_154_877, 999_999).unwrap();
+
+        row1.set_field(plan.idx("col_tinyint"), s_tinyint);
+        row1.set_field(plan.idx("col_smallint"), s_smallint);
+        row1.set_field(plan.idx("col_bigint"), s_bigint);
+        row1.set_field(plan.idx("col_float"), s_float);
+        row1.set_field(plan.idx("col_double"), s_double);
+        row1.set_field(plan.idx("col_boolean"), true);
+        row1.set_field(plan.idx("col_char"), s_char);
+        row1.set_field(plan.idx("col_string"), s_string);
+        row1.set_field(plan.idx("col_decimal"), s_decimal.clone());
+        row1.set_field(plan.idx("col_date"), Datum::Date(s_date));
+        row1.set_field(plan.idx("col_time_s"), s_time_s);
+        row1.set_field(plan.idx("col_time_ms"), s_time_ms);
+        row1.set_field(plan.idx("col_time_us"), s_time_us);
+        row1.set_field(plan.idx("col_time_ns"), s_time_ns);
+        row1.set_field(plan.idx("col_ts_s"), s_ts_s);
+        row1.set_field(plan.idx("col_ts_ms"), s_ts_ms);
+        row1.set_field(plan.idx("col_ts_us"), s_ts_us);
+        row1.set_field(plan.idx("col_ts_ns"), s_ts_ns);
+        row1.set_field(plan.idx("col_ts_ltz_s"), s_ts_ltz_s);
+        row1.set_field(plan.idx("col_ts_ltz_ms"), s_ts_ltz_ms);
+        row1.set_field(plan.idx("col_ts_ltz_us"), s_ts_ltz_us);
+        row1.set_field(plan.idx("col_ts_ltz_ns"), s_ts_ltz_ns);
+        row1.set_field(plan.idx("col_bytes_top"), s_bytes_top.as_slice());
+        row1.set_field(plan.idx("col_binary_top"), s_binary_top.as_slice());
+        row1.set_field(plan.idx("col_ts_us_neg"), s_ts_us_neg);
+        row1.set_field(plan.idx("col_ts_ns_neg"), s_ts_ns_neg);
+        row1.set_field(plan.idx("col_ts_ltz_us_neg"), s_ts_ltz_us_neg);
+        row1.set_field(plan.idx("col_ts_ltz_ns_neg"), s_ts_ltz_ns_neg);
+
+        upsert_writer
+            .upsert(&row1)
+            .expect("upsert row1")
+            .await
+            .expect("ack row1");
+
+        // Row 2 (id=2) — empty MAP, all other compound + scalar columns NULL.
+        let mut row2 = GenericRow::new(column_count);
+        row2.set_field(0, 2_i32);
+        for i in 1..column_count {
+            row2.set_field(i, Datum::Null);
+        }
+        let empty_map = FlussMapWriter::new(0, &DataTypes::string(), &DataTypes::int())
+            .complete()
+            .expect("empty_map");
+        row2.set_field(plan.idx("map_string_int"), Datum::Map(empty_map));
+        upsert_writer
+            .upsert(&row2)
+            .expect("upsert row2")
+            .await
+            .expect("ack row2");
+
+        // Row 3 (id=3) — every compound + scalar column NULL.
+        let mut row3 = GenericRow::new(column_count);
+        row3.set_field(0, 3_i32);
+        for i in 1..column_count {
+            row3.set_field(i, Datum::Null);
+        }
+        upsert_writer
+            .upsert(&row3)
+            .expect("upsert row3")
+            .await
+            .expect("ack row3");
+
+        let mut lookuper = table
+            .new_lookup()
+            .expect("lookup")
+            .create_lookuper()
+            .expect("lookuper");
+
+        let result1 = lookuper.lookup(&make_key(1)).await.expect("lookup row1");
+        let r1 = result1
+            .get_single_row()
+            .expect("row1")
+            .expect("row1 exists");
+        assert_eq!(r1.get_int(0).unwrap(), 1);
+
+        // === ARRAY: basic shapes ===
+        let arr_int = r1.get_array(1).unwrap();
+        assert_eq!(arr_int.size(), 3);
+        assert_eq!(arr_int.get_int(2).unwrap(), 30);
+        let arr_string = r1.get_array(2).unwrap();
+        assert_eq!(arr_string.size(), 2);
+        assert_eq!(arr_string.get_string(0).unwrap(), "hello");
+        let arr_of_arr = r1.get_array(3).unwrap();
+        assert_eq!(arr_of_arr.size(), 2);
+        assert_eq!(arr_of_arr.get_array(1).unwrap().get_int(1).unwrap(), 4);
+
+        // === ARRAY<ROW> ===
+        let aor = r1.get_array(4).unwrap();
+        assert_eq!(aor.size(), 2);
+        let e0 = aor.get_row(0, &row_seq_label).unwrap();
+        assert_eq!(e0.get_int(0).unwrap(), 1);
+        assert_eq!(e0.get_string(1).unwrap(), "open");
+
+        // === ROW: basic + deep + rich ===
+        let rb = r1.get_row(5).unwrap();
+        assert_eq!(rb.get_int(0).unwrap(), 42);
+        assert_eq!(rb.get_string(1).unwrap(), "hello");
+        let rd = r1.get_row(6).unwrap();
+        let rd_inner = rd.get_row(0).unwrap();
+        assert_eq!(rd_inner.get_int(0).unwrap(), 99);
+        let rr = r1.get_row(7).unwrap();
+        assert!(rr.get_boolean(0).unwrap());
+        assert_eq!(rr.get_int(1).unwrap(), 100_000);
+        assert_eq!(rr.get_long(2).unwrap(), 9_876_543_210);
+        assert!(rr.get_float(3).unwrap().is_infinite());
+        assert!((rr.get_double(4).unwrap() - std::f64::consts::PI).abs() < f64::EPSILON);
+        assert_eq!(rr.get_string(5).unwrap(), "hello world");
+        assert_eq!(rr.get_bytes(6).unwrap(), b"binary");
+        assert_eq!(
+            rr.get_decimal(7, 10, 2).unwrap(),
+            Decimal::from_unscaled_long(12345, 10, 2).unwrap()
+        );
+        assert_eq!(rr.get_date(8).unwrap().get_inner(), 20476);
+        assert_eq!(rr.get_time(9).unwrap().get_inner(), 36_827_123);
+        assert_eq!(
+            rr.get_timestamp_ntz(10, 6).unwrap().get_millisecond(),
+            1_769_163_227_123
+        );
+        assert_eq!(
+            rr.get_timestamp_ltz(11, 6).unwrap().get_epoch_millisecond(),
+            1_769_163_227_456
+        );
+        assert_eq!(rr.get_binary(12, 4).unwrap(), b"\x01\x02\x03\x04");
+        let f_arr = rr.get_array(13).unwrap();
+        assert_eq!(f_arr.size(), 3);
+        assert!(f_arr.is_null_at(1));
+
+        // === MAP: basic ===
+        let m = r1.get_map(8).unwrap();
+        assert_eq!(m.size(), 3);
+        assert_eq!(m.get(&Datum::from("a")).unwrap(), Some(Datum::from(1_i32)));
+        assert_eq!(m.get(&Datum::from("b")).unwrap(), Some(Datum::Null));
+        assert_eq!(m.get(&Datum::from("c")).unwrap(), Some(Datum::from(3_i32)));
+
+        // === MAP<K, ROW> ===
+        let m = r1.get_map(9).unwrap();
+        let v0 = m.value_array().get_row(0, &row_seq_label).unwrap();
+        assert_eq!(v0.get_int(0).unwrap(), 1);
+        assert_eq!(v0.get_string(1).unwrap(), "open");
+
+        // === MAP<K, MAP> ===
+        let m = r1.get_map(10).unwrap();
+        let g1 = m
+            .value_array()
+            .get_map(0, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(g1.size(), 2);
+
+        // === MAP<K, ARRAY> + ARRAY<MAP> ===
+        let m = r1.get_map(11).unwrap();
+        assert_eq!(m.value_array().get_array(0).unwrap().size(), 3);
+        let am = r1.get_array(12).unwrap();
+        assert_eq!(am.size(), 2);
+        let am0 = am
+            .get_map(0, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(am0.size(), 2);
+
+        // === Scalars: integers + floating point ===
+        assert_eq!(r1.get_byte(plan.idx("col_tinyint")).unwrap(), s_tinyint);
+        assert_eq!(r1.get_short(plan.idx("col_smallint")).unwrap(), s_smallint);
+        assert_eq!(r1.get_long(plan.idx("col_bigint")).unwrap(), s_bigint);
+        assert!((r1.get_float(plan.idx("col_float")).unwrap() - s_float).abs() < f32::EPSILON);
+        assert!((r1.get_double(plan.idx("col_double")).unwrap() - s_double).abs() < f64::EPSILON);
+
+        // === Scalars: boolean / char / string / decimal / date ===
+        assert!(r1.get_boolean(plan.idx("col_boolean")).unwrap());
+        assert_eq!(r1.get_char(plan.idx("col_char"), 10).unwrap(), s_char);
+        assert_eq!(r1.get_string(plan.idx("col_string")).unwrap(), s_string);
+        assert_eq!(
+            r1.get_decimal(plan.idx("col_decimal"), 10, 2).unwrap(),
+            s_decimal
+        );
+        assert_eq!(
+            r1.get_date(plan.idx("col_date")).unwrap().get_inner(),
+            s_date.get_inner()
+        );
+
+        // === Scalars: time across all four precisions ===
+        assert_eq!(
+            r1.get_time(plan.idx("col_time_s")).unwrap().get_inner(),
+            s_time_s.get_inner()
+        );
+        assert_eq!(
+            r1.get_time(plan.idx("col_time_ms")).unwrap().get_inner(),
+            s_time_ms.get_inner()
+        );
+        assert_eq!(
+            r1.get_time(plan.idx("col_time_us")).unwrap().get_inner(),
+            s_time_us.get_inner()
+        );
+        assert_eq!(
+            r1.get_time(plan.idx("col_time_ns")).unwrap().get_inner(),
+            s_time_ns.get_inner()
+        );
+
+        // === Scalars: timestamp across all four precisions ===
+        assert_eq!(
+            r1.get_timestamp_ntz(plan.idx("col_ts_s"), 0)
+                .unwrap()
+                .get_millisecond(),
+            s_ts_s.get_millisecond()
+        );
+        assert_eq!(
+            r1.get_timestamp_ntz(plan.idx("col_ts_ms"), 3)
+                .unwrap()
+                .get_millisecond(),
+            s_ts_ms.get_millisecond()
+        );
+        let read_ts_us = r1.get_timestamp_ntz(plan.idx("col_ts_us"), 6).unwrap();
+        assert_eq!(read_ts_us.get_millisecond(), s_ts_us.get_millisecond());
+        assert_eq!(
+            read_ts_us.get_nano_of_millisecond(),
+            s_ts_us.get_nano_of_millisecond()
+        );
+        let read_ts_ns = r1.get_timestamp_ntz(plan.idx("col_ts_ns"), 9).unwrap();
+        assert_eq!(read_ts_ns.get_millisecond(), s_ts_ns.get_millisecond());
+        assert_eq!(
+            read_ts_ns.get_nano_of_millisecond(),
+            s_ts_ns.get_nano_of_millisecond()
+        );
+
+        // === Scalars: timestamp_ltz across all four precisions ===
+        assert_eq!(
+            r1.get_timestamp_ltz(plan.idx("col_ts_ltz_s"), 0)
+                .unwrap()
+                .get_epoch_millisecond(),
+            s_ts_ltz_s.get_epoch_millisecond()
+        );
+        assert_eq!(
+            r1.get_timestamp_ltz(plan.idx("col_ts_ltz_ms"), 3)
+                .unwrap()
+                .get_epoch_millisecond(),
+            s_ts_ltz_ms.get_epoch_millisecond()
+        );
+        let read_ltz_us = r1.get_timestamp_ltz(plan.idx("col_ts_ltz_us"), 6).unwrap();
+        assert_eq!(
+            read_ltz_us.get_epoch_millisecond(),
+            s_ts_ltz_us.get_epoch_millisecond()
+        );
+        assert_eq!(
+            read_ltz_us.get_nano_of_millisecond(),
+            s_ts_ltz_us.get_nano_of_millisecond()
+        );
+        let read_ltz_ns = r1.get_timestamp_ltz(plan.idx("col_ts_ltz_ns"), 9).unwrap();
+        assert_eq!(
+            read_ltz_ns.get_epoch_millisecond(),
+            s_ts_ltz_ns.get_epoch_millisecond()
+        );
+        assert_eq!(
+            read_ltz_ns.get_nano_of_millisecond(),
+            s_ts_ltz_ns.get_nano_of_millisecond()
+        );
+
+        // === Scalars: bytes + fixed binary ===
+        assert_eq!(
+            r1.get_bytes(plan.idx("col_bytes_top")).unwrap(),
+            s_bytes_top.as_slice()
+        );
+        assert_eq!(
+            r1.get_binary(plan.idx("col_binary_top"), 4).unwrap(),
+            s_binary_top.as_slice()
+        );
+
+        // === Scalars: negative-epoch timestamps (pre-1970) ===
+        let read_neg_us = r1.get_timestamp_ntz(plan.idx("col_ts_us_neg"), 6).unwrap();
+        assert_eq!(read_neg_us.get_millisecond(), s_ts_us_neg.get_millisecond());
+        assert_eq!(
+            read_neg_us.get_nano_of_millisecond(),
+            s_ts_us_neg.get_nano_of_millisecond()
+        );
+        let read_neg_ns = r1.get_timestamp_ntz(plan.idx("col_ts_ns_neg"), 9).unwrap();
+        assert_eq!(read_neg_ns.get_millisecond(), s_ts_ns_neg.get_millisecond());
+        assert_eq!(
+            read_neg_ns.get_nano_of_millisecond(),
+            s_ts_ns_neg.get_nano_of_millisecond()
+        );
+        let read_neg_ltz_us = r1
+            .get_timestamp_ltz(plan.idx("col_ts_ltz_us_neg"), 6)
+            .unwrap();
+        assert_eq!(
+            read_neg_ltz_us.get_epoch_millisecond(),
+            s_ts_ltz_us_neg.get_epoch_millisecond()
+        );
+        let read_neg_ltz_ns = r1
+            .get_timestamp_ltz(plan.idx("col_ts_ltz_ns_neg"), 9)
+            .unwrap();
+        assert_eq!(
+            read_neg_ltz_ns.get_epoch_millisecond(),
+            s_ts_ltz_ns_neg.get_epoch_millisecond()
+        );
+
+        // === Row 2 lookup — empty map, all other columns NULL ===
+        let result2 = lookuper.lookup(&make_key(2)).await.expect("lookup row2");
+        let r2 = result2
+            .get_single_row()
+            .expect("row2")
+            .expect("row2 exists");
+        assert_eq!(r2.get_int(0).unwrap(), 2);
+        let map_idx = plan.idx("map_string_int");
+        for i in 1..column_count {
+            if i == map_idx {
+                assert_eq!(r2.get_map(map_idx).unwrap().size(), 0);
+            } else {
+                assert!(r2.is_null_at(i).unwrap(), "field {i} should be null");
+            }
+        }
+
+        // === Row 3 lookup — every compound + scalar field NULL ===
+        let result3 = lookuper.lookup(&make_key(3)).await.expect("lookup row3");
+        let r3 = result3
+            .get_single_row()
+            .expect("row3")
+            .expect("row3 exists");
+        assert_eq!(r3.get_int(0).unwrap(), 3);
+        for i in 1..column_count {
+            assert!(r3.is_null_at(i).unwrap(), "field {i} should be null");
+        }
+
+        admin.drop_table(&table_path, false).await.expect("drop");
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index fc8f837649..5e61ab0724 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -19,13 +19,16 @@
 #[cfg(test)]
 mod table_test {
     use crate::integration::utils::{
-        create_partitions, create_table, get_shared_cluster, make_int_array, make_string_array,
+        ColumnPlan, array_dt_basics_columns, as_row_type, create_partitions, create_table,
+        dt_array_int, dt_map_string_int, dt_row_seq_label, get_shared_cluster, make_int_array,
+        make_string_array, map_dt_basics_columns, row_dt_basics_columns, scalar_dt_columns,
     };
-    use arrow::array::record_batch;
+    use arrow::array::{Int32Array, record_batch};
     use fluss::client::{EARLIEST_OFFSET, FlussTable, TableScan};
     use fluss::metadata::{DataField, DataTypes, Schema, TableDescriptor, TablePath};
-    use fluss::record::ScanRecord;
+    use fluss::record::{ScanBatch, ScanRecord};
     use fluss::row::binary_array::FlussArrayWriter;
+    use fluss::row::binary_map::FlussMapWriter;
     use fluss::row::{
         Date, Datum, Decimal, FlussArray, GenericRow, InternalRow, Time, TimestampLtz, TimestampNtz,
     };
@@ -504,9 +507,7 @@ mod table_test {
             .unwrap();
         writer.flush().await.unwrap();
 
-        use arrow::array::Int32Array;
-
-        fn extract_ids(batches: &[fluss::record::ScanBatch]) -> Vec<i32> {
+        fn extract_ids(batches: &[ScanBatch]) -> Vec<i32> {
             batches
                 .iter()
                 .flat_map(|b| {
@@ -582,547 +583,6 @@ mod table_test {
 
     /// Integration test covering produce and scan operations for all supported datatypes
     /// in log tables.
-    #[tokio::test]
-    async fn all_supported_datatypes() {
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_log_all_datatypes");
-
-        // Create a log table with all supported datatypes for append/scan
-        let table_descriptor = TableDescriptor::builder()
-            .schema(
-                Schema::builder()
-                    // Integer types
-                    .column("col_tinyint", DataTypes::tinyint())
-                    .column("col_smallint", DataTypes::smallint())
-                    .column("col_int", DataTypes::int())
-                    .column("col_bigint", DataTypes::bigint())
-                    // Floating point types
-                    .column("col_float", DataTypes::float())
-                    .column("col_double", DataTypes::double())
-                    // Boolean type
-                    .column("col_boolean", DataTypes::boolean())
-                    // Char type
-                    .column("col_char", DataTypes::char(10))
-                    // String type
-                    .column("col_string", DataTypes::string())
-                    // Decimal type
-                    .column("col_decimal", DataTypes::decimal(10, 2))
-                    // Date type
-                    .column("col_date", DataTypes::date())
-                    // Time types
-                    .column("col_time_s", DataTypes::time_with_precision(0))
-                    .column("col_time_ms", DataTypes::time_with_precision(3))
-                    .column("col_time_us", DataTypes::time_with_precision(6))
-                    .column("col_time_ns", DataTypes::time_with_precision(9))
-                    // Timestamp types
-                    .column("col_timestamp_s", DataTypes::timestamp_with_precision(0))
-                    .column("col_timestamp_ms", DataTypes::timestamp_with_precision(3))
-                    .column("col_timestamp_us", DataTypes::timestamp_with_precision(6))
-                    .column("col_timestamp_ns", DataTypes::timestamp_with_precision(9))
-                    // Timestamp_ltz types
-                    .column(
-                        "col_timestamp_ltz_s",
-                        DataTypes::timestamp_ltz_with_precision(0),
-                    )
-                    .column(
-                        "col_timestamp_ltz_ms",
-                        DataTypes::timestamp_ltz_with_precision(3),
-                    )
-                    .column(
-                        "col_timestamp_ltz_us",
-                        DataTypes::timestamp_ltz_with_precision(6),
-                    )
-                    .column(
-                        "col_timestamp_ltz_ns",
-                        DataTypes::timestamp_ltz_with_precision(9),
-                    )
-                    // Bytes type
-                    .column("col_bytes", DataTypes::bytes())
-                    // Fixed-size binary type
-                    .column("col_binary", DataTypes::binary(4))
-                    // Timestamp types with negative values (before Unix epoch)
-                    .column(
-                        "col_timestamp_us_neg",
-                        DataTypes::timestamp_with_precision(6),
-                    )
-                    .column(
-                        "col_timestamp_ns_neg",
-                        DataTypes::timestamp_with_precision(9),
-                    )
-                    .column(
-                        "col_timestamp_ltz_us_neg",
-                        DataTypes::timestamp_ltz_with_precision(6),
-                    )
-                    .column(
-                        "col_timestamp_ltz_ns_neg",
-                        DataTypes::timestamp_ltz_with_precision(9),
-                    )
-                    .column("col_array", DataTypes::array(DataTypes::string()))
-                    .column(
-                        "col_row",
-                        DataTypes::row(vec![
-                            DataField::new("seq", DataTypes::int(), None),
-                            DataField::new("label", DataTypes::string(), None),
-                        ]),
-                    )
-                    .build()
-                    .expect("Failed to build schema"),
-            )
-            .build()
-            .expect("Failed to build table");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let field_count = table.get_table_info().schema.columns().len();
-
-        let append_writer = table
-            .new_append()
-            .expect("Failed to create append")
-            .create_writer()
-            .expect("Failed to create writer");
-
-        // Test data for all datatypes
-        let col_tinyint = 127i8;
-        let col_smallint = 32767i16;
-        let col_int = 2147483647i32;
-        let col_bigint = 9223372036854775807i64;
-        let col_float = std::f32::consts::PI;
-        let col_double = std::f64::consts::E;
-        let col_boolean = true;
-        let col_char = "hello";
-        let col_string = "world of fluss rust client";
-        let col_decimal = Decimal::from_unscaled_long(12345, 10, 2).unwrap(); // 123.45
-        let col_date = Date::new(20476); // 2026-01-23
-        let col_time_s = Time::new(36827000); // 10:13:47
-        let col_time_ms = Time::new(36827123); // 10:13:47.123
-        let col_time_us = Time::new(86399999); // 23:59:59.999
-        let col_time_ns = Time::new(1); // 00:00:00.001
-        // 2026-01-23 10:13:47 UTC
-        let col_timestamp_s = TimestampNtz::new(1769163227000);
-        // 2026-01-23 10:13:47.123 UTC
-        let col_timestamp_ms = TimestampNtz::new(1769163227123);
-        // 2026-01-23 10:13:47.123456 UTC
-        let col_timestamp_us = TimestampNtz::from_millis_nanos(1769163227123, 456000).unwrap();
-        // 2026-01-23 10:13:47.123999999 UTC
-        let col_timestamp_ns = TimestampNtz::from_millis_nanos(1769163227123, 999_999).unwrap();
-        let col_timestamp_ltz_s = TimestampLtz::new(1769163227000);
-        let col_timestamp_ltz_ms = TimestampLtz::new(1769163227123);
-        let col_timestamp_ltz_us = TimestampLtz::from_millis_nanos(1769163227123, 456000).unwrap();
-        let col_timestamp_ltz_ns = TimestampLtz::from_millis_nanos(1769163227123, 999_999).unwrap();
-        let col_bytes: Vec<u8> = b"binary data".to_vec();
-        let col_binary: Vec<u8> = vec![0xDE, 0xAD, 0xBE, 0xEF];
-
-        // 1960-06-15 08:30:45.123456 UTC (before 1970)
-        let col_timestamp_us_neg = TimestampNtz::from_millis_nanos(-301234154877, 456000).unwrap();
-        // 1960-06-15 08:30:45.123999999 UTC (before 1970)
-        let col_timestamp_ns_neg = TimestampNtz::from_millis_nanos(-301234154877, 999_999).unwrap();
-        let col_timestamp_ltz_us_neg =
-            TimestampLtz::from_millis_nanos(-301234154877, 456000).unwrap();
-        let col_timestamp_ltz_ns_neg =
-            TimestampLtz::from_millis_nanos(-301234154877, 999_999).unwrap();
-
-        let col_array = make_string_array(&[Some("fluss"), Some("rust")]);
-
-        let mut col_row_inner = GenericRow::new(2);
-        col_row_inner.set_field(0, 7_i32);
-        col_row_inner.set_field(1, "lumiere");
-
-        let mut row = GenericRow::new(field_count);
-        row.set_field(0, col_tinyint);
-        row.set_field(1, col_smallint);
-        row.set_field(2, col_int);
-        row.set_field(3, col_bigint);
-        row.set_field(4, col_float);
-        row.set_field(5, col_double);
-        row.set_field(6, col_boolean);
-        row.set_field(7, col_char);
-        row.set_field(8, col_string);
-        row.set_field(9, col_decimal.clone());
-        row.set_field(10, col_date);
-        row.set_field(11, col_time_s);
-        row.set_field(12, col_time_ms);
-        row.set_field(13, col_time_us);
-        row.set_field(14, col_time_ns);
-        row.set_field(15, col_timestamp_s);
-        row.set_field(16, col_timestamp_ms);
-        row.set_field(17, col_timestamp_us);
-        row.set_field(18, col_timestamp_ns);
-        row.set_field(19, col_timestamp_ltz_s);
-        row.set_field(20, col_timestamp_ltz_ms);
-        row.set_field(21, col_timestamp_ltz_us);
-        row.set_field(22, col_timestamp_ltz_ns);
-        row.set_field(23, col_bytes.as_slice());
-        row.set_field(24, col_binary.as_slice());
-        row.set_field(25, col_timestamp_us_neg);
-        row.set_field(26, col_timestamp_ns_neg);
-        row.set_field(27, col_timestamp_ltz_us_neg);
-        row.set_field(28, col_timestamp_ltz_ns_neg);
-        row.set_field(29, col_array);
-        row.set_field(30, Datum::Row(Box::new(col_row_inner)));
-
-        append_writer
-            .append(&row)
-            .expect("Failed to append row with all datatypes");
-
-        // Append a row with null values for all columns
-        let mut row_with_nulls = GenericRow::new(field_count);
-        for i in 0..field_count {
-            row_with_nulls.set_field(i, Datum::Null);
-        }
-
-        append_writer
-            .append(&row_with_nulls)
-            .expect("Failed to append row with nulls");
-
-        append_writer.flush().await.expect("Failed to flush");
-
-        // Scan the records
-        let records = scan_table(&table, |scan| scan).await;
-
-        assert_eq!(records.len(), 2, "Expected 2 records");
-
-        let found_row = records[0].row();
-        assert_eq!(
-            found_row.get_byte(0).unwrap(),
-            col_tinyint,
-            "col_tinyint mismatch"
-        );
-        assert_eq!(
-            found_row.get_short(1).unwrap(),
-            col_smallint,
-            "col_smallint mismatch"
-        );
-        assert_eq!(found_row.get_int(2).unwrap(), col_int, "col_int mismatch");
-        assert_eq!(
-            found_row.get_long(3).unwrap(),
-            col_bigint,
-            "col_bigint mismatch"
-        );
-        assert!(
-            (found_row.get_float(4).unwrap() - col_float).abs() < f32::EPSILON,
-            "col_float mismatch: expected {}, got {}",
-            col_float,
-            found_row.get_float(4).unwrap()
-        );
-        assert!(
-            (found_row.get_double(5).unwrap() - col_double).abs() < f64::EPSILON,
-            "col_double mismatch: expected {}, got {}",
-            col_double,
-            found_row.get_double(5).unwrap()
-        );
-        assert_eq!(
-            found_row.get_boolean(6).unwrap(),
-            col_boolean,
-            "col_boolean mismatch"
-        );
-        assert_eq!(
-            found_row.get_char(7, 10).unwrap(),
-            col_char,
-            "col_char mismatch"
-        );
-        assert_eq!(
-            found_row.get_string(8).unwrap(),
-            col_string,
-            "col_string mismatch"
-        );
-        assert_eq!(
-            found_row.get_decimal(9, 10, 2).unwrap(),
-            col_decimal,
-            "col_decimal mismatch"
-        );
-        assert_eq!(
-            found_row.get_date(10).unwrap().get_inner(),
-            col_date.get_inner(),
-            "col_date mismatch"
-        );
-
-        assert_eq!(
-            found_row.get_time(11).unwrap().get_inner(),
-            col_time_s.get_inner(),
-            "col_time_s mismatch"
-        );
-
-        assert_eq!(
-            found_row.get_time(12).unwrap().get_inner(),
-            col_time_ms.get_inner(),
-            "col_time_ms mismatch"
-        );
-
-        assert_eq!(
-            found_row.get_time(13).unwrap().get_inner(),
-            col_time_us.get_inner(),
-            "col_time_us mismatch"
-        );
-
-        assert_eq!(
-            found_row.get_time(14).unwrap().get_inner(),
-            col_time_ns.get_inner(),
-            "col_time_ns mismatch"
-        );
-
-        assert_eq!(
-            found_row
-                .get_timestamp_ntz(15, 0)
-                .unwrap()
-                .get_millisecond(),
-            col_timestamp_s.get_millisecond(),
-            "col_timestamp_s mismatch"
-        );
-
-        assert_eq!(
-            found_row
-                .get_timestamp_ntz(16, 3)
-                .unwrap()
-                .get_millisecond(),
-            col_timestamp_ms.get_millisecond(),
-            "col_timestamp_ms mismatch"
-        );
-
-        let read_ts_us = found_row.get_timestamp_ntz(17, 6).unwrap();
-        assert_eq!(
-            read_ts_us.get_millisecond(),
-            col_timestamp_us.get_millisecond(),
-            "col_timestamp_us millis mismatch"
-        );
-        assert_eq!(
-            read_ts_us.get_nano_of_millisecond(),
-            col_timestamp_us.get_nano_of_millisecond(),
-            "col_timestamp_us nanos mismatch"
-        );
-
-        let read_ts_ns = found_row.get_timestamp_ntz(18, 9).unwrap();
-        assert_eq!(
-            read_ts_ns.get_millisecond(),
-            col_timestamp_ns.get_millisecond(),
-            "col_timestamp_ns millis mismatch"
-        );
-        assert_eq!(
-            read_ts_ns.get_nano_of_millisecond(),
-            col_timestamp_ns.get_nano_of_millisecond(),
-            "col_timestamp_ns nanos mismatch"
-        );
-
-        assert_eq!(
-            found_row
-                .get_timestamp_ltz(19, 0)
-                .unwrap()
-                .get_epoch_millisecond(),
-            col_timestamp_ltz_s.get_epoch_millisecond(),
-            "col_timestamp_ltz_s mismatch"
-        );
-
-        assert_eq!(
-            found_row
-                .get_timestamp_ltz(20, 3)
-                .unwrap()
-                .get_epoch_millisecond(),
-            col_timestamp_ltz_ms.get_epoch_millisecond(),
-            "col_timestamp_ltz_ms mismatch"
-        );
-
-        let read_ts_ltz_us = found_row.get_timestamp_ltz(21, 6).unwrap();
-        assert_eq!(
-            read_ts_ltz_us.get_epoch_millisecond(),
-            col_timestamp_ltz_us.get_epoch_millisecond(),
-            "col_timestamp_ltz_us millis mismatch"
-        );
-        assert_eq!(
-            read_ts_ltz_us.get_nano_of_millisecond(),
-            col_timestamp_ltz_us.get_nano_of_millisecond(),
-            "col_timestamp_ltz_us nanos mismatch"
-        );
-
-        let read_ts_ltz_ns = found_row.get_timestamp_ltz(22, 9).unwrap();
-        assert_eq!(
-            read_ts_ltz_ns.get_epoch_millisecond(),
-            col_timestamp_ltz_ns.get_epoch_millisecond(),
-            "col_timestamp_ltz_ns millis mismatch"
-        );
-        assert_eq!(
-            read_ts_ltz_ns.get_nano_of_millisecond(),
-            col_timestamp_ltz_ns.get_nano_of_millisecond(),
-            "col_timestamp_ltz_ns nanos mismatch"
-        );
-        assert_eq!(
-            found_row.get_bytes(23).unwrap(),
-            col_bytes,
-            "col_bytes mismatch"
-        );
-        assert_eq!(
-            found_row.get_binary(24, 4).unwrap(),
-            col_binary,
-            "col_binary mismatch"
-        );
-
-        // Verify timestamps before Unix epoch (negative timestamps)
-        let read_ts_us_neg = found_row.get_timestamp_ntz(25, 6).unwrap();
-        assert_eq!(
-            read_ts_us_neg.get_millisecond(),
-            col_timestamp_us_neg.get_millisecond(),
-            "col_timestamp_us_neg millis mismatch"
-        );
-        assert_eq!(
-            read_ts_us_neg.get_nano_of_millisecond(),
-            col_timestamp_us_neg.get_nano_of_millisecond(),
-            "col_timestamp_us_neg nanos mismatch"
-        );
-
-        let read_ts_ns_neg = found_row.get_timestamp_ntz(26, 9).unwrap();
-        assert_eq!(
-            read_ts_ns_neg.get_millisecond(),
-            col_timestamp_ns_neg.get_millisecond(),
-            "col_timestamp_ns_neg millis mismatch"
-        );
-        assert_eq!(
-            read_ts_ns_neg.get_nano_of_millisecond(),
-            col_timestamp_ns_neg.get_nano_of_millisecond(),
-            "col_timestamp_ns_neg nanos mismatch"
-        );
-
-        let read_ts_ltz_us_neg = found_row.get_timestamp_ltz(27, 6).unwrap();
-        assert_eq!(
-            read_ts_ltz_us_neg.get_epoch_millisecond(),
-            col_timestamp_ltz_us_neg.get_epoch_millisecond(),
-            "col_timestamp_ltz_us_neg millis mismatch"
-        );
-        assert_eq!(
-            read_ts_ltz_us_neg.get_nano_of_millisecond(),
-            col_timestamp_ltz_us_neg.get_nano_of_millisecond(),
-            "col_timestamp_ltz_us_neg nanos mismatch"
-        );
-
-        let read_ts_ltz_ns_neg = found_row.get_timestamp_ltz(28, 9).unwrap();
-        assert_eq!(
-            read_ts_ltz_ns_neg.get_epoch_millisecond(),
-            col_timestamp_ltz_ns_neg.get_epoch_millisecond(),
-            "col_timestamp_ltz_ns_neg millis mismatch"
-        );
-        assert_eq!(
-            read_ts_ltz_ns_neg.get_nano_of_millisecond(),
-            col_timestamp_ltz_ns_neg.get_nano_of_millisecond(),
-            "col_timestamp_ltz_ns_neg nanos mismatch"
-        );
-
-        let arr = found_row.get_array(29).unwrap();
-        assert_eq!(arr.size(), 2, "col_array size mismatch");
-        assert_eq!(arr.get_string(0).unwrap(), "fluss", "col_array[0] mismatch");
-        assert_eq!(arr.get_string(1).unwrap(), "rust", "col_array[1] mismatch");
-
-        let nested = found_row.get_row(30).unwrap();
-        assert_eq!(nested.get_int(0).unwrap(), 7, "col_row.seq mismatch");
-        assert_eq!(
-            nested.get_string(1).unwrap(),
-            "lumiere",
-            "col_row.label mismatch"
-        );
-
-        // Verify row with all nulls (record index 1)
-        let found_row_nulls = records[1].row();
-        for i in 0..field_count {
-            assert!(
-                found_row_nulls.is_null_at(i).unwrap(),
-                "column {} should be null",
-                i
-            );
-        }
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    #[tokio::test]
-    async fn test_map_datatype_roundtrip() {
-        use fluss::row::binary_map::FlussMapWriter;
-        use fluss::row::{Datum, GenericRow};
-
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_map_datatype_roundtrip");
-
-        let key_type = DataTypes::string();
-        let value_type = DataTypes::int();
-        let map_type = DataTypes::map(key_type.clone(), value_type.clone());
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(
-                Schema::builder()
-                    .column("id", DataTypes::int())
-                    .column("map_col", map_type.clone())
-                    .build()
-                    .expect("Failed to build schema"),
-            )
-            .build()
-            .expect("Failed to build table");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        // 1. Construct FlussMap
-        let mut map_writer = FlussMapWriter::new(3, &key_type, &value_type);
-        map_writer.write_entry("k1".into(), 10.into()).unwrap();
-        map_writer.write_entry("k2".into(), 20.into()).unwrap();
-        map_writer.write_entry("k3".into(), 30.into()).unwrap();
-        let fluss_map = map_writer.complete().unwrap();
-
-        // 2. Insert Row
-        let mut row = GenericRow::new(2);
-        row.set_field(0, 1i32);
-        row.set_field(1, Datum::Map(fluss_map));
-
-        let append_writer = table
-            .new_append()
-            .expect("Failed to create append")
-            .create_writer()
-            .expect("Failed to create writer");
-
-        append_writer.append(&row).expect("Failed to append row");
-        append_writer.flush().await.expect("Failed to flush");
-
-        // 3. Fetch Row
-        let records = scan_table(&table, |scan| scan).await;
-        assert_eq!(records.len(), 1, "Expected 1 record");
-
-        let found_row = records[0].row();
-        assert_eq!(found_row.get_int(0).unwrap(), 1);
-
-        // 4. Assert Map
-        let decoded_map = found_row.get_map(1).expect("Failed to get map");
-        assert_eq!(decoded_map.size(), 3);
-
-        let decoded_keys = decoded_map.key_array();
-        let decoded_values = decoded_map.value_array();
-
-        assert_eq!(decoded_keys.get_string(0).unwrap(), "k1");
-        assert_eq!(decoded_keys.get_string(1).unwrap(), "k2");
-        assert_eq!(decoded_keys.get_string(2).unwrap(), "k3");
-
-        assert_eq!(decoded_values.get_int(0).unwrap(), 10);
-        assert_eq!(decoded_values.get_int(1).unwrap(), 20);
-        assert_eq!(decoded_values.get_int(2).unwrap(), 30);
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
     #[tokio::test]
     async fn partitioned_table_append_scan() {
         let cluster = get_shared_cluster();
@@ -1175,7 +635,7 @@ mod table_test {
         ];
 
         for (id, region, value) in &test_data {
-            let mut row = fluss::row::GenericRow::new(3);
+            let mut row = GenericRow::new(3);
             row.set_field(0, *id);
             row.set_field(1, *region);
             row.set_field(2, *value);
@@ -1418,650 +878,104 @@ mod table_test {
             .expect("Failed to drop table");
     }
 
+    /// Projection over a log table containing every compound type.
     #[tokio::test]
-    async fn undersized_row_returns_error() {
+    async fn projection_with_compound_types() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss", "test_log_undersized_row");
+        let table_path = TablePath::new("fluss", "test_log_projection_compound");
 
-        let table_descriptor = TableDescriptor::builder()
-            .schema(
-                Schema::builder()
-                    .column("col_bool", DataTypes::boolean())
-                    .column("col_int", DataTypes::int())
-                    .column("col_string", DataTypes::string())
-                    .column("col_bigint", DataTypes::bigint())
-                    .build()
-                    .expect("Failed to build schema"),
+        let row_type = DataTypes::row(vec![
+            DataField::new("seq", DataTypes::int(), None),
+            DataField::new("label", DataTypes::string(), None),
+        ]);
+
+        let schema = Schema::builder()
+            .column("id", DataTypes::int())
+            .column("nested", row_type)
+            .column(
+                "attrs",
+                DataTypes::map(DataTypes::string(), DataTypes::int()),
             )
+            .column("tags", DataTypes::array(DataTypes::string()))
+            .column("extra", DataTypes::string())
             .build()
-            .expect("Failed to build table");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
+            .expect("schema");
 
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
+        create_table(
+            &admin,
+            &table_path,
+            &TableDescriptor::builder()
+                .schema(schema)
+                .build()
+                .expect("table descriptor"),
+        )
+        .await;
 
-        let append_writer = table
+        let table = connection.get_table(&table_path).await.expect("table");
+        let writer = table
             .new_append()
-            .expect("Failed to create table append")
+            .expect("append")
             .create_writer()
-            .expect("Failed to create writer");
+            .expect("writer");
 
-        // Scenario 1b: GenericRow with only 2 fields for a 4-column table
-        let mut row = fluss::row::GenericRow::new(2);
-        row.set_field(0, true);
-        row.set_field(1, 42_i32);
+        let mut nested = GenericRow::new(2);
+        nested.set_field(0, 42_i32);
+        nested.set_field(1, "hello");
+        let attrs = {
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+            w.write_entry("x".into(), 1.into()).unwrap();
+            w.write_entry("y".into(), 2.into()).unwrap();
+            w.complete().expect("attrs")
+        };
+        let tags = make_string_array(&[Some("alpha"), Some("beta")]);
 
-        let result = append_writer.append(&row);
-        assert!(result.is_err(), "Undersized row should be rejected");
-        let err_msg = result.unwrap_err().to_string();
-        assert!(
-            err_msg.contains("Expected: 4") && err_msg.contains("Actual: 2"),
-            "Error should mention field count mismatch, got: {err_msg}"
-        );
+        let mut row = GenericRow::new(5);
+        row.set_field(0, 7_i32);
+        row.set_field(1, Datum::Row(Box::new(nested)));
+        row.set_field(2, Datum::Map(attrs));
+        row.set_field(3, tags);
+        row.set_field(4, "ignore-me");
+        writer.append(&row).expect("append");
+        writer.flush().await.expect("flush");
 
-        // Correct column count but wrong types:
-        // Schema is (Boolean, Int, String, BigInt) but we put Int64 where String is expected.
-        // This should return an error, not panic.
-        let row_wrong_types = fluss::row::GenericRow::from_data(vec![
-            fluss::row::Datum::Bool(true),
-            fluss::row::Datum::Int32(42),
-            fluss::row::Datum::Int64(999), // wrong: String column
-            fluss::row::Datum::Int64(100),
-        ]);
+        // Project columns in reordered form, dropping `extra`.
+        let records = scan_table(&table, |scan| {
+            scan.project_by_name(&["nested", "attrs", "tags", "id"])
+                .expect("project failed")
+        })
+        .await;
+        assert_eq!(records.len(), 1);
+        let r = records[0].row();
 
-        let result = append_writer.append(&row_wrong_types);
-        assert!(
-            result.is_err(),
-            "Row with mismatched types should be rejected, not panic"
-        );
+        // === Projection: ROW ===
+        let projected_nested = r.get_row(0).expect("get_row over projection");
+        assert_eq!(projected_nested.get_int(0).unwrap(), 42);
+        assert_eq!(projected_nested.get_string(1).unwrap(), "hello");
 
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
+        // === Projection: MAP ===
+        let m = r.get_map(1).expect("get_map over projection");
+        assert_eq!(m.size(), 2);
+        assert_eq!(m.get(&Datum::from("x")).unwrap(), Some(Datum::from(1_i32)));
+        assert_eq!(m.get(&Datum::from("y")).unwrap(), Some(Datum::from(2_i32)));
 
-    #[tokio::test]
-    async fn append_and_scan_with_array() {
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_log_arrays");
-        let inner_array_type = DataTypes::array(DataTypes::int());
-
-        let schema = Schema::builder()
-            .column("id", DataTypes::int())
-            .column("tags", DataTypes::array(DataTypes::string()))
-            .column("scores", DataTypes::array(DataTypes::int()))
-            .column("matrix", DataTypes::array(inner_array_type.clone()))
-            .build()
-            .expect("Failed to build schema");
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(schema)
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let append_writer = table
-            .new_append()
-            .expect("Failed to create append")
-            .create_writer()
-            .expect("Failed to create writer");
-
-        let mut row1 = GenericRow::new(4);
-        row1.set_field(0, 1_i32);
-        row1.set_field(1, make_string_array(&[Some("hello"), Some("world")]));
-        row1.set_field(2, make_int_array(&[Some(10), Some(20), Some(30)]));
-        let m1 = {
-            let mut w = FlussArrayWriter::new(2, &inner_array_type);
-            w.write_array(0, &make_int_array(&[Some(1), Some(2)]));
-            w.write_array(1, &make_int_array(&[Some(3), Some(4)]));
-            w.complete().expect("matrix1")
-        };
-        row1.set_field(3, m1);
-
-        let mut row2 = GenericRow::new(4);
-        row2.set_field(0, 2_i32);
-        row2.set_field(1, make_string_array(&[None]));
-        row2.set_field(2, make_int_array(&[]));
-        let m2 = {
-            let mut w = FlussArrayWriter::new(3, &inner_array_type);
-            w.write_array(0, &make_int_array(&[Some(5)]));
-            w.set_null_at(1);
-            w.write_array(2, &make_int_array(&[]));
-            w.complete().expect("matrix2")
-        };
-        row2.set_field(3, m2);
-
-        let mut row3 = GenericRow::new(4);
-        row3.set_field(0, 3_i32);
-        row3.set_field(1, Datum::Null);
-        row3.set_field(2, make_int_array(&[Some(42)]));
-        row3.set_field(3, Datum::Null);
-
-        append_writer.append(&row1).expect("append row1");
-        append_writer.append(&row2).expect("append row2");
-        append_writer.append(&row3).expect("append row3");
-        append_writer.flush().await.expect("Failed to flush");
-
-        let records = scan_table(&table, |scan| scan).await;
-        assert_eq!(records.len(), 3, "expected three log records");
-
-        let r0 = records[0].row();
-        assert_eq!(r0.get_int(0).unwrap(), 1);
-        let tags_r0 = r0.get_array(1).unwrap();
-        assert_eq!(tags_r0.size(), 2);
-        assert_eq!(tags_r0.get_string(0).unwrap(), "hello");
-        assert_eq!(tags_r0.get_string(1).unwrap(), "world");
-        let scores_r0 = r0.get_array(2).unwrap();
-        assert_eq!(scores_r0.size(), 3);
-        assert_eq!(scores_r0.get_int(0).unwrap(), 10);
-        assert_eq!(scores_r0.get_int(1).unwrap(), 20);
-        assert_eq!(scores_r0.get_int(2).unwrap(), 30);
-        let matrix_r0: FlussArray = r0.get_array(3).unwrap();
-        assert_eq!(matrix_r0.size(), 2);
-        let mr0_0 = matrix_r0.get_array(0).unwrap();
-        assert_eq!(mr0_0.size(), 2);
-        assert_eq!(mr0_0.get_int(0).unwrap(), 1);
-        assert_eq!(mr0_0.get_int(1).unwrap(), 2);
-        let mr0_1 = matrix_r0.get_array(1).unwrap();
-        assert_eq!(mr0_1.size(), 2);
-        assert_eq!(mr0_1.get_int(0).unwrap(), 3);
-        assert_eq!(mr0_1.get_int(1).unwrap(), 4);
-
-        let r1 = records[1].row();
-        assert_eq!(r1.get_int(0).unwrap(), 2);
-        let tags_r1 = r1.get_array(1).unwrap();
-        assert_eq!(tags_r1.size(), 1);
-        assert!(tags_r1.is_null_at(0));
-        let scores_r1 = r1.get_array(2).unwrap();
-        assert_eq!(scores_r1.size(), 0);
-        let matrix_r1 = r1.get_array(3).unwrap();
-        assert_eq!(matrix_r1.size(), 3);
-        let mr1_0 = matrix_r1.get_array(0).unwrap();
-        assert_eq!(mr1_0.size(), 1);
-        assert_eq!(mr1_0.get_int(0).unwrap(), 5);
-        assert!(matrix_r1.is_null_at(1));
-        let mr1_2 = matrix_r1.get_array(2).unwrap();
-        assert_eq!(mr1_2.size(), 0);
-
-        let r2 = records[2].row();
-        assert_eq!(r2.get_int(0).unwrap(), 3);
-        assert!(r2.is_null_at(1).unwrap());
-        let scores_r2 = r2.get_array(2).unwrap();
-        assert_eq!(scores_r2.size(), 1);
-        assert_eq!(scores_r2.get_int(0).unwrap(), 42);
-        assert!(r2.is_null_at(3).unwrap());
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    #[tokio::test]
-    async fn append_and_scan_with_array_of_row() {
-        use fluss::metadata::{DataField, DataType};
-
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_log_array_of_row");
-
-        let event_row_type_owned = DataTypes::row(vec![
-            DataField::new("seq", DataTypes::int(), None),
-            DataField::new("label", DataTypes::string(), None),
-        ]);
-        let array_of_row_type = DataTypes::array(event_row_type_owned.clone());
-
-        let event_row_type = match &event_row_type_owned {
-            DataType::Row(rt) => rt.clone(),
-            _ => unreachable!(),
-        };
-
-        let schema = Schema::builder()
-            .column("id", DataTypes::int())
-            .column("events", array_of_row_type)
-            .build()
-            .expect("Failed to build schema");
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(schema)
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let append_writer = table
-            .new_append()
-            .expect("Failed to create append")
-            .create_writer()
-            .expect("Failed to create writer");
-
-        let mut events1 = FlussArrayWriter::new(2, &event_row_type_owned);
-        let mut e0 = GenericRow::new(2);
-        e0.set_field(0, 1_i32);
-        e0.set_field(1, "open");
-        events1.write_row(0, &e0).expect("write e0");
-        let mut e1 = GenericRow::new(2);
-        e1.set_field(0, 2_i32);
-        e1.set_field(1, "close");
-        events1.write_row(1, &e1).expect("write e1");
-        let events1 = events1.complete().expect("events1");
-
-        let mut row1 = GenericRow::new(2);
-        row1.set_field(0, 1_i32);
-        row1.set_field(1, events1);
-
-        let mut events2 = FlussArrayWriter::new(3, &event_row_type_owned);
-        let mut e2 = GenericRow::new(2);
-        e2.set_field(0, 7_i32);
-        e2.set_field(1, "x");
-        events2.write_row(0, &e2).expect("write e2");
-        events2.set_null_at(1);
-        let mut e3 = GenericRow::new(2);
-        e3.set_field(0, 8_i32);
-        e3.set_field(1, "y");
-        events2.write_row(2, &e3).expect("write e3");
-        let events2 = events2.complete().expect("events2");
-
-        let mut row2 = GenericRow::new(2);
-        row2.set_field(0, 2_i32);
-        row2.set_field(1, events2);
-
-        let mut row3 = GenericRow::new(2);
-        row3.set_field(0, 3_i32);
-        row3.set_field(1, Datum::Null);
-
-        append_writer.append(&row1).expect("append row1");
-        append_writer.append(&row2).expect("append row2");
-        append_writer.append(&row3).expect("append row3");
-        append_writer.flush().await.expect("Failed to flush");
-
-        let records = scan_table(&table, |scan| scan).await;
-        assert_eq!(records.len(), 3, "expected three log records");
-
-        let r0 = records[0].row();
-        assert_eq!(r0.get_int(0).unwrap(), 1);
-        let events_r0 = r0.get_array(1).unwrap();
-        assert_eq!(events_r0.size(), 2);
-        let e0_r0 = events_r0.get_row(0, &event_row_type).unwrap();
-        assert_eq!(e0_r0.get_int(0).unwrap(), 1);
-        assert_eq!(e0_r0.get_string(1).unwrap(), "open");
-        let e1_r0 = events_r0.get_row(1, &event_row_type).unwrap();
-        assert_eq!(e1_r0.get_int(0).unwrap(), 2);
-        assert_eq!(e1_r0.get_string(1).unwrap(), "close");
-
-        let r1 = records[1].row();
-        let events_r1 = r1.get_array(1).unwrap();
-        assert_eq!(events_r1.size(), 3);
-        let e0_r1 = events_r1.get_row(0, &event_row_type).unwrap();
-        assert_eq!(e0_r1.get_int(0).unwrap(), 7);
-        assert_eq!(e0_r1.get_string(1).unwrap(), "x");
-        assert!(events_r1.is_null_at(1));
-        let e2_r1 = events_r1.get_row(2, &event_row_type).unwrap();
-        assert_eq!(e2_r1.get_int(0).unwrap(), 8);
-        assert_eq!(e2_r1.get_string(1).unwrap(), "y");
-
-        let r2 = records[2].row();
-        assert_eq!(r2.get_int(0).unwrap(), 3);
-        assert!(r2.is_null_at(1).unwrap());
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    #[tokio::test]
-    async fn append_and_scan_with_row() {
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_log_rows");
-        let nested_row_type = DataTypes::row(vec![
-            DataField::new("x", DataTypes::int(), None),
-            DataField::new("label", DataTypes::string(), None),
-        ]);
-        let deep_inner_row_type = DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
-        let deep_row_type =
-            DataTypes::row(vec![DataField::new("inner", deep_inner_row_type, None)]);
-
-        let schema = Schema::builder()
-            .column("id", DataTypes::int())
-            .column("nested", nested_row_type)
-            .column("deep", deep_row_type)
-            .build()
-            .expect("Failed to build schema");
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(schema)
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-
-        let append_writer = table
-            .new_append()
-            .expect("Failed to create append")
-            .create_writer()
-            .expect("Failed to create writer");
-
-        let mut nested1 = GenericRow::new(2);
-        nested1.set_field(0, 42_i32);
-        nested1.set_field(1, "hello");
-        let mut deep_inner1 = GenericRow::new(1);
-        deep_inner1.set_field(0, 99_i32);
-        let mut deep1 = GenericRow::new(1);
-        deep1.set_field(0, Datum::Row(Box::new(deep_inner1)));
-
-        let mut row1 = GenericRow::new(3);
-        row1.set_field(0, 1_i32);
-        row1.set_field(1, Datum::Row(Box::new(nested1)));
-        row1.set_field(2, Datum::Row(Box::new(deep1)));
-
-        let mut nested2 = GenericRow::new(2);
-        nested2.set_field(0, 7_i32);
-        nested2.set_field(1, Datum::Null);
-
-        let mut row2 = GenericRow::new(3);
-        row2.set_field(0, 2_i32);
-        row2.set_field(1, Datum::Row(Box::new(nested2)));
-        row2.set_field(2, Datum::Null);
-
-        let mut deep_inner3 = GenericRow::new(1);
-        deep_inner3.set_field(0, -1_i32);
-        let mut deep3 = GenericRow::new(1);
-        deep3.set_field(0, Datum::Row(Box::new(deep_inner3)));
-
-        let mut row3 = GenericRow::new(3);
-        row3.set_field(0, 3_i32);
-        row3.set_field(1, Datum::Null);
-        row3.set_field(2, Datum::Row(Box::new(deep3)));
-
-        append_writer.append(&row1).expect("append row1");
-        append_writer.append(&row2).expect("append row2");
-        append_writer.append(&row3).expect("append row3");
-        append_writer.flush().await.expect("Failed to flush");
-
-        let records = scan_table(&table, |scan| scan).await;
-        assert_eq!(records.len(), 3, "expected three log records");
-
-        let r0 = records[0].row();
-        assert_eq!(r0.get_int(0).unwrap(), 1);
-        let nested_r0 = r0.get_row(1).unwrap();
-        assert_eq!(nested_r0.get_int(0).unwrap(), 42);
-        assert_eq!(nested_r0.get_string(1).unwrap(), "hello");
-        let deep_r0 = r0.get_row(2).unwrap();
-        let deep_inner_r0 = deep_r0.get_row(0).unwrap();
-        assert_eq!(deep_inner_r0.get_int(0).unwrap(), 99);
-
-        let r1 = records[1].row();
-        assert_eq!(r1.get_int(0).unwrap(), 2);
-        let nested_r1 = r1.get_row(1).unwrap();
-        assert_eq!(nested_r1.get_int(0).unwrap(), 7);
-        assert!(nested_r1.is_null_at(1).unwrap());
-        assert!(r1.is_null_at(2).unwrap());
-
-        let r2 = records[2].row();
-        assert_eq!(r2.get_int(0).unwrap(), 3);
-        assert!(r2.is_null_at(1).unwrap());
-        let deep_r2 = r2.get_row(2).unwrap();
-        let deep_inner_r2 = deep_r2.get_row(0).unwrap();
-        assert_eq!(deep_inner_r2.get_int(0).unwrap(), -1);
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    /// Partitioned log table with a ROW column. Confirms partition routing
-    /// + ROW column encoding compose correctly across partitions.
-    /// ROW column with all rich element types (decimal, date, time, timestamps,
-    /// bytes, binary, float NaN/Inf, long strings) round-tripped through the
-    /// log path. Confirms the wire-level encoding of `ROW<rich types>` matches
-    /// what the server expects — the unit-level `test_row_all_primitives_round_trip`
-    /// proves Rust↔Rust round-trip; this test proves Rust→server→Rust.
-    #[tokio::test]
-    async fn append_and_scan_with_row_rich_types() {
-        fn assert_f32_special(actual: f32, expected: f32) {
-            if expected.is_nan() {
-                assert!(actual.is_nan(), "expected NaN");
-            } else if expected.is_infinite() {
-                assert!(actual.is_infinite());
-                assert_eq!(actual.signum(), expected.signum());
-            } else {
-                assert!((actual - expected).abs() < f32::EPSILON);
-            }
-        }
-
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_log_row_rich_types");
-
-        let row_type_owned = DataTypes::row(vec![
-            DataField::new("f_bool", DataTypes::boolean(), None),
-            DataField::new("f_int", DataTypes::int(), None),
-            DataField::new("f_long", DataTypes::bigint(), None),
-            DataField::new("f_float", DataTypes::float(), None),
-            DataField::new("f_double", DataTypes::double(), None),
-            DataField::new("f_str", DataTypes::string(), None),
-            DataField::new("f_bytes", DataTypes::bytes(), None),
-            DataField::new("f_decimal", DataTypes::decimal(10, 2), None),
-            DataField::new("f_date", DataTypes::date(), None),
-            DataField::new("f_time", DataTypes::time_with_precision(3), None),
-            DataField::new("f_ts_ntz", DataTypes::timestamp_with_precision(6), None),
-            DataField::new("f_ts_ltz", DataTypes::timestamp_ltz_with_precision(6), None),
-            DataField::new("f_binary_fixed", DataTypes::binary(4), None),
-            DataField::new("f_array_int", DataTypes::array(DataTypes::int()), None),
-        ]);
-
-        let schema = Schema::builder()
-            .column("id", DataTypes::int())
-            .column("nested", row_type_owned)
-            .build()
-            .expect("Failed to build schema");
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(schema)
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-        let append_writer = table
-            .new_append()
-            .expect("Failed to create append")
-            .create_writer()
-            .expect("Failed to create writer");
-
-        let mut nested1 = GenericRow::new(14);
-        nested1.set_field(0, true);
-        nested1.set_field(1, 100_000_i32);
-        nested1.set_field(2, 9_876_543_210_i64);
-        nested1.set_field(3, f32::INFINITY);
-        nested1.set_field(4, f64::NAN);
-        nested1.set_field(5, "hello world");
-        nested1.set_field(6, b"binary".as_slice());
-        nested1.set_field(7, Decimal::from_unscaled_long(12345, 10, 2).unwrap());
-        nested1.set_field(8, Datum::Date(Date::new(20476)));
-        nested1.set_field(9, Datum::Time(Time::new(36_827_123)));
-        nested1.set_field(
-            10,
-            Datum::TimestampNtz(TimestampNtz::new(1_769_163_227_123)),
-        );
-        nested1.set_field(
-            11,
-            Datum::TimestampLtz(TimestampLtz::new(1_769_163_227_456)),
-        );
-        nested1.set_field(12, b"\x01\x02\x03\x04".as_slice());
-        nested1.set_field(13, make_int_array(&[Some(7), None, Some(11)]));
-
-        let mut row1 = GenericRow::new(2);
-        row1.set_field(0, 1_i32);
-        row1.set_field(1, Datum::Row(Box::new(nested1)));
-
-        let mut row2 = GenericRow::new(2);
-        row2.set_field(0, 2_i32);
-        row2.set_field(1, Datum::Null);
-
-        append_writer.append(&row1).expect("append row1");
-        append_writer.append(&row2).expect("append row2");
-        append_writer.flush().await.expect("Failed to flush");
-
-        let records = scan_table(&table, |scan| scan).await;
-        assert_eq!(records.len(), 2);
-
-        let r0 = records[0].row();
-        assert_eq!(r0.get_int(0).unwrap(), 1);
-        let nested = r0.get_row(1).unwrap();
-        assert!(nested.get_boolean(0).unwrap());
-        assert_eq!(nested.get_int(1).unwrap(), 100_000);
-        assert_eq!(nested.get_long(2).unwrap(), 9_876_543_210);
-        assert_f32_special(nested.get_float(3).unwrap(), f32::INFINITY);
-        assert!(nested.get_double(4).unwrap().is_nan());
-        assert_eq!(nested.get_string(5).unwrap(), "hello world");
-        assert_eq!(nested.get_bytes(6).unwrap(), b"binary");
-        assert_eq!(
-            nested.get_decimal(7, 10, 2).unwrap(),
-            Decimal::from_unscaled_long(12345, 10, 2).unwrap(),
-        );
-        assert_eq!(nested.get_date(8).unwrap().get_inner(), 20476);
-        assert_eq!(nested.get_time(9).unwrap().get_inner(), 36_827_123);
-        assert_eq!(
-            nested.get_timestamp_ntz(10, 6).unwrap().get_millisecond(),
-            1_769_163_227_123,
-        );
-        assert_eq!(
-            nested
-                .get_timestamp_ltz(11, 6)
-                .unwrap()
-                .get_epoch_millisecond(),
-            1_769_163_227_456,
-        );
-        assert_eq!(nested.get_binary(12, 4).unwrap(), b"\x01\x02\x03\x04");
-        let arr = nested.get_array(13).unwrap();
-        assert_eq!(arr.size(), 3);
-        assert_eq!(arr.get_int(0).unwrap(), 7);
-        assert!(arr.is_null_at(1));
-        assert_eq!(arr.get_int(2).unwrap(), 11);
-
-        let r1 = records[1].row();
-        assert_eq!(r1.get_int(0).unwrap(), 2);
-        assert!(r1.is_null_at(1).unwrap());
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
-    }
-
-    /// Projection over a log table with ROW columns. Specifically tests that
-    /// `ProjectedRow::get_row` (added by this PR) works end-to-end against the
-    /// server — without this, the projection code path for ROW would have zero
-    /// integration coverage.
-    #[tokio::test]
-    async fn append_and_scan_with_row_projection() {
-        let cluster = get_shared_cluster();
-        let connection = cluster.get_fluss_connection().await;
-        let admin = connection.get_admin().expect("Failed to get admin");
-
-        let table_path = TablePath::new("fluss", "test_log_row_projection");
-
-        let row_type = DataTypes::row(vec![
-            DataField::new("seq", DataTypes::int(), None),
-            DataField::new("label", DataTypes::string(), None),
-        ]);
-
-        let schema = Schema::builder()
-            .column("id", DataTypes::int())
-            .column("nested", row_type)
-            .column("extra", DataTypes::string())
-            .build()
-            .expect("Failed to build schema");
+        // === Projection: ARRAY ===
+        let a = r.get_array(2).expect("get_array over projection");
+        assert_eq!(a.size(), 2);
+        assert_eq!(a.get_string(0).unwrap(), "alpha");
+        assert_eq!(a.get_string(1).unwrap(), "beta");
 
-        let table_descriptor = TableDescriptor::builder()
-            .schema(schema)
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
-
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
-        let append_writer = table
-            .new_append()
-            .expect("Failed to create append")
-            .create_writer()
-            .expect("Failed to create writer");
+        // === Projection: scalar reordered to position 3 ===
+        assert_eq!(r.get_int(3).unwrap(), 7);
 
-        let mut nested = GenericRow::new(2);
-        nested.set_field(0, 42_i32);
-        nested.set_field(1, "hello");
-
-        let mut row = GenericRow::new(3);
-        row.set_field(0, 7_i32);
-        row.set_field(1, Datum::Row(Box::new(nested)));
-        row.set_field(2, "ignore-me");
-        append_writer.append(&row).expect("append");
-        append_writer.flush().await.expect("Failed to flush");
-
-        let records = scan_table(&table, |scan| {
-            scan.project_by_name(&["nested", "id"])
-                .expect("project failed")
-        })
-        .await;
-        assert_eq!(records.len(), 1);
-
-        let r0 = records[0].row();
-        let projected_nested = r0.get_row(0).expect("get_row over projection");
-        assert_eq!(projected_nested.get_int(0).unwrap(), 42);
-        assert_eq!(projected_nested.get_string(1).unwrap(), "hello");
-        assert_eq!(r0.get_int(1).unwrap(), 7);
-
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
+        admin.drop_table(&table_path, false).await.expect("drop");
     }
 
+    /// Log append + scan against a schema covering every supported data type.
     #[tokio::test]
-    async fn append_and_scan_with_array_rich_types() {
+    async fn all_supported_datatypes() {
         fn assert_f32_special(actual: f32, expected: f32) {
             if expected.is_nan() {
                 assert!(actual.is_nan(), "expected NaN");
@@ -2072,7 +986,6 @@ mod table_test {
                 assert!((actual - expected).abs() < f32::EPSILON);
             }
         }
-
         fn assert_f64_special(actual: f64, expected: f64) {
             if expected.is_nan() {
                 assert!(actual.is_nan(), "expected NaN");
@@ -2088,263 +1001,967 @@ mod table_test {
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().expect("Failed to get admin");
 
-        let table_path = TablePath::new("fluss", "test_log_arrays_rich_types");
-
-        // Compact types: DECIMAL(10,2) precision<=18, TIMESTAMP(6) precision<=3 for millis
-        let dec_compact = Decimal::from_unscaled_long(12345, 10, 2).unwrap();
-        let ts_compact = TimestampNtz::from_millis_nanos(1769163227123, 456000).unwrap();
-
-        // Non-compact types: DECIMAL(22,5) precision>18, TIMESTAMP(9) precision>3
-        let dec_big = Decimal::from_unscaled_bytes(&[66, 237, 18, 59, 11, 216, 31, 4, 244], 22, 5)
-            .expect("big decimal");
-        let ts_nano = TimestampNtz::from_millis_nanos(1769163227123, 999_999).unwrap();
-
-        let d = Date::new(20476);
-        let t = Time::new(36827123);
-        let elem_bytes = &[0_u8, 1, 2, 255];
-        let fixed_a: Vec<u8> = vec![0xDE, 0xAD, 0xBE, 0xEF];
-        let fixed_b: Vec<u8> = vec![0x01, 0x02, 0x03, 0x04];
-
-        let schema = Schema::builder()
-            .column("id", DataTypes::int())
-            .column("arr_bytes", DataTypes::array(DataTypes::bytes()))
-            .column("arr_date", DataTypes::array(DataTypes::date()))
-            .column(
+        let table_path = TablePath::new("fluss", "test_log_complex_types");
+
+        let row_seq_label_owned = dt_row_seq_label();
+        let row_seq_label = as_row_type(&row_seq_label_owned);
+        let inner_array_int = dt_array_int();
+        let inner_map_string_int = dt_map_string_int();
+
+        let plan = ColumnPlan::new()
+            .add("id", DataTypes::int())
+            .start_section("array_basics")
+            .extend(array_dt_basics_columns())
+            .start_section("row_basics")
+            .extend(row_dt_basics_columns())
+            .start_section("map_basics")
+            .extend(map_dt_basics_columns())
+            // ARRAY rich types
+            .start_section("array_rich")
+            .add("arr_bytes", DataTypes::array(DataTypes::bytes()))
+            .add("arr_date", DataTypes::array(DataTypes::date()))
+            .add(
                 "arr_time",
                 DataTypes::array(DataTypes::time_with_precision(3)),
             )
-            .column(
-                "arr_ts_compact",
+            .add(
+                "arr_ts",
                 DataTypes::array(DataTypes::timestamp_with_precision(6)),
             )
-            .column(
-                "arr_ts_nano",
-                DataTypes::array(DataTypes::timestamp_with_precision(9)),
-            )
-            .column(
-                "arr_decimal_compact",
-                DataTypes::array(DataTypes::decimal(10, 2)),
+            .add(
+                "arr_ts_ltz",
+                DataTypes::array(DataTypes::timestamp_ltz_with_precision(3)),
             )
-            .column(
+            .add("arr_decimal", DataTypes::array(DataTypes::decimal(10, 2)))
+            .add(
                 "arr_decimal_big",
                 DataTypes::array(DataTypes::decimal(22, 5)),
             )
-            .column("arr_long_str", DataTypes::array(DataTypes::string()))
-            .column("arr_float", DataTypes::array(DataTypes::float()))
-            .column("arr_double", DataTypes::array(DataTypes::double()))
-            .column("arr_binary", DataTypes::array(DataTypes::binary(4)))
-            .build()
-            .expect("Failed to build schema");
-
-        let table_descriptor = TableDescriptor::builder()
-            .schema(schema)
-            .build()
-            .expect("Failed to build table descriptor");
-
-        create_table(&admin, &table_path, &table_descriptor).await;
+            .add("arr_float", DataTypes::array(DataTypes::float()))
+            .add("arr_double", DataTypes::array(DataTypes::double()))
+            .add("arr_binary", DataTypes::array(DataTypes::binary(4)))
+            // MAP rich types
+            .start_section("map_rich")
+            .add(
+                "map_bytes",
+                DataTypes::map(DataTypes::string(), DataTypes::bytes()),
+            )
+            .add(
+                "map_decimal",
+                DataTypes::map(DataTypes::string(), DataTypes::decimal(10, 2)),
+            )
+            .add(
+                "map_date",
+                DataTypes::map(DataTypes::string(), DataTypes::date()),
+            )
+            .add(
+                "map_time",
+                DataTypes::map(DataTypes::string(), DataTypes::time_with_precision(3)),
+            )
+            .add(
+                "map_ts",
+                DataTypes::map(DataTypes::string(), DataTypes::timestamp_with_precision(6)),
+            )
+            .add(
+                "map_ts_ltz",
+                DataTypes::map(
+                    DataTypes::string(),
+                    DataTypes::timestamp_ltz_with_precision(3),
+                ),
+            )
+            .add(
+                "map_float",
+                DataTypes::map(DataTypes::string(), DataTypes::float()),
+            )
+            .add(
+                "map_double",
+                DataTypes::map(DataTypes::string(), DataTypes::double()),
+            )
+            .add(
+                "map_bool",
+                DataTypes::map(DataTypes::string(), DataTypes::boolean()),
+            )
+            .add(
+                "map_binary",
+                DataTypes::map(DataTypes::string(), DataTypes::binary(4)),
+            )
+            .add(
+                "map_int_key",
+                DataTypes::map(DataTypes::int(), DataTypes::string()),
+            )
+            .start_section("scalars")
+            .extend(scalar_dt_columns());
+        let column_count = plan.len();
 
-        let table = connection
-            .get_table(&table_path)
-            .await
-            .expect("Failed to get table");
+        create_table(
+            &admin,
+            &table_path,
+            &TableDescriptor::builder()
+                .schema(plan.build_schema(None))
+                .build()
+                .expect("table descriptor"),
+        )
+        .await;
 
-        let append_writer = table
+        let table = connection.get_table(&table_path).await.expect("table");
+        let writer = table
             .new_append()
-            .expect("Failed to create append")
+            .expect("append")
             .create_writer()
-            .expect("Failed to create writer");
+            .expect("writer");
 
-        let mut row = GenericRow::new(12);
-        row.set_field(0, 1_i32);
+        // Shared scalar values
+        let dec = Decimal::from_unscaled_long(12345, 10, 2).unwrap();
+        let dec_big = Decimal::from_unscaled_bytes(&[66, 237, 18, 59, 11, 216, 31, 4, 244], 22, 5)
+            .expect("big decimal");
+        let date_v = Date::new(20476);
+        let time_v = Time::new(36_827_123);
+        let ts_v = TimestampNtz::from_millis_nanos(1_769_163_227_123, 456_000).unwrap();
+        let ts_ltz_v = TimestampLtz::new(1_769_163_227_123);
+        let bytes_v = vec![0xDE_u8, 0xAD, 0xBE, 0xEF];
+        let fixed_a = vec![0x01_u8, 0x02, 0x03, 0x04];
+        let fixed_b = vec![0xAA_u8, 0xBB, 0xCC, 0xDD];
+
+        // Row 0 — every column populated.
+        let mut row0 = GenericRow::new(column_count);
+        row0.set_field(0, 1_i32);
+
+        // ARRAY basics
+        row0.set_field(1, make_int_array(&[Some(10), Some(20), Some(30)]));
+        row0.set_field(2, make_string_array(&[Some("hello"), Some("world")]));
+        let arr_of_arr_0 = {
+            let mut w = FlussArrayWriter::new(2, &inner_array_int);
+            w.write_array(0, &make_int_array(&[Some(1), Some(2)]));
+            w.write_array(1, &make_int_array(&[Some(3), Some(4)]));
+            w.complete().expect("arr_of_arr_0")
+        };
+        row0.set_field(3, arr_of_arr_0);
+        let arr_of_row_0 = {
+            let mut w = FlussArrayWriter::new(2, &row_seq_label_owned);
+            let mut e0 = GenericRow::new(2);
+            e0.set_field(0, 1_i32);
+            e0.set_field(1, "open");
+            w.write_row(0, &e0).expect("e0");
+            let mut e1 = GenericRow::new(2);
+            e1.set_field(0, 2_i32);
+            e1.set_field(1, "close");
+            w.write_row(1, &e1).expect("e1");
+            w.complete().expect("arr_of_row_0")
+        };
+        row0.set_field(4, arr_of_row_0);
+
+        // ROW basics
+        let mut row_basic_0 = GenericRow::new(2);
+        row_basic_0.set_field(0, 42_i32);
+        row_basic_0.set_field(1, "hello");
+        row0.set_field(5, Datum::Row(Box::new(row_basic_0)));
+
+        let mut row_deep_inner_0 = GenericRow::new(1);
+        row_deep_inner_0.set_field(0, 99_i32);
+        let mut row_deep_0 = GenericRow::new(1);
+        row_deep_0.set_field(0, Datum::Row(Box::new(row_deep_inner_0)));
+        row0.set_field(6, Datum::Row(Box::new(row_deep_0)));
+
+        let mut row_rich_0 = GenericRow::new(14);
+        row_rich_0.set_field(0, true);
+        row_rich_0.set_field(1, 100_000_i32);
+        row_rich_0.set_field(2, 9_876_543_210_i64);
+        row_rich_0.set_field(3, f32::INFINITY);
+        row_rich_0.set_field(4, f64::NAN);
+        row_rich_0.set_field(5, "hello world");
+        row_rich_0.set_field(6, b"binary".as_slice());
+        row_rich_0.set_field(7, dec.clone());
+        row_rich_0.set_field(8, Datum::Date(Date::new(20476)));
+        row_rich_0.set_field(9, Datum::Time(Time::new(36_827_123)));
+        row_rich_0.set_field(
+            10,
+            Datum::TimestampNtz(TimestampNtz::new(1_769_163_227_123)),
+        );
+        row_rich_0.set_field(
+            11,
+            Datum::TimestampLtz(TimestampLtz::new(1_769_163_227_456)),
+        );
+        row_rich_0.set_field(12, b"\x01\x02\x03\x04".as_slice());
+        row_rich_0.set_field(13, make_int_array(&[Some(7), None, Some(11)]));
+        row0.set_field(7, Datum::Row(Box::new(row_rich_0)));
+
+        // MAP basics
+        let map_string_int_0 = {
+            let mut w = FlussMapWriter::new(3, &DataTypes::string(), &DataTypes::int());
+            w.write_entry("a".into(), 1.into()).unwrap();
+            w.write_entry("b".into(), Datum::Null).unwrap();
+            w.write_entry("c".into(), 3.into()).unwrap();
+            w.complete().expect("map_string_int_0")
+        };
+        row0.set_field(8, Datum::Map(map_string_int_0));
+
+        let map_of_row_0 = {
+            let mut e0 = GenericRow::new(2);
+            e0.set_field(0, 1_i32);
+            e0.set_field(1, "open");
+            let mut e1 = GenericRow::new(2);
+            e1.set_field(0, 2_i32);
+            e1.set_field(1, "close");
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &row_seq_label_owned);
+            w.write_entry("e0".into(), Datum::Row(Box::new(e0)))
+                .unwrap();
+            w.write_entry("e1".into(), Datum::Row(Box::new(e1)))
+                .unwrap();
+            w.complete().expect("map_of_row_0")
+        };
+        row0.set_field(9, Datum::Map(map_of_row_0));
+
+        let map_of_map_0 = {
+            let g1 = {
+                let mut w = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+                w.write_entry("a".into(), 1.into()).unwrap();
+                w.write_entry("b".into(), 2.into()).unwrap();
+                w.complete().expect("g1")
+            };
+            let g2 = {
+                let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::int());
+                w.write_entry("c".into(), 3.into()).unwrap();
+                w.complete().expect("g2")
+            };
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &inner_map_string_int);
+            w.write_entry("g1".into(), Datum::Map(g1)).unwrap();
+            w.write_entry("g2".into(), Datum::Map(g2)).unwrap();
+            w.complete().expect("map_of_map_0")
+        };
+        row0.set_field(10, Datum::Map(map_of_map_0));
+
+        let map_of_array_0 = {
+            let primes = make_int_array(&[Some(2), Some(3), Some(5)]);
+            let squares = make_int_array(&[Some(1), Some(4)]);
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &inner_array_int);
+            w.write_entry("primes".into(), Datum::Array(primes))
+                .unwrap();
+            w.write_entry("squares".into(), Datum::Array(squares))
+                .unwrap();
+            w.complete().expect("map_of_array_0")
+        };
+        row0.set_field(11, Datum::Map(map_of_array_0));
+
+        let array_of_map_0 = {
+            let m0 = {
+                let mut w = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+                w.write_entry("x".into(), 1.into()).unwrap();
+                w.write_entry("y".into(), 2.into()).unwrap();
+                w.complete().expect("m0")
+            };
+            let m1 = {
+                let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::int());
+                w.write_entry("z".into(), 9.into()).unwrap();
+                w.complete().expect("m1")
+            };
+            let mut w = FlussArrayWriter::new(2, &inner_map_string_int);
+            w.write_map(0, &m0);
+            w.write_map(1, &m1);
+            w.complete().expect("array_of_map_0")
+        };
+        row0.set_field(12, array_of_map_0);
 
-        // col 1: arr_bytes — binary with null element
-        let arr_bytes = {
+        // ARRAY rich types
+        let arr_bytes_0 = {
             let mut w = FlussArrayWriter::new(2, &DataTypes::bytes());
-            w.write_binary_bytes(0, elem_bytes);
+            w.write_binary_bytes(0, &bytes_v);
             w.set_null_at(1);
-            w.complete().expect("arr_bytes")
+            w.complete().expect("arr_bytes_0")
         };
-        row.set_field(1, arr_bytes);
-
-        // col 2: arr_date
-        let arr_date = {
+        row0.set_field(13, arr_bytes_0);
+        let arr_date_0 = {
             let mut w = FlussArrayWriter::new(2, &DataTypes::date());
-            w.write_date(0, d);
+            w.write_date(0, date_v);
             w.set_null_at(1);
-            w.complete().expect("arr_date")
+            w.complete().expect("arr_date_0")
         };
-        row.set_field(2, arr_date);
-
-        // col 3: arr_time
-        let arr_time = {
+        row0.set_field(14, arr_date_0);
+        let arr_time_0 = {
             let mut w = FlussArrayWriter::new(2, &DataTypes::time_with_precision(3));
-            w.write_time(0, t);
+            w.write_time(0, time_v);
             w.set_null_at(1);
-            w.complete().expect("arr_time")
+            w.complete().expect("arr_time_0")
         };
-        row.set_field(3, arr_time);
-
-        // col 4: arr_ts_compact — compact timestamp (precision 6, millis+nanos)
-        let arr_ts_compact = {
+        row0.set_field(15, arr_time_0);
+        let arr_ts_0 = {
             let mut w = FlussArrayWriter::new(2, &DataTypes::timestamp_with_precision(6));
-            w.write_timestamp_ntz(0, &ts_compact, 6);
+            w.write_timestamp_ntz(0, &ts_v, 6);
             w.set_null_at(1);
-            w.complete().expect("arr_ts_compact")
+            w.complete().expect("arr_ts_0")
         };
-        row.set_field(4, arr_ts_compact);
-
-        // col 5: arr_ts_nano — non-compact timestamp (precision 9)
-        let arr_ts_nano = {
-            let mut w = FlussArrayWriter::new(1, &DataTypes::timestamp_with_precision(9));
-            w.write_timestamp_ntz(0, &ts_nano, 9);
-            w.complete().expect("arr_ts_nano")
+        row0.set_field(16, arr_ts_0);
+        let arr_ts_ltz_0 = {
+            let mut w = FlussArrayWriter::new(2, &DataTypes::timestamp_ltz_with_precision(3));
+            w.write_timestamp_ltz(0, &ts_ltz_v, 3);
+            w.set_null_at(1);
+            w.complete().expect("arr_ts_ltz_0")
         };
-        row.set_field(5, arr_ts_nano);
-
-        // col 6: arr_decimal_compact — compact decimal (precision 10)
-        let arr_decimal_compact = {
+        row0.set_field(17, arr_ts_ltz_0);
+        let arr_decimal_0 = {
             let mut w = FlussArrayWriter::new(2, &DataTypes::decimal(10, 2));
-            w.write_decimal(0, &dec_compact, 10);
+            w.write_decimal(0, &dec, 10);
             w.set_null_at(1);
-            w.complete().expect("arr_decimal_compact")
+            w.complete().expect("arr_decimal_0")
         };
-        row.set_field(6, arr_decimal_compact);
-
-        // col 7: arr_decimal_big — non-compact decimal (precision 22)
-        let arr_decimal_big = {
+        row0.set_field(18, arr_decimal_0);
+        let arr_decimal_big_0 = {
             let mut w = FlussArrayWriter::new(1, &DataTypes::decimal(22, 5));
             w.write_decimal(0, &dec_big, 22);
-            w.complete().expect("arr_decimal_big")
-        };
-        row.set_field(7, arr_decimal_big);
-
-        // col 8: arr_long_str — heap-backed strings (>= 8 bytes)
-        let arr_long_str = {
-            let mut w = FlussArrayWriter::new(2, &DataTypes::string());
-            w.write_string(0, "abcdefghi");
-            w.write_string(1, "longstring_here");
-            w.complete().expect("arr_long_str")
+            w.complete().expect("arr_decimal_big_0")
         };
-        row.set_field(8, arr_long_str);
-
-        // col 9: arr_float — IEEE 754 specials
-        let arr_float = {
+        row0.set_field(19, arr_decimal_big_0);
+        let arr_float_0 = {
             let mut w = FlussArrayWriter::new(3, &DataTypes::float());
             w.write_float(0, f32::NAN);
             w.write_float(1, f32::INFINITY);
             w.write_float(2, f32::NEG_INFINITY);
-            w.complete().expect("arr_float")
+            w.complete().expect("arr_float_0")
         };
-        row.set_field(9, arr_float);
-
-        // col 10: arr_double — IEEE 754 specials
-        let arr_double = {
+        row0.set_field(20, arr_float_0);
+        let arr_double_0 = {
             let mut w = FlussArrayWriter::new(3, &DataTypes::double());
             w.write_double(0, f64::NAN);
             w.write_double(1, f64::INFINITY);
             w.write_double(2, f64::NEG_INFINITY);
-            w.complete().expect("arr_double")
+            w.complete().expect("arr_double_0")
         };
-        row.set_field(10, arr_double);
-
-        // col 11: arr_binary — fixed-size binary(4)
-        let arr_binary = {
+        row0.set_field(21, arr_double_0);
+        let arr_binary_0 = {
             let mut w = FlussArrayWriter::new(2, &DataTypes::binary(4));
             w.write_binary_bytes(0, &fixed_a);
             w.write_binary_bytes(1, &fixed_b);
-            w.complete().expect("arr_binary")
+            w.complete().expect("arr_binary_0")
+        };
+        row0.set_field(22, arr_binary_0);
+
+        // MAP rich types
+        let map_bytes_0 = {
+            let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::bytes());
+            w.write_entry("blob".into(), bytes_v.as_slice().into())
+                .unwrap();
+            w.complete().expect("map_bytes_0")
+        };
+        row0.set_field(23, Datum::Map(map_bytes_0));
+        let map_decimal_0 = {
+            let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::decimal(10, 2));
+            w.write_entry("price".into(), Datum::Decimal(dec.clone()))
+                .unwrap();
+            w.complete().expect("map_decimal_0")
+        };
+        row0.set_field(24, Datum::Map(map_decimal_0));
+        let map_date_0 = {
+            let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::date());
+            w.write_entry("d".into(), Datum::Date(date_v)).unwrap();
+            w.complete().expect("map_date_0")
+        };
+        row0.set_field(25, Datum::Map(map_date_0));
+        let map_time_0 = {
+            let mut w =
+                FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::time_with_precision(3));
+            w.write_entry("t".into(), Datum::Time(time_v)).unwrap();
+            w.complete().expect("map_time_0")
+        };
+        row0.set_field(26, Datum::Map(map_time_0));
+        let map_ts_0 = {
+            let mut w = FlussMapWriter::new(
+                1,
+                &DataTypes::string(),
+                &DataTypes::timestamp_with_precision(6),
+            );
+            w.write_entry("ts".into(), Datum::TimestampNtz(ts_v))
+                .unwrap();
+            w.complete().expect("map_ts_0")
+        };
+        row0.set_field(27, Datum::Map(map_ts_0));
+        let map_ts_ltz_0 = {
+            let mut w = FlussMapWriter::new(
+                1,
+                &DataTypes::string(),
+                &DataTypes::timestamp_ltz_with_precision(3),
+            );
+            w.write_entry("ts".into(), Datum::TimestampLtz(ts_ltz_v))
+                .unwrap();
+            w.complete().expect("map_ts_ltz_0")
+        };
+        row0.set_field(28, Datum::Map(map_ts_ltz_0));
+        let map_float_0 = {
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::float());
+            w.write_entry("nan".into(), f32::NAN.into()).unwrap();
+            w.write_entry("inf".into(), f32::INFINITY.into()).unwrap();
+            w.complete().expect("map_float_0")
+        };
+        row0.set_field(29, Datum::Map(map_float_0));
+        let map_double_0 = {
+            let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::double());
+            w.write_entry("pi".into(), std::f64::consts::PI.into())
+                .unwrap();
+            w.complete().expect("map_double_0")
+        };
+        row0.set_field(30, Datum::Map(map_double_0));
+        let map_bool_0 = {
+            let mut w = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::boolean());
+            w.write_entry("t".into(), true.into()).unwrap();
+            w.write_entry("f".into(), false.into()).unwrap();
+            w.complete().expect("map_bool_0")
+        };
+        row0.set_field(31, Datum::Map(map_bool_0));
+        let map_binary_0 = {
+            let mut w = FlussMapWriter::new(1, &DataTypes::string(), &DataTypes::binary(4));
+            w.write_entry("k".into(), fixed_a.as_slice().into())
+                .unwrap();
+            w.complete().expect("map_binary_0")
         };
-        row.set_field(11, arr_binary);
+        row0.set_field(32, Datum::Map(map_binary_0));
+        let map_int_key_0 = {
+            let mut w = FlussMapWriter::new(2, &DataTypes::int(), &DataTypes::string());
+            w.write_entry(1.into(), "one".into()).unwrap();
+            w.write_entry(2.into(), "two".into()).unwrap();
+            w.complete().expect("map_int_key_0")
+        };
+        row0.set_field(33, Datum::Map(map_int_key_0));
+
+        // Scalar values
+        let scalar_tinyint = 127_i8;
+        let scalar_smallint = 32_767_i16;
+        let scalar_bigint = 9_223_372_036_854_775_807_i64;
+        let scalar_float = std::f32::consts::PI;
+        let scalar_double = std::f64::consts::E;
+        let scalar_char = "hello";
+        let scalar_string = "world of fluss rust client";
+        let scalar_time_s = Time::new(36_827_000);
+        let scalar_time_ms = Time::new(36_827_123);
+        let scalar_time_us = Time::new(86_399_999);
+        let scalar_time_ns = Time::new(1);
+        let scalar_ts_s = TimestampNtz::new(1_769_163_227_000);
+        let scalar_ts_ms = TimestampNtz::new(1_769_163_227_123);
+        let scalar_ts_us = TimestampNtz::from_millis_nanos(1_769_163_227_123, 456_000).unwrap();
+        let scalar_ts_ns = TimestampNtz::from_millis_nanos(1_769_163_227_123, 999_999).unwrap();
+        let scalar_ts_ltz_s = TimestampLtz::new(1_769_163_227_000);
+        let scalar_ts_ltz_ms = TimestampLtz::new(1_769_163_227_123);
+        let scalar_ts_ltz_us = TimestampLtz::from_millis_nanos(1_769_163_227_123, 456_000).unwrap();
+        let scalar_ts_ltz_ns = TimestampLtz::from_millis_nanos(1_769_163_227_123, 999_999).unwrap();
+        let scalar_bytes_top: Vec<u8> = b"binary data".to_vec();
+        let scalar_binary_top: Vec<u8> = vec![0xDE, 0xAD, 0xBE, 0xEF];
+        let scalar_ts_us_neg = TimestampNtz::from_millis_nanos(-301_234_154_877, 456_000).unwrap();
+        let scalar_ts_ns_neg = TimestampNtz::from_millis_nanos(-301_234_154_877, 999_999).unwrap();
+        let scalar_ts_ltz_us_neg =
+            TimestampLtz::from_millis_nanos(-301_234_154_877, 456_000).unwrap();
+        let scalar_ts_ltz_ns_neg =
+            TimestampLtz::from_millis_nanos(-301_234_154_877, 999_999).unwrap();
+
+        row0.set_field(34, scalar_tinyint);
+        row0.set_field(35, scalar_smallint);
+        row0.set_field(36, scalar_bigint);
+        row0.set_field(37, scalar_float);
+        row0.set_field(38, scalar_double);
+        row0.set_field(39, true);
+        row0.set_field(40, scalar_char);
+        row0.set_field(41, scalar_string);
+        row0.set_field(42, dec.clone());
+        row0.set_field(43, Datum::Date(date_v));
+        row0.set_field(44, scalar_time_s);
+        row0.set_field(45, scalar_time_ms);
+        row0.set_field(46, scalar_time_us);
+        row0.set_field(47, scalar_time_ns);
+        row0.set_field(48, scalar_ts_s);
+        row0.set_field(49, scalar_ts_ms);
+        row0.set_field(50, scalar_ts_us);
+        row0.set_field(51, scalar_ts_ns);
+        row0.set_field(52, scalar_ts_ltz_s);
+        row0.set_field(53, scalar_ts_ltz_ms);
+        row0.set_field(54, scalar_ts_ltz_us);
+        row0.set_field(55, scalar_ts_ltz_ns);
+        row0.set_field(56, scalar_bytes_top.as_slice());
+        row0.set_field(57, scalar_binary_top.as_slice());
+        row0.set_field(58, scalar_ts_us_neg);
+        row0.set_field(59, scalar_ts_ns_neg);
+        row0.set_field(60, scalar_ts_ltz_us_neg);
+        row0.set_field(61, scalar_ts_ltz_ns_neg);
+
+        // Row 1 — ARRAY/MAP basic-shape edge cases (empty, null elements).
+        let mut row1 = GenericRow::new(column_count);
+        row1.set_field(0, 2_i32);
+        row1.set_field(1, make_int_array(&[]));
+        row1.set_field(2, make_string_array(&[None]));
+        let arr_of_arr_1 = {
+            let mut w = FlussArrayWriter::new(3, &inner_array_int);
+            w.write_array(0, &make_int_array(&[Some(5)]));
+            w.set_null_at(1);
+            w.write_array(2, &make_int_array(&[]));
+            w.complete().expect("arr_of_arr_1")
+        };
+        row1.set_field(3, arr_of_arr_1);
+        let arr_of_row_1 = {
+            let mut w = FlussArrayWriter::new(3, &row_seq_label_owned);
+            let mut e0 = GenericRow::new(2);
+            e0.set_field(0, 7_i32);
+            e0.set_field(1, "x");
+            w.write_row(0, &e0).expect("e0");
+            w.set_null_at(1);
+            let mut e2 = GenericRow::new(2);
+            e2.set_field(0, 8_i32);
+            e2.set_field(1, "y");
+            w.write_row(2, &e2).expect("e2");
+            w.complete().expect("arr_of_row_1")
+        };
+        row1.set_field(4, arr_of_row_1);
+        for i in plan.section_range("row_basics") {
+            row1.set_field(i, Datum::Null);
+        }
+        // Empty MAP
+        let empty_map = FlussMapWriter::new(0, &DataTypes::string(), &DataTypes::int())
+            .complete()
+            .expect("empty_map");
+        row1.set_field(8, Datum::Map(empty_map));
+        for i in (plan.idx("map_string_int") + 1)..plan.len() {
+            row1.set_field(i, Datum::Null);
+        }
 
-        append_writer.append(&row).expect("append");
-        append_writer.flush().await.expect("Failed to flush");
+        // Row 2 — every column NULL.
+        let mut row2 = GenericRow::new(column_count);
+        row2.set_field(0, 3_i32);
+        for i in 1..column_count {
+            row2.set_field(i, Datum::Null);
+        }
 
-        let records = scan_table(&table, |scan| scan).await;
-        assert_eq!(records.len(), 1);
-        let r = records[0].row();
+        writer.append(&row0).expect("append row0");
+        writer.append(&row1).expect("append row1");
+        writer.append(&row2).expect("append row2");
+        writer.flush().await.expect("flush");
 
-        // Verify arr_bytes
-        let ab = r.get_array(1).unwrap();
-        assert_eq!(ab.size(), 2);
-        assert_eq!(ab.get_binary(0).unwrap(), elem_bytes);
-        assert!(ab.is_null_at(1));
+        let records = scan_table(&table, |scan| scan).await;
+        assert_eq!(records.len(), 3);
+        let r0 = records[0].row();
+        let r1 = records[1].row();
+        let r2 = records[2].row();
 
-        // Verify arr_date
-        let ad = r.get_array(2).unwrap();
-        assert_eq!(ad.size(), 2);
-        assert_eq!(ad.get_date(0).unwrap().get_inner(), d.get_inner());
-        assert!(ad.is_null_at(1));
+        assert_eq!(r0.get_int(0).unwrap(), 1);
+        assert_eq!(r1.get_int(0).unwrap(), 2);
+        assert_eq!(r2.get_int(0).unwrap(), 3);
 
-        // Verify arr_time
-        let at = r.get_array(3).unwrap();
-        assert_eq!(at.size(), 2);
-        assert_eq!(at.get_time(0).unwrap().get_inner(), t.get_inner());
-        assert!(at.is_null_at(1));
+        // === ARRAY: basic shapes ===
+        let arr_int = r0.get_array(1).unwrap();
+        assert_eq!(arr_int.size(), 3);
+        assert_eq!(arr_int.get_int(0).unwrap(), 10);
+        assert_eq!(arr_int.get_int(2).unwrap(), 30);
+        let arr_string = r0.get_array(2).unwrap();
+        assert_eq!(arr_string.size(), 2);
+        assert_eq!(arr_string.get_string(0).unwrap(), "hello");
+        assert_eq!(arr_string.get_string(1).unwrap(), "world");
+        let arr_of_arr = r0.get_array(3).unwrap();
+        assert_eq!(arr_of_arr.size(), 2);
+        let inner = arr_of_arr.get_array(0).unwrap();
+        assert_eq!(inner.size(), 2);
+        assert_eq!(inner.get_int(0).unwrap(), 1);
+        assert_eq!(inner.get_int(1).unwrap(), 2);
+        let inner = arr_of_arr.get_array(1).unwrap();
+        assert_eq!(inner.get_int(0).unwrap(), 3);
+        assert_eq!(inner.get_int(1).unwrap(), 4);
+
+        // === ARRAY: edge cases on row 1 (empty + null elements + null inner) ===
+        assert_eq!(r1.get_array(1).unwrap().size(), 0);
+        let arr_string_r1 = r1.get_array(2).unwrap();
+        assert_eq!(arr_string_r1.size(), 1);
+        assert!(arr_string_r1.is_null_at(0));
+        let arr_of_arr_r1 = r1.get_array(3).unwrap();
+        assert_eq!(arr_of_arr_r1.size(), 3);
+        let aa0 = arr_of_arr_r1.get_array(0).unwrap();
+        assert_eq!(aa0.size(), 1);
+        assert_eq!(aa0.get_int(0).unwrap(), 5);
+        assert!(arr_of_arr_r1.is_null_at(1));
+        assert_eq!(arr_of_arr_r1.get_array(2).unwrap().size(), 0);
+
+        // === ARRAY: null whole column on row 2 ===
+        assert!(r2.is_null_at(1).unwrap());
+        assert!(r2.is_null_at(2).unwrap());
+        assert!(r2.is_null_at(3).unwrap());
 
-        // Verify arr_ts_compact
-        let ats = r.get_array(4).unwrap();
-        assert_eq!(ats.size(), 2);
-        let read_ts_compact = ats.get_timestamp_ntz(0, 6).unwrap();
+        // === ARRAY<ROW>: row 0 + row 1 with null element + row 2 null whole ===
+        let aor0 = r0.get_array(4).unwrap();
+        assert_eq!(aor0.size(), 2);
+        let e0 = aor0.get_row(0, &row_seq_label).unwrap();
+        assert_eq!(e0.get_int(0).unwrap(), 1);
+        assert_eq!(e0.get_string(1).unwrap(), "open");
+        let e1 = aor0.get_row(1, &row_seq_label).unwrap();
+        assert_eq!(e1.get_int(0).unwrap(), 2);
+        assert_eq!(e1.get_string(1).unwrap(), "close");
+        let aor1 = r1.get_array(4).unwrap();
+        assert_eq!(aor1.size(), 3);
+        let e0 = aor1.get_row(0, &row_seq_label).unwrap();
+        assert_eq!(e0.get_int(0).unwrap(), 7);
+        assert!(aor1.is_null_at(1));
+        let e2 = aor1.get_row(2, &row_seq_label).unwrap();
+        assert_eq!(e2.get_int(0).unwrap(), 8);
+        assert!(r2.is_null_at(4).unwrap());
+
+        // === ROW: basic + deep + rich types on row 0; row 2 null ===
+        let rb = r0.get_row(5).unwrap();
+        assert_eq!(rb.get_int(0).unwrap(), 42);
+        assert_eq!(rb.get_string(1).unwrap(), "hello");
+        let rd = r0.get_row(6).unwrap();
+        let rd_inner = rd.get_row(0).unwrap();
+        assert_eq!(rd_inner.get_int(0).unwrap(), 99);
+        let rr = r0.get_row(7).unwrap();
+        assert!(rr.get_boolean(0).unwrap());
+        assert_eq!(rr.get_int(1).unwrap(), 100_000);
+        assert_eq!(rr.get_long(2).unwrap(), 9_876_543_210);
+        assert_f32_special(rr.get_float(3).unwrap(), f32::INFINITY);
+        assert!(rr.get_double(4).unwrap().is_nan());
+        assert_eq!(rr.get_string(5).unwrap(), "hello world");
+        assert_eq!(rr.get_bytes(6).unwrap(), b"binary");
+        assert_eq!(rr.get_decimal(7, 10, 2).unwrap(), dec);
+        assert_eq!(rr.get_date(8).unwrap().get_inner(), 20476);
+        assert_eq!(rr.get_time(9).unwrap().get_inner(), 36_827_123);
+        assert_eq!(
+            rr.get_timestamp_ntz(10, 6).unwrap().get_millisecond(),
+            1_769_163_227_123
+        );
+        assert_eq!(
+            rr.get_timestamp_ltz(11, 6).unwrap().get_epoch_millisecond(),
+            1_769_163_227_456
+        );
+        assert_eq!(rr.get_binary(12, 4).unwrap(), b"\x01\x02\x03\x04");
+        let f_arr = rr.get_array(13).unwrap();
+        assert_eq!(f_arr.size(), 3);
+        assert_eq!(f_arr.get_int(0).unwrap(), 7);
+        assert!(f_arr.is_null_at(1));
+        assert!(r2.is_null_at(5).unwrap());
+        assert!(r2.is_null_at(6).unwrap());
+        assert!(r2.is_null_at(7).unwrap());
+
+        // === MAP: basic (with null value) + empty (row 1) + null (row 2) ===
+        let m = r0.get_map(8).unwrap();
+        assert_eq!(m.size(), 3);
+        assert_eq!(m.get(&Datum::from("a")).unwrap(), Some(Datum::from(1_i32)));
+        assert_eq!(m.get(&Datum::from("b")).unwrap(), Some(Datum::Null));
+        assert_eq!(m.get(&Datum::from("c")).unwrap(), Some(Datum::from(3_i32)));
+        assert_eq!(r1.get_map(8).unwrap().size(), 0);
+        assert!(r2.is_null_at(8).unwrap());
+
+        // === MAP<K, ROW> ===
+        let m = r0.get_map(9).unwrap();
+        assert_eq!(m.size(), 2);
+        let keys = m.key_array();
+        let values = m.value_array();
+        assert_eq!(keys.get_string(0).unwrap(), "e0");
+        let v0 = values.get_row(0, &row_seq_label).unwrap();
+        assert_eq!(v0.get_int(0).unwrap(), 1);
+        assert_eq!(v0.get_string(1).unwrap(), "open");
+        assert_eq!(keys.get_string(1).unwrap(), "e1");
+        let v1 = values.get_row(1, &row_seq_label).unwrap();
+        assert_eq!(v1.get_int(0).unwrap(), 2);
+        assert_eq!(v1.get_string(1).unwrap(), "close");
+
+        // === MAP<K, MAP> ===
+        let m = r0.get_map(10).unwrap();
+        assert_eq!(m.size(), 2);
+        let g1 = m
+            .value_array()
+            .get_map(0, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(g1.size(), 2);
+        assert_eq!(g1.get(&Datum::from("a")).unwrap(), Some(Datum::from(1_i32)));
+        let g2 = m
+            .value_array()
+            .get_map(1, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(g2.size(), 1);
+        assert_eq!(g2.get(&Datum::from("c")).unwrap(), Some(Datum::from(3_i32)));
+
+        // === MAP<K, ARRAY> + ARRAY<MAP> ===
+        let m = r0.get_map(11).unwrap();
+        assert_eq!(m.size(), 2);
+        let primes = m.value_array().get_array(0).unwrap();
+        assert_eq!(primes.size(), 3);
+        assert_eq!(primes.get_int(2).unwrap(), 5);
+        let am = r0.get_array(12).unwrap();
+        assert_eq!(am.size(), 2);
+        let am0 = am
+            .get_map(0, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(am0.size(), 2);
+        let am1 = am
+            .get_map(1, &DataTypes::string(), &DataTypes::int())
+            .unwrap();
+        assert_eq!(am1.size(), 1);
         assert_eq!(
-            read_ts_compact.get_millisecond(),
-            ts_compact.get_millisecond()
+            am1.get(&Datum::from("z")).unwrap(),
+            Some(Datum::from(9_i32))
         );
+
+        // === ARRAY rich types ===
+        let ab = r0.get_array(13).unwrap();
+        assert_eq!(ab.size(), 2);
+        assert_eq!(ab.get_bytes(0).unwrap(), bytes_v.as_slice());
+        assert!(ab.is_null_at(1));
+        let ad = r0.get_array(14).unwrap();
+        assert_eq!(ad.get_date(0).unwrap().get_inner(), date_v.get_inner());
+        assert!(ad.is_null_at(1));
+        let at = r0.get_array(15).unwrap();
+        assert_eq!(at.get_time(0).unwrap().get_inner(), time_v.get_inner());
+        assert!(at.is_null_at(1));
+        let ats = r0.get_array(16).unwrap();
+        let read_ts = ats.get_timestamp_ntz(0, 6).unwrap();
+        assert_eq!(read_ts.get_millisecond(), ts_v.get_millisecond());
         assert_eq!(
-            read_ts_compact.get_nano_of_millisecond(),
-            ts_compact.get_nano_of_millisecond()
+            read_ts.get_nano_of_millisecond(),
+            ts_v.get_nano_of_millisecond()
         );
         assert!(ats.is_null_at(1));
-
-        // Verify arr_ts_nano
-        let ats_nano = r.get_array(5).unwrap();
-        assert_eq!(ats_nano.size(), 1);
-        let read_ts_nano = ats_nano.get_timestamp_ntz(0, 9).unwrap();
-        assert_eq!(read_ts_nano.get_millisecond(), ts_nano.get_millisecond());
+        let atl = r0.get_array(17).unwrap();
         assert_eq!(
-            read_ts_nano.get_nano_of_millisecond(),
-            ts_nano.get_nano_of_millisecond()
+            atl.get_timestamp_ltz(0, 3).unwrap().get_epoch_millisecond(),
+            ts_ltz_v.get_epoch_millisecond()
         );
-
-        // Verify arr_decimal_compact
-        let adc = r.get_array(6).unwrap();
-        assert_eq!(adc.size(), 2);
-        assert_eq!(adc.get_decimal(0, 10, 2).unwrap(), dec_compact);
+        assert!(atl.is_null_at(1));
+        let adc = r0.get_array(18).unwrap();
+        assert_eq!(adc.get_decimal(0, 10, 2).unwrap(), dec);
         assert!(adc.is_null_at(1));
-
-        // Verify arr_decimal_big
-        let adb = r.get_array(7).unwrap();
-        assert_eq!(adb.size(), 1);
+        let adb = r0.get_array(19).unwrap();
         assert_eq!(adb.get_decimal(0, 22, 5).unwrap(), dec_big);
-
-        // Verify arr_long_str
-        let als = r.get_array(8).unwrap();
-        assert_eq!(als.size(), 2);
-        assert_eq!(als.get_string(0).unwrap(), "abcdefghi");
-        assert_eq!(als.get_string(1).unwrap(), "longstring_here");
-
-        // Verify arr_float — IEEE 754 specials
-        let af = r.get_array(9).unwrap();
+        let af = r0.get_array(20).unwrap();
         assert_eq!(af.size(), 3);
         assert_f32_special(af.get_float(0).unwrap(), f32::NAN);
         assert_f32_special(af.get_float(1).unwrap(), f32::INFINITY);
         assert_f32_special(af.get_float(2).unwrap(), f32::NEG_INFINITY);
-
-        // Verify arr_double — IEEE 754 specials
-        let adbl = r.get_array(10).unwrap();
-        assert_eq!(adbl.size(), 3);
+        let adbl = r0.get_array(21).unwrap();
         assert_f64_special(adbl.get_double(0).unwrap(), f64::NAN);
         assert_f64_special(adbl.get_double(1).unwrap(), f64::INFINITY);
         assert_f64_special(adbl.get_double(2).unwrap(), f64::NEG_INFINITY);
-
-        // Verify arr_binary — fixed-size binary(4)
-        let fb: FlussArray = r.get_array(11).unwrap();
-        assert_eq!(fb.size(), 2);
+        let fb: FlussArray = r0.get_array(22).unwrap();
         assert_eq!(fb.get_binary(0).unwrap(), fixed_a.as_slice());
         assert_eq!(fb.get_binary(1).unwrap(), fixed_b.as_slice());
 
-        admin
-            .drop_table(&table_path, false)
-            .await
-            .expect("Failed to drop table");
+        // === MAP rich types ===
+        let m = r0.get_map(23).unwrap();
+        assert_eq!(m.value_array().get_bytes(0).unwrap(), bytes_v.as_slice());
+        let m = r0.get_map(24).unwrap();
+        assert_eq!(m.value_array().get_decimal(0, 10, 2).unwrap(), dec);
+        let m = r0.get_map(25).unwrap();
+        assert_eq!(
+            m.value_array().get_date(0).unwrap().get_inner(),
+            date_v.get_inner()
+        );
+        let m = r0.get_map(26).unwrap();
+        assert_eq!(
+            m.value_array().get_time(0).unwrap().get_inner(),
+            time_v.get_inner()
+        );
+        let m = r0.get_map(27).unwrap();
+        let read_ts = m.value_array().get_timestamp_ntz(0, 6).unwrap();
+        assert_eq!(read_ts.get_millisecond(), ts_v.get_millisecond());
+        let m = r0.get_map(28).unwrap();
+        let read_ltz = m.value_array().get_timestamp_ltz(0, 3).unwrap();
+        assert_eq!(
+            read_ltz.get_epoch_millisecond(),
+            ts_ltz_v.get_epoch_millisecond()
+        );
+        let m = r0.get_map(29).unwrap();
+        assert!(m.value_array().get_float(0).unwrap().is_nan());
+        assert!(m.value_array().get_float(1).unwrap().is_infinite());
+        let m = r0.get_map(30).unwrap();
+        assert!(
+            (m.value_array().get_double(0).unwrap() - std::f64::consts::PI).abs() < f64::EPSILON
+        );
+        let m = r0.get_map(31).unwrap();
+        assert!(m.value_array().get_boolean(0).unwrap());
+        assert!(!m.value_array().get_boolean(1).unwrap());
+        let m = r0.get_map(32).unwrap();
+        assert_eq!(m.value_array().get_binary(0).unwrap(), fixed_a.as_slice());
+        let m = r0.get_map(33).unwrap();
+        assert_eq!(m.size(), 2);
+        assert_eq!(m.key_array().get_int(0).unwrap(), 1);
+        assert_eq!(m.value_array().get_string(0).unwrap(), "one");
+
+        // === Convenience API: entries / get / key_type / value_type ===
+        // (exercised on row 0's map_string_int at index 8)
+        let m = r0.get_map(8).unwrap();
+        assert_eq!(m.key_type(), &DataTypes::string().as_non_nullable());
+        assert_eq!(m.value_type(), &DataTypes::int());
+        let mut got: HashMap<String, Option<i32>> = HashMap::with_capacity(m.size());
+        for entry in m.entries() {
+            let (k, v) = entry.expect("decode entry");
+            let key = match k {
+                Datum::String(s) => s.into_owned(),
+                other => panic!("unexpected key variant: {other:?}"),
+            };
+            let value = match v {
+                Datum::Int32(i) => Some(i),
+                Datum::Null => None,
+                other => panic!("unexpected value variant: {other:?}"),
+            };
+            got.insert(key, value);
+        }
+        let expected: HashMap<String, Option<i32>> = HashMap::from([
+            ("a".to_string(), Some(1)),
+            ("b".to_string(), None),
+            ("c".to_string(), Some(3)),
+        ]);
+        assert_eq!(got, expected);
+        assert_eq!(m.get(&Datum::from("a")).unwrap(), Some(Datum::from(1_i32)));
+        assert!(m.get(&Datum::from("missing")).unwrap().is_none());
+
+        // === Bulk write via FlussMapWriter::extend (covered with a fresh map) ===
+        let src: HashMap<&str, i32> = HashMap::from([("a", 1), ("b", 2), ("c", 3)]);
+        let extend_built = {
+            let mut w = FlussMapWriter::new(src.len(), &DataTypes::string(), &DataTypes::int());
+            w.extend(src.clone()).expect("extend");
+            w.complete().expect("extend-complete")
+        };
+        assert_eq!(extend_built.size(), src.len());
+        let extend_b = extend_built.get(&Datum::from("b")).unwrap();
+        assert_eq!(extend_b, Some(Datum::from(2_i32)));
+
+        // === Scalars: integer family ===
+        assert_eq!(r0.get_byte(34).unwrap(), scalar_tinyint);
+        assert_eq!(r0.get_short(35).unwrap(), scalar_smallint);
+        assert_eq!(r0.get_long(36).unwrap(), scalar_bigint);
+
+        // === Scalars: floating point ===
+        assert!((r0.get_float(37).unwrap() - scalar_float).abs() < f32::EPSILON);
+        assert!((r0.get_double(38).unwrap() - scalar_double).abs() < f64::EPSILON);
+
+        // === Scalars: boolean / char / string ===
+        assert!(r0.get_boolean(39).unwrap());
+        assert_eq!(r0.get_char(40, 10).unwrap(), scalar_char);
+        assert_eq!(r0.get_string(41).unwrap(), scalar_string);
+
+        // === Scalars: decimal / date ===
+        assert_eq!(r0.get_decimal(42, 10, 2).unwrap(), dec);
+        assert_eq!(r0.get_date(43).unwrap().get_inner(), date_v.get_inner());
+
+        // === Scalars: time across all four precisions ===
+        assert_eq!(
+            r0.get_time(44).unwrap().get_inner(),
+            scalar_time_s.get_inner()
+        );
+        assert_eq!(
+            r0.get_time(45).unwrap().get_inner(),
+            scalar_time_ms.get_inner()
+        );
+        assert_eq!(
+            r0.get_time(46).unwrap().get_inner(),
+            scalar_time_us.get_inner()
+        );
+        assert_eq!(
+            r0.get_time(47).unwrap().get_inner(),
+            scalar_time_ns.get_inner()
+        );
+
+        // === Scalars: timestamp across all four precisions ===
+        assert_eq!(
+            r0.get_timestamp_ntz(48, 0).unwrap().get_millisecond(),
+            scalar_ts_s.get_millisecond()
+        );
+        assert_eq!(
+            r0.get_timestamp_ntz(49, 3).unwrap().get_millisecond(),
+            scalar_ts_ms.get_millisecond()
+        );
+        let read_us = r0.get_timestamp_ntz(50, 6).unwrap();
+        assert_eq!(read_us.get_millisecond(), scalar_ts_us.get_millisecond());
+        assert_eq!(
+            read_us.get_nano_of_millisecond(),
+            scalar_ts_us.get_nano_of_millisecond()
+        );
+        let read_ns = r0.get_timestamp_ntz(51, 9).unwrap();
+        assert_eq!(read_ns.get_millisecond(), scalar_ts_ns.get_millisecond());
+        assert_eq!(
+            read_ns.get_nano_of_millisecond(),
+            scalar_ts_ns.get_nano_of_millisecond()
+        );
+
+        // === Scalars: timestamp_ltz across all four precisions ===
+        assert_eq!(
+            r0.get_timestamp_ltz(52, 0).unwrap().get_epoch_millisecond(),
+            scalar_ts_ltz_s.get_epoch_millisecond()
+        );
+        assert_eq!(
+            r0.get_timestamp_ltz(53, 3).unwrap().get_epoch_millisecond(),
+            scalar_ts_ltz_ms.get_epoch_millisecond()
+        );
+        let read_ltz_us = r0.get_timestamp_ltz(54, 6).unwrap();
+        assert_eq!(
+            read_ltz_us.get_epoch_millisecond(),
+            scalar_ts_ltz_us.get_epoch_millisecond()
+        );
+        assert_eq!(
+            read_ltz_us.get_nano_of_millisecond(),
+            scalar_ts_ltz_us.get_nano_of_millisecond()
+        );
+        let read_ltz_ns = r0.get_timestamp_ltz(55, 9).unwrap();
+        assert_eq!(
+            read_ltz_ns.get_epoch_millisecond(),
+            scalar_ts_ltz_ns.get_epoch_millisecond()
+        );
+        assert_eq!(
+            read_ltz_ns.get_nano_of_millisecond(),
+            scalar_ts_ltz_ns.get_nano_of_millisecond()
+        );
+
+        // === Scalars: bytes + fixed binary ===
+        assert_eq!(r0.get_bytes(56).unwrap(), scalar_bytes_top.as_slice());
+        assert_eq!(r0.get_binary(57, 4).unwrap(), scalar_binary_top.as_slice());
+
+        // === Scalars: negative-epoch timestamps (pre-1970) ===
+        let read_neg_us = r0.get_timestamp_ntz(58, 6).unwrap();
+        assert_eq!(
+            read_neg_us.get_millisecond(),
+            scalar_ts_us_neg.get_millisecond()
+        );
+        assert_eq!(
+            read_neg_us.get_nano_of_millisecond(),
+            scalar_ts_us_neg.get_nano_of_millisecond()
+        );
+        let read_neg_ns = r0.get_timestamp_ntz(59, 9).unwrap();
+        assert_eq!(
+            read_neg_ns.get_millisecond(),
+            scalar_ts_ns_neg.get_millisecond()
+        );
+        assert_eq!(
+            read_neg_ns.get_nano_of_millisecond(),
+            scalar_ts_ns_neg.get_nano_of_millisecond()
+        );
+        let read_neg_ltz_us = r0.get_timestamp_ltz(60, 6).unwrap();
+        assert_eq!(
+            read_neg_ltz_us.get_epoch_millisecond(),
+            scalar_ts_ltz_us_neg.get_epoch_millisecond()
+        );
+        let read_neg_ltz_ns = r0.get_timestamp_ltz(61, 9).unwrap();
+        assert_eq!(
+            read_neg_ltz_ns.get_epoch_millisecond(),
+            scalar_ts_ltz_ns_neg.get_epoch_millisecond()
+        );
+
+        // === Scalars: every column NULL on row 2 ===
+        for i in plan.section_range("scalars") {
+            assert!(
+                r2.is_null_at(i).unwrap(),
+                "scalar column {i} should be null"
+            );
+        }
+
+        // === Append-side validation: malformed rows are rejected client-side ===
+        // Field count mismatch — far fewer fields than the schema demands.
+        let mut undersized = GenericRow::new(2);
+        undersized.set_field(0, true);
+        let err = writer.append(&undersized).unwrap_err().to_string();
+        assert!(
+            err.contains(&format!("Expected: {column_count}")) && err.contains("Actual: 2"),
+            "expected field-count error, got: {err}"
+        );
+
+        // Type mismatch — correct field count but every cell is Bool, which
+        // satisfies none of the column types except col_boolean.
+        let wrong_types = GenericRow::from_data(
+            (0..column_count)
+                .map(|_| Datum::Bool(true))
+                .collect::<Vec<_>>(),
+        );
+        assert!(
+            writer.append(&wrong_types).is_err(),
+            "row with wrong types should be rejected, not panic"
+        );
+
+        admin.drop_table(&table_path, false).await.expect("drop");
     }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index 81a7c0b107..58c77f035b 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -17,7 +17,9 @@
  */
 use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
 use fluss::client::FlussAdmin;
-use fluss::metadata::{DataTypes, PartitionSpec, TableDescriptor, TablePath};
+use fluss::metadata::{
+    DataField, DataType, DataTypes, PartitionSpec, RowType, Schema, TableDescriptor, TablePath,
+};
 use fluss::row::FlussArray;
 use fluss::row::binary_array::FlussArrayWriter;
 use std::collections::HashMap;
@@ -176,3 +178,200 @@ pub async fn create_partitions(
             .expect("Failed to create partition");
     }
 }
+
+pub fn dt_array_int() -> DataType {
+    DataTypes::array(DataTypes::int())
+}
+
+pub fn dt_map_string_int() -> DataType {
+    DataTypes::map(DataTypes::string(), DataTypes::int())
+}
+
+pub fn dt_row_seq_label() -> DataType {
+    DataTypes::row(vec![
+        DataField::new("seq", DataTypes::int(), None),
+        DataField::new("label", DataTypes::string(), None),
+    ])
+}
+
+pub fn as_row_type(dt: &DataType) -> RowType {
+    match dt {
+        DataType::Row(rt) => rt.clone(),
+        other => panic!("expected DataType::Row, got {other:?}"),
+    }
+}
+
+pub fn dt_row_deep() -> DataType {
+    let inner = DataTypes::row(vec![DataField::new("n", DataTypes::int(), None)]);
+    DataTypes::row(vec![DataField::new("inner", inner, None)])
+}
+
+pub fn dt_row_rich() -> DataType {
+    DataTypes::row(vec![
+        DataField::new("f_bool", DataTypes::boolean(), None),
+        DataField::new("f_int", DataTypes::int(), None),
+        DataField::new("f_long", DataTypes::bigint(), None),
+        DataField::new("f_float", DataTypes::float(), None),
+        DataField::new("f_double", DataTypes::double(), None),
+        DataField::new("f_str", DataTypes::string(), None),
+        DataField::new("f_bytes", DataTypes::bytes(), None),
+        DataField::new("f_decimal", DataTypes::decimal(10, 2), None),
+        DataField::new("f_date", DataTypes::date(), None),
+        DataField::new("f_time", DataTypes::time_with_precision(3), None),
+        DataField::new("f_ts_ntz", DataTypes::timestamp_with_precision(6), None),
+        DataField::new("f_ts_ltz", DataTypes::timestamp_ltz_with_precision(6), None),
+        DataField::new("f_binary_fixed", DataTypes::binary(4), None),
+        DataField::new("f_array_int", DataTypes::array(DataTypes::int()), None),
+    ])
+}
+
+pub fn array_dt_basics_columns() -> Vec<(&'static str, DataType)> {
+    vec![
+        ("arr_int", DataTypes::array(DataTypes::int())),
+        ("arr_string", DataTypes::array(DataTypes::string())),
+        ("arr_of_arr", DataTypes::array(dt_array_int())),
+        ("arr_of_row", DataTypes::array(dt_row_seq_label())),
+    ]
+}
+
+pub fn row_dt_basics_columns() -> Vec<(&'static str, DataType)> {
+    vec![
+        ("row_basic", dt_row_seq_label()),
+        ("row_deep", dt_row_deep()),
+        ("row_rich", dt_row_rich()),
+    ]
+}
+
+pub fn map_dt_basics_columns() -> Vec<(&'static str, DataType)> {
+    vec![
+        ("map_string_int", dt_map_string_int()),
+        (
+            "map_of_row",
+            DataTypes::map(DataTypes::string(), dt_row_seq_label()),
+        ),
+        (
+            "map_of_map",
+            DataTypes::map(DataTypes::string(), dt_map_string_int()),
+        ),
+        (
+            "map_of_array",
+            DataTypes::map(DataTypes::string(), dt_array_int()),
+        ),
+        ("array_of_map", DataTypes::array(dt_map_string_int())),
+    ]
+}
+
+pub fn scalar_dt_columns() -> Vec<(&'static str, DataType)> {
+    vec![
+        ("col_tinyint", DataTypes::tinyint()),
+        ("col_smallint", DataTypes::smallint()),
+        ("col_bigint", DataTypes::bigint()),
+        ("col_float", DataTypes::float()),
+        ("col_double", DataTypes::double()),
+        ("col_boolean", DataTypes::boolean()),
+        ("col_char", DataTypes::char(10)),
+        ("col_string", DataTypes::string()),
+        ("col_decimal", DataTypes::decimal(10, 2)),
+        ("col_date", DataTypes::date()),
+        ("col_time_s", DataTypes::time_with_precision(0)),
+        ("col_time_ms", DataTypes::time_with_precision(3)),
+        ("col_time_us", DataTypes::time_with_precision(6)),
+        ("col_time_ns", DataTypes::time_with_precision(9)),
+        ("col_ts_s", DataTypes::timestamp_with_precision(0)),
+        ("col_ts_ms", DataTypes::timestamp_with_precision(3)),
+        ("col_ts_us", DataTypes::timestamp_with_precision(6)),
+        ("col_ts_ns", DataTypes::timestamp_with_precision(9)),
+        ("col_ts_ltz_s", DataTypes::timestamp_ltz_with_precision(0)),
+        ("col_ts_ltz_ms", DataTypes::timestamp_ltz_with_precision(3)),
+        ("col_ts_ltz_us", DataTypes::timestamp_ltz_with_precision(6)),
+        ("col_ts_ltz_ns", DataTypes::timestamp_ltz_with_precision(9)),
+        ("col_bytes_top", DataTypes::bytes()),
+        ("col_binary_top", DataTypes::binary(4)),
+        ("col_ts_us_neg", DataTypes::timestamp_with_precision(6)),
+        ("col_ts_ns_neg", DataTypes::timestamp_with_precision(9)),
+        (
+            "col_ts_ltz_us_neg",
+            DataTypes::timestamp_ltz_with_precision(6),
+        ),
+        (
+            "col_ts_ltz_ns_neg",
+            DataTypes::timestamp_ltz_with_precision(9),
+        ),
+    ]
+}
+
+#[derive(Default)]
+pub struct ColumnPlan {
+    cols: Vec<(&'static str, DataType)>,
+    index: HashMap<&'static str, usize>,
+    sections: Vec<(&'static str, usize)>,
+}
+
+impl ColumnPlan {
+    pub fn new() -> Self {
+        Self::default()
+    }
+
+    pub fn add(mut self, name: &'static str, dt: DataType) -> Self {
+        let prev = self.index.insert(name, self.cols.len());
+        assert!(prev.is_none(), "duplicate column in plan: {name}");
+        self.cols.push((name, dt));
+        self
+    }
+
+    pub fn extend<I: IntoIterator<Item = (&'static str, DataType)>>(mut self, it: I) -> Self {
+        for (n, dt) in it {
+            self = self.add(n, dt);
+        }
+        self
+    }
+
+    /// Marks the next column added as the start of a named section. Each call
+    /// closes the previous section; the last section runs to the end of the plan.
+    pub fn start_section(mut self, name: &'static str) -> Self {
+        assert!(
+            !self.sections.iter().any(|(n, _)| *n == name),
+            "duplicate section: {name}"
+        );
+        self.sections.push((name, self.cols.len()));
+        self
+    }
+
+    pub fn build_schema(&self, pk: Option<&[&str]>) -> Schema {
+        let mut sb = Schema::builder();
+        for (n, dt) in &self.cols {
+            sb = sb.column(*n, dt.clone());
+        }
+        if let Some(keys) = pk {
+            sb = sb.primary_key(keys.iter().copied());
+        }
+        sb.build().expect("schema build")
+    }
+
+    pub fn idx(&self, name: &str) -> usize {
+        *self
+            .index
+            .get(name)
+            .unwrap_or_else(|| panic!("unknown column in plan: {name}"))
+    }
+
+    pub fn len(&self) -> usize {
+        self.cols.len()
+    }
+
+    /// Half-open range of the named section: `[its start, next section's start or plan end)`.
+    pub fn section_range(&self, name: &str) -> std::ops::Range<usize> {
+        let pos = self
+            .sections
+            .iter()
+            .position(|(n, _)| *n == name)
+            .unwrap_or_else(|| panic!("unknown section: {name}"));
+        let start = self.sections[pos].1;
+        let end = self
+            .sections
+            .get(pos + 1)
+            .map(|(_, s)| *s)
+            .unwrap_or(self.cols.len());
+        start..end
+    }
+}

From 5ef93a8ba0f17173b3e5872f8cf9b13dd24d1abf Mon Sep 17 00:00:00 2001
From: slfan1989 <55643692+slfan1989@users.noreply.github.com>
Date: Tue, 26 May 2026 01:14:25 +0800
Subject: [PATCH 277/287] [test] Add Rust integration coverage for
 RecordBatchLogReader bounded reads. (#559)

---
 .../crates/fluss/src/client/table/reader.rs   |   8 +-
 .../fluss/tests/integration/log_table.rs      |  32 +-
 .../integration/record_batch_log_reader.rs    | 528 ++++++++++++++++++
 .../crates/fluss/tests/integration/utils.rs   |  19 +
 fluss-rust/crates/fluss/tests/test_fluss.rs   |   1 +
 5 files changed, 560 insertions(+), 28 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs

diff --git a/fluss-rust/crates/fluss/src/client/table/reader.rs b/fluss-rust/crates/fluss/src/client/table/reader.rs
index 0a08803d9e..518c68a222 100644
--- a/fluss-rust/crates/fluss/src/client/table/reader.rs
+++ b/fluss-rust/crates/fluss/src/client/table/reader.rs
@@ -488,10 +488,10 @@ fn filter_batches(
     completed
 }
 
-// TODO: Add Rust-level end-to-end tests with `FlussTestingCluster` (feature
-// `integration_tests`) covering `new_until_latest`, partitioned tables,
-// and `new_until_offsets` stopping semantics. Drop cleanup and the
-// reader-active guard are covered by the Python integration test
+// Rust-level end-to-end coverage for `new_until_latest`, partitioned tables,
+// and `new_until_offsets` stopping semantics lives in
+// `crates/fluss/tests/integration/record_batch_log_reader.rs`. Drop cleanup and the
+// reader-active guard remain covered by the Python integration test
 // `test_to_arrow_batch_reader_drop_and_guard`.
 #[cfg(test)]
 mod tests {
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 5e61ab0724..8bad7398f1 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -20,13 +20,14 @@
 mod table_test {
     use crate::integration::utils::{
         ColumnPlan, array_dt_basics_columns, as_row_type, create_partitions, create_table,
-        dt_array_int, dt_map_string_int, dt_row_seq_label, get_shared_cluster, make_int_array,
-        make_string_array, map_dt_basics_columns, row_dt_basics_columns, scalar_dt_columns,
+        dt_array_int, dt_map_string_int, dt_row_seq_label, extract_ids_from_batches,
+        get_shared_cluster, make_int_array, make_string_array, map_dt_basics_columns,
+        row_dt_basics_columns, scalar_dt_columns,
     };
-    use arrow::array::{Int32Array, record_batch};
+    use arrow::array::record_batch;
     use fluss::client::{EARLIEST_OFFSET, FlussTable, TableScan};
     use fluss::metadata::{DataField, DataTypes, Schema, TableDescriptor, TablePath};
-    use fluss::record::{ScanBatch, ScanRecord};
+    use fluss::record::ScanRecord;
     use fluss::row::binary_array::FlussArrayWriter;
     use fluss::row::binary_map::FlussMapWriter;
     use fluss::row::{
@@ -507,30 +508,13 @@ mod table_test {
             .unwrap();
         writer.flush().await.unwrap();
 
-        fn extract_ids(batches: &[ScanBatch]) -> Vec<i32> {
-            batches
-                .iter()
-                .flat_map(|b| {
-                    let batch = b.batch();
-                    (0..batch.num_rows()).map(move |i| {
-                        batch
-                            .column(0)
-                            .as_any()
-                            .downcast_ref::<Int32Array>()
-                            .unwrap()
-                            .value(i)
-                    })
-                })
-                .collect()
-        }
-
         // poll may return partial results if not all batches are available yet,
         // so we accumulate across multiple polls until we have the expected count.
         let mut all_ids = Vec::new();
         let deadline = tokio::time::Instant::now() + Duration::from_secs(10);
         while all_ids.len() < 6 && tokio::time::Instant::now() < deadline {
             let batches = scanner.poll(Duration::from_secs(5)).await.unwrap();
-            all_ids.extend(extract_ids(&batches));
+            all_ids.extend(extract_ids_from_batches(&batches));
         }
 
         // Test 2: Order should be preserved across multiple batches
@@ -547,7 +531,7 @@ mod table_test {
         let deadline = tokio::time::Instant::now() + Duration::from_secs(10);
         while new_ids.len() < 2 && tokio::time::Instant::now() < deadline {
             let more = scanner.poll(Duration::from_secs(5)).await.unwrap();
-            new_ids.extend(extract_ids(&more));
+            new_ids.extend(extract_ids_from_batches(&more));
         }
 
         // Test 3: Subsequent polls should not return duplicate data (offset continuation)
@@ -561,7 +545,7 @@ mod table_test {
         let deadline = tokio::time::Instant::now() + Duration::from_secs(10);
         while trunc_ids.len() < 5 && tokio::time::Instant::now() < deadline {
             let trunc_batches = trunc_scanner.poll(Duration::from_secs(5)).await.unwrap();
-            trunc_ids.extend(extract_ids(&trunc_batches));
+            trunc_ids.extend(extract_ids_from_batches(&trunc_batches));
         }
 
         // Subscribing from offset 3 should return [4,5,6,7,8], not [1,2,3,4,5,6,7,8]
diff --git a/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs b/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs
new file mode 100644
index 0000000000..1383645316
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs
@@ -0,0 +1,528 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+#[cfg(test)]
+mod reader_test {
+    use crate::integration::utils::{
+        create_partitions, create_table, extract_ids_from_batches, get_shared_cluster,
+    };
+    use arrow::array::record_batch;
+    use fluss::client::{EARLIEST_OFFSET, FlussConnection, RecordBatchLogReader};
+    use fluss::config::{Config, NoKeyAssigner};
+    use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
+    use fluss::rpc::message::OffsetSpec;
+    use std::collections::HashMap;
+    use std::time::Duration;
+
+    #[tokio::test]
+    async fn until_offsets_stops_at_explicit_offset() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_reader_until_offsets");
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+        create_table(&admin, &table_path, &table_descriptor).await;
+        tokio::time::sleep(Duration::from_secs(1)).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+        writer
+            .append_arrow_batch(
+                record_batch!(
+                    ("id", Int32, [1, 2, 3, 4, 5, 6]),
+                    ("name", Utf8, ["a", "b", "c", "d", "e", "f"])
+                )
+                .unwrap(),
+            )
+            .expect("Failed to append batch");
+        writer.flush().await.expect("Failed to flush");
+
+        let scanner = table
+            .new_scan()
+            .create_record_batch_log_scanner()
+            .expect("Failed to create record batch scanner");
+        scanner
+            .subscribe(0, 1)
+            .await
+            .expect("Failed to subscribe from offset 1");
+
+        let table_id = table.get_table_info().table_id;
+        let mut reader = RecordBatchLogReader::new_until_offsets(
+            scanner,
+            HashMap::from([(TableBucket::new(table_id, 0), 4)]),
+        )
+        .expect("Failed to create record batch reader");
+
+        let batches = tokio::time::timeout(Duration::from_secs(10), reader.collect_all_batches())
+            .await
+            .expect("Timed out collecting bounded reader batches")
+            .expect("Failed to collect bounded reader batches");
+
+        assert_eq!(
+            extract_ids_from_batches(&batches),
+            vec![2, 3, 4],
+            "reader should include offsets [1, 4) and stop before offset 4"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn until_offsets_with_empty_range() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_reader_until_offsets_empty_range");
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+        create_table(&admin, &table_path, &table_descriptor).await;
+        tokio::time::sleep(Duration::from_secs(1)).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+        writer
+            .append_arrow_batch(
+                record_batch!(("id", Int32, [1, 2, 3]), ("name", Utf8, ["a", "b", "c"])).unwrap(),
+            )
+            .expect("Failed to append batch");
+        writer.flush().await.expect("Failed to flush");
+
+        let scanner = table
+            .new_scan()
+            .create_record_batch_log_scanner()
+            .expect("Failed to create record batch scanner");
+        scanner
+            .subscribe(0, 1)
+            .await
+            .expect("Failed to subscribe from offset 1");
+
+        let table_id = table.get_table_info().table_id;
+        let mut reader = RecordBatchLogReader::new_until_offsets(
+            scanner,
+            HashMap::from([(TableBucket::new(table_id, 0), 1)]),
+        )
+        .expect("Failed to create record batch reader");
+
+        let batches = tokio::time::timeout(Duration::from_secs(10), reader.collect_all_batches())
+            .await
+            .expect("Timed out collecting empty-range reader batches")
+            .expect("Failed to collect empty-range reader batches");
+
+        assert!(
+            batches.is_empty(),
+            "reader should return no batches when start and stop offsets are equal"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn until_offsets_past_end_of_log() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_reader_until_offsets_past_end");
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+        create_table(&admin, &table_path, &table_descriptor).await;
+        tokio::time::sleep(Duration::from_secs(1)).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+        writer
+            .append_arrow_batch(
+                record_batch!(("id", Int32, [1, 2, 3]), ("name", Utf8, ["a", "b", "c"])).unwrap(),
+            )
+            .expect("Failed to append initial batch");
+        writer.flush().await.expect("Failed to flush initial batch");
+
+        let scanner = table
+            .new_scan()
+            .create_record_batch_log_scanner()
+            .expect("Failed to create record batch scanner");
+        scanner
+            .subscribe(0, EARLIEST_OFFSET)
+            .await
+            .expect("Failed to subscribe bucket");
+
+        let table_id = table.get_table_info().table_id;
+        let mut reader = RecordBatchLogReader::new_until_offsets(
+            scanner,
+            HashMap::from([(TableBucket::new(table_id, 0), 6)]),
+        )
+        .expect("Failed to create record batch reader");
+
+        let collect_task = tokio::spawn(async move { reader.collect_all_batches().await });
+        tokio::time::sleep(Duration::from_millis(750)).await;
+        assert!(
+            !collect_task.is_finished(),
+            "reader should wait when the stopping offset is beyond the current log end"
+        );
+
+        writer
+            .append_arrow_batch(
+                record_batch!(("id", Int32, [4, 5, 6]), ("name", Utf8, ["d", "e", "f"])).unwrap(),
+            )
+            .expect("Failed to append follow-up batch");
+        writer
+            .flush()
+            .await
+            .expect("Failed to flush follow-up batch");
+
+        let batches = tokio::time::timeout(Duration::from_secs(10), collect_task)
+            .await
+            .expect("Timed out collecting reader batches after appending past stop offset")
+            .expect("Reader task panicked")
+            .expect("Failed to collect reader batches");
+
+        assert_eq!(
+            extract_ids_from_batches(&batches),
+            vec![1, 2, 3, 4, 5, 6],
+            "reader should resume after future records arrive and stop at the requested offset"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn until_offsets_multi_bucket() {
+        let cluster = get_shared_cluster();
+        let connection = FlussConnection::new(Config {
+            writer_acks: "all".to_string(),
+            bootstrap_servers: cluster.plaintext_bootstrap_servers().to_string(),
+            writer_bucket_no_key_assigner: NoKeyAssigner::RoundRobin,
+            ..Default::default()
+        })
+        .await
+        .expect("Failed to connect with round-robin bucket assignment");
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_reader_until_offsets_multi_bucket");
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .distributed_by(Some(2), vec!["id".to_string()])
+            .build()
+            .expect("Failed to build table");
+        create_table(&admin, &table_path, &table_descriptor).await;
+        tokio::time::sleep(Duration::from_secs(1)).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+        writer
+            .append_arrow_batch(
+                record_batch!(
+                    ("id", Int32, [1, 2, 3, 4]),
+                    ("name", Utf8, ["a", "b", "c", "d"])
+                )
+                .unwrap(),
+            )
+            .expect("Failed to append first batch");
+        writer
+            .append_arrow_batch(
+                record_batch!(
+                    ("id", Int32, [5, 6, 7, 8]),
+                    ("name", Utf8, ["e", "f", "g", "h"])
+                )
+                .unwrap(),
+            )
+            .expect("Failed to append second batch");
+        writer.flush().await.expect("Failed to flush");
+
+        let latest_offsets = admin
+            .list_offsets(&table_path, &[0, 1], OffsetSpec::Latest)
+            .await
+            .expect("Failed to list latest offsets");
+        assert!(
+            latest_offsets.values().all(|offset| *offset > 0),
+            "test records should be distributed across both buckets: {latest_offsets:?}"
+        );
+
+        let scanner = table
+            .new_scan()
+            .create_record_batch_log_scanner()
+            .expect("Failed to create record batch scanner");
+        scanner
+            .subscribe_buckets(&HashMap::from([(0, 0), (1, 0)]))
+            .await
+            .expect("Failed to subscribe to multiple buckets");
+
+        let table_id = table.get_table_info().table_id;
+        let stopping_offsets: HashMap<TableBucket, i64> = latest_offsets
+            .into_iter()
+            .map(|(bucket, offset)| (TableBucket::new(table_id, bucket), offset))
+            .collect();
+        assert_eq!(
+            stopping_offsets.len(),
+            2,
+            "reader should track two stopping offsets"
+        );
+
+        let mut reader = RecordBatchLogReader::new_until_offsets(scanner, stopping_offsets)
+            .expect("Failed to create record batch reader");
+        let batches = tokio::time::timeout(Duration::from_secs(10), reader.collect_all_batches())
+            .await
+            .expect("Timed out collecting multi-bucket reader batches")
+            .expect("Failed to collect multi-bucket reader batches");
+
+        let mut ids = extract_ids_from_batches(&batches);
+        ids.sort();
+        assert_eq!(ids, vec![1, 2, 3, 4, 5, 6, 7, 8]);
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn until_latest_reads_non_partitioned_table() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_reader_non_partitioned_latest");
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+        tokio::time::sleep(Duration::from_secs(1)).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+        writer
+            .append_arrow_batch(
+                record_batch!(
+                    ("id", Int32, [1, 2, 3, 4]),
+                    ("name", Utf8, ["a", "b", "c", "d"])
+                )
+                .unwrap(),
+            )
+            .expect("Failed to append batch");
+        writer.flush().await.expect("Failed to flush");
+
+        let scanner = table
+            .new_scan()
+            .create_record_batch_log_scanner()
+            .expect("Failed to create record batch scanner");
+        scanner
+            .subscribe(0, EARLIEST_OFFSET)
+            .await
+            .expect("Failed to subscribe bucket");
+
+        let mut reader = RecordBatchLogReader::new_until_latest(scanner, &admin)
+            .await
+            .expect("Failed to create latest-offset reader");
+        let batches = tokio::time::timeout(Duration::from_secs(10), reader.collect_all_batches())
+            .await
+            .expect("Timed out collecting non-partitioned reader batches")
+            .expect("Failed to collect non-partitioned reader batches");
+
+        assert_eq!(
+            extract_ids_from_batches(&batches),
+            vec![1, 2, 3, 4],
+            "latest-offset reader should read all records present in the non-partitioned table"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+
+    #[tokio::test]
+    async fn until_latest_reads_partitioned_table() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("Failed to get admin");
+
+        let table_path = TablePath::new("fluss", "test_reader_partitioned_latest");
+        let table_descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("region", DataTypes::string())
+                    .column("value", DataTypes::bigint())
+                    .build()
+                    .expect("Failed to build schema"),
+            )
+            .partitioned_by(vec!["region"])
+            .build()
+            .expect("Failed to build table");
+
+        create_table(&admin, &table_path, &table_descriptor).await;
+        create_partitions(&admin, &table_path, "region", &["US", "EU"]).await;
+        tokio::time::sleep(Duration::from_secs(2)).await;
+
+        let table = connection
+            .get_table(&table_path)
+            .await
+            .expect("Failed to get table");
+        let writer = table
+            .new_append()
+            .expect("Failed to create append")
+            .create_writer()
+            .expect("Failed to create writer");
+
+        let us_batch = record_batch!(
+            ("id", Int32, [1, 2]),
+            ("region", Utf8, ["US", "US"]),
+            ("value", Int64, [100, 200])
+        )
+        .unwrap();
+        writer
+            .append_arrow_batch(us_batch)
+            .expect("Failed to append US batch");
+
+        let eu_batch = record_batch!(
+            ("id", Int32, [3, 4]),
+            ("region", Utf8, ["EU", "EU"]),
+            ("value", Int64, [300, 400])
+        )
+        .unwrap();
+        writer
+            .append_arrow_batch(eu_batch)
+            .expect("Failed to append EU batch");
+        writer.flush().await.expect("Failed to flush");
+
+        let scanner = table
+            .new_scan()
+            .create_record_batch_log_scanner()
+            .expect("Failed to create record batch scanner");
+        for partition in admin
+            .list_partition_infos(&table_path)
+            .await
+            .expect("Failed to list partition infos")
+        {
+            // The table uses the default single-bucket layout, so bucket 0 is
+            // the only bucket in each partition. If this test switches to a
+            // multi-bucket table, subscribe all buckets for each partition.
+            scanner
+                .subscribe_partition(partition.get_partition_id(), 0, EARLIEST_OFFSET)
+                .await
+                .expect("Failed to subscribe partition bucket");
+        }
+
+        let mut reader = RecordBatchLogReader::new_until_latest(scanner, &admin)
+            .await
+            .expect("Failed to create latest-offset reader");
+        let batches = tokio::time::timeout(Duration::from_secs(10), reader.collect_all_batches())
+            .await
+            .expect("Timed out collecting partitioned reader batches")
+            .expect("Failed to collect partitioned reader batches");
+
+        let mut ids = extract_ids_from_batches(&batches);
+        ids.sort();
+        assert_eq!(
+            ids,
+            vec![1, 2, 3, 4],
+            "latest-offset reader should read all records present in subscribed partitions"
+        );
+
+        admin
+            .drop_table(&table_path, false)
+            .await
+            .expect("Failed to drop table");
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index 58c77f035b..934b66264e 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -16,10 +16,12 @@
  * limitations under the License.
  */
 use crate::integration::fluss_cluster::{FlussTestingCluster, FlussTestingClusterBuilder};
+use arrow::array::Int32Array;
 use fluss::client::FlussAdmin;
 use fluss::metadata::{
     DataField, DataType, DataTypes, PartitionSpec, RowType, Schema, TableDescriptor, TablePath,
 };
+use fluss::record::ScanBatch;
 use fluss::row::FlussArray;
 use fluss::row::binary_array::FlussArrayWriter;
 use std::collections::HashMap;
@@ -120,6 +122,23 @@ pub fn make_int_array(values: &[Option<i32>]) -> FlussArray {
     writer.complete().expect("Failed to build int array")
 }
 
+pub fn extract_ids_from_batches(batches: &[ScanBatch]) -> Vec<i32> {
+    batches
+        .iter()
+        .flat_map(|scan_batch| {
+            let batch = scan_batch.batch();
+            (0..batch.num_rows()).map(move |row| {
+                batch
+                    .column(0)
+                    .as_any()
+                    .downcast_ref::<Int32Array>()
+                    .expect("id column should be Int32")
+                    .value(row)
+            })
+        })
+        .collect()
+}
+
 /// Similar to wait_for_cluster_ready but connects with SASL credentials.
 pub async fn wait_for_cluster_ready_with_sasl(cluster: &FlussTestingCluster) {
     let timeout = Duration::from_secs(30);
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
index 967564693e..792b68f00e 100644
--- a/fluss-rust/crates/fluss/tests/test_fluss.rs
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -24,6 +24,7 @@ mod integration {
     mod fluss_cluster;
     mod kv_table;
     mod log_table;
+    mod record_batch_log_reader;
     mod sasl_auth;
 
     mod utils;

From 88f56487a4145821b4839119791eda32bb7a8bb9 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Tue, 26 May 2026 16:42:56 +0200
Subject: [PATCH 278/287] [metrics] Add scanner poll-timing metrics (#555)

* Add scanner poll timing metrics

* cargo fmt

* improve overlapping polls scenario

* address feedback
---
 .../crates/fluss/src/client/table/scanner.rs  | 287 ++++++++++++++++++
 fluss-rust/crates/fluss/src/metrics.rs        |  48 +++
 .../docs/user-guide/rust/api-reference.md     |   4 +-
 3 files changed, 338 insertions(+), 1 deletion(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 0167af02e2..5fa8bb9220 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -29,6 +29,7 @@ use crate::error::{ApiError, Error, FlussError, Result};
 use crate::metadata::{LogFormat, PhysicalTablePath, RowType, TableBucket, TableInfo, TablePath};
 use crate::metrics::{
     SCANNER_BYTES_PER_REQUEST, SCANNER_FETCH_LATENCY_MS, SCANNER_FETCH_REQUESTS_TOTAL,
+    SCANNER_POLL_IDLE_RATIO, SCANNER_TIME_BETWEEN_POLL_MS,
 };
 use crate::proto::{
     ErrorResponse, FetchLogRequest, FetchLogResponse, PbFetchLogReqForBucket, PbFetchLogReqForTable,
@@ -281,6 +282,64 @@ struct LogScannerInner {
     /// Guards against subscription changes while a
     /// [`crate::client::RecordBatchLogReader`] is iterating.
     reader_active: std::sync::atomic::AtomicBool,
+    /// Holds the snapshot fields used by [`PollGuard`] to derive the
+    /// scanner poll-timing metrics. The mutex makes the state updates
+    /// in `record_poll_start` / `record_poll_end` atomic; metric
+    /// emission and `log::warn!` calls happen after the lock is
+    /// released. The start↔end pairing depends on the single-consumer
+    /// contract documented on [`LogScanner::poll`] and
+    /// [`RecordBatchLogScanner::poll`] (mirrors Java's
+    /// `LogScannerImpl.acquire()`). Overlapping polls on the same
+    /// scanner trip a `debug_assert!` in `record_poll_start` (debug
+    /// builds) or emit a `log::warn!` (release builds).
+    poll_state: Mutex<PollState>,
+}
+
+/// Snapshot state used to derive the scanner poll-timing metrics.
+///
+/// The mutex makes the state updates in `record_poll_start` /
+/// `record_poll_end` atomic with respect to themselves; metric
+/// emission (`metrics::gauge!(...).set(...)`) and `log::warn!` calls
+/// happen after the lock is released so a user-installed recorder or
+/// logger cannot stall the critical section. The mutex does **not** by
+/// itself preserve start↔end pairing across overlapping `poll()` calls
+/// — that invariant relies on the single-consumer contract that
+/// mirrors Java's `LogScannerImpl.acquire()`. Concurrent polls on the
+/// same scanner are detected by a `debug_assert!` in
+/// `record_poll_start` (panics in debug / tests) and a `log::warn!` on
+/// both anomalous paths (`record_poll_start` sees a stale `Some`;
+/// `record_poll_end` sees `None`) for release-build observability.
+#[derive(Default, Debug)]
+struct PollState {
+    /// Instant captured at the most recent `record_poll_start()`. `None`
+    /// before the first poll.
+    last_poll_at: Option<Instant>,
+    /// Instant captured at the start of the in-flight poll. `None` after
+    /// the last `record_poll_end()`.
+    poll_start_at: Option<Instant>,
+    /// Cached ms between the two most recent poll starts, used to compute
+    /// `poll_idle_ratio` in `record_poll_end`.
+    time_between_poll_ms: f64,
+}
+
+/// Pairs `record_poll_start` with `record_poll_end`. Created
+/// at the top of `poll_records` / `poll_batches`; `record_poll_end` runs on
+/// drop, including the cancellation path (caller drops the future).
+struct PollGuard<'a> {
+    inner: &'a LogScannerInner,
+}
+
+impl<'a> PollGuard<'a> {
+    fn new(inner: &'a LogScannerInner) -> Self {
+        inner.record_poll_start();
+        Self { inner }
+    }
+}
+
+impl Drop for PollGuard<'_> {
+    fn drop(&mut self) {
+        self.inner.record_poll_end();
+    }
 }
 
 impl LogScannerInner {
@@ -322,6 +381,7 @@ impl LogScannerInner {
             )?,
             arrow_schema,
             reader_active: std::sync::atomic::AtomicBool::new(false),
+            poll_state: Mutex::new(PollState::default()),
         })
     }
 
@@ -340,6 +400,10 @@ impl LogScannerInner {
     }
 
     async fn poll_records(&self, timeout: Duration) -> Result<ScanRecords> {
+        // Pairs record_poll_start (now) with record_poll_end
+        // (drop). Runs on every exit, including the cancellation path
+        // where the caller drops this future.
+        let _poll_guard = PollGuard::new(self);
         let start = Instant::now();
         let deadline = start + timeout;
 
@@ -378,6 +442,90 @@ impl LogScannerInner {
         }
     }
 
+    /// Records the start of a `poll()` call and emits
+    /// `SCANNER_TIME_BETWEEN_POLL_MS`. The first poll emits `0.0`,
+    /// matching Java's `ScannerMetricGroup.recordPollStart`
+    /// (`timeMsBetweenPoll = lastPollMs != 0L ? pollStartMs - lastPollMs : 0L`).
+    ///
+    /// Single-consumer contract: a previous poll must have recorded its
+    /// end before the next start. Java enforces this with
+    /// `LogScannerImpl.acquire()` (throws `ConcurrentModificationException`).
+    /// Rust surfaces violations as:
+    /// - debug builds: `debug_assert!` panics (caught by tests),
+    /// - release builds: `log::warn!` + the in-flight `poll_start_at` is
+    ///   overwritten so the metric series keeps moving; the resulting
+    ///   `time_between_poll_ms` / `poll_idle_ratio` values for the
+    ///   overlapping polls are not meaningful until the overlap clears.
+    fn record_poll_start(&self) {
+        let now = Instant::now();
+        // Compute under the lock; emit the metric outside the critical
+        // section so a user-installed recorder cannot stall the next poll.
+        let (between_ms, overlap) = {
+            let mut state = self.poll_state.lock();
+            let overlap = state.poll_start_at.is_some();
+            debug_assert!(
+                !overlap,
+                "concurrent poll() detected on the same scanner; \
+                 LogScanner / RecordBatchLogScanner are single-consumer \
+                 (see LogScannerImpl.acquire() for Java parity)"
+            );
+            let between_ms = match state.last_poll_at {
+                Some(prev) => now.duration_since(prev).as_secs_f64() * 1000.0,
+                None => 0.0,
+            };
+            state.time_between_poll_ms = between_ms;
+            state.last_poll_at = Some(now);
+            state.poll_start_at = Some(now);
+            (between_ms, overlap)
+        };
+        if overlap {
+            warn!(
+                "concurrent poll() detected on scanner; single-consumer \
+                 contract violated, poll-timing metrics will be inaccurate \
+                 until the overlap clears"
+            );
+        }
+        metrics::gauge!(SCANNER_TIME_BETWEEN_POLL_MS).set(between_ms);
+    }
+
+    /// Computes `poll_idle_ratio = poll_time / (poll_time + between_time)`.
+    /// On the first poll, `between_time` is 0 so the ratio is 1.0
+    /// (poll-bound).
+    ///
+    /// Orphan call: if no matching `record_poll_start` is in flight,
+    /// emits a `log::warn!` (single-consumer contract may have been
+    /// violated, e.g. in release builds where the start-side
+    /// `debug_assert!` is compiled out) and skips the metric update.
+    fn record_poll_end(&self) {
+        let now = Instant::now();
+        // Compute under the lock; emit metric / warn outside the critical
+        // section so neither the user-installed recorder nor the logger
+        // can stall the next poll.
+        let (orphan, ratio) = {
+            let mut state = self.poll_state.lock();
+            match state.poll_start_at.take() {
+                None => (true, None),
+                Some(start) => {
+                    let poll_time_ms = now.duration_since(start).as_secs_f64() * 1000.0;
+                    let total = poll_time_ms + state.time_between_poll_ms;
+                    let r = (total > 0.0).then_some(poll_time_ms / total);
+                    (false, r)
+                }
+            }
+        };
+        if orphan {
+            warn!(
+                "record_poll_end called without a matching record_poll_start; \
+                 single-consumer contract may have been violated, idle ratio \
+                 for this poll is not emitted"
+            );
+            return;
+        }
+        if let Some(r) = ratio {
+            metrics::gauge!(SCANNER_POLL_IDLE_RATIO).set(r);
+        }
+    }
+
     async fn subscribe(&self, bucket: i32, offset: i64) -> Result<()> {
         self.check_no_active_reader()?;
         if self.is_partitioned_table {
@@ -520,6 +668,7 @@ impl LogScannerInner {
     }
 
     async fn poll_batches(&self, timeout: Duration) -> Result<Vec<ScanBatch>> {
+        let _poll_guard = PollGuard::new(self);
         let start = Instant::now();
         let deadline = start + timeout;
 
@@ -2232,6 +2381,144 @@ mod tests {
         Ok(())
     }
 
+    /// Builds a self-contained `LogScannerInner` for poll-timing tests
+    /// inside a `current_thread` runtime so callers can drive `PollGuard`
+    /// lifecycles synchronously.
+    fn with_test_log_scanner_inner<F: FnOnce(&LogScannerInner)>(body: F) {
+        let rt = tokio::runtime::Builder::new_current_thread()
+            .enable_all()
+            .build()
+            .expect("build current_thread runtime");
+        rt.block_on(async {
+            let table_path = TablePath::new("db".to_string(), "tbl".to_string());
+            let table_info = build_table_info(table_path.clone(), 1, 1);
+            let cluster = build_cluster_arc(&table_path, 1, 1);
+            let metadata = Arc::new(Metadata::new_for_test(cluster));
+            let inner = LogScannerInner::new(
+                &table_info,
+                metadata,
+                Arc::new(RpcClient::new()),
+                &Config::default(),
+                None,
+            )
+            .expect("build LogScannerInner");
+            body(&inner);
+        });
+    }
+
+    fn snapshot_gauge(
+        snapshotter: &metrics_util::debugging::Snapshotter,
+        name: &str,
+    ) -> Option<f64> {
+        use metrics_util::debugging::DebugValue;
+        snapshotter
+            .snapshot()
+            .into_vec()
+            .into_iter()
+            .find_map(|(key, _, _, val)| {
+                if key.key().name() == name {
+                    if let DebugValue::Gauge(g) = val {
+                        return Some(g.into_inner());
+                    }
+                }
+                None
+            })
+    }
+
+    /// Exercises the `PollGuard` lifecycle across two consecutive
+    /// `record_poll_start` calls. Asserts both poll-timing gauges are
+    /// emitted at the right moments and `record_poll_end` runs on guard
+    /// drop (also the cancellation-safety path, since dropping the
+    /// `poll()` future drops the guard).
+    #[test]
+    fn poll_guard_emits_time_between_poll_and_idle_ratio() {
+        use crate::metrics::{SCANNER_POLL_IDLE_RATIO, SCANNER_TIME_BETWEEN_POLL_MS};
+        use metrics_util::debugging::DebuggingRecorder;
+
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            with_test_log_scanner_inner(|inner| {
+                // First poll: emits time_between_poll_ms=0 (Java parity:
+                // ScannerMetricGroup.recordPollStart emits 0 when there is
+                // no previous poll). Idle ratio is also emitted as 1.0
+                // on drop (poll_time / (poll_time + 0) = 1.0).
+                {
+                    let _g = PollGuard::new(inner);
+                    std::thread::sleep(std::time::Duration::from_millis(5));
+                }
+
+                // Brief gap so time_between_poll_ms is observably > 0.
+                std::thread::sleep(std::time::Duration::from_millis(5));
+
+                // Second poll: refreshes both time_between_poll_ms (>0)
+                // and a fresh idle ratio.
+                {
+                    let _g = PollGuard::new(inner);
+                    std::thread::sleep(std::time::Duration::from_millis(5));
+                }
+            });
+        });
+
+        let between = snapshot_gauge(&snapshotter, SCANNER_TIME_BETWEEN_POLL_MS)
+            .expect("time_between_poll_ms must be emitted on every poll");
+        assert!(
+            between > 0.0,
+            "second-poll time_between_poll_ms must be positive, got {between}"
+        );
+
+        let ratio = snapshot_gauge(&snapshotter, SCANNER_POLL_IDLE_RATIO)
+            .expect("poll_idle_ratio must be emitted on poll end");
+        assert!(
+            (0.0..=1.0).contains(&ratio),
+            "poll_idle_ratio must be in [0, 1], got {ratio}"
+        );
+    }
+
+    /// Java parity: `ScannerMetricGroup.recordPollStart` emits
+    /// `timeMsBetweenPoll = 0` on the very first poll. The Rust gauge
+    /// must do the same so dashboards see the metric series from poll #1.
+    #[test]
+    fn time_between_poll_ms_emits_zero_on_first_poll() {
+        use crate::metrics::SCANNER_TIME_BETWEEN_POLL_MS;
+        use metrics_util::debugging::DebuggingRecorder;
+
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            with_test_log_scanner_inner(|inner| {
+                let _g = PollGuard::new(inner);
+                // Drop at end of scope completes the poll; the value of
+                // SCANNER_TIME_BETWEEN_POLL_MS was emitted at start, not end.
+            });
+        });
+
+        let between = snapshot_gauge(&snapshotter, SCANNER_TIME_BETWEEN_POLL_MS)
+            .expect("time_between_poll_ms must be emitted on the first poll");
+        assert_eq!(
+            between, 0.0,
+            "first-poll time_between_poll_ms must be 0.0 (Java parity), got {between}"
+        );
+    }
+
+    /// Pins the single-consumer contract: overlapping `PollGuard`s on the
+    /// same scanner trip the `debug_assert!` in `record_poll_start`.
+    /// Release builds skip the check, so the test is gated on
+    /// `debug_assertions`.
+    #[cfg(debug_assertions)]
+    #[test]
+    #[should_panic(expected = "concurrent poll() detected")]
+    fn overlapping_polls_panic_in_debug_builds() {
+        with_test_log_scanner_inner(|inner| {
+            let _g1 = PollGuard::new(inner);
+            // _g1 has not been dropped → poll_start_at is still Some,
+            // so the second start must panic.
+            let _g2 = PollGuard::new(inner);
+        });
+    }
+
     /// Drives `handle_fetch_response` against a local metrics recorder and
     /// asserts that latency + bytes-per-request histograms are emitted with
     /// values that mirror what Java would record. This complements the unit
diff --git a/fluss-rust/crates/fluss/src/metrics.rs b/fluss-rust/crates/fluss/src/metrics.rs
index a533abd535..540e991f4e 100644
--- a/fluss-rust/crates/fluss/src/metrics.rs
+++ b/fluss-rust/crates/fluss/src/metrics.rs
@@ -49,6 +49,34 @@ pub const CLIENT_BYTES_RECEIVED_TOTAL: &str = "fluss.client.bytes_received.total
 pub const CLIENT_REQUEST_LATENCY_MS: &str = "fluss.client.request_latency_ms";
 pub const CLIENT_REQUESTS_IN_FLIGHT: &str = "fluss.client.requests_in_flight";
 
+// ---------------------------------------------------------------------------
+// Scanner poll-timing metrics
+//
+// Java reference: ScannerMetricGroup.java, LogScannerImpl.java
+//
+// These track consumer liveness and processing efficiency at the `poll()`
+// boundary. Java records via `volatile long` fields read by gauge suppliers;
+// Rust snapshots the values at poll start/end.
+//
+// Java's `lastPollSecondsAgo` gauge is intentionally NOT ported. Java
+// implements it as a gauge supplier evaluated at scrape time, which the
+// `metrics` crate facade has no equivalent for. A snapshot-at-poll-start
+// port would just duplicate `time_between_poll_ms / 1000` and would not
+// advance while a consumer is hung — defeating the metric's purpose
+// (detecting a stuck consumer). Revisit if the `metrics` crate gains a
+// supplier abstraction or we add a background liveness task.
+// ---------------------------------------------------------------------------
+
+/// Gauge: milliseconds between the start of consecutive `poll()` calls. A
+/// large value usually means the consumer's downstream processing is slow.
+pub const SCANNER_TIME_BETWEEN_POLL_MS: &str = "fluss.client.scanner.time_between_poll_ms";
+
+/// Gauge: fraction of wall-clock time spent inside `poll()` —
+/// `poll_time_ms / (poll_time_ms + time_between_poll_ms)`. A value near 1.0
+/// means the scanner is starved for data; a low value means the consumer is
+/// the bottleneck.
+pub const SCANNER_POLL_IDLE_RATIO: &str = "fluss.client.scanner.poll_idle_ratio";
+
 // ---------------------------------------------------------------------------
 // Scanner fetch + remote download metrics
 //
@@ -305,6 +333,26 @@ mod tests {
         assert_eq!(counter_by_api_key.get("fetch_log"), Some(&3));
     }
 
+    #[test]
+    fn scanner_poll_timing_metrics_emit_correctly() {
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            metrics::gauge!(SCANNER_TIME_BETWEEN_POLL_MS).set(200.0);
+            metrics::gauge!(SCANNER_POLL_IDLE_RATIO).set(0.8);
+        });
+
+        let snapshot = snapshotter.snapshot();
+        let entries: Vec<_> = snapshot.into_vec();
+
+        assert_eq!(
+            find_gauge!(entries, SCANNER_TIME_BETWEEN_POLL_MS),
+            Some(200.0)
+        );
+        assert_eq!(find_gauge!(entries, SCANNER_POLL_IDLE_RATIO), Some(0.8));
+    }
+
     #[test]
     fn scanner_fetch_metrics_emit_correctly() {
         let recorder = DebuggingRecorder::new();
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 52999e8cda..3f94841e4a 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -139,6 +139,8 @@ Complete API reference for the Fluss Rust client.
 
 ## `LogScanner`
 
+Single-consumer: do not call `poll` concurrently on the same scanner (e.g. from `tokio::join!` or two tasks sharing an `Arc`). Mirrors Java's `LogScannerImpl.acquire()` guard. Debug builds surface overlapping calls via a `debug_assert!`; release builds skip the check for performance and produce skewed poll-timing metrics (`fluss.client.scanner.time_between_poll_ms`, `fluss.client.scanner.poll_idle_ratio`) if the contract is violated.
+
 | Method                                                                                                    | Description                                              |
 |-----------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
 | `async fn subscribe(&self, bucket_id: i32, start_offset: i64) -> Result<()>`                              | Subscribe to a bucket                                    |
@@ -151,7 +153,7 @@ Complete API reference for the Fluss Rust client.
 
 ## `RecordBatchLogScanner`
 
-Overlapping `poll` calls on clones that share state, or `poll` concurrent with `RecordBatchLogReader::next_batch`, are not supported. Use one active polling/consumption call at a time per underlying scanner state.
+Single-consumer: overlapping `poll` calls on handles that share state, or `poll` concurrent with `RecordBatchLogReader::next_batch`, are not supported — use one active polling/consumption call at a time per underlying scanner state. Mirrors Java's `LogScannerImpl.acquire()` guard. Debug builds surface overlapping calls via a `debug_assert!`; release builds skip the check for performance and produce skewed poll-timing metrics (`fluss.client.scanner.time_between_poll_ms`, `fluss.client.scanner.poll_idle_ratio`) if the contract is violated.
 
 | Method                                                                                                    | Description                                              |
 |-----------------------------------------------------------------------------------------------------------|----------------------------------------------------------|

From 5a472b24c17eb982a27bc71fd6ce98cb2e98ec87 Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Tue, 26 May 2026 23:11:17 +0200
Subject: [PATCH 279/287] feat: [metrics] Add database and table labels for
 scanner metrics (#565)

* add database and table label to scanner metrics

* revert dropped comments

* revert dropped comments

* refactor to avoid clones many times

* optimize tests
---
 .../fluss/src/client/table/remote_log.rs      |  50 ++--
 .../crates/fluss/src/client/table/scanner.rs  |  58 ++++-
 fluss-rust/crates/fluss/src/metrics.rs        | 228 +++++++++++++++++-
 fluss-rust/crates/fluss/src/test_utils.rs     |  57 +++++
 .../docs/user-guide/rust/api-reference.md     |   2 +
 5 files changed, 359 insertions(+), 36 deletions(-)

diff --git a/fluss-rust/crates/fluss/src/client/table/remote_log.rs b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
index 8957aced14..c48bdccabf 100644
--- a/fluss-rust/crates/fluss/src/client/table/remote_log.rs
+++ b/fluss-rust/crates/fluss/src/client/table/remote_log.rs
@@ -18,10 +18,7 @@ use crate::client::credentials::CredentialsReceiver;
 use crate::error::{Error, Result};
 use crate::io::{FileIO, Storage};
 use crate::metadata::TableBucket;
-use crate::metrics::{
-    SCANNER_REMOTE_FETCH_BYTES_TOTAL, SCANNER_REMOTE_FETCH_ERRORS_TOTAL,
-    SCANNER_REMOTE_FETCH_REQUESTS_TOTAL,
-};
+use crate::metrics::ScannerMetrics;
 use crate::proto::{PbRemoteLogFetchInfo, PbRemoteLogSegment};
 use futures::TryStreamExt;
 use parking_lot::Mutex;
@@ -394,6 +391,10 @@ struct DownloadCoordinator {
     max_concurrent_downloads: usize,
     recycle_notify: Arc<Notify>,
     fetcher: Arc<dyn RemoteLogFetcher>,
+    /// Per-table scanner metric handles cloned by every spawned download
+    /// task to attribute remote-fetch metrics to the owning scanner's
+    /// `(database, table)`.
+    metrics: Arc<ScannerMetrics>,
 }
 
 impl DownloadCoordinator {
@@ -462,10 +463,11 @@ impl DownloadCoordinator {
             // Clone data for the spawned task
             let fetcher = self.fetcher.clone();
             let recycle_notify = self.recycle_notify.clone();
+            let metrics = Arc::clone(&self.metrics);
 
             // Spawn download task
             self.active_downloads.spawn(async move {
-                spawn_download_task(request, permit, fetcher, recycle_notify).await
+                spawn_download_task(request, permit, fetcher, recycle_notify, metrics).await
             });
             self.in_flight += 1;
         }
@@ -491,6 +493,7 @@ async fn spawn_download_task(
     permit: tokio::sync::OwnedSemaphorePermit,
     fetcher: Arc<dyn RemoteLogFetcher>,
     recycle_notify: Arc<Notify>,
+    metrics: Arc<ScannerMetrics>,
 ) -> DownloadResult {
     // Check if receiver still alive (early cancellation check)
     if request.result_sender.is_closed() {
@@ -501,7 +504,7 @@ async fn spawn_download_task(
     // Java reference: RemoteLogDownloader.java increments `remoteFetchRequestCount`
     // immediately before initiating the download. Each retry of the same segment
     // counts as a separate request (matches Java behavior).
-    metrics::counter!(SCANNER_REMOTE_FETCH_REQUESTS_TOTAL).increment(1);
+    metrics.record_remote_fetch_request();
 
     // Try download ONCE
     let download_result = fetcher.fetch(&request).await;
@@ -509,8 +512,7 @@ async fn spawn_download_task(
     match download_result {
         Ok(fetch_result) => {
             // Success - permit will be released on drop (FileSource handles file deletion)
-            metrics::counter!(SCANNER_REMOTE_FETCH_BYTES_TOTAL)
-                .increment(fetch_result.file_size as u64);
+            metrics.record_remote_fetch_bytes(fetch_result.file_size as u64);
             DownloadResult::Success {
                 result: RemoteLogFile {
                     file_path: fetch_result.file_path,
@@ -528,7 +530,7 @@ async fn spawn_download_task(
         Err(e) => {
             // Download failed - check if we should retry or give up
             // Counted per attempt, so retries each contribute one error.
-            metrics::counter!(SCANNER_REMOTE_FETCH_ERRORS_TOTAL).increment(1);
+            metrics.record_remote_fetch_error();
             let retry_count = request.retry_count + 1;
 
             if retry_count > MAX_RETRY_COUNT {
@@ -781,12 +783,13 @@ pub struct RemoteLogDownloader {
 }
 
 impl RemoteLogDownloader {
-    pub fn new(
+    pub(crate) fn new(
         local_log_dir: TempDir,
         max_prefetch_segments: usize,
         max_concurrent_downloads: usize,
         remote_log_read_concurrency: usize,
         credentials_rx: CredentialsReceiver,
+        metrics: Arc<ScannerMetrics>,
     ) -> Result<Self> {
         let fetcher = Arc::new(ProductionFetcher {
             credentials_rx,
@@ -794,14 +797,20 @@ impl RemoteLogDownloader {
             remote_log_read_concurrency,
         });
 
-        Self::new_with_fetcher(fetcher, max_prefetch_segments, max_concurrent_downloads)
+        Self::new_with_fetcher(
+            fetcher,
+            max_prefetch_segments,
+            max_concurrent_downloads,
+            metrics,
+        )
     }
 
     /// Create a RemoteLogDownloader with a custom fetcher (for testing).
-    pub fn new_with_fetcher(
+    pub(crate) fn new_with_fetcher(
         fetcher: Arc<dyn RemoteLogFetcher>,
         max_prefetch_segments: usize,
         max_concurrent_downloads: usize,
+        metrics: Arc<ScannerMetrics>,
     ) -> Result<Self> {
         let (request_sender, request_receiver) = mpsc::unbounded_channel();
 
@@ -813,6 +822,7 @@ impl RemoteLogDownloader {
             max_concurrent_downloads,
             recycle_notify: Arc::new(Notify::new()),
             fetcher,
+            metrics,
         };
 
         // Spawn coordinator task - it will exit when request_sender is dropped
@@ -976,6 +986,8 @@ impl RemoteLogDownloader {
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::metadata::TablePath;
+    use crate::test_utils::test_scanner_metrics;
     use std::sync::atomic::{AtomicUsize, Ordering};
 
     /// Helper function to create a TableBucket for testing
@@ -983,6 +995,14 @@ mod tests {
         TableBucket::new(table_id, bucket_id)
     }
 
+    /// `ScannerMetrics` instance shared across the local test fixtures. The
+    /// labels are arbitrary because none of the tests in this module install
+    /// a metrics recorder; the metrics just need to exist for the API
+    /// surface.
+    fn metrics() -> Arc<ScannerMetrics> {
+        test_scanner_metrics(&TablePath::new("db", "tbl"))
+    }
+
     /// Simplified fake fetcher for testing
     struct FakeFetcher {
         completion_gate: Arc<Notify>,
@@ -1172,6 +1192,7 @@ mod tests {
             fake_fetcher.clone(),
             10, // High prefetch limit
             2,  // Max concurrent downloads = 2
+            metrics(),
         )
         .unwrap();
 
@@ -1219,6 +1240,7 @@ mod tests {
             fake_fetcher,
             2,  // Max prefetch = 2
             10, // High concurrent limit
+            metrics(),
         )
         .unwrap();
 
@@ -1278,7 +1300,7 @@ mod tests {
         let fake_fetcher = Arc::new(FakeFetcher::new(2, true)); // Fail twice, succeed third time
 
         let downloader =
-            RemoteLogDownloader::new_with_fetcher(fake_fetcher.clone(), 10, 1).unwrap();
+            RemoteLogDownloader::new_with_fetcher(fake_fetcher.clone(), 10, 1, metrics()).unwrap();
 
         let bucket = create_table_bucket(1, 0);
         let seg = create_segment("seg1", 0, 1000, bucket);
@@ -1303,7 +1325,7 @@ mod tests {
         let seg2 = create_segment("seg2", 100, 1000, create_table_bucket(1, 0));
         let fake_fetcher2 = Arc::new(FakeFetcher::new(100, true)); // Fail forever
         let downloader2 =
-            RemoteLogDownloader::new_with_fetcher(fake_fetcher2.clone(), 10, 1).unwrap();
+            RemoteLogDownloader::new_with_fetcher(fake_fetcher2.clone(), 10, 1, metrics()).unwrap();
 
         let future2 = downloader2.request_remote_log("dir", &seg2);
         tokio::time::sleep(Duration::from_millis(50)).await;
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 5fa8bb9220..d7e2dd2c71 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -27,10 +27,7 @@ use crate::config::Config;
 use crate::error::Error::UnsupportedOperation;
 use crate::error::{ApiError, Error, FlussError, Result};
 use crate::metadata::{LogFormat, PhysicalTablePath, RowType, TableBucket, TableInfo, TablePath};
-use crate::metrics::{
-    SCANNER_BYTES_PER_REQUEST, SCANNER_FETCH_LATENCY_MS, SCANNER_FETCH_REQUESTS_TOTAL,
-    SCANNER_POLL_IDLE_RATIO, SCANNER_TIME_BETWEEN_POLL_MS,
-};
+use crate::metrics::ScannerMetrics;
 use crate::proto::{
     ErrorResponse, FetchLogRequest, FetchLogResponse, PbFetchLogReqForBucket, PbFetchLogReqForTable,
 };
@@ -293,6 +290,9 @@ struct LogScannerInner {
     /// scanner trip a `debug_assert!` in `record_poll_start` (debug
     /// builds) or emit a `log::warn!` (release builds).
     poll_state: Mutex<PollState>,
+    /// Per-table scanner metric handles, pre-bound with `database`/`table`
+    /// labels.
+    metrics: Arc<ScannerMetrics>,
 }
 
 /// Snapshot state used to derive the scanner poll-timing metrics.
@@ -365,6 +365,7 @@ impl LogScannerInner {
             None => to_arrow_schema(full_row_type)?,
         };
 
+        let metrics = Arc::new(ScannerMetrics::new(&table_info.table_path));
         Ok(Self {
             table_path: table_info.table_path.clone(),
             table_id: table_info.table_id,
@@ -378,10 +379,12 @@ impl LogScannerInner {
                 log_scanner_status.clone(),
                 config,
                 projected_fields,
+                Arc::clone(&metrics),
             )?,
             arrow_schema,
             reader_active: std::sync::atomic::AtomicBool::new(false),
             poll_state: Mutex::new(PollState::default()),
+            metrics,
         })
     }
 
@@ -485,7 +488,7 @@ impl LogScannerInner {
                  until the overlap clears"
             );
         }
-        metrics::gauge!(SCANNER_TIME_BETWEEN_POLL_MS).set(between_ms);
+        self.metrics.record_time_between_poll_ms(between_ms);
     }
 
     /// Computes `poll_idle_ratio = poll_time / (poll_time + between_time)`.
@@ -522,7 +525,7 @@ impl LogScannerInner {
             return;
         }
         if let Some(r) = ratio {
-            metrics::gauge!(SCANNER_POLL_IDLE_RATIO).set(r);
+            self.metrics.record_poll_idle_ratio(r);
         }
     }
 
@@ -918,6 +921,9 @@ struct LogFetcher {
     security_token_manager: Arc<SecurityTokenManager>,
     log_fetch_buffer: Arc<LogFetchBuffer>,
     nodes_with_pending_fetch_requests: Arc<Mutex<HashSet<i32>>>,
+    /// Per-table scanner metric handles shared with the owning
+    /// `LogScannerInner` and `RemoteLogDownloader`.
+    metrics: Arc<ScannerMetrics>,
     max_poll_records: usize,
     fetch_max_bytes: i32,
     fetch_min_bytes: i32,
@@ -932,6 +938,8 @@ struct FetchResponseContext {
     read_context: ReadContext,
     remote_read_context: ReadContext,
     remote_log_downloader: Arc<RemoteLogDownloader>,
+    /// Per-table scanner metric handles for `scanner.fetch_*` recording.
+    metrics: Arc<ScannerMetrics>,
     /// `Instant` captured immediately before the FetchLog RPC; used to compute
     /// `scanner.fetch_latency_ms` on a successful response.
     request_start_time: Instant,
@@ -945,6 +953,7 @@ impl LogFetcher {
         log_scanner_status: Arc<LogScannerStatus>,
         config: &Config,
         projected_fields: Option<Vec<usize>>,
+        metrics: Arc<ScannerMetrics>,
     ) -> Result<Self> {
         let full_row_type = table_info.get_row_type();
         let full_arrow_schema = to_arrow_schema(full_row_type)?;
@@ -988,6 +997,7 @@ impl LogFetcher {
             config.remote_file_download_thread_num,
             config.scanner_remote_log_read_concurrency,
             credentials_rx,
+            Arc::clone(&metrics),
         )?);
 
         // Start the background token refresh task
@@ -1005,6 +1015,7 @@ impl LogFetcher {
             security_token_manager,
             log_fetch_buffer,
             nodes_with_pending_fetch_requests: Arc::new(Mutex::new(HashSet::new())),
+            metrics,
             max_poll_records: config.scanner_log_max_poll_records,
             fetch_max_bytes: config.scanner_log_fetch_max_bytes,
             fetch_min_bytes: config.scanner_log_fetch_min_bytes,
@@ -1177,6 +1188,7 @@ impl LogFetcher {
             let remote_log_downloader = Arc::clone(&self.remote_log_downloader);
             let nodes_with_pending = self.nodes_with_pending_fetch_requests.clone();
             let metadata = self.metadata.clone();
+            let metrics = Arc::clone(&self.metrics);
             // Spawn async task to handle the fetch request
             // Note: These tasks are not explicitly tracked or cancelled when LogFetcher is dropped.
             // This is acceptable because:
@@ -1211,7 +1223,7 @@ impl LogFetcher {
                 // Java increment the fetch counter and capture `requestStartTime` immediately
                 // before the RPC. Failed connection acquisition above is not counted.
                 let request_start_time = Instant::now();
-                metrics::counter!(SCANNER_FETCH_REQUESTS_TOTAL).increment(1);
+                metrics.record_fetch_request();
 
                 let fetch_response = match con
                     .request(message::FetchLogRequest::new(fetch_request.clone()))
@@ -1237,6 +1249,7 @@ impl LogFetcher {
                     read_context,
                     remote_read_context,
                     remote_log_downloader,
+                    metrics,
                     request_start_time,
                 };
                 Self::handle_fetch_response(fetch_response, response_context).await;
@@ -1267,6 +1280,7 @@ impl LogFetcher {
             read_context,
             remote_read_context,
             remote_log_downloader,
+            metrics,
             request_start_time,
         } = context;
 
@@ -1274,9 +1288,8 @@ impl LogFetcher {
         // both report the serialized API message body size, excluding protocol
         // headers and framing. Recorded unconditionally (including zero-record
         // responses) to match Java's histogram semantics.
-        metrics::histogram!(SCANNER_FETCH_LATENCY_MS)
-            .record(request_start_time.elapsed().as_secs_f64() * 1000.0);
-        metrics::histogram!(SCANNER_BYTES_PER_REQUEST).record(fetch_response.encoded_len() as f64);
+        metrics.record_fetch_latency_ms(request_start_time.elapsed().as_secs_f64() * 1000.0);
+        metrics.record_bytes_per_request(fetch_response.encoded_len() as f64);
 
         for pb_fetch_log_resp in fetch_response.tables_resp {
             let table_id = pb_fetch_log_resp.table_id;
@@ -2046,7 +2059,9 @@ mod tests {
     use crate::record::MemoryLogRecordsArrowBuilder;
     use crate::row::{Datum, GenericRow};
     use crate::rpc::FlussError;
-    use crate::test_utils::{build_cluster_arc, build_table_info};
+    use crate::test_utils::{
+        assert_scanner_entries_labeled, build_cluster_arc, build_table_info, test_scanner_metrics,
+    };
 
     fn build_records(table_info: &TableInfo, table_path: Arc<TablePath>) -> Result<Vec<u8>> {
         let mut builder = MemoryLogRecordsArrowBuilder::new(
@@ -2084,6 +2099,7 @@ mod tests {
             status.clone(),
             &Config::default(),
             None,
+            test_scanner_metrics(&table_path),
         )?;
 
         let bucket = TableBucket::new(1, 0);
@@ -2117,6 +2133,7 @@ mod tests {
             status,
             &Config::default(),
             None,
+            test_scanner_metrics(&table_path),
         )?;
 
         let bucket = TableBucket::new(1, 0);
@@ -2154,6 +2171,7 @@ mod tests {
             status,
             &Config::default(),
             None,
+            test_scanner_metrics(&table_path),
         )?;
 
         fetcher.nodes_with_pending_fetch_requests.lock().insert(1);
@@ -2178,6 +2196,7 @@ mod tests {
             status.clone(),
             &Config::default(),
             None,
+            test_scanner_metrics(&table_path),
         )?;
 
         let response = FetchLogResponse {
@@ -2203,6 +2222,7 @@ mod tests {
             read_context: fetcher.read_context.clone(),
             remote_read_context: fetcher.remote_read_context.clone(),
             remote_log_downloader: fetcher.remote_log_downloader.clone(),
+            metrics: Arc::clone(&fetcher.metrics),
             request_start_time: Instant::now(),
         };
 
@@ -2229,6 +2249,7 @@ mod tests {
             status.clone(),
             &Config::default(),
             None,
+            test_scanner_metrics(&table_path),
         )?;
 
         let bucket = TableBucket::new(1, 0);
@@ -2257,6 +2278,7 @@ mod tests {
             read_context: fetcher.read_context.clone(),
             remote_read_context: fetcher.remote_read_context.clone(),
             remote_log_downloader: fetcher.remote_log_downloader.clone(),
+            metrics: Arc::clone(&fetcher.metrics),
             request_start_time: Instant::now(),
         };
 
@@ -2361,6 +2383,7 @@ mod tests {
             status,
             &config,
             None,
+            test_scanner_metrics(&table_path),
         )?;
 
         let requests = fetcher.prepare_fetch_log_requests().await;
@@ -2474,6 +2497,10 @@ mod tests {
             (0.0..=1.0).contains(&ratio),
             "poll_idle_ratio must be in [0, 1], got {ratio}"
         );
+
+        // Both gauges must carry `database=db` / `table=tbl` (the fixture
+        // values from `with_test_log_scanner_inner`).
+        assert_scanner_entries_labeled(&snapshotter.snapshot().into_vec(), "db", "tbl");
     }
 
     /// Java parity: `ScannerMetricGroup.recordPollStart` emits
@@ -2501,6 +2528,7 @@ mod tests {
             between, 0.0,
             "first-poll time_between_poll_ms must be 0.0 (Java parity), got {between}"
         );
+        assert_scanner_entries_labeled(&snapshotter.snapshot().into_vec(), "db", "tbl");
     }
 
     /// Pins the single-consumer contract: overlapping `PollGuard`s on the
@@ -2560,6 +2588,7 @@ mod tests {
                     status,
                     &Config::default(),
                     None,
+                    test_scanner_metrics(&table_path),
                 )
                 .expect("build LogFetcher");
 
@@ -2586,6 +2615,7 @@ mod tests {
                     read_context: fetcher.read_context.clone(),
                     remote_read_context: fetcher.remote_read_context.clone(),
                     remote_log_downloader: fetcher.remote_log_downloader.clone(),
+                    metrics: Arc::clone(&fetcher.metrics),
                     request_start_time: Instant::now(),
                 };
 
@@ -2623,5 +2653,11 @@ mod tests {
             vec![expected_bytes],
             "bytes histogram must record encoded_len() for parity with Java fetchLogResponse.totalSize()",
         );
+
+        // Every emitted scanner metric must carry both `database` and `table`
+        // labels — that's the whole point of `ScannerMetrics`. If a future
+        // contributor adds a new `metrics::*!` macro inline (bypassing
+        // `ScannerMetrics`), this assertion catches it.
+        assert_scanner_entries_labeled(&entries, "db", "tbl");
     }
 }
diff --git a/fluss-rust/crates/fluss/src/metrics.rs b/fluss-rust/crates/fluss/src/metrics.rs
index 540e991f4e..7c62738c4e 100644
--- a/fluss-rust/crates/fluss/src/metrics.rs
+++ b/fluss-rust/crates/fluss/src/metrics.rs
@@ -22,6 +22,7 @@
 //! recorder (e.g. `metrics-exporter-prometheus`) to collect them. When no
 //! recorder is installed, all metric calls are no-ops with zero overhead.
 
+use crate::metadata::TablePath;
 use crate::rpc::ApiKey;
 
 // ---------------------------------------------------------------------------
@@ -30,6 +31,10 @@ use crate::rpc::ApiKey;
 
 pub const LABEL_API_KEY: &str = "api_key";
 
+/// Identifies the database and table for per-table scanner metrics.
+pub const LABEL_DATABASE: &str = "database";
+pub const LABEL_TABLE: &str = "table";
+
 // ---------------------------------------------------------------------------
 // Connection / RPC metrics
 //
@@ -89,9 +94,9 @@ pub const SCANNER_POLL_IDLE_RATIO: &str = "fluss.client.scanner.poll_idle_ratio"
 // and counters for throughput; the recorder/exporter handles rate
 // computation (e.g. Prometheus `rate()`).
 //
-// Java emits one `ScannerMetricGroup` per (database, table). Rust currently
-// emits without per-table labels — adding `database`/`table` labels is
-// tracked separately and intentionally deferred to keep this PR minimal.
+// Java emits one `ScannerMetricGroup` per (database, table); Rust matches
+// that by attaching `database` + `table` labels to every scanner metric
+// (see `ScannerMetrics` below).
 // ---------------------------------------------------------------------------
 
 /// Histogram: elapsed ms for each successful FetchLog RPC.
@@ -114,6 +119,130 @@ pub const SCANNER_REMOTE_FETCH_BYTES_TOTAL: &str = "fluss.client.scanner.remote_
 pub const SCANNER_REMOTE_FETCH_ERRORS_TOTAL: &str =
     "fluss.client.scanner.remote_fetch_errors.total";
 
+// ---------------------------------------------------------------------------
+// Per-table scanner metric handles
+// ---------------------------------------------------------------------------
+
+/// Cached `(database, table)`-labeled scanner metric handles.
+///
+/// Adding a new scanner metric: declare the constant above, add one
+/// field plus an initializer line in [`Self::new`] using the matching
+/// `scanner_{gauge,counter,histogram}` helper, and a `record_*` method.
+/// The helpers are the single source of truth for the label set, so a
+/// future label addition (e.g. `cluster_id`) is a one-line change.
+///
+/// # Recorder binding
+///
+/// `metrics::counter!(...)` / `gauge!(...)` / `histogram!(...)` resolve
+/// the recorder at the macro callsite. Because this struct caches the
+/// returned handles, every cached handle is bound to whichever recorder
+/// is installed when [`Self::new`] runs. Construct the scanner *after*
+/// installing the production recorder; in tests, construct it inside
+/// the `metrics::with_local_recorder(...)` closure. With no recorder
+/// installed, all `record_*` calls are zero-overhead no-ops.
+pub(crate) struct ScannerMetrics {
+    time_between_poll_ms: metrics::Gauge,
+    poll_idle_ratio: metrics::Gauge,
+    fetch_requests_total: metrics::Counter,
+    fetch_latency_ms: metrics::Histogram,
+    bytes_per_request: metrics::Histogram,
+    remote_fetch_requests_total: metrics::Counter,
+    remote_fetch_bytes_total: metrics::Counter,
+    remote_fetch_errors_total: metrics::Counter,
+}
+
+impl ScannerMetrics {
+    /// Build a fresh handle cache for `table_path`. Resolves the
+    /// currently installed recorder once per metric.
+    pub(crate) fn new(table_path: &TablePath) -> Self {
+        let database = table_path.database();
+        let table = table_path.table();
+        Self {
+            time_between_poll_ms: scanner_gauge(SCANNER_TIME_BETWEEN_POLL_MS, database, table),
+            poll_idle_ratio: scanner_gauge(SCANNER_POLL_IDLE_RATIO, database, table),
+            fetch_requests_total: scanner_counter(SCANNER_FETCH_REQUESTS_TOTAL, database, table),
+            fetch_latency_ms: scanner_histogram(SCANNER_FETCH_LATENCY_MS, database, table),
+            bytes_per_request: scanner_histogram(SCANNER_BYTES_PER_REQUEST, database, table),
+            remote_fetch_requests_total: scanner_counter(
+                SCANNER_REMOTE_FETCH_REQUESTS_TOTAL,
+                database,
+                table,
+            ),
+            remote_fetch_bytes_total: scanner_counter(
+                SCANNER_REMOTE_FETCH_BYTES_TOTAL,
+                database,
+                table,
+            ),
+            remote_fetch_errors_total: scanner_counter(
+                SCANNER_REMOTE_FETCH_ERRORS_TOTAL,
+                database,
+                table,
+            ),
+        }
+    }
+
+    pub(crate) fn record_time_between_poll_ms(&self, value: f64) {
+        self.time_between_poll_ms.set(value);
+    }
+
+    pub(crate) fn record_poll_idle_ratio(&self, value: f64) {
+        self.poll_idle_ratio.set(value);
+    }
+
+    pub(crate) fn record_fetch_request(&self) {
+        self.fetch_requests_total.increment(1);
+    }
+
+    pub(crate) fn record_fetch_latency_ms(&self, value: f64) {
+        self.fetch_latency_ms.record(value);
+    }
+
+    pub(crate) fn record_bytes_per_request(&self, value: f64) {
+        self.bytes_per_request.record(value);
+    }
+
+    pub(crate) fn record_remote_fetch_request(&self) {
+        self.remote_fetch_requests_total.increment(1);
+    }
+
+    pub(crate) fn record_remote_fetch_bytes(&self, bytes: u64) {
+        self.remote_fetch_bytes_total.increment(bytes);
+    }
+
+    pub(crate) fn record_remote_fetch_error(&self) {
+        self.remote_fetch_errors_total.increment(1);
+    }
+}
+
+// Per-table scanner handle factories. These centralize the
+// `(database, table)` label set so a future schema change (renaming a
+// label, adding `cluster_id`, etc.) is a one-line edit instead of
+// touching every callsite in `ScannerMetrics::new`.
+
+fn scanner_gauge(name: &'static str, database: &str, table: &str) -> metrics::Gauge {
+    metrics::gauge!(
+        name,
+        LABEL_DATABASE => database.to_string(),
+        LABEL_TABLE => table.to_string(),
+    )
+}
+
+fn scanner_counter(name: &'static str, database: &str, table: &str) -> metrics::Counter {
+    metrics::counter!(
+        name,
+        LABEL_DATABASE => database.to_string(),
+        LABEL_TABLE => table.to_string(),
+    )
+}
+
+fn scanner_histogram(name: &'static str, database: &str, table: &str) -> metrics::Histogram {
+    metrics::histogram!(
+        name,
+        LABEL_DATABASE => database.to_string(),
+        LABEL_TABLE => table.to_string(),
+    )
+}
+
 /// Returns a label value for reportable API keys, matching Java's
 /// `ConnectionMetrics.REPORT_API_KEYS` filter (`ProduceLog`, `FetchLog`,
 /// `PutKv`, `Lookup`). Returns `None` for admin/metadata/auth calls to
@@ -131,6 +260,7 @@ pub(crate) fn api_key_label(api_key: ApiKey) -> Option<&'static str> {
 #[cfg(test)]
 mod tests {
     use super::*;
+    use crate::test_utils::assert_scanner_entries_labeled;
     use metrics_util::debugging::DebuggingRecorder;
 
     macro_rules! find_counter {
@@ -339,8 +469,10 @@ mod tests {
         let snapshotter = recorder.snapshotter();
 
         metrics::with_local_recorder(&recorder, || {
-            metrics::gauge!(SCANNER_TIME_BETWEEN_POLL_MS).set(200.0);
-            metrics::gauge!(SCANNER_POLL_IDLE_RATIO).set(0.8);
+            let table_path = TablePath::new("db", "tbl");
+            let m = ScannerMetrics::new(&table_path);
+            m.record_time_between_poll_ms(200.0);
+            m.record_poll_idle_ratio(0.8);
         });
 
         let snapshot = snapshotter.snapshot();
@@ -351,6 +483,7 @@ mod tests {
             Some(200.0)
         );
         assert_eq!(find_gauge!(entries, SCANNER_POLL_IDLE_RATIO), Some(0.8));
+        assert_scanner_entries_labeled(&entries, "db", "tbl");
     }
 
     #[test]
@@ -359,9 +492,11 @@ mod tests {
         let snapshotter = recorder.snapshotter();
 
         metrics::with_local_recorder(&recorder, || {
-            metrics::counter!(SCANNER_FETCH_REQUESTS_TOTAL).increment(1);
-            metrics::histogram!(SCANNER_FETCH_LATENCY_MS).record(15.5);
-            metrics::histogram!(SCANNER_BYTES_PER_REQUEST).record(4096.0);
+            let table_path = TablePath::new("db", "tbl");
+            let m = ScannerMetrics::new(&table_path);
+            m.record_fetch_request();
+            m.record_fetch_latency_ms(15.5);
+            m.record_bytes_per_request(4096.0);
         });
 
         let snapshot = snapshotter.snapshot();
@@ -379,6 +514,7 @@ mod tests {
             find_histogram!(entries, SCANNER_BYTES_PER_REQUEST),
             Some(vec![4096.0])
         );
+        assert_scanner_entries_labeled(&entries, "db", "tbl");
     }
 
     #[test]
@@ -387,9 +523,13 @@ mod tests {
         let snapshotter = recorder.snapshotter();
 
         metrics::with_local_recorder(&recorder, || {
-            metrics::counter!(SCANNER_REMOTE_FETCH_REQUESTS_TOTAL).increment(3);
-            metrics::counter!(SCANNER_REMOTE_FETCH_BYTES_TOTAL).increment(1024);
-            metrics::counter!(SCANNER_REMOTE_FETCH_ERRORS_TOTAL).increment(1);
+            let table_path = TablePath::new("db", "tbl");
+            let m = ScannerMetrics::new(&table_path);
+            m.record_remote_fetch_request();
+            m.record_remote_fetch_request();
+            m.record_remote_fetch_request();
+            m.record_remote_fetch_bytes(1024);
+            m.record_remote_fetch_error();
         });
 
         let snapshot = snapshotter.snapshot();
@@ -407,5 +547,71 @@ mod tests {
             find_counter!(entries, SCANNER_REMOTE_FETCH_ERRORS_TOTAL),
             Some(1)
         );
+        assert_scanner_entries_labeled(&entries, "db", "tbl");
+    }
+
+    /// Two scanners on different tables must produce independent metric
+    /// series.
+    #[test]
+    fn different_table_paths_produce_separate_metric_series() {
+        use std::collections::HashMap;
+
+        let recorder = DebuggingRecorder::new();
+        let snapshotter = recorder.snapshotter();
+
+        metrics::with_local_recorder(&recorder, || {
+            let m1 = ScannerMetrics::new(&TablePath::new("db1", "t1"));
+            let m2 = ScannerMetrics::new(&TablePath::new("db2", "t2"));
+
+            for _ in 0..5 {
+                m1.record_fetch_request();
+            }
+            for _ in 0..3 {
+                m2.record_fetch_request();
+            }
+        });
+
+        let snapshot = snapshotter.snapshot();
+        let entries: Vec<_> = snapshot.into_vec();
+
+        let request_entries: Vec<_> = entries
+            .iter()
+            .filter(|(key, _, _, _)| key.key().name() == SCANNER_FETCH_REQUESTS_TOTAL)
+            .collect();
+
+        assert_eq!(
+            request_entries.len(),
+            2,
+            "(db1,t1) and (db2,t2) must be separate metric series"
+        );
+
+        let mut counter_by_table: HashMap<(String, String), u64> = HashMap::new();
+        for (key, _, _, val) in request_entries {
+            let mut database = None;
+            let mut table = None;
+            for label in key.key().labels() {
+                if label.key() == LABEL_DATABASE {
+                    database = Some(label.value().to_string());
+                } else if label.key() == LABEL_TABLE {
+                    table = Some(label.value().to_string());
+                }
+            }
+            let database = database.expect("scanner metric must include database label");
+            let table = table.expect("scanner metric must include table label");
+            let counter_value = match val {
+                metrics_util::debugging::DebugValue::Counter(v) => *v,
+                other => panic!("expected Counter, got {other:?}"),
+            };
+            counter_by_table.insert((database, table), counter_value);
+        }
+
+        assert_eq!(
+            counter_by_table.get(&("db1".to_string(), "t1".to_string())),
+            Some(&5),
+        );
+        assert_eq!(
+            counter_by_table.get(&("db2".to_string(), "t2".to_string())),
+            Some(&3),
+        );
     }
 }
diff --git a/fluss-rust/crates/fluss/src/test_utils.rs b/fluss-rust/crates/fluss/src/test_utils.rs
index 47bb2ea81e..f1e17e5f58 100644
--- a/fluss-rust/crates/fluss/src/test_utils.rs
+++ b/fluss-rust/crates/fluss/src/test_utils.rs
@@ -20,6 +20,7 @@ use crate::metadata::{
     DataField, DataTypes, PhysicalTablePath, Schema, TableBucket, TableDescriptor, TableInfo,
     TablePath,
 };
+use crate::metrics::{LABEL_DATABASE, LABEL_TABLE, ScannerMetrics};
 use std::collections::HashMap;
 use std::sync::Arc;
 
@@ -87,3 +88,59 @@ pub(crate) fn build_cluster_arc(
 ) -> Arc<Cluster> {
     Arc::new(build_cluster(table_path, table_id, buckets))
 }
+
+/// Build an `Arc<ScannerMetrics>` for tests. Most callers don't install
+/// a recorder, so the cached handles are no-ops; tests that *do* install
+/// `metrics::with_local_recorder(...)` must call this *inside* the
+/// recorder closure for the cached handles to bind to that recorder.
+pub(crate) fn test_scanner_metrics(table_path: &TablePath) -> Arc<ScannerMetrics> {
+    Arc::new(ScannerMetrics::new(table_path))
+}
+
+/// Asserts that every entry whose name starts with `fluss.client.scanner.`
+/// carries both the `database` and `table` labels matching the expected
+/// values. Use after a `Snapshotter::snapshot().into_vec()` to verify all
+/// emitted scanner metrics in one shot — protects against future scanner
+/// metrics that bypass [`ScannerMetrics`].
+pub(crate) fn assert_scanner_entries_labeled(
+    entries: &[(
+        metrics_util::CompositeKey,
+        Option<metrics::Unit>,
+        Option<metrics::SharedString>,
+        metrics_util::debugging::DebugValue,
+    )],
+    expected_database: &str,
+    expected_table: &str,
+) {
+    for (key, _, _, _) in entries {
+        let name = key.key().name();
+        if !name.starts_with("fluss.client.scanner.") {
+            continue;
+        }
+        let labels: Vec<_> = key
+            .key()
+            .labels()
+            .map(|l| (l.key().to_string(), l.value().to_string()))
+            .collect();
+        let database = labels
+            .iter()
+            .find(|(k, _)| k == LABEL_DATABASE)
+            .unwrap_or_else(|| {
+                panic!("scanner metric `{name}` is missing the database label; labels={labels:?}")
+            });
+        let table = labels
+            .iter()
+            .find(|(k, _)| k == LABEL_TABLE)
+            .unwrap_or_else(|| {
+                panic!("scanner metric `{name}` is missing the table label; labels={labels:?}")
+            });
+        assert_eq!(
+            database.1, expected_database,
+            "scanner metric `{name}` has unexpected database label"
+        );
+        assert_eq!(
+            table.1, expected_table,
+            "scanner metric `{name}` has unexpected table label"
+        );
+    }
+}
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 3f94841e4a..5d98303083 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -141,6 +141,8 @@ Complete API reference for the Fluss Rust client.
 
 Single-consumer: do not call `poll` concurrently on the same scanner (e.g. from `tokio::join!` or two tasks sharing an `Arc`). Mirrors Java's `LogScannerImpl.acquire()` guard. Debug builds surface overlapping calls via a `debug_assert!`; release builds skip the check for performance and produce skewed poll-timing metrics (`fluss.client.scanner.time_between_poll_ms`, `fluss.client.scanner.poll_idle_ratio`) if the contract is violated.
 
+All `fluss.client.scanner.*` metrics carry `database` and `table` labels (matching Java's per-`TablePath` `ScannerMetricGroup`), so multi-table consumers get one time series per scanned table.
+
 | Method                                                                                                    | Description                                              |
 |-----------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
 | `async fn subscribe(&self, bucket_id: i32, start_offset: i64) -> Result<()>`                              | Subscribe to a bucket                                    |

From b38859efa8041681056c6e62c290dcca1f881ceb Mon Sep 17 00:00:00 2001
From: Nicoleta Lazar <nicolazar91@gmail.com>
Date: Wed, 27 May 2026 09:03:36 +0100
Subject: [PATCH 280/287]  [elixir] feat: Extend Fluss.Config with writer
 tuning options (#566)

* feat(elixir): Extend NifConfig with writer tuning fields

This commit adds eight new fields to NifConfig covering writer tuning, such
as: acks, retries, request max size, idempotence, buffer memory / wait
timeout, max in flight requests per bucket, and the bucket-assigner enum
(:sticky or :round_robin atoms via NifUnitEnum)

* feat(elixir): Expose writer tuning options on Fluss.Config

This commit adds eight writer-tuning fields to Fluss.Config and exposes
the corresponding setters: acks, retries, request max size, idempotence,
buffer, memory/wait timeout, max inflight requests per bucket, and
bucket-assigner enum.
---
 .../bindings/elixir/lib/fluss/config.ex       |  55 ++++++++-
 .../elixir/native/fluss_nif/src/config.rs     |  47 +++++++-
 .../bindings/elixir/test/config_test.exs      | 108 ++++++++++++++++++
 3 files changed, 206 insertions(+), 4 deletions(-)
 create mode 100644 fluss-rust/bindings/elixir/test/config_test.exs

diff --git a/fluss-rust/bindings/elixir/lib/fluss/config.ex b/fluss-rust/bindings/elixir/lib/fluss/config.ex
index f12f61e426..d02a428ff3 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/config.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/config.ex
@@ -33,17 +33,33 @@ defmodule Fluss.Config do
 
   @enforce_keys [:bootstrap_servers]
   defstruct bootstrap_servers: nil,
+            writer_acks: nil,
             writer_batch_size: nil,
             writer_batch_timeout_ms: nil,
+            writer_bucket_no_key_assigner: nil,
+            writer_buffer_memory_size: nil,
+            writer_buffer_wait_timeout_ms: nil,
             writer_dynamic_batch_size_enabled: nil,
-            writer_dynamic_batch_size_min: nil
+            writer_dynamic_batch_size_min: nil,
+            writer_enable_idempotence: nil,
+            writer_max_inflight_requests_per_bucket: nil,
+            writer_request_max_size: nil,
+            writer_retries: nil
 
   @type t :: %__MODULE__{
           bootstrap_servers: String.t(),
+          writer_acks: String.t() | nil,
           writer_batch_size: non_neg_integer() | nil,
           writer_batch_timeout_ms: non_neg_integer() | nil,
+          writer_bucket_no_key_assigner: :sticky | :round_robin | nil,
+          writer_buffer_memory_size: non_neg_integer() | nil,
+          writer_buffer_wait_timeout_ms: non_neg_integer() | nil,
           writer_dynamic_batch_size_enabled: boolean() | nil,
-          writer_dynamic_batch_size_min: non_neg_integer() | nil
+          writer_dynamic_batch_size_min: non_neg_integer() | nil,
+          writer_enable_idempotence: boolean() | nil,
+          writer_max_inflight_requests_per_bucket: non_neg_integer() | nil,
+          writer_request_max_size: non_neg_integer() | nil,
+          writer_retries: non_neg_integer() | nil
         }
 
   @spec new(String.t()) :: t()
@@ -58,6 +74,10 @@ defmodule Fluss.Config do
   def set_bootstrap_servers(%__MODULE__{} = config, servers) when is_binary(servers),
     do: %{config | bootstrap_servers: servers}
 
+  @spec set_writer_acks(t(), String.t()) :: t()
+  def set_writer_acks(%__MODULE__{} = config, acks) when is_binary(acks),
+    do: %{config | writer_acks: acks}
+
   @spec set_writer_batch_size(t(), non_neg_integer()) :: t()
   def set_writer_batch_size(%__MODULE__{} = config, size) when is_integer(size),
     do: %{config | writer_batch_size: size}
@@ -66,6 +86,19 @@ defmodule Fluss.Config do
   def set_writer_batch_timeout_ms(%__MODULE__{} = config, ms) when is_integer(ms),
     do: %{config | writer_batch_timeout_ms: ms}
 
+  @spec set_writer_bucket_no_key_assigner(t(), :sticky | :round_robin) :: t()
+  def set_writer_bucket_no_key_assigner(%__MODULE__{} = config, assigner)
+      when assigner in [:sticky, :round_robin],
+      do: %{config | writer_bucket_no_key_assigner: assigner}
+
+  @spec set_writer_buffer_memory_size(t(), non_neg_integer()) :: t()
+  def set_writer_buffer_memory_size(%__MODULE__{} = config, size) when is_integer(size),
+    do: %{config | writer_buffer_memory_size: size}
+
+  @spec set_writer_buffer_wait_timeout_ms(t(), non_neg_integer()) :: t()
+  def set_writer_buffer_wait_timeout_ms(%__MODULE__{} = config, ms) when is_integer(ms),
+    do: %{config | writer_buffer_wait_timeout_ms: ms}
+
   @spec set_writer_dynamic_batch_size_enabled(t(), boolean()) :: t()
   def set_writer_dynamic_batch_size_enabled(%__MODULE__{} = config, enabled)
       when is_boolean(enabled),
@@ -75,6 +108,24 @@ defmodule Fluss.Config do
   def set_writer_dynamic_batch_size_min(%__MODULE__{} = config, size) when is_integer(size),
     do: %{config | writer_dynamic_batch_size_min: size}
 
+  @spec set_writer_enable_idempotence(t(), boolean()) :: t()
+  def set_writer_enable_idempotence(%__MODULE__{} = config, enabled)
+      when is_boolean(enabled),
+      do: %{config | writer_enable_idempotence: enabled}
+
+  @spec set_writer_max_inflight_requests_per_bucket(t(), non_neg_integer()) :: t()
+  def set_writer_max_inflight_requests_per_bucket(%__MODULE__{} = config, n)
+      when is_integer(n),
+      do: %{config | writer_max_inflight_requests_per_bucket: n}
+
+  @spec set_writer_request_max_size(t(), non_neg_integer()) :: t()
+  def set_writer_request_max_size(%__MODULE__{} = config, size) when is_integer(size),
+    do: %{config | writer_request_max_size: size}
+
+  @spec set_writer_retries(t(), non_neg_integer()) :: t()
+  def set_writer_retries(%__MODULE__{} = config, n) when is_integer(n),
+    do: %{config | writer_retries: n}
+
   @spec get_bootstrap_servers(t()) :: String.t()
   def get_bootstrap_servers(%__MODULE__{bootstrap_servers: servers}), do: servers
 end
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
index 8bbdfad993..60034d9bc8 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
@@ -15,18 +15,34 @@
 // specific language governing permissions and limitations
 // under the License.
 
-use fluss::config::Config;
-use rustler::NifStruct;
+use fluss::config::{Config, NoKeyAssigner};
+use rustler::{NifStruct, NifUnitEnum};
+
+/// Bucket-assigner strategy for tables without bucket keys.
+/// Maps to fluss::config::NoKeyAssigner.
+#[derive(NifUnitEnum)]
+pub enum NifNoKeyAssigner {
+    Sticky,
+    RoundRobin,
+}
 
 /// Decoded from `%Fluss.Config{}` Elixir struct.
 #[derive(NifStruct)]
 #[module = "Fluss.Config"]
 pub struct NifConfig {
     pub bootstrap_servers: String,
+    pub writer_acks: Option<String>,
     pub writer_batch_size: Option<i32>,
     pub writer_batch_timeout_ms: Option<i64>,
+    pub writer_bucket_no_key_assigner: Option<NifNoKeyAssigner>,
+    pub writer_buffer_memory_size: Option<u64>,
+    pub writer_buffer_wait_timeout_ms: Option<u64>,
     pub writer_dynamic_batch_size_enabled: Option<bool>,
     pub writer_dynamic_batch_size_min: Option<i32>,
+    pub writer_enable_idempotence: Option<bool>,
+    pub writer_max_inflight_requests_per_bucket: Option<u64>,
+    pub writer_request_max_size: Option<i32>,
+    pub writer_retries: Option<i32>,
 }
 
 impl NifConfig {
@@ -47,6 +63,33 @@ impl NifConfig {
         if let Some(size) = self.writer_dynamic_batch_size_min {
             config.writer_dynamic_batch_size_min = size;
         }
+        if let Some(acks) = self.writer_acks {
+            config.writer_acks = acks;
+        }
+        if let Some(assigner) = self.writer_bucket_no_key_assigner {
+            config.writer_bucket_no_key_assigner = match assigner {
+                NifNoKeyAssigner::Sticky => NoKeyAssigner::Sticky,
+                NifNoKeyAssigner::RoundRobin => NoKeyAssigner::RoundRobin,
+            };
+        }
+        if let Some(memory_size) = self.writer_buffer_memory_size {
+            config.writer_buffer_memory_size = memory_size as usize;
+        }
+        if let Some(timeout_ms) = self.writer_buffer_wait_timeout_ms {
+            config.writer_buffer_wait_timeout_ms = timeout_ms;
+        }
+        if let Some(enabled) = self.writer_enable_idempotence {
+            config.writer_enable_idempotence = enabled;
+        }
+        if let Some(requests_limit) = self.writer_max_inflight_requests_per_bucket {
+            config.writer_max_inflight_requests_per_bucket = requests_limit as usize;
+        }
+        if let Some(max_size) = self.writer_request_max_size {
+            config.writer_request_max_size = max_size;
+        }
+        if let Some(retries) = self.writer_retries {
+            config.writer_retries = retries;
+        }
         config
     }
 }
diff --git a/fluss-rust/bindings/elixir/test/config_test.exs b/fluss-rust/bindings/elixir/test/config_test.exs
new file mode 100644
index 0000000000..344c647892
--- /dev/null
+++ b/fluss-rust/bindings/elixir/test/config_test.exs
@@ -0,0 +1,108 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+defmodule Fluss.ConfigTest do
+  use ExUnit.Case, async: true
+
+  test "new/1 creates config with bootstrap_servers; all other fields default to nil" do
+    config = Fluss.Config.new("localhost:9123")
+    assert config == %Fluss.Config{bootstrap_servers: "localhost:9123"}
+  end
+
+  test "set_writer_acks/2 sets the acks value" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_acks("all")
+
+    assert config.writer_acks == "all"
+  end
+
+  test "set_writer_bucket_no_key_assigner/2 sets a valid assigner" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_bucket_no_key_assigner(:sticky)
+
+    assert config.writer_bucket_no_key_assigner == :sticky
+  end
+
+  test "set_writer_bucket_no_key_assigner/2 only accepts :sticky or :round_robin" do
+    assert_raise FunctionClauseError, fn ->
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_bucket_no_key_assigner(:custom)
+    end
+  end
+
+  test "set_writer_buffer_memory_size/2 sets the buffer memory size" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_buffer_memory_size(67_108_864)
+
+    assert config.writer_buffer_memory_size == 67_108_864
+  end
+
+  test "set_writer_buffer_wait_timeout_ms/2 sets the wait timeout" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_buffer_wait_timeout_ms(5_000)
+
+    assert config.writer_buffer_wait_timeout_ms == 5_000
+  end
+
+  test "set_writer_enable_idempotence/2 sets the idempotence flag" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_enable_idempotence(false)
+
+    assert config.writer_enable_idempotence == false
+  end
+
+  test "set_writer_max_inflight_requests_per_bucket/2 sets the inflight limit" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_max_inflight_requests_per_bucket(3)
+
+    assert config.writer_max_inflight_requests_per_bucket == 3
+  end
+
+  test "set_writer_request_max_size/2 sets the request max size" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_request_max_size(2_097_152)
+
+    assert config.writer_request_max_size == 2_097_152
+  end
+
+  test "set_writer_retries/2 sets the retry count" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_retries(5)
+
+    assert config.writer_retries == 5
+  end
+
+  test "setters chain correctly" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_writer_acks("all")
+      |> Fluss.Config.set_writer_retries(3)
+      |> Fluss.Config.set_writer_bucket_no_key_assigner(:round_robin)
+
+    assert config.writer_acks == "all"
+    assert config.writer_retries == 3
+    assert config.writer_bucket_no_key_assigner == :round_robin
+  end
+end

From 087bc9904134a7f08b9bf4d5efba11116af77f9b Mon Sep 17 00:00:00 2001
From: slfan1989 <55643692+slfan1989@users.noreply.github.com>
Date: Thu, 28 May 2026 15:54:53 +0800
Subject: [PATCH 281/287] [tests] replace fixed tokio::time::sleep workarounds
 with wait_for_table_ready helper. (#564)

* [tests] replace fixed tokio::time::sleep workarounds with wait_for_table_ready helper.

* [tests] replace fixed tokio::time::sleep workarounds with wait_for_table_ready helper.

* [tests] replace fixed tokio::time::sleep workarounds with wait_for_table_ready helper.
---
 .../fluss/tests/integration/log_table.rs      |  11 +-
 .../integration/record_batch_log_reader.rs    |  13 +-
 .../crates/fluss/tests/integration/utils.rs   | 157 +++++++++++++++---
 3 files changed, 142 insertions(+), 39 deletions(-)

diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index 8bad7398f1..e2377e1ddc 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -22,7 +22,7 @@ mod table_test {
         ColumnPlan, array_dt_basics_columns, as_row_type, create_partitions, create_table,
         dt_array_int, dt_map_string_int, dt_row_seq_label, extract_ids_from_batches,
         get_shared_cluster, make_int_array, make_string_array, map_dt_basics_columns,
-        row_dt_basics_columns, scalar_dt_columns,
+        row_dt_basics_columns, scalar_dt_columns, wait_for_partitions_ready, wait_for_table_ready,
     };
     use arrow::array::record_batch;
     use fluss::client::{EARLIEST_OFFSET, FlussTable, TableScan};
@@ -169,8 +169,7 @@ mod table_test {
 
         create_table(&admin, &table_path, &table_descriptor).await;
 
-        // Wait for table to be fully initialized
-        tokio::time::sleep(tokio::time::Duration::from_secs(2)).await;
+        wait_for_table_ready(&admin, &table_path).await;
 
         // Test earliest offset (should be 0 for empty table)
         let earliest_offsets = admin
@@ -475,7 +474,7 @@ mod table_test {
             &TableDescriptor::builder().schema(schema).build().unwrap(),
         )
         .await;
-        tokio::time::sleep(Duration::from_secs(1)).await;
+        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection.get_table(&table_path).await.unwrap();
         let scanner = table.new_scan().create_record_batch_log_scanner().unwrap();
@@ -595,8 +594,8 @@ mod table_test {
         // Create partitions
         create_partitions(&admin, &table_path, "region", &["US", "EU"]).await;
 
-        // Wait for partitions to be available
-        tokio::time::sleep(Duration::from_secs(2)).await;
+        // Wait for partition bucket leaders to be available.
+        wait_for_partitions_ready(&admin, &table_path, &["US", "EU"]).await;
 
         let table = connection
             .get_table(&table_path)
diff --git a/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs b/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs
index 1383645316..cf89c065b9 100644
--- a/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs
+++ b/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs
@@ -21,6 +21,7 @@
 mod reader_test {
     use crate::integration::utils::{
         create_partitions, create_table, extract_ids_from_batches, get_shared_cluster,
+        wait_for_partitions_ready, wait_for_table_buckets_ready, wait_for_table_ready,
     };
     use arrow::array::record_batch;
     use fluss::client::{EARLIEST_OFFSET, FlussConnection, RecordBatchLogReader};
@@ -48,7 +49,7 @@ mod reader_test {
             .build()
             .expect("Failed to build table");
         create_table(&admin, &table_path, &table_descriptor).await;
-        tokio::time::sleep(Duration::from_secs(1)).await;
+        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection
             .get_table(&table_path)
@@ -121,7 +122,7 @@ mod reader_test {
             .build()
             .expect("Failed to build table");
         create_table(&admin, &table_path, &table_descriptor).await;
-        tokio::time::sleep(Duration::from_secs(1)).await;
+        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection
             .get_table(&table_path)
@@ -189,7 +190,7 @@ mod reader_test {
             .build()
             .expect("Failed to build table");
         create_table(&admin, &table_path, &table_descriptor).await;
-        tokio::time::sleep(Duration::from_secs(1)).await;
+        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection
             .get_table(&table_path)
@@ -284,7 +285,7 @@ mod reader_test {
             .build()
             .expect("Failed to build table");
         create_table(&admin, &table_path, &table_descriptor).await;
-        tokio::time::sleep(Duration::from_secs(1)).await;
+        wait_for_table_buckets_ready(&admin, &table_path, &[0, 1]).await;
 
         let table = connection
             .get_table(&table_path)
@@ -380,7 +381,7 @@ mod reader_test {
             .expect("Failed to build table");
 
         create_table(&admin, &table_path, &table_descriptor).await;
-        tokio::time::sleep(Duration::from_secs(1)).await;
+        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection
             .get_table(&table_path)
@@ -453,7 +454,7 @@ mod reader_test {
 
         create_table(&admin, &table_path, &table_descriptor).await;
         create_partitions(&admin, &table_path, "region", &["US", "EU"]).await;
-        tokio::time::sleep(Duration::from_secs(2)).await;
+        wait_for_partitions_ready(&admin, &table_path, &["US", "EU"]).await;
 
         let table = connection
             .get_table(&table_path)
diff --git a/fluss-rust/crates/fluss/tests/integration/utils.rs b/fluss-rust/crates/fluss/tests/integration/utils.rs
index 934b66264e..2ebe31d963 100644
--- a/fluss-rust/crates/fluss/tests/integration/utils.rs
+++ b/fluss-rust/crates/fluss/tests/integration/utils.rs
@@ -24,7 +24,9 @@ use fluss::metadata::{
 use fluss::record::ScanBatch;
 use fluss::row::FlussArray;
 use fluss::row::binary_array::FlussArrayWriter;
+use fluss::rpc::message::OffsetSpec;
 use std::collections::HashMap;
+use std::future::Future;
 use std::sync::Arc;
 use std::sync::LazyLock;
 use std::time::Duration;
@@ -100,6 +102,110 @@ pub async fn create_table(
         .expect("Failed to create table");
 }
 
+const READINESS_TIMEOUT: Duration = Duration::from_secs(30);
+const READINESS_POLL_INTERVAL: Duration = Duration::from_millis(200);
+
+async fn poll_until<F, Fut>(
+    timeout: Duration,
+    interval: Duration,
+    timeout_message: String,
+    mut probe: F,
+) where
+    F: FnMut() -> Fut,
+    Fut: Future<Output = Result<(), String>>,
+{
+    let start = std::time::Instant::now();
+
+    loop {
+        match probe().await {
+            Ok(()) => return,
+            Err(err) => {
+                if start.elapsed() >= timeout {
+                    panic!(
+                        "{timeout_message} after {} seconds. Last error: {err}",
+                        timeout.as_secs()
+                    );
+                }
+            }
+        }
+
+        tokio::time::sleep(interval).await;
+    }
+}
+
+/// Waits until the default bucket of a non-partitioned table can serve offset requests.
+///
+/// Newly-created tables may not have bucket leaders immediately. Polling list offsets avoids
+/// fixed sleeps that are either flaky on slow CI or waste time when the cluster is ready sooner.
+pub async fn wait_for_table_ready(admin: &FlussAdmin, table_path: &TablePath) {
+    wait_for_table_buckets_ready(admin, table_path, &[0]).await;
+}
+
+/// Waits until the specified buckets of a non-partitioned table can serve offset requests.
+pub async fn wait_for_table_buckets_ready(
+    admin: &FlussAdmin,
+    table_path: &TablePath,
+    buckets: &[i32],
+) {
+    poll_until(
+        READINESS_TIMEOUT,
+        READINESS_POLL_INTERVAL,
+        format!("Timed out waiting for table '{table_path}' buckets {buckets:?} to become ready"),
+        || async {
+            admin
+                .list_offsets(table_path, buckets, OffsetSpec::Latest)
+                .await
+                .map(|_| ())
+                .map_err(|err| format!("{err:?}"))
+        },
+    )
+    .await;
+}
+
+/// Waits until all listed partition values can serve offset requests for the default bucket.
+pub async fn wait_for_partitions_ready(
+    admin: &FlussAdmin,
+    table_path: &TablePath,
+    partition_values: &[&str],
+) {
+    for partition_value in partition_values {
+        wait_for_partition_ready(admin, table_path, partition_value).await;
+    }
+}
+
+/// Waits until one partition value can serve offset requests for the default bucket.
+pub async fn wait_for_partition_ready(
+    admin: &FlussAdmin,
+    table_path: &TablePath,
+    partition_value: &str,
+) {
+    wait_for_partition_buckets_ready(admin, table_path, partition_value, &[0]).await;
+}
+
+/// Waits until the specified buckets of a partition can serve offset requests.
+pub async fn wait_for_partition_buckets_ready(
+    admin: &FlussAdmin,
+    table_path: &TablePath,
+    partition_value: &str,
+    buckets: &[i32],
+) {
+    poll_until(
+        READINESS_TIMEOUT,
+        READINESS_POLL_INTERVAL,
+        format!(
+            "Timed out waiting for table '{table_path}' partition '{partition_value}' buckets {buckets:?} to become ready"
+        ),
+        || async {
+            admin
+                .list_partition_offsets(table_path, partition_value, buckets, OffsetSpec::Latest)
+                .await
+                .map(|_| ())
+                .map_err(|err| format!("{err:?}"))
+        },
+    )
+    .await;
+}
+
 pub fn make_string_array(values: &[Option<&str>]) -> FlussArray {
     let mut writer = FlussArrayWriter::new(values.len(), &DataTypes::string());
     for (idx, value) in values.iter().enumerate() {
@@ -141,38 +247,35 @@ pub fn extract_ids_from_batches(batches: &[ScanBatch]) -> Vec<i32> {
 
 /// Similar to wait_for_cluster_ready but connects with SASL credentials.
 pub async fn wait_for_cluster_ready_with_sasl(cluster: &FlussTestingCluster) {
-    let timeout = Duration::from_secs(30);
-    let poll_interval = Duration::from_millis(500);
-    let start = std::time::Instant::now();
-
     let (username, password) = cluster
         .sasl_users()
         .first()
         .expect("SASL cluster must have at least one user");
 
-    loop {
-        let connection = cluster
-            .get_fluss_connection_with_sasl(username, password)
-            .await;
-        if connection
-            .get_metadata()
-            .get_cluster()
-            .get_one_available_server()
-            .is_some()
-        {
-            return;
-        }
-
-        if start.elapsed() >= timeout {
-            panic!(
-                "SASL server readiness check timed out after {} seconds. \
-                 CoordinatorEventProcessor may not be initialized or TabletServer may not be available.",
-                timeout.as_secs()
-            );
-        }
-
-        tokio::time::sleep(poll_interval).await;
-    }
+    poll_until(
+        Duration::from_secs(30),
+        Duration::from_millis(500),
+        "SASL server readiness check timed out".to_string(),
+        || async {
+            let connection = cluster
+                .get_fluss_connection_with_sasl(username, password)
+                .await;
+            if connection
+                .get_metadata()
+                .get_cluster()
+                .get_one_available_server()
+                .is_some()
+            {
+                Ok(())
+            } else {
+                Err(
+                    "CoordinatorEventProcessor may not be initialized or TabletServer may not be available"
+                        .to_string(),
+                )
+            }
+        },
+    )
+    .await;
 }
 
 /// Creates partitions for a partitioned table.

From 634c603e24c1106f720c20a5986a6640739e8940 Mon Sep 17 00:00:00 2001
From: Arnav-Panjla <arnavpanjla@gmail.com>
Date: Wed, 27 May 2026 00:35:26 +0100
Subject: [PATCH 282/287] [client] Implement BatchScanner with limit-based scan

Implements a one-shot bounded BatchScanner backed by a single
LimitScanRequest RPC (fixes #316):
- adds TableScan::limit and create_batch_scanner
- eager RPC with leader resolution (mirrors Lookuper)
- Arrow IPC (log) and KV -> RecordBatch (PK) decoding
- projection support

Squashed from PR #515.
---
 .../fluss/src/client/table/batch_scanner.rs   | 435 ++++++++++++++++++
 .../crates/fluss/src/client/table/mod.rs      |   2 +
 .../crates/fluss/src/client/table/scanner.rs  |  51 ++
 .../fluss/tests/integration/batch_scanner.rs  | 162 +++++++
 fluss-rust/crates/fluss/tests/test_fluss.rs   |   1 +
 5 files changed, 651 insertions(+)
 create mode 100644 fluss-rust/crates/fluss/src/client/table/batch_scanner.rs
 create mode 100644 fluss-rust/crates/fluss/tests/integration/batch_scanner.rs

diff --git a/fluss-rust/crates/fluss/src/client/table/batch_scanner.rs b/fluss-rust/crates/fluss/src/client/table/batch_scanner.rs
new file mode 100644
index 0000000000..f0319859fc
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/client/table/batch_scanner.rs
@@ -0,0 +1,435 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! One-shot bounded scanner backed by a single `LimitScanRequest` RPC.
+//!
+//! Unlike [`crate::client::table::LogScanner`], a `BatchScanner` does not
+//! subscribe to bucket offsets or stream from the server. It performs a single
+//! eager request for up to `limit` rows from one `TableBucket` and exposes the
+//! result as a single Arrow [`RecordBatch`] on the first call to
+//! [`BatchScanner::poll_batch`]; subsequent calls return `None`.
+
+use crate::client::metadata::Metadata;
+use crate::error::{ApiError, Error, FlussError, Result};
+use crate::metadata::{TableBucket, TableInfo};
+use crate::proto::ErrorResponse;
+use crate::record::kv::{KvRecordBatch, KvRecordReadContext, ReadContext as KvReadContext, SchemaGetter};
+use crate::record::{LogRecordsBatches, ReadContext as ArrowReadContext, ScanBatch, RowAppendRecordBatchBuilder, to_arrow_schema};
+use crate::rpc::RpcClient;
+use crate::rpc::message::LimitScanRequest;
+use arrow::array::RecordBatch;
+use arrow_schema::SchemaRef;
+use bytes::Bytes;
+use std::sync::Arc;
+
+/// Adapter over a [`TableInfo`] that satisfies [`SchemaGetter`] for a single
+/// table. KV lookups always carry the same schema id, so we just hand back
+/// the embedded schema.
+struct TableInfoSchemaGetter {
+    schema: Arc<crate::metadata::Schema>,
+}
+
+impl SchemaGetter for TableInfoSchemaGetter {
+    fn get_schema(&self, _schema_id: i16) -> Result<Arc<crate::metadata::Schema>> {
+        Ok(Arc::clone(&self.schema))
+    }
+}
+
+/// One-shot bounded scanner.
+///
+/// The scanner sends a single `LimitScanRequest` on construction and caches
+/// the resulting Arrow `RecordBatch`. The first `poll_batch()` returns the
+/// batch (wrapped in a [`ScanBatch`]); the second returns `None`.
+pub struct BatchScanner {
+    bucket: TableBucket,
+    /// Pre-fetched batch, taken out on the first `poll_batch` call.
+    batch: Option<RecordBatch>,
+    /// Base log offset of the pre-fetched batch. For log tables, this is the
+    /// `base_log_offset` of the first underlying `LogRecordBatch`. For KV
+    /// tables (limit scan on a primary-key table) there is no log offset, so
+    /// this is `0`.
+    base_offset: i64,
+}
+
+impl BatchScanner {
+    pub(super) async fn new(
+        rpc_client: Arc<RpcClient>,
+        metadata: Arc<Metadata>,
+        table_info: TableInfo,
+        projected_fields: Option<Vec<usize>>,
+        bucket: TableBucket,
+        limit: i32,
+    ) -> Result<Self> {
+        // Resolve leader for the target bucket (mirrors Lookuper's pattern).
+        let leader = metadata
+            .leader_for(&table_info.table_path, &bucket)
+            .await?
+            .ok_or_else(|| {
+                Error::leader_not_available(format!(
+                    "No leader found for table bucket: {bucket}"
+                ))
+            })?;
+        let connection = rpc_client.get_connection(&leader).await?;
+
+        // Fire the single LimitScanRequest RPC.
+        let request = LimitScanRequest::new(
+            table_info.table_id,
+            bucket.partition_id(),
+            bucket.bucket_id(),
+            limit,
+        );
+        let response = connection.request(request).await?;
+
+        // Surface server-side errors using the same shape as Lookuper.
+        if let Some(error_code) = response.error_code
+            && error_code != FlussError::None.code()
+        {
+            let err: ApiError = ErrorResponse {
+                error_code,
+                error_message: response.error_message.clone(),
+            }
+            .into();
+            return Err(Error::FlussAPIError { api_error: err });
+        }
+
+        let is_log_table = response.is_log_table.unwrap_or(false);
+        let raw = response.records.unwrap_or_default();
+
+        let (batch, base_offset) = if is_log_table {
+            decode_log_batch(&table_info, projected_fields.as_deref(), raw)?
+        } else {
+            (decode_kv_batch(&table_info, projected_fields.as_deref(), raw)?, 0)
+        };
+
+        Ok(Self {
+            bucket,
+            batch: Some(batch),
+            base_offset,
+        })
+    }
+
+    /// Returns the pre-fetched batch on the first call, then `None`.
+    pub async fn poll_batch(&mut self) -> Result<Option<ScanBatch>> {
+        let base_offset = self.base_offset;
+        Ok(self
+            .batch
+            .take()
+            .map(|b| ScanBatch::new(self.bucket.clone(), b, base_offset)))
+    }
+
+    /// The bucket scanned by this `BatchScanner`.
+    pub fn bucket(&self) -> &TableBucket {
+        &self.bucket
+    }
+}
+
+/// Decode an Arrow-IPC encoded `LogRecordBatch` payload into a single Arrow
+/// `RecordBatch`. Multiple inner batches (rare for a `LimitScanRequest`) are
+/// concatenated.
+fn decode_log_batch(
+    table_info: &TableInfo,
+    projected_fields: Option<&[usize]>,
+    raw: Vec<u8>,
+) -> Result<(RecordBatch, i64)> {
+    let row_type = Arc::new(table_info.get_row_type().clone());
+    let full_schema = to_arrow_schema(table_info.get_row_type())?;
+    let read_context = match projected_fields {
+        None => ArrowReadContext::new(full_schema.clone(), row_type.clone(), false),
+        Some(fields) => ArrowReadContext::with_projection_pushdown(
+            full_schema.clone(),
+            row_type.clone(),
+            fields.to_vec(),
+            false,
+        )?,
+    };
+
+    let target_schema: SchemaRef = match projected_fields {
+        None => full_schema,
+        Some(fields) => ArrowReadContext::project_schema(
+            to_arrow_schema(table_info.get_row_type())?,
+            fields,
+        )?,
+    };
+
+    if raw.is_empty() {
+        return Ok((RecordBatch::new_empty(target_schema), 0));
+    }
+
+    let mut batches: Vec<RecordBatch> = Vec::new();
+    let mut base_offset: Option<i64> = None;
+    for log_batch in LogRecordsBatches::new(raw) {
+        let log_batch = log_batch?;
+        if base_offset.is_none() {
+            base_offset = Some(log_batch.base_log_offset());
+        }
+        let rb = log_batch.record_batch(&read_context)?;
+        batches.push(rb);
+    }
+
+    let base_offset = base_offset.unwrap_or(0);
+    if batches.is_empty() {
+        return Ok((RecordBatch::new_empty(target_schema), base_offset));
+    }
+    if batches.len() == 1 {
+        return Ok((batches.into_iter().next().unwrap(), base_offset));
+    }
+    let merged = arrow::compute::concat_batches(&target_schema, batches.iter()).map_err(|e| {
+        Error::UnexpectedError {
+            message: format!("Failed to concatenate log record batches: {e}"),
+            source: None,
+        }
+    })?;
+    Ok((merged, base_offset))
+}
+
+/// Decode a KV-format payload into a single Arrow `RecordBatch`. Each
+/// `CompactedRow` is appended through [`RowAppendRecordBatchBuilder`]; deletion
+/// records (no value) are skipped because primary key tables don't return
+/// tombstones from a limit scan.
+fn decode_kv_batch(
+    table_info: &TableInfo,
+    projected_fields: Option<&[usize]>,
+    raw: Vec<u8>,
+) -> Result<RecordBatch> {
+    let row_type = table_info.get_row_type();
+    let full_arrow_schema = to_arrow_schema(row_type)?;
+
+    if raw.is_empty() {
+        let schema: SchemaRef = match projected_fields {
+            None => full_arrow_schema,
+            Some(fields) => ArrowReadContext::project_schema(full_arrow_schema, fields)?,
+        };
+        return Ok(RecordBatch::new_empty(schema));
+    }
+
+    let kv_format = table_info.table_config.get_kv_format()?;
+    let schema_getter = Arc::new(TableInfoSchemaGetter {
+        schema: Arc::new(table_info.get_schema().clone()),
+    });
+    let read_context = KvRecordReadContext::new(kv_format, schema_getter);
+
+    // The KV records payload may be a single batch or a sequence of batches.
+    // The server-side `LimitScanResponse` returns one batch in practice, but
+    // we walk the buffer defensively.
+    let bytes = Bytes::from(raw);
+    let mut builder = RowAppendRecordBatchBuilder::new(row_type)?;
+    let mut position = 0usize;
+
+    while position < bytes.len() {
+        let kv_batch = KvRecordBatch::new(bytes.clone(), position);
+        let size = kv_batch.size_in_bytes().map_err(|e| Error::UnexpectedError {
+            message: format!("Invalid KvRecordBatch length: {e}"),
+            source: None,
+        })?;
+
+        let records = kv_batch.records_unchecked(&read_context as &dyn KvReadContext)?;
+        let decoder = records.decoder_arc();
+        for record in records {
+            let record = record.map_err(|e| Error::UnexpectedError {
+                message: format!("Failed to read KV record: {e}"),
+                source: None,
+            })?;
+            if let Some(row) = record.row(&*decoder) {
+                builder.append(&row)?;
+            }
+        }
+
+        position = position.checked_add(size).ok_or_else(|| Error::UnexpectedError {
+            message: "KvRecordBatch position overflow".to_string(),
+            source: None,
+        })?;
+    }
+
+    let full_batch = Arc::unwrap_or_clone(builder.build_arrow_record_batch()?);
+
+    match projected_fields {
+        None => Ok(full_batch),
+        Some(fields) => {
+            let projected_schema =
+                ArrowReadContext::project_schema(full_arrow_schema, fields)?;
+            let columns: Vec<_> = fields
+                .iter()
+                .map(|&idx| full_batch.column(idx).clone())
+                .collect();
+            Ok(RecordBatch::try_new(projected_schema, columns)?)
+        }
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::client::WriteRecord;
+    use crate::compression::{
+        ArrowCompressionInfo, ArrowCompressionRatioEstimator, ArrowCompressionType,
+        DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+    };
+    use crate::metadata::{
+        DataField, DataTypes, PhysicalTablePath, Schema, TableDescriptor, TableInfo,
+        TablePath,
+    };
+    use crate::record::MemoryLogRecordsArrowBuilder;
+    use crate::row::GenericRow;
+
+    fn build_two_col_table_info() -> TableInfo {
+        let row_type = DataTypes::row(vec![
+            DataField::new("id", DataTypes::int(), None),
+            DataField::new("name", DataTypes::string(), None),
+        ]);
+        let schema = Schema::builder()
+            .with_row_type(&row_type)
+            .build()
+            .expect("schema build");
+        let descriptor = TableDescriptor::builder()
+            .schema(schema)
+            .distributed_by(Some(1), vec![])
+            .build()
+            .expect("descriptor build");
+        TableInfo::of(
+            TablePath::new("db".to_string(), "tbl".to_string()),
+            42,
+            1,
+            descriptor,
+            0,
+            0,
+        )
+    }
+
+    fn build_log_records(table_info: &TableInfo, base_offset: i64, rows: &[(i32, &str)]) -> Vec<u8> {
+        let row_type = table_info.get_row_type();
+        let table_path = table_info.table_path.clone();
+        let table_info_arc = Arc::new(table_info.clone());
+        let physical = Arc::new(PhysicalTablePath::of(Arc::new(table_path)));
+        let mut builder = MemoryLogRecordsArrowBuilder::new(
+            1,
+            row_type,
+            false,
+            ArrowCompressionInfo {
+                compression_type: ArrowCompressionType::None,
+                compression_level: DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
+            },
+            usize::MAX,
+            Arc::new(ArrowCompressionRatioEstimator::default()),
+        )
+        .expect("builder");
+
+        for (i, (id, name)) in rows.iter().enumerate() {
+            let mut row = GenericRow::new(2);
+            row.set_field(0, *id);
+            row.set_field(1, *name);
+            let record = WriteRecord::for_append(
+                Arc::clone(&table_info_arc),
+                physical.clone(),
+                (i + 1) as i32,
+                &row,
+            );
+            builder.append(&record).expect("append");
+        }
+        let mut data = builder.build().expect("build log batch");
+        // Builder always writes base_log_offset=0; patch it so tests can verify
+        // BatchScanner faithfully propagates whatever offset the server returned.
+        let bytes = base_offset.to_le_bytes();
+        data[..bytes.len()].copy_from_slice(&bytes);
+        data
+    }
+
+    #[test]
+    fn decode_log_batch_empty_returns_empty_record_batch() {
+        let table_info = build_two_col_table_info();
+        let (batch, base_offset) =
+            decode_log_batch(&table_info, None, Vec::new()).expect("decode empty");
+        assert_eq!(batch.num_rows(), 0);
+        assert_eq!(batch.num_columns(), 2);
+        assert_eq!(base_offset, 0);
+    }
+
+    #[test]
+    fn decode_log_batch_empty_with_projection() {
+        let table_info = build_two_col_table_info();
+        let (batch, base_offset) =
+            decode_log_batch(&table_info, Some(&[1usize]), Vec::new()).expect("decode empty");
+        assert_eq!(batch.num_rows(), 0);
+        assert_eq!(batch.num_columns(), 1);
+        assert_eq!(batch.schema().field(0).name(), "name");
+        assert_eq!(base_offset, 0);
+    }
+
+    #[test]
+    fn decode_log_batch_extracts_base_offset_and_rows() {
+        let table_info = build_two_col_table_info();
+        let raw = build_log_records(&table_info, 17, &[(1, "alice"), (2, "bob"), (3, "carol")]);
+
+        let (batch, base_offset) =
+            decode_log_batch(&table_info, None, raw).expect("decode populated");
+        assert_eq!(batch.num_rows(), 3);
+        assert_eq!(batch.num_columns(), 2);
+        assert_eq!(base_offset, 17);
+    }
+
+    #[test]
+    fn decode_log_batch_projection_keeps_requested_columns() {
+        let table_info = build_two_col_table_info();
+        let raw = build_log_records(&table_info, 0, &[(7, "x"), (8, "y")]);
+
+        let (batch, _) =
+            decode_log_batch(&table_info, Some(&[0usize]), raw).expect("decode projected");
+        assert_eq!(batch.num_rows(), 2);
+        assert_eq!(batch.num_columns(), 1);
+        assert_eq!(batch.schema().field(0).name(), "id");
+    }
+
+    #[test]
+    fn decode_kv_batch_empty_returns_empty_record_batch() {
+        let table_info = build_two_col_table_info();
+        let batch = decode_kv_batch(&table_info, None, Vec::new()).expect("decode empty kv");
+        assert_eq!(batch.num_rows(), 0);
+        assert_eq!(batch.num_columns(), 2);
+    }
+
+    #[test]
+    fn decode_kv_batch_empty_with_projection() {
+        let table_info = build_two_col_table_info();
+        let batch = decode_kv_batch(&table_info, Some(&[0usize]), Vec::new())
+            .expect("decode projected empty kv");
+        assert_eq!(batch.num_rows(), 0);
+        assert_eq!(batch.num_columns(), 1);
+        assert_eq!(batch.schema().field(0).name(), "id");
+    }
+
+    #[tokio::test]
+    async fn poll_batch_returns_batch_then_none() {
+        let table_info = build_two_col_table_info();
+        let raw = build_log_records(&table_info, 5, &[(1, "alice"), (2, "bob")]);
+        let (batch, base_offset) = decode_log_batch(&table_info, None, raw).expect("decode");
+
+        let bucket = TableBucket::new(table_info.table_id, 0);
+        let mut scanner = BatchScanner {
+            bucket: bucket.clone(),
+            batch: Some(batch),
+            base_offset,
+        };
+
+        let first = scanner.poll_batch().await.expect("poll").expect("some");
+        assert_eq!(first.bucket(), &bucket);
+        assert_eq!(first.num_records(), 2);
+        assert_eq!(first.base_offset(), 5);
+        assert_eq!(first.last_offset(), 6);
+
+        let second = scanner.poll_batch().await.expect("poll");
+        assert!(second.is_none());
+    }
+}
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index e116bbb42d..5ef5d1793c 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -25,6 +25,7 @@ use std::sync::Arc;
 pub const EARLIEST_OFFSET: i64 = -2;
 
 mod append;
+mod batch_scanner;
 mod lookup;
 
 mod log_fetch_buffer;
@@ -35,6 +36,7 @@ mod scanner;
 mod upsert;
 
 pub use append::{AppendWriter, TableAppend};
+pub use batch_scanner::BatchScanner;
 pub use lookup::{LookupResult, Lookuper, PrefixKeyLookuper, TableLookup, TablePrefixLookup};
 pub use reader::{RecordBatchLogReader, SyncRecordBatchLogReader};
 pub use remote_log::{
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index d7e2dd2c71..031975b3e6 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -16,6 +16,7 @@
 // under the License.
 
 use crate::client::connection::FlussConnection;
+use crate::client::table::batch_scanner::BatchScanner;
 use crate::client::credentials::SecurityTokenManager;
 use crate::client::metadata::Metadata;
 use crate::client::table::log_fetch_buffer::{
@@ -55,6 +56,8 @@ pub struct TableScan<'a> {
     metadata: Arc<Metadata>,
     /// Column indices to project. None means all columns, Some(vec) means only the specified columns (non-empty).
     projected_fields: Option<Vec<usize>>,
+    /// Optional row limit. When set, callers may construct a [`BatchScanner`] for a one-shot bounded scan.
+    limit: Option<i32>,
 }
 
 impl<'a> TableScan<'a> {
@@ -64,9 +67,57 @@ impl<'a> TableScan<'a> {
             table_info,
             metadata,
             projected_fields: None,
+            limit: None,
         }
     }
 
+    /// Sets a row limit for the scan, enabling [`Self::create_batch_scanner`].
+    ///
+    /// The limit must be positive. Callers configure a limit prior to
+    /// constructing a `BatchScanner` for a one-shot bounded read.
+    pub fn limit(mut self, n: i32) -> Result<Self> {
+        if n <= 0 {
+            return Err(Error::IllegalArgument {
+                message: format!("Scan limit must be positive, got {n}"),
+            });
+        }
+        self.limit = Some(n);
+        Ok(self)
+    }
+
+    /// Creates a `BatchScanner` that performs a single bounded scan of `table_bucket`.
+    ///
+    /// Requires a previously-configured limit via [`Self::limit`]. The scanner sends
+    /// a `LimitScanRequest` eagerly and exposes the resulting batch through
+    /// [`BatchScanner::poll_batch`].
+    pub async fn create_batch_scanner(
+        self,
+        table_bucket: TableBucket,
+    ) -> Result<BatchScanner> {
+        let limit = self.limit.ok_or_else(|| Error::IllegalArgument {
+            message: "create_batch_scanner requires a limit configured via .limit(n)"
+                .to_string(),
+        })?;
+        if table_bucket.table_id() != self.table_info.table_id {
+            return Err(Error::IllegalArgument {
+                message: format!(
+                    "Bucket table_id {} does not match scan table_id {}",
+                    table_bucket.table_id(),
+                    self.table_info.table_id
+                ),
+            });
+        }
+        BatchScanner::new(
+            self.conn.get_connections(),
+            self.metadata.clone(),
+            self.table_info,
+            self.projected_fields,
+            table_bucket,
+            limit,
+        )
+        .await
+    }
+
     /// Projects the scan to only include specified columns by their indices.
     ///
     /// # Arguments
diff --git a/fluss-rust/crates/fluss/tests/integration/batch_scanner.rs b/fluss-rust/crates/fluss/tests/integration/batch_scanner.rs
new file mode 100644
index 0000000000..2623528176
--- /dev/null
+++ b/fluss-rust/crates/fluss/tests/integration/batch_scanner.rs
@@ -0,0 +1,162 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#[cfg(test)]
+mod batch_scanner_test {
+    use crate::integration::utils::{create_table, get_shared_cluster};
+    use arrow::array::record_batch;
+    use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
+    use std::time::Duration;
+
+    /// End-to-end check that BatchScanner returns the appended rows on first
+    /// poll and `None` on the next, honoring the configured limit.
+    #[tokio::test]
+    async fn batch_scanner_returns_appended_rows_then_none() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("admin");
+
+        let table_path = TablePath::new("fluss", "test_batch_scanner_log");
+        let descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("c1", DataTypes::int())
+                    .column("c2", DataTypes::string())
+                    .build()
+                    .expect("schema"),
+            )
+            // Single bucket so a single BatchScanner sees every row.
+            .distributed_by(Some(1), vec!["c1".to_string()])
+            .build()
+            .expect("descriptor");
+        create_table(&admin, &table_path, &descriptor).await;
+
+        let table = connection.get_table(&table_path).await.expect("table");
+        let writer = table
+            .new_append()
+            .expect("append")
+            .create_writer()
+            .expect("writer");
+
+        let batch = record_batch!(
+            ("c1", Int32, [1, 2, 3, 4, 5]),
+            ("c2", Utf8, ["a", "b", "c", "d", "e"])
+        )
+        .unwrap();
+        writer.append_arrow_batch(batch).expect("append batch");
+        writer.flush().await.expect("flush");
+
+        // Give the server a moment to commit and make the records readable.
+        tokio::time::sleep(Duration::from_secs(1)).await;
+
+        let table_info = table.get_table_info();
+        let bucket = TableBucket::new(table_info.table_id, 0);
+
+        let mut batch_scanner = table
+            .new_scan()
+            .limit(3)
+            .expect("limit")
+            .create_batch_scanner(bucket.clone())
+            .await
+            .expect("create batch scanner");
+
+        let first = batch_scanner
+            .poll_batch()
+            .await
+            .expect("poll")
+            .expect("first batch should be Some");
+
+        assert_eq!(first.bucket(), &bucket);
+        // The server may return fewer rows than the limit on the first call,
+        // but must never exceed it.
+        assert!(
+            first.num_records() > 0 && first.num_records() <= 3,
+            "expected 1..=3 records, got {}",
+            first.num_records()
+        );
+
+        let second = batch_scanner
+            .poll_batch()
+            .await
+            .expect("second poll succeeds");
+        assert!(second.is_none(), "second poll must return None");
+    }
+
+    /// A bucket id outside the table's bucket range should be rejected by the
+    /// scanner before any RPC is made.
+    #[tokio::test]
+    async fn batch_scanner_requires_matching_table_id() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("admin");
+
+        let table_path = TablePath::new("fluss", "test_batch_scanner_table_id");
+        let descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("c1", DataTypes::int())
+                    .build()
+                    .expect("schema"),
+            )
+            .distributed_by(Some(1), vec!["c1".to_string()])
+            .build()
+            .expect("descriptor");
+        create_table(&admin, &table_path, &descriptor).await;
+
+        let table = connection.get_table(&table_path).await.expect("table");
+
+        // Bucket with a wrong table_id — must fail without hitting the server.
+        let bogus_bucket = TableBucket::new(table.get_table_info().table_id + 9999, 0);
+
+        let result = table
+            .new_scan()
+            .limit(1)
+            .expect("limit")
+            .create_batch_scanner(bogus_bucket)
+            .await;
+        assert!(
+            result.is_err(),
+            "batch scanner must reject mismatched table_id"
+        );
+    }
+
+    /// `.limit(n)` must reject non-positive values before any scanner is built.
+    #[tokio::test]
+    async fn batch_scanner_rejects_non_positive_limit() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("admin");
+
+        let table_path = TablePath::new("fluss", "test_batch_scanner_bad_limit");
+        let descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("c1", DataTypes::int())
+                    .build()
+                    .expect("schema"),
+            )
+            .distributed_by(Some(1), vec!["c1".to_string()])
+            .build()
+            .expect("descriptor");
+        create_table(&admin, &table_path, &descriptor).await;
+
+        let table = connection.get_table(&table_path).await.expect("table");
+        assert!(table.new_scan().limit(0).is_err());
+        assert!(table.new_scan().limit(-5).is_err());
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/test_fluss.rs b/fluss-rust/crates/fluss/tests/test_fluss.rs
index 792b68f00e..2d2bd152ec 100644
--- a/fluss-rust/crates/fluss/tests/test_fluss.rs
+++ b/fluss-rust/crates/fluss/tests/test_fluss.rs
@@ -21,6 +21,7 @@ extern crate fluss;
 #[cfg(feature = "integration_tests")]
 mod integration {
     mod admin;
+    mod batch_scanner;
     mod fluss_cluster;
     mod kv_table;
     mod log_table;

From 35a6ec6f4e384fe7da30302d9e20cf28148bbba3 Mon Sep 17 00:00:00 2001
From: Anton Borisov <anton.borisov@fresha.com>
Date: Wed, 27 May 2026 01:31:55 +0100
Subject: [PATCH 283/287] [client] Fix KV limit-scan decode + enforce limit,
 support schema evolution

---
 .../fluss/src/client/table/batch_scanner.rs   | 710 +++++++++++++-----
 .../crates/fluss/src/client/table/mod.rs      |   2 +-
 .../crates/fluss/src/client/table/scanner.rs  |  74 +-
 fluss-rust/crates/fluss/src/record/kv/mod.rs  |   2 +
 .../fluss/src/record/kv/value_record_batch.rs | 188 +++++
 .../fluss/tests/integration/batch_scanner.rs  | 236 +++++-
 .../fluss/tests/integration/log_table.rs      |   2 -
 .../integration/record_batch_log_reader.rs    |   7 +-
 .../docs/user-guide/rust/api-reference.md     |  15 +
 .../user-guide/rust/example/log-tables.md     |  17 +
 .../rust/example/primary-key-tables.md        |  15 +
 11 files changed, 1025 insertions(+), 243 deletions(-)
 create mode 100644 fluss-rust/crates/fluss/src/record/kv/value_record_batch.rs

diff --git a/fluss-rust/crates/fluss/src/client/table/batch_scanner.rs b/fluss-rust/crates/fluss/src/client/table/batch_scanner.rs
index f0319859fc..cc0585f30e 100644
--- a/fluss-rust/crates/fluss/src/client/table/batch_scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/batch_scanner.rs
@@ -15,135 +15,165 @@
 // specific language governing permissions and limitations
 // under the License.
 
-//! One-shot bounded scanner backed by a single `LimitScanRequest` RPC.
+//! Bounded batch scanner backed by a single `LimitScanRequest`, polled with
+//! `next_batch` until it returns `None` (like `RecordBatchLogReader`).
 //!
-//! Unlike [`crate::client::table::LogScanner`], a `BatchScanner` does not
-//! subscribe to bucket offsets or stream from the server. It performs a single
-//! eager request for up to `limit` rows from one `TableBucket` and exposes the
-//! result as a single Arrow [`RecordBatch`] on the first call to
-//! [`BatchScanner::poll_batch`]; subsequent calls return `None`.
+//! The KV branch decodes a [`ValueRecordBatch`], decoding each record against
+//! its own schema id via [`FixedSchemaDecoder`] so older records are projected
+//! onto the current schema (the same path as lookup).
 
+use crate::client::ClientSchemaGetter;
 use crate::client::metadata::Metadata;
 use crate::error::{ApiError, Error, FlussError, Result};
-use crate::metadata::{TableBucket, TableInfo};
+use crate::metadata::{KvFormat, RowType, Schema, TableBucket, TableInfo};
 use crate::proto::ErrorResponse;
-use crate::record::kv::{KvRecordBatch, KvRecordReadContext, ReadContext as KvReadContext, SchemaGetter};
-use crate::record::{LogRecordsBatches, ReadContext as ArrowReadContext, ScanBatch, RowAppendRecordBatchBuilder, to_arrow_schema};
+use crate::record::kv::{SCHEMA_ID_LENGTH, ValueRecordBatch};
+use crate::record::{
+    LogRecordsBatches, ReadContext as ArrowReadContext, RowAppendRecordBatchBuilder, ScanBatch,
+    to_arrow_schema,
+};
+use crate::row::FixedSchemaDecoder;
 use crate::rpc::RpcClient;
 use crate::rpc::message::LimitScanRequest;
 use arrow::array::RecordBatch;
+use arrow::compute::concat_batches;
 use arrow_schema::SchemaRef;
+use byteorder::{ByteOrder, LittleEndian};
 use bytes::Bytes;
+use std::collections::HashMap;
+use std::ops::Range;
 use std::sync::Arc;
 
-/// Adapter over a [`TableInfo`] that satisfies [`SchemaGetter`] for a single
-/// table. KV lookups always carry the same schema id, so we just hand back
-/// the embedded schema.
-struct TableInfoSchemaGetter {
-    schema: Arc<crate::metadata::Schema>,
+/// One-shot bounded scanner: a single `LimitScanRequest` yielded as one
+/// [`ScanBatch`]. Creation is cheap; the request runs on the first
+/// [`next_batch`](Self::next_batch), which returns the batch once, then `None`.
+pub struct LimitBatchScanner {
+    bucket: TableBucket,
+    /// Taken on the first `next_batch` to run the scan; `None` afterward.
+    pending: Option<PendingScan>,
 }
 
-impl SchemaGetter for TableInfoSchemaGetter {
-    fn get_schema(&self, _schema_id: i16) -> Result<Arc<crate::metadata::Schema>> {
-        Ok(Arc::clone(&self.schema))
-    }
+/// Request inputs captured at creation, consumed by the first `next_batch`.
+struct PendingScan {
+    rpc_client: Arc<RpcClient>,
+    metadata: Arc<Metadata>,
+    table_info: TableInfo,
+    schema_getter: Arc<ClientSchemaGetter>,
+    projected_fields: Option<Vec<usize>>,
+    limit: i32,
 }
 
-/// One-shot bounded scanner.
-///
-/// The scanner sends a single `LimitScanRequest` on construction and caches
-/// the resulting Arrow `RecordBatch`. The first `poll_batch()` returns the
-/// batch (wrapped in a [`ScanBatch`]); the second returns `None`.
-pub struct BatchScanner {
-    bucket: TableBucket,
-    /// Pre-fetched batch, taken out on the first `poll_batch` call.
-    batch: Option<RecordBatch>,
-    /// Base log offset of the pre-fetched batch. For log tables, this is the
-    /// `base_log_offset` of the first underlying `LogRecordBatch`. For KV
-    /// tables (limit scan on a primary-key table) there is no log offset, so
-    /// this is `0`.
-    base_offset: i64,
-}
-
-impl BatchScanner {
-    pub(super) async fn new(
+impl LimitBatchScanner {
+    pub(super) fn new(
         rpc_client: Arc<RpcClient>,
         metadata: Arc<Metadata>,
         table_info: TableInfo,
+        schema_getter: Arc<ClientSchemaGetter>,
         projected_fields: Option<Vec<usize>>,
         bucket: TableBucket,
         limit: i32,
-    ) -> Result<Self> {
-        // Resolve leader for the target bucket (mirrors Lookuper's pattern).
-        let leader = metadata
-            .leader_for(&table_info.table_path, &bucket)
-            .await?
-            .ok_or_else(|| {
-                Error::leader_not_available(format!(
-                    "No leader found for table bucket: {bucket}"
-                ))
-            })?;
-        let connection = rpc_client.get_connection(&leader).await?;
-
-        // Fire the single LimitScanRequest RPC.
-        let request = LimitScanRequest::new(
-            table_info.table_id,
-            bucket.partition_id(),
-            bucket.bucket_id(),
-            limit,
-        );
-        let response = connection.request(request).await?;
-
-        // Surface server-side errors using the same shape as Lookuper.
-        if let Some(error_code) = response.error_code
-            && error_code != FlussError::None.code()
-        {
-            let err: ApiError = ErrorResponse {
-                error_code,
-                error_message: response.error_message.clone(),
-            }
-            .into();
-            return Err(Error::FlussAPIError { api_error: err });
+    ) -> Self {
+        Self {
+            bucket,
+            pending: Some(PendingScan {
+                rpc_client,
+                metadata,
+                table_info,
+                schema_getter,
+                projected_fields,
+                limit,
+            }),
         }
+    }
 
-        let is_log_table = response.is_log_table.unwrap_or(false);
-        let raw = response.records.unwrap_or_default();
-
-        let (batch, base_offset) = if is_log_table {
-            decode_log_batch(&table_info, projected_fields.as_deref(), raw)?
-        } else {
-            (decode_kv_batch(&table_info, projected_fields.as_deref(), raw)?, 0)
+    /// Runs the scan on the first call and returns its batch, then `None`. Not
+    /// retried — an error leaves the scanner spent; create a new one to retry.
+    pub async fn next_batch(&mut self) -> Result<Option<ScanBatch>> {
+        let Some(pending) = self.pending.take() else {
+            return Ok(None);
         };
-
-        Ok(Self {
-            bucket,
-            batch: Some(batch),
-            base_offset,
-        })
+        run_limit_scan(&pending, &self.bucket).await.map(Some)
     }
 
-    /// Returns the pre-fetched batch on the first call, then `None`.
-    pub async fn poll_batch(&mut self) -> Result<Option<ScanBatch>> {
-        let base_offset = self.base_offset;
-        Ok(self
-            .batch
-            .take()
-            .map(|b| ScanBatch::new(self.bucket.clone(), b, base_offset)))
+    /// Drains the scanner into all of its batches.
+    pub async fn collect_all_batches(&mut self) -> Result<Vec<ScanBatch>> {
+        let mut batches = Vec::new();
+        while let Some(batch) = self.next_batch().await? {
+            batches.push(batch);
+        }
+        Ok(batches)
     }
 
-    /// The bucket scanned by this `BatchScanner`.
+    /// The bucket scanned by this `LimitBatchScanner`.
     pub fn bucket(&self) -> &TableBucket {
         &self.bucket
     }
 }
 
-/// Decode an Arrow-IPC encoded `LogRecordBatch` payload into a single Arrow
-/// `RecordBatch`. Multiple inner batches (rare for a `LimitScanRequest`) are
-/// concatenated.
+/// Resolves the leader, sends the `LimitScanRequest`, and decodes the response
+/// into one [`ScanBatch`].
+async fn run_limit_scan(pending: &PendingScan, bucket: &TableBucket) -> Result<ScanBatch> {
+    let leader = pending
+        .metadata
+        .leader_for(&pending.table_info.table_path, bucket)
+        .await?
+        .ok_or_else(|| {
+            Error::leader_not_available(format!("No leader found for table bucket: {bucket}"))
+        })?;
+    let connection = pending.rpc_client.get_connection(&leader).await?;
+
+    let request = LimitScanRequest::new(
+        pending.table_info.table_id,
+        bucket.partition_id(),
+        bucket.bucket_id(),
+        pending.limit,
+    );
+    let response = connection.request(request).await?;
+
+    if let Some(error_code) = response.error_code
+        && error_code != FlussError::None.code()
+    {
+        let err: ApiError = ErrorResponse {
+            error_code,
+            error_message: response.error_message.clone(),
+        }
+        .into();
+        return Err(Error::FlussAPIError { api_error: err });
+    }
+
+    let raw = response.records.unwrap_or_default();
+    // `limit` is validated positive by `TableScan::limit`.
+    let limit = pending.limit.max(0) as usize;
+    let projected = pending.projected_fields.as_deref();
+
+    // Choose the payload format from table metadata, not the response's advisory
+    // `is_log_table` flag.
+    let (batch, base_offset) = if !pending.table_info.has_primary_key() {
+        decode_log_batch(&pending.table_info, projected, raw, limit)?
+    } else {
+        // KV (primary-key) limit scan: no log offset, so base_offset is 0.
+        let batch = decode_kv_batch(
+            &pending.table_info,
+            &pending.schema_getter,
+            projected,
+            raw,
+            limit,
+        )
+        .await?;
+        (batch, 0)
+    };
+
+    Ok(ScanBatch::new(bucket.clone(), batch, base_offset))
+}
+
+/// Decode the log payload into a single Arrow `RecordBatch`, concatenating any
+/// inner batches. If more than `limit` rows are returned, the last `limit` are
+/// kept and `base_offset` is advanced by the number dropped.
 fn decode_log_batch(
     table_info: &TableInfo,
     projected_fields: Option<&[usize]>,
     raw: Vec<u8>,
+    limit: usize,
 ) -> Result<(RecordBatch, i64)> {
     let row_type = Arc::new(table_info.get_row_type().clone());
     let full_schema = to_arrow_schema(table_info.get_row_type())?;
@@ -159,10 +189,9 @@ fn decode_log_batch(
 
     let target_schema: SchemaRef = match projected_fields {
         None => full_schema,
-        Some(fields) => ArrowReadContext::project_schema(
-            to_arrow_schema(table_info.get_row_type())?,
-            fields,
-        )?,
+        Some(fields) => {
+            ArrowReadContext::project_schema(to_arrow_schema(table_info.get_row_type())?, fields)?
+        }
     };
 
     if raw.is_empty() {
@@ -181,89 +210,189 @@ fn decode_log_batch(
     }
 
     let base_offset = base_offset.unwrap_or(0);
-    if batches.is_empty() {
-        return Ok((RecordBatch::new_empty(target_schema), base_offset));
-    }
-    if batches.len() == 1 {
-        return Ok((batches.into_iter().next().unwrap(), base_offset));
-    }
-    let merged = arrow::compute::concat_batches(&target_schema, batches.iter()).map_err(|e| {
-        Error::UnexpectedError {
+    let merged = if batches.is_empty() {
+        RecordBatch::new_empty(target_schema)
+    } else if batches.len() == 1 {
+        batches.into_iter().next().unwrap()
+    } else {
+        concat_batches(&target_schema, batches.iter()).map_err(|e| Error::UnexpectedError {
             message: format!("Failed to concatenate log record batches: {e}"),
             source: None,
-        }
-    })?;
-    Ok((merged, base_offset))
+        })?
+    };
+
+    Ok(take_last_rows(merged, base_offset, limit))
 }
 
-/// Decode a KV-format payload into a single Arrow `RecordBatch`. Each
-/// `CompactedRow` is appended through [`RowAppendRecordBatchBuilder`]; deletion
-/// records (no value) are skipped because primary key tables don't return
-/// tombstones from a limit scan.
-fn decode_kv_batch(
+/// Decode a KV limit-scan [`ValueRecordBatch`] into a single Arrow
+/// `RecordBatch`, decoding each record by its own schema id and projecting onto
+/// the current schema.
+async fn decode_kv_batch(
     table_info: &TableInfo,
+    schema_getter: &ClientSchemaGetter,
     projected_fields: Option<&[usize]>,
     raw: Vec<u8>,
+    limit: usize,
 ) -> Result<RecordBatch> {
-    let row_type = table_info.get_row_type();
-    let full_arrow_schema = to_arrow_schema(row_type)?;
-
+    // No records: return an empty (projected) batch.
     if raw.is_empty() {
-        let schema: SchemaRef = match projected_fields {
-            None => full_arrow_schema,
-            Some(fields) => ArrowReadContext::project_schema(full_arrow_schema, fields)?,
-        };
-        return Ok(RecordBatch::new_empty(schema));
+        return empty_record_batch(table_info.get_row_type(), projected_fields);
     }
 
     let kv_format = table_info.table_config.get_kv_format()?;
-    let schema_getter = Arc::new(TableInfoSchemaGetter {
-        schema: Arc::new(table_info.get_schema().clone()),
-    });
-    let read_context = KvRecordReadContext::new(kv_format, schema_getter);
-
-    // The KV records payload may be a single batch or a sequence of batches.
-    // The server-side `LimitScanResponse` returns one batch in practice, but
-    // we walk the buffer defensively.
-    let bytes = Bytes::from(raw);
-    let mut builder = RowAppendRecordBatchBuilder::new(row_type)?;
-    let mut position = 0usize;
-
-    while position < bytes.len() {
-        let kv_batch = KvRecordBatch::new(bytes.clone(), position);
-        let size = kv_batch.size_in_bytes().map_err(|e| Error::UnexpectedError {
-            message: format!("Invalid KvRecordBatch length: {e}"),
+    let target_schema = table_info.get_schema();
+    let target_schema_id =
+        i16::try_from(table_info.get_schema_id()).map_err(|_| Error::UnexpectedError {
+            message: format!(
+                "Schema id {} does not fit in 16 bits — wire format violated",
+                table_info.get_schema_id()
+            ),
             source: None,
         })?;
 
-        let records = kv_batch.records_unchecked(&read_context as &dyn KvReadContext)?;
-        let decoder = records.decoder_arc();
-        for record in records {
-            let record = record.map_err(|e| Error::UnexpectedError {
-                message: format!("Failed to read KV record: {e}"),
+    let batch = ValueRecordBatch::new(Bytes::from(raw));
+    let ranges = batch.value_ranges()?;
+
+    // Collect the distinct schema ids present, then build one decoder per id
+    // (fetching older schemas via the coordinator as needed).
+    let mut schema_ids: Vec<i16> = Vec::new();
+    for range in &ranges {
+        let id = read_schema_id(&batch.data()[range.clone()])?;
+        if !schema_ids.contains(&id) {
+            schema_ids.push(id);
+        }
+    }
+    let decoders = build_kv_decoders(
+        schema_getter,
+        target_schema,
+        target_schema_id,
+        kv_format,
+        &schema_ids,
+    )
+    .await?;
+
+    value_records_to_record_batch(
+        &batch,
+        &ranges,
+        &decoders,
+        table_info.get_row_type(),
+        projected_fields,
+        limit,
+    )
+}
+
+/// Build one [`FixedSchemaDecoder`] per distinct schema id. The current schema
+/// decodes without projection; older schemas are fetched and projected onto the
+/// current schema.
+async fn build_kv_decoders(
+    schema_getter: &ClientSchemaGetter,
+    target_schema: &Schema,
+    target_schema_id: i16,
+    kv_format: KvFormat,
+    schema_ids: &[i16],
+) -> Result<HashMap<i16, FixedSchemaDecoder>> {
+    let mut decoders = HashMap::with_capacity(schema_ids.len());
+    for &id in schema_ids {
+        if decoders.contains_key(&id) {
+            continue;
+        }
+        let decoder = if id == target_schema_id {
+            FixedSchemaDecoder::new_no_projection(kv_format, target_schema)?
+        } else {
+            let source = schema_getter.get_schema(id as i32).await?;
+            FixedSchemaDecoder::new(kv_format, source.as_ref(), target_schema)?
+        };
+        decoders.insert(id, decoder);
+    }
+    Ok(decoders)
+}
+
+/// Decode every value record into a row shaped by `target_row_type`, build a
+/// single Arrow batch, keep the last `limit` rows, then apply column projection.
+fn value_records_to_record_batch(
+    batch: &ValueRecordBatch,
+    ranges: &[Range<usize>],
+    decoders: &HashMap<i16, FixedSchemaDecoder>,
+    target_row_type: &RowType,
+    projected_fields: Option<&[usize]>,
+    limit: usize,
+) -> Result<RecordBatch> {
+    let mut builder = RowAppendRecordBatchBuilder::new(target_row_type)?;
+    for range in ranges {
+        let payload = &batch.data()[range.clone()];
+        let schema_id = read_schema_id(payload)?;
+        let decoder = decoders
+            .get(&schema_id)
+            .ok_or_else(|| Error::UnexpectedError {
+                message: format!("No decoder built for schema id {schema_id}"),
                 source: None,
             })?;
-            if let Some(row) = record.row(&*decoder) {
-                builder.append(&row)?;
-            }
-        }
+        let row = decoder.decode(payload)?;
+        builder.append(&row)?;
+    }
+
+    let full = Arc::unwrap_or_clone(builder.build_arrow_record_batch()?);
+    let (full, _) = take_last_rows(full, 0, limit);
+    project_batch(full, target_row_type, projected_fields)
+}
 
-        position = position.checked_add(size).ok_or_else(|| Error::UnexpectedError {
-            message: "KvRecordBatch position overflow".to_string(),
+/// Read the leading little-endian schema id from a `[schema_id | row]` payload.
+fn read_schema_id(payload: &[u8]) -> Result<i16> {
+    if payload.len() < SCHEMA_ID_LENGTH {
+        return Err(Error::UnexpectedError {
+            message: format!(
+                "Value record payload too short: {} bytes, need {} for schema id",
+                payload.len(),
+                SCHEMA_ID_LENGTH
+            ),
             source: None,
-        })?;
+        });
+    }
+    let schema_id = LittleEndian::read_i16(&payload[..SCHEMA_ID_LENGTH]);
+    if schema_id < 0 {
+        return Err(Error::UnexpectedError {
+            message: format!("Invalid negative schema id {schema_id}; payload is corrupt"),
+            source: None,
+        });
     }
+    Ok(schema_id)
+}
 
-    let full_batch = Arc::unwrap_or_clone(builder.build_arrow_record_batch()?);
+/// Keep the last `limit` rows of `batch`, advancing `base_offset` by the number
+/// of dropped leading rows. A `batch` at or under the limit is returned as-is.
+fn take_last_rows(batch: RecordBatch, base_offset: i64, limit: usize) -> (RecordBatch, i64) {
+    let rows = batch.num_rows();
+    if rows > limit {
+        let dropped = rows - limit;
+        (batch.slice(dropped, limit), base_offset + dropped as i64)
+    } else {
+        (batch, base_offset)
+    }
+}
+
+/// An empty `RecordBatch` with the (optionally projected) target schema.
+fn empty_record_batch(
+    target_row_type: &RowType,
+    projected_fields: Option<&[usize]>,
+) -> Result<RecordBatch> {
+    let empty = RecordBatch::new_empty(to_arrow_schema(target_row_type)?);
+    project_batch(empty, target_row_type, projected_fields)
+}
 
+/// Project `batch` (shaped by `target_row_type`) onto the requested columns.
+fn project_batch(
+    batch: RecordBatch,
+    target_row_type: &RowType,
+    projected_fields: Option<&[usize]>,
+) -> Result<RecordBatch> {
     match projected_fields {
-        None => Ok(full_batch),
+        None => Ok(batch),
         Some(fields) => {
             let projected_schema =
-                ArrowReadContext::project_schema(full_arrow_schema, fields)?;
+                ArrowReadContext::project_schema(to_arrow_schema(target_row_type)?, fields)?;
             let columns: Vec<_> = fields
                 .iter()
-                .map(|&idx| full_batch.column(idx).clone())
+                .map(|&idx| batch.column(idx).clone())
                 .collect();
             Ok(RecordBatch::try_new(projected_schema, columns)?)
         }
@@ -279,11 +408,14 @@ mod tests {
         DEFAULT_NON_ZSTD_COMPRESSION_LEVEL,
     };
     use crate::metadata::{
-        DataField, DataTypes, PhysicalTablePath, Schema, TableDescriptor, TableInfo,
-        TablePath,
+        Column, DataField, DataType, DataTypes, PhysicalTablePath, Schema, TableDescriptor,
+        TableInfo, TablePath,
     };
     use crate::record::MemoryLogRecordsArrowBuilder;
     use crate::row::GenericRow;
+    use crate::row::binary::BinaryWriter;
+    use crate::row::compacted::CompactedRowWriter;
+    use arrow::array::{Array, Int32Array, Int64Array};
 
     fn build_two_col_table_info() -> TableInfo {
         let row_type = DataTypes::row(vec![
@@ -309,7 +441,11 @@ mod tests {
         )
     }
 
-    fn build_log_records(table_info: &TableInfo, base_offset: i64, rows: &[(i32, &str)]) -> Vec<u8> {
+    fn build_log_records(
+        table_info: &TableInfo,
+        base_offset: i64,
+        rows: &[(i32, &str)],
+    ) -> Vec<u8> {
         let row_type = table_info.get_row_type();
         let table_path = table_info.table_path.clone();
         let table_info_arc = Arc::new(table_info.clone());
@@ -347,11 +483,13 @@ mod tests {
         data
     }
 
+    // ---- log path ----------------------------------------------------------
+
     #[test]
     fn decode_log_batch_empty_returns_empty_record_batch() {
         let table_info = build_two_col_table_info();
         let (batch, base_offset) =
-            decode_log_batch(&table_info, None, Vec::new()).expect("decode empty");
+            decode_log_batch(&table_info, None, Vec::new(), usize::MAX).expect("decode empty");
         assert_eq!(batch.num_rows(), 0);
         assert_eq!(batch.num_columns(), 2);
         assert_eq!(base_offset, 0);
@@ -361,7 +499,8 @@ mod tests {
     fn decode_log_batch_empty_with_projection() {
         let table_info = build_two_col_table_info();
         let (batch, base_offset) =
-            decode_log_batch(&table_info, Some(&[1usize]), Vec::new()).expect("decode empty");
+            decode_log_batch(&table_info, Some(&[1usize]), Vec::new(), usize::MAX)
+                .expect("decode empty");
         assert_eq!(batch.num_rows(), 0);
         assert_eq!(batch.num_columns(), 1);
         assert_eq!(batch.schema().field(0).name(), "name");
@@ -374,7 +513,7 @@ mod tests {
         let raw = build_log_records(&table_info, 17, &[(1, "alice"), (2, "bob"), (3, "carol")]);
 
         let (batch, base_offset) =
-            decode_log_batch(&table_info, None, raw).expect("decode populated");
+            decode_log_batch(&table_info, None, raw, usize::MAX).expect("decode populated");
         assert_eq!(batch.num_rows(), 3);
         assert_eq!(batch.num_columns(), 2);
         assert_eq!(base_offset, 17);
@@ -385,51 +524,244 @@ mod tests {
         let table_info = build_two_col_table_info();
         let raw = build_log_records(&table_info, 0, &[(7, "x"), (8, "y")]);
 
-        let (batch, _) =
-            decode_log_batch(&table_info, Some(&[0usize]), raw).expect("decode projected");
+        let (batch, _) = decode_log_batch(&table_info, Some(&[0usize]), raw, usize::MAX)
+            .expect("decode projected");
         assert_eq!(batch.num_rows(), 2);
         assert_eq!(batch.num_columns(), 1);
         assert_eq!(batch.schema().field(0).name(), "id");
     }
 
     #[test]
-    fn decode_kv_batch_empty_returns_empty_record_batch() {
+    fn decode_log_batch_truncates_to_last_limit_rows() {
         let table_info = build_two_col_table_info();
-        let batch = decode_kv_batch(&table_info, None, Vec::new()).expect("decode empty kv");
-        assert_eq!(batch.num_rows(), 0);
-        assert_eq!(batch.num_columns(), 2);
+        // Server returned 4 rows starting at offset 100, but limit is 2.
+        let raw = build_log_records(&table_info, 100, &[(1, "a"), (2, "b"), (3, "c"), (4, "d")]);
+
+        let (batch, base_offset) = decode_log_batch(&table_info, None, raw, 2).expect("decode");
+        assert_eq!(batch.num_rows(), 2);
+        // The last two rows are kept, so the base offset advances by 2.
+        assert_eq!(base_offset, 102);
+        let ids = batch
+            .column(0)
+            .as_any()
+            .downcast_ref::<Int32Array>()
+            .unwrap();
+        assert_eq!(ids.value(0), 3);
+        assert_eq!(ids.value(1), 4);
+    }
+
+    // ---- KV path -----------------------------------------------------------
+
+    fn schema_with_ids(columns: &[(i32, &str, DataType)]) -> Schema {
+        let cols: Vec<Column> = columns
+            .iter()
+            .map(|(id, name, dt)| Column::new(*name, dt.clone()).with_id(*id))
+            .collect();
+        Schema::builder().with_columns(cols).build().unwrap()
+    }
+
+    /// Encode a value-record batch from `(schema_id, compacted-row-bytes)`
+    /// pairs, matching the Java `DefaultValueRecordBatch` wire layout.
+    fn value_batch(records: &[(i16, Vec<u8>)]) -> ValueRecordBatch {
+        let mut body = Vec::new();
+        for (schema_id, row) in records {
+            let rec_len = (SCHEMA_ID_LENGTH + row.len()) as i32;
+            body.extend_from_slice(&rec_len.to_le_bytes());
+            body.extend_from_slice(&schema_id.to_le_bytes());
+            body.extend_from_slice(row);
+        }
+        let mut out = Vec::new();
+        out.extend_from_slice(&((1 + 4 + body.len()) as i32).to_le_bytes()); // Length
+        out.push(0); // Magic
+        out.extend_from_slice(&(records.len() as i32).to_le_bytes()); // RecordCount
+        out.extend_from_slice(&body);
+        ValueRecordBatch::new(Bytes::from(out))
+    }
+
+    fn compacted(field_count: usize, write: impl FnOnce(&mut CompactedRowWriter)) -> Vec<u8> {
+        let mut w = CompactedRowWriter::new(field_count);
+        write(&mut w);
+        w.to_bytes().as_ref().to_vec()
+    }
+
+    fn id_name_schema() -> Schema {
+        schema_with_ids(&[
+            (0, "id", DataTypes::int()),
+            (1, "name", DataTypes::string()),
+        ])
     }
 
     #[test]
-    fn decode_kv_batch_empty_with_projection() {
-        let table_info = build_two_col_table_info();
-        let batch = decode_kv_batch(&table_info, Some(&[0usize]), Vec::new())
-            .expect("decode projected empty kv");
-        assert_eq!(batch.num_rows(), 0);
-        assert_eq!(batch.num_columns(), 1);
-        assert_eq!(batch.schema().field(0).name(), "id");
+    fn value_records_empty_returns_empty_batch() {
+        let schema = id_name_schema();
+        let batch = value_batch(&[]);
+        let ranges = batch.value_ranges().unwrap();
+        let rb = value_records_to_record_batch(
+            &batch,
+            &ranges,
+            &HashMap::new(),
+            schema.row_type(),
+            None,
+            usize::MAX,
+        )
+        .expect("decode empty kv");
+        assert_eq!(rb.num_rows(), 0);
+        assert_eq!(rb.num_columns(), 2);
     }
 
-    #[tokio::test]
-    async fn poll_batch_returns_batch_then_none() {
-        let table_info = build_two_col_table_info();
-        let raw = build_log_records(&table_info, 5, &[(1, "alice"), (2, "bob")]);
-        let (batch, base_offset) = decode_log_batch(&table_info, None, raw).expect("decode");
-
-        let bucket = TableBucket::new(table_info.table_id, 0);
-        let mut scanner = BatchScanner {
-            bucket: bucket.clone(),
-            batch: Some(batch),
-            base_offset,
-        };
+    #[test]
+    fn empty_kv_payload_returns_empty_batch() {
+        let schema = id_name_schema();
+        // Full schema.
+        let rb = empty_record_batch(schema.row_type(), None).expect("empty");
+        assert_eq!(rb.num_rows(), 0);
+        assert_eq!(rb.num_columns(), 2);
+        // Projected.
+        let rb = empty_record_batch(schema.row_type(), Some(&[1usize])).expect("empty projected");
+        assert_eq!(rb.num_rows(), 0);
+        assert_eq!(rb.num_columns(), 1);
+        assert_eq!(rb.schema().field(0).name(), "name");
+    }
 
-        let first = scanner.poll_batch().await.expect("poll").expect("some");
-        assert_eq!(first.bucket(), &bucket);
-        assert_eq!(first.num_records(), 2);
-        assert_eq!(first.base_offset(), 5);
-        assert_eq!(first.last_offset(), 6);
+    #[test]
+    fn value_records_decode_rows() {
+        let schema = id_name_schema();
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &schema).unwrap();
+        let mut decoders = HashMap::new();
+        decoders.insert(0i16, decoder);
+
+        let r0 = compacted(2, |w| {
+            w.write_int(1);
+            w.write_string("alice");
+        });
+        let r1 = compacted(2, |w| {
+            w.write_int(2);
+            w.write_string("bob");
+        });
+        let batch = value_batch(&[(0, r0), (0, r1)]);
+        let ranges = batch.value_ranges().unwrap();
+
+        let rb = value_records_to_record_batch(
+            &batch,
+            &ranges,
+            &decoders,
+            schema.row_type(),
+            None,
+            usize::MAX,
+        )
+        .expect("decode kv rows");
+        assert_eq!(rb.num_rows(), 2);
+        let ids = rb.column(0).as_any().downcast_ref::<Int32Array>().unwrap();
+        assert_eq!(ids.value(0), 1);
+        assert_eq!(ids.value(1), 2);
+    }
+
+    #[test]
+    fn value_records_limit_keeps_last_rows() {
+        let schema = id_name_schema();
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &schema).unwrap();
+        let mut decoders = HashMap::new();
+        decoders.insert(0i16, decoder);
+
+        let records: Vec<(i16, Vec<u8>)> = (1..=5)
+            .map(|i| {
+                (
+                    0i16,
+                    compacted(2, |w| {
+                        w.write_int(i);
+                        w.write_string("x");
+                    }),
+                )
+            })
+            .collect();
+        let batch = value_batch(&records);
+        let ranges = batch.value_ranges().unwrap();
+
+        let rb =
+            value_records_to_record_batch(&batch, &ranges, &decoders, schema.row_type(), None, 3)
+                .expect("decode kv rows");
+        assert_eq!(rb.num_rows(), 3);
+        let ids = rb.column(0).as_any().downcast_ref::<Int32Array>().unwrap();
+        // Last 3 of [1,2,3,4,5].
+        assert_eq!(ids.values(), &[3, 4, 5]);
+    }
 
-        let second = scanner.poll_batch().await.expect("poll");
-        assert!(second.is_none());
+    #[test]
+    fn value_records_projection_keeps_requested_columns() {
+        let schema = id_name_schema();
+        let decoder = FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &schema).unwrap();
+        let mut decoders = HashMap::new();
+        decoders.insert(0i16, decoder);
+
+        let r0 = compacted(2, |w| {
+            w.write_int(9);
+            w.write_string("nine");
+        });
+        let batch = value_batch(&[(0, r0)]);
+        let ranges = batch.value_ranges().unwrap();
+
+        let rb = value_records_to_record_batch(
+            &batch,
+            &ranges,
+            &decoders,
+            schema.row_type(),
+            Some(&[1usize]),
+            usize::MAX,
+        )
+        .expect("decode projected kv");
+        assert_eq!(rb.num_columns(), 1);
+        assert_eq!(rb.schema().field(0).name(), "name");
+    }
+
+    #[test]
+    fn value_records_decode_across_schema_evolution() {
+        // Source schema (older): [id, name]. Target (current): added `age`.
+        let source = id_name_schema();
+        let target = schema_with_ids(&[
+            (0, "id", DataTypes::int()),
+            (1, "name", DataTypes::string()),
+            (2, "age", DataTypes::bigint()),
+        ]);
+
+        let mut decoders = HashMap::new();
+        // Records with schema id 0 were written under the old schema.
+        decoders.insert(
+            0i16,
+            FixedSchemaDecoder::new(KvFormat::COMPACTED, &source, &target).unwrap(),
+        );
+        // Records with schema id 1 carry the current schema.
+        decoders.insert(
+            1i16,
+            FixedSchemaDecoder::new_no_projection(KvFormat::COMPACTED, &target).unwrap(),
+        );
+
+        let old_row = compacted(2, |w| {
+            w.write_int(1);
+            w.write_string("alice");
+        });
+        let new_row = compacted(3, |w| {
+            w.write_int(2);
+            w.write_string("bob");
+            w.write_long(30);
+        });
+        let batch = value_batch(&[(0, old_row), (1, new_row)]);
+        let ranges = batch.value_ranges().unwrap();
+
+        let rb = value_records_to_record_batch(
+            &batch,
+            &ranges,
+            &decoders,
+            target.row_type(),
+            None,
+            usize::MAX,
+        )
+        .expect("decode mixed-schema kv");
+
+        assert_eq!(rb.num_rows(), 2);
+        assert_eq!(rb.num_columns(), 3);
+        let age = rb.column(2).as_any().downcast_ref::<Int64Array>().unwrap();
+        // Old record has no `age` column -> null; new record carries 30.
+        assert!(age.is_null(0), "old-schema record must read age as null");
+        assert_eq!(age.value(1), 30);
     }
 }
diff --git a/fluss-rust/crates/fluss/src/client/table/mod.rs b/fluss-rust/crates/fluss/src/client/table/mod.rs
index 5ef5d1793c..657a44bfe8 100644
--- a/fluss-rust/crates/fluss/src/client/table/mod.rs
+++ b/fluss-rust/crates/fluss/src/client/table/mod.rs
@@ -36,7 +36,7 @@ mod scanner;
 mod upsert;
 
 pub use append::{AppendWriter, TableAppend};
-pub use batch_scanner::BatchScanner;
+pub use batch_scanner::LimitBatchScanner;
 pub use lookup::{LookupResult, Lookuper, PrefixKeyLookuper, TableLookup, TablePrefixLookup};
 pub use reader::{RecordBatchLogReader, SyncRecordBatchLogReader};
 pub use remote_log::{
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 031975b3e6..35cc52e309 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -15,10 +15,11 @@
 // specific language governing permissions and limitations
 // under the License.
 
+use crate::client::ClientSchemaGetter;
 use crate::client::connection::FlussConnection;
-use crate::client::table::batch_scanner::BatchScanner;
 use crate::client::credentials::SecurityTokenManager;
 use crate::client::metadata::Metadata;
+use crate::client::table::batch_scanner::LimitBatchScanner;
 use crate::client::table::log_fetch_buffer::{
     CompletedFetch, DefaultCompletedFetch, FetchErrorAction, FetchErrorContext, FetchErrorLogLevel,
     LogFetchBuffer, RemotePendingFetch,
@@ -27,7 +28,9 @@ use crate::client::table::remote_log::{RemoteLogDownloader, RemoteLogFetchInfo};
 use crate::config::Config;
 use crate::error::Error::UnsupportedOperation;
 use crate::error::{ApiError, Error, FlussError, Result};
-use crate::metadata::{LogFormat, PhysicalTablePath, RowType, TableBucket, TableInfo, TablePath};
+use crate::metadata::{
+    LogFormat, PhysicalTablePath, RowType, SchemaInfo, TableBucket, TableInfo, TablePath,
+};
 use crate::metrics::ScannerMetrics;
 use crate::proto::{
     ErrorResponse, FetchLogRequest, FetchLogResponse, PbFetchLogReqForBucket, PbFetchLogReqForTable,
@@ -71,10 +74,10 @@ impl<'a> TableScan<'a> {
         }
     }
 
-    /// Sets a row limit for the scan, enabling [`Self::create_batch_scanner`].
+    /// Sets a row limit for the scan, enabling [`Self::create_bucket_batch_scanner`].
     ///
-    /// The limit must be positive. Callers configure a limit prior to
-    /// constructing a `BatchScanner` for a one-shot bounded read.
+    /// The limit must be positive. A limit is incompatible with the log
+    /// scanners, which reject it.
     pub fn limit(mut self, n: i32) -> Result<Self> {
         if n <= 0 {
             return Err(Error::IllegalArgument {
@@ -85,17 +88,31 @@ impl<'a> TableScan<'a> {
         Ok(self)
     }
 
-    /// Creates a `BatchScanner` that performs a single bounded scan of `table_bucket`.
+    /// Log scanners don't support limit pushdown; reject a configured limit
+    /// rather than silently ignoring it.
+    fn reject_limit(&self, scanner: &str) -> Result<()> {
+        if let Some(limit) = self.limit {
+            return Err(Error::UnsupportedOperation {
+                message: format!(
+                    "{scanner} doesn't support limit pushdown. Table: {}, requested limit: {limit}",
+                    self.table_info.table_path
+                ),
+            });
+        }
+        Ok(())
+    }
+
+    /// Creates a one-shot bounded scan of `table_bucket`.
     ///
-    /// Requires a previously-configured limit via [`Self::limit`]. The scanner sends
-    /// a `LimitScanRequest` eagerly and exposes the resulting batch through
-    /// [`BatchScanner::poll_batch`].
-    pub async fn create_batch_scanner(
+    /// Requires a previously-configured limit via [`Self::limit`]. Creation is
+    /// cheap; the `LimitScanRequest` runs on the first
+    /// [`LimitBatchScanner::next_batch`].
+    pub fn create_bucket_batch_scanner(
         self,
         table_bucket: TableBucket,
-    ) -> Result<BatchScanner> {
+    ) -> Result<LimitBatchScanner> {
         let limit = self.limit.ok_or_else(|| Error::IllegalArgument {
-            message: "create_batch_scanner requires a limit configured via .limit(n)"
+            message: "create_bucket_batch_scanner requires a limit configured via .limit(n)"
                 .to_string(),
         })?;
         if table_bucket.table_id() != self.table_info.table_id {
@@ -107,15 +124,40 @@ impl<'a> TableScan<'a> {
                 ),
             });
         }
-        BatchScanner::new(
+        let num_buckets = self.table_info.get_num_buckets();
+        if table_bucket.bucket_id() < 0 || table_bucket.bucket_id() >= num_buckets {
+            return Err(Error::IllegalArgument {
+                message: format!(
+                    "Bucket id {} out of range for table with {num_buckets} buckets",
+                    table_bucket.bucket_id()
+                ),
+            });
+        }
+        // Log tables decode as Arrow IPC, so only ARROW format is supported (KV
+        // tables use the value-record path and are exempt).
+        if !self.table_info.has_primary_key() {
+            validate_scan_support(&self.table_info.table_path, &self.table_info)?;
+        }
+        // Pre-seed the current schema; older versions are fetched lazily during
+        // KV decode. Mirrors `Table::new_lookup`.
+        let latest = SchemaInfo::new(
+            self.table_info.get_schema().clone(),
+            self.table_info.get_schema_id(),
+        );
+        let schema_getter = Arc::new(ClientSchemaGetter::new(
+            self.table_info.table_path.clone(),
+            self.conn.get_admin()?,
+            latest,
+        ));
+        Ok(LimitBatchScanner::new(
             self.conn.get_connections(),
             self.metadata.clone(),
             self.table_info,
+            schema_getter,
             self.projected_fields,
             table_bucket,
             limit,
-        )
-        .await
+        ))
     }
 
     /// Projects the scan to only include specified columns by their indices.
@@ -270,6 +312,7 @@ impl<'a> TableScan<'a> {
     }
 
     pub fn create_log_scanner(self) -> Result<LogScanner> {
+        self.reject_limit("LogScanner")?;
         validate_scan_support(&self.table_info.table_path, &self.table_info)?;
         let inner = LogScannerInner::new(
             &self.table_info,
@@ -284,6 +327,7 @@ impl<'a> TableScan<'a> {
     }
 
     pub fn create_record_batch_log_scanner(self) -> Result<RecordBatchLogScanner> {
+        self.reject_limit("RecordBatchLogScanner")?;
         validate_scan_support(&self.table_info.table_path, &self.table_info)?;
         let inner = LogScannerInner::new(
             &self.table_info,
diff --git a/fluss-rust/crates/fluss/src/record/kv/mod.rs b/fluss-rust/crates/fluss/src/record/kv/mod.rs
index 857c5e5fc9..8f7750a80a 100644
--- a/fluss-rust/crates/fluss/src/record/kv/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/mod.rs
@@ -22,6 +22,7 @@ mod kv_record_batch;
 mod kv_record_batch_builder;
 mod kv_record_read_context;
 mod read_context;
+mod value_record_batch;
 
 #[cfg(test)]
 mod test_util;
@@ -31,6 +32,7 @@ pub use kv_record_batch::*;
 pub use kv_record_batch_builder::*;
 pub use kv_record_read_context::{KvRecordReadContext, SchemaGetter};
 pub use read_context::ReadContext;
+pub use value_record_batch::ValueRecordBatch;
 
 /// Current KV magic value
 pub const CURRENT_KV_MAGIC_VALUE: u8 = 0;
diff --git a/fluss-rust/crates/fluss/src/record/kv/value_record_batch.rs b/fluss-rust/crates/fluss/src/record/kv/value_record_batch.rs
new file mode 100644
index 0000000000..cfcb4a6d61
--- /dev/null
+++ b/fluss-rust/crates/fluss/src/record/kv/value_record_batch.rs
@@ -0,0 +1,188 @@
+// Licensed to the Apache Software Foundation (ASF) under one
+// or more contributor license agreements.  See the NOTICE file
+// distributed with this work for additional information
+// regarding copyright ownership.  The ASF licenses this file
+// to you under the Apache License, Version 2.0 (the
+// "License"); you may not use this file except in compliance
+// with the License.  You may obtain a copy of the License at
+//
+//   http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing,
+// software distributed under the License is distributed on an
+// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+// KIND, either express or implied.  See the License for the
+// specific language governing permissions and limitations
+// under the License.
+
+//! Reader for the value-record batch returned by a KV (primary-key) limit
+//! scan. This is a distinct wire format from [`super::KvRecordBatch`]: it
+//! carries value-only records (no keys, no CRC/writer-id header) and a schema
+//! id *per record* rather than per batch.
+//!
+//! Batch layout (little-endian):
+//! - Length      => Int32  (size of everything after this field)
+//! - Magic       => Int8
+//! - RecordCount => Int32
+//! - Records     => [ValueRecord]
+//!
+//! Each `ValueRecord`:
+//! - Length   => Int32  (size after this field: SchemaId + Value)
+//! - SchemaId => Int16
+//! - Value    => row bytes
+//!
+//! Reference: `org.apache.fluss.record.DefaultValueRecordBatch` and
+//! `org.apache.fluss.record.DefaultValueRecord`.
+
+use crate::error::{Error, Result};
+use byteorder::{ByteOrder, LittleEndian};
+use bytes::Bytes;
+use std::ops::Range;
+
+const LENGTH_LENGTH: usize = 4;
+const MAGIC_LENGTH: usize = 1;
+const RECORD_COUNT_LENGTH: usize = 4;
+/// Offset of the record count within the batch header.
+const RECORD_COUNT_OFFSET: usize = LENGTH_LENGTH + MAGIC_LENGTH;
+/// Size of the batch header (`Length + Magic + RecordCount`).
+const RECORD_BATCH_HEADER_SIZE: usize = LENGTH_LENGTH + MAGIC_LENGTH + RECORD_COUNT_LENGTH;
+/// Size of a `ValueRecord`'s leading length field.
+const RECORD_LENGTH_LENGTH: usize = 4;
+
+/// Read-only view over a serialized value-record batch.
+pub struct ValueRecordBatch {
+    data: Bytes,
+}
+
+impl ValueRecordBatch {
+    /// Wraps raw batch bytes. The batch is expected to start at offset 0.
+    pub fn new(data: Bytes) -> Self {
+        Self { data }
+    }
+
+    /// Number of records declared in the batch header.
+    pub fn record_count(&self) -> Result<i32> {
+        if self.data.len() < RECORD_BATCH_HEADER_SIZE {
+            return Err(corrupt(format!(
+                "value-record batch too short: {} bytes, need {} for header",
+                self.data.len(),
+                RECORD_BATCH_HEADER_SIZE
+            )));
+        }
+        Ok(LittleEndian::read_i32(
+            &self.data[RECORD_COUNT_OFFSET..RECORD_COUNT_OFFSET + RECORD_COUNT_LENGTH],
+        ))
+    }
+
+    /// Returns one byte range per record, each spanning `[SchemaId | Value]`:
+    /// the payload [`crate::row::FixedSchemaDecoder::decode`] expects. Index
+    /// [`Self::data`] with a returned range to get it without copying.
+    pub fn value_ranges(&self) -> Result<Vec<Range<usize>>> {
+        let count = self.record_count()?;
+        if count < 0 {
+            return Err(corrupt(format!("invalid record count {count}")));
+        }
+        let mut ranges = Vec::with_capacity(count as usize);
+        let mut pos = RECORD_BATCH_HEADER_SIZE;
+        for i in 0..count as usize {
+            if pos + RECORD_LENGTH_LENGTH > self.data.len() {
+                return Err(corrupt(format!(
+                    "truncated value-record batch: record {i} length field runs past end"
+                )));
+            }
+            let rec_len = LittleEndian::read_i32(&self.data[pos..pos + RECORD_LENGTH_LENGTH]);
+            if rec_len < 0 {
+                return Err(corrupt(format!("record {i} has negative length {rec_len}")));
+            }
+            let start = pos + RECORD_LENGTH_LENGTH;
+            let end = start + rec_len as usize;
+            if end > self.data.len() {
+                return Err(corrupt(format!(
+                    "truncated value-record batch: record {i} payload runs past end"
+                )));
+            }
+            ranges.push(start..end);
+            pos = end;
+        }
+        Ok(ranges)
+    }
+
+    /// The underlying batch bytes.
+    pub fn data(&self) -> &Bytes {
+        &self.data
+    }
+}
+
+fn corrupt(message: String) -> Error {
+    Error::UnexpectedError {
+        message,
+        source: None,
+    }
+}
+
+#[cfg(test)]
+mod tests {
+    use super::*;
+    use crate::record::kv::SCHEMA_ID_LENGTH;
+
+    /// Build a value-record batch from `(schema_id, row_bytes)` pairs, mirroring
+    /// the Java `DefaultValueRecordBatch.Builder` wire layout.
+    fn build_batch(records: &[(i16, &[u8])]) -> Vec<u8> {
+        let mut body = Vec::new();
+        for (schema_id, row) in records {
+            let rec_len = (SCHEMA_ID_LENGTH + row.len()) as i32;
+            body.extend_from_slice(&rec_len.to_le_bytes());
+            body.extend_from_slice(&schema_id.to_le_bytes());
+            body.extend_from_slice(row);
+        }
+        let mut out = Vec::new();
+        // Length covers Magic + RecordCount + body.
+        let length = (MAGIC_LENGTH + RECORD_COUNT_LENGTH + body.len()) as i32;
+        out.extend_from_slice(&length.to_le_bytes());
+        out.push(0); // magic
+        out.extend_from_slice(&(records.len() as i32).to_le_bytes());
+        out.extend_from_slice(&body);
+        out
+    }
+
+    #[test]
+    fn parses_record_count_and_ranges() {
+        let raw = build_batch(&[(7, &[1, 2, 3]), (7, &[4, 5])]);
+        let batch = ValueRecordBatch::new(Bytes::from(raw));
+        assert_eq!(batch.record_count().unwrap(), 2);
+
+        let ranges = batch.value_ranges().unwrap();
+        assert_eq!(ranges.len(), 2);
+        // First record payload = [schema_id(2) | row(3)] = 5 bytes.
+        let r0 = &batch.data()[ranges[0].clone()];
+        assert_eq!(r0.len(), 5);
+        assert_eq!(LittleEndian::read_i16(&r0[..2]), 7);
+        assert_eq!(&r0[2..], &[1, 2, 3]);
+        // Second record payload = [schema_id(2) | row(2)] = 4 bytes.
+        let r1 = &batch.data()[ranges[1].clone()];
+        assert_eq!(r1.len(), 4);
+        assert_eq!(&r1[2..], &[4, 5]);
+    }
+
+    #[test]
+    fn empty_batch_has_no_ranges() {
+        let raw = build_batch(&[]);
+        let batch = ValueRecordBatch::new(Bytes::from(raw));
+        assert_eq!(batch.record_count().unwrap(), 0);
+        assert!(batch.value_ranges().unwrap().is_empty());
+    }
+
+    #[test]
+    fn truncated_payload_errors() {
+        let mut raw = build_batch(&[(7, &[1, 2, 3])]);
+        raw.truncate(raw.len() - 2); // chop into the row payload
+        let batch = ValueRecordBatch::new(Bytes::from(raw));
+        assert!(batch.value_ranges().is_err());
+    }
+
+    #[test]
+    fn short_header_errors() {
+        let batch = ValueRecordBatch::new(Bytes::from(vec![0u8, 1, 2]));
+        assert!(batch.record_count().is_err());
+    }
+}
diff --git a/fluss-rust/crates/fluss/tests/integration/batch_scanner.rs b/fluss-rust/crates/fluss/tests/integration/batch_scanner.rs
index 2623528176..0b484a8c66 100644
--- a/fluss-rust/crates/fluss/tests/integration/batch_scanner.rs
+++ b/fluss-rust/crates/fluss/tests/integration/batch_scanner.rs
@@ -19,12 +19,13 @@
 #[cfg(test)]
 mod batch_scanner_test {
     use crate::integration::utils::{create_table, get_shared_cluster};
-    use arrow::array::record_batch;
-    use fluss::metadata::{DataTypes, Schema, TableBucket, TableDescriptor, TablePath};
-    use std::time::Duration;
+    use arrow::array::{Int32Array, StringArray, record_batch};
+    use fluss::metadata::{DataTypes, LogFormat, Schema, TableBucket, TableDescriptor, TablePath};
+    use fluss::row::GenericRow;
+    use std::collections::HashMap;
 
-    /// End-to-end check that BatchScanner returns the appended rows on first
-    /// poll and `None` on the next, honoring the configured limit.
+    /// End-to-end check that the scanner yields the appended rows once and then
+    /// `None`, honoring the configured limit.
     #[tokio::test]
     async fn batch_scanner_returns_appended_rows_then_none() {
         let cluster = get_shared_cluster();
@@ -61,22 +62,18 @@ mod batch_scanner_test {
         writer.append_arrow_batch(batch).expect("append batch");
         writer.flush().await.expect("flush");
 
-        // Give the server a moment to commit and make the records readable.
-        tokio::time::sleep(Duration::from_secs(1)).await;
-
         let table_info = table.get_table_info();
         let bucket = TableBucket::new(table_info.table_id, 0);
 
-        let mut batch_scanner = table
+        let mut scanner = table
             .new_scan()
             .limit(3)
             .expect("limit")
-            .create_batch_scanner(bucket.clone())
-            .await
+            .create_bucket_batch_scanner(bucket.clone())
             .expect("create batch scanner");
 
-        let first = batch_scanner
-            .poll_batch()
+        let first = scanner
+            .next_batch()
             .await
             .expect("poll")
             .expect("first batch should be Some");
@@ -90,17 +87,109 @@ mod batch_scanner_test {
             first.num_records()
         );
 
-        let second = batch_scanner
-            .poll_batch()
+        assert!(
+            scanner.next_batch().await.expect("poll").is_none(),
+            "scanner must end after one batch"
+        );
+    }
+
+    /// Limit scan on a primary-key table: decodes the value-record batch and
+    /// honors the limit. Exercises the KV wire path (distinct from the log one).
+    #[tokio::test]
+    async fn batch_scanner_reads_primary_key_table() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("admin");
+
+        let table_path = TablePath::new("fluss", "test_batch_scanner_pk");
+        let descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("id", DataTypes::int())
+                    .column("name", DataTypes::string())
+                    .primary_key(vec!["id"])
+                    .build()
+                    .expect("schema"),
+            )
+            // Single bucket so one BatchScanner sees every row.
+            .distributed_by(Some(1), vec!["id".to_string()])
+            .build()
+            .expect("descriptor");
+        create_table(&admin, &table_path, &descriptor).await;
+
+        let table = connection.get_table(&table_path).await.expect("table");
+        let writer = table
+            .new_upsert()
+            .expect("upsert")
+            .create_writer()
+            .expect("writer");
+
+        let expected: HashMap<i32, &str> =
+            [(1, "a"), (2, "b"), (3, "c"), (4, "d"), (5, "e")].into();
+        for (id, name) in &expected {
+            let mut row = GenericRow::new(2);
+            row.set_field(0, *id);
+            row.set_field(1, *name);
+            writer.upsert(&row).expect("upsert row");
+        }
+        writer.flush().await.expect("flush");
+
+        let table_info = table.get_table_info();
+        let bucket = TableBucket::new(table_info.table_id, 0);
+
+        let mut scanner = table
+            .new_scan()
+            .limit(3)
+            .expect("limit")
+            .create_bucket_batch_scanner(bucket.clone())
+            .expect("create batch scanner");
+
+        let first = scanner
+            .next_batch()
             .await
-            .expect("second poll succeeds");
-        assert!(second.is_none(), "second poll must return None");
+            .expect("poll")
+            .expect("first batch should be Some");
+
+        assert_eq!(first.bucket(), &bucket);
+        let rows = first.batch();
+        assert_eq!(rows.num_columns(), 2, "id + name");
+        assert!(
+            rows.num_rows() > 0 && rows.num_rows() <= 3,
+            "expected 1..=3 records, got {}",
+            rows.num_rows()
+        );
+
+        // Every returned (id, name) must match what we upserted.
+        let ids = rows
+            .column(0)
+            .as_any()
+            .downcast_ref::<Int32Array>()
+            .expect("id column Int32");
+        let names = rows
+            .column(1)
+            .as_any()
+            .downcast_ref::<StringArray>()
+            .expect("name column Utf8");
+        for i in 0..rows.num_rows() {
+            let id = ids.value(i);
+            let name = names.value(i);
+            assert_eq!(
+                expected.get(&id),
+                Some(&name),
+                "decoded row ({id}, {name}) does not match upserted data"
+            );
+        }
+
+        assert!(
+            scanner.next_batch().await.expect("poll").is_none(),
+            "scanner must end after one batch"
+        );
     }
 
-    /// A bucket id outside the table's bucket range should be rejected by the
-    /// scanner before any RPC is made.
+    /// A bucket with the wrong table_id or an out-of-range bucket_id must be
+    /// rejected before any RPC is made.
     #[tokio::test]
-    async fn batch_scanner_requires_matching_table_id() {
+    async fn batch_scanner_rejects_invalid_bucket() {
         let cluster = get_shared_cluster();
         let connection = cluster.get_fluss_connection().await;
         let admin = connection.get_admin().expect("admin");
@@ -119,19 +208,64 @@ mod batch_scanner_test {
         create_table(&admin, &table_path, &descriptor).await;
 
         let table = connection.get_table(&table_path).await.expect("table");
+        let table_id = table.get_table_info().table_id;
+
+        // Wrong table_id.
+        assert!(
+            table
+                .new_scan()
+                .limit(1)
+                .expect("limit")
+                .create_bucket_batch_scanner(TableBucket::new(table_id + 9999, 0))
+                .is_err(),
+            "must reject mismatched table_id"
+        );
 
-        // Bucket with a wrong table_id — must fail without hitting the server.
-        let bogus_bucket = TableBucket::new(table.get_table_info().table_id + 9999, 0);
+        // Bucket id past the single bucket of this table.
+        assert!(
+            table
+                .new_scan()
+                .limit(1)
+                .expect("limit")
+                .create_bucket_batch_scanner(TableBucket::new(table_id, 99))
+                .is_err(),
+            "must reject out-of-range bucket_id"
+        );
+    }
+
+    /// A limit scan over a non-ARROW log table must be rejected (the log path
+    /// decodes Arrow IPC).
+    #[tokio::test]
+    async fn batch_scanner_rejects_non_arrow_log_format() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("admin");
+
+        let table_path = TablePath::new("fluss", "test_batch_scanner_indexed");
+        let descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("c1", DataTypes::int())
+                    .build()
+                    .expect("schema"),
+            )
+            .log_format(LogFormat::INDEXED)
+            .distributed_by(Some(1), vec!["c1".to_string()])
+            .build()
+            .expect("descriptor");
+        create_table(&admin, &table_path, &descriptor).await;
+
+        let table = connection.get_table(&table_path).await.expect("table");
+        let bucket = TableBucket::new(table.get_table_info().table_id, 0);
 
-        let result = table
-            .new_scan()
-            .limit(1)
-            .expect("limit")
-            .create_batch_scanner(bogus_bucket)
-            .await;
         assert!(
-            result.is_err(),
-            "batch scanner must reject mismatched table_id"
+            table
+                .new_scan()
+                .limit(1)
+                .expect("limit")
+                .create_bucket_batch_scanner(bucket)
+                .is_err(),
+            "must reject INDEXED log format"
         );
     }
 
@@ -159,4 +293,46 @@ mod batch_scanner_test {
         assert!(table.new_scan().limit(0).is_err());
         assert!(table.new_scan().limit(-5).is_err());
     }
+
+    /// A configured limit must be rejected by the log scanners rather than
+    /// silently ignored.
+    #[tokio::test]
+    async fn limit_is_rejected_by_log_scanners() {
+        let cluster = get_shared_cluster();
+        let connection = cluster.get_fluss_connection().await;
+        let admin = connection.get_admin().expect("admin");
+
+        let table_path = TablePath::new("fluss", "test_batch_scanner_limit_logscan");
+        let descriptor = TableDescriptor::builder()
+            .schema(
+                Schema::builder()
+                    .column("c1", DataTypes::int())
+                    .build()
+                    .expect("schema"),
+            )
+            .distributed_by(Some(1), vec!["c1".to_string()])
+            .build()
+            .expect("descriptor");
+        create_table(&admin, &table_path, &descriptor).await;
+
+        let table = connection.get_table(&table_path).await.expect("table");
+        assert!(
+            table
+                .new_scan()
+                .limit(5)
+                .expect("limit")
+                .create_log_scanner()
+                .is_err(),
+            "create_log_scanner must reject a configured limit"
+        );
+        assert!(
+            table
+                .new_scan()
+                .limit(5)
+                .expect("limit")
+                .create_record_batch_log_scanner()
+                .is_err(),
+            "create_record_batch_log_scanner must reject a configured limit"
+        );
+    }
 }
diff --git a/fluss-rust/crates/fluss/tests/integration/log_table.rs b/fluss-rust/crates/fluss/tests/integration/log_table.rs
index e2377e1ddc..f8323df7c2 100644
--- a/fluss-rust/crates/fluss/tests/integration/log_table.rs
+++ b/fluss-rust/crates/fluss/tests/integration/log_table.rs
@@ -217,8 +217,6 @@ mod table_test {
         // Flush to ensure all writes are acknowledged
         append_writer.flush().await.expect("Failed to flush");
 
-        tokio::time::sleep(tokio::time::Duration::from_secs(1)).await;
-
         // Test latest offset after appending (should be 3)
         let latest_offsets_after = admin
             .list_offsets(&table_path, &[0], OffsetSpec::Latest)
diff --git a/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs b/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs
index cf89c065b9..6c8d5392c1 100644
--- a/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs
+++ b/fluss-rust/crates/fluss/tests/integration/record_batch_log_reader.rs
@@ -21,7 +21,7 @@
 mod reader_test {
     use crate::integration::utils::{
         create_partitions, create_table, extract_ids_from_batches, get_shared_cluster,
-        wait_for_partitions_ready, wait_for_table_buckets_ready, wait_for_table_ready,
+        wait_for_partitions_ready,
     };
     use arrow::array::record_batch;
     use fluss::client::{EARLIEST_OFFSET, FlussConnection, RecordBatchLogReader};
@@ -49,7 +49,6 @@ mod reader_test {
             .build()
             .expect("Failed to build table");
         create_table(&admin, &table_path, &table_descriptor).await;
-        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection
             .get_table(&table_path)
@@ -122,7 +121,6 @@ mod reader_test {
             .build()
             .expect("Failed to build table");
         create_table(&admin, &table_path, &table_descriptor).await;
-        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection
             .get_table(&table_path)
@@ -190,7 +188,6 @@ mod reader_test {
             .build()
             .expect("Failed to build table");
         create_table(&admin, &table_path, &table_descriptor).await;
-        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection
             .get_table(&table_path)
@@ -285,7 +282,6 @@ mod reader_test {
             .build()
             .expect("Failed to build table");
         create_table(&admin, &table_path, &table_descriptor).await;
-        wait_for_table_buckets_ready(&admin, &table_path, &[0, 1]).await;
 
         let table = connection
             .get_table(&table_path)
@@ -381,7 +377,6 @@ mod reader_test {
             .expect("Failed to build table");
 
         create_table(&admin, &table_path, &table_descriptor).await;
-        wait_for_table_ready(&admin, &table_path).await;
 
         let table = connection
             .get_table(&table_path)
diff --git a/fluss-rust/website/docs/user-guide/rust/api-reference.md b/fluss-rust/website/docs/user-guide/rust/api-reference.md
index 5d98303083..bb2ec3e8f1 100644
--- a/fluss-rust/website/docs/user-guide/rust/api-reference.md
+++ b/fluss-rust/website/docs/user-guide/rust/api-reference.md
@@ -134,8 +134,10 @@ Complete API reference for the Fluss Rust client.
 |-----------------------------------------------------------------------------|-----------------------------------------|
 | `fn project(self, indices: &[usize]) -> Result<Self>`                       | Project columns by index                |
 | `fn project_by_name(self, names: &[&str]) -> Result<Self>`                  | Project columns by name                 |
+| `fn limit(self, n: i32) -> Result<Self>`                                    | Set a row limit (enables `create_bucket_batch_scanner`; rejected by log scanners) |
 | `fn create_log_scanner(self) -> Result<LogScanner>`                         | Create a record-based log scanner       |
 | `fn create_record_batch_log_scanner(self) -> Result<RecordBatchLogScanner>` | Create an Arrow batch-based log scanner |
+| `fn create_bucket_batch_scanner(self, bucket: TableBucket) -> Result<LimitBatchScanner>` | Bounded scan of one bucket (requires `limit`; runs on first `next_batch`) |
 
 ## `LogScanner`
 
@@ -211,6 +213,19 @@ bucket identity per batch, use `next_batch` instead.
 | `fn next(&mut self) -> Option<Result<RecordBatch, ArrowError>>` | Iterator: next batch, or `None` when caught up   |
 | `fn schema(&self) -> SchemaRef`                                 | Arrow schema for produced batches                |
 
+## `LimitBatchScanner`
+
+One-shot bounded scanner from `TableScan::limit(n).create_bucket_batch_scanner(bucket)`.
+Poll it with `next_batch` until it returns `None` (mirrors `RecordBatchLogReader`).
+Supports both log and primary-key tables (the latter returns the current,
+server-deduplicated state); yields a single batch of at most `n` rows.
+
+| Method                                                        | Description                          |
+|---------------------------------------------------------------|--------------------------------------|
+| `async fn next_batch(&mut self) -> Result<Option<ScanBatch>>` | Rows on the first call, `None` after |
+| `async fn collect_all_batches(&mut self) -> Result<Vec<ScanBatch>>` | Drain into all batches         |
+| `fn bucket(&self) -> &TableBucket`                            | The scanned bucket                   |
+
 ## `ScanRecord`
 
 | Method                                 | Description                            |
diff --git a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
index 0485779699..e77c8c6c43 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/log-tables.md
@@ -153,3 +153,20 @@ let scanner = table.new_scan()
     .project_by_name(&["event_id", "timestamp"])?
     .create_log_scanner()?;
 ```
+
+## Limit Scan
+
+For a bounded read of up to `n` rows from a single bucket, use a batch scanner
+instead of subscribing. It issues one request; poll it with `next_batch` until
+it returns `None`.
+
+```rust
+let bucket = TableBucket::new(table.get_table_info().table_id, 0);
+let mut scanner = table.new_scan().limit(10)?.create_bucket_batch_scanner(bucket)?;
+
+while let Some(batch) = scanner.next_batch().await? {
+    println!("rows: {}", batch.batch().num_rows());
+}
+```
+
+Limit applies per bucket; scan each bucket to cover a multi-bucket table.
diff --git a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
index 82a07c4cba..01836e29e4 100644
--- a/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
+++ b/fluss-rust/website/docs/user-guide/rust/example/primary-key-tables.md
@@ -124,3 +124,18 @@ println!("Rows: {}", batch.num_rows());
 ## Prefix Lookup
 
 To fetch all rows sharing a common primary-key prefix (by choosing a bucket key that's a strict prefix of the primary key), see [Prefix Lookup](./prefix-lookup.md).
+
+## Limit Scan
+
+To read up to `n` rows of a bucket's current state without supplying keys, use a batch scanner. The server returns the deduplicated current rows as Arrow batches, which is convenient for previews or DataFusion sources.
+
+```rust
+let bucket = TableBucket::new(table.get_table_info().table_id, 0);
+let mut scanner = table.new_scan().limit(10)?.create_bucket_batch_scanner(bucket)?;
+
+while let Some(batch) = scanner.next_batch().await? {
+    println!("rows: {}", batch.batch().num_rows());
+}
+```
+
+Limit applies per bucket; scan each bucket to cover a multi-bucket table.

From 52ac57ab76a186b5742e5c72b2208f41a8125cdb Mon Sep 17 00:00:00 2001
From: Nicoleta Lazar <nicoleta.lazar@fresha.com>
Date: Thu, 28 May 2026 17:38:56 +0100
Subject: [PATCH 284/287] [elixir] feat: Extend Fluss.Config with scanner
 tuning options (#574)

* feat(elixir): Extend NifConfig with scanner tuning fields

This commit adds 8 more scanner-tuning fields to NifConfig, covering the
remote log prefetch, download concurrency, max poll records and fetch
size/time limits.

* feat(elixir): Expose scanner tuning options on Fluss.Config

This commit adds 8 scanner-tuning fields to Fluss.Config with
corresponding set_* setters: remote prefetch count, remote log read
concurrency, file download thread count, max poll records and fetch
size/time bounds.
---
 .../bindings/elixir/lib/fluss/config.ex       | 54 ++++++++++++++++
 .../elixir/native/fluss_nif/src/config.rs     | 32 ++++++++++
 .../bindings/elixir/test/config_test.exs      | 64 +++++++++++++++++++
 3 files changed, 150 insertions(+)

diff --git a/fluss-rust/bindings/elixir/lib/fluss/config.ex b/fluss-rust/bindings/elixir/lib/fluss/config.ex
index d02a428ff3..07324df091 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/config.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/config.ex
@@ -33,6 +33,14 @@ defmodule Fluss.Config do
 
   @enforce_keys [:bootstrap_servers]
   defstruct bootstrap_servers: nil,
+            remote_file_download_thread_num: nil,
+            scanner_log_fetch_max_bytes: nil,
+            scanner_log_fetch_max_bytes_for_bucket: nil,
+            scanner_log_fetch_min_bytes: nil,
+            scanner_log_fetch_wait_max_time_ms: nil,
+            scanner_log_max_poll_records: nil,
+            scanner_remote_log_prefetch_num: nil,
+            scanner_remote_log_read_concurrency: nil,
             writer_acks: nil,
             writer_batch_size: nil,
             writer_batch_timeout_ms: nil,
@@ -48,6 +56,14 @@ defmodule Fluss.Config do
 
   @type t :: %__MODULE__{
           bootstrap_servers: String.t(),
+          remote_file_download_thread_num: non_neg_integer() | nil,
+          scanner_log_fetch_max_bytes: non_neg_integer() | nil,
+          scanner_log_fetch_max_bytes_for_bucket: non_neg_integer() | nil,
+          scanner_log_fetch_min_bytes: non_neg_integer() | nil,
+          scanner_log_fetch_wait_max_time_ms: non_neg_integer() | nil,
+          scanner_log_max_poll_records: non_neg_integer() | nil,
+          scanner_remote_log_prefetch_num: non_neg_integer() | nil,
+          scanner_remote_log_read_concurrency: non_neg_integer() | nil,
           writer_acks: String.t() | nil,
           writer_batch_size: non_neg_integer() | nil,
           writer_batch_timeout_ms: non_neg_integer() | nil,
@@ -74,6 +90,44 @@ defmodule Fluss.Config do
   def set_bootstrap_servers(%__MODULE__{} = config, servers) when is_binary(servers),
     do: %{config | bootstrap_servers: servers}
 
+  @spec set_remote_file_download_thread_num(t(), non_neg_integer()) :: t()
+  def set_remote_file_download_thread_num(%__MODULE__{} = config, threads)
+      when is_integer(threads),
+      do: %{config | remote_file_download_thread_num: threads}
+
+  @spec set_scanner_log_fetch_max_bytes(t(), non_neg_integer()) :: t()
+  def set_scanner_log_fetch_max_bytes(%__MODULE__{} = config, max_bytes)
+      when is_integer(max_bytes),
+      do: %{config | scanner_log_fetch_max_bytes: max_bytes}
+
+  @spec set_scanner_log_fetch_max_bytes_for_bucket(t(), non_neg_integer()) :: t()
+  def set_scanner_log_fetch_max_bytes_for_bucket(%__MODULE__{} = config, max_bytes)
+      when is_integer(max_bytes),
+      do: %{config | scanner_log_fetch_max_bytes_for_bucket: max_bytes}
+
+  @spec set_scanner_log_fetch_min_bytes(t(), non_neg_integer()) :: t()
+  def set_scanner_log_fetch_min_bytes(%__MODULE__{} = config, min_bytes)
+      when is_integer(min_bytes),
+      do: %{config | scanner_log_fetch_min_bytes: min_bytes}
+
+  @spec set_scanner_log_fetch_wait_max_time_ms(t(), non_neg_integer()) :: t()
+  def set_scanner_log_fetch_wait_max_time_ms(%__MODULE__{} = config, wait_ms)
+      when is_integer(wait_ms),
+      do: %{config | scanner_log_fetch_wait_max_time_ms: wait_ms}
+
+  @spec set_scanner_log_max_poll_records(t(), non_neg_integer()) :: t()
+  def set_scanner_log_max_poll_records(%__MODULE__{} = config, num) when is_integer(num),
+    do: %{config | scanner_log_max_poll_records: num}
+
+  @spec set_scanner_remote_log_prefetch_num(t(), non_neg_integer()) :: t()
+  def set_scanner_remote_log_prefetch_num(%__MODULE__{} = config, num) when is_integer(num),
+    do: %{config | scanner_remote_log_prefetch_num: num}
+
+  @spec set_scanner_remote_log_read_concurrency(t(), non_neg_integer()) :: t()
+  def set_scanner_remote_log_read_concurrency(%__MODULE__{} = config, concurrency)
+      when is_integer(concurrency),
+      do: %{config | scanner_remote_log_read_concurrency: concurrency}
+
   @spec set_writer_acks(t(), String.t()) :: t()
   def set_writer_acks(%__MODULE__{} = config, acks) when is_binary(acks),
     do: %{config | writer_acks: acks}
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
index 60034d9bc8..79aabcd7c0 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
@@ -31,6 +31,14 @@ pub enum NifNoKeyAssigner {
 #[module = "Fluss.Config"]
 pub struct NifConfig {
     pub bootstrap_servers: String,
+    pub remote_file_download_thread_num: Option<u64>,
+    pub scanner_log_fetch_max_bytes: Option<i32>,
+    pub scanner_log_fetch_max_bytes_for_bucket: Option<i32>,
+    pub scanner_log_fetch_min_bytes: Option<i32>,
+    pub scanner_log_fetch_wait_max_time_ms: Option<i32>,
+    pub scanner_log_max_poll_records: Option<u64>,
+    pub scanner_remote_log_prefetch_num: Option<u64>,
+    pub scanner_remote_log_read_concurrency: Option<u64>,
     pub writer_acks: Option<String>,
     pub writer_batch_size: Option<i32>,
     pub writer_batch_timeout_ms: Option<i64>,
@@ -51,6 +59,30 @@ impl NifConfig {
             bootstrap_servers: self.bootstrap_servers,
             ..Config::default()
         };
+        if let Some(n) = self.remote_file_download_thread_num {
+            config.remote_file_download_thread_num = n as usize;
+        }
+        if let Some(size) = self.scanner_log_fetch_max_bytes {
+            config.scanner_log_fetch_max_bytes = size;
+        }
+        if let Some(size) = self.scanner_log_fetch_max_bytes_for_bucket {
+            config.scanner_log_fetch_max_bytes_for_bucket = size;
+        }
+        if let Some(size) = self.scanner_log_fetch_min_bytes {
+            config.scanner_log_fetch_min_bytes = size;
+        }
+        if let Some(ms) = self.scanner_log_fetch_wait_max_time_ms {
+            config.scanner_log_fetch_wait_max_time_ms = ms;
+        }
+        if let Some(n) = self.scanner_log_max_poll_records {
+            config.scanner_log_max_poll_records = n as usize;
+        }
+        if let Some(n) = self.scanner_remote_log_prefetch_num {
+            config.scanner_remote_log_prefetch_num = n as usize;
+        }
+        if let Some(n) = self.scanner_remote_log_read_concurrency {
+            config.scanner_remote_log_read_concurrency = n as usize;
+        }
         if let Some(size) = self.writer_batch_size {
             config.writer_batch_size = size;
         }
diff --git a/fluss-rust/bindings/elixir/test/config_test.exs b/fluss-rust/bindings/elixir/test/config_test.exs
index 344c647892..2550a7e82e 100644
--- a/fluss-rust/bindings/elixir/test/config_test.exs
+++ b/fluss-rust/bindings/elixir/test/config_test.exs
@@ -23,6 +23,70 @@ defmodule Fluss.ConfigTest do
     assert config == %Fluss.Config{bootstrap_servers: "localhost:9123"}
   end
 
+  test "set_remote_file_download_thread_num/2 sets the download thread num" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_remote_file_download_thread_num(4)
+
+    assert config.remote_file_download_thread_num == 4
+  end
+
+  test "set_scanner_log_fetch_max_bytes/2 sets the fetch max bytes" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_scanner_log_fetch_max_bytes(16_777_216)
+
+    assert config.scanner_log_fetch_max_bytes == 16_777_216
+  end
+
+  test "set_scanner_log_fetch_max_bytes_for_bucket/2 sets the per-bucket fetch limit" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_scanner_log_fetch_max_bytes_for_bucket(1_048_576)
+
+    assert config.scanner_log_fetch_max_bytes_for_bucket == 1_048_576
+  end
+
+  test "set_scanner_log_fetch_min_bytes/2 sets the fetch min bytes" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_scanner_log_fetch_min_bytes(1)
+
+    assert config.scanner_log_fetch_min_bytes == 1
+  end
+
+  test "set_scanner_log_fetch_wait_max_time_ms/2 sets the max wait time" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_scanner_log_fetch_wait_max_time_ms(500)
+
+    assert config.scanner_log_fetch_wait_max_time_ms == 500
+  end
+
+  test "set_scanner_log_max_poll_records/2 sets the max poll records" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_scanner_log_max_poll_records(1000)
+
+    assert config.scanner_log_max_poll_records == 1000
+  end
+
+  test "set_scanner_remote_log_prefetch_num/2 sets the prefetch num" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_scanner_remote_log_prefetch_num(2)
+
+    assert config.scanner_remote_log_prefetch_num == 2
+  end
+
+  test "set_scanner_remote_log_read_concurrency/2 sets the read concurrency" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_scanner_remote_log_read_concurrency(4)
+
+    assert config.scanner_remote_log_read_concurrency == 4
+  end
+
   test "set_writer_acks/2 sets the acks value" do
     config =
       Fluss.Config.new("localhost:9123")

From 53da6a8cb234795057812678579ece523b4eeaad Mon Sep 17 00:00:00 2001
From: Kaiqi Dong <kaiqi.dong@bitvavo.com>
Date: Thu, 28 May 2026 22:51:31 +0200
Subject: [PATCH 285/287] chore: [ci] Fix rustdoc warning and promote warning
 to error in CI (#576)

* fix rustdoc and promote warning to error in ci

* address comments
---
 .../.github/workflows/check_license_and_formatting.yml |  6 ++++++
 fluss-rust/crates/fluss/src/record/kv/mod.rs           |  2 +-
 .../crates/fluss/src/record/kv/value_record_batch.rs   | 10 +++++-----
 .../fluss/src/row/binary/iceberg_binary_row_writer.rs  |  3 +--
 4 files changed, 13 insertions(+), 8 deletions(-)

diff --git a/fluss-rust/.github/workflows/check_license_and_formatting.yml b/fluss-rust/.github/workflows/check_license_and_formatting.yml
index 784e778e51..881af9f927 100644
--- a/fluss-rust/.github/workflows/check_license_and_formatting.yml
+++ b/fluss-rust/.github/workflows/check_license_and_formatting.yml
@@ -66,3 +66,9 @@ jobs:
 
       - name: Clippy
         run: cargo clippy --all-targets --workspace -- -D warnings
+
+      - name: Rustdoc
+        # fluss_python is excluded: its [lib] name = "fluss" collides with fluss-rs
+        run: cargo doc --workspace --no-deps --exclude fluss_python
+        env:
+          RUSTDOCFLAGS: -D warnings
diff --git a/fluss-rust/crates/fluss/src/record/kv/mod.rs b/fluss-rust/crates/fluss/src/record/kv/mod.rs
index 8f7750a80a..4d0f894638 100644
--- a/fluss-rust/crates/fluss/src/record/kv/mod.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/mod.rs
@@ -32,7 +32,7 @@ pub use kv_record_batch::*;
 pub use kv_record_batch_builder::*;
 pub use kv_record_read_context::{KvRecordReadContext, SchemaGetter};
 pub use read_context::ReadContext;
-pub use value_record_batch::ValueRecordBatch;
+pub(crate) use value_record_batch::ValueRecordBatch;
 
 /// Current KV magic value
 pub const CURRENT_KV_MAGIC_VALUE: u8 = 0;
diff --git a/fluss-rust/crates/fluss/src/record/kv/value_record_batch.rs b/fluss-rust/crates/fluss/src/record/kv/value_record_batch.rs
index cfcb4a6d61..fdd6b0702c 100644
--- a/fluss-rust/crates/fluss/src/record/kv/value_record_batch.rs
+++ b/fluss-rust/crates/fluss/src/record/kv/value_record_batch.rs
@@ -50,18 +50,18 @@ const RECORD_BATCH_HEADER_SIZE: usize = LENGTH_LENGTH + MAGIC_LENGTH + RECORD_CO
 const RECORD_LENGTH_LENGTH: usize = 4;
 
 /// Read-only view over a serialized value-record batch.
-pub struct ValueRecordBatch {
+pub(crate) struct ValueRecordBatch {
     data: Bytes,
 }
 
 impl ValueRecordBatch {
     /// Wraps raw batch bytes. The batch is expected to start at offset 0.
-    pub fn new(data: Bytes) -> Self {
+    pub(crate) fn new(data: Bytes) -> Self {
         Self { data }
     }
 
     /// Number of records declared in the batch header.
-    pub fn record_count(&self) -> Result<i32> {
+    pub(crate) fn record_count(&self) -> Result<i32> {
         if self.data.len() < RECORD_BATCH_HEADER_SIZE {
             return Err(corrupt(format!(
                 "value-record batch too short: {} bytes, need {} for header",
@@ -77,7 +77,7 @@ impl ValueRecordBatch {
     /// Returns one byte range per record, each spanning `[SchemaId | Value]`:
     /// the payload [`crate::row::FixedSchemaDecoder::decode`] expects. Index
     /// [`Self::data`] with a returned range to get it without copying.
-    pub fn value_ranges(&self) -> Result<Vec<Range<usize>>> {
+    pub(crate) fn value_ranges(&self) -> Result<Vec<Range<usize>>> {
         let count = self.record_count()?;
         if count < 0 {
             return Err(corrupt(format!("invalid record count {count}")));
@@ -108,7 +108,7 @@ impl ValueRecordBatch {
     }
 
     /// The underlying batch bytes.
-    pub fn data(&self) -> &Bytes {
+    pub(crate) fn data(&self) -> &Bytes {
         &self.data
     }
 }
diff --git a/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs b/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
index 4320a62285..82a61928ae 100644
--- a/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
+++ b/fluss-rust/crates/fluss/src/row/binary/iceberg_binary_row_writer.rs
@@ -37,11 +37,10 @@ const MICROS_PER_MILLI: i64 = 1_000;
 /// - Variable-length types (string, binary) are written without length prefixes
 /// - Decimals are written as unscaled big-endian bytes without length prefixes
 ///
-/// The encoded bytes feed directly into [`IcebergBucketingFunction`]'s MurmurHash
+/// The encoded bytes feed directly into `IcebergBucketingFunction`'s MurmurHash
 /// for bucket assignment and must match the Java Fluss server's encoding exactly.
 ///
 /// [`CompactedRowWriter`]: crate::row::compacted::CompactedRowWriter
-/// [`IcebergBucketingFunction`]: crate::bucketing::IcebergBucketingFunction
 pub struct IcebergBinaryRowWriter {
     position: usize,
     buffer: BytesMut,

From 2b0c742f7dc05346cec255f9ebecf909a917cf1c Mon Sep 17 00:00:00 2001
From: Nicoleta Lazar <nicoleta.lazar@fresha.com>
Date: Fri, 29 May 2026 00:36:13 +0100
Subject: [PATCH 286/287] [elixir] feat: Extend Fluss.Config with security,
 SASL and connect timeout options (#577)

* feat(elixir): Extend NifConfig with security & connect timeout fields

This commit adds 5 fields to NifConfig: connect timeout ms and
security_* settings (protocol, sasl mechanism, usernama and password)

* feat(elixir): Expose security opts and connect timeout in Fluss.Config

This commit adds 5 fields to Fluss.Config with the corresponding
setters: connect timeout, security protocol, sasl mechanism, username
and password.

To ensure that the password is redacted, we add a custom Inspect impl,
essentially mirroring the upstream rust debug redaction.
---
 .../bindings/elixir/lib/fluss/config.ex       | 54 ++++++++++++++++++
 .../elixir/native/fluss_nif/src/config.rs     | 20 +++++++
 .../bindings/elixir/test/config_test.exs      | 56 +++++++++++++++++++
 3 files changed, 130 insertions(+)

diff --git a/fluss-rust/bindings/elixir/lib/fluss/config.ex b/fluss-rust/bindings/elixir/lib/fluss/config.ex
index 07324df091..8aaacf7993 100644
--- a/fluss-rust/bindings/elixir/lib/fluss/config.ex
+++ b/fluss-rust/bindings/elixir/lib/fluss/config.ex
@@ -33,6 +33,7 @@ defmodule Fluss.Config do
 
   @enforce_keys [:bootstrap_servers]
   defstruct bootstrap_servers: nil,
+            connect_timeout_ms: nil,
             remote_file_download_thread_num: nil,
             scanner_log_fetch_max_bytes: nil,
             scanner_log_fetch_max_bytes_for_bucket: nil,
@@ -41,6 +42,10 @@ defmodule Fluss.Config do
             scanner_log_max_poll_records: nil,
             scanner_remote_log_prefetch_num: nil,
             scanner_remote_log_read_concurrency: nil,
+            security_protocol: nil,
+            security_sasl_mechanism: nil,
+            security_sasl_password: nil,
+            security_sasl_username: nil,
             writer_acks: nil,
             writer_batch_size: nil,
             writer_batch_timeout_ms: nil,
@@ -56,6 +61,7 @@ defmodule Fluss.Config do
 
   @type t :: %__MODULE__{
           bootstrap_servers: String.t(),
+          connect_timeout_ms: non_neg_integer() | nil,
           remote_file_download_thread_num: non_neg_integer() | nil,
           scanner_log_fetch_max_bytes: non_neg_integer() | nil,
           scanner_log_fetch_max_bytes_for_bucket: non_neg_integer() | nil,
@@ -64,6 +70,10 @@ defmodule Fluss.Config do
           scanner_log_max_poll_records: non_neg_integer() | nil,
           scanner_remote_log_prefetch_num: non_neg_integer() | nil,
           scanner_remote_log_read_concurrency: non_neg_integer() | nil,
+          security_protocol: String.t() | nil,
+          security_sasl_mechanism: String.t() | nil,
+          security_sasl_password: String.t() | nil,
+          security_sasl_username: String.t() | nil,
           writer_acks: String.t() | nil,
           writer_batch_size: non_neg_integer() | nil,
           writer_batch_timeout_ms: non_neg_integer() | nil,
@@ -90,6 +100,10 @@ defmodule Fluss.Config do
   def set_bootstrap_servers(%__MODULE__{} = config, servers) when is_binary(servers),
     do: %{config | bootstrap_servers: servers}
 
+  @spec set_connect_timeout_ms(t(), non_neg_integer()) :: t()
+  def set_connect_timeout_ms(%__MODULE__{} = config, ms) when is_integer(ms),
+    do: %{config | connect_timeout_ms: ms}
+
   @spec set_remote_file_download_thread_num(t(), non_neg_integer()) :: t()
   def set_remote_file_download_thread_num(%__MODULE__{} = config, threads)
       when is_integer(threads),
@@ -128,6 +142,22 @@ defmodule Fluss.Config do
       when is_integer(concurrency),
       do: %{config | scanner_remote_log_read_concurrency: concurrency}
 
+  @spec set_security_protocol(t(), String.t()) :: t()
+  def set_security_protocol(%__MODULE__{} = config, protocol) when is_binary(protocol),
+    do: %{config | security_protocol: protocol}
+
+  @spec set_security_sasl_mechanism(t(), String.t()) :: t()
+  def set_security_sasl_mechanism(%__MODULE__{} = config, mechanism) when is_binary(mechanism),
+    do: %{config | security_sasl_mechanism: mechanism}
+
+  @spec set_security_sasl_password(t(), String.t()) :: t()
+  def set_security_sasl_password(%__MODULE__{} = config, pass) when is_binary(pass),
+    do: %{config | security_sasl_password: pass}
+
+  @spec set_security_sasl_username(t(), String.t()) :: t()
+  def set_security_sasl_username(%__MODULE__{} = config, username) when is_binary(username),
+    do: %{config | security_sasl_username: username}
+
   @spec set_writer_acks(t(), String.t()) :: t()
   def set_writer_acks(%__MODULE__{} = config, acks) when is_binary(acks),
     do: %{config | writer_acks: acks}
@@ -183,3 +213,27 @@ defmodule Fluss.Config do
   @spec get_bootstrap_servers(t()) :: String.t()
   def get_bootstrap_servers(%__MODULE__{bootstrap_servers: servers}), do: servers
 end
+
+defimpl Inspect, for: Fluss.Config do
+  import Inspect.Algebra
+
+  def inspect(%Fluss.Config{} = config, opts) do
+    sanitized = %{config | security_sasl_password: redact(config.security_sasl_password)}
+
+    fields = sanitized |> Map.from_struct() |> Map.to_list()
+
+    container_doc(
+      "%Fluss.Config{",
+      fields,
+      "}",
+      opts,
+      fn {key, value}, opts ->
+        concat([Atom.to_string(key), ": ", to_doc(value, opts)])
+      end,
+      separator: ","
+    )
+  end
+
+  defp redact(nil), do: nil
+  defp redact(_), do: "[REDACTED]"
+end
diff --git a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
index 79aabcd7c0..8c1bab51eb 100644
--- a/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
+++ b/fluss-rust/bindings/elixir/native/fluss_nif/src/config.rs
@@ -31,6 +31,7 @@ pub enum NifNoKeyAssigner {
 #[module = "Fluss.Config"]
 pub struct NifConfig {
     pub bootstrap_servers: String,
+    pub connect_timeout_ms: Option<u64>,
     pub remote_file_download_thread_num: Option<u64>,
     pub scanner_log_fetch_max_bytes: Option<i32>,
     pub scanner_log_fetch_max_bytes_for_bucket: Option<i32>,
@@ -39,6 +40,10 @@ pub struct NifConfig {
     pub scanner_log_max_poll_records: Option<u64>,
     pub scanner_remote_log_prefetch_num: Option<u64>,
     pub scanner_remote_log_read_concurrency: Option<u64>,
+    pub security_protocol: Option<String>,
+    pub security_sasl_mechanism: Option<String>,
+    pub security_sasl_password: Option<String>,
+    pub security_sasl_username: Option<String>,
     pub writer_acks: Option<String>,
     pub writer_batch_size: Option<i32>,
     pub writer_batch_timeout_ms: Option<i64>,
@@ -59,6 +64,9 @@ impl NifConfig {
             bootstrap_servers: self.bootstrap_servers,
             ..Config::default()
         };
+        if let Some(timeout) = self.connect_timeout_ms {
+            config.connect_timeout_ms = timeout;
+        }
         if let Some(n) = self.remote_file_download_thread_num {
             config.remote_file_download_thread_num = n as usize;
         }
@@ -83,6 +91,18 @@ impl NifConfig {
         if let Some(n) = self.scanner_remote_log_read_concurrency {
             config.scanner_remote_log_read_concurrency = n as usize;
         }
+        if let Some(protocol) = self.security_protocol {
+            config.security_protocol = protocol;
+        }
+        if let Some(mechanism) = self.security_sasl_mechanism {
+            config.security_sasl_mechanism = mechanism;
+        }
+        if let Some(password) = self.security_sasl_password {
+            config.security_sasl_password = password;
+        }
+        if let Some(username) = self.security_sasl_username {
+            config.security_sasl_username = username;
+        }
         if let Some(size) = self.writer_batch_size {
             config.writer_batch_size = size;
         }
diff --git a/fluss-rust/bindings/elixir/test/config_test.exs b/fluss-rust/bindings/elixir/test/config_test.exs
index 2550a7e82e..f4b8a11ca1 100644
--- a/fluss-rust/bindings/elixir/test/config_test.exs
+++ b/fluss-rust/bindings/elixir/test/config_test.exs
@@ -23,6 +23,14 @@ defmodule Fluss.ConfigTest do
     assert config == %Fluss.Config{bootstrap_servers: "localhost:9123"}
   end
 
+  test "set_connect_timeout_ms/2 sets the connect timeout" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_connect_timeout_ms(30_000)
+
+    assert config.connect_timeout_ms == 30_000
+  end
+
   test "set_remote_file_download_thread_num/2 sets the download thread num" do
     config =
       Fluss.Config.new("localhost:9123")
@@ -87,6 +95,54 @@ defmodule Fluss.ConfigTest do
     assert config.scanner_remote_log_read_concurrency == 4
   end
 
+  test "set_security_protocol/2 sets the security protocol" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_security_protocol("sasl")
+
+    assert config.security_protocol == "sasl"
+  end
+
+  test "set_security_sasl_mechanism/2 sets the SASL mechanism" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_security_sasl_mechanism("PLAIN")
+
+    assert config.security_sasl_mechanism == "PLAIN"
+  end
+
+  test "set_security_sasl_username/2 sets the SASL username" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_security_sasl_username("admin")
+
+    assert config.security_sasl_username == "admin"
+  end
+
+  test "set_security_sasl_password/2 sets the SASL password" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_security_sasl_password("secret")
+
+    assert config.security_sasl_password == "secret"
+  end
+
+  test "inspect/1 redacts security_sasl_password when set" do
+    config =
+      Fluss.Config.new("localhost:9123")
+      |> Fluss.Config.set_security_sasl_password("supersecret")
+
+    output = inspect(config)
+    refute output =~ "supersecret"
+    assert output =~ "[REDACTED]"
+  end
+
+  test "inspect/1 leaves nil security_sasl_password as nil" do
+    config = Fluss.Config.new("localhost:9123")
+    output = inspect(config)
+    assert output =~ "security_sasl_password: nil"
+  end
+
   test "set_writer_acks/2 sets the acks value" do
     config =
       Fluss.Config.new("localhost:9123")

From c232100b5c8c338bc69d835a1812697060d6183d Mon Sep 17 00:00:00 2001
From: Anton Borisov <anton.borisov@fresha.com>
Date: Fri, 29 May 2026 08:56:28 +0100
Subject: [PATCH 287/287] [FIP-40] Adapt imported fluss-rust to the monorepo
 (proto, CI, docs, release)

---
 .../actions/verify-tag-version/action.yml     |   0
 .../.github => .github}/dependabot.yml        |   8 +-
 {fluss-rust/.github => .github}/release.yml   |   0
 .github/workflows/ci.yaml                     |   2 +
 .github/workflows/client-integration.yml      | 366 +++++++++
 .github/workflows/license-check.yml           |  12 +-
 .../workflows/python-release.yml              |  25 +-
 .../workflows/rust-build-and-test.yml         |  52 +-
 .../workflows/rust-docs-check.yml             |  12 +-
 .../workflows/rust-license-and-format.yml     |  38 +-
 .../workflows/rust-release.yml                |  13 +-
 fluss-rust/.asf.yaml                          |  47 --
 fluss-rust/.github/ISSUE_TEMPLATE/bug.yml     |  58 --
 fluss-rust/.github/ISSUE_TEMPLATE/config.yml  |  19 -
 fluss-rust/.github/ISSUE_TEMPLATE/feature.yml |  58 --
 fluss-rust/.github/ISSUE_TEMPLATE/task.yml    |  51 --
 fluss-rust/.github/PULL_REQUEST_TEMPLATE.md   |  41 -
 .../.github/workflows/build_and_test_cpp.yml  |  90 ---
 .../workflows/build_and_test_elixir.yml       | 103 ---
 .../workflows/build_and_test_python.yml       | 100 ---
 .../workflows/deploy_documentation.yml        |  81 --
 fluss-rust/.licenserc.yaml                    |  14 +-
 fluss-rust/Cargo.lock                         |  12 +-
 fluss-rust/Cargo.toml                         |   4 +-
 fluss-rust/DISCLAIMER                         |  10 -
 fluss-rust/LICENSE                            | 201 -----
 fluss-rust/NOTICE                             |   5 -
 fluss-rust/bindings/elixir/mix.exs            |   2 +-
 .../crates/fluss-test-cluster/src/lib.rs      |   5 +-
 fluss-rust/crates/fluss/build.rs              |  21 +-
 fluss-rust/crates/fluss/src/client/admin.rs   |   1 +
 .../crates/fluss/src/client/table/scanner.rs  |   5 +
 fluss-rust/crates/fluss/src/lib.rs            |   4 +-
 .../crates/fluss/src/metadata/partition.rs    |   1 +
 .../crates/fluss/src/proto/fluss_api.proto    | 503 ------------
 fluss-rust/crates/fluss/src/rpc/convert.rs    |   2 +
 .../fluss/src/rpc/message/create_partition.rs |   3 +-
 .../rpc/message/get_latest_lake_snapshot.rs   |  10 +-
 .../fluss/src/rpc/message/list_databases.rs   |   4 +-
 .../crates/fluss/src/rpc/message/lookup.rs    |   5 +-
 fluss-rust/scripts/vendor-proto.sh            |  46 ++
 pom.xml                                       |   2 +
 website/community/dev/building.md             |  38 +-
 website/community/dev/ide-setup.md            |   9 +
 .../how-to-contribute/contribute-code.md      |   3 +-
 .../creating-a-fluss-release.mdx              |  25 +
 .../how-to-release/pre-rc-checklist.md        |  38 +
 .../release-manager-preparation.md            |  22 +
 .../verifying-a-fluss-release.md              |  32 +
 website/docs/apis/client-support-matrix.md    |  16 +-
 website/docs/apis/cpp-client.md               |  70 --
 website/docs/apis/cpp/_category_.json         |   4 +
 website/docs/apis/cpp/api-reference.md        | 731 ++++++++++++++++++
 website/docs/apis/cpp/data-types.md           | 250 ++++++
 website/docs/apis/cpp/error-handling.md       | 238 ++++++
 website/docs/apis/cpp/example/_category_.json |   4 +
 .../docs/apis/cpp/example/admin-operations.md | 158 ++++
 .../docs/apis/cpp/example/configuration.md    |  42 +
 website/docs/apis/cpp/example/index.md        |  63 ++
 website/docs/apis/cpp/example/log-tables.md   | 161 ++++
 .../apis/cpp/example/partitioned-tables.md    | 179 +++++
 .../apis/cpp/example/primary-key-tables.md    | 132 ++++
 website/docs/apis/cpp/installation.md         | 107 +++
 website/docs/apis/index.md                    |  42 +
 website/docs/apis/java/_category_.json        |   4 +
 .../apis/{java-client.md => java/index.md}    |   0
 website/docs/apis/python-client.md            |  45 --
 website/docs/apis/python/_category_.json      |   4 +
 website/docs/apis/python/api-reference.md     | 389 ++++++++++
 website/docs/apis/python/data-types.md        |  95 +++
 website/docs/apis/python/error-handling.md    | 168 ++++
 .../docs/apis/python/example/_category_.json  |   4 +
 .../apis/python/example/admin-operations.md   |  81 ++
 .../docs/apis/python/example/configuration.md |  49 ++
 website/docs/apis/python/example/index.md     |  46 ++
 .../docs/apis/python/example/log-tables.md    | 129 ++++
 .../apis/python/example/partitioned-tables.md | 104 +++
 .../apis/python/example/primary-key-tables.md |  61 ++
 website/docs/apis/python/installation.md      |  41 +
 website/docs/apis/rust-client.md              |  53 --
 website/docs/apis/rust/_category_.json        |   4 +
 website/docs/apis/rust/api-reference.md       | 597 ++++++++++++++
 website/docs/apis/rust/data-types.md          | 179 +++++
 website/docs/apis/rust/error-handling.md      | 241 ++++++
 .../docs/apis/rust/example/_category_.json    |   4 +
 .../apis/rust/example/admin-operations.md     | 122 +++
 .../docs/apis/rust/example/configuration.md   |  35 +
 website/docs/apis/rust/example/index.md       |  56 ++
 website/docs/apis/rust/example/log-tables.md  | 172 +++++
 .../apis/rust/example/partitioned-tables.md   | 219 ++++++
 .../docs/apis/rust/example/prefix-lookup.md   | 110 +++
 .../apis/rust/example/primary-key-tables.md   | 141 ++++
 website/docs/apis/rust/installation.md        |  76 ++
 .../table-design/merge-engines/aggregation.md |   2 +-
 website/docusaurus.config.ts                  |   2 +-
 95 files changed, 5998 insertions(+), 1635 deletions(-)
 rename {fluss-rust/.github => .github}/actions/verify-tag-version/action.yml (100%)
 rename {fluss-rust/.github => .github}/dependabot.yml (87%)
 rename {fluss-rust/.github => .github}/release.yml (100%)
 create mode 100644 .github/workflows/client-integration.yml
 rename fluss-rust/.github/workflows/release_python.yml => .github/workflows/python-release.yml (88%)
 rename fluss-rust/.github/workflows/build_and_test_rust.yml => .github/workflows/rust-build-and-test.yml (70%)
 rename fluss-rust/.github/workflows/check_documentation.yml => .github/workflows/rust-docs-check.yml (82%)
 rename fluss-rust/.github/workflows/check_license_and_formatting.yml => .github/workflows/rust-license-and-format.yml (69%)
 rename fluss-rust/.github/workflows/release_rust.yml => .github/workflows/rust-release.yml (80%)
 delete mode 100644 fluss-rust/.asf.yaml
 delete mode 100644 fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
 delete mode 100644 fluss-rust/.github/ISSUE_TEMPLATE/config.yml
 delete mode 100644 fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
 delete mode 100644 fluss-rust/.github/ISSUE_TEMPLATE/task.yml
 delete mode 100644 fluss-rust/.github/PULL_REQUEST_TEMPLATE.md
 delete mode 100644 fluss-rust/.github/workflows/build_and_test_cpp.yml
 delete mode 100644 fluss-rust/.github/workflows/build_and_test_elixir.yml
 delete mode 100644 fluss-rust/.github/workflows/build_and_test_python.yml
 delete mode 100644 fluss-rust/.github/workflows/deploy_documentation.yml
 delete mode 100644 fluss-rust/DISCLAIMER
 delete mode 100644 fluss-rust/LICENSE
 delete mode 100644 fluss-rust/NOTICE
 delete mode 100644 fluss-rust/crates/fluss/src/proto/fluss_api.proto
 create mode 100755 fluss-rust/scripts/vendor-proto.sh
 create mode 100644 website/community/how-to-release/pre-rc-checklist.md
 delete mode 100644 website/docs/apis/cpp-client.md
 create mode 100644 website/docs/apis/cpp/_category_.json
 create mode 100644 website/docs/apis/cpp/api-reference.md
 create mode 100644 website/docs/apis/cpp/data-types.md
 create mode 100644 website/docs/apis/cpp/error-handling.md
 create mode 100644 website/docs/apis/cpp/example/_category_.json
 create mode 100644 website/docs/apis/cpp/example/admin-operations.md
 create mode 100644 website/docs/apis/cpp/example/configuration.md
 create mode 100644 website/docs/apis/cpp/example/index.md
 create mode 100644 website/docs/apis/cpp/example/log-tables.md
 create mode 100644 website/docs/apis/cpp/example/partitioned-tables.md
 create mode 100644 website/docs/apis/cpp/example/primary-key-tables.md
 create mode 100644 website/docs/apis/cpp/installation.md
 create mode 100644 website/docs/apis/index.md
 create mode 100644 website/docs/apis/java/_category_.json
 rename website/docs/apis/{java-client.md => java/index.md} (100%)
 delete mode 100644 website/docs/apis/python-client.md
 create mode 100644 website/docs/apis/python/_category_.json
 create mode 100644 website/docs/apis/python/api-reference.md
 create mode 100644 website/docs/apis/python/data-types.md
 create mode 100644 website/docs/apis/python/error-handling.md
 create mode 100644 website/docs/apis/python/example/_category_.json
 create mode 100644 website/docs/apis/python/example/admin-operations.md
 create mode 100644 website/docs/apis/python/example/configuration.md
 create mode 100644 website/docs/apis/python/example/index.md
 create mode 100644 website/docs/apis/python/example/log-tables.md
 create mode 100644 website/docs/apis/python/example/partitioned-tables.md
 create mode 100644 website/docs/apis/python/example/primary-key-tables.md
 create mode 100644 website/docs/apis/python/installation.md
 delete mode 100644 website/docs/apis/rust-client.md
 create mode 100644 website/docs/apis/rust/_category_.json
 create mode 100644 website/docs/apis/rust/api-reference.md
 create mode 100644 website/docs/apis/rust/data-types.md
 create mode 100644 website/docs/apis/rust/error-handling.md
 create mode 100644 website/docs/apis/rust/example/_category_.json
 create mode 100644 website/docs/apis/rust/example/admin-operations.md
 create mode 100644 website/docs/apis/rust/example/configuration.md
 create mode 100644 website/docs/apis/rust/example/index.md
 create mode 100644 website/docs/apis/rust/example/log-tables.md
 create mode 100644 website/docs/apis/rust/example/partitioned-tables.md
 create mode 100644 website/docs/apis/rust/example/prefix-lookup.md
 create mode 100644 website/docs/apis/rust/example/primary-key-tables.md
 create mode 100644 website/docs/apis/rust/installation.md

diff --git a/fluss-rust/.github/actions/verify-tag-version/action.yml b/.github/actions/verify-tag-version/action.yml
similarity index 100%
rename from fluss-rust/.github/actions/verify-tag-version/action.yml
rename to .github/actions/verify-tag-version/action.yml
diff --git a/fluss-rust/.github/dependabot.yml b/.github/dependabot.yml
similarity index 87%
rename from fluss-rust/.github/dependabot.yml
rename to .github/dependabot.yml
index 7c12d72c0c..714e644bd5 100644
--- a/fluss-rust/.github/dependabot.yml
+++ b/.github/dependabot.yml
@@ -17,14 +17,14 @@
 
 version: 2
 updates:
-  # Maintain dependencies for GitHub Actions
+  # GitHub Actions used by the repository's workflows
   - package-ecosystem: "github-actions"
     directory: "/"
     schedule:
       interval: "monthly"
 
-  # Maintain dependencies for rust
+  # Rust client workspace
   - package-ecosystem: "cargo"
-    directory: "/"
+    directory: "/fluss-rust"
     schedule:
-      interval: "monthly"
\ No newline at end of file
+      interval: "monthly"
diff --git a/fluss-rust/.github/release.yml b/.github/release.yml
similarity index 100%
rename from fluss-rust/.github/release.yml
rename to .github/release.yml
diff --git a/.github/workflows/ci.yaml b/.github/workflows/ci.yaml
index 4ef7d372de..ee4a269d73 100644
--- a/.github/workflows/ci.yaml
+++ b/.github/workflows/ci.yaml
@@ -25,11 +25,13 @@ on:
     paths-ignore:
       - 'website/**'
       - 'helm/**'
+      - 'fluss-rust/**'
       - '**/*.md'
   pull_request:
     paths-ignore:
       - 'website/**'
       - 'helm/**'
+      - 'fluss-rust/**'
       - '**/*.md'
 
 concurrency:
diff --git a/.github/workflows/client-integration.yml b/.github/workflows/client-integration.yml
new file mode 100644
index 0000000000..6d77be877f
--- /dev/null
+++ b/.github/workflows/client-integration.yml
@@ -0,0 +1,366 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements.  See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership.  The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied.  See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+# Client integration tests against a SAME-REVISION server (FIP-40 §3.2).
+# Builds the Fluss server image from this source tree ONCE, caches + saves it,
+# then fans out the Rust / Python / C++ / Elixir integration suites against that
+# fluss:dev image (build-once-fan-out, à la Temporal/PyFlink). The image build is
+# cached on server/proto hashes, so client-only PRs reuse it instead of rebuilding.
+
+name: Client Integration
+
+on:
+  push:
+    branches:
+      - main
+    paths:
+      - 'fluss-rpc/src/main/proto/**'
+      - 'fluss-server/**'
+      - 'fluss-common/**'
+      - 'fluss-dist/**'
+      - 'docker/fluss/**'
+      - 'fluss-rust/crates/**'
+      - 'fluss-rust/bindings/**'
+      - 'fluss-rust/Cargo.toml'
+      - 'fluss-rust/Cargo.lock'
+      - '.github/workflows/client-integration.yml'
+  pull_request:
+    branches:
+      - main
+    paths:
+      - 'fluss-rpc/src/main/proto/**'
+      - 'fluss-server/**'
+      - 'fluss-common/**'
+      - 'fluss-dist/**'
+      - 'docker/fluss/**'
+      - 'fluss-rust/crates/**'
+      - 'fluss-rust/bindings/**'
+      - 'fluss-rust/Cargo.toml'
+      - 'fluss-rust/Cargo.lock'
+      - '.github/workflows/client-integration.yml'
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
+  cancel-in-progress: true
+
+jobs:
+  # Decide which client suites to run, mirroring the per-binding scoping the
+  # standalone fluss-rust repo had: a binding suite runs only when its own
+  # binding, the core fluss-rs crate, or the server/proto changed. On non-PR
+  # events (push to main, manual) everything runs.
+  detect-changes:
+    runs-on: ubuntu-latest
+    outputs:
+      rust: ${{ steps.filter.outputs.rust }}
+      python: ${{ steps.filter.outputs.python }}
+      cpp: ${{ steps.filter.outputs.cpp }}
+      elixir: ${{ steps.filter.outputs.elixir }}
+    steps:
+      - uses: actions/checkout@v6
+        with:
+          fetch-depth: 0
+      - id: filter
+        run: |
+          if [ "${{ github.event_name }}" != "pull_request" ]; then
+            all=true; changed=""
+          else
+            all=false
+            changed=$(git diff --name-only "${{ github.event.pull_request.base.sha }}...HEAD")
+          fi
+          echo "Changed files:"; echo "$changed"
+          has() { echo "$changed" | grep -qE "$1"; }
+          protocol=false; core=false; py=false; cpp=false; ex=false
+          has '^(fluss-rpc/src/main/proto/|fluss-server/|fluss-common/|fluss-dist/|docker/fluss/)' && protocol=true || true
+          has '^(fluss-rust/crates/|fluss-rust/Cargo\.)' && core=true || true
+          has '^fluss-rust/bindings/python/' && py=true || true
+          has '^fluss-rust/bindings/cpp/' && cpp=true || true
+          has '^fluss-rust/bindings/elixir/' && ex=true || true
+          # a suite runs if: non-PR (all) OR core crate OR server/proto OR its own binding changed
+          gate() { if [ "$all" = true ] || [ "$core" = true ] || [ "$protocol" = true ] || [ "$1" = true ]; then echo true; else echo false; fi; }
+          {
+            echo "rust=$(gate false)"
+            echo "python=$(gate $py)"
+            echo "cpp=$(gate $cpp)"
+            echo "elixir=$(gate $ex)"
+          } >> "$GITHUB_OUTPUT"
+
+  # Build the server image from THIS source tree once; cache it on server/proto
+  # hashes so client-only PRs restore it instead of rebuilding. The saved image
+  # is uploaded as an artifact and loaded by every client integration job.
+  build-server-image:
+    needs: detect-changes
+    if: needs.detect-changes.outputs.rust == 'true' || needs.detect-changes.outputs.python == 'true' || needs.detect-changes.outputs.cpp == 'true' || needs.detect-changes.outputs.elixir == 'true'
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v6
+
+      - name: Cache server image
+        id: image-cache
+        uses: actions/cache@v4
+        with:
+          path: /tmp/fluss-dev.tar
+          key: fluss-dev-image-${{ hashFiles('fluss-server/**', 'fluss-common/**', 'fluss-rpc/**', 'fluss-dist/**', 'docker/fluss/**', 'pom.xml') }}
+
+      - name: Set up JDK 17
+        if: steps.image-cache.outputs.cache-hit != 'true'
+        uses: actions/setup-java@v5
+        with:
+          java-version: '17'
+          distribution: 'temurin'
+          cache: maven
+
+      - name: Build server image (fluss:dev) from source
+        if: steps.image-cache.outputs.cache-hit != 'true'
+        run: |
+          ./mvnw -B --no-transfer-progress clean package -pl fluss-dist -am -DskipTests
+          rm -rf docker/fluss/build-target
+          mkdir -p docker/fluss/build-target
+          cp -r build-target/* docker/fluss/build-target/
+          docker build -t fluss:dev docker/fluss
+          docker save fluss:dev -o /tmp/fluss-dev.tar
+
+      - name: Upload server image
+        uses: actions/upload-artifact@v4
+        with:
+          name: fluss-dev-image
+          path: /tmp/fluss-dev.tar
+          retention-days: 1
+
+  rust-integration:
+    needs: [detect-changes, build-server-image]
+    if: needs.detect-changes.outputs.rust == 'true'
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    defaults:
+      run:
+        working-directory: fluss-rust
+    env:
+      FLUSS_IMAGE: fluss
+      FLUSS_VERSION: dev
+    steps:
+      - uses: actions/checkout@v6
+      - uses: actions/download-artifact@v4
+        with:
+          name: fluss-dev-image
+          path: /tmp
+      - name: Load server image
+        run: docker load -i /tmp/fluss-dev.tar
+      - name: Install protoc
+        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
+      - name: Rust Cache
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
+        with:
+          workspaces: fluss-rust
+      - name: Integration tests
+        run: cargo test --features integration_tests --test test_fluss -p fluss-rs
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
+
+  python-integration:
+    needs: [detect-changes, build-server-image]
+    if: needs.detect-changes.outputs.python == 'true'
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python: ["3.9", "3.10", "3.11", "3.12"]
+    defaults:
+      run:
+        working-directory: fluss-rust
+    env:
+      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/fluss-rust/target/debug/fluss-test-cluster
+      FLUSS_IMAGE: fluss
+      FLUSS_VERSION: dev
+    steps:
+      - uses: actions/checkout@v6
+      - uses: actions/download-artifact@v4
+        with:
+          name: fluss-dev-image
+          path: /tmp
+      - name: Load server image
+        run: docker load -i /tmp/fluss-dev.tar
+      - name: Set up Python
+        uses: actions/setup-python@v6
+        with:
+          python-version: ${{ matrix.python }}
+      - name: Install uv
+        uses: astral-sh/setup-uv@37802adc94f370d6bfd71619e3f0bf239e1f3b78
+      - name: Install protoc
+        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
+      - name: Rust Cache
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
+        with:
+          workspaces: fluss-rust
+      - name: Build fluss-test-cluster binary
+        run: cargo build -p fluss-test-cluster
+      - name: Build Python bindings
+        working-directory: fluss-rust/bindings/python
+        run: |
+          uv sync --extra dev --no-install-project
+          uv run --no-sync maturin develop --uv
+      - name: Run tests (parallel)
+        working-directory: fluss-rust/bindings/python
+        run: uv run --no-sync pytest test/ -v -n 2 --dist=loadfile
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
+          FLUSS_SKIP_CLUSTER_TEARDOWN: "1"
+      - name: Dump fluss cluster container logs
+        if: always()
+        run: |
+          mkdir -p cluster-logs
+          for c in $(docker ps -a --filter "name=shared-test" --format '{{.Names}}'); do
+            docker logs "$c" > "cluster-logs/$c.log" 2>&1 || true
+          done
+      - uses: actions/upload-artifact@v4
+        if: always()
+        with:
+          name: cluster-logs-${{ matrix.python }}
+          path: fluss-rust/cluster-logs/
+          if-no-files-found: ignore
+          retention-days: 3
+
+  cpp-integration:
+    needs: [detect-changes, build-server-image]
+    if: needs.detect-changes.outputs.cpp == 'true'
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    defaults:
+      run:
+        working-directory: fluss-rust
+    env:
+      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/fluss-rust/target/debug/fluss-test-cluster
+      FLUSS_IMAGE: fluss
+      FLUSS_VERSION: dev
+    steps:
+      - uses: actions/checkout@v6
+      - uses: actions/download-artifact@v4
+        with:
+          name: fluss-dev-image
+          path: /tmp
+      - name: Load server image
+        run: docker load -i /tmp/fluss-dev.tar
+      - name: Install protoc
+        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
+        with:
+          repo-token: ${{ secrets.GITHUB_TOKEN }}
+      - name: Install Apache Arrow C++
+        run: |
+          sudo apt-get install -y -V ca-certificates lsb-release wget
+          wget https://apache.jfrog.io/artifactory/arrow/$(lsb_release --id --short | tr 'A-Z' 'a-z')/apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
+          sudo apt-get install -y -V ./apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
+          sudo apt-get update
+          sudo apt-get install -y -V libarrow-dev
+      - name: Rust Cache
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
+        with:
+          workspaces: fluss-rust
+      - name: Setup sccache
+        uses: mozilla-actions/sccache-action@7d986dd989559c6ecdb630a3fd2557667be217ad # v0.0.9
+      - name: Build fluss-test-cluster binary
+        run: cargo build -p fluss-test-cluster
+      - name: Build C++ bindings and tests
+        working-directory: fluss-rust/bindings/cpp
+        env:
+          SCCACHE_GHA_ENABLED: "true"
+        run: |
+          cmake -B build \
+            -DFLUSS_ENABLE_TESTING=ON \
+            -DCMAKE_BUILD_TYPE=Debug \
+            -DCMAKE_C_COMPILER_LAUNCHER=sccache \
+            -DCMAKE_CXX_COMPILER_LAUNCHER=sccache
+          cmake --build build --parallel
+          sccache --show-stats
+      - name: Run C++ integration tests (parallel)
+        working-directory: fluss-rust/bindings/cpp
+        run: cd build && ctest -j$(nproc) --output-on-failure --timeout 300
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
+
+  elixir-integration:
+    needs: [detect-changes, build-server-image]
+    if: needs.detect-changes.outputs.elixir == 'true'
+    timeout-minutes: 60
+    runs-on: ubuntu-latest
+    defaults:
+      run:
+        working-directory: fluss-rust
+    env:
+      OTP_VERSION: "28.0.2"
+      ELIXIR_VERSION: "1.19.5"
+      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/fluss-rust/target/debug/fluss-test-cluster
+      MIX_ENV: test
+      FLUSS_IMAGE: fluss
+      FLUSS_VERSION: dev
+    steps:
+      - uses: actions/checkout@v6
+      - uses: actions/download-artifact@v4
+        with:
+          name: fluss-dev-image
+          path: /tmp
+      - name: Load server image
+        run: docker load -i /tmp/fluss-dev.tar
+      - name: Set up BEAM
+        uses: erlef/setup-beam@fc68ffb90438ef2936bbb3251622353b3dcb2f93 # v1.24.0
+        with:
+          otp-version: ${{ env.OTP_VERSION }}
+          elixir-version: ${{ env.ELIXIR_VERSION }}
+      - name: Install protoc
+        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
+      - name: Rust Cache
+        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
+        with:
+          workspaces: fluss-rust
+      - name: Cache Mix deps and build
+        uses: actions/cache@v4
+        with:
+          path: |
+            fluss-rust/bindings/elixir/deps
+            fluss-rust/bindings/elixir/_build
+          key: ${{ runner.os }}-mix-otp${{ env.OTP_VERSION }}-elixir${{ env.ELIXIR_VERSION }}-${{ hashFiles('fluss-rust/bindings/elixir/mix.lock') }}
+          restore-keys: |
+            ${{ runner.os }}-mix-otp${{ env.OTP_VERSION }}-elixir${{ env.ELIXIR_VERSION }}-
+      - name: Build fluss-test-cluster binary
+        run: cargo build -p fluss-test-cluster
+      - name: Fetch Elixir deps
+        working-directory: fluss-rust/bindings/elixir
+        run: mix deps.get
+      - name: Check formatting
+        working-directory: fluss-rust/bindings/elixir
+        run: mix format --check-formatted
+      - name: Compile (warnings as errors)
+        working-directory: fluss-rust/bindings/elixir
+        run: mix compile --warnings-as-errors
+      - name: Credo
+        working-directory: fluss-rust/bindings/elixir
+        run: mix credo
+      - name: Run unit tests
+        working-directory: fluss-rust/bindings/elixir
+        run: mix test
+      - name: Run integration tests
+        working-directory: fluss-rust/bindings/elixir
+        run: mix test --include integration --only integration
+        env:
+          RUST_LOG: DEBUG
+          RUST_BACKTRACE: full
diff --git a/.github/workflows/license-check.yml b/.github/workflows/license-check.yml
index 5f52ffa3d9..aa69703eec 100644
--- a/.github/workflows/license-check.yml
+++ b/.github/workflows/license-check.yml
@@ -17,7 +17,17 @@ name: Check License
 permissions:
   contents: read
 
-on: [push, pull_request]
+on:
+  push:
+    paths-ignore:
+      - 'fluss-rust/**'
+      - 'website/**'
+      - '**/*.md'
+  pull_request:
+    paths-ignore:
+      - 'fluss-rust/**'
+      - 'website/**'
+      - '**/*.md'
 
 concurrency:
   group: ${{ github.workflow }}-${{ github.event_name }}-${{ github.event.number || github.run_id }}
diff --git a/fluss-rust/.github/workflows/release_python.yml b/.github/workflows/python-release.yml
similarity index 88%
rename from fluss-rust/.github/workflows/release_python.yml
rename to .github/workflows/python-release.yml
index c2fed15556..ddbc4f0cf9 100644
--- a/fluss-rust/.github/workflows/release_python.yml
+++ b/.github/workflows/python-release.yml
@@ -51,9 +51,14 @@ jobs:
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
 
+      # Vendor the canonical proto so the sdist builds standalone from source.
+      - name: Vendor canonical proto into the crate
+        working-directory: fluss-rust
+        run: scripts/vendor-proto.sh
+
       - uses: PyO3/maturin-action@v1
         with:
-          working-directory: bindings/python
+          working-directory: fluss-rust/bindings/python
           command: sdist
           args: -o dist
 
@@ -61,7 +66,7 @@ jobs:
         uses: actions/upload-artifact@v7
         with:
           name: wheels-sdist
-          path: bindings/python/dist
+          path: fluss-rust/bindings/python/dist
 
   wheels:
     runs-on: ${{ matrix.os }}
@@ -93,7 +98,7 @@ jobs:
       # Install protoc in manylinux container (x86_64/aarch64); script shared via YAML anchor
       - uses: PyO3/maturin-action@v1
         with:
-          working-directory: bindings/python
+          working-directory: fluss-rust/bindings/python
           target: ${{ matrix.target }}
           command: build
           args: --release -o dist -i python3.9
@@ -114,7 +119,7 @@ jobs:
             export PROTOC=/tmp/protoc_install/bin/protoc
       - uses: PyO3/maturin-action@v1
         with:
-          working-directory: bindings/python
+          working-directory: fluss-rust/bindings/python
           target: ${{ matrix.target }}
           command: build
           args: --release -o dist -i python3.10
@@ -122,7 +127,7 @@ jobs:
           before-script-linux: *protoc-install
       - uses: PyO3/maturin-action@v1
         with:
-          working-directory: bindings/python
+          working-directory: fluss-rust/bindings/python
           target: ${{ matrix.target }}
           command: build
           args: --release -o dist -i python3.11
@@ -130,7 +135,7 @@ jobs:
           before-script-linux: *protoc-install
       - uses: PyO3/maturin-action@v1
         with:
-          working-directory: bindings/python
+          working-directory: fluss-rust/bindings/python
           target: ${{ matrix.target }}
           command: build
           args: --release -o dist -i python3.12
@@ -141,7 +146,7 @@ jobs:
         uses: actions/upload-artifact@v7
         with:
           name: wheels-${{ matrix.os }}-${{ matrix.target || 'native' }}
-          path: bindings/python/dist
+          path: fluss-rust/bindings/python/dist
 
   release:
     name: Publish to PyPI
@@ -155,7 +160,7 @@ jobs:
         with:
           pattern: wheels-*
           merge-multiple: true
-          path: bindings/python/dist
+          path: fluss-rust/bindings/python/dist
 
       - name: Publish to TestPyPI
         if: contains(github.ref, '-')
@@ -163,7 +168,7 @@ jobs:
         with:
           repository-url: https://test.pypi.org/legacy/
           skip-existing: true
-          packages-dir: bindings/python/dist
+          packages-dir: fluss-rust/bindings/python/dist
           password: ${{ secrets.TEST_PYPI_API_TOKEN }}
 
       - name: Publish to PyPI
@@ -171,5 +176,5 @@ jobs:
         uses: pypa/gh-action-pypi-publish@ed0c53931b1dc9bd32cbe73a98c7f6766f8a527e
         with:
           skip-existing: true
-          packages-dir: bindings/python/dist
+          packages-dir: fluss-rust/bindings/python/dist
           password: ${{ secrets.PYPI_API_TOKEN }}
diff --git a/fluss-rust/.github/workflows/build_and_test_rust.yml b/.github/workflows/rust-build-and-test.yml
similarity index 70%
rename from fluss-rust/.github/workflows/build_and_test_rust.yml
rename to .github/workflows/rust-build-and-test.yml
index 9e60bd0c52..d59fadce59 100644
--- a/fluss-rust/.github/workflows/build_and_test_rust.yml
+++ b/.github/workflows/rust-build-and-test.yml
@@ -21,24 +21,35 @@ on:
   push:
     branches:
       - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
+    paths:
+      - 'fluss-rust/crates/**'
+      - 'fluss-rust/Cargo.toml'
+      - 'fluss-rust/Cargo.lock'
+      - 'fluss-rust/rust-toolchain.toml'
+      - 'fluss-rust/.cargo/**'
+      - 'fluss-rpc/src/main/proto/**'
+      - '.github/workflows/rust-build-and-test.yml'
   pull_request:
     branches:
       - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-      - 'bindings/python/**'
-      - 'bindings/cpp/**'
-      - 'bindings/elixir/**'
+    paths:
+      - 'fluss-rust/crates/**'
+      - 'fluss-rust/Cargo.toml'
+      - 'fluss-rust/Cargo.lock'
+      - 'fluss-rust/rust-toolchain.toml'
+      - 'fluss-rust/.cargo/**'
+      - 'fluss-rpc/src/main/proto/**'
+      - '.github/workflows/rust-build-and-test.yml'
   workflow_dispatch:
 
 concurrency:
   group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
   cancel-in-progress: true
 
+defaults:
+  run:
+    working-directory: fluss-rust
+
 jobs:
   build-and-unit-test:
     timeout-minutes: 60
@@ -58,6 +69,8 @@ jobs:
 
       - name: Rust Cache
         uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
+        with:
+          workspaces: fluss-rust
 
       - name: Build
         run: cargo build --workspace --all-targets --exclude fluss_python --exclude fluss-cpp --exclude fluss_nif
@@ -67,24 +80,3 @@ jobs:
         env:
           RUST_LOG: DEBUG
           RUST_BACKTRACE: full
-
-  integration-test:
-    needs: build-and-unit-test
-    timeout-minutes: 60
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v6
-
-      - name: Install protoc
-        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
-        with:
-          repo-token: ${{ secrets.GITHUB_TOKEN }}
-
-      - name: Rust Cache
-        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
-
-      - name: Integration Test
-        run: cargo test --features integration_tests --test test_fluss -p fluss-rs
-        env:
-          RUST_LOG: DEBUG
-          RUST_BACKTRACE: full
diff --git a/fluss-rust/.github/workflows/check_documentation.yml b/.github/workflows/rust-docs-check.yml
similarity index 82%
rename from fluss-rust/.github/workflows/check_documentation.yml
rename to .github/workflows/rust-docs-check.yml
index 70e6a438d2..e2e6e72059 100644
--- a/fluss-rust/.github/workflows/check_documentation.yml
+++ b/.github/workflows/rust-docs-check.yml
@@ -16,26 +16,28 @@
 # limitations under the License.
 ################################################################################
 
-# This workflow is meant for checking broken links in the documentation.
-name: Documentation Check
+# Checks for broken links in the fluss-rust client documentation.
+name: Rust Documentation Check
 permissions:
   contents: read
 on:
   pull_request:
     branches: [main]
     paths:
-      - 'website/**'
+      - 'fluss-rust/website/**'
+      - '.github/workflows/rust-docs-check.yml'
   push:
     branches: [main]
     paths:
-      - 'website/**'
+      - 'fluss-rust/website/**'
+      - '.github/workflows/rust-docs-check.yml'
 
 jobs:
   check-documentation:
     runs-on: ubuntu-latest
     defaults:
       run:
-        working-directory: ./website
+        working-directory: fluss-rust/website
     steps:
       - uses: actions/checkout@v6
         with:
diff --git a/fluss-rust/.github/workflows/check_license_and_formatting.yml b/.github/workflows/rust-license-and-format.yml
similarity index 69%
rename from fluss-rust/.github/workflows/check_license_and_formatting.yml
rename to .github/workflows/rust-license-and-format.yml
index 881af9f927..2c2d4f6b41 100644
--- a/fluss-rust/.github/workflows/check_license_and_formatting.yml
+++ b/.github/workflows/rust-license-and-format.yml
@@ -15,27 +15,47 @@
 # specific language governing permissions and limitations
 # under the License.
 
-name: License and Formatting Check
+name: Rust License and Formatting Check
 
 on:
   push:
     branches:
       - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
+    paths:
+      - 'fluss-rust/crates/**'
+      - 'fluss-rust/bindings/**'
+      - 'fluss-rust/Cargo.toml'
+      - 'fluss-rust/Cargo.lock'
+      - 'fluss-rust/deny.toml'
+      - 'fluss-rust/.licenserc.yaml'
+      - 'fluss-rust/rustfmt.toml'
+      - 'fluss-rust/rust-toolchain.toml'
+      - 'fluss-rpc/src/main/proto/**'
+      - '.github/workflows/rust-license-and-format.yml'
   pull_request:
     branches:
       - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
+    paths:
+      - 'fluss-rust/crates/**'
+      - 'fluss-rust/bindings/**'
+      - 'fluss-rust/Cargo.toml'
+      - 'fluss-rust/Cargo.lock'
+      - 'fluss-rust/deny.toml'
+      - 'fluss-rust/.licenserc.yaml'
+      - 'fluss-rust/rustfmt.toml'
+      - 'fluss-rust/rust-toolchain.toml'
+      - 'fluss-rpc/src/main/proto/**'
+      - '.github/workflows/rust-license-and-format.yml'
   workflow_dispatch:
 
 concurrency:
   group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
   cancel-in-progress: true
 
+defaults:
+  run:
+    working-directory: fluss-rust
+
 jobs:
   check-license-and-formatting:
     runs-on: ubuntu-latest
@@ -44,6 +64,8 @@ jobs:
 
       - name: Check License Header
         uses: apache/skywalking-eyes/header@61275cc80d0798a405cb070f7d3a8aaf7cf2c2c1 # v0.8.0
+        with:
+          config: fluss-rust/.licenserc.yaml
 
       - name: Install cargo-deny
         uses: taiki-e/install-action@v2
@@ -60,6 +82,8 @@ jobs:
 
       - name: Rust Cache
         uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
+        with:
+          workspaces: fluss-rust
 
       - name: Format
         run: cargo fmt --all -- --check
diff --git a/fluss-rust/.github/workflows/release_rust.yml b/.github/workflows/rust-release.yml
similarity index 80%
rename from fluss-rust/.github/workflows/release_rust.yml
rename to .github/workflows/rust-release.yml
index 946b2b26a8..d2f8901400 100644
--- a/fluss-rust/.github/workflows/release_rust.yml
+++ b/.github/workflows/rust-release.yml
@@ -28,6 +28,10 @@ on:
     tags:
       - "v*"  # Only version-like tags (e.g. v0.1.0, v0.1.0-rc1); avoids running on arbitrary tags
 
+defaults:
+  run:
+    working-directory: fluss-rust
+
 jobs:
   publish:
     runs-on: ubuntu-latest
@@ -41,11 +45,16 @@ jobs:
       - name: Install protoc
         run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
 
+      # build.rs reads the canonical proto from the in-repo fluss-rpc, which is
+      # outside the published crate; vendor it so the crate publishes standalone.
+      - name: Vendor canonical proto into the crate
+        run: scripts/vendor-proto.sh
+
       - name: Dry run (crates/fluss)
-        run: cargo publish -p fluss-rs --dry-run
+        run: cargo publish -p fluss-rs --dry-run --allow-dirty
 
       - name: Publish fluss-rs to crates.io
         if: startsWith(github.ref, 'refs/tags/') && !contains(github.ref, '-')
-        run: cargo publish -p fluss-rs
+        run: cargo publish -p fluss-rs --allow-dirty
         env:
           CARGO_REGISTRY_TOKEN: ${{ secrets.CARGO_REGISTRY_TOKEN }}
diff --git a/fluss-rust/.asf.yaml b/fluss-rust/.asf.yaml
deleted file mode 100644
index fae1722d2f..0000000000
--- a/fluss-rust/.asf.yaml
+++ /dev/null
@@ -1,47 +0,0 @@
-#  Licensed to the Apache Software Foundation (ASF) under one
-#  or more contributor license agreements.  See the NOTICE file
-#  distributed with this work for additional information
-#  regarding copyright ownership.  The ASF licenses this file
-#  to you under the Apache License, Version 2.0 (the
-#  "License"); you may not use this file except in compliance
-#  with the License.  You may obtain a copy of the License at
-#
-#    http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing,
-#  software distributed under the License is distributed on an
-#  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-#  KIND, either express or implied.  See the License for the
-#  specific language governing permissions and limitations
-#  under the License.
-
-# See: https://cwiki.apache.org/confluence/display/INFRA/git+-+.asf.yaml+features
-
-github:
-  description: "Rust Client for Apache Fluss (Incubating)"
-  homepage: https://clients.fluss.apache.org/
-  ghp_branch: gh-pages
-  ghp_path: /
-  features:
-    issues: true
-    projects: false
-    discussions: false
-    wiki: false
-  labels:
-    - fluss
-    - streaming
-    - real-time-analytics
-    - lakehouse
-    - rust
-    - python
-  enabled_merge_buttons:
-    squash:  true
-    merge:   false
-    rebase:  true
-notifications:
-  commits:      commits@fluss.apache.org
-  issues:       issues@fluss.apache.org
-  pullrequests: issues@fluss.apache.org
-  jobs:         builds@fluss.apache.org
-  discussions:  issues@fluss.apache.org
-
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml b/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
deleted file mode 100644
index aadd86da4e..0000000000
--- a/fluss-rust/.github/ISSUE_TEMPLATE/bug.yml
+++ /dev/null
@@ -1,58 +0,0 @@
-################################################################################
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-################################################################################
-
-name: Bug report 🐞
-description: Problems, bugs and issues with Fluss
-type: "bug"
-body:
-  - type: markdown
-    attributes:
-      value: |
-        Thank you very much for your feedback!
-  - type: checkboxes
-    attributes:
-      label: Search before asking
-      description: >
-        Please search [issues](https://github.com/apache/fluss-rust/issues) to check if your issue has already been reported.
-      options:
-        - label: >
-            I searched in the [issues](https://github.com/apache/fluss-rust/issues) and found nothing similar.
-          required: true
-  - type: textarea
-    attributes:
-      label: Please describe the bug 🐞
-      description: >
-        Please describe the problem, what to expect, and how to reproduce.
-        Feel free to include stacktraces and the Fluss server/client configuration.
-        You can include files by dragging and dropping them here.
-    validations:
-      required: true
-  - type: textarea
-    attributes:
-      label: Solution
-      description: Describe the proposed solution about how to fix it if any.
-  - type: checkboxes
-    attributes:
-      label: Are you willing to submit a PR?
-      description: >
-        We look forward to the community of developers or users helping solve Fluss problems together. If you are willing to submit a PR to fix this problem, please check the box.
-      options:
-        - label: I'm willing to submit a PR!
-  - type: markdown
-    attributes:
-      value: "Thanks for completing our form!"
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/config.yml b/fluss-rust/.github/ISSUE_TEMPLATE/config.yml
deleted file mode 100644
index c2520da489..0000000000
--- a/fluss-rust/.github/ISSUE_TEMPLATE/config.yml
+++ /dev/null
@@ -1,19 +0,0 @@
-################################################################################
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-################################################################################
-
-blank_issues_enabled: false
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml b/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
deleted file mode 100644
index 9f08a60008..0000000000
--- a/fluss-rust/.github/ISSUE_TEMPLATE/feature.yml
+++ /dev/null
@@ -1,58 +0,0 @@
-################################################################################
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-################################################################################
-
-name: Feature Request 🚀
-description: User-facing functionality or improvement you’d like to see added
-type: "feature"
-body:
-  - type: markdown
-    attributes:
-      value: |
-        Thank you very much for your feature proposal!
-  - type: checkboxes
-    attributes:
-      label: Search before asking
-      description: >
-        Please search [issues](https://github.com/apache/fluss-rust/issues) to check if your issue has already been reported.
-      options:
-        - label: >
-            I searched in the [issues](https://github.com/apache/fluss-rust/issues) and found nothing similar.
-          required: true
-  - type: textarea
-    attributes:
-      label: Motivation
-      description: Please describe the feature and elaborate on the use case and motivation behind it
-    validations:
-      required: true
-  - type: textarea
-    attributes:
-      label: Solution
-      description: Describe the proposed solution and add related materials like links if any.
-  - type: textarea
-    attributes:
-      label: Anything else?
-  - type: checkboxes
-    attributes:
-      label: Willingness to contribute
-      description: >
-        We look forward to the community of developers or users helping develop Fluss features together. If you are willing to submit a PR to implement the feature, please check the box.
-      options:
-        - label: I'm willing to submit a PR!
-  - type: markdown
-    attributes:
-      value: "Thanks for completing our form!"
diff --git a/fluss-rust/.github/ISSUE_TEMPLATE/task.yml b/fluss-rust/.github/ISSUE_TEMPLATE/task.yml
deleted file mode 100644
index dddc621f28..0000000000
--- a/fluss-rust/.github/ISSUE_TEMPLATE/task.yml
+++ /dev/null
@@ -1,51 +0,0 @@
-################################################################################
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#      http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-################################################################################
-
-name: Task 📌
-description: Specific work item - either part of a larger feature or independent project maintenance
-type: "task"
-body:
-  - type: markdown
-    attributes:
-      value: |
-        Thank you very much for your work!
-  - type: checkboxes
-    attributes:
-      label: Search before asking
-      description: >
-        Please search [issues](https://github.com/apache/fluss-rust/issues) to check if your issue has already been reported.
-      options:
-        - label: >
-            I searched in the [issues](https://github.com/apache/fluss-rust/issues) and found nothing similar.
-          required: true
-  - type: textarea
-    attributes:
-      label: Description
-      description: Please describe the task and the purpose of the work.
-    validations:
-      required: true
-  - type: checkboxes
-    attributes:
-      label: Willingness to contribute
-      description: >
-        We look forward to the community of developers or users helping develop Fluss together. If you are willing to submit a PR to implement the task, please check the box.
-      options:
-        - label: I'm willing to submit a PR!
-  - type: markdown
-    attributes:
-      value: "Thanks for completing our form!"
diff --git a/fluss-rust/.github/PULL_REQUEST_TEMPLATE.md b/fluss-rust/.github/PULL_REQUEST_TEMPLATE.md
deleted file mode 100644
index 5e03d8df9c..0000000000
--- a/fluss-rust/.github/PULL_REQUEST_TEMPLATE.md
+++ /dev/null
@@ -1,41 +0,0 @@
-<!--
-*Thank you very much for contributing to Fluss - we are happy that you want to help us improve Fluss. To help the community review your contribution in the best possible way, please go through the checklist below, which will get the contribution into a shape in which it can be best reviewed.*
-
-## Contribution Checklist
-
-  - Make sure that the pull request corresponds to a [GitHub issue](https://github.com/apache/fluss-rust/issues). Exceptions are made for typos in JavaDoc or documentation files, which need no issue.
-
-  - Name the pull request in the format "[component] Title of the pull request", where *[component]* should be replaced by the name of the component being changed. Typically, this corresponds to the component label assigned to the issue (e.g., [kv], [log], [client], [flink]). Skip *[component]* if you are unsure about which is the best component.
-
-  - Fill out the template below to describe the changes contributed by the pull request. That will give reviewers the context they need to do the review.
-
-  - Make sure that the change passes the automated tests, i.e., `mvn clean verify` passes.
-
-  - Each pull request should address only one issue, not mix up code from multiple issues.
-
-
-**(The sections below can be removed for hotfixes or typos)**
--->
-
-### Purpose
-
-<!-- Linking this pull request to the issue -->
-Linked issue: close #xxx
-
-<!-- What is the purpose of the change -->
-
-### Brief change log
-
-<!-- Please describe the changes made in this pull request and explain how they address the issue -->
-
-### Tests
-
-<!-- List UT and IT cases to verify this change -->
-
-### API and Format
-
-<!-- Does this change affect API or storage format -->
-
-### Documentation
-
-<!-- Does this change introduce a new feature -->
diff --git a/fluss-rust/.github/workflows/build_and_test_cpp.yml b/fluss-rust/.github/workflows/build_and_test_cpp.yml
deleted file mode 100644
index 9ede0c3e3c..0000000000
--- a/fluss-rust/.github/workflows/build_and_test_cpp.yml
+++ /dev/null
@@ -1,90 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-name: C++ Build and Tests
-
-on:
-  push:
-    branches:
-      - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-  pull_request:
-    branches:
-      - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-      - 'bindings/python/**'
-      - 'bindings/elixir/**'
-  workflow_dispatch:
-
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
-  cancel-in-progress: true
-
-jobs:
-  build-and-test:
-    timeout-minutes: 60
-    runs-on: ubuntu-latest
-    env:
-      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/target/debug/fluss-test-cluster
-    steps:
-      - uses: actions/checkout@v6
-
-      - name: Install protoc
-        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
-        with:
-          repo-token: ${{ secrets.GITHUB_TOKEN }}
-
-      - name: Install Apache Arrow C++
-        run: |
-          sudo apt-get install -y -V ca-certificates lsb-release wget
-          wget https://apache.jfrog.io/artifactory/arrow/$(lsb_release --id --short | tr 'A-Z' 'a-z')/apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
-          sudo apt-get install -y -V ./apache-arrow-apt-source-latest-$(lsb_release --codename --short).deb
-          sudo apt-get update
-          sudo apt-get install -y -V libarrow-dev
-
-      - name: Rust Cache
-        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
-
-      - name: Setup sccache
-        uses: mozilla-actions/sccache-action@7d986dd989559c6ecdb630a3fd2557667be217ad # v0.0.9
-
-      - name: Build fluss-test-cluster binary
-        run: cargo build -p fluss-test-cluster
-
-      - name: Build C++ bindings and tests
-        working-directory: bindings/cpp
-        env:
-          SCCACHE_GHA_ENABLED: "true"
-        run: |
-          cmake -B build \
-            -DFLUSS_ENABLE_TESTING=ON \
-            -DCMAKE_BUILD_TYPE=Debug \
-            -DCMAKE_C_COMPILER_LAUNCHER=sccache \
-            -DCMAKE_CXX_COMPILER_LAUNCHER=sccache
-          cmake --build build --parallel
-          sccache --show-stats
-
-      - name: Run C++ integration tests (parallel)
-        working-directory: bindings/cpp
-        run: cd build && ctest -j$(nproc) --output-on-failure --timeout 300
-        env:
-          RUST_LOG: DEBUG
-          RUST_BACKTRACE: full
diff --git a/fluss-rust/.github/workflows/build_and_test_elixir.yml b/fluss-rust/.github/workflows/build_and_test_elixir.yml
deleted file mode 100644
index 03f3329e0f..0000000000
--- a/fluss-rust/.github/workflows/build_and_test_elixir.yml
+++ /dev/null
@@ -1,103 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-name: Elixir Build and Tests
-
-on:
-  push:
-    branches:
-      - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-  pull_request:
-    branches:
-      - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-      - 'bindings/cpp/**'
-      - 'bindings/python/**'
-  workflow_dispatch:
-
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
-  cancel-in-progress: true
-
-jobs:
-  build-and-test:
-    timeout-minutes: 60
-    runs-on: ubuntu-latest
-    env:
-      OTP_VERSION: "28.0.2"
-      ELIXIR_VERSION: "1.19.5"
-      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/target/debug/fluss-test-cluster
-      MIX_ENV: test
-    steps:
-      - uses: actions/checkout@v6
-
-      - name: Set up BEAM
-        uses: erlef/setup-beam@fc68ffb90438ef2936bbb3251622353b3dcb2f93 # v1.24.0
-        with:
-          otp-version: ${{ env.OTP_VERSION }}
-          elixir-version: ${{ env.ELIXIR_VERSION }}
-
-      - name: Install protoc
-        run: sudo apt-get update && sudo apt-get install -y protobuf-compiler
-
-      - name: Rust Cache
-        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
-
-      - name: Cache Mix deps and build
-        uses: actions/cache@v4
-        with:
-          path: |
-            bindings/elixir/deps
-            bindings/elixir/_build
-          key: ${{ runner.os }}-mix-otp${{ env.OTP_VERSION }}-elixir${{ env.ELIXIR_VERSION }}-${{ hashFiles('bindings/elixir/mix.lock') }}
-          restore-keys: |
-            ${{ runner.os }}-mix-otp${{ env.OTP_VERSION }}-elixir${{ env.ELIXIR_VERSION }}-
-
-      - name: Build fluss-test-cluster binary
-        run: cargo build -p fluss-test-cluster
-
-      - name: Fetch Elixir deps
-        working-directory: bindings/elixir
-        run: mix deps.get
-
-      - name: Check formatting
-        working-directory: bindings/elixir
-        run: mix format --check-formatted
-
-      - name: Compile (warnings as errors)
-        working-directory: bindings/elixir
-        run: mix compile --warnings-as-errors
-
-      - name: Credo
-        working-directory: bindings/elixir
-        run: mix credo
-
-      - name: Run unit tests
-        working-directory: bindings/elixir
-        run: mix test
-
-      - name: Run integration tests
-        working-directory: bindings/elixir
-        run: mix test --include integration --only integration
-        env:
-          RUST_LOG: DEBUG
-          RUST_BACKTRACE: full
diff --git a/fluss-rust/.github/workflows/build_and_test_python.yml b/fluss-rust/.github/workflows/build_and_test_python.yml
deleted file mode 100644
index a8d3f05b47..0000000000
--- a/fluss-rust/.github/workflows/build_and_test_python.yml
+++ /dev/null
@@ -1,100 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-name: Python Build and Tests
-
-on:
-  push:
-    branches:
-      - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-  pull_request:
-    branches:
-      - main
-    paths-ignore:
-      - 'website/**'
-      - '**/*.md'
-      - 'bindings/cpp/**'
-      - 'bindings/elixir/**'
-  workflow_dispatch:
-
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}-${{ github.event_name }}
-  cancel-in-progress: true
-
-jobs:
-  build-and-test:
-    timeout-minutes: 60
-    runs-on: ubuntu-latest
-    strategy:
-      matrix:
-        python: ["3.9", "3.10", "3.11", "3.12"]
-    env:
-      FLUSS_TEST_CLUSTER_BIN: ${{ github.workspace }}/target/debug/fluss-test-cluster
-    steps:
-      - uses: actions/checkout@v6
-
-      - name: Set up Python
-        uses: actions/setup-python@v6
-        with:
-          python-version: ${{ matrix.python }}
-
-      - name: Install uv
-        uses: astral-sh/setup-uv@37802adc94f370d6bfd71619e3f0bf239e1f3b78
-
-      - name: Install protoc
-        uses: arduino/setup-protoc@c65c819552d16ad3c9b72d9dfd5ba5237b9c906b # v3.0.0
-        with:
-          repo-token: ${{ secrets.GITHUB_TOKEN }}
-
-      - name: Rust Cache
-        uses: Swatinem/rust-cache@c19371144df3bb44fab255c43d04cbc2ab54d1c4 # v2.9.1
-
-      - name: Build fluss-test-cluster binary
-        run: cargo build -p fluss-test-cluster
-
-      - name: Build Python bindings
-        working-directory: bindings/python
-        run: |
-          uv sync --extra dev --no-install-project
-          uv run --no-sync maturin develop --uv
-
-      - name: Run tests (parallel)
-        working-directory: bindings/python
-        run: uv run --no-sync pytest test/ -v -n 2 --dist=loadfile
-        env:
-          RUST_LOG: DEBUG
-          RUST_BACKTRACE: full
-          FLUSS_SKIP_CLUSTER_TEARDOWN: "1"
-
-      - name: Dump fluss cluster container logs
-        if: always()
-        run: |
-          mkdir -p cluster-logs
-          for c in $(docker ps -a --filter "name=shared-test" --format '{{.Names}}'); do
-            docker logs "$c" > "cluster-logs/$c.log" 2>&1 || true
-          done
-
-      - uses: actions/upload-artifact@v4
-        if: always()
-        with:
-          name: cluster-logs-${{ matrix.python }}
-          path: cluster-logs/
-          if-no-files-found: ignore
-          retention-days: 3
diff --git a/fluss-rust/.github/workflows/deploy_documentation.yml b/fluss-rust/.github/workflows/deploy_documentation.yml
deleted file mode 100644
index 05d8f1c1b8..0000000000
--- a/fluss-rust/.github/workflows/deploy_documentation.yml
+++ /dev/null
@@ -1,81 +0,0 @@
-# Licensed to the Apache Software Foundation (ASF) under one
-# or more contributor license agreements.  See the NOTICE file
-# distributed with this work for additional information
-# regarding copyright ownership.  The ASF licenses this file
-# to you under the Apache License, Version 2.0 (the
-# "License"); you may not use this file except in compliance
-# with the License.  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing,
-# software distributed under the License is distributed on an
-# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
-# KIND, either express or implied.  See the License for the
-# specific language governing permissions and limitations
-# under the License.
-
-name: Deploy Documentation
-
-on:
-  workflow_dispatch:
-
-permissions:
-  contents: write
-
-jobs:
-  deploy:
-    runs-on: ubuntu-latest
-    defaults:
-      run:
-        working-directory: ./website
-    steps:
-      - uses: actions/checkout@v6
-        with:
-          fetch-depth: 0
-
-      - uses: actions/setup-node@v6
-        with:
-          node-version: 24
-
-      - name: Install dependencies
-        run: npm install
-
-      - name: Build website
-        run: npm run build
-
-      - name: Deploy to gh-pages branch
-        working-directory: .
-        env:
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-        run: |
-          git config user.name "github-actions[bot]"
-          git config user.email "github-actions[bot]@users.noreply.github.com"
-
-          # Create a temporary directory with the built site
-          TMPDIR=$(mktemp -d)
-          cp -r website/build/* "$TMPDIR"
-
-          # Switch to the gh-pages branch (create orphan if it doesn't exist)
-          if git ls-remote --exit-code origin gh-pages; then
-            git fetch origin gh-pages
-            git checkout gh-pages
-          else
-            git checkout --orphan gh-pages
-            git rm -rf .
-          fi
-
-          # Replace contents with the new build
-          git rm -rf . || true
-          git clean -fdx
-          cp -r "$TMPDIR"/* .
-          rm -rf "$TMPDIR"
-
-          # Commit and push
-          git add -A
-          if git diff --cached --quiet; then
-            echo "No changes to deploy."
-          else
-            git commit -m "Deploy website from ${GITHUB_SHA::8}"
-            git push origin gh-pages
-          fi
diff --git a/fluss-rust/.licenserc.yaml b/fluss-rust/.licenserc.yaml
index 5fcd99829a..a3647d7f27 100644
--- a/fluss-rust/.licenserc.yaml
+++ b/fluss-rust/.licenserc.yaml
@@ -20,16 +20,20 @@ header:
     spdx-id: Apache-2.0
     copyright-owner: Apache Software Foundation
 
+  paths:
+    - 'fluss-rust/**'
+
   paths-ignore:
+    # bare (gitignore-style) patterns match the basename at any depth
     - '.gitignore'
     - 'Cargo.lock'
     - 'LICENSE'
     - 'NOTICE'
     - 'DISCLAIMER'
-    - 'bindings/python/fluss/py.typed'
-    - '**/mix.lock'
-    - 'website/**'
+    - 'fluss-rust/bindings/python/fluss/py.typed'
+    - 'fluss-rust/**/mix.lock'
+    - 'fluss-rust/website/**'
     - '**/*.md'
-    - '**/DEPENDENCIES.*.tsv'
-    - '**/*.env'
+    - 'fluss-rust/**/DEPENDENCIES.*.tsv'
+    - 'fluss-rust/**/*.env'
   comment: on-failure
diff --git a/fluss-rust/Cargo.lock b/fluss-rust/Cargo.lock
index f409723ed2..4570d4d81c 100644
--- a/fluss-rust/Cargo.lock
+++ b/fluss-rust/Cargo.lock
@@ -1079,7 +1079,7 @@ dependencies = [
 
 [[package]]
 name = "fluss-cpp"
-version = "0.2.0"
+version = "1.0.0"
 dependencies = [
  "anyhow",
  "arrow",
@@ -1092,7 +1092,7 @@ dependencies = [
 
 [[package]]
 name = "fluss-examples"
-version = "0.2.0"
+version = "1.0.0"
 dependencies = [
  "clap",
  "fluss-rs",
@@ -1102,7 +1102,7 @@ dependencies = [
 
 [[package]]
 name = "fluss-rs"
-version = "0.2.0"
+version = "1.0.0"
 dependencies = [
  "arrow",
  "arrow-schema",
@@ -1143,7 +1143,7 @@ dependencies = [
 
 [[package]]
 name = "fluss-test-cluster"
-version = "0.2.0"
+version = "1.0.0"
 dependencies = [
  "clap",
  "fluss-rs",
@@ -1155,7 +1155,7 @@ dependencies = [
 
 [[package]]
 name = "fluss_nif"
-version = "0.2.0"
+version = "1.0.0"
 dependencies = [
  "bigdecimal",
  "fluss-rs",
@@ -1165,7 +1165,7 @@ dependencies = [
 
 [[package]]
 name = "fluss_python"
-version = "0.2.0"
+version = "1.0.0"
 dependencies = [
  "arrow",
  "arrow-array",
diff --git a/fluss-rust/Cargo.toml b/fluss-rust/Cargo.toml
index 8f811c82ce..a555a9198a 100644
--- a/fluss-rust/Cargo.toml
+++ b/fluss-rust/Cargo.toml
@@ -23,7 +23,7 @@ homepage = "https://clients.fluss.apache.org/"
 license = "Apache-2.0"
 repository = "https://github.com/apache/fluss-rust"
 rust-version = "1.85"
-version = "0.2.0"
+version = "1.0.0"
 keywords = ["fluss", "streaming-storage", "datalake"]
 
 [workspace]
@@ -31,7 +31,7 @@ resolver = "2"
 members = ["crates/fluss", "crates/fluss-test-cluster", "crates/examples", "bindings/python", "bindings/cpp", "bindings/elixir/native/fluss_nif"]
 
 [workspace.dependencies]
-fluss = { package = "fluss-rs", version = "0.2.0", path = "crates/fluss", features = ["storage-all"] }
+fluss = { package = "fluss-rs", version = "1.0.0", path = "crates/fluss", features = ["storage-all"] }
 tokio = { version = "1.44.2", features = ["full"] }
 clap = { version = "4.5.37", features = ["derive"] }
 arrow = { version = "57.0.0", features = ["ipc_compression", "ffi"] }
diff --git a/fluss-rust/DISCLAIMER b/fluss-rust/DISCLAIMER
deleted file mode 100644
index ddc4f01632..0000000000
--- a/fluss-rust/DISCLAIMER
+++ /dev/null
@@ -1,10 +0,0 @@
-Apache Fluss (incubating) is an effort undergoing incubation at The Apache
-Software Foundation (ASF), sponsored by the Apache Incubator PMC.
-
-Incubation is required of all newly accepted projects until a further review
-indicates that the infrastructure, communications, and decision making process
-have stabilized in a manner consistent with other successful ASF projects.
-
-While incubation status is not necessarily a reflection of the completeness
-or stability of the code, it does indicate that the project has yet to be
-fully endorsed by the ASF.
\ No newline at end of file
diff --git a/fluss-rust/LICENSE b/fluss-rust/LICENSE
deleted file mode 100644
index 261eeb9e9f..0000000000
--- a/fluss-rust/LICENSE
+++ /dev/null
@@ -1,201 +0,0 @@
-                                 Apache License
-                           Version 2.0, January 2004
-                        http://www.apache.org/licenses/
-
-   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-   1. Definitions.
-
-      "License" shall mean the terms and conditions for use, reproduction,
-      and distribution as defined by Sections 1 through 9 of this document.
-
-      "Licensor" shall mean the copyright owner or entity authorized by
-      the copyright owner that is granting the License.
-
-      "Legal Entity" shall mean the union of the acting entity and all
-      other entities that control, are controlled by, or are under common
-      control with that entity. For the purposes of this definition,
-      "control" means (i) the power, direct or indirect, to cause the
-      direction or management of such entity, whether by contract or
-      otherwise, or (ii) ownership of fifty percent (50%) or more of the
-      outstanding shares, or (iii) beneficial ownership of such entity.
-
-      "You" (or "Your") shall mean an individual or Legal Entity
-      exercising permissions granted by this License.
-
-      "Source" form shall mean the preferred form for making modifications,
-      including but not limited to software source code, documentation
-      source, and configuration files.
-
-      "Object" form shall mean any form resulting from mechanical
-      transformation or translation of a Source form, including but
-      not limited to compiled object code, generated documentation,
-      and conversions to other media types.
-
-      "Work" shall mean the work of authorship, whether in Source or
-      Object form, made available under the License, as indicated by a
-      copyright notice that is included in or attached to the work
-      (an example is provided in the Appendix below).
-
-      "Derivative Works" shall mean any work, whether in Source or Object
-      form, that is based on (or derived from) the Work and for which the
-      editorial revisions, annotations, elaborations, or other modifications
-      represent, as a whole, an original work of authorship. For the purposes
-      of this License, Derivative Works shall not include works that remain
-      separable from, or merely link (or bind by name) to the interfaces of,
-      the Work and Derivative Works thereof.
-
-      "Contribution" shall mean any work of authorship, including
-      the original version of the Work and any modifications or additions
-      to that Work or Derivative Works thereof, that is intentionally
-      submitted to Licensor for inclusion in the Work by the copyright owner
-      or by an individual or Legal Entity authorized to submit on behalf of
-      the copyright owner. For the purposes of this definition, "submitted"
-      means any form of electronic, verbal, or written communication sent
-      to the Licensor or its representatives, including but not limited to
-      communication on electronic mailing lists, source code control systems,
-      and issue tracking systems that are managed by, or on behalf of, the
-      Licensor for the purpose of discussing and improving the Work, but
-      excluding communication that is conspicuously marked or otherwise
-      designated in writing by the copyright owner as "Not a Contribution."
-
-      "Contributor" shall mean Licensor and any individual or Legal Entity
-      on behalf of whom a Contribution has been received by Licensor and
-      subsequently incorporated within the Work.
-
-   2. Grant of Copyright License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      copyright license to reproduce, prepare Derivative Works of,
-      publicly display, publicly perform, sublicense, and distribute the
-      Work and such Derivative Works in Source or Object form.
-
-   3. Grant of Patent License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      (except as stated in this section) patent license to make, have made,
-      use, offer to sell, sell, import, and otherwise transfer the Work,
-      where such license applies only to those patent claims licensable
-      by such Contributor that are necessarily infringed by their
-      Contribution(s) alone or by combination of their Contribution(s)
-      with the Work to which such Contribution(s) was submitted. If You
-      institute patent litigation against any entity (including a
-      cross-claim or counterclaim in a lawsuit) alleging that the Work
-      or a Contribution incorporated within the Work constitutes direct
-      or contributory patent infringement, then any patent licenses
-      granted to You under this License for that Work shall terminate
-      as of the date such litigation is filed.
-
-   4. Redistribution. You may reproduce and distribute copies of the
-      Work or Derivative Works thereof in any medium, with or without
-      modifications, and in Source or Object form, provided that You
-      meet the following conditions:
-
-      (a) You must give any other recipients of the Work or
-          Derivative Works a copy of this License; and
-
-      (b) You must cause any modified files to carry prominent notices
-          stating that You changed the files; and
-
-      (c) You must retain, in the Source form of any Derivative Works
-          that You distribute, all copyright, patent, trademark, and
-          attribution notices from the Source form of the Work,
-          excluding those notices that do not pertain to any part of
-          the Derivative Works; and
-
-      (d) If the Work includes a "NOTICE" text file as part of its
-          distribution, then any Derivative Works that You distribute must
-          include a readable copy of the attribution notices contained
-          within such NOTICE file, excluding those notices that do not
-          pertain to any part of the Derivative Works, in at least one
-          of the following places: within a NOTICE text file distributed
-          as part of the Derivative Works; within the Source form or
-          documentation, if provided along with the Derivative Works; or,
-          within a display generated by the Derivative Works, if and
-          wherever such third-party notices normally appear. The contents
-          of the NOTICE file are for informational purposes only and
-          do not modify the License. You may add Your own attribution
-          notices within Derivative Works that You distribute, alongside
-          or as an addendum to the NOTICE text from the Work, provided
-          that such additional attribution notices cannot be construed
-          as modifying the License.
-
-      You may add Your own copyright statement to Your modifications and
-      may provide additional or different license terms and conditions
-      for use, reproduction, or distribution of Your modifications, or
-      for any such Derivative Works as a whole, provided Your use,
-      reproduction, and distribution of the Work otherwise complies with
-      the conditions stated in this License.
-
-   5. Submission of Contributions. Unless You explicitly state otherwise,
-      any Contribution intentionally submitted for inclusion in the Work
-      by You to the Licensor shall be under the terms and conditions of
-      this License, without any additional terms or conditions.
-      Notwithstanding the above, nothing herein shall supersede or modify
-      the terms of any separate license agreement you may have executed
-      with Licensor regarding such Contributions.
-
-   6. Trademarks. This License does not grant permission to use the trade
-      names, trademarks, service marks, or product names of the Licensor,
-      except as required for reasonable and customary use in describing the
-      origin of the Work and reproducing the content of the NOTICE file.
-
-   7. Disclaimer of Warranty. Unless required by applicable law or
-      agreed to in writing, Licensor provides the Work (and each
-      Contributor provides its Contributions) on an "AS IS" BASIS,
-      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-      implied, including, without limitation, any warranties or conditions
-      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-      PARTICULAR PURPOSE. You are solely responsible for determining the
-      appropriateness of using or redistributing the Work and assume any
-      risks associated with Your exercise of permissions under this License.
-
-   8. Limitation of Liability. In no event and under no legal theory,
-      whether in tort (including negligence), contract, or otherwise,
-      unless required by applicable law (such as deliberate and grossly
-      negligent acts) or agreed to in writing, shall any Contributor be
-      liable to You for damages, including any direct, indirect, special,
-      incidental, or consequential damages of any character arising as a
-      result of this License or out of the use or inability to use the
-      Work (including but not limited to damages for loss of goodwill,
-      work stoppage, computer failure or malfunction, or any and all
-      other commercial damages or losses), even if such Contributor
-      has been advised of the possibility of such damages.
-
-   9. Accepting Warranty or Additional Liability. While redistributing
-      the Work or Derivative Works thereof, You may choose to offer,
-      and charge a fee for, acceptance of support, warranty, indemnity,
-      or other liability obligations and/or rights consistent with this
-      License. However, in accepting such obligations, You may act only
-      on Your own behalf and on Your sole responsibility, not on behalf
-      of any other Contributor, and only if You agree to indemnify,
-      defend, and hold each Contributor harmless for any liability
-      incurred by, or claims asserted against, such Contributor by reason
-      of your accepting any such warranty or additional liability.
-
-   END OF TERMS AND CONDITIONS
-
-   APPENDIX: How to apply the Apache License to your work.
-
-      To apply the Apache License to your work, attach the following
-      boilerplate notice, with the fields enclosed by brackets "[]"
-      replaced with your own identifying information. (Don't include
-      the brackets!)  The text should be enclosed in the appropriate
-      comment syntax for the file format. We also recommend that a
-      file or class name and description of purpose be included on the
-      same "printed page" as the copyright notice for easier
-      identification within third-party archives.
-
-   Copyright [yyyy] [name of copyright owner]
-
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
diff --git a/fluss-rust/NOTICE b/fluss-rust/NOTICE
deleted file mode 100644
index 1ec5da05df..0000000000
--- a/fluss-rust/NOTICE
+++ /dev/null
@@ -1,5 +0,0 @@
-Apache Fluss Rust (incubating)
-Copyright 2025 The Apache Software Foundation
-
-This product includes software developed at
-The Apache Software Foundation (http://www.apache.org/).
\ No newline at end of file
diff --git a/fluss-rust/bindings/elixir/mix.exs b/fluss-rust/bindings/elixir/mix.exs
index f5d416d807..b83e9f94b9 100644
--- a/fluss-rust/bindings/elixir/mix.exs
+++ b/fluss-rust/bindings/elixir/mix.exs
@@ -18,7 +18,7 @@
 defmodule Fluss.MixProject do
   use Mix.Project
 
-  @version "0.1.0"
+  @version "1.0.0"
 
   def project do
     [
diff --git a/fluss-rust/crates/fluss-test-cluster/src/lib.rs b/fluss-rust/crates/fluss-test-cluster/src/lib.rs
index 041c21b06c..76199f7ed7 100644
--- a/fluss-rust/crates/fluss-test-cluster/src/lib.rs
+++ b/fluss-rust/crates/fluss-test-cluster/src/lib.rs
@@ -101,8 +101,9 @@ impl FlussTestingClusterBuilder {
             sasl_users: Vec::new(),
             coordinator_host_port: 9123,
             plain_client_port: None,
-            image: FLUSS_IMAGE.to_string(),
-            image_tag: FLUSS_VERSION.to_string(),
+            // runtime env overrides the compile-time default (server-compat CI lane)
+            image: std::env::var("FLUSS_IMAGE").unwrap_or_else(|_| FLUSS_IMAGE.to_string()),
+            image_tag: std::env::var("FLUSS_VERSION").unwrap_or_else(|_| FLUSS_VERSION.to_string()),
         }
     }
 
diff --git a/fluss-rust/crates/fluss/build.rs b/fluss-rust/crates/fluss/build.rs
index 040ee52179..65d58e3592 100644
--- a/fluss-rust/crates/fluss/build.rs
+++ b/fluss-rust/crates/fluss/build.rs
@@ -16,15 +16,26 @@
 // under the License.
 
 use std::io::Result;
+use std::path::Path;
 
 fn main() -> Result<()> {
     let mut config = prost_build::Config::new();
     config.bytes([
-        ".proto.PbProduceLogReqForBucket.records",
-        ".proto.PbPutKvReqForBucket.records",
-        ".proto.PbLookupReqForBucket.key",
-        ".proto.PbPrefixLookupReqForBucket.keys",
+        ".fluss.PbProduceLogReqForBucket.records",
+        ".fluss.PbPutKvReqForBucket.records",
+        ".fluss.PbLookupReqForBucket.keys",
+        ".fluss.PbPrefixLookupReqForBucket.keys",
     ]);
-    config.compile_protos(&["src/proto/fluss_api.proto"], &["src/proto"])?;
+    // Published crates vendor the proto under proto/ (scripts/vendor-proto.sh);
+    // monorepo builds read the canonical proto directly from fluss-rpc.
+    let (proto, include_dir) = if Path::new("proto/FlussApi.proto").exists() {
+        ("proto/FlussApi.proto", "proto")
+    } else {
+        (
+            "../../../fluss-rpc/src/main/proto/FlussApi.proto",
+            "../../../fluss-rpc/src/main/proto",
+        )
+    };
+    config.compile_protos(&[proto], &[include_dir])?;
     Ok(())
 }
diff --git a/fluss-rust/crates/fluss/src/client/admin.rs b/fluss-rust/crates/fluss/src/client/admin.rs
index 0828b83bfe..1eb2f80bb0 100644
--- a/fluss-rust/crates/fluss/src/client/admin.rs
+++ b/fluss-rust/crates/fluss/src/client/admin.rs
@@ -150,6 +150,7 @@ impl FlussAdmin {
             table_json,
             created_time,
             modified_time,
+            remote_data_dir: _,
         } = response;
         let v: &[u8] = &table_json[..];
         let table_descriptor =
diff --git a/fluss-rust/crates/fluss/src/client/table/scanner.rs b/fluss-rust/crates/fluss/src/client/table/scanner.rs
index 35cc52e309..f0cb320171 100644
--- a/fluss-rust/crates/fluss/src/client/table/scanner.rs
+++ b/fluss-rust/crates/fluss/src/client/table/scanner.rs
@@ -1956,6 +1956,8 @@ impl LogFetcher {
                         projection_pushdown_enabled: projection_enabled,
                         projected_fields: projected_fields.clone(),
                         buckets_req: feq_for_buckets,
+                        filter_predicate: None,
+                        filter_schema_id: None,
                     };
 
                     let fetch_log_request = FetchLogRequest {
@@ -2306,6 +2308,7 @@ mod tests {
                     log_start_offset: None,
                     remote_log_fetch_info: None,
                     records: None,
+                    filtered_end_offset: None,
                 }],
             }],
         };
@@ -2362,6 +2365,7 @@ mod tests {
                     log_start_offset: None,
                     remote_log_fetch_info: None,
                     records: None,
+                    filtered_end_offset: None,
                 }],
             }],
         };
@@ -2699,6 +2703,7 @@ mod tests {
                             log_start_offset: Some(0),
                             remote_log_fetch_info: None,
                             records: None,
+                            filtered_end_offset: None,
                         }],
                     }],
                 };
diff --git a/fluss-rust/crates/fluss/src/lib.rs b/fluss-rust/crates/fluss/src/lib.rs
index 0266e0de6e..027465235c 100644
--- a/fluss-rust/crates/fluss/src/lib.rs
+++ b/fluss-rust/crates/fluss/src/lib.rs
@@ -147,5 +147,7 @@ pub type PartitionId = i64;
 pub type BucketId = i32;
 
 pub mod proto {
-    include!(concat!(env!("OUT_DIR"), "/proto.rs"));
+    // generated from the canonical proto; its doc comments aren't clippy-clean
+    #![allow(clippy::doc_lazy_continuation)]
+    include!(concat!(env!("OUT_DIR"), "/fluss.rs"));
 }
diff --git a/fluss-rust/crates/fluss/src/metadata/partition.rs b/fluss-rust/crates/fluss/src/metadata/partition.rs
index 18402354a5..c63fe296c5 100644
--- a/fluss-rust/crates/fluss/src/metadata/partition.rs
+++ b/fluss-rust/crates/fluss/src/metadata/partition.rs
@@ -300,6 +300,7 @@ impl PartitionInfo {
         PbPartitionInfo {
             partition_id: self.partition_id,
             partition_spec: self.partition_spec.to_pb(),
+            remote_data_dir: None,
         }
     }
 
diff --git a/fluss-rust/crates/fluss/src/proto/fluss_api.proto b/fluss-rust/crates/fluss/src/proto/fluss_api.proto
deleted file mode 100644
index 2add80d7f9..0000000000
--- a/fluss-rust/crates/fluss/src/proto/fluss_api.proto
+++ /dev/null
@@ -1,503 +0,0 @@
-/*
- * Licensed to the Apache Software Foundation (ASF) under one or more
- * contributor license agreements.  See the NOTICE file distributed with
- * this work for additional information regarding copyright ownership.
- * The ASF licenses this file to You under the Apache License, Version 2.0
- * (the "License"); you may not use this file except in compliance with
- * the License.  You may obtain a copy of the License at
- *
- *    http://www.apache.org/licenses/LICENSE-2.0
- *
- * Unless required by applicable law or agreed to in writing, software
- * distributed under the License is distributed on an "AS IS" BASIS,
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- * See the License for the specific language governing permissions and
- * limitations under the License.
- */
-
-syntax = "proto2";
-
-package proto;
-
-message ErrorResponse {
-  required int32 error_code = 1;
-  optional string error_message = 2;
-}
-
-// api versions request and response
-message ApiVersionsRequest {
-  required string client_software_name = 1;
-  required string client_software_version = 2;
-}
-
-message ApiVersionsResponse {
-  repeated PbApiVersion api_versions = 1;
-  optional int32 server_type = 2;
-}
-
-message PbApiVersion {
-  required int32 api_key = 1;
-  required int32 min_version = 2;
-  required int32 max_version = 3;
-}
-
-// metadata request and response, request send from client to each server.
-message MetadataRequest {
-  repeated PbTablePath table_path = 1;
-  repeated PbPhysicalTablePath partitions_path = 2;
-
-  // note: currently, we assume the partition ids must belong to the table_paths in the
-  // metadata request
-  // todo: we won't need the assumption after we introduce metadata cache in server
-  repeated int64 partitions_id = 3 [packed = true];
-}
-
-message MetadataResponse {
-  optional PbServerNode coordinator_server = 1;
-  repeated PbServerNode tablet_servers = 2;
-  repeated PbTableMetadata table_metadata = 3;
-  repeated PbPartitionMetadata partition_metadata = 4;
-}
-
-// produce log request and response
-message ProduceLogRequest {
-  required int32 acks = 1;
-  required int64 table_id = 2;
-  required int32 timeout_ms = 3;
-  repeated PbProduceLogReqForBucket buckets_req = 4;
-}
-
-
-message ProduceLogResponse {
-  repeated PbProduceLogRespForBucket buckets_resp = 1;
-}
-
-
-// --------------- Inner classes ----------------
-message PbTablePath {
-  required string database_name = 1;
-  required string table_name = 2;
-}
-
-message PbPhysicalTablePath {
-  required string database_name = 1;
-  required string table_name = 2;
-  optional string partition_name = 3;
-}
-
-// For MetadataResponse, host and port are still used for all versions.
-// For UpdateMetadataRequest,
-//   * versions <= 0.6: host and port are used.
-//   * versions >= 0.7: listeners is used to replace host and port.
-message PbServerNode {
-  required int32 node_id = 1;
-  required string host = 2;
-  required int32 port = 3;
-  optional string listeners = 4;
-}
-
-message PbTableMetadata {
-  required PbTablePath table_path = 1;
-  required int64 table_id = 2;
-  required int32 schema_id = 3;
-  required bytes table_json = 4;
-  repeated PbBucketMetadata bucket_metadata = 5;
-  required int64 created_time = 6;
-  required int64 modified_time = 7;
-}
-
-message PbPartitionMetadata {
-  required int64 table_id = 1;
-  // the partition name and id for the partition
-  required string partition_name = 2;
-  required int64 partition_id = 3;
-  repeated PbBucketMetadata bucket_metadata = 4;
-}
-
-message PbBucketMetadata {
-  required int32 bucket_id = 1;
-  // optional as some time the leader may not elected yet
-  optional int32 leader_id = 2;
-  repeated int32 replica_id = 3 [packed = true];
-  // TODO: Add isr here.
-}
-
-message PbProduceLogReqForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  required bytes records = 3;
-}
-
-message PbProduceLogRespForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  optional int32 error_code = 3;
-  optional string error_message = 4;
-  optional int64 base_offset = 5;
-}
-
-// put kv request and response
-message PutKvRequest {
-  required int32 acks = 1;
-  required int64 table_id = 2;
-  required int32 timeout_ms = 3;
-  // the indexes for the columns to write,
-  // if empty, means write all columns
-  repeated int32 target_columns = 4 [packed = true];
-  repeated PbPutKvReqForBucket buckets_req = 5;
-}
-
-message PutKvResponse {
-  repeated PbPutKvRespForBucket buckets_resp = 1;
-}
-
-message PbPutKvReqForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  required bytes records = 3;
-}
-
-message PbPutKvRespForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  optional int32 error_code = 3;
-  optional string error_message = 4;
-}
-
-message CreateTableRequest {
-  required PbTablePath table_path = 1;
-  required bytes table_json = 2;
-  required bool ignore_if_exists = 3;
-}
-
-message CreateTableResponse {
-}
-
-message DropTableRequest {
-  required PbTablePath table_path = 1;
-  required bool ignore_if_not_exists = 2;
-}
-
-message DropTableResponse {
-}
-
-message TableExistsRequest {
-  required PbTablePath table_path = 1;
-}
-
-message TableExistsResponse {
-  required bool exists = 1;
-}
-
-message GetTableInfoRequest {
-  required PbTablePath table_path = 1;
-}
-
-message GetTableInfoResponse {
-  required int64 table_id = 1;
-  required int32 schema_id = 2;
-  required bytes table_json = 3;
-  required int64 created_time = 4;
-  required int64 modified_time = 5;
-}
-
-// get table schema request and response. Mirrors the Java RPC at api key 1011.
-// Omitting `schema_id` requests the latest schema.
-message GetTableSchemaRequest {
-  required PbTablePath table_path = 1;
-  optional int32 schema_id = 2;
-}
-
-message GetTableSchemaResponse {
-  required int32 schema_id = 1;
-  required bytes schema_json = 2;
-}
-
-message ListTablesRequest {
-  required string database_name = 1;
-}
-
-message ListTablesResponse {
-  repeated string table_name = 1;
-}
-
-message CreateDatabaseRequest {
-  required string database_name = 1;
-  required bool ignore_if_exists = 2;
-  optional bytes database_json = 3;
-}
-
-message CreateDatabaseResponse {
-}
-
-message GetDatabaseInfoRequest {
-  required string database_name = 1;
-}
-
-message GetDatabaseInfoResponse {
-  required bytes database_json = 3;
-  required int64 created_time = 4;
-  required int64 modified_time = 5;
-}
-
-message DropDatabaseRequest {
-  required string database_name = 1;
-  required bool ignore_if_not_exists = 2;
-  required bool cascade = 3;
-}
-
-message DropDatabaseResponse {
-}
-
-message DatabaseExistsRequest {
-  required string database_name = 1;
-}
-
-message DatabaseExistsResponse {
-  required bool exists = 1;
-}
-
-message ListDatabasesRequest {
-}
-
-message ListDatabasesResponse {
-  repeated string database_name = 1;
-}
-
-// list offsets request and response
-message ListOffsetsRequest {
-  required int32 follower_server_id = 1;  // value -1 indicate the request from client.
-  required int32 offset_type = 2; // value can be 0,1,2 (see ListOffsetsParam for more details)
-  required int64 table_id = 3;
-  optional int64 partition_id = 4;
-  repeated int32 bucket_id = 5 [packed = true]; // it is recommended to use packed for repeated numerics to get more efficient encoding
-  optional int64 startTimestamp = 6;
-}
-message ListOffsetsResponse {
-  repeated PbListOffsetsRespForBucket buckets_resp = 1;
-}
-
-
-// fetch log request and response
-message FetchLogRequest {
-  required int32 follower_server_id = 1;  // value -1 indicate the request from client.
-  required int32 max_bytes = 2;
-  repeated PbFetchLogReqForTable tables_req = 3;
-  optional int32 max_wait_ms = 4;
-  optional int32 min_bytes = 5;
-}
-
-message FetchLogResponse {
-  repeated PbFetchLogRespForTable tables_resp = 1;
-}
-
-message PbFetchLogReqForTable {
-  required int64 table_id = 1;
-  required bool projection_pushdown_enabled = 2;
-  repeated int32 projected_fields = 3 [packed = true];
-  repeated PbFetchLogReqForBucket buckets_req = 4;
-}
-
-
-message PbFetchLogReqForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  // TODO leader epoch
-  required int64 fetch_offset = 3;
-  required int32 max_fetch_bytes = 4;
-}
-
-
-message PbFetchLogRespForTable {
-  required int64 table_id = 1;
-  repeated PbFetchLogRespForBucket buckets_resp = 2;
-}
-message PbFetchLogRespForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  optional int32 error_code = 3;
-  optional string error_message = 4;
-  optional int64 high_watermark = 5;
-  optional int64 log_start_offset = 6; // TODO now we don't introduce log start offset, but remain it in protobuf
-  optional PbRemoteLogFetchInfo remote_log_fetch_info = 7;
-  optional bytes records = 8;
-}
-
-message PbRemoteLogFetchInfo {
-  required string remote_log_tablet_dir = 1;
-  optional string partition_name = 2;
-  repeated PbRemoteLogSegment remote_log_segments = 3;
-  optional int32 first_start_pos = 4;
-}
-
-message PbRemoteLogSegment {
-  required string remote_log_segment_id = 1;
-  required int64 remote_log_start_offset = 2;
-  required int64 remote_log_end_offset = 3;
-  required int32 segment_size_in_bytes = 4;
-  optional int64 max_timestamp = 5;
-}
-
-message PbListOffsetsRespForBucket {
-  required int32 bucket_id = 1;
-  optional int32 error_code = 2;
-  optional string error_message = 3;
-  optional int64 offset = 4;
-}
-
-// fetch latest lake snapshot
-message GetLatestLakeSnapshotRequest {
-  required PbTablePath table_path = 1;
-}
-
-message GetLatestLakeSnapshotResponse {
-  required int64 table_id = 1;
-  required int64 snapshotId = 2;
-  repeated PbLakeSnapshotForBucket bucket_snapshots = 3;
-}
-
-message PbLakeSnapshotForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  optional int64 log_offset = 3;
-}
-
-message PbKeyValue {
-  required string key = 1;
-  required string value = 2;
-}
-
-message GetFileSystemSecurityTokenRequest {
-}
-
-message GetFileSystemSecurityTokenResponse {
-  required string schema = 1;
-  required bytes token = 2;
-  optional int64 expiration_time = 3;
-  repeated PbKeyValue addition_info = 4;
-}
-
-// lookup request and response
-message LookupRequest {
-  required int64 table_id = 1;
-  repeated PbLookupReqForBucket buckets_req = 2;
-}
-
-message LookupResponse {
-  repeated PbLookupRespForBucket buckets_resp = 1;
-}
-
-message PbLookupReqForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  repeated bytes key = 3;
-}
-
-message PbLookupRespForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  optional int32 error_code = 3;
-  optional string error_message = 4;
-  repeated PbValue values = 5;
-}
-
-message PbValue {
-  optional bytes values = 1;
-}
-
-// prefix lookup request and response
-message PrefixLookupRequest {
-  required int64 table_id = 1;
-  repeated PbPrefixLookupReqForBucket buckets_req = 2;
-}
-
-message PrefixLookupResponse {
-  repeated PbPrefixLookupRespForBucket buckets_resp = 1;
-}
-
-message PbPrefixLookupReqForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  repeated bytes keys = 3;
-}
-
-message PbPrefixLookupRespForBucket {
-  optional int64 partition_id = 1;
-  required int32 bucket_id = 2;
-  optional int32 error_code = 3;
-  optional string error_message = 4;
-  repeated PbValueList value_lists = 5;
-}
-
-message PbValueList {
-  repeated bytes values = 1;
-}
-
-message PbPartitionSpec {
-  repeated PbKeyValue partition_key_values = 1;
-}
-
-message PbPartitionInfo {
-  required int64 partition_id = 1;
-  required PbPartitionSpec partition_spec = 2;
-}
-
-message ListPartitionInfosRequest {
-  required PbTablePath table_path = 1;
-  optional PbPartitionSpec partial_partition_spec = 2;
-}
-
-message ListPartitionInfosResponse {
-  repeated PbPartitionInfo partitions_info = 1;
-}
-
-message CreatePartitionRequest {
-  required PbTablePath table_path = 1;
-  required PbPartitionSpec partition_spec = 2;
-  required bool ignore_if_exists = 3;
-}
-
-message CreatePartitionResponse {}
-
-message DropPartitionRequest {
-  required PbTablePath table_path = 1;
-  required PbPartitionSpec partition_spec = 2;
-  required bool ignore_if_not_exists = 3;
-}
-
-message DropPartitionResponse {}
-
-message AuthenticateRequest {
-  required string protocol = 1;
-  required bytes token = 2;
-}
-
-message AuthenticateResponse {
-  optional bytes challenge = 1;
-}
-
-// limit scan request and response
-message LimitScanRequest {
-  required int64 table_id = 2;
-  optional int64 partition_id = 3;
-  required int32 bucket_id = 4;
-  required int32 limit = 5;
-}
-
-message LimitScanResponse{
-  optional int32 error_code = 1;
-  optional string error_message = 2;
-  // flag to indicate the table type
-  optional bool is_log_table = 3;
-  // LogRecordBatch if is_log_table is true, otherwise KvRecordBatch
-  optional bytes records = 4;
-}
-
-// init writer request and response
-message InitWriterRequest {
-  repeated PbTablePath table_path = 1;
-}
-
-message InitWriterResponse {
-  required int64 writer_id = 1;
-}
diff --git a/fluss-rust/crates/fluss/src/rpc/convert.rs b/fluss-rust/crates/fluss/src/rpc/convert.rs
index 1862589bc5..441645c2e6 100644
--- a/fluss-rust/crates/fluss/src/rpc/convert.rs
+++ b/fluss-rust/crates/fluss/src/rpc/convert.rs
@@ -73,6 +73,7 @@ mod tests {
             host: "127.0.0.1".to_string(),
             port: 9092,
             listeners: None,
+            rack: None,
         };
         let node = from_pb_server_node(pb, ServerType::TabletServer);
         assert_eq!(node.id(), 7);
@@ -84,6 +85,7 @@ mod tests {
             host: "localhost".to_string(),
             port: 8123,
             listeners: None,
+            rack: None,
         };
         let node = from_pb_server_node(pb, ServerType::CoordinatorServer);
         assert_eq!(node.uid(), "cs-3");
diff --git a/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs b/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
index ad633655c0..68595cfc5c 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/create_partition.rs
@@ -40,7 +40,8 @@ impl CreatePartitionRequest {
             inner_request: proto::CreatePartitionRequest {
                 table_path: to_table_path(table_path),
                 partition_spec: partition_spec.to_pb(),
-                ignore_if_exists,
+                // canonical proto field is misnamed; it carries the "ignore if exists" flag
+                ignore_if_not_exists: ignore_if_exists,
             },
         }
     }
diff --git a/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs b/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
index 0b59384dfd..5138fe7298 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/get_latest_lake_snapshot.rs
@@ -30,16 +30,18 @@ use prost::Message;
 
 #[derive(Debug)]
 pub struct GetLatestLakeSnapshotRequest {
-    pub inner_request: proto::GetLatestLakeSnapshotRequest,
+    pub inner_request: proto::GetLakeSnapshotRequest,
 }
 
 impl GetLatestLakeSnapshotRequest {
     pub fn new(table_path: &TablePath) -> Self {
-        let inner_request = proto::GetLatestLakeSnapshotRequest {
+        let inner_request = proto::GetLakeSnapshotRequest {
             table_path: PbTablePath {
                 database_name: table_path.database().to_string(),
                 table_name: table_path.table().to_string(),
             },
+            snapshot_id: None,
+            readable: None,
         };
 
         Self { inner_request }
@@ -47,9 +49,9 @@ impl GetLatestLakeSnapshotRequest {
 }
 
 impl RequestBody for GetLatestLakeSnapshotRequest {
-    type ResponseBody = proto::GetLatestLakeSnapshotResponse;
+    type ResponseBody = proto::GetLakeSnapshotResponse;
     const API_KEY: ApiKey = ApiKey::GetLatestLakeSnapshot;
 }
 
 impl_write_type!(GetLatestLakeSnapshotRequest);
-impl_read_type!(proto::GetLatestLakeSnapshotResponse);
+impl_read_type!(proto::GetLakeSnapshotResponse);
diff --git a/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs b/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
index 21e1640000..74ca494464 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/list_databases.rs
@@ -32,7 +32,9 @@ pub struct ListDatabasesRequest {
 impl ListDatabasesRequest {
     pub fn new() -> Self {
         ListDatabasesRequest {
-            inner_request: proto::ListDatabasesRequest {},
+            inner_request: proto::ListDatabasesRequest {
+                include_summary: None,
+            },
         }
     }
 }
diff --git a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
index 200d4bc8c0..e205fa6b67 100644
--- a/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
+++ b/fluss-rust/crates/fluss/src/rpc/message/lookup.rs
@@ -42,7 +42,7 @@ impl LookupRequest {
                 |(bucket_id, partition_id, keys)| proto::PbLookupReqForBucket {
                     partition_id,
                     bucket_id,
-                    key: keys,
+                    keys,
                 },
             )
             .collect();
@@ -50,6 +50,9 @@ impl LookupRequest {
         let request = proto::LookupRequest {
             table_id,
             buckets_req,
+            insert_if_not_exists: None,
+            acks: None,
+            timeout_ms: None,
         };
 
         Self {
diff --git a/fluss-rust/scripts/vendor-proto.sh b/fluss-rust/scripts/vendor-proto.sh
new file mode 100755
index 0000000000..64b328c894
--- /dev/null
+++ b/fluss-rust/scripts/vendor-proto.sh
@@ -0,0 +1,46 @@
+#!/usr/bin/env bash
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements.  See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to you under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+# Vendor the canonical FlussApi.proto into the fluss-rs crate so `cargo publish`
+# produces a self-contained crate. build.rs prefers crates/fluss/proto/FlussApi.proto
+# when present, otherwise reads it from ../../../fluss-rpc in the monorepo.
+#
+# Usage:
+#   scripts/vendor-proto.sh           # copy canonical proto into the crate
+#   scripts/vendor-proto.sh --clean   # remove the vendored copy
+
+set -euo pipefail
+
+REPO_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
+CANONICAL="${REPO_ROOT}/../fluss-rpc/src/main/proto/FlussApi.proto"
+DEST_DIR="${REPO_ROOT}/crates/fluss/proto"
+DEST="${DEST_DIR}/FlussApi.proto"
+
+if [ "${1:-}" = "--clean" ]; then
+  rm -rf "$DEST_DIR"
+  echo "Removed vendored proto: ${DEST_DIR}"
+  exit 0
+fi
+
+if [ ! -f "$CANONICAL" ]; then
+  echo "Canonical proto not found: ${CANONICAL}" >&2
+  echo "Run from the consolidated repo (fluss-rpc must be a sibling of fluss-rust)." >&2
+  exit 1
+fi
+
+mkdir -p "$DEST_DIR"
+cp "$CANONICAL" "$DEST"
+echo "Vendored ${CANONICAL} -> ${DEST}"
diff --git a/pom.xml b/pom.xml
index d39a91d9b3..0c5c4dcc63 100644
--- a/pom.xml
+++ b/pom.xml
@@ -691,6 +691,8 @@
                         <exclude>website/static/**</exclude>
                         <exclude>website/build/**</exclude>
                         <exclude>website/node_modules/**</exclude>
+                        <!-- Rust client: own license enforcement (skywalking-eyes + cargo-deny) -->
+                        <exclude>fluss-rust/**</exclude>
                     </excludes>
                 </configuration>
             </plugin>
diff --git a/website/community/dev/building.md b/website/community/dev/building.md
index 963ac39917..a891c84b6b 100644
--- a/website/community/dev/building.md
+++ b/website/community/dev/building.md
@@ -52,4 +52,40 @@ mvn clean install -DskipTests -T 1C
 
 **NOTE**:
 - For local testing, it's recommend to use directory `${project}/build-target` in project.
-- For deploying distributed cluster, it's recommend to use binary file named `fluss-xxx-bin.tgz`, the file is in directory `${project}/fluss-dist/target`.
\ No newline at end of file
+- For deploying distributed cluster, it's recommend to use binary file named `fluss-xxx-bin.tgz`, the file is in directory `${project}/fluss-dist/target`.
+
+## Building the Rust client (fluss-rust)
+
+The Rust client, language bindings, and examples live under `fluss-rust/` and build with Cargo. You need **Rust** (the toolchain pinned in `fluss-rust/rust-toolchain.toml`, currently 1.85+) and **protoc**, the Protobuf compiler — `build.rs` compiles the canonical `fluss-rpc/src/main/proto/FlussApi.proto`.
+
+```bash
+# protoc (pick one)
+brew install protobuf                    # macOS
+sudo apt-get install protobuf-compiler   # Debian/Ubuntu
+
+cd fluss-rust
+cargo build --workspace --all-targets    # build everything
+cargo test --workspace                    # unit tests
+```
+
+Integration tests start a Fluss cluster via Docker:
+
+```bash
+RUST_TEST_THREADS=1 cargo test --features integration_tests --workspace
+```
+
+The Python and C++ bindings build on top of the Rust crate:
+
+```bash
+cd fluss-rust/bindings/python && uv sync --extra dev && uv run maturin develop   # Python
+cd fluss-rust/bindings/cpp && cmake -B build && cmake --build build              # C++
+```
+
+Before pushing, run the same checks CI does:
+
+```bash
+cd fluss-rust
+cargo fmt --all -- --check
+cargo clippy --all-targets --workspace -- -D warnings
+cargo deny check licenses
+```
\ No newline at end of file
diff --git a/website/community/dev/ide-setup.md b/website/community/dev/ide-setup.md
index 3d157a5c50..2914dd8467 100644
--- a/website/community/dev/ide-setup.md
+++ b/website/community/dev/ide-setup.md
@@ -221,3 +221,12 @@ Go to "Settings" → "Build, Execution, Deployment" → "Compiler" → "Java Com
 This happens if Fluss dependencies are set to "provided", resulting in them not being available
 on the classpath. You can either check "Include dependencies with 'Provided' scope" in your
 run configuration, or create a test that calls the `main()` method of the example.
+
+## RustRover
+
+For the Rust client under `fluss-rust/`, we recommend [RustRover](https://www.jetbrains.com/rust/).
+
+1. Open RustRover, choose **Open**, and select the `fluss-rust/` directory as the project root so Cargo resolves the workspace.
+2. RustRover uses the toolchain pinned in `fluss-rust/rust-toolchain.toml` (install it with `rustup` if prompted). You also need **protoc** on your `PATH` — see [Building the Rust client](/community/dev/building).
+3. Enable **Rustfmt** and **Clippy** under Settings → Rust so local formatting and lints match CI (`cargo fmt --all -- --check`, `cargo clippy --all-targets -- -D warnings`).
+4. Apply the Apache license header to new files — the boilerplate is in `fluss-rust/copyright.txt`; configure it under Settings → Editor → Copyright.
diff --git a/website/community/how-to-contribute/contribute-code.md b/website/community/how-to-contribute/contribute-code.md
index affadb37d5..31ac2418f3 100644
--- a/website/community/how-to-contribute/contribute-code.md
+++ b/website/community/how-to-contribute/contribute-code.md
@@ -32,6 +32,7 @@ Implement the change according to the Code Style and Quality (refer to the [Flin
 
 1. Only start working on the implementation if there is consensus on the approach (e.g. you are assigned to the ticket)
 2. If you are newer, can refer to [ide setup](/community/dev/ide-setup) to setup a Fluss dev environment.
+3. For Rust client changes (under `fluss-rust/`), see [Building the Rust client](/community/dev/building) and the [RustRover IDE setup](/community/dev/ide-setup).
 
 ### Review
 Create the pull request and work with the reviewer. 
@@ -53,7 +54,7 @@ Considerations before opening a pull request:
 
 - Fill out the pull request template to describe the changes contributed by the pull request. Please describe it such that the reviewer understands the problem and solution from the description, not only from the code. That will give reviewers the context they need to do the review.
 
-- Make sure that the change passes the automated tests, i.e., `mvn clean verify` passes.
+- Make sure that the change passes the automated tests, i.e., `mvn clean verify` passes. For Rust client changes under `fluss-rust/`, make sure `cargo build`, `cargo test`, `cargo fmt --all -- --check`, and `cargo clippy --all-targets -- -D warnings` pass (see [Building the Rust client](/community/dev/building)).
 
 - Each pull request should address only one issue, not mix up code from multiple issues.
 
diff --git a/website/community/how-to-release/creating-a-fluss-release.mdx b/website/community/how-to-release/creating-a-fluss-release.mdx
index e66e3a46b5..3eb15b4b26 100644
--- a/website/community/how-to-release/creating-a-fluss-release.mdx
+++ b/website/community/how-to-release/creating-a-fluss-release.mdx
@@ -503,6 +503,28 @@ This ensures that the **Quickstart guide** in the documentation references the c
 git push origin $TAG
 ```
 
+### 9. Publish client RC artifacts (crates.io / PyPI)
+
+The Rust, Python, and C++ clients live in `fluss-rust/` and release from this repository under the **same version and tag** — there is no separate client release.
+
+Before tagging, make sure the client versions match `${RELEASE_VERSION}`:
+
+```bash
+# Rust workspace version (also drives the python/cpp/elixir-NIF crates via version.workspace)
+fluss-rust/scripts/bump-version.sh <previous_version> ${RELEASE_VERSION}
+# The Elixir binding has its own version attribute — set @version "${RELEASE_VERSION}" in
+#   fluss-rust/bindings/elixir/mix.exs
+# Regenerate the Rust dependency/license audit (cargo-deny):
+(cd fluss-rust && python3 scripts/dependencies.py)
+```
+
+Pushing the **RC tag** (`v${RELEASE_VERSION}-rc${RC_NUM}`) triggers the client workflows:
+
+- `python-release.yml` builds the wheels + sdist and publishes them to **TestPyPI**.
+- `rust-release.yml` runs `cargo publish --dry-run` to validate the crate. The canonical proto is vendored into the crate automatically (`fluss-rust/scripts/vendor-proto.sh`), because `build.rs` reads it from the in-repo `fluss-rpc`.
+
+The final publish to **crates.io** and **PyPI** happens when the release tag is pushed (see the **Git tag** step under [Finalize the release](#finalize-the-release)). Publishing uses the CI secrets `CARGO_REGISTRY_TOKEN`, `PYPI_API_TOKEN`, and `TEST_PYPI_API_TOKEN`.
+
 -------------
 
 **Checklist to proceed to the next step**
@@ -512,6 +534,7 @@ git push origin $TAG
 - RC Docker images pushed to DockerHub ([apache/fluss](https://hub.docker.com/r/apache/fluss/tags), [apache/fluss-quickstart-flink](https://hub.docker.com/r/apache/fluss-quickstart-flink/tags))
 - RC tag pushed to the [official repository](https://github.com/apache/fluss/tags)
 - Updated `dockerVersion` in `fluss-versions.json` on `main` branch
+- Client RC artifacts published to TestPyPI, and `cargo publish --dry-run` for `fluss-rs` is green
 
 
 ## Vote on the release candidate
@@ -774,6 +797,8 @@ git tag -s "v${RELEASE_VERSION}" refs/tags/${TAG}^{} -m "Release Fluss ${RELEASE
 git push origin refs/tags/v${RELEASE_VERSION}
 ```
 
+Pushing the `v${RELEASE_VERSION}` tag also triggers the client release workflows: `rust-release.yml` publishes `fluss-rs` to **crates.io**, and `python-release.yml` publishes the wheels + sdist to **PyPI**.
+
 ### 5. Publish Docker Images
 
 :::note
diff --git a/website/community/how-to-release/pre-rc-checklist.md b/website/community/how-to-release/pre-rc-checklist.md
new file mode 100644
index 0000000000..658bc4a778
--- /dev/null
+++ b/website/community/how-to-release/pre-rc-checklist.md
@@ -0,0 +1,38 @@
+---
+title: Pre-RC Checklist
+sidebar_position: 1.5
+---
+
+# Pre-RC Checklist
+
+Run through this before cutting a release candidate. It catches the problems that are expensive to discover mid-vote, now that a single tag releases Java, Rust, Python, and C++ together.
+
+## Access and secrets
+
+- [ ] Maven Central (Apache Nexus) access for `org.apache.fluss` — see [Release Manager Preparation](release-manager-preparation.md)
+- [ ] `CARGO_REGISTRY_TOKEN`, `PYPI_API_TOKEN`, and `TEST_PYPI_API_TOKEN` configured as repository secrets
+- [ ] crates.io owner of `fluss-rs`; PyPI maintainer of `pyfluss`
+- [ ] GPG key published to the Apache KEYS file
+
+## Build and publish dry-runs
+
+- [ ] `cargo publish -p fluss-rs --dry-run` succeeds (run after `fluss-rust/scripts/vendor-proto.sh` so the proto is vendored)
+- [ ] Python wheels + sdist install from **TestPyPI** (the RC tag publishes there):
+
+  ```bash
+  pip install -i https://test.pypi.org/simple/ pyfluss==${RELEASE_VERSION}
+  ```
+
+- [ ] `fluss-cpp` Bazel build smoke test passes:
+
+  ```bash
+  cd fluss-rust/bindings/cpp && bazel build //...
+  ```
+
+## Audits
+
+- [ ] `cargo deny check licenses` passes; the Rust dependency list is regenerated and committed
+- [ ] Java + Rust + binding CI is green on the release branch
+- [ ] `LICENSE` / `NOTICE` cover any third-party content bundled in the source release (including under `fluss-rust/`)
+
+Once these pass, proceed to [Creating a Fluss Release](creating-a-fluss-release.mdx).
diff --git a/website/community/how-to-release/release-manager-preparation.md b/website/community/how-to-release/release-manager-preparation.md
index 700b3bf45e..85123029d4 100644
--- a/website/community/how-to-release/release-manager-preparation.md
+++ b/website/community/how-to-release/release-manager-preparation.md
@@ -210,6 +210,28 @@ which tar
 ```
 
 
+## Rust, Python, and C++ client publishing
+
+A unified release also publishes the Rust, Python, and C++ clients (under `fluss-rust/`). As release manager, make sure the following access and CI secrets are in place.
+
+### Registry access
+
+- **crates.io** (`fluss-rs`): your account must be an owner of the crate. Verify with `cargo login <token>`, then `cargo publish -p fluss-rs --dry-run`.
+- **PyPI / TestPyPI** (`pyfluss`): confirm you are a maintainer at https://pypi.org/project/pyfluss/, and generate API tokens on both PyPI and TestPyPI.
+- **Hex.pm** (Elixir `fluss`): post-1.0 only — not published yet.
+
+### GitHub Actions secrets
+
+Publishing is automated by the `rust-release.yml` and `python-release.yml` workflows when a version tag is pushed. Configure these repository secrets:
+
+- `CARGO_REGISTRY_TOKEN` — crates.io API token
+- `PYPI_API_TOKEN` — PyPI token (final release)
+- `TEST_PYPI_API_TOKEN` — TestPyPI token (release candidates)
+
+### Toolchain for the dependency audit
+
+Regenerating the Rust dependency/license list (an ASF requirement) needs the toolchain in `fluss-rust/rust-toolchain.toml`, [cargo-deny](https://embarkstudios.github.io/cargo-deny/), and Python 3.11+ (for `fluss-rust/scripts/dependencies.py`).
+
 ## Further reading
 
 It's recommended but not mandatory to read following documents before making a release to know more details about apache release:
diff --git a/website/community/how-to-release/verifying-a-fluss-release.md b/website/community/how-to-release/verifying-a-fluss-release.md
index a1649c17c7..c7b4dc7863 100644
--- a/website/community/how-to-release/verifying-a-fluss-release.md
+++ b/website/community/how-to-release/verifying-a-fluss-release.md
@@ -73,6 +73,38 @@ Unzip the source release archive, and verify that:
 5. The LICENSE and NOTICE files in the root directory refer to dependencies in the source release, i.e., files in the git repository (such as fonts, css, JavaScript, images)
 
 
+## Verifying the clients (Rust / Python / C++)
+
+The Rust, Python, and C++ clients ship in the same source release under `fluss-rust/`. Build them from the extracted source archive — you need **Rust** (see `fluss-rust/rust-toolchain.toml` for the expected version), plus **protobuf** and, for the Python binding, **Python 3.9+**:
+
+```bash
+cd fluss-rust
+cargo build --workspace --release
+```
+
+Per-language verification:
+
+- **Rust:** build from the source release (above), or depend on the RC tag in a throwaway project (`fluss-rs = { git = "https://github.com/apache/fluss", tag = "v${RELEASE_VERSION}-rc${RC_NUM}" }`), then write a few test cases (connect, create table, read/write). Installation: https://fluss.apache.org/docs/apis/rust/installation/
+- **Python:** for an RC, install from **TestPyPI** (`pip install -i https://test.pypi.org/simple/ pyfluss==${RELEASE_VERSION}`) and write test cases. Installation: https://fluss.apache.org/docs/apis/python/installation/
+- **C++:** build and link the C++ client from `fluss-rust/bindings/cpp/`, then verify. Installation: https://fluss.apache.org/docs/apis/cpp/installation/
+
+The Rust workspace's dependency licenses are checked with [cargo-deny](https://embarkstudios.github.io/cargo-deny/); the release manager regenerates the dependency audit before the release.
+
+## Release artifacts and publish targets
+
+A release publishes to several registries; confirm each one carries the release version:
+
+| Component | Target | Identifier |
+|-----------|--------|------------|
+| Java / Scala | Maven Central (via Apache Nexus staging) | `org.apache.fluss:fluss-*` |
+| Rust | [crates.io](https://crates.io/crates/fluss-rs) | `fluss-rs` |
+| Python | [PyPI](https://pypi.org/project/pyfluss/) (RC → [TestPyPI](https://test.pypi.org/project/pyfluss/)) | `pyfluss` |
+| C++ | source archive only (no registry) | — |
+| Elixir | Hex.pm (post-1.0; not yet published) | `fluss` |
+| Docker | Docker Hub | `apache/fluss`, `apache/fluss-quickstart-flink` |
+
+Source archives, signatures, and checksums are on [dist.apache.org](https://dist.apache.org/repos/dist/dev/incubator/fluss/) (dev) and, after the vote, on [downloads.apache.org](https://downloads.apache.org/incubator/fluss/).
+
 ## Testing Against Staged Maven Artifacts
 
 Update the root `pom.xml` of the maven project (like the apache/fluss project) to include the staged repository in the `<repositories>` section. You can do this by adding a new repository entry like this:
diff --git a/website/docs/apis/client-support-matrix.md b/website/docs/apis/client-support-matrix.md
index cb932f2d42..f4d31733c5 100644
--- a/website/docs/apis/client-support-matrix.md
+++ b/website/docs/apis/client-support-matrix.md
@@ -1,6 +1,6 @@
 ---
 title: "Client Support Matrix"
-sidebar_position: 5
+sidebar_position: 6
 ---
 
 # Client Feature Support Matrix
@@ -11,7 +11,7 @@ Fluss has a rich set of features and native data types available to users. The f
 
 These data operations are available under TableAppend, TableScan, TableUpsert and TableLookup interfaces.
 
-| Table Type   | Operations                 | [Java Client](/apis/java-client.md) | Rust Client | Python Client | C++ Client |
+| Table Type   | Operations                 | [Java Client](./java/index.md) | Rust Client | Python Client | C++ Client |
 |--------------|----------------------------|-------------------------------------|-------------|---------------|------------|
 | Log          | Append                     | ✔️                                  | ✔️          | ✔️            | ✔️         |
 | Log          | Typed Append               | ✔️                                  |             |               |            |
@@ -30,14 +30,14 @@ These data operations are available under TableAppend, TableScan, TableUpsert an
 | Primary Key  | Batch Scan (Snapshot)      | ✔️                                  |             |               |            |
 
 :::tip
-For more details, see [Table Overview](/table-design/overview.md).
+For more details, see [Table Overview](../table-design/overview.md).
 :::
 
 ## Data Types
 
 Client support for Fluss data types are as follows:
 
-| DataType                                                        | [Java Client](/apis/java-client.md) | Rust Client | Python Client | C++ Client |
+| DataType                                                        | [Java Client](./java/index.md) | Rust Client | Python Client | C++ Client |
 |-----------------------------------------------------------------|-------------------------------------|-------------|---------------|------------|
 | BOOLEAN                                                         | ✔️                                  | ✔️          | ✔️            | ✔️         |
 | TINYINT                                                         | ✔️                                  | ✔️          | ✔️            | ✔️         |
@@ -63,14 +63,14 @@ Client support for Fluss data types are as follows:
 | ROW\<n0 t0, n1 t1, ...\><br/>ROW\<n0 t0 'd0', n1 t1 'd1', ...\> | ✔️                                  |             |               |            |
 
 :::tip
-For more details, see [Data Types](table-design/data-types.md).
+For more details, see [Data Types](../table-design/data-types.md).
 :::
 
 ## Admin Operations
 
 Admin operations are available under FlussAdmin interface.
 
-| Entity    | Operations             | [Java Client](/apis/java-client.md) | Rust Client | Python Client | C++ Client |
+| Entity    | Operations             | [Java Client](./java/index.md) | Rust Client | Python Client | C++ Client |
 |-----------|------------------------|-------------------------------------|-------------|---------------|------------|
 | Database  | CreateDatabase         | ✔️                                  | ✔️          |               |            |
 | Database  | DropDatabase           | ✔️                                  | ✔️          |               |            |
@@ -103,12 +103,12 @@ Admin operations are available under FlussAdmin interface.
 
 ## Data Lake Formats
 
-| Format  | [Java Client](/apis/java-client.md) | Rust Client | Python Client | C++ Client |
+| Format  | [Java Client](./java/index.md) | Rust Client | Python Client | C++ Client |
 |---------|-------------------------------------|-------------|---------------|------------|
 | Iceberg | ✔️                                  |             |               |            |
 | Lance   | ✔️                                  | ✔️          |               |            |
 | Paimon  | ✔️                                  |             |               |            |
 
 :::tip
-For more details, see [Streaming Lakehouse](/streaming-lakehouse/overview.md).
+For more details, see [Streaming Lakehouse](../streaming-lakehouse/overview.md).
 :::
\ No newline at end of file
diff --git a/website/docs/apis/cpp-client.md b/website/docs/apis/cpp-client.md
deleted file mode 100644
index 420ea6f099..0000000000
--- a/website/docs/apis/cpp-client.md
+++ /dev/null
@@ -1,70 +0,0 @@
----
-title: "C++ Client"
-sidebar_position: 4
----
-
-# Fluss C++ Client
-
-The Fluss C++ Client provides a high-performance, synchronous interface for
-interacting with Fluss clusters. It manages an internal Tokio runtime and
-supports Apache Arrow for efficient data interchange.
-
-The client provides two main APIs:
-
-- **[Admin API](https://clients.fluss.apache.org/user-guide/cpp/api-reference#admin)**: For managing databases, tables, and partitions.
-- **[Table API](https://clients.fluss.apache.org/user-guide/cpp/api-reference#table)**: For reading and writing to Log and Primary Key tables.
-
-## Installation
-
-The C++ client is not yet published as a package and must be built from source.
-
-**Prerequisites:** CMake 3.22+, C++17 compiler, Rust 1.85+, Apache Arrow C++ library
-
-Install dependencies:
-```bash
-# macOS
-brew install cmake arrow
-
-# Ubuntu/Debian
-sudo apt-get install cmake libarrow-dev
-```
-```bash
-git clone https://github.com/apache/fluss-rust.git
-cd fluss-rust/bindings/cpp
-mkdir -p build && cd build
-cmake -DCMAKE_BUILD_TYPE=Release ..
-cmake --build .
-```
-
-For full build options including CMake integration into your own project, see the
-[C++ client installation guide](https://clients.fluss.apache.org/user-guide/cpp/installation).
-
-## Quick Example
-```cpp
-#include "fluss.hpp"
-
-int main() {
-    fluss::Configuration config;
-    config.bootstrap_servers = "127.0.0.1:9123";
-
-    fluss::Connection conn;
-    fluss::Result result = fluss::Connection::Create(config, conn);
-    if (!result.Ok()) {
-        std::cerr << "Connection failed: " << result.error_message << std::endl;
-        return 1;
-    }
-
-    fluss::Admin admin;
-    conn.GetAdmin(admin);
-
-    return 0;
-}
-```
-
-For more examples, see the [Fluss C++ Client documentation](https://clients.fluss.apache.org/user-guide/cpp/example/).
-
-## Full Documentation
-
-For the complete C++ client reference including all configuration options,
-API methods, data types, error handling, and worked examples — see the
-**[Fluss C++ Client documentation](https://clients.fluss.apache.org/user-guide/cpp/installation)**.
\ No newline at end of file
diff --git a/website/docs/apis/cpp/_category_.json b/website/docs/apis/cpp/_category_.json
new file mode 100644
index 0000000000..d32653e102
--- /dev/null
+++ b/website/docs/apis/cpp/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "C++",
+  "position": 5
+}
diff --git a/website/docs/apis/cpp/api-reference.md b/website/docs/apis/cpp/api-reference.md
new file mode 100644
index 0000000000..e9b94c9d9e
--- /dev/null
+++ b/website/docs/apis/cpp/api-reference.md
@@ -0,0 +1,731 @@
+---
+sidebar_position: 2
+---
+# API Reference
+
+Complete API reference for the Fluss C++ client.
+
+## `Result`
+
+| Field / Method  | Type          | Description                                                    |
+|-----------------|---------------|----------------------------------------------------------------|
+| `error_code`    | `int32_t`     | 0 for success, non-zero for errors                             |
+| `error_message` | `std::string` | Human-readable error description                               |
+| `Ok()`          | `bool`        | Returns `true` if operation succeeded (`error_code == 0`)      |
+
+## `Configuration`
+
+| Field                                 | Type          | Default              | Description                                                                              |
+|---------------------------------------|---------------|----------------------|------------------------------------------------------------------------------------------|
+| `bootstrap_servers`                   | `std::string` | `"127.0.0.1:9123"`   | Coordinator server address                                                               |
+| `writer_request_max_size`             | `int32_t`     | `10485760` (10 MB)   | Maximum request size in bytes                                                            |
+| `writer_acks`                         | `std::string` | `"all"`              | Acknowledgment setting (`"all"`, `"0"`, `"1"`, or `"-1"`)                                |
+| `writer_retries`                      | `int32_t`     | `INT32_MAX`          | Number of retries on failure                                                             |
+| `writer_batch_size`                   | `int32_t`     | `2097152` (2 MB)     | Batch size for writes in bytes. Upper bound when dynamic sizing is on; fixed batch size when off |
+| `writer_dynamic_batch_size_enabled`   | `bool`        | `true`               | Enable per-table dynamic batch sizing: target grows 10% above 80% fill, shrinks 5% below 50% |
+| `writer_dynamic_batch_size_min`       | `int32_t`     | `262144` (256 KB)    | Lower bound for the dynamic batch size estimator (ignored when disabled)                 |
+| `writer_batch_timeout_ms`             | `int64_t`     | `100`                | Maximum time in ms to wait for a writer batch to fill up before sending                  |
+| `writer_bucket_no_key_assigner`       | `std::string` | `"sticky"`           | Bucket assignment strategy for tables without bucket keys: `"sticky"` or `"round_robin"` |
+| `scanner_remote_log_prefetch_num`     | `size_t`      | `4`                  | Number of remote log segments to prefetch                                                |
+| `remote_file_download_thread_num`     | `size_t`      | `3`                  | Number of threads for remote log downloads                                               |
+| `scanner_remote_log_read_concurrency` | `size_t`      | `4`                  | Streaming read concurrency within a remote log file                                      |
+| `scanner_log_max_poll_records`        | `size_t`      | `500`                | Maximum number of records returned in a single Poll()                                    |
+| `scanner_log_fetch_max_bytes`         | `int32_t`     | `16777216` (16 MB)   | Maximum bytes per fetch response for LogScanner                                          |
+| `scanner_log_fetch_min_bytes`         | `int32_t`     | `1`                  | Minimum bytes the server must accumulate before returning a fetch response               |
+| `scanner_log_fetch_wait_max_time_ms`  | `int32_t`     | `500`                | Maximum time (ms) the server may wait to satisfy min-bytes                               |
+| `scanner_log_fetch_max_bytes_for_bucket`| `int32_t`   | `1048576` (1 MB)     | Maximum bytes per fetch response per bucket for LogScanner                               |
+| `connect_timeout_ms`                  | `uint64_t`    | `120000`             | TCP connect timeout in milliseconds                                                      |
+| `security_protocol`                   | `std::string` | `"PLAINTEXT"`        | `"PLAINTEXT"` (default) or `"sasl"` for SASL auth                                        |
+| `security_sasl_mechanism`             | `std::string` | `"PLAIN"`            | SASL mechanism (only `"PLAIN"` is supported)                                             |
+| `security_sasl_username`              | `std::string` | (empty)              | SASL username (required when protocol is `"sasl"`)                                       |
+| `security_sasl_password`              | `std::string` | (empty)              | SASL password (required when protocol is `"sasl"`)                                       |
+
+## `Connection`
+
+| Method                                                                  | Description                                       |
+|-------------------------------------------------------------------------|---------------------------------------------------|
+| `static Create(const Configuration& config, Connection& out) -> Result` | Create a connection to a Fluss cluster            |
+| `GetAdmin(Admin& out) -> Result`                                        | Get the admin interface                           |
+| `GetTable(const TablePath& table_path, Table& out) -> Result`           | Get a table for read/write operations             |
+| `Available() -> bool`                                                   | Check if the connection is valid and initialized  |
+
+## `Admin`
+
+### Database Operations
+
+| Method                                                                                                                    | Description              |
+|---------------------------------------------------------------------------------------------------------------------------|--------------------------|
+| `CreateDatabase(const std::string& database_name, const DatabaseDescriptor& descriptor, bool ignore_if_exists) -> Result` | Create a database        |
+| `DropDatabase(const std::string& name, bool ignore_if_not_exists, bool cascade) -> Result`                                | Drop a database          |
+| `ListDatabases(std::vector<std::string>& out) -> Result`                                                                  | List all databases       |
+| `DatabaseExists(const std::string& name, bool& out) -> Result`                                                            | Check if a database exists |
+| `GetDatabaseInfo(const std::string& name, DatabaseInfo& out) -> Result`                                                   | Get database metadata    |
+
+### Table Operations
+
+| Method                                                                                                     | Description                 |
+|------------------------------------------------------------------------------------------------------------|-----------------------------|
+| `CreateTable(const TablePath& path, const TableDescriptor& descriptor, bool ignore_if_exists) -> Result`   | Create a table              |
+| `DropTable(const TablePath& path, bool ignore_if_not_exists) -> Result`                                    | Drop a table                |
+| `GetTableInfo(const TablePath& path, TableInfo& out) -> Result`                                            | Get table metadata          |
+| `ListTables(const std::string& database_name, std::vector<std::string>& out) -> Result`                    | List tables in a database   |
+| `TableExists(const TablePath& path, bool& out) -> Result`                                                  | Check if a table exists     |
+
+### Partition Operations
+
+| Method                                                                                                                                          | Description              |
+|-------------------------------------------------------------------------------------------------------------------------------------------------|--------------------------|
+| `CreatePartition(const TablePath& path, const std::unordered_map<std::string, std::string>& partition_spec, bool ignore_if_exists) -> Result`   | Create a partition       |
+| `DropPartition(const TablePath& path, const std::unordered_map<std::string, std::string>& partition_spec, bool ignore_if_not_exists) -> Result` | Drop a partition         |
+| `ListPartitionInfos(const TablePath& path, std::vector<PartitionInfo>& out) -> Result`                                                          | List partition metadata  |
+
+### Offset Operations
+
+| Method                                                                                                                                                                                                  | Description                             |
+|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------|
+| `ListOffsets(const TablePath& path, const std::vector<int32_t>& bucket_ids, const OffsetSpec& query, std::unordered_map<int32_t, int64_t>& out) -> Result`                                             | Get offsets for buckets                 |
+| `ListPartitionOffsets(const TablePath& path, const std::string& partition_name, const std::vector<int32_t>& bucket_ids, const OffsetSpec& query, std::unordered_map<int32_t, int64_t>& out) -> Result` | Get offsets for a partition's buckets   |
+
+### Lake Operations
+
+| Method                                                                      | Description                  |
+|-----------------------------------------------------------------------------|------------------------------|
+| `GetLatestLakeSnapshot(const TablePath& path, LakeSnapshot& out) -> Result` | Get the latest lake snapshot |
+
+### Cluster Operations
+
+| Method                                                    | Description                                        |
+|-----------------------------------------------------------|----------------------------------------------------|
+| `GetServerNodes(std::vector<ServerNode>& out) -> Result`  | Get all alive server nodes (coordinator + tablets) |
+
+## `ServerNode`
+
+| Field         | Type          | Description                                              |
+|---------------|---------------|----------------------------------------------------------|
+| `id`          | `int32_t`     | Server node ID                                           |
+| `host`        | `std::string` | Hostname of the server                                   |
+| `port`        | `uint32_t`    | Port number                                              |
+| `server_type` | `std::string` | Server type (`"CoordinatorServer"` or `"TabletServer"`)  |
+| `uid`         | `std::string` | Unique identifier (e.g. `"cs-0"`, `"ts-1"`)             |
+
+## `Table`
+
+| Method                        | Description                              |
+|-------------------------------|------------------------------------------|
+| `NewRow() -> GenericRow`      | Create a schema-aware row for this table |
+| `NewAppend() -> TableAppend`  | Create an append builder for log tables  |
+| `NewUpsert() -> TableUpsert`  | Create an upsert builder for PK tables   |
+| `NewLookup() -> TableLookup`  | Create a lookup builder for PK tables    |
+| `NewScan() -> TableScan`      | Create a scan builder                    |
+| `GetTableInfo() -> TableInfo` | Get table metadata                       |
+| `GetTablePath() -> TablePath` | Get the table path                       |
+| `HasPrimaryKey() -> bool`     | Check if the table has a primary key     |
+
+## `TableAppend`
+
+| Method                                       | Description             |
+|----------------------------------------------|-------------------------|
+| `CreateWriter(AppendWriter& out) -> Result`  | Create an append writer |
+
+## `TableUpsert`
+
+| Method                                                                       | Description                                |
+|------------------------------------------------------------------------------|--------------------------------------------|
+| `PartialUpdateByIndex(std::vector<size_t> column_indices) -> TableUpsert&`   | Configure partial update by column indices |
+| `PartialUpdateByName(std::vector<std::string> column_names) -> TableUpsert&` | Configure partial update by column names   |
+| `CreateWriter(UpsertWriter& out) -> Result`                                  | Create an upsert writer                    |
+
+## `TableLookup`
+
+| Method                                    | Description                         |
+|-------------------------------------------|-------------------------------------|
+| `CreateLookuper(Lookuper& out) -> Result` | Create a lookuper for point lookups |
+
+## `TableScan`
+
+| Method                                                               | Description                                   |
+|----------------------------------------------------------------------|-----------------------------------------------|
+| `ProjectByIndex(std::vector<size_t> column_indices) -> TableScan&`   | Project columns by index                      |
+| `ProjectByName(std::vector<std::string> column_names) -> TableScan&` | Project columns by name                       |
+| `CreateLogScanner(LogScanner& out) -> Result`                        | Create a record-based log scanner             |
+| `CreateRecordBatchLogScanner(LogScanner& out) -> Result`             | Create an Arrow RecordBatch-based log scanner |
+
+## `AppendWriter`
+
+| Method                                                      | Description                            |
+|-------------------------------------------------------------|----------------------------------------|
+| `Append(const GenericRow& row) -> Result`                   | Append a row (fire-and-forget)         |
+| `Append(const GenericRow& row, WriteResult& out) -> Result` | Append a row with write acknowledgment |
+| `Flush() -> Result`                                         | Flush all pending writes               |
+
+## `UpsertWriter`
+
+| Method                                                      | Description                                   |
+|-------------------------------------------------------------|-----------------------------------------------|
+| `Upsert(const GenericRow& row) -> Result`                   | Upsert a row (fire-and-forget)                |
+| `Upsert(const GenericRow& row, WriteResult& out) -> Result` | Upsert a row with write acknowledgment        |
+| `Delete(const GenericRow& row) -> Result`                   | Delete a row by primary key (fire-and-forget) |
+| `Delete(const GenericRow& row, WriteResult& out) -> Result` | Delete a row with write acknowledgment        |
+| `Flush() -> Result`                                         | Flush all pending operations                  |
+
+## `WriteResult`
+
+| Method             | Description                                 |
+|--------------------|---------------------------------------------|
+| `Wait() -> Result` | Wait for server acknowledgment of the write |
+
+## `Lookuper`
+
+| Method                                                        |  Description                |
+|---------------------------------------------------------------|-----------------------------|
+| `Lookup(const GenericRow& pk_row, LookupResult& out) -> Result` | Lookup a row by primary key |
+
+## `LogScanner`
+
+| Method                                                                                               |  Description                              |
+|------------------------------------------------------------------------------------------------------|-------------------------------------------|
+| `Subscribe(int32_t bucket_id, int64_t offset) -> Result`                                             | Subscribe to a single bucket at an offset |
+| `Subscribe(const std::vector<BucketSubscription>& bucket_offsets) -> Result`                         | Subscribe to multiple buckets             |
+| `SubscribePartitionBuckets(int64_t partition_id, int32_t bucket_id, int64_t start_offset) -> Result` | Subscribe to a single partition bucket    |
+| `SubscribePartitionBuckets(const std::vector<PartitionBucketSubscription>& subscriptions) -> Result` | Subscribe to multiple partition buckets   |
+| `Unsubscribe(int32_t bucket_id) -> Result`                                                           | Unsubscribe from a non-partitioned bucket |
+| `UnsubscribePartition(int64_t partition_id, int32_t bucket_id) -> Result`                            | Unsubscribe from a partition bucket       |
+| `Poll(int64_t timeout_ms, ScanRecords& out) -> Result`                                               | Poll individual records                   |
+| `PollRecordBatch(int64_t timeout_ms, ArrowRecordBatches& out) -> Result`                             | Poll Arrow RecordBatches                  |
+
+## `GenericRow`
+
+`GenericRow` is a **write-only** row used for append, upsert, delete, and lookup key construction. For reading field values from scan or lookup results, see [`RowView`](#rowview) and [`LookupResult`](#lookupresult).
+
+### Index-Based Setters
+
+| Method                                                    |  Description                   |
+|-----------------------------------------------------------|--------------------------------|
+| `SetNull(size_t idx)`                                     | Set field to null              |
+| `SetBool(size_t idx, bool value)`                         | Set boolean value              |
+| `SetInt32(size_t idx, int32_t value)`                     | Set 32-bit integer             |
+| `SetInt64(size_t idx, int64_t value)`                     | Set 64-bit integer             |
+| `SetFloat32(size_t idx, float value)`                     | Set 32-bit float               |
+| `SetFloat64(size_t idx, double value)`                    | Set 64-bit float               |
+| `SetString(size_t idx, const std::string& value)`         | Set string value               |
+| `SetBytes(size_t idx, const std::vector<uint8_t>& value)` | Set binary data                |
+| `SetDate(size_t idx, const Date& value)`                  | Set date value                 |
+| `SetTime(size_t idx, const Time& value)`                  | Set time value                 |
+| `SetTimestampNtz(size_t idx, const Timestamp& value)`     | Set timestamp without timezone |
+| `SetTimestampLtz(size_t idx, const Timestamp& value)`     | Set timestamp with timezone    |
+| `SetDecimal(size_t idx, const std::string& value)`        | Set decimal from string        |
+| `SetArray(size_t idx, ArrayWriter&& writer)`              | Set array value (consumes the writer) |
+
+### Name-Based Setters
+
+When using `table.NewRow()`, the `Set()` method auto-routes to the correct type based on the schema:
+
+| Method                                                   | Description                       |
+|----------------------------------------------------------|-----------------------------------|
+| `Set(const std::string& name, std::nullptr_t)`           | Set field to null by column name  |
+| `Set(const std::string& name, bool value)`               | Set boolean by column name        |
+| `Set(const std::string& name, int32_t value)`            | Set integer by column name        |
+| `Set(const std::string& name, int64_t value)`            | Set big integer by column name    |
+| `Set(const std::string& name, float value)`              | Set float by column name          |
+| `Set(const std::string& name, double value)`             | Set double by column name         |
+| `Set(const std::string& name, const std::string& value)` | Set string/decimal by column name |
+| `Set(const std::string& name, const Date& value)`        | Set date by column name           |
+| `Set(const std::string& name, const Time& value)`        | Set time by column name           |
+| `Set(const std::string& name, const Timestamp& value)`   | Set timestamp by column name      |
+
+## `RowView`
+
+Read-only row view for scan results. Provides zero-copy access to string and bytes data. `RowView` shares ownership of the underlying scan data via reference counting, so it can safely outlive the `ScanRecords` that produced it.
+
+:::note string_view Lifetime
+`GetString()` returns `std::string_view` that borrows from the underlying data. The `string_view` is valid as long as any `RowView` (or `ScanRecord`) referencing the same poll result is alive. Copy to `std::string` if you need the value after all references are gone.
+:::
+
+### Index-Based Getters
+
+| Method                                                     |  Description                   |
+|------------------------------------------------------------|--------------------------------|
+| `FieldCount() -> size_t`                                   | Get the number of fields       |
+| `GetType(size_t idx) -> TypeId`                            | Get the type at index          |
+| `IsNull(size_t idx) -> bool`                               | Check if field is null         |
+| `GetBool(size_t idx) -> bool`                              | Get boolean value at index     |
+| `GetInt32(size_t idx) -> int32_t`                          | Get 32-bit integer at index    |
+| `GetInt64(size_t idx) -> int64_t`                          | Get 64-bit integer at index    |
+| `GetFloat32(size_t idx) -> float`                          | Get 32-bit float at index      |
+| `GetFloat64(size_t idx) -> double`                         | Get 64-bit float at index      |
+| `GetString(size_t idx) -> std::string_view`                | Get string at index (zero-copy)|
+| `GetBytes(size_t idx) -> std::pair<const uint8_t*, size_t>`| Get binary data at index (zero-copy)|
+| `GetDate(size_t idx) -> Date`                              | Get date at index              |
+| `GetTime(size_t idx) -> Time`                              | Get time at index              |
+| `GetTimestamp(size_t idx) -> Timestamp`                    | Get timestamp at index         |
+| `IsDecimal(size_t idx) -> bool`                            | Check if field is a decimal type|
+| `GetDecimalString(size_t idx) -> std::string`              | Get decimal as string at index |
+
+### Array Getters (Index-Based)
+
+| Method                                                             |  Description                              |
+|--------------------------------------------------------------------|-------------------------------------------|
+| `GetArraySize(size_t idx) -> size_t`                               | Get element count of array at index       |
+| `GetArrayElementType(size_t idx) -> TypeId`                        | Get element type of array at index        |
+| `IsArrayElementNull(size_t idx, size_t element) -> bool`           | Check if array element is null            |
+| `GetArrayBool(size_t idx, size_t element) -> bool`                 | Get boolean array element                 |
+| `GetArrayInt32(size_t idx, size_t element) -> int32_t`             | Get 32-bit integer array element          |
+| `GetArrayInt64(size_t idx, size_t element) -> int64_t`             | Get 64-bit integer array element          |
+| `GetArrayFloat32(size_t idx, size_t element) -> float`             | Get 32-bit float array element            |
+| `GetArrayFloat64(size_t idx, size_t element) -> double`            | Get 64-bit float array element            |
+| `GetArrayString(size_t idx, size_t element) -> std::string`        | Get string array element                  |
+| `GetArrayBytes(size_t idx, size_t element) -> std::vector<uint8_t>`| Get binary array element                  |
+| `GetArrayDate(size_t idx, size_t element) -> Date`                 | Get date array element                    |
+| `GetArrayTime(size_t idx, size_t element) -> Time`                 | Get time array element                    |
+| `GetArrayTimestamp(size_t idx, size_t element) -> Timestamp`       | Get timestamp array element               |
+| `GetArrayDecimalString(size_t idx, size_t element) -> std::string` | Get decimal array element as string       |
+| `GetArrayView(size_t idx) -> ArrayView`                            | Get owning ArrayView for nested access    |
+
+All array getters are also available by column name (e.g., `GetArraySize("col")`, `GetArrayView("col")`).
+
+### Name-Based Getters
+
+| Method                                                  |  Description                       |
+|---------------------------------------------------------|------------------------------------|
+| `IsNull(const std::string& name) -> bool`               | Check if field is null by name     |
+| `GetBool(const std::string& name) -> bool`              | Get boolean by column name         |
+| `GetInt32(const std::string& name) -> int32_t`          | Get 32-bit integer by column name  |
+| `GetInt64(const std::string& name) -> int64_t`          | Get 64-bit integer by column name  |
+| `GetFloat32(const std::string& name) -> float`          | Get 32-bit float by column name    |
+| `GetFloat64(const std::string& name) -> double`         | Get 64-bit float by column name    |
+| `GetString(const std::string& name) -> std::string_view`| Get string by column name          |
+| `GetBytes(const std::string& name) -> std::pair<const uint8_t*, size_t>` | Get binary data by column name |
+| `GetDate(const std::string& name) -> Date`              | Get date by column name            |
+| `GetTime(const std::string& name) -> Time`              | Get time by column name            |
+| `GetTimestamp(const std::string& name) -> Timestamp`    | Get timestamp by column name       |
+| `GetDecimalString(const std::string& name) -> std::string` | Get decimal as string by column name |
+
+## `ScanRecord`
+
+`ScanRecord` is a value type that can be freely copied, stored, and accumulated across multiple `Poll()` calls. It shares ownership of the underlying scan data via reference counting.
+
+| Field         | Type         |  Description                                                        |
+|---------------|--------------|---------------------------------------------------------------------|
+| `offset`      | `int64_t`    | Record offset in the log                                            |
+| `timestamp`   | `int64_t`    | Record timestamp                                                    |
+| `change_type` | `ChangeType` | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
+| `row`         | `RowView`    | Row data (value type, shares ownership via reference counting)      |
+
+## `ScanRecords`
+
+### Flat Access
+
+| Method                                  |  Description                               |
+|-----------------------------------------|--------------------------------------------|
+| `Count() -> size_t`                     | Total number of records across all buckets |
+| `IsEmpty() -> bool`                     | Check if empty                             |
+| `begin() / end()`                       | Iterator support for range-based for loops |
+
+Flat iteration over all records (regardless of bucket):
+
+```cpp
+for (const auto& rec : records) {
+    std::cout << "offset=" << rec.offset << std::endl;
+}
+```
+
+### Per-Bucket Access
+
+| Method                                                          |  Description                                                          |
+|-----------------------------------------------------------------|-----------------------------------------------------------------------|
+| `BucketCount() -> size_t`                                       | Number of distinct buckets                                            |
+| `Buckets() -> std::vector<TableBucket>`                         | List of distinct buckets                                              |
+| `Records(const TableBucket& bucket) -> BucketRecords`              | Records for a specific bucket (empty if bucket not present)           |
+| `BucketAt(size_t idx) -> BucketRecords`                            | Records by bucket index (0-based, O(1))                               |
+
+## `BucketRecords`
+
+A bundle of scan records belonging to a single bucket. Obtained from `ScanRecords::Records()` or `ScanRecords::BucketAt()`. `BucketRecords` is a value type — it shares ownership of the underlying scan data via reference counting, so it can safely outlive the `ScanRecords` that produced it.
+
+| Method                                         |  Description                               |
+|------------------------------------------------|--------------------------------------------|
+| `Size() -> size_t`                         | Number of records in this bucket           |
+| `Empty() -> bool`                          | Check if empty                             |
+| `Bucket() -> const TableBucket&`           | Get the bucket                             |
+| `operator[](size_t idx) -> ScanRecord`     | Access record by index within this bucket  |
+| `begin() / end()`                          | Iterator support for range-based for loops |
+
+## `TableBucket`
+
+| Field / Method                        |  Description                                    |
+|---------------------------------------|-------------------------------------------------|
+| `table_id -> int64_t`                    | Table ID                                        |
+| `bucket_id -> int32_t`                   | Bucket ID                                       |
+| `partition_id -> std::optional<int64_t>` | Partition ID (empty if non-partitioned)         |
+| `operator==(const TableBucket&) -> bool` | Equality comparison                             |
+
+## `LookupResult`
+
+Read-only result for lookup operations. Provides zero-copy access to field values.
+
+### Metadata
+
+| Method                      |  Description                   |
+|-----------------------------|--------------------------------|
+| `Found() -> bool`           | Whether a matching row was found |
+| `FieldCount() -> size_t`    | Get the number of fields       |
+
+### Index-Based Getters
+
+| Method                                                     |  Description                   |
+|------------------------------------------------------------|--------------------------------|
+| `GetType(size_t idx) -> TypeId`                            | Get the type at index          |
+| `IsNull(size_t idx) -> bool`                               | Check if field is null         |
+| `GetBool(size_t idx) -> bool`                              | Get boolean value at index     |
+| `GetInt32(size_t idx) -> int32_t`                          | Get 32-bit integer at index    |
+| `GetInt64(size_t idx) -> int64_t`                          | Get 64-bit integer at index    |
+| `GetFloat32(size_t idx) -> float`                          | Get 32-bit float at index      |
+| `GetFloat64(size_t idx) -> double`                         | Get 64-bit float at index      |
+| `GetString(size_t idx) -> std::string_view`                | Get string at index (zero-copy)|
+| `GetBytes(size_t idx) -> std::pair<const uint8_t*, size_t>`| Get binary data at index (zero-copy)|
+| `GetDate(size_t idx) -> Date`                              | Get date at index              |
+| `GetTime(size_t idx) -> Time`                              | Get time at index              |
+| `GetTimestamp(size_t idx) -> Timestamp`                    | Get timestamp at index         |
+| `IsDecimal(size_t idx) -> bool`                            | Check if field is a decimal type|
+| `GetDecimalString(size_t idx) -> std::string`              | Get decimal as string at index |
+
+### Array Getters (Index-Based)
+
+Same array getters as [`RowView`](#array-getters-index-based) — `GetArraySize`, `GetArrayInt32`, `GetArrayView`, etc. Also available by column name.
+
+### Name-Based Getters
+
+| Method                                                  |  Description                       |
+|---------------------------------------------------------|------------------------------------|
+| `IsNull(const std::string& name) -> bool`               | Check if field is null by name     |
+| `GetBool(const std::string& name) -> bool`              | Get boolean by column name         |
+| `GetInt32(const std::string& name) -> int32_t`          | Get 32-bit integer by column name  |
+| `GetInt64(const std::string& name) -> int64_t`          | Get 64-bit integer by column name  |
+| `GetFloat32(const std::string& name) -> float`          | Get 32-bit float by column name    |
+| `GetFloat64(const std::string& name) -> double`         | Get 64-bit float by column name    |
+| `GetString(const std::string& name) -> std::string_view`| Get string by column name          |
+| `GetBytes(const std::string& name) -> std::pair<const uint8_t*, size_t>` | Get binary data by column name |
+| `GetDate(const std::string& name) -> Date`              | Get date by column name            |
+| `GetTime(const std::string& name) -> Time`              | Get time by column name            |
+| `GetTimestamp(const std::string& name) -> Timestamp`    | Get timestamp by column name       |
+| `GetDecimalString(const std::string& name) -> std::string` | Get decimal as string by column name |
+
+## `ArrowRecordBatch`
+
+| Method                                                         | Description                          |
+|----------------------------------------------------------------|--------------------------------------|
+| `GetArrowRecordBatch() -> std::shared_ptr<arrow::RecordBatch>` | Get the underlying Arrow RecordBatch |
+| `Available() -> bool`                                          | Check if the batch is valid          |
+| `NumRows() -> int64_t`                                         | Number of rows in the batch          |
+| `GetTableId() -> int64_t`                                      | Table ID                             |
+| `GetPartitionId() -> int64_t`                                  | Partition ID                         |
+| `GetBucketId() -> int32_t`                                     | Bucket ID                            |
+| `GetBaseOffset() -> int64_t`                                   | First record offset                  |
+| `GetLastOffset() -> int64_t`                                   | Last record offset                   |
+
+## `ArrowRecordBatches`
+
+| Method                   |  Description                               |
+|--------------------------|--------------------------------------------|
+| `Size() -> size_t`       | Number of batches                          |
+| `Empty() -> bool`        | Check if empty                             |
+| `operator[](size_t idx)` | Access batch by index                      |
+| `begin() / end()`        | Iterator support for range-based for loops |
+
+## `Schema`
+
+| Method                            |  Description                |
+|-----------------------------------|-----------------------------|
+| `NewBuilder() -> Schema::Builder` | Create a new schema builder |
+
+## `Schema::Builder`
+
+| Method                                                                 |  Description            |
+|------------------------------------------------------------------------|-------------------------|
+| `AddColumn(const std::string& name, const DataType& type) -> Builder&` | Add a column            |
+| `SetPrimaryKeys(const std::vector<std::string>& keys) -> Builder&`     | Set primary key columns |
+| `Build() -> Schema`                                                    | Build the schema        |
+
+## `TableDescriptor`
+
+| Method                                     |  Description                          |
+|--------------------------------------------|---------------------------------------|
+| `NewBuilder() -> TableDescriptor::Builder` | Create a new table descriptor builder |
+
+## `TableDescriptor::Builder`
+
+| Method                                                                            | Description                |
+|-----------------------------------------------------------------------------------|----------------------------|
+| `SetSchema(const Schema& schema) -> Builder&`                                     | Set the table schema       |
+| `SetPartitionKeys(const std::vector<std::string>& keys) -> Builder&`              | Set partition key columns  |
+| `SetBucketCount(int32_t count) -> Builder&`                                       | Set the number of buckets  |
+| `SetBucketKeys(const std::vector<std::string>& keys) -> Builder&`                 | Set bucket key columns     |
+| `SetProperty(const std::string& key, const std::string& value) -> Builder&`       | Set a table property       |
+| `SetCustomProperty(const std::string& key, const std::string& value) -> Builder&` | Set a custom property      |
+| `SetComment(const std::string& comment) -> Builder&`                              | Set a table comment        |
+| `Build() -> TableDescriptor`                                                      | Build the table descriptor |
+
+## `DataType`
+
+### Factory Methods
+
+| Method                                        |  Description                       |
+|-----------------------------------------------|------------------------------------|
+| `DataType::Boolean()`                         | Boolean type                       |
+| `DataType::TinyInt()`                         | 8-bit signed integer               |
+| `DataType::SmallInt()`                        | 16-bit signed integer              |
+| `DataType::Int()`                             | 32-bit signed integer              |
+| `DataType::BigInt()`                          | 64-bit signed integer              |
+| `DataType::Float()`                           | 32-bit floating point              |
+| `DataType::Double()`                          | 64-bit floating point              |
+| `DataType::String()`                          | UTF-8 string                       |
+| `DataType::Bytes()`                           | Binary data                        |
+| `DataType::Date()`                            | Date (days since epoch)            |
+| `DataType::Time()`                            | Time (milliseconds since midnight) |
+| `DataType::Timestamp(int precision)`          | Timestamp without timezone         |
+| `DataType::TimestampLtz(int precision)`       | Timestamp with timezone            |
+| `DataType::Decimal(int precision, int scale)` | Decimal with precision and scale   |
+| `DataType::Array(DataType element)`           | Array of the given element type    |
+
+### Accessors
+
+| Method                              |  Description                                |
+|-------------------------------------|---------------------------------------------|
+| `id() -> TypeId`                    | Get the type ID                             |
+| `precision() -> int`               | Get precision (for Decimal/Timestamp types) |
+| `scale() -> int`                   | Get scale (for Decimal type)                |
+| `nullable() -> bool`               | Returns `true` if this type is nullable (default), `false` if `NOT NULL` |
+| `element_type() -> const DataType*` | Get element type (for Array type, nullptr otherwise) |
+| `NotNull() -> DataType`            | Returns a copy of this type with nullable set to `false` |
+
+## `ArrayWriter`
+
+Write-only builder for array column values. Constructed with a fixed size and element type, then populated element-by-element. Move-only — consumed by `GenericRow::SetArray()` or `ArrayWriter::SetArray()` for nested arrays.
+
+| Method                                                    |  Description                              |
+|-----------------------------------------------------------|-------------------------------------------|
+| `ArrayWriter(size_t size, DataType element_type)`         | Create an array writer                    |
+| `SetNull(size_t idx)`                                     | Set element to null                       |
+| `SetBool(size_t idx, bool value)`                         | Set boolean element                       |
+| `SetInt32(size_t idx, int32_t value)`                     | Set 32-bit integer element                |
+| `SetInt64(size_t idx, int64_t value)`                     | Set 64-bit integer element                |
+| `SetFloat32(size_t idx, float value)`                     | Set 32-bit float element                  |
+| `SetFloat64(size_t idx, double value)`                    | Set 64-bit float element                  |
+| `SetString(size_t idx, const std::string& value)`         | Set string element                        |
+| `SetBytes(size_t idx, const std::vector<uint8_t>& value)` | Set binary element                        |
+| `SetDate(size_t idx, const Date& value)`                  | Set date element                          |
+| `SetTime(size_t idx, const Time& value)`                  | Set time element                          |
+| `SetTimestampNtz(size_t idx, const Timestamp& value)`     | Set timestamp without timezone element    |
+| `SetTimestampLtz(size_t idx, const Timestamp& value)`     | Set timestamp with timezone element       |
+| `SetDecimal(size_t idx, const std::string& value)`        | Set decimal element from string           |
+| `SetArray(size_t idx, ArrayWriter&& nested)`              | Set nested array element (consumes nested)|
+
+## `ArrayView`
+
+Read-only view over an array column value. Obtained from `RowView::GetArrayView()` or `LookupResult::GetArrayView()`, and recursively from `ArrayView::GetArray()` for nested `ARRAY<ARRAY<...>>` columns. Move-only.
+
+| Method                                                  |  Description                              |
+|---------------------------------------------------------|-------------------------------------------|
+| `Size() -> size_t`                                      | Get element count                         |
+| `ElementType() -> TypeId`                               | Get element type                          |
+| `IsNull(size_t element) -> bool`                        | Check if element is null                  |
+| `GetBool(size_t element) -> bool`                       | Get boolean element                       |
+| `GetInt32(size_t element) -> int32_t`                   | Get 32-bit integer element                |
+| `GetInt64(size_t element) -> int64_t`                   | Get 64-bit integer element                |
+| `GetFloat32(size_t element) -> float`                   | Get 32-bit float element                  |
+| `GetFloat64(size_t element) -> double`                  | Get 64-bit float element                  |
+| `GetString(size_t element) -> std::string`              | Get string element                        |
+| `GetBytes(size_t element) -> std::vector<uint8_t>`      | Get binary element                        |
+| `GetDate(size_t element) -> Date`                       | Get date element                          |
+| `GetTime(size_t element) -> Time`                       | Get time element                          |
+| `GetTimestamp(size_t element) -> Timestamp`              | Get timestamp element                     |
+| `GetTimestampLtz(size_t element) -> Timestamp`          | Get timestamp with timezone element       |
+| `GetDecimalString(size_t element) -> std::string`       | Get decimal element as string             |
+| `GetArray(size_t element) -> ArrayView`                 | Get nested array as child ArrayView       |
+
+## `TablePath`
+
+| Method / Field                                                     |  Description          |
+|--------------------------------------------------------------------|-----------------------|
+| `TablePath(const std::string& database, const std::string& table)` | Create a table path   |
+| `database_name -> std::string`                                     | Database name         |
+| `table_name -> std::string`                                        | Table name            |
+| `ToString() -> std::string`                                        | String representation |
+
+## `TableInfo`
+
+| Field               | Type                                           | Description                         |
+|---------------------|------------------------------------------------|-------------------------------------|
+| `table_id`          | `int64_t`                                      | Table ID                            |
+| `schema_id`         | `int32_t`                                      | Schema ID                           |
+| `table_path`        | `TablePath`                                    | Table path                          |
+| `created_time`      | `int64_t`                                      | Creation timestamp                  |
+| `modified_time`     | `int64_t`                                      | Last modification timestamp         |
+| `primary_keys`      | `std::vector<std::string>`                     | Primary key columns                 |
+| `bucket_keys`       | `std::vector<std::string>`                     | Bucket key columns                  |
+| `partition_keys`    | `std::vector<std::string>`                     | Partition key columns               |
+| `num_buckets`       | `int32_t`                                      | Number of buckets                   |
+| `has_primary_key`   | `bool`                                         | Whether the table has a primary key |
+| `is_partitioned`    | `bool`                                         | Whether the table is partitioned    |
+| `properties`        | `std::unordered_map<std::string, std::string>` | Table properties                    |
+| `custom_properties` | `std::unordered_map<std::string, std::string>` | Custom properties                   |
+| `comment`           | `std::string`                                  | Table comment                       |
+| `schema`            | `Schema`                                       | Table schema                        |
+
+## Temporal Types
+
+### `Date`
+
+| Method                                        |  Description                 |
+|-----------------------------------------------|------------------------------|
+| `Date::FromDays(int32_t days)`                | Create from days since epoch |
+| `Date::FromYMD(int year, int month, int day)` | Create from year, month, day |
+| `Year() -> int`                               | Get year                     |
+| `Month() -> int`                              | Get month                    |
+| `Day() -> int`                                | Get day                      |
+
+### `Time`
+
+| Method                                            |  Description                                 |
+|---------------------------------------------------|----------------------------------------------|
+| `Time::FromMillis(int32_t millis)`                | Create from milliseconds since midnight      |
+| `Time::FromHMS(int hour, int minute, int second)` | Create from hour, minute, second             |
+| `Hour() -> int`                                   | Get hour                                     |
+| `Minute() -> int`                                 | Get minute                                   |
+| `Second() -> int`                                 | Get second                                   |
+| `Millis() -> int64_t`                             | Get sub-second millisecond component (0-999) |
+
+### `Timestamp`
+
+| Method                                                               |  Description                             |
+|----------------------------------------------------------------------|------------------------------------------|
+| `Timestamp::FromMillis(int64_t millis)`                              | Create from milliseconds since epoch     |
+| `Timestamp::FromMillisNanos(int64_t millis, int32_t nanos)`          | Create from milliseconds and nanoseconds |
+| `Timestamp::FromTimePoint(std::chrono::system_clock::time_point tp)` | Create from a time point                 |
+
+## `PartitionInfo`
+
+| Field            | Type          |  Description   |
+|------------------|---------------|----------------|
+| `partition_id`   | `int64_t`     | Partition ID   |
+| `partition_name` | `std::string` | Partition name |
+
+## `DatabaseDescriptor`
+
+| Field        | Type                                           | Description       |
+|--------------|------------------------------------------------|-------------------|
+| `comment`    | `std::string`                                  | Database comment  |
+| `properties` | `std::unordered_map<std::string, std::string>` | Custom properties |
+
+## `DatabaseInfo`
+
+| Field           | Type                                           |  Description                |
+|-----------------|------------------------------------------------|-----------------------------|
+| `database_name` | `std::string`                                  | Database name               |
+| `comment`       | `std::string`                                  | Database comment            |
+| `properties`    | `std::unordered_map<std::string, std::string>` | Custom properties           |
+| `created_time`  | `int64_t`                                      | Creation timestamp          |
+| `modified_time` | `int64_t`                                      | Last modification timestamp |
+
+## `LakeSnapshot`
+
+| Field            | Type                        |  Description       |
+|------------------|-----------------------------|--------------------|
+| `snapshot_id`    | `int64_t`                   | Snapshot ID        |
+| `bucket_offsets` | `std::vector<BucketOffset>` | All bucket offsets |
+
+## `BucketOffset`
+
+| Field          | Type      | Description  |
+|----------------|-----------|--------------|
+| `table_id`     | `int64_t` | Table ID     |
+| `partition_id` | `int64_t` | Partition ID |
+| `bucket_id`    | `int32_t` | Bucket ID    |
+| `offset`       | `int64_t` | Offset value |
+
+## `OffsetSpec`
+
+| Method                                             | Description                             |
+|----------------------------------------------------|-----------------------------------------|
+| `OffsetSpec::Earliest()`                          | Query for the earliest available offset |
+| `OffsetSpec::Latest()`                            | Query for the latest offset             |
+| `OffsetSpec::Timestamp(int64_t timestamp_ms)`     | Query offset at a specific timestamp    |
+
+## Constants
+
+| Constant                 |  Value |  Description                                            |
+|--------------------------|--------|---------------------------------------------------------|
+| `fluss::EARLIEST_OFFSET` | `-2`   | Start reading from the earliest available offset        |
+
+To start reading from the latest offset (only new records), resolve the current offset via `ListOffsets` before subscribing:
+
+```cpp
+std::unordered_map<int32_t, int64_t> offsets;
+admin.ListOffsets(table_path, {0}, fluss::OffsetSpec::Latest(), offsets);
+scanner.Subscribe(0, offsets[0]);
+```
+
+## Enums
+
+### `ChangeType`
+
+| Value          | Short String | Description                      |
+|----------------|--------------|----------------------------------|
+| `AppendOnly`   | `+A`         | Append-only record               |
+| `Insert`       | `+I`         | Inserted row                     |
+| `UpdateBefore` | `-U`         | Previous value of an updated row |
+| `UpdateAfter`  | `+U`         | New value of an updated row      |
+| `Delete`       | `-D`         | Deleted row                      |
+
+You may refer to the following example to convert ChangeType enum to its short string representation.
+
+```cpp
+inline const char* ChangeTypeShortString(ChangeType ct) {
+    switch (ct) {
+        case ChangeType::AppendOnly: return "+A";
+        case ChangeType::Insert: return "+I";
+        case ChangeType::UpdateBefore: return "-U";
+        case ChangeType::UpdateAfter: return "+U";
+        case ChangeType::Delete: return "-D";
+    }
+    throw std::invalid_argument("Unknown ChangeType");
+}
+```
+
+### `TypeId`
+
+| Value          |  Description               |
+|----------------|----------------------------|
+| `Boolean`      | Boolean type               |
+| `TinyInt`      | 8-bit signed integer       |
+| `SmallInt`     | 16-bit signed integer      |
+| `Int`          | 32-bit signed integer      |
+| `BigInt`       | 64-bit signed integer      |
+| `Float`        | 32-bit floating point      |
+| `Double`       | 64-bit floating point      |
+| `String`       | UTF-8 string               |
+| `Bytes`        | Binary data                |
+| `Date`         | Date                       |
+| `Time`         | Time                       |
+| `Timestamp`    | Timestamp without timezone |
+| `TimestampLtz` | Timestamp with timezone    |
+| `Decimal`      | Decimal                    |
+| `Array`        | Array of elements          |
+
+### `ChangeType`
+
+| Value          |  Description                                |
+|----------------|---------------------------------------------|
+| `AppendOnly`   | Append-only record (log tables)             |
+| `Insert`       | Inserted row (PK tables)                    |
+| `UpdateBefore` | Row value before an update (PK tables)      |
+| `UpdateAfter`  | Row value after an update (PK tables)       |
+| `Delete`       | Deleted row (PK tables)                     |
+
+### `OffsetSpec`
+
+| Value       |  Description                   |
+|-------------|--------------------------------|
+| `Earliest`  | Earliest available offset      |
+| `Latest`    | Latest offset                  |
+| `Timestamp` | Offset at a specific timestamp |
diff --git a/website/docs/apis/cpp/data-types.md b/website/docs/apis/cpp/data-types.md
new file mode 100644
index 0000000000..cce40cefa1
--- /dev/null
+++ b/website/docs/apis/cpp/data-types.md
@@ -0,0 +1,250 @@
+---
+sidebar_position: 3
+---
+# Data Types
+
+## Schema DataTypes
+
+| DataType                   | Description                                                    |
+|----------------------------|----------------------------------------------------------------|
+| `DataType::Boolean()`      | Boolean value                                                  |
+| `DataType::TinyInt()`      | 8-bit signed integer                                           |
+| `DataType::SmallInt()`     | 16-bit signed integer                                          |
+| `DataType::Int()`          | 32-bit signed integer                                          |
+| `DataType::BigInt()`       | 64-bit signed integer                                          |
+| `DataType::Float()`        | 32-bit floating point                                          |
+| `DataType::Double()`       | 64-bit floating point                                          |
+| `DataType::String()`       | UTF-8 string                                                   |
+| `DataType::Bytes()`        | Binary data                                                    |
+| `DataType::Date()`         | Date (days since epoch)                                        |
+| `DataType::Time()`         | Time (milliseconds since midnight)                             |
+| `DataType::Timestamp()`    | Timestamp without timezone (default precision 6, microseconds) |
+| `DataType::TimestampLtz()` | Timestamp with timezone (default precision 6, microseconds)    |
+| `DataType::Decimal(p, s)`  | Decimal with precision and scale                               |
+| `DataType::Array(element)` | Array of the given element type (supports nesting)             |
+
+## Nullability
+
+All DataTypes are nullable by default. Use `.NotNull()` to create a `NOT NULL` type:
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("id", fluss::DataType::Int().NotNull())
+    .AddColumn("name", fluss::DataType::String())          // nullable by default
+    .Build();
+```
+
+Primary key columns are automatically forced `NOT NULL` regardless of the `DataType` setting.
+
+For nested types, nullability is preserved at each array level and at the leaf element:
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("tags", fluss::DataType::Array(fluss::DataType::String().NotNull()))
+    .AddColumn("ids", fluss::DataType::Array(fluss::DataType::Int()).NotNull())
+    .AddColumn("nested", fluss::DataType::Array(
+        fluss::DataType::Array(fluss::DataType::Int()).NotNull()))
+    .Build();
+// "tags":   ARRAY<STRING NOT NULL>         (outer nullable, elements NOT NULL)
+// "ids":    ARRAY<INT> NOT NULL            (outer NOT NULL, elements nullable)
+// "nested": ARRAY<ARRAY<INT> NOT NULL>     (outer nullable, inner array NOT NULL)
+```
+
+You can query nullability at runtime:
+
+```cpp
+auto info = table.GetTableInfo();
+bool is_nullable = info.schema.columns[0].data_type.nullable();
+```
+
+## GenericRow Setters
+
+`SetInt32` is used for `TinyInt`, `SmallInt`, and `Int` columns. For `TinyInt` and `SmallInt`, the value is validated at write time — an error is returned if it overflows the column's range (e.g., \[-128, 127\] for `TinyInt`, \[-32768, 32767\] for `SmallInt`).
+
+```cpp
+fluss::GenericRow row;
+row.SetNull(0);
+row.SetBool(1, true);
+row.SetInt32(2, 42);
+row.SetInt64(3, 1234567890L);
+row.SetFloat32(4, 3.14f);
+row.SetFloat64(5, 2.71828);
+row.SetString(6, "hello");
+row.SetBytes(7, {0x01, 0x02, 0x03});
+```
+
+### Array Columns
+
+Array values are built element-by-element using `ArrayWriter`, then attached to the row via `SetArray`:
+
+```cpp
+fluss::ArrayWriter aw(3, fluss::DataType::Int());
+aw.SetInt32(0, 10);
+aw.SetInt32(1, 20);
+aw.SetNull(2);
+row.SetArray(8, std::move(aw));
+```
+
+For nested arrays (e.g., `ARRAY<ARRAY<INT>>`), build inner arrays first:
+
+```cpp
+fluss::ArrayWriter inner(2, fluss::DataType::Int());
+inner.SetInt32(0, 1);
+inner.SetInt32(1, 2);
+
+fluss::ArrayWriter outer(1, fluss::DataType::Array(fluss::DataType::Int()));
+outer.SetArray(0, std::move(inner));
+row.SetArray(9, std::move(outer));
+```
+
+## Name-Based Setters
+
+When using `table.NewRow()`, you can set fields by column name. The setter automatically routes to the correct type based on the schema:
+
+```cpp
+auto row = table.NewRow();
+row.Set("user_id", 1);
+row.Set("name", "Alice");
+row.Set("score", 95.5f);
+row.Set("balance", "1234.56");   // decimal as string
+row.Set("birth_date", fluss::Date::FromYMD(1990, 3, 15));
+row.Set("login_time", fluss::Time::FromHMS(9, 30, 0));
+row.Set("created_at", fluss::Timestamp::FromMillis(1700000000000));
+row.Set("nickname", nullptr);    // set to null
+```
+
+## Reading Field Values
+
+Field values are read through `RowView` (from scan results) and `LookupResult` (from lookups), not through `GenericRow`. Both provide the same getter interface with zero-copy access to string and bytes data.
+
+`ScanRecord` is a value type — it can be freely copied, stored, and accumulated across multiple `Poll()` calls via reference counting.
+
+:::note string_view Lifetime
+`GetString()` returns `std::string_view` that borrows from the underlying data. The `string_view` is valid as long as any `ScanRecord` referencing the same poll result is alive. Copy to `std::string` if you need the value after all records are gone.
+:::
+
+```cpp
+// ScanRecord is a value type — safe to store and accumulate:
+std::vector<fluss::ScanRecord> all_records;
+fluss::ScanRecords records;
+scanner.Poll(5000, records);
+for (const auto& rec : records) {
+    all_records.push_back(rec);                    // safe! ref-counted
+    auto name = rec.row.GetString(0);              // zero-copy string_view
+    auto owned = std::string(rec.row.GetString(0)); // explicit copy when needed
+}
+
+// DON'T — string_view dangles after all records referencing the data are destroyed:
+std::string_view dangling;
+{
+    fluss::ScanRecords records;
+    scanner.Poll(5000, records);
+    dangling = records[0].row.GetString(0);
+}
+// dangling is undefined behavior here — no ScanRecord keeps the data alive!
+```
+
+### From Scan Results (RowView)
+
+```cpp
+for (const auto& rec : records) {
+    auto name = rec.row.GetString(1);          // zero-copy string_view
+    float score = rec.row.GetFloat32(3);
+    auto balance = rec.row.GetDecimalString(4); // std::string (already owned)
+    fluss::Date date = rec.row.GetDate(5);
+    fluss::Time time = rec.row.GetTime(6);
+    fluss::Timestamp ts = rec.row.GetTimestamp(7);
+}
+```
+
+### From Lookup Results (LookupResult)
+
+```cpp
+fluss::LookupResult result;
+lookuper.Lookup(pk_row, result);
+if (result.Found()) {
+    auto name = result.GetString(1);  // zero-copy string_view
+    int64_t age = result.GetInt64(2);
+}
+```
+
+### Reading Array Columns
+
+Array columns can be read element-by-element using index-based getters, or via an `ArrayView` for recursive access:
+
+```cpp
+// Element-by-element access (flat arrays)
+size_t len = rec.row.GetArraySize(8);
+for (size_t i = 0; i < len; i++) {
+    if (!rec.row.IsArrayElementNull(8, i)) {
+        int32_t val = rec.row.GetArrayInt32(8, i);
+    }
+}
+
+// ArrayView for nested arrays or when you need a standalone handle
+fluss::ArrayView av = rec.row.GetArrayView(8);
+for (size_t i = 0; i < av.Size(); i++) {
+    if (!av.IsNull(i)) {
+        int32_t val = av.GetInt32(i);
+    }
+}
+
+// Nested arrays: ArrayView::GetArray() returns a child ArrayView
+fluss::ArrayView outer = rec.row.GetArrayView(9);
+for (size_t i = 0; i < outer.Size(); i++) {
+    fluss::ArrayView inner = outer.GetArray(i);
+    for (size_t j = 0; j < inner.Size(); j++) {
+        int32_t val = inner.GetInt32(j);
+    }
+}
+```
+
+## TypeId Enum
+
+`TinyInt` and `SmallInt` values are widened to `int32_t` on read.
+
+| TypeId          | C++ Type                                    | Getter                    |
+|-----------------|---------------------------------------------|---------------------------|
+| `Boolean`       | `bool`                                      | `GetBool(idx)`            |
+| `TinyInt`       | `int32_t`                                   | `GetInt32(idx)`           |
+| `SmallInt`      | `int32_t`                                   | `GetInt32(idx)`           |
+| `Int`           | `int32_t`                                   | `GetInt32(idx)`           |
+| `BigInt`        | `int64_t`                                   | `GetInt64(idx)`           |
+| `Float`         | `float`                                     | `GetFloat32(idx)`         |
+| `Double`        | `double`                                    | `GetFloat64(idx)`         |
+| `String`        | `std::string_view`                          | `GetString(idx)`          |
+| `Bytes`         | `std::pair<const uint8_t*, size_t>`         | `GetBytes(idx)`           |
+| `Date`          | `Date`                                      | `GetDate(idx)`            |
+| `Time`          | `Time`                                      | `GetTime(idx)`            |
+| `Timestamp`     | `Timestamp`                                 | `GetTimestamp(idx)`       |
+| `TimestampLtz`  | `Timestamp`                                 | `GetTimestamp(idx)`       |
+| `Decimal`       | `std::string`                               | `GetDecimalString(idx)`   |
+| `Array`         | `ArrayView`                                 | `GetArrayView(idx)`       |
+
+## Type Checking
+
+```cpp
+if (rec.row.GetType(0) == fluss::TypeId::Int) {
+    int32_t value = rec.row.GetInt32(0);
+}
+if (rec.row.IsNull(1)) {
+    // field is null
+}
+if (rec.row.IsDecimal(2)) {
+    std::string decimal_str = rec.row.GetDecimalString(2);
+}
+```
+
+## Constants
+
+```cpp
+constexpr int64_t fluss::EARLIEST_OFFSET = -2;  // Start from earliest
+```
+
+To start reading from the latest offset, resolve the current offset via `ListOffsets` before subscribing:
+
+```cpp
+std::unordered_map<int32_t, int64_t> offsets;
+admin.ListOffsets(table_path, {0}, fluss::OffsetSpec::Latest(), offsets);
+scanner.Subscribe(0, offsets[0]);
+```
diff --git a/website/docs/apis/cpp/error-handling.md b/website/docs/apis/cpp/error-handling.md
new file mode 100644
index 0000000000..7447a264c7
--- /dev/null
+++ b/website/docs/apis/cpp/error-handling.md
@@ -0,0 +1,238 @@
+---
+sidebar_position: 4
+---
+# Error Handling
+
+All C++ client operations return a `fluss::Result` struct instead of throwing exceptions. This gives you explicit control over error handling.
+
+## The `Result` Struct
+
+```cpp
+#include "fluss.hpp"
+
+// All operations return fluss::Result
+fluss::Result result = admin.CreateTable(path, descriptor);
+if (!result.Ok()) {
+    std::cerr << "Error code: " << result.error_code << std::endl;
+    std::cerr << "Error message: " << result.error_message << std::endl;
+}
+```
+
+| Field / Method   | Type          | Description                               |
+|------------------|---------------|-------------------------------------------|
+| `error_code`     | `int32_t`     | 0 for success, non-zero for errors        |
+| `error_message`  | `std::string` | Human-readable error description          |
+| `Ok()`           | `bool`        | Returns `true` if the operation succeeded |
+
+## Handling Errors
+
+Check the `Result` after each operation and decide how to respond, e.g. log and continue, retry, or abort:
+
+```cpp
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+if (!result.Ok()) {
+    // Log, retry, or propagate the error as appropriate
+    std::cerr << "Connection failed (code " << result.error_code
+              << "): " << result.error_message << std::endl;
+    return 1;
+}
+```
+
+## Connection State Checking
+
+Use `Available()` to verify that a connection or object is valid before using it:
+
+```cpp
+fluss::Connection conn;
+if (!conn.Available()) {
+    // Connection not initialized or already moved
+}
+
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+fluss::Result result = fluss::Connection::Create(config, conn);
+if (result.Ok() && conn.Available()) {
+    // Connection is ready to use
+}
+```
+
+## Error Codes
+
+Server-side errors carry a specific error code (>0 or -1). Client-side errors (connection failures, type mismatches, etc.) use `ErrorCode::CLIENT_ERROR` (-2). Use `fluss::ErrorCode` to match on specific codes:
+
+```cpp
+fluss::Result result = admin.DropTable(table_path);
+if (!result.Ok()) {
+    if (result.error_code == fluss::ErrorCode::TABLE_NOT_EXIST) {
+        std::cerr << "Table does not exist" << std::endl;
+    } else if (result.error_code == fluss::ErrorCode::PARTITION_NOT_EXISTS) {
+        std::cerr << "Partition does not exist" << std::endl;
+    } else if (result.error_code == fluss::ErrorCode::CLIENT_ERROR) {
+        std::cerr << "Client-side error: " << result.error_message << std::endl;
+    } else {
+        std::cerr << "Server error (code " << result.error_code
+                  << "): " << result.error_message << std::endl;
+    }
+}
+```
+
+### Common Error Codes
+
+| Constant                                      | Code | Description                         |
+|-----------------------------------------------|------|-------------------------------------|
+| `ErrorCode::CLIENT_ERROR`                     | -2   | Client-side error (not from server) |
+| `ErrorCode::UNKNOWN_SERVER_ERROR`             | -1   | Unexpected server error             |
+| `ErrorCode::NETWORK_EXCEPTION`                | 1    | Server disconnected before response |
+| `ErrorCode::DATABASE_NOT_EXIST`               | 4    | Database does not exist             |
+| `ErrorCode::DATABASE_ALREADY_EXIST`           | 6    | Database already exists             |
+| `ErrorCode::TABLE_NOT_EXIST`                  | 7    | Table does not exist                |
+| `ErrorCode::TABLE_ALREADY_EXIST`              | 8    | Table already exists                |
+| `ErrorCode::INVALID_TABLE_EXCEPTION`          | 15   | Invalid table operation             |
+| `ErrorCode::REQUEST_TIME_OUT`                 | 25   | Request timed out                   |
+| `ErrorCode::PARTITION_NOT_EXISTS`             | 36   | Partition does not exist            |
+| `ErrorCode::PARTITION_ALREADY_EXISTS`         | 42   | Partition already exists            |
+| `ErrorCode::PARTITION_SPEC_INVALID_EXCEPTION` | 43   | Invalid partition spec              |
+| `ErrorCode::LEADER_NOT_AVAILABLE_EXCEPTION`   | 44   | No leader available for partition   |
+| `ErrorCode::AUTHENTICATE_EXCEPTION`           | 46   | Authentication failed (bad credentials) |
+
+See `fluss::ErrorCode` in `fluss.hpp` for the full list of named constants.
+
+## Retry Logic
+
+Some errors are transient, where the server may be temporarily unavailable, mid-election, or under load. `IsRetriable()` can be used for deciding to to retry an operation rather than treating the error as permanent.
+
+`ErrorCode::IsRetriable(int32_t code)` is a static helper available directly on the error code:
+
+```cpp
+fluss::Result result = writer.Append(row);
+if (!result.Ok()) {
+    if (result.IsRetriable()) {
+        // Transient failure — safe to retry 
+    } else {
+        // Permanent failure — log and abort
+        std::cerr << "Fatal error (code " << result.error_code
+                  << "): " << result.error_message << std::endl;
+    }
+}
+```
+
+`Result::IsRetriable()` delegates to `ErrorCode::IsRetriable()`, so you can also call it directly on the code:
+
+```cpp
+if (fluss::ErrorCode::IsRetriable(result.error_code)) {
+    // retry
+}
+```
+
+### Retriable Error Codes
+
+| Constant                                                    | Code | Reason                                    |
+|-------------------------------------------------------------|------|-------------------------------------------|
+| `ErrorCode::NETWORK_EXCEPTION`                          | 1    | Server disconnected                       |
+| `ErrorCode::CORRUPT_MESSAGE`                            | 3    | CRC or size error                         |
+| `ErrorCode::SCHEMA_NOT_EXIST`                           | 9    | Schema may not exist                      |
+| `ErrorCode::LOG_STORAGE_EXCEPTION`                      | 10   | Transient log storage error               |
+| `ErrorCode::KV_STORAGE_EXCEPTION`                       | 11   | Transient KV storage error                |
+| `ErrorCode::NOT_LEADER_OR_FOLLOWER`                     | 12   | Leader election in progress               |
+| `ErrorCode::CORRUPT_RECORD_EXCEPTION`                   | 14   | Corrupt record                            |
+| `ErrorCode::UNKNOWN_TABLE_OR_BUCKET_EXCEPTION`          | 21   | Metadata not yet available                |
+| `ErrorCode::REQUEST_TIME_OUT`                           | 25   | Request timed out                         |
+| `ErrorCode::STORAGE_EXCEPTION`                          | 26   | Transient storage error                   |
+| `ErrorCode::NOT_ENOUGH_REPLICAS_AFTER_APPEND_EXCEPTION` | 28   | Wrote to server but with low ISR size     |
+| `ErrorCode::NOT_ENOUGH_REPLICAS_EXCEPTION`              | 29   | Low ISR size at write time                |
+| `ErrorCode::LEADER_NOT_AVAILABLE_EXCEPTION`             | 44   | No leader available for partition         |
+
+Client-side errors (`ErrorCode::CLIENT_ERROR`, code -2) always return `false` from `IsRetriable()`.
+
+## Common Error Scenarios
+
+### Connection Refused
+
+The cluster is not running or the address is incorrect:
+
+```cpp
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+if (!result.Ok()) {
+    // "Connection refused" or timeout error
+    std::cerr << "Cannot connect to cluster: " << result.error_message << std::endl;
+}
+```
+
+### Table Not Found
+
+Attempting to access a table that does not exist:
+
+```cpp
+fluss::Table table;
+fluss::Result result = conn.GetTable(fluss::TablePath("fluss", "nonexistent"), table);
+if (!result.Ok()) {
+    if (result.error_code == fluss::ErrorCode::TABLE_NOT_EXIST) {
+        std::cerr << "Table not found" << std::endl;
+    }
+}
+```
+
+### Partition Not Found
+
+Writing to a partitioned primary key table before creating partitions:
+
+```cpp
+// This will fail if partitions are not created first
+auto row = table.NewRow();
+row.Set("user_id", 1);
+row.Set("region", "US");
+row.Set("score", static_cast<int64_t>(100));
+fluss::WriteResult wr;
+fluss::Result result = writer.Upsert(row, wr);
+if (!result.Ok()) {
+    if (result.error_code == fluss::ErrorCode::PARTITION_NOT_EXISTS) {
+        std::cerr << "Partition not found, create partitions before writing" << std::endl;
+    }
+}
+```
+
+### Authentication Failed
+
+SASL credentials are incorrect or the user does not exist:
+
+```cpp
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+config.security_protocol = "sasl";
+config.security_sasl_username = "admin";
+config.security_sasl_password = "wrong-password";
+
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+if (!result.Ok()) {
+    if (result.error_code == fluss::ErrorCode::AUTHENTICATE_EXCEPTION) {
+        std::cerr << "Authentication failed: " << result.error_message << std::endl;
+    }
+}
+```
+
+### Schema Mismatch
+
+Using incorrect types or column indices when writing:
+
+```cpp
+fluss::GenericRow row;
+// Setting wrong type for a column will result in an error
+// when the row is sent to the server
+row.SetString(0, "not_an_integer");  // Column 0 expects Int
+fluss::Result result = writer.Append(row);
+if (!result.Ok()) {
+    std::cerr << "Schema mismatch: " << result.error_message << std::endl;
+}
+```
+
+## Best Practices
+
+1. **Always check `Result`**: Never ignore the return value of operations that return `Result`.
+2. **Handle errors gracefully**: Log errors and retry or fail gracefully rather than crashing.
+3. **Verify connection state**: Use `Available()` to check connection validity before operations.
+4. **Create partitions before writing**: For partitioned primary key tables, always create partitions before attempting upserts.
diff --git a/website/docs/apis/cpp/example/_category_.json b/website/docs/apis/cpp/example/_category_.json
new file mode 100644
index 0000000000..4d81ec12ae
--- /dev/null
+++ b/website/docs/apis/cpp/example/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Examples",
+  "position": 5
+}
diff --git a/website/docs/apis/cpp/example/admin-operations.md b/website/docs/apis/cpp/example/admin-operations.md
new file mode 100644
index 0000000000..0f08549a0e
--- /dev/null
+++ b/website/docs/apis/cpp/example/admin-operations.md
@@ -0,0 +1,158 @@
+---
+sidebar_position: 3
+---
+# Admin Operations
+
+## Get Admin Interface
+
+```cpp
+fluss::Admin admin;
+conn.GetAdmin(admin);
+```
+
+## Database Operations
+
+```cpp
+// Create database
+fluss::DatabaseDescriptor db_descriptor;
+db_descriptor.comment = "My database";
+admin.CreateDatabase("my_database", db_descriptor, true);
+
+// List all databases
+std::vector<std::string> databases;
+admin.ListDatabases(databases);
+for (const auto& db : databases) {
+    std::cout << "Database: " << db << std::endl;
+}
+
+// Check if database exists
+bool exists = false;
+admin.DatabaseExists("my_database", exists);
+
+// Get database information
+fluss::DatabaseInfo db_info;
+admin.GetDatabaseInfo("my_database", db_info);
+std::cout << "Database: " << db_info.database_name << std::endl;
+
+// Drop database
+admin.DropDatabase("my_database", true, false);
+```
+
+## Table Operations
+
+```cpp
+fluss::TablePath table_path("fluss", "my_table");
+
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("id", fluss::DataType::Int())
+    .AddColumn("name", fluss::DataType::String())
+    .AddColumn("score", fluss::DataType::Float())
+    .AddColumn("age", fluss::DataType::Int())
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetBucketCount(3)
+    .SetComment("Example table")
+    .Build();
+
+// Create table
+admin.CreateTable(table_path, descriptor, true);
+
+// Get table information
+fluss::TableInfo table_info;
+admin.GetTableInfo(table_path, table_info);
+std::cout << "Table ID: " << table_info.table_id << std::endl;
+std::cout << "Number of buckets: " << table_info.num_buckets << std::endl;
+std::cout << "Has primary key: " << table_info.has_primary_key << std::endl;
+std::cout << "Is partitioned: " << table_info.is_partitioned << std::endl;
+
+// Drop table
+admin.DropTable(table_path, true);
+```
+
+## Schema Builder Options
+
+```cpp
+// Schema with primary key
+auto pk_schema = fluss::Schema::NewBuilder()
+    .AddColumn("id", fluss::DataType::Int())
+    .AddColumn("name", fluss::DataType::String())
+    .AddColumn("value", fluss::DataType::Double())
+    .SetPrimaryKeys({"id"})
+    .Build();
+
+// Table descriptor with partitioning
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetPartitionKeys({"date"})
+    .SetBucketCount(3)
+    .SetBucketKeys({"user_id"})
+    .SetProperty("retention_days", "7")
+    .SetComment("Sample table")
+    .Build();
+```
+
+## Partition Operations
+
+```cpp
+// Create a partition
+std::unordered_map<std::string, std::string> partition_spec = {{"region", "US"}};
+admin.CreatePartition(table_path, partition_spec, true);
+
+// List all partitions
+std::vector<fluss::PartitionInfo> partitions;
+admin.ListPartitionInfos(table_path, partitions);
+for (const auto& p : partitions) {
+    std::cout << "Partition: id=" << p.partition_id
+              << ", name=" << p.partition_name << std::endl;
+}
+
+// Drop a partition
+admin.DropPartition(table_path, partition_spec, true);
+```
+
+## Offset Operations
+
+```cpp
+std::vector<int32_t> bucket_ids = {0, 1, 2};
+
+// Query earliest offsets
+std::unordered_map<int32_t, int64_t> earliest_offsets;
+admin.ListOffsets(table_path, bucket_ids,
+                  fluss::OffsetSpec::Earliest(), earliest_offsets);
+
+// Query latest offsets
+std::unordered_map<int32_t, int64_t> latest_offsets;
+admin.ListOffsets(table_path, bucket_ids,
+                  fluss::OffsetSpec::Latest(), latest_offsets);
+
+// Query offsets for a specific timestamp
+std::unordered_map<int32_t, int64_t> timestamp_offsets;
+admin.ListOffsets(table_path, bucket_ids,
+                  fluss::OffsetSpec::Timestamp(timestamp_ms),
+                  timestamp_offsets);
+
+// Query partition offsets
+std::unordered_map<int32_t, int64_t> partition_offsets;
+admin.ListPartitionOffsets(table_path, "partition_name",
+                           bucket_ids, fluss::OffsetSpec::Latest(),
+                           partition_offsets);
+```
+
+## Lake Snapshot
+
+:::note
+Lake snapshots require [lake integration](https://fluss.apache.org/docs/maintenance/tiered-storage/overview/) (e.g. Paimon or Iceberg) to be enabled on the server. Without it, `GetLatestLakeSnapshot` will return an error.
+:::
+
+```cpp
+fluss::LakeSnapshot snapshot;
+admin.GetLatestLakeSnapshot(table_path, snapshot);
+std::cout << "Snapshot ID: " << snapshot.snapshot_id << std::endl;
+for (const auto& bucket_offset : snapshot.bucket_offsets) {
+    std::cout << "  Table " << bucket_offset.table_id
+              << ", Bucket " << bucket_offset.bucket_id
+              << ": offset=" << bucket_offset.offset << std::endl;
+}
+```
diff --git a/website/docs/apis/cpp/example/configuration.md b/website/docs/apis/cpp/example/configuration.md
new file mode 100644
index 0000000000..38202618c9
--- /dev/null
+++ b/website/docs/apis/cpp/example/configuration.md
@@ -0,0 +1,42 @@
+---
+sidebar_position: 2
+---
+# Configuration
+
+## Connection Setup
+
+```cpp
+#include "fluss.hpp"
+
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+
+if (!result.Ok()) {
+    std::cerr << "Connection failed: " << result.error_message << std::endl;
+}
+```
+
+## Connection Configurations
+
+All fields have sensible defaults. Only `bootstrap_servers` typically needs to be set.
+
+See the [`Configuration`](../api-reference.md#configuration) section in the API Reference for the full list of configuration fields, types, and defaults.
+
+## SASL Authentication
+
+To connect to a Fluss cluster with SASL/PLAIN authentication enabled:
+
+```cpp
+fluss::Configuration config;
+config.bootstrap_servers = "127.0.0.1:9123";
+config.security_protocol = "sasl";
+config.security_sasl_mechanism = "PLAIN";
+config.security_sasl_username = "admin";
+config.security_sasl_password = "admin-secret";
+
+fluss::Connection conn;
+fluss::Result result = fluss::Connection::Create(config, conn);
+```
diff --git a/website/docs/apis/cpp/example/index.md b/website/docs/apis/cpp/example/index.md
new file mode 100644
index 0000000000..51f60e4175
--- /dev/null
+++ b/website/docs/apis/cpp/example/index.md
@@ -0,0 +1,63 @@
+---
+sidebar_position: 1
+---
+# Example
+
+Minimal working example: connect to Fluss, create a table, write data, and read it back.
+
+```cpp
+#include <iostream>
+#include "fluss.hpp"
+
+int main() {
+    // Connect
+    fluss::Configuration config;
+    config.bootstrap_servers = "127.0.0.1:9123";
+
+    fluss::Connection conn;
+    fluss::Connection::Create(config, conn);
+
+    fluss::Admin admin;
+    conn.GetAdmin(admin);
+
+    // Create a log table
+    fluss::TablePath table_path("fluss", "quickstart_cpp");
+    auto schema = fluss::Schema::NewBuilder()
+        .AddColumn("id", fluss::DataType::Int())
+        .AddColumn("name", fluss::DataType::String())
+        .Build();
+    auto descriptor = fluss::TableDescriptor::NewBuilder()
+        .SetSchema(schema)
+        .Build();
+    admin.CreateTable(table_path, descriptor, true);
+
+    // Write
+    fluss::Table table;
+    conn.GetTable(table_path, table);
+
+    fluss::AppendWriter writer;
+    table.NewAppend().CreateWriter(writer);
+
+    fluss::GenericRow row;
+    row.SetInt32(0, 1);
+    row.SetString(1, "hello");
+    writer.Append(row);
+    writer.Flush();
+
+    // Read
+    fluss::LogScanner scanner;
+    table.NewScan().CreateLogScanner(scanner);
+    auto info = table.GetTableInfo();
+    for (int b = 0; b < info.num_buckets; ++b) {
+        scanner.Subscribe(b, 0);
+    }
+    fluss::ScanRecords records;
+    scanner.Poll(5000, records);
+    for (const auto& rec : records) {
+        std::cout << "id=" << rec.row.GetInt32(0)
+                  << ", name=" << rec.row.GetString(1) << std::endl;
+    }
+
+    return 0;
+}
+```
diff --git a/website/docs/apis/cpp/example/log-tables.md b/website/docs/apis/cpp/example/log-tables.md
new file mode 100644
index 0000000000..0125a4ce29
--- /dev/null
+++ b/website/docs/apis/cpp/example/log-tables.md
@@ -0,0 +1,161 @@
+---
+sidebar_position: 4
+---
+# Log Tables
+
+Log tables are append-only tables without primary keys, suitable for event streaming.
+
+## Creating a Log Table
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("event_id", fluss::DataType::Int())
+    .AddColumn("event_type", fluss::DataType::String())
+    .AddColumn("timestamp", fluss::DataType::BigInt())
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .Build();
+
+fluss::TablePath table_path("fluss", "events");
+admin.CreateTable(table_path, descriptor, true);
+```
+
+## Writing to Log Tables
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+fluss::AppendWriter writer;
+table.NewAppend().CreateWriter(writer);
+
+fluss::GenericRow row;
+row.SetInt32(0, 1);           // event_id
+row.SetString(1, "user_login");  // event_type
+row.SetInt64(2, 1704067200000L); // timestamp
+writer.Append(row);
+
+writer.Flush();
+```
+
+## Reading from Log Tables
+
+```cpp
+fluss::LogScanner scanner;
+table.NewScan().CreateLogScanner(scanner);
+
+auto info = table.GetTableInfo();
+for (int b = 0; b < info.num_buckets; ++b) {
+    scanner.Subscribe(b, 0);
+}
+
+fluss::ScanRecords records;
+scanner.Poll(5000, records);  // timeout in ms
+
+for (const auto& rec : records) {
+    std::cout << "event_id=" << rec.row.GetInt32(0)
+              << " event_type=" << rec.row.GetString(1)
+              << " timestamp=" << rec.row.GetInt64(2)
+              << " @ offset=" << rec.offset << std::endl;
+}
+
+// Or per-bucket access
+for (const auto& bucket : records.Buckets()) {
+    auto view = records.Records(bucket);
+    std::cout << "Bucket " << bucket.bucket_id << ": "
+              << view.Size() << " records" << std::endl;
+    for (const auto& rec : view) {
+        std::cout << "  event_id=" << rec.row.GetInt32(0)
+                  << " event_type=" << rec.row.GetString(1)
+                  << " @ offset=" << rec.offset << std::endl;
+    }
+}
+```
+
+**Continuous polling:**
+
+```cpp
+while (running) {
+    fluss::ScanRecords records;
+    scanner.Poll(1000, records);
+    for (const auto& rec : records) {
+        process(rec);
+    }
+}
+```
+
+**Accumulating records across polls:**
+
+`ScanRecord` is a value type — it can be freely copied, stored, and accumulated. The underlying data stays alive via reference counting (zero-copy).
+
+```cpp
+std::vector<fluss::ScanRecord> all_records;
+while (all_records.size() < 1000) {
+    fluss::ScanRecords records;
+    scanner.Poll(1000, records);
+    for (const auto& rec : records) {
+        all_records.push_back(rec);  // ref-counted, no data copy
+    }
+}
+// all_records is valid — each record keeps its data alive
+```
+
+**Batch subscribe:**
+
+```cpp
+std::vector<fluss::BucketSubscription> subscriptions;
+subscriptions.push_back({0, 0});    // bucket 0, offset 0
+subscriptions.push_back({1, 100});  // bucket 1, offset 100
+scanner.Subscribe(subscriptions);
+```
+
+**Unsubscribe from a bucket:**
+
+```cpp
+// Stop receiving records from bucket 1
+scanner.Unsubscribe(1);
+```
+
+**Arrow RecordBatch polling (high performance):**
+
+```cpp
+#include <arrow/record_batch.h>
+
+fluss::LogScanner arrow_scanner;
+table.NewScan().CreateRecordBatchLogScanner(arrow_scanner);
+
+for (int b = 0; b < info.num_buckets; ++b) {
+    arrow_scanner.Subscribe(b, 0);
+}
+
+fluss::ArrowRecordBatches batches;
+arrow_scanner.PollRecordBatch(5000, batches);
+
+for (size_t i = 0; i < batches.Size(); ++i) {
+    const auto& batch = batches[i];
+    if (batch->Available()) {
+        auto arrow_batch = batch->GetArrowRecordBatch();
+        std::cout << "Batch " << i << ": " << arrow_batch->num_rows() << " rows"
+                  << ", partition_id=" << batch->GetPartitionId()
+                  << ", bucket_id=" << batch->GetBucketId() << std::endl;
+    }
+}
+```
+
+## Column Projection
+
+```cpp
+// Project by column index
+fluss::LogScanner projected_scanner;
+table.NewScan().ProjectByIndex({0, 2}).CreateLogScanner(projected_scanner);
+
+// Project by column name
+fluss::LogScanner name_projected_scanner;
+table.NewScan().ProjectByName({"event_id", "timestamp"}).CreateLogScanner(name_projected_scanner);
+
+// Arrow RecordBatch with projection
+fluss::LogScanner projected_arrow_scanner;
+table.NewScan().ProjectByIndex({0, 2}).CreateRecordBatchLogScanner(projected_arrow_scanner);
+```
diff --git a/website/docs/apis/cpp/example/partitioned-tables.md b/website/docs/apis/cpp/example/partitioned-tables.md
new file mode 100644
index 0000000000..17c1c2057d
--- /dev/null
+++ b/website/docs/apis/cpp/example/partitioned-tables.md
@@ -0,0 +1,179 @@
+---
+sidebar_position: 6
+---
+# Partitioned Tables
+
+Partitioned tables distribute data across partitions based on partition column values, enabling efficient data organization and querying. Both log tables and primary key tables support partitioning.
+
+## Partitioned Log Tables
+
+### Creating a Partitioned Log Table
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("event_id", fluss::DataType::Int())
+    .AddColumn("event_type", fluss::DataType::String())
+    .AddColumn("dt", fluss::DataType::String())
+    .AddColumn("region", fluss::DataType::String())
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetPartitionKeys({"dt", "region"})
+    .SetBucketCount(3)
+    .Build();
+
+fluss::TablePath table_path("fluss", "partitioned_events");
+admin.CreateTable(table_path, descriptor, true);
+```
+
+### Writing to Partitioned Log Tables
+
+**Partitions must exist before writing data, otherwise the client will by default retry indefinitely.** Include partition column values in each row, the client routes records to the correct partition automatically.
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+fluss::AppendWriter writer;
+table.NewAppend().CreateWriter(writer);
+
+fluss::GenericRow row;
+row.SetInt32(0, 1);
+row.SetString(1, "user_login");
+row.SetString(2, "2024-01-15");
+row.SetString(3, "US");
+writer.Append(row);
+writer.Flush();
+```
+
+### Reading from Partitioned Log Tables
+
+For partitioned tables, use partition-aware subscribe methods.
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+fluss::LogScanner scanner;
+table.NewScan().CreateLogScanner(scanner);
+
+// Subscribe to individual partitions
+for (const auto& pi : partition_infos) {
+    scanner.SubscribePartitionBuckets(pi.partition_id, 0, 0);
+}
+
+fluss::ScanRecords records;
+scanner.Poll(5000, records);
+
+for (const auto& rec : records) {
+    std::cout << "bucket_id=" << rec.bucket_id
+              << " offset=" << rec.offset << std::endl;
+}
+
+// Or batch-subscribe to all partitions at once
+fluss::LogScanner batch_scanner;
+table.NewScan().CreateLogScanner(batch_scanner);
+
+std::vector<fluss::PartitionBucketSubscription> subs;
+for (const auto& pi : partition_infos) {
+    subs.push_back({pi.partition_id, 0, 0});
+}
+batch_scanner.SubscribePartitionBuckets(subs);
+```
+
+**Unsubscribe from a partition bucket:**
+
+```cpp
+// Stop receiving records from a specific partition bucket
+scanner.UnsubscribePartition(partition_infos[0].partition_id, 0);
+```
+
+### Managing Partitions
+
+```cpp
+// Create a partition
+admin.CreatePartition(table_path, {{"dt", "2024-01-15"}, {"region", "EMEA"}}, true);
+
+// List partitions
+std::vector<fluss::PartitionInfo> partition_infos;
+admin.ListPartitionInfos(table_path, partition_infos);
+
+// Query partition offsets
+std::vector<int32_t> bucket_ids = {0, 1, 2};
+std::unordered_map<int32_t, int64_t> offsets;
+admin.ListPartitionOffsets(table_path, "2024-01-15$US",
+                           bucket_ids, fluss::OffsetSpec::Latest(), offsets);
+```
+
+## Partitioned Primary Key Tables
+
+Partitioned KV tables combine partitioning with primary key operations. Partition columns must be part of the primary key.
+
+### Creating a Partitioned Primary Key Table
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("user_id", fluss::DataType::Int())
+    .AddColumn("region", fluss::DataType::String())
+    .AddColumn("zone", fluss::DataType::BigInt())
+    .AddColumn("score", fluss::DataType::BigInt())
+    .SetPrimaryKeys({"user_id", "region", "zone"})
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetPartitionKeys({"region", "zone"})
+    .SetBucketCount(3)
+    .Build();
+
+fluss::TablePath table_path("fluss", "partitioned_users");
+admin.CreateTable(table_path, descriptor, true);
+```
+
+### Writing to Partitioned Primary Key Tables
+
+**Partitions must exist before upserting data, otherwise the client will by default retry indefinitely.**
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+// Create partitions first
+admin.CreatePartition(table_path, {{"region", "APAC"}, {"zone", "1"}}, true);
+admin.CreatePartition(table_path, {{"region", "EMEA"}, {"zone", "2"}}, true);
+admin.CreatePartition(table_path, {{"region", "US"}, {"zone", "3"}}, true);
+
+fluss::UpsertWriter writer;
+table.NewUpsert().CreateWriter(writer);
+
+auto row = table.NewRow();
+row.Set("user_id", 1001);
+row.Set("region", "APAC");
+row.Set("zone", static_cast<int64_t>(1));
+row.Set("score", static_cast<int64_t>(1234));
+writer.Upsert(row);
+writer.Flush();
+```
+
+### Looking Up Records in Partitioned Tables
+
+Lookup requires all primary key columns including partition columns.
+
+> **Note:** Scanning partitioned primary key tables is not supported. Use lookup operations instead.
+
+```cpp
+fluss::Lookuper lookuper;
+table.NewLookup().CreateLookuper(lookuper);
+
+auto pk = table.NewRow();
+pk.Set("user_id", 1001);
+pk.Set("region", "APAC");
+pk.Set("zone", static_cast<int64_t>(1));
+
+fluss::LookupResult result;
+lookuper.Lookup(pk, result);
+if (result.Found()) {
+    std::cout << "score=" << result.GetInt64(3) << std::endl;
+}
+```
diff --git a/website/docs/apis/cpp/example/primary-key-tables.md b/website/docs/apis/cpp/example/primary-key-tables.md
new file mode 100644
index 0000000000..f26b5477a7
--- /dev/null
+++ b/website/docs/apis/cpp/example/primary-key-tables.md
@@ -0,0 +1,132 @@
+---
+sidebar_position: 5
+---
+# Primary Key Tables
+
+Primary key tables (KV tables) support upsert, delete, and lookup operations.
+
+## Creating a Primary Key Table
+
+```cpp
+auto schema = fluss::Schema::NewBuilder()
+    .AddColumn("id", fluss::DataType::Int())
+    .AddColumn("name", fluss::DataType::String())
+    .AddColumn("age", fluss::DataType::BigInt())
+    .SetPrimaryKeys({"id"})
+    .Build();
+
+auto descriptor = fluss::TableDescriptor::NewBuilder()
+    .SetSchema(schema)
+    .SetBucketCount(3)
+    .Build();
+
+fluss::TablePath table_path("fluss", "users");
+admin.CreateTable(table_path, descriptor, true);
+```
+
+## Upserting Records
+
+```cpp
+fluss::Table table;
+conn.GetTable(table_path, table);
+
+fluss::UpsertWriter upsert_writer;
+table.NewUpsert().CreateWriter(upsert_writer);
+
+// Fire-and-forget upserts
+{
+    auto row = table.NewRow();
+    row.Set("id", 1);
+    row.Set("name", "Alice");
+    row.Set("age", static_cast<int64_t>(25));
+    upsert_writer.Upsert(row);
+}
+{
+    auto row = table.NewRow();
+    row.Set("id", 2);
+    row.Set("name", "Bob");
+    row.Set("age", static_cast<int64_t>(30));
+    upsert_writer.Upsert(row);
+}
+upsert_writer.Flush();
+
+// Per-record acknowledgment
+{
+    auto row = table.NewRow();
+    row.Set("id", 3);
+    row.Set("name", "Charlie");
+    row.Set("age", static_cast<int64_t>(35));
+    fluss::WriteResult wr;
+    upsert_writer.Upsert(row, wr);
+    wr.Wait();
+}
+```
+
+## Updating Records
+
+Upsert with the same primary key to update an existing record.
+
+```cpp
+auto row = table.NewRow();
+row.Set("id", 1);
+row.Set("name", "Alice Updated");
+row.Set("age", static_cast<int64_t>(26));
+fluss::WriteResult wr;
+upsert_writer.Upsert(row, wr);
+wr.Wait();
+```
+
+## Deleting Records
+
+```cpp
+auto pk_row = table.NewRow();
+pk_row.Set("id", 2);
+fluss::WriteResult wr;
+upsert_writer.Delete(pk_row, wr);
+wr.Wait();
+```
+
+## Partial Updates
+
+Update only specific columns while preserving others.
+
+```cpp
+// By column names
+fluss::UpsertWriter partial_writer;
+table.NewUpsert()
+    .PartialUpdateByName({"id", "age"})
+    .CreateWriter(partial_writer);
+
+auto row = table.NewRow();
+row.Set("id", 1);
+row.Set("age", static_cast<int64_t>(27));
+fluss::WriteResult wr;
+partial_writer.Upsert(row, wr);
+wr.Wait();
+
+// By column indices
+fluss::UpsertWriter partial_writer_idx;
+table.NewUpsert()
+    .PartialUpdateByIndex({0, 2})
+    .CreateWriter(partial_writer_idx);
+```
+
+## Looking Up Records
+
+```cpp
+fluss::Lookuper lookuper;
+table.NewLookup().CreateLookuper(lookuper);
+
+auto pk_row = table.NewRow();
+pk_row.Set("id", 1);
+
+fluss::LookupResult result;
+lookuper.Lookup(pk_row, result);
+
+if (result.Found()) {
+    std::cout << "Found: name=" << result.GetString(1)
+              << ", age=" << result.GetInt64(2) << std::endl;
+} else {
+    std::cout << "Not found" << std::endl;
+}
+```
diff --git a/website/docs/apis/cpp/installation.md b/website/docs/apis/cpp/installation.md
new file mode 100644
index 0000000000..6360da4369
--- /dev/null
+++ b/website/docs/apis/cpp/installation.md
@@ -0,0 +1,107 @@
+---
+sidebar_position: 1
+---
+# Installation
+
+The C++ bindings are not yet published as a package. You need to build from source.
+
+**Prerequisites:** CMake 3.22+, C++17 compiler, Rust 1.85+, Apache Arrow C++ library
+
+```bash
+git clone https://github.com/apache/fluss-rust.git
+cd fluss-rust
+```
+
+Install dependencies:
+
+```bash
+# macOS
+brew install cmake arrow
+
+# Ubuntu/Debian
+sudo apt-get install cmake libarrow-dev
+```
+
+If Arrow is not available via package manager, build from source:
+
+```bash
+git clone https://github.com/apache/arrow.git
+cd arrow/cpp
+cmake -B build -DARROW_BUILD_SHARED=ON
+cmake --build build
+sudo cmake --install build
+```
+
+Build the C++ bindings:
+
+```bash
+cd bindings/cpp
+mkdir -p build && cd build
+
+# Debug mode
+cmake ..
+
+# Or Release mode
+cmake -DCMAKE_BUILD_TYPE=Release ..
+
+# Build
+cmake --build .
+```
+
+This produces:
+- `libfluss_cpp.a` (Static library)
+- `fluss_cpp_example` (Example executable)
+- Header files in `include/`
+
+## Integrating into Your Project
+
+**Option 1: CMake FetchContent**
+
+```cmake
+include(FetchContent)
+FetchContent_Declare(
+    fluss-cpp
+    GIT_REPOSITORY https://github.com/apache/fluss-rust.git
+    SOURCE_SUBDIR bindings/cpp
+)
+FetchContent_MakeAvailable(fluss-cpp)
+
+target_link_libraries(your_target PRIVATE fluss_cpp)
+```
+
+**Option 2: Manual Integration**
+
+Copy the build artifacts and configure CMake:
+
+```cmake
+find_package(Arrow REQUIRED)
+
+add_library(fluss_cpp STATIC IMPORTED)
+set_target_properties(fluss_cpp PROPERTIES
+    IMPORTED_LOCATION ${CMAKE_SOURCE_DIR}/lib/libfluss_cpp.a
+    INTERFACE_INCLUDE_DIRECTORIES ${CMAKE_SOURCE_DIR}/include
+)
+
+target_link_libraries(your_target
+    PRIVATE
+    fluss_cpp
+    Arrow::arrow_shared
+    ${CMAKE_DL_LIBS}
+    Threads::Threads
+)
+
+# On macOS, also link these frameworks
+if(APPLE)
+    target_link_libraries(your_target PRIVATE
+        "-framework CoreFoundation"
+        "-framework Security"
+    )
+endif()
+```
+
+**Option 3: Subdirectory**
+
+```cmake
+add_subdirectory(vendor/fluss-rust/bindings/cpp)
+target_link_libraries(your_target PRIVATE fluss_cpp)
+```
diff --git a/website/docs/apis/index.md b/website/docs/apis/index.md
new file mode 100644
index 0000000000..342782883c
--- /dev/null
+++ b/website/docs/apis/index.md
@@ -0,0 +1,42 @@
+---
+sidebar_position: 1
+title: Introduction
+---
+
+# Introduction
+
+[Apache Fluss](https://fluss.apache.org/) (incubating) is a streaming storage system built for real-time analytics, serving as the real-time data layer for Lakehouse architectures.
+
+This documentation covers the **Fluss client libraries** for [Java](./java/index.md), Rust, Python, and C++, which are developed in the [Apache Fluss](https://github.com/apache/fluss) repository. These clients allow you to:
+
+- **Create and manage** databases, tables, and partitions
+- **Write** data to log tables (append-only) and primary key tables (upsert/delete)
+- **Read** data via log scanning and key lookups
+- **Integrate** with the broader Fluss ecosystem including lakehouse snapshots
+
+## Prerequisites
+
+You need a running Fluss cluster to use any of the client libraries. See the [Deploying a Local Cluster](https://fluss.apache.org/docs/install-deploy/deploying-local-cluster/) guide to get started.
+
+## Key Concepts
+
+- **Log table** — an append-only table (no primary key). Records are immutable once written. Use for event streams, logs, and audit trails.
+  - **Offset** — the position of a record within a log table's bucket. Used to track reading progress. Start from `EARLIEST_OFFSET` to read all data, or resolve the current latest offset via `list_offsets` to only read new records.
+- **Primary key (PK) table** — a table with a primary key. Supports upsert, delete, and point lookups.
+- **Bucket** — the unit of parallelism within a table (similar to Kafka partitions). Each table has one or more buckets. Readers subscribe to individual buckets.
+- **Partition** — a way to organize data by column values (e.g. by date or region). Each partition contains its own set of buckets. Partitions must be created explicitly before writing.
+
+## Client Overview
+
+|                        | Rust                                                       | Python                   | C++                                            |
+|------------------------|------------------------------------------------------------|--------------------------|------------------------------------------------|
+| **Package**            | [fluss-rs](https://crates.io/crates/fluss-rs) on crates.io | Build from source (PyO3) | Build from source (CMake)                      |
+| **Async runtime**      | Tokio                                                      | asyncio                  | Synchronous (Tokio runtime managed internally) |
+| **Data format**        | Arrow RecordBatch / GenericRow                             | PyArrow / Pandas / dict  | Arrow RecordBatch / GenericRow                 |
+| **Log tables**         | Read + Write                                               | Read + Write             | Read + Write                                   |
+| **Primary key tables** | Upsert + Delete + Lookup                                   | Upsert + Delete + Lookup | Upsert + Delete + Lookup                       |
+| **Partitioned tables** | Read + Write                                               | Read + Write             | Read + Write                                   |
+
+## How This Guide Is Organised
+
+These guides walk through installation, configuration, and working with each table type. Code examples for Rust, Python, and C++ are shown side by side; the Java client has its own comprehensive guide.
diff --git a/website/docs/apis/java/_category_.json b/website/docs/apis/java/_category_.json
new file mode 100644
index 0000000000..5d19ed2ea3
--- /dev/null
+++ b/website/docs/apis/java/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Java",
+  "position": 2
+}
diff --git a/website/docs/apis/java-client.md b/website/docs/apis/java/index.md
similarity index 100%
rename from website/docs/apis/java-client.md
rename to website/docs/apis/java/index.md
diff --git a/website/docs/apis/python-client.md b/website/docs/apis/python-client.md
deleted file mode 100644
index 4f81ab833d..0000000000
--- a/website/docs/apis/python-client.md
+++ /dev/null
@@ -1,45 +0,0 @@
----
-title: "Python Client"
-sidebar_position: 2
----
-
-# Fluss Python Client
-
-The Fluss Python Client provides a high-performance, asynchronous interface for
-interacting with Fluss clusters. Built on top of the Rust core via
-[PyO3](https://pyo3.rs/), it leverages PyArrow for efficient data interchange
-and supports idiomatic integration with Pandas.
-
-The client provides two main APIs:
-
-- **[Admin API](https://clients.fluss.apache.org/user-guide/python/api-reference#flussadmin)**: For managing databases, tables, and partitions.
-- **[Table API](https://clients.fluss.apache.org/user-guide/python/api-reference#flusstable)**: For reading and writing to Log and Primary Key tables
-
-## Installation
-```bash
-pip install pyfluss
-```
-
-## Quick Example
-```python
-import asyncio
-import fluss
-
-async def main():
-    config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
-    conn = await fluss.FlussConnection.create(config)
-    async with conn:
-        admin = await conn.get_admin()
-        databases = await admin.list_databases()
-        print(f"Available databases: {databases}")
-
-if __name__ == "__main__":
-    asyncio.run(main())
-```
-For more examples, see [Fluss Python Client documentation](https://clients.fluss.apache.org/user-guide/python/example/).
-
-## Full Documentation
-
-For the complete Python client reference including all configuration options,
-API methods, data types, error handling, and worked examples — see the
-**[Fluss Python Client documentation](https://clients.fluss.apache.org/user-guide/python/installation)**.
\ No newline at end of file
diff --git a/website/docs/apis/python/_category_.json b/website/docs/apis/python/_category_.json
new file mode 100644
index 0000000000..5775bfc99b
--- /dev/null
+++ b/website/docs/apis/python/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Python",
+  "position": 4
+}
diff --git a/website/docs/apis/python/api-reference.md b/website/docs/apis/python/api-reference.md
new file mode 100644
index 0000000000..9bf0b6902f
--- /dev/null
+++ b/website/docs/apis/python/api-reference.md
@@ -0,0 +1,389 @@
+---
+sidebar_position: 2
+---
+# API Reference
+
+Complete API reference for the Fluss Python client.
+
+## `Config`
+
+| Method / Property                     | Config Key                            | Description                                                                             |
+|---------------------------------------|---------------------------------------|-----------------------------------------------------------------------------------------|
+| `Config(properties: dict = None)`     |                                       | Create config from a dict of key-value pairs                                            |
+| `bootstrap_servers`                   | `bootstrap.servers`                   | Get/set coordinator server address                                                      |
+| `writer_request_max_size`             | `writer.request-max-size`             | Get/set max request size in bytes                                                       |
+| `writer_acks`                         | `writer.acks`                         | Get/set acknowledgment setting (`"all"` for all replicas)                               |
+| `writer_retries`                      | `writer.retries`                      | Get/set number of retries on failure                                                    |
+| `writer_batch_size`                   | `writer.batch-size`                   | Get/set write batch size in bytes. Upper bound when dynamic sizing is on; fixed batch size when off |
+| `writer_dynamic_batch_size_enabled`   | `writer.dynamic-batch-size.enabled`   | Get/set whether the per-table dynamic batch size estimator is enabled (default `true`)  |
+| `writer_dynamic_batch_size_min`       | `writer.dynamic-batch-size-min`       | Get/set the lower bound for the dynamic batch size estimator (default 256 KB; ignored when disabled) |
+| `writer_batch_timeout_ms`             | `writer.batch-timeout-ms`             | Get/set max time in ms to wait for a writer batch to fill up before sending             |
+| `writer_bucket_no_key_assigner`       | `writer.bucket.no-key-assigner`       | Get/set bucket assignment strategy (`"sticky"` or `"round_robin"`)                      |
+| `scanner_remote_log_prefetch_num`     | `scanner.remote-log.prefetch-num`     | Get/set number of remote log segments to prefetch                                       |
+| `remote_file_download_thread_num`     | `remote-file.download-thread-num`     | Get/set number of threads for remote log downloads                                      |
+| `scanner_remote_log_read_concurrency` | `scanner.remote-log.read-concurrency` | Get/set streaming read concurrency within a remote log file                             |
+| `scanner_log_max_poll_records`        | `scanner.log.max-poll-records`        | Get/set max number of records returned in a single poll()                               |
+| `scanner_log_fetch_max_bytes`         | `scanner.log.fetch.max-bytes`         | Get/set maximum bytes per fetch response for LogScanner                                 |
+| `scanner_log_fetch_min_bytes`         | `scanner.log.fetch.min-bytes`         | Get/set minimum bytes the server must accumulate before returning a fetch response      |
+| `scanner_log_fetch_wait_max_time_ms`  | `scanner.log.fetch.wait-max-time-ms`  | Get/set maximum time (ms) the server may wait to satisfy min-bytes                      |
+| `scanner_log_fetch_max_bytes_for_bucket` | `scanner.log.fetch.max-bytes-for-bucket` | Get/set maximum bytes per fetch response per bucket for LogScanner                |
+| `connect_timeout_ms`                  | `connect-timeout`                     | Get/set TCP connect timeout in milliseconds                                             |
+| `security_protocol`                   | `security.protocol`                   | Get/set security protocol (`"PLAINTEXT"` or `"sasl"`)                                   |
+| `security_sasl_mechanism`             | `security.sasl.mechanism`             | Get/set SASL mechanism (only `"PLAIN"` is supported)                                    |
+| `security_sasl_username`              | `security.sasl.username`              | Get/set SASL username (required when protocol is `"sasl"`)                              |
+| `security_sasl_password`              | `security.sasl.password`              | Get/set SASL password (required when protocol is `"sasl"`)                              |
+
+## `FlussConnection`
+
+| Method                                                    |  Description                          |
+|-----------------------------------------------------------|---------------------------------------|
+| `await FlussConnection.create(config) -> FlussConnection` | Connect to a Fluss cluster            |
+| `conn.get_admin() -> FlussAdmin`                        | Get admin interface                   |
+| `await conn.get_table(table_path) -> FlussTable`          | Get a table for read/write operations |
+| `await conn.close()`                                      | Close the connection                  |
+
+Supports `async with` statement (async context manager).
+
+## `FlussAdmin`
+
+| Method                                                                                                                |  Description                          |
+|-----------------------------------------------------------------------------------------------------------------------|---------------------------------------|
+| `await create_database(name, database_descriptor=None, ignore_if_exists=False)`                                       | Create a database                     |
+| `await drop_database(name, ignore_if_not_exists=False, cascade=True)`                                                 | Drop a database                       |
+| `await list_databases() -> list[str]`                                                                                 | List all databases                    |
+| `await database_exists(name) -> bool`                                                                                 | Check if a database exists            |
+| `await get_database_info(name) -> DatabaseInfo`                                                                       | Get database metadata                 |
+| `await create_table(table_path, table_descriptor, ignore_if_exists=False)`                                            | Create a table                        |
+| `await drop_table(table_path, ignore_if_not_exists=False)`                                                            | Drop a table                          |
+| `await get_table_info(table_path) -> TableInfo`                                                                       | Get table metadata                    |
+| `await list_tables(database_name) -> list[str]`                                                                       | List tables in a database             |
+| `await table_exists(table_path) -> bool`                                                                              | Check if a table exists               |
+| `await list_offsets(table_path, bucket_ids, offset_spec) -> dict[int, int]`                           | Get offsets for buckets               |
+| `await list_partition_offsets(table_path, partition_name, bucket_ids, offset_spec) -> dict[int, int]` | Get offsets for a partition's buckets |
+| `await create_partition(table_path, partition_spec, ignore_if_exists=False)`                                          | Create a partition                    |
+| `await drop_partition(table_path, partition_spec, ignore_if_not_exists=False)`                                        | Drop a partition                      |
+| `await list_partition_infos(table_path) -> list[PartitionInfo]`                                                       | List partitions                       |
+| `await get_latest_lake_snapshot(table_path) -> LakeSnapshot`                                                          | Get latest lake snapshot              |
+| `await get_server_nodes() -> list[ServerNode]`                                                                        | Get all alive server nodes            |
+
+## `ServerNode`
+
+| Property                 | Description                                                |
+|--------------------------|------------------------------------------------------------|
+| `.id -> int`             | Server node ID                                             |
+| `.host -> str`           | Hostname of the server                                     |
+| `.port -> int`           | Port number                                                |
+| `.server_type -> str`    | Server type (`"CoordinatorServer"` or `"TabletServer"`)    |
+| `.uid -> str`            | Unique identifier (e.g. `"cs-0"`, `"ts-1"`)               |
+
+## `FlussTable`
+
+| Method                          |  Description                            |
+|---------------------------------|-----------------------------------------|
+| `new_scan() -> TableScan`       | Create a scan builder                   |
+| `new_append() -> TableAppend`   | Create an append builder for log tables |
+| `new_upsert() -> TableUpsert`   | Create an upsert builder for PK tables  |
+| `new_lookup() -> TableLookup`   | Create a lookup builder for PK tables   |
+| `get_table_info() -> TableInfo` | Get table metadata                      |
+| `get_table_path() -> TablePath` | Get table path                          |
+| `has_primary_key() -> bool`     | Check if table has a primary key        |
+
+## `TableScan`
+
+| Method                                                   |  Description                                                        |
+|----------------------------------------------------------|---------------------------------------------------------------------|
+| `.project(indices) -> TableScan`                         | Project columns by index                                            |
+| `.project_by_name(names) -> TableScan`                   | Project columns by name                                             |
+| `await .create_log_scanner() -> LogScanner`              | Create record-based scanner (for `poll()`)                          |
+| `await .create_record_batch_log_scanner() -> LogScanner` | Create batch-based scanner (for `poll_arrow()`, `to_arrow()`, etc.) |
+
+## `TableAppend`
+
+Builder for creating an `AppendWriter`. Obtain via `FlussTable.new_append()`.
+
+| Method                             |  Description             |
+|------------------------------------|--------------------------|
+| `.create_writer() -> AppendWriter` | Create the append writer |
+
+## `TableUpsert`
+
+Builder for creating an `UpsertWriter`. Obtain via `FlussTable.new_upsert()`.
+
+| Method                                             |  Description                               |
+|----------------------------------------------------|--------------------------------------------|
+| `.partial_update_by_name(columns) -> TableUpsert`  | Configure partial update by column names   |
+| `.partial_update_by_index(indices) -> TableUpsert` | Configure partial update by column indices |
+| `.create_writer() -> UpsertWriter`                 | Create the upsert writer                   |
+
+## `TableLookup`
+
+Builder for creating a `Lookuper` or `PrefixLookuper`. Obtain via `FlussTable.new_lookup()`.
+
+| Method                                              |  Description                              |
+|-----------------------------------------------------|-------------------------------------------|
+| `.create_lookuper() -> Lookuper`                    | Create a primary key lookuper             |
+| `.lookup_by(column_names) -> TablePrefixLookup`     | Switch to prefix-scan mode for the given columns (partition keys + bucket keys) |
+
+## `TablePrefixLookup`
+
+Builder for creating a `PrefixLookuper`. Obtain via `TableLookup.lookup_by(columns)`.
+
+| Method                                     |  Description              |
+|--------------------------------------------|---------------------------|
+| `.create_lookuper() -> PrefixLookuper`     | Create the prefix lookuper |
+
+## `AppendWriter`
+
+| Method                                           |  Description                        |
+|--------------------------------------------------|-------------------------------------|
+| `.append(row) -> WriteResultHandle`              | Append a row (dict, list, or tuple) |
+| `.write_arrow(table)`                            | Write a PyArrow Table               |
+| `.write_arrow_batch(batch) -> WriteResultHandle` | Write a PyArrow RecordBatch         |
+| `.write_pandas(df)`                              | Write a Pandas DataFrame            |
+| `await .flush()`                                 | Flush all pending writes            |
+
+## `UpsertWriter`
+
+| Method                              |  Description                          |
+|-------------------------------------|---------------------------------------|
+| `.upsert(row) -> WriteResultHandle` | Upsert a row (insert or update by PK) |
+| `.delete(pk) -> WriteResultHandle`  | Delete a row by primary key           |
+| `await .flush()`                    | Flush all pending operations          |
+
+## `WriteResultHandle`
+
+| Method          |  Description                                 |
+|-----------------|----------------------------------------------|
+| `await .wait()` | Wait for server acknowledgment of this write |
+
+## `Lookuper`
+
+| Method                              |  Description                |
+|-------------------------------------|-----------------------------|
+| `await .lookup(pk) -> dict \| None` | Lookup a row by primary key |
+
+## `PrefixLookuper`
+
+| Method                                        |  Description                                |
+|-----------------------------------------------|---------------------------------------------|
+| `await .lookup(prefix) -> list[dict]`         | Lookup all rows matching a prefix key       |
+
+## `LogScanner`
+
+| Method                                                        |  Description                                                                     |
+|---------------------------------------------------------------|----------------------------------------------------------------------------------|
+| `.subscribe(bucket_id, start_offset)`                         | Subscribe to a bucket                                                            |
+| `.subscribe_buckets(bucket_offsets)`                          | Subscribe to multiple buckets (`{bucket_id: offset}`)                            |
+| `.subscribe_partition(partition_id, bucket_id, start_offset)` | Subscribe to a partition bucket                                                  |
+| `.subscribe_partition_buckets(partition_bucket_offsets)`      | Subscribe to multiple partition+bucket combos (`{(part_id, bucket_id): offset}`) |
+| `.unsubscribe(bucket_id)`                                     | Unsubscribe from a bucket (non-partitioned tables)                               |
+| `.unsubscribe_partition(partition_id, bucket_id)`             | Unsubscribe from a partition bucket                                              |
+| `await .poll(timeout_ms) -> ScanRecords`                      | Poll individual records (record scanner only)                                    |
+| `await .poll_arrow(timeout_ms) -> pa.Table`                   | Poll as Arrow Table (batch scanner only)                                         |
+| `await .poll_record_batch(timeout_ms) -> list[RecordBatch]`   | Poll batches with metadata (batch scanner only)                                  |
+| `.to_arrow_batch_reader() -> pa.RecordBatchReader`            | Lazy Arrow RecordBatchReader reading until latest offsets (batch scanner only)    |
+| `await .to_arrow() -> pa.Table`                               | Read all subscribed data as Arrow Table (batch scanner only)                     |
+| `await .to_pandas() -> pd.DataFrame`                          | Read all subscribed data as DataFrame (batch scanner only)                       |
+
+> **Note:** Overlapping `poll_*` / `to_arrow*` / `to_arrow_batch_reader` calls on the same underlying scanner are not supported. Use only one active polling/consumption path at a time.
+
+## `ScanRecords`
+
+Returned by `LogScanner.poll()`. Records are grouped by bucket.
+
+> **Note:** Flat iteration and integer indexing traverse buckets in an arbitrary order that is consistent within a single `ScanRecords` instance but may differ between `poll()` calls. Use per-bucket access (`.items()`, `.records(bucket)`) when bucket ordering matters.
+
+```python
+scan_records = await scanner.poll(timeout_ms=5000)
+
+# Sequence access
+scan_records[0]                              # first record
+scan_records[-1]                             # last record
+scan_records[:5]                             # first 5 records
+
+# Per-bucket access
+for bucket, records in scan_records.items():
+    for record in records:
+        print(f"bucket={bucket.bucket_id}, offset={record.offset}, row={record.row}")
+
+# Flat iteration
+for record in scan_records:
+    print(record.row)
+```
+
+### Methods
+
+| Method                                 |  Description                                                     |
+|----------------------------------------|------------------------------------------------------------------|
+| `.buckets() -> list[TableBucket]`      | List of distinct buckets                                         |
+| `.records(bucket) -> list[ScanRecord]` | Records for a specific bucket (empty list if bucket not present) |
+| `.count() -> int`                      | Total record count across all buckets                            |
+| `.is_empty() -> bool`                  | Check if empty                                                   |
+
+### Indexing
+
+| Expression                   | Returns              | Description                       |
+|------------------------------|----------------------|-----------------------------------|
+| `scan_records[0]`           | `ScanRecord`         | Record by flat index              |
+| `scan_records[-1]`          | `ScanRecord`         | Negative indexing                  |
+| `scan_records[1:5]`         | `list[ScanRecord]`   | Slice                             |
+| `scan_records[bucket]`      | `list[ScanRecord]`   | Records for a bucket              |
+
+### Mapping Protocol
+
+| Method / Protocol              | Description                                     |
+|--------------------------------|-------------------------------------------------|
+| `.keys()`                      | Same as `.buckets()`                            |
+| `.values()`                    | Lazy iterator over record lists, one per bucket |
+| `.items()`                     | Lazy iterator over `(bucket, records)` pairs    |
+| `len(scan_records)`           | Same as `.count()`                              |
+| `bucket in scan_records`      | Membership test                                 |
+| `for record in scan_records`  | Flat iteration over all records                 |
+
+## `ScanRecord`
+
+| Property                     |  Description                                                        |
+|------------------------------|---------------------------------------------------------------------|
+| `.offset -> int`             | Record offset in the log                                            |
+| `.timestamp -> int`          | Record timestamp                                                    |
+| `.change_type -> ChangeType` | Change type (AppendOnly, Insert, UpdateBefore, UpdateAfter, Delete) |
+| `.row -> dict`               | Row data as `{column_name: value}`                                  |
+
+## `RecordBatch`
+
+| Property                   | Description                  |
+|----------------------------|------------------------------|
+| `.batch -> pa.RecordBatch` | Arrow RecordBatch data       |
+| `.bucket -> TableBucket`   | Bucket this batch belongs to |
+| `.base_offset -> int`      | First record offset          |
+| `.last_offset -> int`      | Last record offset           |
+
+## `Schema`
+
+| Method                                         |  Description               |
+|------------------------------------------------|----------------------------|
+| `Schema(schema: pa.Schema, primary_keys=None)` | Create from PyArrow schema. Field nullability (`pa.field(..., nullable=False)`) is preserved. |
+| `.get_column_names() -> list[str]`             | Get column names           |
+| `.get_column_types() -> list[str]`             | Get column type names. Non-nullable types include a `" NOT NULL"` suffix (e.g., `"int NOT NULL"`). |
+| `.get_columns() -> list[tuple[str, str]]`      | Get `(name, type)` pairs. Type strings follow the same nullability formatting as `.get_column_types()`. |
+| `.get_primary_keys() -> list[str]`             | Get primary key columns    |
+
+## `TableDescriptor`
+
+| Method                                                                                                                                                                         | Description             |
+|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-------------------------|
+| `TableDescriptor(schema, *, partition_keys=None, bucket_count=None, bucket_keys=None, comment=None, log_format=None, kv_format=None, properties=None, custom_properties=None)` | Create table descriptor |
+| `.get_schema() -> Schema`                                                                                                                                                      | Get the schema          |
+
+## `TablePath`
+
+| Method / Property            | Description         |
+|------------------------------|---------------------|
+| `TablePath(database, table)` | Create a table path |
+| `.database_name -> str`      | Database name       |
+| `.table_name -> str`         | Table name          |
+
+## `TableInfo`
+
+| Property / Method                    |  Description                |
+|--------------------------------------|-----------------------------|
+| `.table_id -> int`                   | Table ID                    |
+| `.table_path -> TablePath`           | Table path                  |
+| `.num_buckets -> int`                | Number of buckets           |
+| `.schema_id -> int`                  | Schema ID                   |
+| `.comment -> str \| None`            | Table comment               |
+| `.created_time -> int`               | Creation timestamp          |
+| `.modified_time -> int`              | Last modification timestamp |
+| `.get_primary_keys() -> list[str]`   | Primary key columns         |
+| `.get_partition_keys() -> list[str]` | Partition columns           |
+| `.get_bucket_keys() -> list[str]`    | Bucket key columns          |
+| `.has_primary_key() -> bool`         | Has primary key?            |
+| `.is_partitioned() -> bool`          | Is partitioned?             |
+| `.get_schema() -> Schema`            | Get table schema            |
+| `.get_column_names() -> list[str]`   | Column names                |
+| `.get_column_count() -> int`         | Number of columns           |
+| `.get_properties() -> dict`          | All table properties        |
+| `.get_custom_properties() -> dict`   | Custom properties only      |
+
+## `PartitionInfo`
+
+| Property                 |  Description   |
+|--------------------------|----------------|
+| `.partition_id -> int`   | Partition ID   |
+| `.partition_name -> str` | Partition name |
+
+## `DatabaseDescriptor`
+
+| Method / Property                                          | Description       |
+|------------------------------------------------------------|-------------------|
+| `DatabaseDescriptor(comment=None, custom_properties=None)` | Create descriptor |
+| `.comment -> str \| None`                                  | Database comment  |
+| `.get_custom_properties() -> dict`                         | Custom properties |
+
+## `DatabaseInfo`
+
+| Property / Method                                  | Description                 |
+|----------------------------------------------------|-----------------------------|
+| `.database_name -> str`                            | Database name               |
+| `.created_time -> int`                             | Creation timestamp          |
+| `.modified_time -> int`                            | Last modification timestamp |
+| `.get_database_descriptor() -> DatabaseDescriptor` | Get descriptor              |
+
+## `LakeSnapshot`
+
+| Property / Method                                 | Description             |
+|---------------------------------------------------|-------------------------|
+| `.snapshot_id -> int`                             | Snapshot ID             |
+| `.table_buckets_offset -> dict[TableBucket, int]` | All bucket offsets      |
+| `.get_bucket_offset(bucket) -> int \| None`       | Get offset for a bucket |
+| `.get_table_buckets() -> list[TableBucket]`       | Get all buckets         |
+
+## `TableBucket`
+
+| Method / Property                                            | Description                            |
+|--------------------------------------------------------------|----------------------------------------|
+| `TableBucket(table_id, bucket)`                              | Create non-partitioned bucket          |
+| `TableBucket.with_partition(table_id, partition_id, bucket)` | Create partitioned bucket              |
+| `.table_id -> int`                                           | Table ID                               |
+| `.bucket_id -> int`                                          | Bucket ID                              |
+| `.partition_id -> int \| None`                               | Partition ID (None if non-partitioned) |
+
+## `FlussError`
+
+| Property             | Description                                                                         |
+|----------------------|-------------------------------------------------------------------------------------|
+| `.message -> str`    | Error message                                                                       |
+| `.error_code -> int` | Error code (`ErrorCode.CLIENT_ERROR` for client-side errors, server code otherwise) |
+
+Raised for all Fluss-specific errors (connection failures, table not found, schema mismatches, etc.). Inherits from `Exception`. See [Error Handling](./error-handling.md) for details on matching specific error codes.
+
+## Constants
+
+| Constant                     | Value         | Description                                         |
+|------------------------------|---------------|-----------------------------------------------------|
+| `fluss.EARLIEST_OFFSET`      | `-2`          | Start reading from earliest available offset        |
+
+## `OffsetSpec`
+
+| Method                      | Description                                      |
+|-----------------------------|--------------------------------------------------|
+| `OffsetSpec.earliest()`     | Earliest available offset                        |
+| `OffsetSpec.latest()`       | Latest offset                                    |
+| `OffsetSpec.timestamp(ts)`  | Offset at or after the given timestamp (millis)  |
+
+To start reading from the latest offset (only new records), resolve the current offset via `list_offsets` before subscribing:
+
+```python
+offsets = await admin.list_offsets(table_path, [0], fluss.OffsetSpec.latest())
+scanner.subscribe(bucket_id=0, start_offset=offsets[0])
+```
+
+## `ChangeType`
+
+| Value                         | Short String | Description                   |
+|-------------------------------|--------------|-------------------------------|
+| `ChangeType.AppendOnly` (0)   | `+A`         | Append-only                   |
+| `ChangeType.Insert` (1)       | `+I`         | Insert                        |
+| `ChangeType.UpdateBefore` (2) | `-U`         | Previous value of updated row |
+| `ChangeType.UpdateAfter` (3)  | `+U`         | New value of updated row      |
+| `ChangeType.Delete` (4)       | `-D`         | Delete                        |
diff --git a/website/docs/apis/python/data-types.md b/website/docs/apis/python/data-types.md
new file mode 100644
index 0000000000..8e4371e216
--- /dev/null
+++ b/website/docs/apis/python/data-types.md
@@ -0,0 +1,95 @@
+---
+sidebar_position: 3
+---
+# Data Types
+
+The Python client uses PyArrow types for schema definitions:
+
+| PyArrow Type                                    | Fluss Type                        | Python Type         |
+|-------------------------------------------------|-----------------------------------|---------------------|
+| `pa.bool_()`                                    | Boolean                           | `bool`              |
+| `pa.int8()` / `int16()` / `int32()` / `int64()` | TinyInt / SmallInt / Int / BigInt | `int`               |
+| `pa.float32()` / `float64()`                    | Float / Double                    | `float`             |
+| `pa.string()`                                   | String                            | `str`               |
+| `pa.binary()`                                   | Bytes                             | `bytes`             |
+| `pa.binary(n)`                                  | Binary(n)                         | `bytes`             |
+| `pa.date32()`                                   | Date                              | `datetime.date`     |
+| `pa.time32("ms")`                               | Time                              | `datetime.time`     |
+| `pa.timestamp("us")`                            | Timestamp (NTZ)                   | `datetime.datetime` |
+| `pa.timestamp("us", tz="UTC")`                  | TimestampLTZ                      | `datetime.datetime` |
+| `pa.decimal128(precision, scale)`               | Decimal                           | `decimal.Decimal`   |
+| `pa.list_(type)`                                  | Array                             | `list`              |
+
+All Python native types (`date`, `time`, `datetime`, `Decimal`) work when appending rows via dicts.
+
+## Nullability
+
+PyArrow field nullability is preserved when constructing Fluss schemas. By default, fields are nullable. Use `nullable=False` on `pa.field()` to create a `NOT NULL` column:
+
+```python
+schema = pa.schema([
+    pa.field("id", pa.int32(), nullable=False),
+    pa.field("name", pa.string()),          # nullable by default
+])
+fluss_schema = fluss.Schema(schema)
+fluss_schema.get_column_types()  # ["int NOT NULL", "string"]
+```
+
+Primary key columns are automatically forced `NOT NULL` regardless of the PyArrow field setting.
+
+For nested types, element nullability is also preserved:
+
+```python
+schema = pa.schema([
+    pa.field("tags", pa.list_(pa.field("item", pa.string(), nullable=False))),
+])
+fluss_schema = fluss.Schema(schema)
+fluss_schema.get_column_types()  # ["array<string NOT NULL>"]
+```
+
+## Writing Data
+
+Rows can be dicts, lists, or tuples:
+
+```python
+from datetime import date, time, datetime
+from decimal import Decimal
+
+row = {
+    "user_id": 1,
+    "name": "Alice",
+    "active": True,
+    "score": 95.5,
+    "balance": Decimal("1234.56"),
+    "birth_date": date(1990, 3, 15),
+    "login_time": time(9, 30, 0),
+    "created_at": datetime(2024, 1, 1, 0, 0, 0),
+    "nickname": None,  # null value
+    "tags": ["active", "premium"],  # Array of strings
+    "scores": [10, None, 30],       # Array with null values
+}
+handle = writer.append(row)
+```
+
+Lists and tuples must have values in column order:
+
+```python
+row = [1, "Alice", True, 95.5, Decimal("1234.56"), date(1990, 3, 15), time(9, 30, 0), datetime(2024, 1, 1), None]
+handle = writer.append(row)
+```
+
+## Reading Data
+
+```python
+records = await scanner.poll(timeout_ms=1000)
+for record in records:
+    row = record.row  # dict[str, Any]
+    print(row["user_id"])     # int
+    print(row["name"])        # str
+    print(row["balance"])     # decimal.Decimal
+    print(row["birth_date"])  # datetime.date
+    print(row["created_at"])  # datetime.datetime
+
+    if row["nickname"] is None:
+        print("nickname is null")
+```
diff --git a/website/docs/apis/python/error-handling.md b/website/docs/apis/python/error-handling.md
new file mode 100644
index 0000000000..5bef366516
--- /dev/null
+++ b/website/docs/apis/python/error-handling.md
@@ -0,0 +1,168 @@
+---
+sidebar_position: 4
+---
+# Error Handling
+
+The client raises `fluss.FlussError` for all Fluss-specific errors. Each error carries a `message` and an `error_code`.
+
+## Basic Usage
+
+```python
+import fluss
+
+try:
+    await admin.create_table(table_path, table_descriptor)
+except fluss.FlussError as e:
+    print(f"Error (code {e.error_code}): {e.message}")
+```
+
+## Error Codes
+
+Server-side errors carry a specific error code (>0 or -1). Client-side errors (connection failures, type mismatches, etc.) use `ErrorCode.CLIENT_ERROR` (-2). Use `fluss.ErrorCode` to match on specific codes:
+
+```python
+import fluss
+
+try:
+    await admin.drop_table(table_path)
+except fluss.FlussError as e:
+    if e.error_code == fluss.ErrorCode.TABLE_NOT_EXIST:
+        print("Table does not exist")
+    elif e.error_code == fluss.ErrorCode.PARTITION_NOT_EXISTS:
+        print("Partition does not exist")
+    elif e.error_code == fluss.ErrorCode.CLIENT_ERROR:
+        print(f"Client-side error: {e.message}")
+    else:
+        print(f"Server error (code {e.error_code}): {e.message}")
+```
+
+### Common Error Codes
+
+| Constant                                     | Code | Description                         |
+|----------------------------------------------|------|-------------------------------------|
+| `ErrorCode.CLIENT_ERROR`                     | -2   | Client-side error (not from server) |
+| `ErrorCode.UNKNOWN_SERVER_ERROR`             | -1   | Unexpected server error             |
+| `ErrorCode.NETWORK_EXCEPTION`                | 1    | Server disconnected before response |
+| `ErrorCode.DATABASE_NOT_EXIST`               | 4    | Database does not exist             |
+| `ErrorCode.DATABASE_ALREADY_EXIST`           | 6    | Database already exists             |
+| `ErrorCode.TABLE_NOT_EXIST`                  | 7    | Table does not exist                |
+| `ErrorCode.TABLE_ALREADY_EXIST`              | 8    | Table already exists                |
+| `ErrorCode.INVALID_TABLE_EXCEPTION`          | 15   | Invalid table operation             |
+| `ErrorCode.REQUEST_TIME_OUT`                 | 25   | Request timed out                   |
+| `ErrorCode.PARTITION_NOT_EXISTS`             | 36   | Partition does not exist            |
+| `ErrorCode.PARTITION_ALREADY_EXISTS`         | 42   | Partition already exists            |
+| `ErrorCode.PARTITION_SPEC_INVALID_EXCEPTION` | 43   | Invalid partition spec              |
+| `ErrorCode.LEADER_NOT_AVAILABLE_EXCEPTION`   | 44   | No leader available for partition   |
+| `ErrorCode.AUTHENTICATE_EXCEPTION`           | 46   | Authentication failed (bad credentials) |
+
+See `fluss.ErrorCode` for the full list of named constants.
+
+## Retry Logic
+
+Some errors are transient, where the server may be temporarily unavailable, mid-election, or under load. `is_retriable` can be used for deciding to retry an operation rather than treating the error as permanent.
+
+`FlussError.is_retriable` is a property available directly on the exception:
+
+```python
+import fluss
+
+try:
+    await writer.append(row)
+except fluss.FlussError as e:
+    if e.is_retriable:
+        # Transient failure — safe to retry
+        pass
+    else:
+        # Permanent failure — log and abort
+        print(f"Fatal error (code {e.error_code}): {e.message}")
+```
+
+### Retriable Error Codes
+
+| Constant                                                     | Code | Reason                                    |
+|--------------------------------------------------------------|------|-------------------------------------------|
+| `ErrorCode.NETWORK_EXCEPTION`                               | 1    | Server disconnected                       |
+| `ErrorCode.CORRUPT_MESSAGE`                                 | 3    | CRC or size error                         |
+| `ErrorCode.SCHEMA_NOT_EXIST`                                | 9    | Schema may not exist                      |
+| `ErrorCode.LOG_STORAGE_EXCEPTION`                           | 10   | Transient log storage error               |
+| `ErrorCode.KV_STORAGE_EXCEPTION`                            | 11   | Transient KV storage error                |
+| `ErrorCode.NOT_LEADER_OR_FOLLOWER`                          | 12   | Leader election in progress               |
+| `ErrorCode.CORRUPT_RECORD_EXCEPTION`                        | 14   | Corrupt record                            |
+| `ErrorCode.UNKNOWN_TABLE_OR_BUCKET_EXCEPTION`               | 21   | Metadata not yet available                |
+| `ErrorCode.REQUEST_TIME_OUT`                                | 25   | Request timed out                         |
+| `ErrorCode.STORAGE_EXCEPTION`                               | 26   | Transient storage error                   |
+| `ErrorCode.NOT_ENOUGH_REPLICAS_AFTER_APPEND_EXCEPTION`      | 28   | Wrote to server but with low ISR size     |
+| `ErrorCode.NOT_ENOUGH_REPLICAS_EXCEPTION`                   | 29   | Low ISR size at write time                |
+| `ErrorCode.LEADER_NOT_AVAILABLE_EXCEPTION`                  | 44   | No leader available for partition         |
+
+Client-side errors (`ErrorCode.CLIENT_ERROR`, code -2) always return `False` from `is_retriable`.
+
+## Common Error Scenarios
+
+### Connection Refused
+
+The Fluss cluster is not running or the address is incorrect.
+
+```python
+try:
+    config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
+    conn = await fluss.FlussConnection.create(config)
+except fluss.FlussError as e:
+    # error_code == ErrorCode.CLIENT_ERROR for connection failures
+    print(f"Cannot connect to cluster: {e.message}")
+```
+
+### Table Not Found
+
+The table does not exist or has been dropped.
+
+```python
+try:
+    await admin.drop_table(table_path)
+except fluss.FlussError as e:
+    if e.error_code == fluss.ErrorCode.TABLE_NOT_EXIST:
+        print("Table not found")
+```
+
+### Partition Not Found
+
+Writing to a partitioned table before creating partitions.
+
+```python
+try:
+    await admin.drop_partition(table_path, {"region": "US"})
+except fluss.FlussError as e:
+    if e.error_code == fluss.ErrorCode.PARTITION_NOT_EXISTS:
+        print("Partition does not exist, create it first")
+```
+
+### Authentication Failed
+
+SASL credentials are incorrect or the user does not exist.
+
+```python
+try:
+    config = fluss.Config({
+        "bootstrap.servers": "127.0.0.1:9123",
+        "client.security.protocol": "sasl",
+        "client.security.sasl.username": "admin",
+        "client.security.sasl.password": "wrong-password",
+    })
+    conn = await fluss.FlussConnection.create(config)
+except fluss.FlussError as e:
+    if e.error_code == fluss.ErrorCode.AUTHENTICATE_EXCEPTION:
+        print(f"Authentication failed: {e.message}")
+```
+
+### Schema Mismatch
+
+Row data doesn't match the table schema.
+
+```python
+try:
+    writer.append({"wrong_column": "value"})
+    await writer.flush()
+except fluss.FlussError as e:
+    # error_code == ErrorCode.CLIENT_ERROR for type/schema mismatches
+    print(f"Schema mismatch: {e.message}")
+```
diff --git a/website/docs/apis/python/example/_category_.json b/website/docs/apis/python/example/_category_.json
new file mode 100644
index 0000000000..4d81ec12ae
--- /dev/null
+++ b/website/docs/apis/python/example/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Examples",
+  "position": 5
+}
diff --git a/website/docs/apis/python/example/admin-operations.md b/website/docs/apis/python/example/admin-operations.md
new file mode 100644
index 0000000000..2cda6c4abf
--- /dev/null
+++ b/website/docs/apis/python/example/admin-operations.md
@@ -0,0 +1,81 @@
+---
+sidebar_position: 3
+---
+# Admin Operations
+
+```python
+admin = conn.get_admin()
+```
+
+## Databases
+
+```python
+await admin.create_database("my_database", ignore_if_exists=True)
+databases = await admin.list_databases()
+exists = await admin.database_exists("my_database")
+await admin.drop_database("my_database", ignore_if_not_exists=True, cascade=True)
+```
+
+## Tables
+
+Schemas are defined using PyArrow and wrapped in `fluss.Schema`:
+
+```python
+import pyarrow as pa
+
+schema = fluss.Schema(pa.schema([
+    pa.field("id", pa.int32()),
+    pa.field("name", pa.string()),
+    pa.field("amount", pa.int64()),
+]))
+
+table_path = fluss.TablePath("my_database", "my_table")
+await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
+
+table_info = await admin.get_table_info(table_path)
+tables = await admin.list_tables("my_database")
+await admin.drop_table(table_path, ignore_if_not_exists=True)
+```
+
+### TableDescriptor Options
+
+`TableDescriptor` accepts these optional parameters:
+
+| Parameter           | Description                                                                         |
+|---------------------|-------------------------------------------------------------------------------------|
+| `partition_keys`    | Column names to partition by (e.g. `["region"]`)                                    |
+| `bucket_count`      | Number of buckets (parallelism units) for the table                                 |
+| `bucket_keys`       | Columns used to determine bucket assignment                                         |
+| `comment`           | Table comment / description                                                         |
+| `log_format`        | Log storage format: `"ARROW"` or `"INDEXED"`                                        |
+| `kv_format`         | KV storage format for primary key tables: `"INDEXED"` or `"COMPACTED"`              |
+| `properties`        | Table configuration properties as a dict (e.g. `{"table.replication.factor": "1"}`) |
+| `custom_properties` | User-defined properties as a dict                                                   |
+
+## Offsets
+
+```python
+# Latest offsets for buckets
+offsets = await admin.list_offsets(table_path, bucket_ids=[0, 1], offset_spec=fluss.OffsetSpec.latest())
+
+# By timestamp
+offsets = await admin.list_offsets(table_path, bucket_ids=[0], offset_spec=fluss.OffsetSpec.timestamp(1704067200000))
+
+# Per-partition offsets
+offsets = await admin.list_partition_offsets(table_path, partition_name="US", bucket_ids=[0], offset_spec=fluss.OffsetSpec.latest())
+```
+
+## Lake Snapshot
+
+:::note
+Lake snapshots require [lake integration](https://fluss.apache.org/docs/maintenance/tiered-storage/overview/) (e.g. Paimon or Iceberg) to be enabled on the server. Without it, `get_latest_lake_snapshot` will raise an error.
+:::
+
+```python
+snapshot = await admin.get_latest_lake_snapshot(table_path)
+print(f"Snapshot ID: {snapshot.snapshot_id}")
+print(f"Table buckets: {snapshot.get_table_buckets()}")
+
+bucket = fluss.TableBucket(table_id=1, bucket=0)
+offset = snapshot.get_bucket_offset(bucket)
+```
diff --git a/website/docs/apis/python/example/configuration.md b/website/docs/apis/python/example/configuration.md
new file mode 100644
index 0000000000..448ae029ac
--- /dev/null
+++ b/website/docs/apis/python/example/configuration.md
@@ -0,0 +1,49 @@
+---
+sidebar_position: 2
+---
+# Configuration
+
+## Connection Setup
+
+```python
+import fluss
+
+config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
+conn = await fluss.FlussConnection.create(config)
+```
+
+The connection also supports async context managers:
+
+```python
+async with await fluss.FlussConnection.create(config) as conn:
+    ...
+```
+
+## Connection Configurations
+
+Configuration options can be set either via dict keys in the `Config()` constructor, or via Python property setters.
+
+See the [`Config`](../api-reference.md#config) section in the API Reference for the full list of options, their config keys, and descriptions.
+
+## SASL Authentication
+
+To connect to a Fluss cluster with SASL/PLAIN authentication enabled:
+
+```python
+config = fluss.Config({
+    "bootstrap.servers": "127.0.0.1:9123",
+    "security.protocol": "sasl",
+    "security.sasl.mechanism": "PLAIN",
+    "security.sasl.username": "admin",
+    "security.sasl.password": "admin-secret",
+})
+conn = await fluss.FlussConnection.create(config)
+```
+
+## Connection Lifecycle
+
+Remember to close the connection when done:
+
+```python
+await conn.close()
+```
diff --git a/website/docs/apis/python/example/index.md b/website/docs/apis/python/example/index.md
new file mode 100644
index 0000000000..ecbdc84685
--- /dev/null
+++ b/website/docs/apis/python/example/index.md
@@ -0,0 +1,46 @@
+---
+sidebar_position: 1
+---
+# Example
+
+Minimal working example: connect to Fluss, create a table, write data, and read it back.
+
+```python
+import asyncio
+import pyarrow as pa
+import fluss
+
+async def main():
+    # Connect
+    config = fluss.Config({"bootstrap.servers": "127.0.0.1:9123"})
+    conn = await fluss.FlussConnection.create(config)
+    admin = conn.get_admin()
+
+    # Create a log table
+    schema = fluss.Schema(pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("name", pa.string()),
+        pa.field("score", pa.float32()),
+    ]))
+    table_path = fluss.TablePath("fluss", "quick_start")
+    await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
+
+    # Write
+    table = await conn.get_table(table_path)
+    writer = table.new_append().create_writer()
+    writer.append({"id": 1, "name": "Alice", "score": 95.5})
+    writer.append({"id": 2, "name": "Bob", "score": 87.0})
+    await writer.flush()
+
+    # Read
+    num_buckets = (await admin.get_table_info(table_path)).num_buckets
+    scanner = await table.new_scan().create_record_batch_log_scanner()
+    scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+    print(await scanner.to_pandas())
+
+    # Cleanup
+    await admin.drop_table(table_path, ignore_if_not_exists=True)
+    await conn.close()
+
+asyncio.run(main())
+```
diff --git a/website/docs/apis/python/example/log-tables.md b/website/docs/apis/python/example/log-tables.md
new file mode 100644
index 0000000000..4dbe256781
--- /dev/null
+++ b/website/docs/apis/python/example/log-tables.md
@@ -0,0 +1,129 @@
+---
+sidebar_position: 4
+---
+# Log Tables
+
+Log tables are append-only tables without primary keys, suitable for event streaming.
+
+## Creating a Log Table
+
+```python
+import pyarrow as pa
+
+schema = fluss.Schema(pa.schema([
+    pa.field("id", pa.int32()),
+    pa.field("name", pa.string()),
+    pa.field("score", pa.float32()),
+]))
+
+table_path = fluss.TablePath("fluss", "events")
+await admin.create_table(table_path, fluss.TableDescriptor(schema), ignore_if_exists=True)
+```
+
+## Writing
+
+Rows can be appended as dicts, lists, or tuples. For bulk writes, use `write_arrow()`, `write_arrow_batch()`, or `write_pandas()`.
+
+Write methods like `append()` and `write_arrow_batch()` return a `WriteResultHandle`. You can ignore it for fire-and-forget semantics (flush at the end), or `await handle.wait()` to block until the server acknowledges that specific write.
+
+```python
+table = await conn.get_table(table_path)
+writer = table.new_append().create_writer()
+
+# Fire-and-forget: queue writes, flush at the end
+writer.append({"id": 1, "name": "Alice", "score": 95.5})
+writer.append([2, "Bob", 87.0])
+await writer.flush()
+
+# Per-record acknowledgment
+handle = writer.append({"id": 3, "name": "Charlie", "score": 91.0})
+await handle.wait()
+
+# Bulk writes
+writer.write_arrow(pa_table)          # PyArrow Table
+writer.write_arrow_batch(record_batch) # PyArrow RecordBatch
+writer.write_pandas(df)                # Pandas DataFrame
+await writer.flush()
+```
+
+## Reading
+
+There are two scanner types:
+- **Batch scanner** (`create_record_batch_log_scanner()`): returns Arrow Tables or DataFrames, best for analytics
+- **Record scanner** (`create_log_scanner()`): returns individual records with metadata (offset, timestamp, change type), best for streaming
+
+And two reading modes:
+- **`to_arrow()` / `to_pandas()`**: reads all data from subscribed buckets up to the current latest offset, then returns. Best for one-shot batch reads.
+- **`poll_arrow()` / `poll()` / `poll_record_batch()`**: returns whatever data is available within the timeout, then returns. Call in a loop for continuous streaming.
+
+### Batch Read (One-Shot)
+
+```python
+num_buckets = (await admin.get_table_info(table_path)).num_buckets
+
+scanner = await table.new_scan().create_record_batch_log_scanner()
+scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+# Reads everything up to current latest offset, then returns
+arrow_table = await scanner.to_arrow()
+df = await scanner.to_pandas()
+```
+
+### Continuous Polling
+
+Use `poll_arrow()` or `poll()` in a loop for streaming consumption:
+
+```python
+# Batch scanner: poll as Arrow Tables
+scanner = await table.new_scan().create_record_batch_log_scanner()
+scanner.subscribe(bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
+
+while True:
+    result = await scanner.poll_arrow(timeout_ms=5000)
+    if result.num_rows > 0:
+        print(result.to_pandas())
+
+# Record scanner: poll individual records
+scanner = await table.new_scan().create_log_scanner()
+scanner.subscribe_buckets({i: fluss.EARLIEST_OFFSET for i in range(num_buckets)})
+
+while True:
+    scan_records = await scanner.poll(timeout_ms=5000)
+
+    for record in scan_records:
+        print(f"offset={record.offset}, change={record.change_type.short_string()}, row={record.row}")
+
+    # Or per-bucket access (dict-like)
+    for bucket, records in scan_records.items():
+        for record in records:
+            print(f"bucket={bucket.bucket_id}, offset={record.offset}, row={record.row}")
+```
+
+### Unsubscribing
+
+To stop consuming from a bucket, use `unsubscribe()`:
+
+```python
+scanner.unsubscribe(bucket_id=0)
+```
+
+### Subscribe from Latest Offset
+
+To only consume new records (skip existing data), first resolve the current latest offset via `list_offsets`, then subscribe at that offset:
+
+```python
+admin = conn.get_admin()
+offsets = await admin.list_offsets(table_path, [0], fluss.OffsetSpec.latest())
+latest = offsets[0]
+
+scanner = await table.new_scan().create_record_batch_log_scanner()
+scanner.subscribe(bucket_id=0, start_offset=latest)
+```
+
+## Column Projection
+
+```python
+scanner = await table.new_scan().project([0, 2]).create_record_batch_log_scanner()
+# or by name
+scanner = await table.new_scan().project_by_name(["id", "score"]).create_record_batch_log_scanner()
+```
diff --git a/website/docs/apis/python/example/partitioned-tables.md b/website/docs/apis/python/example/partitioned-tables.md
new file mode 100644
index 0000000000..894bb519db
--- /dev/null
+++ b/website/docs/apis/python/example/partitioned-tables.md
@@ -0,0 +1,104 @@
+---
+sidebar_position: 6
+---
+# Partitioned Tables
+
+Partitioned tables distribute data across partitions based on column values. Partitions must exist before writing data, otherwise the client will by default retry indefinitely.
+
+## Creating and Managing Partitions
+
+```python
+import pyarrow as pa
+
+schema = fluss.Schema(pa.schema([
+    pa.field("id", pa.int32()),
+    pa.field("region", pa.string()),
+    pa.field("value", pa.int64()),
+]))
+
+table_path = fluss.TablePath("fluss", "partitioned_events")
+await admin.create_table(
+    table_path,
+    fluss.TableDescriptor(schema, partition_keys=["region"], bucket_count=1),
+    ignore_if_exists=True,
+)
+
+# Create partitions
+await admin.create_partition(table_path, {"region": "US"}, ignore_if_exists=True)
+await admin.create_partition(table_path, {"region": "EU"}, ignore_if_exists=True)
+
+# List partitions
+partition_infos = await admin.list_partition_infos(table_path)
+```
+
+## Writing
+
+Same as non-partitioned tables - include partition column values in each row. **Partitions must exist before writing data, otherwise the client will by default retry indefinitely.**
+
+```python
+table = await conn.get_table(table_path)
+writer = table.new_append().create_writer()
+writer.append({"id": 1, "region": "US", "value": 100})
+writer.append({"id": 2, "region": "EU", "value": 200})
+await writer.flush()
+```
+
+## Reading
+
+Use `subscribe_partition()` or `subscribe_partition_buckets()` instead of `subscribe()`:
+
+```python
+scanner = await table.new_scan().create_record_batch_log_scanner()
+
+# Subscribe to individual partitions
+for p in partition_infos:
+    scanner.subscribe_partition(partition_id=p.partition_id, bucket_id=0, start_offset=fluss.EARLIEST_OFFSET)
+
+# Or batch-subscribe
+scanner.subscribe_partition_buckets({
+    (p.partition_id, 0): fluss.EARLIEST_OFFSET for p in partition_infos
+})
+
+print(await scanner.to_pandas())
+```
+
+### Unsubscribing
+
+To stop consuming from a specific partition bucket, use `unsubscribe_partition()`:
+
+```python
+scanner.unsubscribe_partition(partition_id=partition_infos[0].partition_id, bucket_id=0)
+```
+
+## Partitioned Primary Key Tables
+
+Partition columns must be part of the primary key. Partitions must exist before upserting data, otherwise the client will by default retry indefinitely.
+
+```python
+schema = fluss.Schema(
+    pa.schema([
+        pa.field("user_id", pa.int32()),
+        pa.field("region", pa.string()),
+        pa.field("score", pa.int64()),
+    ]),
+    primary_keys=["user_id", "region"],
+)
+
+table_path = fluss.TablePath("fluss", "partitioned_users")
+await admin.create_table(
+    table_path,
+    fluss.TableDescriptor(schema, partition_keys=["region"]),
+    ignore_if_exists=True,
+)
+
+await admin.create_partition(table_path, {"region": "US"}, ignore_if_exists=True)
+
+table = await conn.get_table(table_path)
+writer = table.new_upsert().create_writer()
+writer.upsert({"user_id": 1, "region": "US", "score": 1234})
+await writer.flush()
+
+# Lookup includes partition columns
+lookuper = table.new_lookup().create_lookuper()
+result = await lookuper.lookup({"user_id": 1, "region": "US"})
+```
diff --git a/website/docs/apis/python/example/primary-key-tables.md b/website/docs/apis/python/example/primary-key-tables.md
new file mode 100644
index 0000000000..cd61e5084c
--- /dev/null
+++ b/website/docs/apis/python/example/primary-key-tables.md
@@ -0,0 +1,61 @@
+---
+sidebar_position: 5
+---
+# Primary Key Tables
+
+Primary key tables support upsert, delete, and point lookup operations.
+
+## Creating a Primary Key Table
+
+Pass `primary_keys` to `fluss.Schema`:
+
+```python
+import pyarrow as pa
+
+schema = fluss.Schema(
+    pa.schema([
+        pa.field("id", pa.int32()),
+        pa.field("name", pa.string()),
+        pa.field("age", pa.int64()),
+    ]),
+    primary_keys=["id"],
+)
+table_path = fluss.TablePath("fluss", "users")
+await admin.create_table(table_path, fluss.TableDescriptor(schema, bucket_count=3), ignore_if_exists=True)
+```
+
+## Upsert, Delete, Lookup
+
+```python
+table = await conn.get_table(table_path)
+
+# Upsert (fire-and-forget, flush at the end)
+writer = table.new_upsert().create_writer()
+writer.upsert({"id": 1, "name": "Alice", "age": 25})
+writer.upsert({"id": 2, "name": "Bob", "age": 30})
+await writer.flush()
+
+# Per-record acknowledgment (for read-after-write)
+handle = writer.upsert({"id": 3, "name": "Charlie", "age": 35})
+await handle.wait()
+
+# Delete by primary key
+handle = writer.delete({"id": 2})
+await handle.wait()
+
+# Lookup
+lookuper = table.new_lookup().create_lookuper()
+result = await lookuper.lookup({"id": 1})
+if result:
+    print(f"Found: name={result['name']}, age={result['age']}")
+```
+
+## Partial Updates
+
+Update specific columns while preserving others:
+
+```python
+partial_writer = table.new_upsert().partial_update_by_name(["id", "age"]).create_writer()
+partial_writer.upsert({"id": 1, "age": 27})  # only updates age
+await partial_writer.flush()
+```
diff --git a/website/docs/apis/python/installation.md b/website/docs/apis/python/installation.md
new file mode 100644
index 0000000000..4182dbb431
--- /dev/null
+++ b/website/docs/apis/python/installation.md
@@ -0,0 +1,41 @@
+---
+sidebar_position: 1
+---
+# Installation
+
+```bash
+pip install pyfluss
+```
+
+## Building From Source (Optional)
+
+**Prerequisites:** Python 3.9+, Rust 1.85+
+
+```bash
+git clone https://github.com/apache/fluss-rust.git
+cd fluss-rust/bindings/python
+```
+
+Install [maturin](https://github.com/PyO3/maturin):
+
+```bash
+pip install maturin
+```
+
+Build and install:
+
+```bash
+# Development mode (editable)
+maturin develop
+
+# Or build a wheel
+maturin build --release
+pip install target/wheels/fluss-*.whl
+```
+
+Verify:
+
+```python
+import fluss
+print("Fluss Python bindings installed successfully!")
+```
diff --git a/website/docs/apis/rust-client.md b/website/docs/apis/rust-client.md
deleted file mode 100644
index 8b71936315..0000000000
--- a/website/docs/apis/rust-client.md
+++ /dev/null
@@ -1,53 +0,0 @@
----
-title: "Rust Client"
-sidebar_position: 3
----
-
-# Fluss Rust Client
-
-The Fluss Rust Client is a high-performance, asynchronous library powered by the
-[Tokio](https://tokio.rs/) runtime. It provides a native interface for interacting
-with Fluss clusters with minimal overhead.
-
-The client provides two main APIs:
-
-- **[Admin API](https://clients.fluss.apache.org/user-guide/rust/api-reference#flussadmin)**: For managing databases, tables, and partitions.
-- **[Table API](https://clients.fluss.apache.org/user-guide/rust/api-reference/#flusstablea)**: For reading and writing to Log and Primary Key tables
-
-## Installation
-
-The Fluss Rust client is published to [crates.io](https://crates.io/crates/fluss-rs)
-as `fluss-rs`. The crate's library name is `fluss`, so you import it with `use fluss::...`.
-
-Add the following to your `Cargo.toml`:
-```toml
-[dependencies]
-fluss-rs = "0.1"
-tokio = { version = "1", features = ["full"] }
-```
-
-## Quick Example
-```rust
-use fluss::client::FlussConnection;
-use fluss::config::Config;
-use fluss::error::Result;
-
-#[tokio::main]
-async fn main() -> Result<()> {
-    let mut config = Config::default();
-    config.bootstrap_servers = "127.0.0.1:9123".to_string();
-
-    let conn = FlussConnection::new(config).await?;
-    let admin = conn.get_admin().await?;
-
-    Ok(())
-}
-```
-
-For more examples, see [Fluss Rust Client documentation](https://clients.fluss.apache.org/user-guide/rust/example/).
-
-## Full Documentation
-
-For the complete Rust client reference including all configuration options,
-API methods, data types, error handling, and worked examples — see the
-**[Fluss Rust Client documentation](https://clients.fluss.apache.org/user-guide/rust/installation)**.
\ No newline at end of file
diff --git a/website/docs/apis/rust/_category_.json b/website/docs/apis/rust/_category_.json
new file mode 100644
index 0000000000..d2279a0af3
--- /dev/null
+++ b/website/docs/apis/rust/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Rust",
+  "position": 3
+}
diff --git a/website/docs/apis/rust/api-reference.md b/website/docs/apis/rust/api-reference.md
new file mode 100644
index 0000000000..bb2ec3e8f1
--- /dev/null
+++ b/website/docs/apis/rust/api-reference.md
@@ -0,0 +1,597 @@
+---
+sidebar_position: 2
+---
+# API Reference
+
+Complete API reference for the Fluss Rust client.
+
+## `Config`
+
+| Field                                 | Type            | Default            | Description                                                                          |
+|---------------------------------------|-----------------|--------------------|--------------------------------------------------------------------------------------|
+| `bootstrap_servers`                   | `String`        | `"127.0.0.1:9123"` | Coordinator server address                                                           |
+| `writer_request_max_size`             | `i32`           | `10485760` (10 MB) | Maximum request size in bytes                                                        |
+| `writer_acks`                         | `String`        | `"all"`            | Acknowledgment setting (`"all"` waits for all replicas)                              |
+| `writer_retries`                      | `i32`           | `i32::MAX`         | Number of retries on failure                                                         |
+| `writer_batch_size`                   | `i32`           | `2097152` (2 MB)   | Batch size for writes in bytes. Upper bound when dynamic sizing is on; fixed batch size when off. |
+| `writer_dynamic_batch_size_enabled`   | `bool`          | `true`             | Enable per-table dynamic batch sizing: target grows 10% above 80% fill, shrinks 5% below 50%, clamped to `[writer_dynamic_batch_size_min, writer_batch_size]` |
+| `writer_dynamic_batch_size_min`       | `i32`           | `262144` (256 KB)  | Lower bound for the dynamic batch size estimator (ignored when `writer_dynamic_batch_size_enabled` is `false`) |
+| `writer_batch_timeout_ms`             | `i64`           | `100`              | Maximum time in ms to wait for a writer batch to fill up before sending              |
+| `writer_bucket_no_key_assigner`       | `NoKeyAssigner` | `sticky`           | Bucket assignment strategy for tables without bucket keys: `sticky` or `round_robin` |
+| `scanner_remote_log_prefetch_num`     | `usize`         | `4`                | Number of remote log segments to prefetch                                            |
+| `remote_file_download_thread_num`     | `usize`         | `3`                | Number of threads for remote log downloads                                           |
+| `scanner_remote_log_read_concurrency` | `usize`         | `4`                | Streaming read concurrency within a remote log file                                  |
+| `scanner_log_max_poll_records`        | `usize`         | `500`              | Maximum number of records returned in a single poll()                                |
+| `scanner_log_fetch_max_bytes`         | `i32`           | `16777216` (16 MB) | Maximum bytes per fetch response for LogScanner                                      |
+| `scanner_log_fetch_min_bytes`         | `i32`           | `1`                | Minimum bytes the server must accumulate before returning a fetch response           |
+| `scanner_log_fetch_wait_max_time_ms`  | `i32`           | `500`              | Maximum time (ms) the server may wait to satisfy min-bytes                           |
+| `scanner_log_fetch_max_bytes_for_bucket`| `i32`         | `1048576` (1 MB)   | Maximum bytes per fetch response per bucket for LogScanner                           |
+| `connect_timeout_ms`                  | `u64`           | `120000`           | TCP connect timeout in milliseconds                                                  |
+| `security_protocol`                   | `String`        | `"PLAINTEXT"`      | `PLAINTEXT` (default) or `sasl` for SASL auth                                        |
+| `security_sasl_mechanism`             | `String`        | `"PLAIN"`          | SASL mechanism (only `PLAIN` is supported)                                           |
+| `security_sasl_username`              | `String`        | (empty)            | SASL username (required when protocol is `sasl`)                                     |
+| `security_sasl_password`              | `String`        | (empty)            | SASL password (required when protocol is `sasl`)                                     |
+
+## `FlussConnection`
+
+| Method                                                                        | Description                                    |
+|-------------------------------------------------------------------------------|------------------------------------------------|
+| `async fn new(config: Config) -> Result<Self>`                                | Create a new connection to a Fluss cluster     |
+| `fn get_admin(&self) -> Result<Arc<FlussAdmin>>`                              | Get the admin interface for cluster management |
+| `async fn get_table(&self, table_path: &TablePath) -> Result<FlussTable<'_>>` | Get a table for read/write operations          |
+| `fn config(&self) -> &Config`                                                 | Get a reference to the connection config       |
+
+## `FlussAdmin`
+
+### Database Operations
+
+| Method                                                                                                                       | Description                |
+|------------------------------------------------------------------------------------------------------------------------------|----------------------------|
+| `async fn create_database(&self, name: &str, descriptor: Option<&DatabaseDescriptor>, ignore_if_exists: bool) -> Result<()>` | Create a database          |
+| `async fn drop_database(&self, name: &str, ignore_if_not_exists: bool, cascade: bool) -> Result<()>`                         | Drop a database            |
+| `async fn list_databases(&self) -> Result<Vec<String>>`                                                                      | List all databases         |
+| `async fn database_exists(&self, name: &str) -> Result<bool>`                                                                | Check if a database exists |
+| `async fn get_database_info(&self, name: &str) -> Result<DatabaseInfo>`                                                      | Get database metadata      |
+
+### Table Operations
+
+| Method                                                                                                                     | Description                                                                 |
+|----------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------|
+| `async fn create_table(&self, table_path: &TablePath, descriptor: &TableDescriptor, ignore_if_exists: bool) -> Result<()>` | Create a table                                                              |
+| `async fn drop_table(&self, table_path: &TablePath, ignore_if_not_exists: bool) -> Result<()>`                             | Drop a table                                                                |
+| `async fn get_table_info(&self, table_path: &TablePath) -> Result<TableInfo>`                                              | Get table metadata                                                          |
+| `async fn get_table_schema(&self, table_path: &TablePath, schema_id: Option<i32>) -> Result<SchemaInfo>`                   | Get a table's schema by id, or the latest schema when `schema_id` is `None` |
+| `async fn list_tables(&self, database_name: &str) -> Result<Vec<String>>`                                                  | List tables in a database                                                   |
+| `async fn table_exists(&self, table_path: &TablePath) -> Result<bool>`                                                     | Check if a table exists                                                     |
+
+### Partition Operations
+
+| Method                                                                                                                               | Description                     |
+|--------------------------------------------------------------------------------------------------------------------------------------|---------------------------------|
+| `async fn list_partition_infos(&self, table_path: &TablePath) -> Result<Vec<PartitionInfo>>`                                         | List all partitions             |
+| `async fn list_partition_infos_with_spec(&self, table_path: &TablePath, spec: Option<&PartitionSpec>) -> Result<Vec<PartitionInfo>>` | List partitions matching a spec |
+| `async fn create_partition(&self, table_path: &TablePath, spec: &PartitionSpec, ignore_if_exists: bool) -> Result<()>`               | Create a partition              |
+| `async fn drop_partition(&self, table_path: &TablePath, spec: &PartitionSpec, ignore_if_not_exists: bool) -> Result<()>`             | Drop a partition                |
+
+### Offset Operations
+
+| Method                                                                                                                                                           |  Description                          |
+|------------------------------------------------------------------------------------------------------------------------------------------------------------------|---------------------------------------|
+| `async fn list_offsets(&self, table_path: &TablePath, bucket_ids: &[i32], offset_spec: OffsetSpec) -> Result<HashMap<i32, i64>>`                                 | Get offsets for buckets               |
+| `async fn list_partition_offsets(&self, table_path: &TablePath, partition_name: &str, bucket_ids: &[i32], offset_spec: OffsetSpec) -> Result<HashMap<i32, i64>>` | Get offsets for a partition's buckets |
+
+### Lake Operations
+
+| Method                                                                                     |  Description                 |
+|--------------------------------------------------------------------------------------------|------------------------------|
+| `async fn get_latest_lake_snapshot(&self, table_path: &TablePath) -> Result<LakeSnapshot>` | Get the latest lake snapshot |
+
+### Cluster Operations
+
+| Method                                                        | Description                                         |
+|---------------------------------------------------------------|-----------------------------------------------------|
+| `async fn get_server_nodes(&self) -> Result<Vec<ServerNode>>` | Get all alive server nodes (coordinator + tablets)  |
+
+## `ServerNode`
+
+| Method                            | Description                                          |
+|-----------------------------------|------------------------------------------------------|
+| `fn id(&self) -> i32`            | Server node ID                                       |
+| `fn host(&self) -> &str`         | Hostname of the server                               |
+| `fn port(&self) -> u32`          | Port number                                          |
+| `fn server_type(&self) -> &ServerType` | Server type (`CoordinatorServer` or `TabletServer`) |
+| `fn uid(&self) -> &str`          | Unique identifier (e.g. `"cs-0"`, `"ts-1"`)         |
+
+## `FlussTable<'a>`
+
+| Method                                        | Description                             |
+|-----------------------------------------------|-----------------------------------------|
+| `fn get_table_info(&self) -> &TableInfo`      | Get table metadata                      |
+| `fn new_append(&self) -> Result<TableAppend>` | Create an append builder for log tables |
+| `fn new_scan(&self) -> TableScan<'_>`         | Create a scan builder                   |
+| `fn new_lookup(&self) -> Result<TableLookup>` | Create a lookup builder for PK tables   |
+| `fn new_upsert(&self) -> Result<TableUpsert>` | Create an upsert builder for PK tables  |
+| `fn has_primary_key(&self) -> bool`           | Check if the table has a primary key    |
+| `fn table_path(&self) -> &TablePath`          | Get the table path                      |
+
+## `TableAppend`
+
+| Method                                            | Description             |
+|---------------------------------------------------|-------------------------|
+| `fn create_writer(&self) -> Result<AppendWriter>` | Create an append writer |
+
+## `AppendWriter`
+
+| Method                                                                          | Description                                       |
+|---------------------------------------------------------------------------------|---------------------------------------------------|
+| `fn append(&self, row: &impl InternalRow) -> Result<WriteResultFuture>`         | Append a row; returns a future for acknowledgment |
+| `fn append_arrow_batch(&self, batch: RecordBatch) -> Result<WriteResultFuture>` | Append an Arrow RecordBatch                       |
+| `async fn flush(&self) -> Result<()>`                                           | Flush all pending writes to the server            |
+
+## `TableScan<'a>`
+
+| Method                                                                      | Description                             |
+|-----------------------------------------------------------------------------|-----------------------------------------|
+| `fn project(self, indices: &[usize]) -> Result<Self>`                       | Project columns by index                |
+| `fn project_by_name(self, names: &[&str]) -> Result<Self>`                  | Project columns by name                 |
+| `fn limit(self, n: i32) -> Result<Self>`                                    | Set a row limit (enables `create_bucket_batch_scanner`; rejected by log scanners) |
+| `fn create_log_scanner(self) -> Result<LogScanner>`                         | Create a record-based log scanner       |
+| `fn create_record_batch_log_scanner(self) -> Result<RecordBatchLogScanner>` | Create an Arrow batch-based log scanner |
+| `fn create_bucket_batch_scanner(self, bucket: TableBucket) -> Result<LimitBatchScanner>` | Bounded scan of one bucket (requires `limit`; runs on first `next_batch`) |
+
+## `LogScanner`
+
+Single-consumer: do not call `poll` concurrently on the same scanner (e.g. from `tokio::join!` or two tasks sharing an `Arc`). Mirrors Java's `LogScannerImpl.acquire()` guard. Debug builds surface overlapping calls via a `debug_assert!`; release builds skip the check for performance and produce skewed poll-timing metrics (`fluss.client.scanner.time_between_poll_ms`, `fluss.client.scanner.poll_idle_ratio`) if the contract is violated.
+
+All `fluss.client.scanner.*` metrics carry `database` and `table` labels (matching Java's per-`TablePath` `ScannerMetricGroup`), so multi-table consumers get one time series per scanned table.
+
+| Method                                                                                                    | Description                                              |
+|-----------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
+| `async fn subscribe(&self, bucket_id: i32, start_offset: i64) -> Result<()>`                              | Subscribe to a bucket                                    |
+| `async fn subscribe_buckets(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()>`                     | Subscribe to multiple buckets                            |
+| `async fn subscribe_partition(&self, partition_id: i64, bucket_id: i32, start_offset: i64) -> Result<()>` | Subscribe to a partition bucket                          |
+| `async fn subscribe_partition_buckets(&self, offsets: &HashMap<(i64, i32), i64>) -> Result<()>`           | Subscribe to multiple partition-bucket pairs             |
+| `async fn unsubscribe(&self, bucket_id: i32) -> Result<()>`                                               | Unsubscribe from a bucket (non-partitioned tables)       |
+| `async fn unsubscribe_partition(&self, partition_id: i64, bucket_id: i32) -> Result<()>`                  | Unsubscribe from a partition bucket (partitioned tables) |
+| `async fn poll(&self, timeout: Duration) -> Result<ScanRecords>`                                          | Poll for records                                         |
+
+## `RecordBatchLogScanner`
+
+Single-consumer: overlapping `poll` calls on handles that share state, or `poll` concurrent with `RecordBatchLogReader::next_batch`, are not supported — use one active polling/consumption call at a time per underlying scanner state. Mirrors Java's `LogScannerImpl.acquire()` guard. Debug builds surface overlapping calls via a `debug_assert!`; release builds skip the check for performance and produce skewed poll-timing metrics (`fluss.client.scanner.time_between_poll_ms`, `fluss.client.scanner.poll_idle_ratio`) if the contract is violated.
+
+| Method                                                                                                    | Description                                              |
+|-----------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
+| `async fn subscribe(&self, bucket_id: i32, start_offset: i64) -> Result<()>`                              | Subscribe to a bucket                                    |
+| `async fn subscribe_buckets(&self, bucket_offsets: &HashMap<i32, i64>) -> Result<()>`                     | Subscribe to multiple buckets                            |
+| `async fn subscribe_partition(&self, partition_id: i64, bucket_id: i32, start_offset: i64) -> Result<()>` | Subscribe to a partition bucket                          |
+| `async fn subscribe_partition_buckets(&self, offsets: &HashMap<(i64, i32), i64>) -> Result<()>`           | Subscribe to multiple partition-bucket pairs             |
+| `async fn unsubscribe(&self, bucket_id: i32) -> Result<()>`                                               | Unsubscribe from a bucket (non-partitioned tables)       |
+| `async fn unsubscribe_partition(&self, partition_id: i64, bucket_id: i32) -> Result<()>`                  | Unsubscribe from a partition bucket (partitioned tables) |
+| `async fn poll(&self, timeout: Duration) -> Result<Vec<ScanBatch>>`                                       | Poll for Arrow record batches                            |
+| `fn is_partitioned(&self) -> bool`                                                                        | Check if the table is partitioned                        |
+| `fn get_subscribed_buckets(&self) -> Vec<(TableBucket, i64)>`                                             | Get all current subscriptions as (bucket, offset) pairs  |
+| `fn schema(&self) -> SchemaRef`                                                                           | Get the Arrow schema for batches produced by this scanner|
+| `fn table_path(&self) -> &TablePath`                                                                      | Get the table path                                       |
+| `fn table_id(&self) -> TableId`                                                                           | Get the table ID                                         |
+
+## `RecordBatchLogReader`
+
+Bounded log reader that consumes data up to specified stopping offsets, then terminates.
+Unlike `RecordBatchLogScanner` which polls indefinitely, this reader stops automatically.
+
+| Method                                                                                                      | Description                                              |
+|-------------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
+| `async fn new_until_latest(scanner: RecordBatchLogScanner, admin: &FlussAdmin) -> Result<Self>`              | Read until the latest offsets at time of creation         |
+| `fn new_until_offsets(scanner: RecordBatchLogScanner, stopping_offsets: HashMap<TableBucket, i64>) -> Result<Self>` | Read until custom stopping offsets per bucket             |
+| `async fn next_batch(&mut self) -> Result<Option<ScanBatch>>`                                                | Get the next batch with bucket/offset metadata, or `None` when all buckets caught up |
+| `async fn collect_all_batches(&mut self) -> Result<Vec<ScanBatch>>`                                          | Drain all batches (with metadata) until stopping offsets are satisfied |
+| `fn schema(&self) -> SchemaRef`                                                                              | Arrow schema for produced batches                        |
+| `fn to_record_batch_reader(self, handle: tokio::runtime::Handle) -> SyncRecordBatchLogReader`                | Sync adapter implementing `arrow::RecordBatchReader` (see below) |
+
+## `SyncRecordBatchLogReader`
+
+Synchronous adapter for `RecordBatchLogReader`. Created via
+`RecordBatchLogReader::to_record_batch_reader(handle)`.
+
+Implements both [`Iterator`] and [`arrow::record_batch::RecordBatchReader`], so it
+plugs into the wider Arrow ecosystem — FFI, PyArrow's
+`pa.RecordBatchReader.from_batches`, the C++ Arrow `RecordBatchReader` interface,
+DataFusion sources, etc.
+
+Each `next()` call drives the underlying async reader via
+`tokio::runtime::Handle::block_on`. **Do not call from inside a Tokio worker
+thread that belongs to the same runtime** — nested `block_on` panics. Prefer
+`RecordBatchLogReader::next_batch` in async Rust code; use this adapter only at
+sync/FFI boundaries.
+
+Bucket and offset metadata carried by `ScanBatch` is **dropped** here, because
+the Arrow trait contract yields plain `RecordBatch`. If you need offsets or
+bucket identity per batch, use `next_batch` instead.
+
+| Method                                                          | Description                                      |
+|-----------------------------------------------------------------|--------------------------------------------------|
+| `fn next(&mut self) -> Option<Result<RecordBatch, ArrowError>>` | Iterator: next batch, or `None` when caught up   |
+| `fn schema(&self) -> SchemaRef`                                 | Arrow schema for produced batches                |
+
+## `LimitBatchScanner`
+
+One-shot bounded scanner from `TableScan::limit(n).create_bucket_batch_scanner(bucket)`.
+Poll it with `next_batch` until it returns `None` (mirrors `RecordBatchLogReader`).
+Supports both log and primary-key tables (the latter returns the current,
+server-deduplicated state); yields a single batch of at most `n` rows.
+
+| Method                                                        | Description                          |
+|---------------------------------------------------------------|--------------------------------------|
+| `async fn next_batch(&mut self) -> Result<Option<ScanBatch>>` | Rows on the first call, `None` after |
+| `async fn collect_all_batches(&mut self) -> Result<Vec<ScanBatch>>` | Drain into all batches         |
+| `fn bucket(&self) -> &TableBucket`                            | The scanned bucket                   |
+
+## `ScanRecord`
+
+| Method                                 | Description                            |
+|----------------------------------------|----------------------------------------|
+| `fn row(&self) -> &dyn InternalRow`    | Get the row data                       |
+| `fn offset(&self) -> i64`              | Record offset in the log               |
+| `fn timestamp(&self) -> i64`           | Record timestamp                       |
+| `fn change_type(&self) -> &ChangeType` | Change type (AppendOnly, Insert, etc.) |
+
+## `ScanRecords`
+
+| Method                                                                   | Description                       |
+|--------------------------------------------------------------------------|-----------------------------------|
+| `fn count(&self) -> usize`                                               | Number of records                 |
+| `fn is_empty(&self) -> bool`                                             | Whether the result set is empty   |
+| `fn records(&self, bucket: &TableBucket) -> &[ScanRecord]`               | Get records for a specific bucket |
+| `fn records_by_buckets(&self) -> &HashMap<TableBucket, Vec<ScanRecord>>` | Get all records grouped by bucket |
+
+`ScanRecords` also implements `IntoIterator`, so you can iterate over all records directly:
+
+```rust
+for record in records {
+    println!("offset={}", record.offset());
+}
+```
+
+## `ScanBatch`
+
+| Method                             | Description                    |
+|------------------------------------|--------------------------------|
+| `fn bucket(&self) -> &TableBucket` | Bucket this batch belongs to   |
+| `fn batch(&self) -> &RecordBatch`  | Arrow RecordBatch data         |
+| `fn base_offset(&self) -> i64`     | First record offset            |
+| `fn last_offset(&self) -> i64`     | Last record offset             |
+| `fn num_records(&self) -> usize`   | Number of records in the batch |
+
+## `TableUpsert`
+
+| Method                                                                                | Description                                       |
+|---------------------------------------------------------------------------------------|---------------------------------------------------|
+| `fn create_writer(&self) -> Result<UpsertWriter>`                                     | Create an upsert writer                           |
+| `fn partial_update(&self, column_indices: Option<Vec<usize>>) -> Result<TableUpsert>` | Create a partial update builder by column indices |
+| `fn partial_update_with_column_names(&self, names: &[&str]) -> Result<TableUpsert>`   | Create a partial update builder by column names   |
+
+## `UpsertWriter`
+
+| Method                                                                  | Description                           |
+|-------------------------------------------------------------------------|---------------------------------------|
+| `fn upsert(&self, row: &impl InternalRow) -> Result<WriteResultFuture>` | Upsert a row (insert or update by PK) |
+| `fn delete(&self, row: &impl InternalRow) -> Result<WriteResultFuture>` | Delete a row by primary key           |
+| `async fn flush(&self) -> Result<()>`                                   | Flush all pending operations          |
+
+## `TableLookup`
+
+| Method                                          |  Description                        |
+|-------------------------------------------------|-------------------------------------|
+| `fn create_lookuper(&self) -> Result<Lookuper>` | Create a lookuper for point lookups |
+
+## `Lookuper`
+
+| Method                                                                       |  Description                |
+|------------------------------------------------------------------------------|-----------------------------|
+| `async fn lookup(&mut self, key: &impl InternalRow) -> Result<LookupResult>` | Lookup a row by primary key |
+
+## `LookupResult`
+
+| Method                                                         |  Description                     |
+|----------------------------------------------------------------|----------------------------------|
+| `fn get_single_row(&self) -> Result<Option<impl InternalRow>>` | Get a single row from the result |
+| `fn get_rows(&self) -> Result<Vec<impl InternalRow>>`          | Get all rows from the result     |
+| `fn to_record_batch(&self) -> Result<RecordBatch>`             | Convert all rows to an Arrow `RecordBatch` for DataFusion or other Arrow-based tools    |
+
+## `WriteResultFuture`
+
+| Description                                                                                                                                   |
+|-----------------------------------------------------------------------------------------------------------------------------------------------|
+| Implements `Future<Output = Result<(), Error>>`. Await to wait for server acknowledgment. Returned by `append()`, `upsert()`, and `delete()`. |
+
+Usage:
+
+```rust
+// Fire-and-forget (batched)
+writer.append(&row)?;
+writer.flush().await?;
+
+// Per-record acknowledgment
+writer.append(&row)?.await?;
+```
+
+## `Schema`
+
+| Method                                         |  Description                             |
+|------------------------------------------------|------------------------------------------|
+| `fn builder() -> SchemaBuilder`                | Create a schema builder                  |
+| `fn columns(&self) -> &[Column]`               | Get all columns                          |
+| `fn primary_key(&self) -> Option<&PrimaryKey>` | Get primary key (None if no primary key) |
+| `fn column_names(&self) -> Vec<&str>`          | Get all column names                     |
+| `fn primary_key_indexes(&self) -> Vec<usize>`  | Get primary key column indices           |
+
+## `SchemaBuilder`
+
+| Method                                               |  Description            |
+|------------------------------------------------------|-------------------------|
+| `fn column(name: &str, data_type: DataType) -> Self` | Add a column            |
+| `fn primary_key(keys: Vec<&str>) -> Self`            | Set primary key columns |
+| `fn build() -> Result<Schema>`                       | Build the schema        |
+
+## `SchemaInfo`
+
+A schema together with its server-assigned version id. Returned by [`FlussAdmin::get_table_schema`](#flussadmin).
+
+| Method                                           | Description                              |
+|--------------------------------------------------|------------------------------------------|
+| `fn new(schema: Schema, schema_id: i32) -> Self` | Construct from a schema and id           |
+| `fn schema(&self) -> &Schema`                    | Borrow the schema                        |
+| `fn schema_id(&self) -> i32`                     | Get the server-assigned schema id        |
+| `fn into_parts(self) -> (Schema, i32)`           | Consume and return `(schema, schema_id)` |
+
+## `TableDescriptor`
+
+| Method                                                    | Description                          |
+|-----------------------------------------------------------|--------------------------------------|
+| `fn builder() -> TableDescriptorBuilder`                  | Create a table descriptor builder    |
+| `fn schema(&self) -> &Schema`                             | Get the table schema                 |
+| `fn partition_keys(&self) -> &[String]`                   | Get partition key column names       |
+| `fn has_primary_key(&self) -> bool`                       | Check if the table has a primary key |
+| `fn properties(&self) -> &HashMap<String, String>`        | Get all table properties             |
+| `fn custom_properties(&self) -> &HashMap<String, String>` | Get custom properties                |
+| `fn comment(&self) -> Option<&str>`                       | Get table comment                    |
+
+## `TableDescriptorBuilder`
+
+| Method                                                                                    | Description                                 |
+|-------------------------------------------------------------------------------------------|---------------------------------------------|
+| `fn schema(schema: Schema) -> Self`                                                       | Set the schema                              |
+| `fn log_format(format: LogFormat) -> Self`                                                | Set log format (e.g., `LogFormat::ARROW`)   |
+| `fn kv_format(format: KvFormat) -> Self`                                                  | Set KV format (e.g., `KvFormat::COMPACTED`) |
+| `fn property(key: &str, value: &str) -> Self`                                             | Set a table property                        |
+| `fn custom_property(key: impl Into<String>, value: impl Into<String>) -> Self`            | Set a single custom property                |
+| `fn custom_properties(properties: HashMap<impl Into<String>, impl Into<String>>) -> Self` | Set custom properties                       |
+| `fn partitioned_by(keys: Vec<&str>) -> Self`                                              | Set partition columns                       |
+| `fn distributed_by(bucket_count: Option<i32>, bucket_keys: Vec<String>) -> Self`          | Set bucket distribution                     |
+| `fn comment(comment: &str) -> Self`                                                       | Set table comment                           |
+| `fn build() -> Result<TableDescriptor>`                                                   | Build the table descriptor                  |
+
+## `TablePath`
+
+| Method                                                |  Description        |
+|-------------------------------------------------------|---------------------|
+| `TablePath::new(database: &str, table: &str) -> Self` | Create a table path |
+| `fn database(&self) -> &str`                          | Get database name   |
+| `fn table(&self) -> &str`                             | Get table name      |
+
+## `TableInfo`
+
+| Field / Method       | Description                                         |
+|----------------------|-----------------------------------------------------|
+| `.table_path`        | `TablePath` -- Table path                           |
+| `.table_id`          | `i64` -- Table ID                                   |
+| `.schema_id`         | `i32` -- Schema ID                                  |
+| `.schema`            | `Schema` -- Table schema                            |
+| `.primary_keys`      | `Vec<String>` -- Primary key column names           |
+| `.partition_keys`    | `Vec<String>` -- Partition key column names         |
+| `.num_buckets`       | `i32` -- Number of buckets                          |
+| `.properties`        | `HashMap<String, String>` -- All table properties   |
+| `.custom_properties` | `HashMap<String, String>` -- Custom properties only |
+| `.comment`           | `Option<String>` -- Table comment                   |
+| `.created_time`      | `i64` -- Creation timestamp                         |
+| `.modified_time`     | `i64` -- Last modification timestamp                |
+
+## `TableBucket`
+
+| Method                                                                                              | Description                                |
+|-----------------------------------------------------------------------------------------------------|--------------------------------------------|
+| `TableBucket::new(table_id: i64, bucket_id: i32) -> Self`                                           | Create a non-partitioned bucket            |
+| `TableBucket::new_with_partition(table_id: i64, partition_id: Option<i64>, bucket_id: i32) -> Self` | Create a partitioned bucket                |
+| `fn table_id(&self) -> i64`                                                                         | Get table ID                               |
+| `fn partition_id(&self) -> Option<i64>`                                                             | Get partition ID (None if non-partitioned) |
+| `fn bucket_id(&self) -> i32`                                                                        | Get bucket ID                              |
+
+## `PartitionSpec`
+
+| Method                                                      | Description                                           |
+|-------------------------------------------------------------|-------------------------------------------------------|
+| `PartitionSpec::new(spec_map: HashMap<&str, &str>) -> Self` | Create from a map of partition column names to values |
+| `fn get_spec_map(&self) -> &HashMap<String, String>`        | Get the partition spec map                            |
+
+## `PartitionInfo`
+
+| Method                                   |  Description       |
+|------------------------------------------|--------------------|
+| `fn get_partition_id(&self) -> i64`      | Get partition ID   |
+| `fn get_partition_name(&self) -> String` | Get partition name |
+
+## `DatabaseDescriptor`
+
+| Method                                                    | Description                          |
+|-----------------------------------------------------------|--------------------------------------|
+| `fn builder() -> DatabaseDescriptorBuilder`               | Create a database descriptor builder |
+| `fn comment(&self) -> Option<&str>`                       | Get database comment                 |
+| `fn custom_properties(&self) -> &HashMap<String, String>` | Get custom properties                |
+
+## `DatabaseDescriptorBuilder`
+
+| Method                                                                                    | Description                   |
+|-------------------------------------------------------------------------------------------|-------------------------------|
+| `fn comment(comment: impl Into<String>) -> Self`                                          | Set database comment          |
+| `fn custom_properties(properties: HashMap<impl Into<String>, impl Into<String>>) -> Self` | Set custom properties         |
+| `fn custom_property(key: impl Into<String>, value: impl Into<String>) -> Self`            | Set a single custom property  |
+| `fn build() -> DatabaseDescriptor`                                                        | Build the database descriptor |
+
+## `DatabaseInfo`
+
+| Method                                                 | Description                     |
+|--------------------------------------------------------|---------------------------------|
+| `fn database_name(&self) -> &str`                      | Get database name               |
+| `fn created_time(&self) -> i64`                        | Get creation timestamp          |
+| `fn modified_time(&self) -> i64`                       | Get last modification timestamp |
+| `fn database_descriptor(&self) -> &DatabaseDescriptor` | Get the database descriptor     |
+
+## `LakeSnapshot`
+
+| Field                   | Description                                       |
+|-------------------------|---------------------------------------------------|
+| `.snapshot_id`          | `i64` -- Snapshot ID                              |
+| `.table_buckets_offset` | `HashMap<TableBucket, i64>` -- All bucket offsets |
+
+## `GenericRow<'a>`
+
+| Method                                                             | Description                                      |
+|--------------------------------------------------------------------|--------------------------------------------------|
+| `GenericRow::new(field_count: usize) -> Self`                      | Create a new row with the given number of fields |
+| `fn set_field(&mut self, pos: usize, value: impl Into<Datum<'a>>)` | Set a field value by position                    |
+| `GenericRow::from_data(data: Vec<impl Into<Datum<'a>>>) -> Self`   | Create a row from existing field data            |
+
+Implements the `InternalRow` trait (see below).
+
+## `InternalRow` trait
+
+| Method                                                                                 | Description                             |
+|----------------------------------------------------------------------------------------|-----------------------------------------|
+| `fn is_null_at(&self, idx: usize) -> Result<bool>`                                     | Check if a field is null                |
+| `fn get_boolean(&self, idx: usize) -> Result<bool>`                                    | Get boolean value                       |
+| `fn get_byte(&self, idx: usize) -> Result<i8>`                                         | Get tinyint value                       |
+| `fn get_short(&self, idx: usize) -> Result<i16>`                                       | Get smallint value                      |
+| `fn get_int(&self, idx: usize) -> Result<i32>`                                         | Get int value                           |
+| `fn get_long(&self, idx: usize) -> Result<i64>`                                        | Get bigint value                        |
+| `fn get_float(&self, idx: usize) -> Result<f32>`                                       | Get float value                         |
+| `fn get_double(&self, idx: usize) -> Result<f64>`                                      | Get double value                        |
+| `fn get_string(&self, idx: usize) -> Result<&str>`                                     | Get string value                        |
+| `fn get_decimal(&self, idx: usize, precision: usize, scale: usize) -> Result<Decimal>` | Get decimal value                       |
+| `fn get_date(&self, idx: usize) -> Result<Date>`                                       | Get date value                          |
+| `fn get_time(&self, idx: usize) -> Result<Time>`                                       | Get time value                          |
+| `fn get_timestamp_ntz(&self, idx: usize, precision: u32) -> Result<TimestampNtz>`      | Get timestamp value                     |
+| `fn get_timestamp_ltz(&self, idx: usize, precision: u32) -> Result<TimestampLtz>`      | Get timestamp with local timezone value |
+| `fn get_bytes(&self, idx: usize) -> Result<&[u8]>`                                     | Get bytes value                         |
+| `fn get_binary(&self, idx: usize, length: usize) -> Result<&[u8]>`                     | Get fixed-length binary value           |
+| `fn get_char(&self, idx: usize, length: usize) -> Result<&str>`                        | Get fixed-length char value             |
+| `fn get_array(&self, idx: usize) -> Result<FlussArray>`                                | Get array value                         |
+| `fn get_map(&self, idx: usize) -> Result<FlussMap>`                                    | Get map value                           |
+
+## `FlussArray`
+
+`FlussArray` is the Rust row representation for `ARRAY` values. You usually obtain it from `InternalRow::get_array()`.
+
+| Method | Description |
+|--------|-------------|
+| `fn size(&self) -> usize` | Number of elements in the array |
+| `fn is_null_at(&self, pos: usize) -> bool` | Check whether an element is null |
+| `fn as_bytes(&self) -> &[u8]` | Get encoded bytes of the array |
+
+Element getters mirror `InternalRow` typed getters and return `Result<T>`. For example, use `get_int()`, `get_long()`, and `get_double()` for primitive elements, and `get_string()`, `get_binary()`, `get_decimal()`, `get_timestamp_ntz()`, `get_timestamp_ltz()`, and `get_array()` for variable-length or nested elements.
+
+## `FlussMap`
+
+`FlussMap` is the Rust row representation for `MAP` values. You usually obtain it from `InternalRow::get_map()`.
+
+| Method | Description |
+|--------|-------------|
+| `fn size(&self) -> usize` | Number of entries in the map |
+| `fn as_bytes(&self) -> &[u8]` | Get encoded bytes of the map |
+| `fn key_type(&self) -> &DataType` | Schema-declared type of keys |
+| `fn value_type(&self) -> &DataType` | Schema-declared type of values |
+| `fn entries(&self) -> Entries<'_>` | Iterator yielding `Result<(Datum, Datum)>` pairs |
+| `fn get(&self, key: &Datum) -> Result<Option<Datum>>` | Linear-scan lookup by key (`O(n)`) |
+| `fn key_array(&self) -> &FlussArray` | Parallel keys array (zero-copy view) |
+| `fn value_array(&self) -> &FlussArray` | Parallel values array (zero-copy view) |
+
+Most user code should prefer `entries()` (iteration) and `get()` (lookup). The `key_array()` / `value_array()` views are for serdes and Arrow-adapter code that needs zero-copy access to the underlying parallel-array layout.
+
+## `FlussMapWriter`
+
+`FlussMapWriter` builds a `FlussMap` for write paths.
+
+| Method | Description |
+|--------|-------------|
+| `fn new(capacity: usize, key_type: &DataType, value_type: &DataType) -> Self` | Create a writer sized for `capacity` entries |
+| `fn write_entry(&mut self, key: Datum, value: Datum) -> Result<()>` | Append a single entry; rejects null keys and type mismatches |
+| `fn extend<I, K, V>(&mut self, entries: I) -> Result<()>` | Append every pair from `entries: IntoIterator<Item = (K, V)>` |
+| `fn complete(self) -> Result<FlussMap>` | Finalize the writer and produce the `FlussMap` |
+
+## `ChangeType`
+
+| Value                      | Short String  | Description                      |
+|----------------------------|---------------|----------------------------------|
+| `ChangeType::AppendOnly`   | `+A`          | Append-only record               |
+| `ChangeType::Insert`       | `+I`          | Inserted row                     |
+| `ChangeType::UpdateBefore` | `-U`          | Previous value of an updated row |
+| `ChangeType::UpdateAfter`  | `+U`          | New value of an updated row      |
+| `ChangeType::Delete`       | `-D`          | Deleted row                      |
+
+| Method                           | Description                         |
+|----------------------------------|-------------------------------------|
+| `fn short_string(&self) -> &str` | Get the short string representation |
+
+## `OffsetSpec`
+
+| Variant                      | Description                                     |
+|------------------------------|-------------------------------------------------|
+| `OffsetSpec::Earliest`       | Start from the earliest available offset        |
+| `OffsetSpec::Latest`         | Start from the latest offset (only new records) |
+| `OffsetSpec::Timestamp(i64)` | Start from a specific timestamp in milliseconds |
+
+## Constants
+
+| Constant                         | Value  | Description                                             |
+|----------------------------------|--------|---------------------------------------------------------|
+| `fluss::client::EARLIEST_OFFSET` | `-2`   | Start reading from the earliest available offset        |
+
+To start reading from the latest offset (only new records), resolve the current offset via `list_offsets` before subscribing:
+
+```rust
+use fluss::rpc::message::OffsetSpec;
+
+let offsets = admin.list_offsets(&table_path, &[0], OffsetSpec::Latest).await?;
+let latest = offsets[&0];
+log_scanner.subscribe(0, latest).await?;
+```
+
+## `DataTypes` factory
+
+| Method                                           | Returns    | Description                        |
+|--------------------------------------------------|------------|------------------------------------|
+| `DataTypes::boolean()`                           | `DataType` | Boolean type                       |
+| `DataTypes::tinyint()`                           | `DataType` | 8-bit signed integer               |
+| `DataTypes::smallint()`                          | `DataType` | 16-bit signed integer              |
+| `DataTypes::int()`                               | `DataType` | 32-bit signed integer              |
+| `DataTypes::bigint()`                            | `DataType` | 64-bit signed integer              |
+| `DataTypes::float()`                             | `DataType` | 32-bit floating point              |
+| `DataTypes::double()`                            | `DataType` | 64-bit floating point              |
+| `DataTypes::string()`                            | `DataType` | Variable-length string             |
+| `DataTypes::bytes()`                             | `DataType` | Variable-length byte array         |
+| `DataTypes::date()`                              | `DataType` | Date (days since epoch)            |
+| `DataTypes::time()`                              | `DataType` | Time (milliseconds since midnight) |
+| `DataTypes::timestamp()`                         | `DataType` | Timestamp without timezone         |
+| `DataTypes::timestamp_ltz()`                     | `DataType` | Timestamp with local timezone      |
+| `DataTypes::decimal(precision: u32, scale: u32)` | `DataType` | Fixed-point decimal                |
+| `DataTypes::char(length: u32)`                   | `DataType` | Fixed-length string                |
+| `DataTypes::binary(length: usize)`               | `DataType` | Fixed-length byte array            |
+| `DataTypes::array(element: DataType)`            | `DataType` | Array of elements                  |
+| `DataTypes::map(key: DataType, value: DataType)` | `DataType` | Map of key-value pairs             |
+| `DataTypes::row(fields: Vec<DataField>)`         | `DataType` | Nested row type                    |
+
+## `DataField`
+
+| Method                                                                                                   | Description         |
+|----------------------------------------------------------------------------------------------------------|---------------------|
+| `DataField::new(name: impl Into<String>, data_type: DataType, description: Option<String>) -> DataField` | Create a data field |
+| `fn name(&self) -> &str`                                                                                 | Get the field name  |
diff --git a/website/docs/apis/rust/data-types.md b/website/docs/apis/rust/data-types.md
new file mode 100644
index 0000000000..5418839184
--- /dev/null
+++ b/website/docs/apis/rust/data-types.md
@@ -0,0 +1,179 @@
+---
+sidebar_position: 3
+---
+# Data Types
+
+| Fluss Type      | Rust Type      | Getter                               | Setter                         |
+|-----------------|----------------|--------------------------------------|--------------------------------|
+| `BOOLEAN`       | `bool`         | `get_boolean()`                      | `set_field(idx, bool)`         |
+| `TINYINT`       | `i8`           | `get_byte()`                         | `set_field(idx, i8)`           |
+| `SMALLINT`      | `i16`          | `get_short()`                        | `set_field(idx, i16)`          |
+| `INT`           | `i32`          | `get_int()`                          | `set_field(idx, i32)`          |
+| `BIGINT`        | `i64`          | `get_long()`                         | `set_field(idx, i64)`          |
+| `FLOAT`         | `f32`          | `get_float()`                        | `set_field(idx, f32)`          |
+| `DOUBLE`        | `f64`          | `get_double()`                       | `set_field(idx, f64)`          |
+| `CHAR`          | `&str`         | `get_char(idx, length)`              | `set_field(idx, &str)`         |
+| `STRING`        | `&str`         | `get_string()`                       | `set_field(idx, &str)`         |
+| `DECIMAL`       | `Decimal`      | `get_decimal(idx, precision, scale)` | `set_field(idx, Decimal)`      |
+| `DATE`          | `Date`         | `get_date()`                         | `set_field(idx, Date)`         |
+| `TIME`          | `Time`         | `get_time()`                         | `set_field(idx, Time)`         |
+| `TIMESTAMP`     | `TimestampNtz` | `get_timestamp_ntz(idx, precision)`  | `set_field(idx, TimestampNtz)` |
+| `TIMESTAMP_LTZ` | `TimestampLtz` | `get_timestamp_ltz(idx, precision)`  | `set_field(idx, TimestampLtz)` |
+| `BYTES`         | `&[u8]`        | `get_bytes()`                        | `set_field(idx, &[u8])`        |
+| `BINARY(n)`     | `&[u8]`        | `get_binary(idx, length)`            | `set_field(idx, &[u8])`        |
+| `ARRAY<T>`      | `FlussArray`   | `get_array()`                        | `set_field(idx, FlussArray)`   |
+| `MAP<K, V>`     | `FlussMap`     | `get_map(idx)`                       | `set_field(idx, FlussMap)`     |
+
+## Constructing Special Types
+
+Primitive types (`bool`, `i8`, `i16`, `i32`, `i64`, `f32`, `f64`, `&str`, `&[u8]`) can be passed directly to `set_field`. The following types require explicit construction:
+
+```rust
+use fluss::row::{Date, Time, TimestampNtz, TimestampLtz, Decimal};
+
+// Date: days since Unix epoch
+let date = Date::new(19738);
+
+// Time: milliseconds since midnight
+let time = Time::new(43200000);
+
+// Timestamp without timezone: milliseconds since epoch
+// DataTypes::timestamp() defaults to precision 6 (microseconds).
+// Use DataTypes::timestamp_with_precision(p) for a different precision (0–9).
+let ts = TimestampNtz::new(1704067200000);
+
+// Timestamp with local timezone: milliseconds since epoch
+// DataTypes::timestamp_ltz() also defaults to precision 6.
+let ts_ltz = TimestampLtz::new(1704067200000);
+
+// Decimal: from an unscaled long value with precision and scale
+let decimal = Decimal::from_unscaled_long(12345, 10, 2)?; // represents 123.45
+```
+
+## Creating Rows from Data
+
+`GenericRow::from_data` accepts a `Vec<Datum>`. Because multiple crates implement `From<&str>`, Rust cannot infer the target type from `.into()` alone. Annotate the vector type explicitly:
+
+```rust
+use fluss::row::{Datum, GenericRow};
+
+let data: Vec<Datum> = vec![1i32.into(), "hello".into(), Datum::Null];
+let row = GenericRow::from_data(data);
+```
+
+## Arrays
+
+Use `DataTypes::array(element_type)` in schema definitions. At runtime, read arrays with `row.get_array(idx)?`.
+
+To construct array values for writes, build a `FlussArray` and wrap it with `Datum::Array`:
+
+```rust
+use fluss::metadata::DataTypes;
+use fluss::row::binary_array::FlussArrayWriter;
+use fluss::row::{Datum, GenericRow};
+
+let mut writer = FlussArrayWriter::new(3, &DataTypes::int());
+writer.write_int(0, 10);
+writer.write_int(1, 20);
+writer.set_null_at(2);
+let arr = writer.complete()?;
+
+let mut row = GenericRow::new(1);
+row.set_field(0, Datum::Array(arr));
+```
+
+`ARRAY` is supported for row values and nested row fields. For key encoding, Rust follows Java parity: `ARRAY` can be encoded by the compacted key encoder, while table-level key constraints are validated by the server (which may reject unsupported key types).
+
+## Maps
+
+Use `DataTypes::map(key_type, value_type)` in schema definitions. At runtime, read maps with `row.get_map(idx)?` — the row knows its schema, so no extra type arguments are needed.
+
+### Writing
+
+Build a `FlussMap` entry-by-entry, then wrap it with `Datum::Map`:
+
+```rust
+use fluss::metadata::DataTypes;
+use fluss::row::binary_map::FlussMapWriter;
+use fluss::row::{Datum, GenericRow};
+
+let mut writer = FlussMapWriter::new(2, &DataTypes::string(), &DataTypes::int());
+writer.write_entry("key1".into(), 100.into())?;
+writer.write_entry("key2".into(), Datum::Null)?;
+let map = writer.complete()?;
+
+let mut row = GenericRow::new(1);
+row.set_field(0, Datum::Map(map));
+```
+
+For bulk writes from any iterator of `(key, value)` pairs (including a `HashMap`), use `extend`:
+
+```rust
+use std::collections::HashMap;
+
+let entries: HashMap<&str, i32> = HashMap::from([("a", 1), ("b", 2)]);
+let mut writer = FlussMapWriter::new(entries.len(), &DataTypes::string(), &DataTypes::int());
+writer.extend(entries)?;
+let map = writer.complete()?;
+```
+
+### Reading
+
+The `entries()` iterator yields `(key, value)` pairs as schema-typed `Datum`s, folding the null check in:
+
+```rust
+use fluss::row::InternalRow;
+
+let m = row.get_map(0)?;
+for entry in m.entries() {
+    let (k, v) = entry?;
+    println!("{k:?} => {v:?}");          // Datum's Debug handles null
+}
+```
+
+For point lookups, `get(&key)` does a linear scan and returns `Option<Datum>`:
+
+```rust
+use fluss::row::Datum;
+
+if let Some(v) = m.get(&Datum::from("attr_size"))? {
+    println!("size = {v:?}");
+}
+```
+
+Lookup is `O(n)` — the binary MAP layout has no key index. If you need repeated lookups against the same map, collect the entries once:
+
+```rust
+use std::collections::HashMap;
+
+let snapshot: HashMap<String, Datum<'_>> = m
+    .entries()
+    .map(|e| e.map(|(k, v)| (format!("{k:?}"), v)))
+    .collect::<Result<_, _>>()?;
+```
+
+For raw access to the underlying parallel-array representation (zero-copy, used by serdes / Arrow adapters), `m.key_array()` and `m.value_array()` are still available.
+
+### Constraints
+
+`MAP` keys cannot be null. `MAP` is supported for row values and nested row fields. `MAP` cannot be used as a primary key or bucket key column — the Rust client rejects it at the compacted key encoder, and the Fluss server bans `MAP` (along with `ARRAY` and `ROW`) from key columns.
+
+## Reading Row Data
+
+```rust
+use fluss::row::InternalRow;
+
+for record in scan_records {
+    let row = record.row();
+
+    if row.is_null_at(0)? {
+        // field is null
+    }
+    let id: i32 = row.get_int(0)?;
+    let name: &str = row.get_string(1)?;
+    let score: f32 = row.get_float(2)?;
+    let date: Date = row.get_date(3)?;
+    let ts: TimestampNtz = row.get_timestamp_ntz(4, 6)?;
+    let decimal: Decimal = row.get_decimal(5, 10, 2)?;
+}
+```
diff --git a/website/docs/apis/rust/error-handling.md b/website/docs/apis/rust/error-handling.md
new file mode 100644
index 0000000000..4966428997
--- /dev/null
+++ b/website/docs/apis/rust/error-handling.md
@@ -0,0 +1,241 @@
+---
+sidebar_position: 4
+---
+# Error Handling
+
+The Fluss Rust client uses a unified `Error` type and a `Result<T>` alias for all fallible operations.
+
+## Basic Usage
+
+```rust
+use fluss::error::{Error, Result};
+
+// All operations return Result<T>
+let conn = FlussConnection::new(config).await?;
+let admin = conn.get_admin()?;
+let table = conn.get_table(&table_path).await?;
+```
+
+Use the `?` operator to propagate errors, or `match` on specific variants for fine-grained handling.
+
+## Matching Error Variants
+
+```rust
+use fluss::error::Error;
+
+match result {
+    Ok(val) => {
+        // handle success
+    }
+    Err(Error::RpcError { message, .. }) => {
+        eprintln!("RPC failure: {}", message);
+    }
+    Err(Error::UnsupportedOperation { message }) => {
+        eprintln!("Unsupported: {}", message);
+    }
+    Err(Error::FlussAPIError { api_error }) => {
+        eprintln!("Server error: {}", api_error);
+    }
+    Err(e) => {
+        eprintln!("Unexpected error: {}", e);
+    }
+}
+```
+
+## Error Variants
+
+| Variant                        | Description                                                  |
+|--------------------------------|--------------------------------------------------------------|
+| `UnexpectedError`              | General unexpected errors with a message and optional source |
+| `IoUnexpectedError`            | I/O errors (network, file system)                            |
+| `RemoteStorageUnexpectedError` | Remote storage errors (OpenDAL backend failures)             |
+| `RpcError`                     | RPC communication failures (connection refused, timeout)     |
+| `RowConvertError`              | Row conversion failures (type mismatch, invalid data)        |
+| `ArrowError`                   | Arrow data handling errors (schema mismatch, encoding)       |
+| `IllegalArgument`              | Invalid arguments passed to an API method                    |
+| `UnsupportedOperation`         | Operation not supported on the table type                    |
+| `FlussAPIError`                | Server-side API errors returned by the Fluss cluster         |
+
+Server side errors are represented as `FlussAPIError` with a specific error code. Use the `api_error()` helper to match them ergonomically:
+
+```rust
+use fluss::error::FlussError;
+
+match result {
+    Err(ref e) if e.api_error() == Some(FlussError::InvalidTableException) => {
+        eprintln!("Invalid table: {}", e);
+    }
+    Err(ref e) if e.api_error() == Some(FlussError::PartitionNotExists) => {
+        eprintln!("Partition does not exist: {}", e);
+    }
+    Err(ref e) if e.api_error() == Some(FlussError::LeaderNotAvailableException) => {
+        eprintln!("Leader not available: {}", e);
+    }
+    Err(ref e) if e.api_error() == Some(FlussError::AuthenticateException) => {
+        eprintln!("Authentication failed: {}", e);
+    }
+    _ => {}
+}
+```
+
+## Retry Logic
+
+Some errors are transient, where the server may be temporarily unavailable, mid-election, or under load. `is_retriable()` can be used for deciding to retry an operation rather than treating the error as permanent.
+
+`Error::is_retriable()` is available directly on any `Error` value. `RpcError` is always retriable; `FlussAPIError` delegates to the server error code; all other variants return `false`.
+
+```rust
+use fluss::error::Error;
+
+match writer.append(&row) {
+    Ok(_) => {}
+    Err(ref e) if e.is_retriable() => {
+        // Transient failure — safe to retry
+    }
+    Err(e) => {
+        // Permanent failure — log and abort
+        eprintln!("Fatal error: {}", e);
+    }
+}
+```
+
+### Retriable Variants
+
+| Variant / Error                              | Code | Reason                                    |
+|----------------------------------------------|------|-------------------------------------------|
+| `Error::RpcError`                            | —    | Network-level failure, always retriable   |
+| `FlussError::NetworkException`               | 1    | Server disconnected                       |
+| `FlussError::CorruptMessage`                 | 3    | CRC or size error                         |
+| `FlussError::SchemaNotExist`                 | 9    | Schema may not exist                      |
+| `FlussError::LogStorageException`            | 10   | Transient log storage error               |
+| `FlussError::KvStorageException`             | 11   | Transient KV storage error                |
+| `FlussError::NotLeaderOrFollower`            | 12   | Leader election in progress               |
+| `FlussError::CorruptRecordException`         | 14   | Corrupt record                            |
+| `FlussError::UnknownTableOrBucketException`  | 21   | Metadata not yet available                |
+| `FlussError::RequestTimeOut`                 | 25   | Request timed out                         |
+| `FlussError::StorageException`               | 26   | Transient storage error                   |
+| `FlussError::NotEnoughReplicasAfterAppendException` | 28 | Wrote to server but with low ISR size |
+| `FlussError::NotEnoughReplicasException`     | 29   | Low ISR size at write time                |
+| `FlussError::LeaderNotAvailableException`    | 44   | No leader available for partition         |
+
+All other `Error` variants (e.g. `RowConvertError`, `IllegalArgument`, `UnsupportedOperation`) always return `false` from `is_retriable()`.
+
+## Common Error Scenarios
+
+### Connection Refused
+
+The Fluss cluster is not running or the address is incorrect.
+
+```rust
+let result = FlussConnection::new(config).await;
+match result {
+    Err(Error::RpcError { message, .. }) => {
+        eprintln!("Cannot connect to cluster: {}", message);
+    }
+    _ => {}
+}
+```
+
+### Table Not Found
+
+The table does not exist or has been dropped.
+
+```rust
+use fluss::error::{Error, FlussError};
+
+// Admin operations return FlussError::TableNotExist (code 7)
+let result = admin.drop_table(&table_path, false).await;
+match result {
+    Err(ref e) if e.api_error() == Some(FlussError::TableNotExist) => {
+        eprintln!("Table not found: {}", e);
+    }
+    _ => {}
+}
+
+// conn.get_table() wraps the error differently, match on FlussAPIError directly
+let result = conn.get_table(&table_path).await;
+match result {
+    Err(Error::FlussAPIError { ref api_error }) => {
+        eprintln!("Server error (code {}): {}", api_error.code, api_error.message);
+    }
+    _ => {}
+}
+```
+
+### Partition Not Found
+
+The partition does not exist on a partitioned table.
+
+```rust
+use fluss::error::FlussError;
+
+let result = admin.drop_partition(&table_path, &spec, false).await;
+match result {
+    Err(ref e) if e.api_error() == Some(FlussError::PartitionNotExists) => {
+        eprintln!("Partition does not exist: {}", e);
+    }
+    _ => {}
+}
+```
+
+### Authentication Failed
+
+SASL credentials are incorrect or the user does not exist.
+
+```rust
+use fluss::error::{Error, FlussError};
+
+let result = FlussConnection::new(config).await;
+match result {
+    Err(ref e) if e.api_error() == Some(FlussError::AuthenticateException) => {
+        eprintln!("Authentication failed: {}", e);
+    }
+    _ => {}
+}
+```
+
+### Schema Mismatch
+
+Row data does not match the expected table schema.
+
+```rust
+let result = writer.append(&row);
+match result {
+    Err(Error::RowConvertError { .. }) => {
+        eprintln!("Row does not match table schema");
+    }
+    _ => {}
+}
+```
+
+## Using `Result<T>` in Application Code
+
+The `fluss::error::Result<T>` type alias makes it easy to use Fluss errors with the `?` operator in your application functions:
+
+```rust
+use fluss::error::Result;
+
+async fn my_pipeline() -> Result<()> {
+    let conn = FlussConnection::new(config).await?;
+    let admin = conn.get_admin()?;
+    let table = conn.get_table(&table_path).await?;
+    let writer = table.new_append()?.create_writer()?;
+    writer.append(&row)?;
+    writer.flush().await?;
+    Ok(())
+}
+```
+
+For applications that use other error types alongside Fluss errors, you can convert with standard `From` / `Into` traits or use crates like `anyhow`:
+
+```rust
+use anyhow::Result;
+
+#[tokio::main]
+async fn main() -> Result<()> {
+    let conn = FlussConnection::new(config).await?;
+    // fluss::error::Error implements std::error::Error,
+    // so it converts into anyhow::Error automatically
+    Ok(())
+}
+```
diff --git a/website/docs/apis/rust/example/_category_.json b/website/docs/apis/rust/example/_category_.json
new file mode 100644
index 0000000000..4d81ec12ae
--- /dev/null
+++ b/website/docs/apis/rust/example/_category_.json
@@ -0,0 +1,4 @@
+{
+  "label": "Examples",
+  "position": 5
+}
diff --git a/website/docs/apis/rust/example/admin-operations.md b/website/docs/apis/rust/example/admin-operations.md
new file mode 100644
index 0000000000..39752754f1
--- /dev/null
+++ b/website/docs/apis/rust/example/admin-operations.md
@@ -0,0 +1,122 @@
+---
+sidebar_position: 3
+---
+# Admin Operations
+
+## Get Admin Interface
+
+```rust
+let admin = conn.get_admin()?;
+```
+
+## Database Operations
+
+```rust
+// Create database
+admin.create_database("my_database", None, true).await?;
+
+// List all databases
+let databases = admin.list_databases().await?;
+println!("Databases: {:?}", databases);
+
+// Check if database exists
+let exists = admin.database_exists("my_database").await?;
+
+// Get database information
+let db_info = admin.get_database_info("my_database").await?;
+
+// Drop database
+admin.drop_database("my_database", true, false).await?;
+```
+
+## Table Operations
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .column("amount", DataTypes::bigint())
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("my_database", "my_table");
+
+// Create table
+admin.create_table(&table_path, &table_descriptor, true).await?;
+
+// Get table information
+let table_info = admin.get_table_info(&table_path).await?;
+println!("Table: {}", table_info);
+
+// List tables in database
+let tables = admin.list_tables("my_database").await?;
+
+// Check if table exists
+let exists = admin.table_exists(&table_path).await?;
+
+// Drop table
+admin.drop_table(&table_path, true).await?;
+```
+
+## Partition Operations
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+// List all partitions
+let partitions = admin.list_partition_infos(&table_path).await?;
+
+// List partitions matching a spec
+let mut filter = HashMap::new();
+filter.insert("year", "2024");
+let spec = PartitionSpec::new(filter);
+let partitions = admin.list_partition_infos_with_spec(&table_path, Some(&spec)).await?;
+
+// Create partition
+admin.create_partition(&table_path, &spec, true).await?;
+
+// Drop partition
+admin.drop_partition(&table_path, &spec, true).await?;
+```
+
+## Offset Operations
+
+```rust
+use fluss::rpc::message::OffsetSpec;
+
+let bucket_ids = vec![0, 1, 2];
+
+// Get earliest offsets
+let earliest = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Earliest).await?;
+
+// Get latest offsets
+let latest = admin.list_offsets(&table_path, &bucket_ids, OffsetSpec::Latest).await?;
+
+// Get offsets for a specific timestamp
+let timestamp_ms = 1704067200000; // 2024-01-01 00:00:00 UTC
+let offsets = admin.list_offsets(
+    &table_path, &bucket_ids, OffsetSpec::Timestamp(timestamp_ms),
+).await?;
+
+// Get offsets for a specific partition
+let partition_offsets = admin.list_partition_offsets(
+    &table_path, "partition_name", &bucket_ids, OffsetSpec::Latest,
+).await?;
+```
+
+## Lake Snapshot
+
+:::note
+Lake snapshots require [lake integration](https://fluss.apache.org/docs/maintenance/tiered-storage/overview/) (e.g. Paimon or Iceberg) to be enabled on the server. Without it, `get_latest_lake_snapshot` will return an error.
+:::
+
+```rust
+let snapshot = admin.get_latest_lake_snapshot(&table_path).await?;
+println!("Snapshot ID: {}", snapshot.snapshot_id);
+```
diff --git a/website/docs/apis/rust/example/configuration.md b/website/docs/apis/rust/example/configuration.md
new file mode 100644
index 0000000000..eba38d85f2
--- /dev/null
+++ b/website/docs/apis/rust/example/configuration.md
@@ -0,0 +1,35 @@
+---
+sidebar_position: 2
+---
+# Configuration
+
+## Connection Setup
+
+```rust
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+
+let mut config = Config::default();
+config.bootstrap_servers = "127.0.0.1:9123".to_string();
+
+let conn = FlussConnection::new(config).await?;
+```
+
+## Connection Configurations
+
+See the [`Config`](../api-reference.md#config) section in the API Reference for the full list of configuration options, types, and defaults.
+
+## SASL Authentication
+
+To connect to a Fluss cluster with SASL/PLAIN authentication enabled:
+
+```rust
+let mut config = Config::default();
+config.bootstrap_servers = "127.0.0.1:9123".to_string();
+config.security_protocol = "sasl".to_string();
+config.security_sasl_mechanism = "PLAIN".to_string();
+config.security_sasl_username = "admin".to_string();
+config.security_sasl_password = "admin-secret".to_string();
+
+let conn = FlussConnection::new(config).await?;
+```
diff --git a/website/docs/apis/rust/example/index.md b/website/docs/apis/rust/example/index.md
new file mode 100644
index 0000000000..f1d5a6882d
--- /dev/null
+++ b/website/docs/apis/rust/example/index.md
@@ -0,0 +1,56 @@
+---
+sidebar_position: 1
+---
+# Example
+
+Minimal working examples: connect to Fluss, create a table, write data, and read it back.
+
+```rust
+use fluss::client::FlussConnection;
+use fluss::config::Config;
+use fluss::error::Result;
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+use fluss::row::{GenericRow, InternalRow};
+use std::time::Duration;
+
+#[tokio::main]
+async fn main() -> Result<()> {
+    // Connect
+    let mut config = Config::default();
+    config.bootstrap_servers = "127.0.0.1:9123".to_string();
+    let conn = FlussConnection::new(config).await?;
+    let admin = conn.get_admin()?;
+
+    // Create a log table
+    let table_path = TablePath::new("fluss", "quickstart_rust");
+    let descriptor = TableDescriptor::builder()
+        .schema(
+            Schema::builder()
+                .column("id", DataTypes::int())
+                .column("name", DataTypes::string())
+                .build()?,
+        )
+        .build()?;
+    admin.create_table(&table_path, &descriptor, true).await?;
+
+    // Write
+    let table = conn.get_table(&table_path).await?;
+    let writer = table.new_append()?.create_writer()?;
+    let mut row = GenericRow::new(2);
+    row.set_field(0, 1);
+    row.set_field(1, "hello");
+    writer.append(&row)?;
+    writer.flush().await?;
+
+    // Read
+    let scanner = table.new_scan().create_log_scanner()?;
+    scanner.subscribe(0, 0).await?;
+    let records = scanner.poll(Duration::from_secs(5)).await?;
+    for record in records {
+        let row = record.row();
+        println!("id={}, name={}", row.get_int(0)?, row.get_string(1)?);
+    }
+
+    Ok(())
+}
+```
diff --git a/website/docs/apis/rust/example/log-tables.md b/website/docs/apis/rust/example/log-tables.md
new file mode 100644
index 0000000000..e77c8c6c43
--- /dev/null
+++ b/website/docs/apis/rust/example/log-tables.md
@@ -0,0 +1,172 @@
+---
+sidebar_position: 4
+---
+# Log Tables
+
+Log tables are append-only tables without primary keys, suitable for event streaming.
+
+## Creating a Log Table
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("event_id", DataTypes::int())
+            .column("event_type", DataTypes::string())
+            .column("timestamp", DataTypes::bigint())
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("fluss", "events");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+## Writing to Log Tables
+
+```rust
+use fluss::row::{GenericRow, InternalRow};
+
+let table = conn.get_table(&table_path).await?;
+let append_writer = table.new_append()?.create_writer()?;
+
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);                    // event_id
+row.set_field(1, "user_login");         // event_type
+row.set_field(2, 1704067200000i64);     // timestamp
+
+append_writer.append(&row)?;
+append_writer.flush().await?;
+```
+
+Write operations use a **fire-and-forget** pattern for efficient batching. Each call queues the write and returns a `WriteResultFuture` immediately. Call `flush()` to ensure all queued writes are sent to the server.
+
+For per-record acknowledgment:
+
+```rust
+append_writer.append(&row)?.await?;
+```
+
+## Reading from Log Tables
+
+```rust
+use std::time::Duration;
+
+let table = conn.get_table(&table_path).await?;
+let log_scanner = table.new_scan().create_log_scanner()?;
+
+// Subscribe to bucket 0 starting from offset 0
+log_scanner.subscribe(0, 0).await?;
+
+// Poll for records
+let records = log_scanner.poll(Duration::from_secs(10)).await?;
+
+// Per-bucket access
+for (bucket, bucket_records) in records.records_by_buckets() {
+    println!("Bucket {}: {} records", bucket.bucket_id(), bucket_records.len());
+    for record in bucket_records {
+        let row = record.row();
+        println!(
+            "  event_id={}, event_type={} @ offset={}",
+            row.get_int(0)?,
+            row.get_string(1)?,
+            record.offset()
+        );
+    }
+}
+
+// Or flat iteration (consumes ScanRecords)
+for record in records {
+    let row = record.row();
+    println!(
+        "event_id={}, event_type={}, timestamp={} @ offset={}",
+        row.get_int(0)?,
+        row.get_string(1)?,
+        row.get_long(2)?,
+        record.offset()
+    );
+}
+```
+
+**Subscribe from special offsets:**
+
+```rust
+use fluss::client::EARLIEST_OFFSET;
+
+log_scanner.subscribe(0, EARLIEST_OFFSET).await?;  // from earliest
+log_scanner.subscribe(0, 42).await?;                // from specific offset
+```
+
+**Subscribe from latest offset (only new records):**
+
+To start reading only new records, first resolve the current latest offset via `list_offsets`, then subscribe at that offset:
+
+```rust
+use fluss::rpc::message::OffsetSpec;
+
+let admin = conn.get_admin()?;
+let offsets = admin.list_offsets(&table_path, &[0], OffsetSpec::Latest).await?;
+let latest = offsets[&0];
+log_scanner.subscribe(0, latest).await?;
+```
+
+**Subscribe to all buckets:**
+
+```rust
+let num_buckets = table.get_table_info().get_num_buckets();
+for bucket_id in 0..num_buckets {
+    log_scanner.subscribe(bucket_id, 0).await?;
+}
+```
+
+**Subscribe to multiple buckets at once:**
+
+```rust
+use std::collections::HashMap;
+
+let mut bucket_offsets = HashMap::new();
+bucket_offsets.insert(0, 0i64);
+bucket_offsets.insert(1, 100i64);
+log_scanner.subscribe_buckets(&bucket_offsets).await?;
+```
+
+**Unsubscribe from a bucket:**
+
+```rust
+// Non-partitioned tables
+log_scanner.unsubscribe(bucket_id).await?;
+
+// Partitioned tables
+log_scanner.unsubscribe_partition(partition_id, bucket_id).await?;
+```
+
+## Column Projection
+
+```rust
+// Project by column index
+let scanner = table.new_scan().project(&[0, 2])?.create_log_scanner()?;
+
+// Project by column name
+let scanner = table.new_scan()
+    .project_by_name(&["event_id", "timestamp"])?
+    .create_log_scanner()?;
+```
+
+## Limit Scan
+
+For a bounded read of up to `n` rows from a single bucket, use a batch scanner
+instead of subscribing. It issues one request; poll it with `next_batch` until
+it returns `None`.
+
+```rust
+let bucket = TableBucket::new(table.get_table_info().table_id, 0);
+let mut scanner = table.new_scan().limit(10)?.create_bucket_batch_scanner(bucket)?;
+
+while let Some(batch) = scanner.next_batch().await? {
+    println!("rows: {}", batch.batch().num_rows());
+}
+```
+
+Limit applies per bucket; scan each bucket to cover a multi-bucket table.
diff --git a/website/docs/apis/rust/example/partitioned-tables.md b/website/docs/apis/rust/example/partitioned-tables.md
new file mode 100644
index 0000000000..e583e06ead
--- /dev/null
+++ b/website/docs/apis/rust/example/partitioned-tables.md
@@ -0,0 +1,219 @@
+---
+sidebar_position: 6
+---
+# Partitioned Tables
+
+Partitioned tables distribute data across partitions based on partition column values, enabling efficient data organization and querying. Both log tables and primary key tables support partitioning.
+
+## Partitioned Log Tables
+
+### Creating a Partitioned Log Table
+
+```rust
+use fluss::metadata::{DataTypes, LogFormat, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("event_id", DataTypes::int())
+            .column("event_type", DataTypes::string())
+            .column("dt", DataTypes::string())
+            .column("region", DataTypes::string())
+            .build()?,
+    )
+    .partitioned_by(vec!["dt", "region"])
+    .log_format(LogFormat::ARROW)
+    .build()?;
+
+let table_path = TablePath::new("fluss", "partitioned_events");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+### Writing to Partitioned Log Tables
+
+**Partitions must exist before writing data, otherwise the client will by default retry indefinitely.** Include partition column values in each row, the client routes records to the correct partition automatically.
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+let table = conn.get_table(&table_path).await?;
+
+// Create the partition before writing
+let mut partition_values = HashMap::new();
+partition_values.insert("dt", "2024-01-15");
+partition_values.insert("region", "US");
+admin.create_partition(&table_path, &PartitionSpec::new(partition_values), true).await?;
+
+let append_writer = table.new_append()?.create_writer()?;
+
+let mut row = GenericRow::new(4);
+row.set_field(0, 1);              // event_id
+row.set_field(1, "user_login");   // event_type
+row.set_field(2, "2024-01-15");   // dt (partition column)
+row.set_field(3, "US");           // region (partition column)
+
+append_writer.append(&row)?;
+append_writer.flush().await?;
+```
+
+### Reading from Partitioned Log Tables
+
+For partitioned tables, use partition-aware subscribe methods.
+
+```rust
+use std::time::Duration;
+
+let table = conn.get_table(&table_path).await?;
+let admin = conn.get_admin()?;
+let partitions = admin.list_partition_infos(&table_path).await?;
+
+let log_scanner = table.new_scan().create_log_scanner()?;
+
+// Subscribe to each partition's buckets
+for partition_info in &partitions {
+    let partition_id = partition_info.get_partition_id();
+    let num_buckets = table.get_table_info().get_num_buckets();
+    for bucket_id in 0..num_buckets {
+        log_scanner.subscribe_partition(partition_id, bucket_id, 0).await?;
+    }
+}
+
+let records = log_scanner.poll(Duration::from_secs(10)).await?;
+for record in records {
+    println!("Record: {:?}", record.row());
+}
+```
+
+Subscribe to multiple partition-buckets at once:
+
+```rust
+use std::collections::HashMap;
+
+let mut partition_bucket_offsets = HashMap::new();
+partition_bucket_offsets.insert((partition_id, 0), 0i64);
+partition_bucket_offsets.insert((partition_id, 1), 0i64);
+log_scanner.subscribe_partition_buckets(&partition_bucket_offsets).await?;
+```
+
+### Managing Partitions
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+// Create a partition
+let mut partition_values = HashMap::new();
+partition_values.insert("dt", "2024-01-15");
+partition_values.insert("region", "EMEA");
+let spec = PartitionSpec::new(partition_values);
+admin.create_partition(&table_path, &spec, true).await?;
+
+// List all partitions
+let partitions = admin.list_partition_infos(&table_path).await?;
+for partition in &partitions {
+    println!(
+        "Partition: id={}, name={}",
+        partition.get_partition_id(),
+        partition.get_partition_name()
+    );
+}
+
+// List with filter
+let mut partial_values = HashMap::new();
+partial_values.insert("dt", "2024-01-15");
+let partial_spec = PartitionSpec::new(partial_values);
+let filtered = admin.list_partition_infos_with_spec(
+    &table_path, Some(&partial_spec),
+).await?;
+
+// Drop a partition
+admin.drop_partition(&table_path, &spec, true).await?;
+```
+
+## Partitioned Primary Key Tables
+
+Partitioned KV tables combine partitioning with primary key operations. Partition columns must be part of the primary key.
+
+### Creating a Partitioned Primary Key Table
+
+```rust
+use fluss::metadata::{DataTypes, KvFormat, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("user_id", DataTypes::int())
+            .column("region", DataTypes::string())
+            .column("zone", DataTypes::bigint())
+            .column("score", DataTypes::bigint())
+            .primary_key(vec!["user_id", "region", "zone"])
+            .build()?,
+    )
+    .partitioned_by(vec!["region", "zone"])
+    .kv_format(KvFormat::COMPACTED)
+    .build()?;
+
+let table_path = TablePath::new("fluss", "partitioned_users");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+### Writing to Partitioned Primary Key Tables
+
+**Partitions must exist before upserting data, otherwise the client will by default retry indefinitely.**
+
+```rust
+use fluss::metadata::PartitionSpec;
+use std::collections::HashMap;
+
+let table = conn.get_table(&table_path).await?;
+
+// Create partitions first
+for (region, zone) in [("APAC", "1"), ("EMEA", "2"), ("US", "3")] {
+    let mut values = HashMap::new();
+    values.insert("region", region);
+    values.insert("zone", zone);
+    admin.create_partition(&table_path, &PartitionSpec::new(values), true).await?;
+}
+
+let table_upsert = table.new_upsert()?;
+let upsert_writer = table_upsert.create_writer()?;
+
+for (user_id, region, zone, score) in [
+    (1001, "APAC", 1i64, 1234i64),
+    (1002, "EMEA", 2, 2234),
+    (1003, "US", 3, 3234),
+] {
+    let mut row = GenericRow::new(4);
+    row.set_field(0, user_id);
+    row.set_field(1, region);
+    row.set_field(2, zone);
+    row.set_field(3, score);
+    upsert_writer.upsert(&row)?;
+}
+upsert_writer.flush().await?;
+```
+
+### Looking Up Records in Partitioned Tables
+
+Lookup requires all primary key columns including partition columns.
+
+```rust
+let mut lookuper = table.new_lookup()?.create_lookuper()?;
+
+let mut key = GenericRow::new(3);
+key.set_field(0, 1001);    // user_id
+key.set_field(1, "APAC");  // region (partition column)
+key.set_field(2, 1i64);    // zone (partition column)
+
+let result = lookuper.lookup(&key).await?;
+if let Some(row) = result.get_single_row()? {
+    println!("Found: score={}", row.get_long(3)?);
+}
+```
+
+### Prefix Lookup on Partitioned Tables
+
+See [Prefix Lookup — Partitioned Table](./prefix-lookup.md#partitioned-table) for details and a full runnable example.
+
+> **Note:** Scanning partitioned primary key tables is not supported. Use lookup operations instead.
diff --git a/website/docs/apis/rust/example/prefix-lookup.md b/website/docs/apis/rust/example/prefix-lookup.md
new file mode 100644
index 0000000000..619ba8341d
--- /dev/null
+++ b/website/docs/apis/rust/example/prefix-lookup.md
@@ -0,0 +1,110 @@
+---
+sidebar_position: 7
+---
+# Prefix Lookup
+
+Prefix lookup returns all rows whose primary key starts with a given prefix. It's enabled by choosing a **bucket key that is a strict prefix of the primary key** — rows sharing the same bucket-key prefix land in the same bucket, so one bucket lookup returns them all.
+
+## Table Requirements
+
+- The table must have a primary key.
+- The bucket key must be a strict prefix of the primary key (on partitioned tables, of the *non-partition* portion of the primary key).
+- The bucket key cannot equal the full primary key — that's a normal primary-key lookup, use [`Lookuper`](./primary-key-tables.md#looking-up-records) instead.
+- The `lookup_by` columns passed to the client must equal `partition_keys ++ bucket_key` (in that order, if partitioned).
+
+`create_lookuper()` validates these rules and returns `Err(Error::IllegalArgument { .. })` on mismatch, with a message describing the violation.
+
+## Non-Partitioned Table
+
+Pick a schema where the bucket key is a prefix of the primary key:
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("user_id", DataTypes::int())
+            .column("session_id", DataTypes::string())
+            .column("event_seq", DataTypes::bigint())
+            .column("event_data", DataTypes::string())
+            .primary_key(vec!["user_id", "session_id", "event_seq"])
+            .build()?,
+    )
+    // Bucket key (user_id, session_id) is a prefix of the primary key.
+    .distributed_by(Some(3), vec!["user_id".to_string(), "session_id".to_string()])
+    .build()?;
+```
+
+Create the lookuper with `lookup_by(columns)` naming the prefix columns, then call `lookup(prefix_row)`:
+
+```rust
+use fluss::row::{GenericRow, InternalRow};
+
+let mut prefix_lookuper = table
+    .new_lookup()?
+    .lookup_by(vec!["user_id".to_string(), "session_id".to_string()])
+    .create_lookuper()?;
+
+let mut prefix = GenericRow::new(2);
+prefix.set_field(0, 1);                // user_id
+prefix.set_field(1, "sess-a");         // session_id
+
+let result = prefix_lookuper.lookup(&prefix).await?;
+for row in result.get_rows()? {
+    println!(
+        "seq={}, data={}",
+        row.get_long(2)?,
+        row.get_string(3)?,
+    );
+}
+```
+
+Unlike primary-key lookup (which uses `get_single_row()`), prefix lookup returns zero or more rows via `get_rows()`.
+
+## Partitioned Table
+
+On a partitioned table, the partition columns are stripped from the primary key before the bucket-prefix rule is evaluated. The lookup key, though, must still carry the partition values so the client can route the request to the right partition — so the `lookup_by` columns are `partition_keys ++ bucket_key`.
+
+```rust
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("region", DataTypes::string())
+            .column("user_id", DataTypes::int())
+            .column("session_id", DataTypes::string())
+            .column("event_seq", DataTypes::bigint())
+            .column("event_data", DataTypes::string())
+            .primary_key(vec!["region", "user_id", "session_id", "event_seq"])
+            .build()?,
+    )
+    .partitioned_by(vec!["region"])
+    // Bucket key (user_id, session_id) is a prefix of the pk minus partition cols.
+    .distributed_by(Some(3), vec!["user_id".to_string(), "session_id".to_string()])
+    .build()?;
+```
+
+```rust
+let mut prefix_lookuper = table
+    .new_lookup()?
+    .lookup_by(vec![
+        "region".to_string(),
+        "user_id".to_string(),
+        "session_id".to_string(),
+    ])
+    .create_lookuper()?;
+
+let mut prefix = GenericRow::new(3);
+prefix.set_field(0, "US");             // region (partition column)
+prefix.set_field(1, 1);                // user_id
+prefix.set_field(2, "sess-a");         // session_id
+
+let result = prefix_lookuper.lookup(&prefix).await?;
+for row in result.get_rows()? {
+    println!(
+        "seq={}, data={}",
+        row.get_long(3)?,
+        row.get_string(4)?,
+    );
+}
+```
diff --git a/website/docs/apis/rust/example/primary-key-tables.md b/website/docs/apis/rust/example/primary-key-tables.md
new file mode 100644
index 0000000000..01836e29e4
--- /dev/null
+++ b/website/docs/apis/rust/example/primary-key-tables.md
@@ -0,0 +1,141 @@
+---
+sidebar_position: 5
+---
+# Primary Key Tables
+
+Primary key tables (KV tables) support upsert, delete, and lookup operations.
+
+## Creating a Primary Key Table
+
+```rust
+use fluss::metadata::{DataTypes, Schema, TableDescriptor, TablePath};
+
+let table_descriptor = TableDescriptor::builder()
+    .schema(
+        Schema::builder()
+            .column("id", DataTypes::int())
+            .column("name", DataTypes::string())
+            .column("age", DataTypes::bigint())
+            .primary_key(vec!["id"])
+            .build()?,
+    )
+    .build()?;
+
+let table_path = TablePath::new("fluss", "users");
+admin.create_table(&table_path, &table_descriptor, true).await?;
+```
+
+## Upserting Records
+
+```rust
+use fluss::row::{GenericRow, InternalRow};
+
+let table = conn.get_table(&table_path).await?;
+let table_upsert = table.new_upsert()?;
+let upsert_writer = table_upsert.create_writer()?;
+
+for (id, name, age) in [(1, "Alice", 25i64), (2, "Bob", 30), (3, "Charlie", 35)] {
+    let mut row = GenericRow::new(3);
+    row.set_field(0, id);
+    row.set_field(1, name);
+    row.set_field(2, age);
+    upsert_writer.upsert(&row)?;
+}
+upsert_writer.flush().await?;
+```
+
+## Updating Records
+
+Upsert with the same primary key to update an existing record.
+
+```rust
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);        // id (primary key)
+row.set_field(1, "Alice");
+row.set_field(2, 26i64);    // updated age
+
+upsert_writer.upsert(&row)?;
+upsert_writer.flush().await?;
+```
+
+## Deleting Records
+
+```rust
+// Only primary key field needs to be set
+let mut row = GenericRow::new(3);
+row.set_field(0, 2);  // id of record to delete
+
+upsert_writer.delete(&row)?;
+upsert_writer.flush().await?;
+```
+
+## Partial Updates
+
+Update only specific columns while preserving others.
+
+```rust
+// By column indices
+let partial_upsert = table_upsert.partial_update(Some(vec![0, 2]))?;
+let partial_writer = partial_upsert.create_writer()?;
+
+let mut row = GenericRow::new(3);
+row.set_field(0, 1);       // id (primary key, required)
+row.set_field(2, 27i64);   // age (will be updated)
+// name will remain unchanged
+
+partial_writer.upsert(&row)?;
+partial_writer.flush().await?;
+
+// By column names
+let partial_upsert = table_upsert.partial_update_with_column_names(&["id", "age"])?;
+let partial_writer = partial_upsert.create_writer()?;
+```
+
+## Looking Up Records
+
+```rust
+let mut lookuper = table.new_lookup()?.create_lookuper()?;
+
+let mut key = GenericRow::new(1);
+key.set_field(0, 1);  // id to lookup
+
+let result = lookuper.lookup(&key).await?;
+
+if let Some(row) = result.get_single_row()? {
+    println!(
+        "Found: id={}, name={}, age={}",
+        row.get_int(0)?,
+        row.get_string(1)?,
+        row.get_long(2)?
+    );
+} else {
+    println!("Record not found");
+}
+```
+## Looking Up Records as Arrow RecordBatch
+
+Use `to_record_batch()` to get lookup results in Arrow format, for example when integrating with DataFusion.
+```rust
+let result = lookuper.lookup(&key).await?;
+let batch = result.to_record_batch()?;
+println!("Rows: {}", batch.num_rows());
+```
+
+## Prefix Lookup
+
+To fetch all rows sharing a common primary-key prefix (by choosing a bucket key that's a strict prefix of the primary key), see [Prefix Lookup](./prefix-lookup.md).
+
+## Limit Scan
+
+To read up to `n` rows of a bucket's current state without supplying keys, use a batch scanner. The server returns the deduplicated current rows as Arrow batches, which is convenient for previews or DataFusion sources.
+
+```rust
+let bucket = TableBucket::new(table.get_table_info().table_id, 0);
+let mut scanner = table.new_scan().limit(10)?.create_bucket_batch_scanner(bucket)?;
+
+while let Some(batch) = scanner.next_batch().await? {
+    println!("rows: {}", batch.batch().num_rows());
+}
+```
+
+Limit applies per bucket; scan each bucket to cover a multi-bucket table.
diff --git a/website/docs/apis/rust/installation.md b/website/docs/apis/rust/installation.md
new file mode 100644
index 0000000000..540d4a10a0
--- /dev/null
+++ b/website/docs/apis/rust/installation.md
@@ -0,0 +1,76 @@
+---
+sidebar_position: 1
+---
+# Installation
+
+The Fluss Rust client is published to [crates.io](https://crates.io/crates/fluss-rs) as `fluss-rs`. The crate's library name is `fluss`, so you import it with `use fluss::...`.
+
+```toml
+[dependencies]
+fluss-rs = "0.1.0"
+tokio = { version = "1", features = ["full"] }
+```
+
+## Feature Flags
+
+```toml
+[dependencies]
+# Default: memory and filesystem storage
+fluss-rs = "0.1.0"
+
+# With S3 storage support
+fluss-rs = { version = "0.1", features = ["storage-s3"] }
+
+# With OSS storage support
+fluss-rs = { version = "0.1", features = ["storage-oss"] }
+
+# All storage backends
+fluss-rs = { version = "0.1", features = ["storage-all"] }
+```
+
+Available features:
+- `storage-memory` (default: In-memory storage)
+- `storage-fs` (default: Local filesystem storage)
+- `storage-s3` (Amazon S3 storage)
+- `storage-oss` (Alibaba OSS storage)
+- `storage-all` (All storage backends)
+
+## Git or Path Dependency
+
+For development against unreleased changes:
+
+```toml
+[dependencies]
+# From Git
+fluss = { git = "https://github.com/apache/fluss-rust.git", package = "fluss-rs" }
+
+# From local path
+fluss = { path = "/path/to/fluss-rust/crates/fluss", package = "fluss-rs" }
+```
+
+> **Note:** When using `git` or `path` dependencies, the `package = "fluss-rs"` field is required so that Cargo resolves the correct package while still allowing `use fluss::...` imports.
+
+## Building from Source
+
+**Prerequisites:** Rust 1.85+, Protobuf compiler (`protoc`)
+
+```bash
+git clone https://github.com/apache/fluss-rust.git
+cd fluss-rust
+```
+
+Install `protoc`:
+
+```bash
+# macOS
+brew install protobuf
+
+# Ubuntu/Debian
+sudo apt-get install protobuf-compiler
+```
+
+Build:
+
+```bash
+cargo build --workspace --all-targets
+```
diff --git a/website/docs/table-design/merge-engines/aggregation.md b/website/docs/table-design/merge-engines/aggregation.md
index 4375404af0..71dabb654e 100644
--- a/website/docs/table-design/merge-engines/aggregation.md
+++ b/website/docs/table-design/merge-engines/aggregation.md
@@ -1166,4 +1166,4 @@ For detailed information about Exactly-Once implementation, please refer to: [FI
 - [FirstRow Merge Engine](table-design/merge-engines/first-row.md)
 - [Versioned Merge Engine](table-design/merge-engines/versioned.md)
 - [Primary Key Tables](table-design/table-types/pk-table.md)
-- [Fluss Client API](apis/java-client.md)
+- [Fluss Client API](../../apis/java/index.md)
diff --git a/website/docusaurus.config.ts b/website/docusaurus.config.ts
index 1f6225a759..1e8b4e81ad 100644
--- a/website/docusaurus.config.ts
+++ b/website/docusaurus.config.ts
@@ -325,7 +325,7 @@ const config: Config = {
     prism: {
       theme: lightTheme,
       darkTheme: darkTheme,
-      additionalLanguages: ['java', 'bash', 'scala']
+      additionalLanguages: ['java', 'bash', 'scala', 'rust', 'toml', 'cmake']
     },
     algolia: {
       appId: "X8KSGGLJW1",